diff --git "a/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" "b/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" --- "a/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" +++ "b/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3001, "train/learning_rate": 6.728971962616822e-06, "train/epoch": 0.84, "train/global_step": 1500, "_runtime": 7542, "_timestamp": 1646105814, "_step": 1502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 914.0, 99.0], "bins": [-1145.5391845703125, -1127.27197265625, -1109.0047607421875, -1090.7374267578125, -1072.47021484375, -1054.2030029296875, -1035.935791015625, -1017.6685180664062, -999.4013061523438, -981.1340942382812, -962.8668212890625, -944.599609375, -926.3323974609375, -908.0651245117188, -889.7979125976562, -871.5306396484375, -853.263427734375, -834.9962158203125, -816.7289428710938, -798.4617309570312, -780.1944580078125, -761.92724609375, -743.6600341796875, -725.3927612304688, -707.1255493164062, -688.8583374023438, -670.591064453125, -652.3238525390625, -634.056640625, -615.7893676757812, -597.5221557617188, -579.2548828125, -560.9877319335938, -542.7205200195312, -524.4532470703125, -506.18603515625, -487.9187927246094, -469.65155029296875, -451.38433837890625, -433.1170959472656, -414.8498229980469, -396.58258056640625, -378.31536865234375, -360.0481262207031, -341.7808837890625, -323.5136413574219, -305.24639892578125, -286.97918701171875, -268.7119445800781, -250.4447021484375, -232.17747497558594, -213.91024780273438, -195.64300537109375, -177.37576293945312, -159.10853576660156, -140.84130859375, -122.57406616210938, -104.30683135986328, -86.03959655761719, -67.7723617553711, -49.505126953125, -31.237892150878906, -12.970657348632812, 5.296577453613281, 23.56380844116211]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 11.0, 27.0, 24.0, 28.0, 45.0, 43.0, 45.0, 55.0, 56.0, 44.0, 76.0, 71.0, 68.0, 82.0, 68.0, 51.0, 42.0, 39.0, 23.0, 21.0, 24.0, 10.0, 11.0, 8.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.8681640625, -99.92489624023438, -96.98162078857422, -94.03834533691406, -91.09507751464844, -88.15180969238281, -85.20853424072266, -82.2652587890625, -79.32199096679688, -76.37872314453125, -73.4354476928711, -70.49217224121094, -67.54890441894531, -64.60563659667969, -61.66236114501953, -58.71908950805664, -55.77581787109375, -52.83254623413086, -49.88927459716797, -46.94600296020508, -44.00273132324219, -41.0594596862793, -38.116188049316406, -35.172916412353516, -32.229644775390625, -29.286373138427734, -26.343101501464844, -23.399829864501953, -20.456558227539062, -17.513286590576172, -14.570014953613281, -11.62674331665039, -8.6834716796875, -5.740200042724609, -2.7969284057617188, 0.14634323120117188, 3.0896148681640625, 6.032886505126953, 8.976158142089844, 11.919429779052734, 14.862701416015625, 17.805973052978516, 20.749244689941406, 23.692516326904297, 26.635787963867188, 29.579059600830078, 32.52233123779297, 35.46560287475586, 38.40887451171875, 41.35214614868164, 44.29541778564453, 47.23868942260742, 50.18196105957031, 53.1252326965332, 56.068504333496094, 59.011775970458984, 61.955047607421875, 64.8983154296875, 67.84159088134766, 70.78486633300781, 73.72813415527344, 76.67140197753906, 79.61467742919922, 82.55795288085938, 85.501220703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 6.0, 7.0, 13.0, 21.0, 16.0, 10.0, 21.0, 18.0, 21.0, 21.0, 21.0, 27.0, 35.0, 25.0, 39.0, 32.0, 26.0, 34.0, 31.0, 47.0, 28.0, 44.0, 39.0, 37.0, 38.0, 37.0, 36.0, 31.0, 34.0, 30.0, 23.0, 25.0, 17.0, 12.0, 13.0, 15.0, 12.0, 8.0, 4.0, 4.0, 7.0, 5.0, 2.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.73828125, -2.65740966796875, -2.5765380859375, -2.49566650390625, -2.414794921875, -2.33392333984375, -2.2530517578125, -2.17218017578125, -2.09130859375, -2.01043701171875, -1.9295654296875, -1.84869384765625, -1.767822265625, -1.68695068359375, -1.6060791015625, -1.52520751953125, -1.4443359375, -1.36346435546875, -1.2825927734375, -1.20172119140625, -1.120849609375, -1.03997802734375, -0.9591064453125, -0.87823486328125, -0.79736328125, -0.71649169921875, -0.6356201171875, -0.55474853515625, -0.473876953125, -0.39300537109375, -0.3121337890625, -0.23126220703125, -0.150390625, -0.06951904296875, 0.0113525390625, 0.09222412109375, 0.173095703125, 0.25396728515625, 0.3348388671875, 0.41571044921875, 0.49658203125, 0.57745361328125, 0.6583251953125, 0.73919677734375, 0.820068359375, 0.90093994140625, 0.9818115234375, 1.06268310546875, 1.1435546875, 1.22442626953125, 1.3052978515625, 1.38616943359375, 1.467041015625, 1.54791259765625, 1.6287841796875, 1.70965576171875, 1.79052734375, 1.87139892578125, 1.9522705078125, 2.03314208984375, 2.114013671875, 2.19488525390625, 2.2757568359375, 2.35662841796875, 2.4375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 4.0, 7.0, 7.0, 9.0, 13.0, 25.0, 28.0, 37.0, 49.0, 71.0, 95.0, 108.0, 172.0, 217.0, 325.0, 522.0, 709.0, 1342.0, 2427.0, 5240.0, 14277.0, 51764.0, 348085.0, 2808169.0, 839888.0, 86155.0, 20351.0, 7041.0, 2972.0, 1582.0, 824.0, 543.0, 352.0, 260.0, 168.0, 100.0, 86.0, 75.0, 52.0, 30.0, 21.0, 22.0, 14.0, 12.0, 11.0, 4.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.34375, -10.9854736328125, -10.627197265625, -10.2689208984375, -9.91064453125, -9.5523681640625, -9.194091796875, -8.8358154296875, -8.4775390625, -8.1192626953125, -7.760986328125, -7.4027099609375, -7.04443359375, -6.6861572265625, -6.327880859375, -5.9696044921875, -5.611328125, -5.2530517578125, -4.894775390625, -4.5364990234375, -4.17822265625, -3.8199462890625, -3.461669921875, -3.1033935546875, -2.7451171875, -2.3868408203125, -2.028564453125, -1.6702880859375, -1.31201171875, -0.9537353515625, -0.595458984375, -0.2371826171875, 0.12109375, 0.4793701171875, 0.837646484375, 1.1959228515625, 1.55419921875, 1.9124755859375, 2.270751953125, 2.6290283203125, 2.9873046875, 3.3455810546875, 3.703857421875, 4.0621337890625, 4.42041015625, 4.7786865234375, 5.136962890625, 5.4952392578125, 5.853515625, 6.2117919921875, 6.570068359375, 6.9283447265625, 7.28662109375, 7.6448974609375, 8.003173828125, 8.3614501953125, 8.7197265625, 9.0780029296875, 9.436279296875, 9.7945556640625, 10.15283203125, 10.5111083984375, 10.869384765625, 11.2276611328125, 11.5859375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 23.0, 78.0, 198.0, 419.0, 934.0, 1280.0, 664.0, 269.0, 108.0, 46.0, 16.0, 17.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.53125, -38.5498046875, -37.568359375, -36.5869140625, -35.60546875, -34.6240234375, -33.642578125, -32.6611328125, -31.6796875, -30.6982421875, -29.716796875, -28.7353515625, -27.75390625, -26.7724609375, -25.791015625, -24.8095703125, -23.828125, -22.8466796875, -21.865234375, -20.8837890625, -19.90234375, -18.9208984375, -17.939453125, -16.9580078125, -15.9765625, -14.9951171875, -14.013671875, -13.0322265625, -12.05078125, -11.0693359375, -10.087890625, -9.1064453125, -8.125, -7.1435546875, -6.162109375, -5.1806640625, -4.19921875, -3.2177734375, -2.236328125, -1.2548828125, -0.2734375, 0.7080078125, 1.689453125, 2.6708984375, 3.65234375, 4.6337890625, 5.615234375, 6.5966796875, 7.578125, 8.5595703125, 9.541015625, 10.5224609375, 11.50390625, 12.4853515625, 13.466796875, 14.4482421875, 15.4296875, 16.4111328125, 17.392578125, 18.3740234375, 19.35546875, 20.3369140625, 21.318359375, 22.2998046875, 23.28125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 11.0, 20.0, 26.0, 97.0, 190.0, 700.0, 2533.0, 1136635.0, 3050088.0, 2832.0, 732.0, 232.0, 115.0, 38.0, 11.0, 9.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.375, -113.9267578125, -110.478515625, -107.0302734375, -103.58203125, -100.1337890625, -96.685546875, -93.2373046875, -89.7890625, -86.3408203125, -82.892578125, -79.4443359375, -75.99609375, -72.5478515625, -69.099609375, -65.6513671875, -62.203125, -58.7548828125, -55.306640625, -51.8583984375, -48.41015625, -44.9619140625, -41.513671875, -38.0654296875, -34.6171875, -31.1689453125, -27.720703125, -24.2724609375, -20.82421875, -17.3759765625, -13.927734375, -10.4794921875, -7.03125, -3.5830078125, -0.134765625, 3.3134765625, 6.76171875, 10.2099609375, 13.658203125, 17.1064453125, 20.5546875, 24.0029296875, 27.451171875, 30.8994140625, 34.34765625, 37.7958984375, 41.244140625, 44.6923828125, 48.140625, 51.5888671875, 55.037109375, 58.4853515625, 61.93359375, 65.3818359375, 68.830078125, 72.2783203125, 75.7265625, 79.1748046875, 82.623046875, 86.0712890625, 89.51953125, 92.9677734375, 96.416015625, 99.8642578125, 103.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [3.0, 94.0, 674.0, 229.0, 13.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.627187728881836, -12.197919845581055, -4.768651008605957, 2.6606178283691406, 10.089885711669922, 17.519155502319336, 24.948423385620117, 32.37769317626953, 39.80696105957031, 47.236228942871094, 54.665496826171875, 62.094764709472656, 69.52403259277344, 76.95330810546875, 84.382568359375, 91.81184387207031, 99.24110412597656, 106.67037200927734, 114.09963989257812, 121.5289077758789, 128.9581756591797, 136.387451171875, 143.81671142578125, 151.24598693847656, 158.6752471923828, 166.10452270507812, 173.53378295898438, 180.9630584716797, 188.39231872558594, 195.82159423828125, 203.2508544921875, 210.6801300048828, 218.10939025878906, 225.53866577148438, 232.96792602539062, 240.39720153808594, 247.8264617919922, 255.2557373046875, 262.68499755859375, 270.1142578125, 277.5435485839844, 284.9728088378906, 292.402099609375, 299.83135986328125, 307.2606201171875, 314.68988037109375, 322.1191711425781, 329.5484313964844, 336.9776916503906, 344.4069519042969, 351.83624267578125, 359.2655029296875, 366.69476318359375, 374.1240234375, 381.5533142089844, 388.9825744628906, 396.4118347167969, 403.8410949707031, 411.2703857421875, 418.69964599609375, 426.12890625, 433.55816650390625, 440.9874572753906, 448.4167175292969, 455.8459777832031]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 4.0, 8.0, 10.0, 10.0, 18.0, 17.0, 30.0, 24.0, 31.0, 21.0, 29.0, 37.0, 25.0, 40.0, 46.0, 37.0, 32.0, 34.0, 43.0, 51.0, 43.0, 46.0, 39.0, 41.0, 42.0, 34.0, 37.0, 26.0, 18.0, 25.0, 25.0, 13.0, 10.0, 14.0, 10.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-43.10028076171875, -41.78769302368164, -40.4751091003418, -39.16252136230469, -37.849937438964844, -36.537349700927734, -35.224761962890625, -33.91217803955078, -32.59959030151367, -31.287004470825195, -29.97441864013672, -28.66183090209961, -27.349245071411133, -26.036659240722656, -24.724071502685547, -23.41148567199707, -22.098899841308594, -20.786314010620117, -19.47372817993164, -18.16114044189453, -16.848554611206055, -15.535968780517578, -14.223381996154785, -12.910795211791992, -11.598209381103516, -10.285623550415039, -8.973036766052246, -7.660450458526611, -6.347864151000977, -5.035277843475342, -3.722691535949707, -2.410104751586914, -1.0975189208984375, 0.21506738662719727, 1.527653694152832, 2.840240001678467, 4.152826309204102, 5.465412616729736, 6.777998924255371, 8.090585708618164, 9.40317153930664, 10.715757369995117, 12.02834415435791, 13.340930938720703, 14.65351676940918, 15.966102600097656, 17.278690338134766, 18.591276168823242, 19.90386199951172, 21.216447830200195, 22.529033660888672, 23.84162139892578, 25.154207229614258, 26.466793060302734, 27.779380798339844, 29.09196662902832, 30.404552459716797, 31.717138290405273, 33.02972412109375, 34.34231185913086, 35.65489959716797, 36.96748352050781, 38.28007125854492, 39.59265899658203, 40.905242919921875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 5.0, 3.0, 14.0, 14.0, 8.0, 11.0, 15.0, 22.0, 19.0, 13.0, 17.0, 23.0, 22.0, 30.0, 30.0, 23.0, 37.0, 26.0, 31.0, 50.0, 29.0, 37.0, 37.0, 35.0, 37.0, 36.0, 31.0, 37.0, 32.0, 36.0, 38.0, 27.0, 22.0, 20.0, 18.0, 20.0, 10.0, 9.0, 8.0, 11.0, 13.0, 7.0, 8.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.578125, -2.496978759765625, -2.41583251953125, -2.334686279296875, -2.2535400390625, -2.172393798828125, -2.09124755859375, -2.010101318359375, -1.928955078125, -1.847808837890625, -1.76666259765625, -1.685516357421875, -1.6043701171875, -1.523223876953125, -1.44207763671875, -1.360931396484375, -1.27978515625, -1.198638916015625, -1.11749267578125, -1.036346435546875, -0.9552001953125, -0.874053955078125, -0.79290771484375, -0.711761474609375, -0.630615234375, -0.549468994140625, -0.46832275390625, -0.387176513671875, -0.3060302734375, -0.224884033203125, -0.14373779296875, -0.062591552734375, 0.0185546875, 0.099700927734375, 0.18084716796875, 0.261993408203125, 0.3431396484375, 0.424285888671875, 0.50543212890625, 0.586578369140625, 0.667724609375, 0.748870849609375, 0.83001708984375, 0.911163330078125, 0.9923095703125, 1.073455810546875, 1.15460205078125, 1.235748291015625, 1.31689453125, 1.398040771484375, 1.47918701171875, 1.560333251953125, 1.6414794921875, 1.722625732421875, 1.80377197265625, 1.884918212890625, 1.966064453125, 2.047210693359375, 2.12835693359375, 2.209503173828125, 2.2906494140625, 2.371795654296875, 2.45294189453125, 2.534088134765625, 2.615234375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 12.0, 21.0, 35.0, 33.0, 54.0, 79.0, 137.0, 189.0, 308.0, 465.0, 745.0, 1160.0, 1716.0, 2734.0, 4459.0, 6872.0, 10759.0, 17263.0, 27949.0, 46372.0, 76155.0, 121661.0, 173421.0, 186872.0, 138632.0, 88874.0, 53947.0, 32993.0, 20109.0, 12365.0, 8115.0, 5088.0, 3147.0, 2114.0, 1313.0, 811.0, 523.0, 412.0, 242.0, 139.0, 81.0, 75.0, 33.0, 26.0, 13.0, 10.0, 10.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3125, -0.3024711608886719, -0.29244232177734375, -0.2824134826660156, -0.2723846435546875, -0.2623558044433594, -0.25232696533203125, -0.24229812622070312, -0.232269287109375, -0.22224044799804688, -0.21221160888671875, -0.20218276977539062, -0.1921539306640625, -0.18212509155273438, -0.17209625244140625, -0.16206741333007812, -0.15203857421875, -0.14200973510742188, -0.13198089599609375, -0.12195205688476562, -0.1119232177734375, -0.10189437866210938, -0.09186553955078125, -0.08183670043945312, -0.071807861328125, -0.061779022216796875, -0.05175018310546875, -0.041721343994140625, -0.0316925048828125, -0.021663665771484375, -0.01163482666015625, -0.001605987548828125, 0.0084228515625, 0.018451690673828125, 0.02848052978515625, 0.038509368896484375, 0.0485382080078125, 0.058567047119140625, 0.06859588623046875, 0.07862472534179688, 0.088653564453125, 0.09868240356445312, 0.10871124267578125, 0.11874008178710938, 0.1287689208984375, 0.13879776000976562, 0.14882659912109375, 0.15885543823242188, 0.16888427734375, 0.17891311645507812, 0.18894195556640625, 0.19897079467773438, 0.2089996337890625, 0.21902847290039062, 0.22905731201171875, 0.23908615112304688, 0.249114990234375, 0.2591438293457031, 0.26917266845703125, 0.2792015075683594, 0.2892303466796875, 0.2992591857910156, 0.30928802490234375, 0.3193168640136719, 0.329345703125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 10.0, 12.0, 9.0, 14.0, 14.0, 10.0, 17.0, 19.0, 24.0, 22.0, 26.0, 31.0, 28.0, 28.0, 41.0, 22.0, 35.0, 36.0, 34.0, 47.0, 1059.0, 22.0, 28.0, 40.0, 39.0, 34.0, 34.0, 28.0, 21.0, 27.0, 24.0, 22.0, 22.0, 21.0, 10.0, 18.0, 17.0, 17.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.697265625, -1.643218994140625, -1.58917236328125, -1.535125732421875, -1.4810791015625, -1.427032470703125, -1.37298583984375, -1.318939208984375, -1.264892578125, -1.210845947265625, -1.15679931640625, -1.102752685546875, -1.0487060546875, -0.994659423828125, -0.94061279296875, -0.886566162109375, -0.83251953125, -0.778472900390625, -0.72442626953125, -0.670379638671875, -0.6163330078125, -0.562286376953125, -0.50823974609375, -0.454193115234375, -0.400146484375, -0.346099853515625, -0.29205322265625, -0.238006591796875, -0.1839599609375, -0.129913330078125, -0.07586669921875, -0.021820068359375, 0.0322265625, 0.086273193359375, 0.14031982421875, 0.194366455078125, 0.2484130859375, 0.302459716796875, 0.35650634765625, 0.410552978515625, 0.464599609375, 0.518646240234375, 0.57269287109375, 0.626739501953125, 0.6807861328125, 0.734832763671875, 0.78887939453125, 0.842926025390625, 0.89697265625, 0.951019287109375, 1.00506591796875, 1.059112548828125, 1.1131591796875, 1.167205810546875, 1.22125244140625, 1.275299072265625, 1.329345703125, 1.383392333984375, 1.43743896484375, 1.491485595703125, 1.5455322265625, 1.599578857421875, 1.65362548828125, 1.707672119140625, 1.76171875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 9.0, 10.0, 15.0, 28.0, 37.0, 62.0, 77.0, 122.0, 164.0, 280.0, 462.0, 672.0, 1088.0, 1698.0, 2653.0, 4438.0, 7105.0, 11548.0, 19105.0, 31293.0, 50015.0, 76610.0, 111930.0, 148614.0, 1204480.0, 137255.0, 102505.0, 69219.0, 44076.0, 27472.0, 16927.0, 10349.0, 6321.0, 3848.0, 2449.0, 1572.0, 943.0, 596.0, 436.0, 240.0, 158.0, 91.0, 63.0, 35.0, 20.0, 14.0, 12.0, 3.0, 6.0, 7.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22133636474609375, -0.2142791748046875, -0.20722198486328125, -0.200164794921875, -0.19310760498046875, -0.1860504150390625, -0.17899322509765625, -0.17193603515625, -0.16487884521484375, -0.1578216552734375, -0.15076446533203125, -0.143707275390625, -0.13665008544921875, -0.1295928955078125, -0.12253570556640625, -0.115478515625, -0.10842132568359375, -0.1013641357421875, -0.09430694580078125, -0.087249755859375, -0.08019256591796875, -0.0731353759765625, -0.06607818603515625, -0.05902099609375, -0.05196380615234375, -0.0449066162109375, -0.03784942626953125, -0.030792236328125, -0.02373504638671875, -0.0166778564453125, -0.00962066650390625, -0.0025634765625, 0.00449371337890625, 0.0115509033203125, 0.01860809326171875, 0.025665283203125, 0.03272247314453125, 0.0397796630859375, 0.04683685302734375, 0.05389404296875, 0.06095123291015625, 0.0680084228515625, 0.07506561279296875, 0.082122802734375, 0.08917999267578125, 0.0962371826171875, 0.10329437255859375, 0.1103515625, 0.11740875244140625, 0.1244659423828125, 0.13152313232421875, 0.138580322265625, 0.14563751220703125, 0.1526947021484375, 0.15975189208984375, 0.16680908203125, 0.17386627197265625, 0.1809234619140625, 0.18798065185546875, 0.195037841796875, 0.20209503173828125, 0.2091522216796875, 0.21620941162109375, 0.2232666015625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 10.0, 16.0, 18.0, 18.0, 20.0, 30.0, 45.0, 53.0, 61.0, 99.0, 100.0, 105.0, 92.0, 65.0, 58.0, 42.0, 27.0, 25.0, 15.0, 16.0, 12.0, 13.0, 6.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033206939697265625, -0.003222554922103882, -0.003124415874481201, -0.0030262768268585205, -0.00292813777923584, -0.002829998731613159, -0.0027318596839904785, -0.002633720636367798, -0.002535581588745117, -0.0024374425411224365, -0.002339303493499756, -0.002241164445877075, -0.0021430253982543945, -0.002044886350631714, -0.0019467473030090332, -0.0018486082553863525, -0.0017504692077636719, -0.0016523301601409912, -0.0015541911125183105, -0.0014560520648956299, -0.0013579130172729492, -0.0012597739696502686, -0.0011616349220275879, -0.0010634958744049072, -0.0009653568267822266, -0.0008672177791595459, -0.0007690787315368652, -0.0006709396839141846, -0.0005728006362915039, -0.00047466158866882324, -0.0003765225410461426, -0.0002783834934234619, -0.00018024444580078125, -8.210539817810059e-05, 1.6033649444580078e-05, 0.00011417269706726074, 0.0002123117446899414, 0.00031045079231262207, 0.00040858983993530273, 0.0005067288875579834, 0.0006048679351806641, 0.0007030069828033447, 0.0008011460304260254, 0.0008992850780487061, 0.0009974241256713867, 0.0010955631732940674, 0.001193702220916748, 0.0012918412685394287, 0.0013899803161621094, 0.00148811936378479, 0.0015862584114074707, 0.0016843974590301514, 0.001782536506652832, 0.0018806755542755127, 0.0019788146018981934, 0.002076953649520874, 0.0021750926971435547, 0.0022732317447662354, 0.002371370792388916, 0.0024695098400115967, 0.0025676488876342773, 0.002665787935256958, 0.0027639269828796387, 0.0028620660305023193, 0.002960205078125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 17.0, 19.0, 21.0, 28.0, 31.0, 50.0, 72.0, 88.0, 131.0, 215.0, 286.0, 582.0, 236639.0, 808657.0, 696.0, 326.0, 200.0, 134.0, 83.0, 69.0, 53.0, 30.0, 25.0, 25.0, 12.0, 12.0, 9.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.060713768005371094, -0.05862236022949219, -0.05653095245361328, -0.054439544677734375, -0.05234813690185547, -0.05025672912597656, -0.048165321350097656, -0.04607391357421875, -0.043982505798339844, -0.04189109802246094, -0.03979969024658203, -0.037708282470703125, -0.03561687469482422, -0.03352546691894531, -0.031434059143066406, -0.0293426513671875, -0.027251243591308594, -0.025159835815429688, -0.02306842803955078, -0.020977020263671875, -0.01888561248779297, -0.016794204711914062, -0.014702796936035156, -0.01261138916015625, -0.010519981384277344, -0.008428573608398438, -0.006337165832519531, -0.004245758056640625, -0.0021543502807617188, -6.29425048828125e-05, 0.0020284652709960938, 0.004119873046875, 0.006211280822753906, 0.008302688598632812, 0.010394096374511719, 0.012485504150390625, 0.014576911926269531, 0.016668319702148438, 0.018759727478027344, 0.02085113525390625, 0.022942543029785156, 0.025033950805664062, 0.02712535858154297, 0.029216766357421875, 0.03130817413330078, 0.03339958190917969, 0.035490989685058594, 0.0375823974609375, 0.039673805236816406, 0.04176521301269531, 0.04385662078857422, 0.045948028564453125, 0.04803943634033203, 0.05013084411621094, 0.052222251892089844, 0.05431365966796875, 0.056405067443847656, 0.05849647521972656, 0.06058788299560547, 0.06267929077148438, 0.06477069854736328, 0.06686210632324219, 0.0689535140991211, 0.071044921875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1014.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003435449907556176, -0.002493355656042695, -0.0015512615209445357, -0.0006091673858463764, 0.0003329268656671047, 0.0012750208843499422, 0.0022171151358634233, 0.0031592093873769045, 0.004101303406059742, 0.005043397657573223, 0.005985491909086704, 0.006927586160600185, 0.007869680412113667, 0.008811773732304573, 0.009753867983818054, 0.010695962235331535, 0.011638057418167591, 0.012580151669681072, 0.013522245921194553, 0.014464340172708035, 0.015406434424221516, 0.016348527744412422, 0.017290621995925903, 0.018232716247439384, 0.019174810498952866, 0.020116904750466347, 0.021058999001979828, 0.02200109325349331, 0.02294318750500679, 0.02388528175652027, 0.024827376008033752, 0.025769470259547234, 0.026711562648415565, 0.027653656899929047, 0.028595751151442528, 0.02953784540295601, 0.03047993965446949, 0.03142203390598297, 0.0323641262948513, 0.033306222409009933, 0.034248314797878265, 0.0351904071867466, 0.03613250330090523, 0.03707459568977356, 0.03801669180393219, 0.03895878419280052, 0.03990088030695915, 0.040842972695827484, 0.041785068809986115, 0.042727161198854446, 0.04366925731301308, 0.04461134970188141, 0.04555344581604004, 0.04649553820490837, 0.047437634319067, 0.04837972670793533, 0.049321822822093964, 0.050263915210962296, 0.051206011325120926, 0.05214810371398926, 0.05309019982814789, 0.05403229221701622, 0.05497438833117485, 0.05591648072004318, 0.05685857683420181]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 12.0, 14.0, 25.0, 31.0, 47.0, 37.0, 59.0, 48.0, 62.0, 78.0, 65.0, 69.0, 74.0, 67.0, 47.0, 54.0, 49.0, 30.0, 27.0, 30.0, 23.0, 10.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0030438899993896484, -0.002973015420138836, -0.0029021408408880234, -0.002831266261637211, -0.0027603916823863983, -0.002689517103135586, -0.0026186425238847733, -0.0025477679446339607, -0.002476893365383148, -0.0024060187861323357, -0.002335144206881523, -0.0022642696276307106, -0.002193395048379898, -0.0021225204691290855, -0.002051645889878273, -0.0019807713106274605, -0.001909896731376648, -0.0018390221521258354, -0.0017681475728750229, -0.0016972729936242104, -0.0016263984143733978, -0.0015555238351225853, -0.0014846492558717728, -0.0014137746766209602, -0.0013429000973701477, -0.0012720255181193352, -0.0012011509388685226, -0.0011302763596177101, -0.0010594017803668976, -0.000988527201116085, -0.0009176526218652725, -0.00084677804261446, -0.0007759034633636475, -0.0007050288841128349, -0.0006341543048620224, -0.0005632797256112099, -0.0004924051463603973, -0.0004215305671095848, -0.0003506559878587723, -0.00027978140860795975, -0.00020890682935714722, -0.00013803225010633469, -6.715767085552216e-05, 3.7169083952903748e-06, 7.45914876461029e-05, 0.00014546606689691544, 0.00021634064614772797, 0.0002872152253985405, 0.00035808980464935303, 0.00042896438390016556, 0.0004998389631509781, 0.0005707135424017906, 0.0006415881216526031, 0.0007124627009034157, 0.0007833372801542282, 0.0008542118594050407, 0.0009250864386558533, 0.0009959610179066658, 0.0010668355971574783, 0.0011377101764082909, 0.0012085847556591034, 0.001279459334909916, 0.0013503339141607285, 0.001421208493411541, 0.0014920830726623535]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 5.0, 3.0, 14.0, 14.0, 8.0, 11.0, 15.0, 22.0, 19.0, 13.0, 17.0, 23.0, 22.0, 30.0, 30.0, 23.0, 37.0, 26.0, 31.0, 50.0, 29.0, 37.0, 37.0, 35.0, 37.0, 36.0, 31.0, 37.0, 32.0, 36.0, 38.0, 27.0, 22.0, 20.0, 18.0, 20.0, 10.0, 9.0, 8.0, 11.0, 13.0, 7.0, 8.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.578125, -2.496978759765625, -2.41583251953125, -2.334686279296875, -2.2535400390625, -2.172393798828125, -2.09124755859375, -2.010101318359375, -1.928955078125, -1.847808837890625, -1.76666259765625, -1.685516357421875, -1.6043701171875, -1.523223876953125, -1.44207763671875, -1.360931396484375, -1.27978515625, -1.198638916015625, -1.11749267578125, -1.036346435546875, -0.9552001953125, -0.874053955078125, -0.79290771484375, -0.711761474609375, -0.630615234375, -0.549468994140625, -0.46832275390625, -0.387176513671875, -0.3060302734375, -0.224884033203125, -0.14373779296875, -0.062591552734375, 0.0185546875, 0.099700927734375, 0.18084716796875, 0.261993408203125, 0.3431396484375, 0.424285888671875, 0.50543212890625, 0.586578369140625, 0.667724609375, 0.748870849609375, 0.83001708984375, 0.911163330078125, 0.9923095703125, 1.073455810546875, 1.15460205078125, 1.235748291015625, 1.31689453125, 1.398040771484375, 1.47918701171875, 1.560333251953125, 1.6414794921875, 1.722625732421875, 1.80377197265625, 1.884918212890625, 1.966064453125, 2.047210693359375, 2.12835693359375, 2.209503173828125, 2.2906494140625, 2.371795654296875, 2.45294189453125, 2.534088134765625, 2.615234375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 20.0, 21.0, 19.0, 29.0, 37.0, 67.0, 75.0, 84.0, 119.0, 169.0, 268.0, 323.0, 444.0, 637.0, 905.0, 1319.0, 1971.0, 3103.0, 4794.0, 8179.0, 15893.0, 46661.0, 428736.0, 447634.0, 48069.0, 16024.0, 8289.0, 4848.0, 3108.0, 2085.0, 1329.0, 959.0, 646.0, 445.0, 296.0, 253.0, 177.0, 118.0, 93.0, 68.0, 43.0, 46.0, 32.0, 29.0, 21.0, 13.0, 10.0, 9.0, 11.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-13.3359375, -12.9193115234375, -12.502685546875, -12.0860595703125, -11.66943359375, -11.2528076171875, -10.836181640625, -10.4195556640625, -10.0029296875, -9.5863037109375, -9.169677734375, -8.7530517578125, -8.33642578125, -7.9197998046875, -7.503173828125, -7.0865478515625, -6.669921875, -6.2532958984375, -5.836669921875, -5.4200439453125, -5.00341796875, -4.5867919921875, -4.170166015625, -3.7535400390625, -3.3369140625, -2.9202880859375, -2.503662109375, -2.0870361328125, -1.67041015625, -1.2537841796875, -0.837158203125, -0.4205322265625, -0.00390625, 0.4127197265625, 0.829345703125, 1.2459716796875, 1.66259765625, 2.0792236328125, 2.495849609375, 2.9124755859375, 3.3291015625, 3.7457275390625, 4.162353515625, 4.5789794921875, 4.99560546875, 5.4122314453125, 5.828857421875, 6.2454833984375, 6.662109375, 7.0787353515625, 7.495361328125, 7.9119873046875, 8.32861328125, 8.7452392578125, 9.161865234375, 9.5784912109375, 9.9951171875, 10.4117431640625, 10.828369140625, 11.2449951171875, 11.66162109375, 12.0782470703125, 12.494873046875, 12.9114990234375, 13.328125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 1.0, 7.0, 11.0, 15.0, 16.0, 19.0, 15.0, 21.0, 24.0, 29.0, 29.0, 42.0, 40.0, 72.0, 67.0, 93.0, 175.0, 1487.0, 307.0, 133.0, 98.0, 57.0, 28.0, 42.0, 43.0, 35.0, 19.0, 21.0, 19.0, 20.0, 20.0, 13.0, 10.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.131591796875, -10.80224609375, -10.472900390625, -10.1435546875, -9.814208984375, -9.48486328125, -9.155517578125, -8.826171875, -8.496826171875, -8.16748046875, -7.838134765625, -7.5087890625, -7.179443359375, -6.85009765625, -6.520751953125, -6.19140625, -5.862060546875, -5.53271484375, -5.203369140625, -4.8740234375, -4.544677734375, -4.21533203125, -3.885986328125, -3.556640625, -3.227294921875, -2.89794921875, -2.568603515625, -2.2392578125, -1.909912109375, -1.58056640625, -1.251220703125, -0.921875, -0.592529296875, -0.26318359375, 0.066162109375, 0.3955078125, 0.724853515625, 1.05419921875, 1.383544921875, 1.712890625, 2.042236328125, 2.37158203125, 2.700927734375, 3.0302734375, 3.359619140625, 3.68896484375, 4.018310546875, 4.34765625, 4.677001953125, 5.00634765625, 5.335693359375, 5.6650390625, 5.994384765625, 6.32373046875, 6.653076171875, 6.982421875, 7.311767578125, 7.64111328125, 7.970458984375, 8.2998046875, 8.629150390625, 8.95849609375, 9.287841796875, 9.6171875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 11.0, 12.0, 19.0, 18.0, 18.0, 22.0, 37.0, 32.0, 50.0, 58.0, 115.0, 299.0, 1476.0, 223363.0, 2916740.0, 2435.0, 441.0, 181.0, 82.0, 51.0, 33.0, 34.0, 36.0, 21.0, 15.0, 16.0, 16.0, 15.0, 15.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.6142578125, -40.134765625, -38.6552734375, -37.17578125, -35.6962890625, -34.216796875, -32.7373046875, -31.2578125, -29.7783203125, -28.298828125, -26.8193359375, -25.33984375, -23.8603515625, -22.380859375, -20.9013671875, -19.421875, -17.9423828125, -16.462890625, -14.9833984375, -13.50390625, -12.0244140625, -10.544921875, -9.0654296875, -7.5859375, -6.1064453125, -4.626953125, -3.1474609375, -1.66796875, -0.1884765625, 1.291015625, 2.7705078125, 4.25, 5.7294921875, 7.208984375, 8.6884765625, 10.16796875, 11.6474609375, 13.126953125, 14.6064453125, 16.0859375, 17.5654296875, 19.044921875, 20.5244140625, 22.00390625, 23.4833984375, 24.962890625, 26.4423828125, 27.921875, 29.4013671875, 30.880859375, 32.3603515625, 33.83984375, 35.3193359375, 36.798828125, 38.2783203125, 39.7578125, 41.2373046875, 42.716796875, 44.1962890625, 45.67578125, 47.1552734375, 48.634765625, 50.1142578125, 51.59375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 222.0, 789.0, 6.0, 1.0], "bins": [-255.08868408203125, -250.92105102539062, -246.75341796875, -242.58578491210938, -238.41815185546875, -234.25051879882812, -230.0828857421875, -225.91525268554688, -221.74761962890625, -217.57998657226562, -213.412353515625, -209.24472045898438, -205.07708740234375, -200.90945434570312, -196.7418212890625, -192.57418823242188, -188.4065399169922, -184.23890686035156, -180.07127380371094, -175.9036407470703, -171.7360076904297, -167.56837463378906, -163.40074157714844, -159.23309326171875, -155.06546020507812, -150.8978271484375, -146.73019409179688, -142.56256103515625, -138.39492797851562, -134.227294921875, -130.05966186523438, -125.89202117919922, -121.72441101074219, -117.55677795410156, -113.38914489746094, -109.22151184082031, -105.05387878417969, -100.88624572753906, -96.7186050415039, -92.55097198486328, -88.38333892822266, -84.21570587158203, -80.0480728149414, -75.88043975830078, -71.71279907226562, -67.545166015625, -63.377532958984375, -59.20989990234375, -55.04226303100586, -50.874629974365234, -46.706993103027344, -42.53936004638672, -38.371726989746094, -34.20409393310547, -30.03645896911621, -25.868824005126953, -21.701190948486328, -17.533557891845703, -13.365922927856445, -9.198288917541504, -5.0306549072265625, -0.8630218505859375, 3.3046131134033203, 7.472248077392578, 11.639880180358887]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 5.0, 9.0, 10.0, 9.0, 11.0, 20.0, 21.0, 17.0, 22.0, 26.0, 24.0, 30.0, 39.0, 37.0, 27.0, 44.0, 43.0, 38.0, 40.0, 43.0, 55.0, 43.0, 32.0, 40.0, 31.0, 38.0, 24.0, 30.0, 30.0, 21.0, 30.0, 18.0, 18.0, 13.0, 11.0, 13.0, 11.0, 6.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.167083740234375, -26.251102447509766, -25.33512306213379, -24.41914176940918, -23.503162384033203, -22.587181091308594, -21.671199798583984, -20.755220413208008, -19.83924102783203, -18.923259735107422, -18.007280349731445, -17.091299057006836, -16.17531967163086, -15.25933837890625, -14.343358039855957, -13.427377700805664, -12.511396408081055, -11.595416069030762, -10.679435729980469, -9.76345443725586, -8.847475051879883, -7.931494235992432, -7.0155134201049805, -6.0995330810546875, -5.1835527420043945, -4.267572402954102, -3.3515918254852295, -2.4356112480163574, -1.5196309089660645, -0.6036505699157715, 0.3123302459716797, 1.2283105850219727, 2.1442909240722656, 3.0602712631225586, 3.9762518405914307, 4.892232418060303, 5.808212757110596, 6.724193096160889, 7.64017391204834, 8.556154251098633, 9.472134590148926, 10.388114929199219, 11.304095268249512, 12.220075607299805, 13.136056900024414, 14.05203628540039, 14.968017578125, 15.883997917175293, 16.799978256225586, 17.715959548950195, 18.631938934326172, 19.54792022705078, 20.463899612426758, 21.379880905151367, 22.295860290527344, 23.211841583251953, 24.127822875976562, 25.043804168701172, 25.95978355407715, 26.875764846801758, 27.791744232177734, 28.707725524902344, 29.623706817626953, 30.53968620300293, 31.455665588378906]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 6.0, 2.0, 6.0, 6.0, 10.0, 10.0, 14.0, 20.0, 17.0, 15.0, 11.0, 25.0, 17.0, 22.0, 16.0, 25.0, 31.0, 30.0, 36.0, 38.0, 41.0, 25.0, 43.0, 43.0, 32.0, 35.0, 40.0, 30.0, 38.0, 40.0, 33.0, 32.0, 33.0, 32.0, 13.0, 21.0, 15.0, 20.0, 12.0, 10.0, 15.0, 7.0, 9.0, 5.0, 7.0, 4.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.787109375, -2.6983642578125, -2.609619140625, -2.5208740234375, -2.43212890625, -2.3433837890625, -2.254638671875, -2.1658935546875, -2.0771484375, -1.9884033203125, -1.899658203125, -1.8109130859375, -1.72216796875, -1.6334228515625, -1.544677734375, -1.4559326171875, -1.3671875, -1.2784423828125, -1.189697265625, -1.1009521484375, -1.01220703125, -0.9234619140625, -0.834716796875, -0.7459716796875, -0.6572265625, -0.5684814453125, -0.479736328125, -0.3909912109375, -0.30224609375, -0.2135009765625, -0.124755859375, -0.0360107421875, 0.052734375, 0.1414794921875, 0.230224609375, 0.3189697265625, 0.40771484375, 0.4964599609375, 0.585205078125, 0.6739501953125, 0.7626953125, 0.8514404296875, 0.940185546875, 1.0289306640625, 1.11767578125, 1.2064208984375, 1.295166015625, 1.3839111328125, 1.47265625, 1.5614013671875, 1.650146484375, 1.7388916015625, 1.82763671875, 1.9163818359375, 2.005126953125, 2.0938720703125, 2.1826171875, 2.2713623046875, 2.360107421875, 2.4488525390625, 2.53759765625, 2.6263427734375, 2.715087890625, 2.8038330078125, 2.892578125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 8.0, 11.0, 7.0, 7.0, 11.0, 21.0, 19.0, 29.0, 38.0, 51.0, 56.0, 68.0, 123.0, 140.0, 202.0, 305.0, 455.0, 775.0, 1378.0, 2558.0, 5626.0, 13864.0, 46229.0, 244297.0, 2517547.0, 1193416.0, 119457.0, 28417.0, 9725.0, 4197.0, 2081.0, 1128.0, 620.0, 411.0, 263.0, 201.0, 140.0, 102.0, 71.0, 55.0, 43.0, 26.0, 22.0, 16.0, 15.0, 12.0, 9.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-13.15625, -12.74267578125, -12.3291015625, -11.91552734375, -11.501953125, -11.08837890625, -10.6748046875, -10.26123046875, -9.84765625, -9.43408203125, -9.0205078125, -8.60693359375, -8.193359375, -7.77978515625, -7.3662109375, -6.95263671875, -6.5390625, -6.12548828125, -5.7119140625, -5.29833984375, -4.884765625, -4.47119140625, -4.0576171875, -3.64404296875, -3.23046875, -2.81689453125, -2.4033203125, -1.98974609375, -1.576171875, -1.16259765625, -0.7490234375, -0.33544921875, 0.078125, 0.49169921875, 0.9052734375, 1.31884765625, 1.732421875, 2.14599609375, 2.5595703125, 2.97314453125, 3.38671875, 3.80029296875, 4.2138671875, 4.62744140625, 5.041015625, 5.45458984375, 5.8681640625, 6.28173828125, 6.6953125, 7.10888671875, 7.5224609375, 7.93603515625, 8.349609375, 8.76318359375, 9.1767578125, 9.59033203125, 10.00390625, 10.41748046875, 10.8310546875, 11.24462890625, 11.658203125, 12.07177734375, 12.4853515625, 12.89892578125, 13.3125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 13.0, 13.0, 25.0, 41.0, 60.0, 71.0, 119.0, 179.0, 226.0, 370.0, 506.0, 647.0, 586.0, 394.0, 292.0, 177.0, 131.0, 69.0, 42.0, 34.0, 35.0, 14.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.681884765625, -20.16064453125, -19.639404296875, -19.1181640625, -18.596923828125, -18.07568359375, -17.554443359375, -17.033203125, -16.511962890625, -15.99072265625, -15.469482421875, -14.9482421875, -14.427001953125, -13.90576171875, -13.384521484375, -12.86328125, -12.342041015625, -11.82080078125, -11.299560546875, -10.7783203125, -10.257080078125, -9.73583984375, -9.214599609375, -8.693359375, -8.172119140625, -7.65087890625, -7.129638671875, -6.6083984375, -6.087158203125, -5.56591796875, -5.044677734375, -4.5234375, -4.002197265625, -3.48095703125, -2.959716796875, -2.4384765625, -1.917236328125, -1.39599609375, -0.874755859375, -0.353515625, 0.167724609375, 0.68896484375, 1.210205078125, 1.7314453125, 2.252685546875, 2.77392578125, 3.295166015625, 3.81640625, 4.337646484375, 4.85888671875, 5.380126953125, 5.9013671875, 6.422607421875, 6.94384765625, 7.465087890625, 7.986328125, 8.507568359375, 9.02880859375, 9.550048828125, 10.0712890625, 10.592529296875, 11.11376953125, 11.635009765625, 12.15625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 10.0, 9.0, 22.0, 30.0, 53.0, 89.0, 192.0, 407.0, 1831.0, 632291.0, 3554908.0, 3256.0, 611.0, 239.0, 136.0, 70.0, 40.0, 31.0, 15.0, 20.0, 11.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5, -49.888671875, -47.27734375, -44.666015625, -42.0546875, -39.443359375, -36.83203125, -34.220703125, -31.609375, -28.998046875, -26.38671875, -23.775390625, -21.1640625, -18.552734375, -15.94140625, -13.330078125, -10.71875, -8.107421875, -5.49609375, -2.884765625, -0.2734375, 2.337890625, 4.94921875, 7.560546875, 10.171875, 12.783203125, 15.39453125, 18.005859375, 20.6171875, 23.228515625, 25.83984375, 28.451171875, 31.0625, 33.673828125, 36.28515625, 38.896484375, 41.5078125, 44.119140625, 46.73046875, 49.341796875, 51.953125, 54.564453125, 57.17578125, 59.787109375, 62.3984375, 65.009765625, 67.62109375, 70.232421875, 72.84375, 75.455078125, 78.06640625, 80.677734375, 83.2890625, 85.900390625, 88.51171875, 91.123046875, 93.734375, 96.345703125, 98.95703125, 101.568359375, 104.1796875, 106.791015625, 109.40234375, 112.013671875, 114.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 38.0, 122.0, 317.0, 327.0, 153.0, 43.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.57981872558594, -143.98806762695312, -140.3963165283203, -136.8045654296875, -133.2128143310547, -129.62106323242188, -126.02931213378906, -122.43756103515625, -118.84580993652344, -115.25405883789062, -111.66230773925781, -108.070556640625, -104.47880554199219, -100.88705444335938, -97.29530334472656, -93.70355224609375, -90.11180877685547, -86.52005767822266, -82.92830657958984, -79.33655548095703, -75.74480438232422, -72.1530532836914, -68.56130981445312, -64.96955871582031, -61.377803802490234, -57.78605270385742, -54.19430160522461, -50.60255432128906, -47.01080322265625, -43.41905212402344, -39.827301025390625, -36.23554992675781, -32.64380645751953, -29.05205535888672, -25.460304260253906, -21.868555068969727, -18.276803970336914, -14.685052871704102, -11.093303680419922, -7.501552581787109, -3.909801483154297, -0.3180508613586426, 3.2736997604370117, 6.865449905395508, 10.45720100402832, 14.048952102661133, 17.640701293945312, 21.232452392578125, 24.824203491210938, 28.41595458984375, 32.00770568847656, 35.599456787109375, 39.19120788574219, 42.782958984375, 46.37470626831055, 49.96645736694336, 53.55820846557617, 57.149959564208984, 60.7417106628418, 64.33345794677734, 67.92520904541016, 71.51696014404297, 75.10871124267578, 78.7004623413086, 82.2922134399414]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 3.0, 9.0, 7.0, 7.0, 16.0, 14.0, 18.0, 19.0, 14.0, 25.0, 18.0, 22.0, 29.0, 25.0, 21.0, 55.0, 31.0, 35.0, 42.0, 42.0, 37.0, 38.0, 35.0, 32.0, 37.0, 41.0, 42.0, 25.0, 28.0, 24.0, 31.0, 29.0, 31.0, 14.0, 14.0, 15.0, 10.0, 14.0, 8.0, 13.0, 6.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.5201416015625, -44.14002990722656, -42.75992202758789, -41.37981414794922, -39.99970245361328, -38.619590759277344, -37.23948287963867, -35.859375, -34.47926330566406, -33.099151611328125, -31.719043731689453, -30.33893394470215, -28.958824157714844, -27.57871437072754, -26.198604583740234, -24.81849479675293, -23.438385009765625, -22.05827522277832, -20.678165435791016, -19.29805564880371, -17.917945861816406, -16.5378360748291, -15.157726287841797, -13.777616500854492, -12.397506713867188, -11.017396926879883, -9.637287139892578, -8.257177352905273, -6.877067565917969, -5.496957778930664, -4.116847991943359, -2.7367382049560547, -1.35662841796875, 0.023481369018554688, 1.4035911560058594, 2.783700942993164, 4.163810729980469, 5.543920516967773, 6.924030303955078, 8.304140090942383, 9.684249877929688, 11.064359664916992, 12.444469451904297, 13.824579238891602, 15.204689025878906, 16.58479881286621, 17.964908599853516, 19.34501838684082, 20.725128173828125, 22.10523796081543, 23.485347747802734, 24.86545753479004, 26.245567321777344, 27.62567710876465, 29.005786895751953, 30.385896682739258, 31.766006469726562, 33.1461181640625, 34.52622604370117, 35.906333923339844, 37.28644561767578, 38.66655731201172, 40.04666519165039, 41.42677307128906, 42.806884765625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 3.0, 7.0, 8.0, 11.0, 8.0, 16.0, 12.0, 17.0, 17.0, 19.0, 20.0, 26.0, 40.0, 23.0, 39.0, 32.0, 37.0, 44.0, 45.0, 36.0, 43.0, 42.0, 35.0, 36.0, 25.0, 45.0, 36.0, 32.0, 30.0, 36.0, 29.0, 25.0, 19.0, 19.0, 16.0, 17.0, 14.0, 6.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.7310791015625, -2.632080078125, -2.5330810546875, -2.43408203125, -2.3350830078125, -2.236083984375, -2.1370849609375, -2.0380859375, -1.9390869140625, -1.840087890625, -1.7410888671875, -1.64208984375, -1.5430908203125, -1.444091796875, -1.3450927734375, -1.24609375, -1.1470947265625, -1.048095703125, -0.9490966796875, -0.85009765625, -0.7510986328125, -0.652099609375, -0.5531005859375, -0.4541015625, -0.3551025390625, -0.256103515625, -0.1571044921875, -0.05810546875, 0.0408935546875, 0.139892578125, 0.2388916015625, 0.337890625, 0.4368896484375, 0.535888671875, 0.6348876953125, 0.73388671875, 0.8328857421875, 0.931884765625, 1.0308837890625, 1.1298828125, 1.2288818359375, 1.327880859375, 1.4268798828125, 1.52587890625, 1.6248779296875, 1.723876953125, 1.8228759765625, 1.921875, 2.0208740234375, 2.119873046875, 2.2188720703125, 2.31787109375, 2.4168701171875, 2.515869140625, 2.6148681640625, 2.7138671875, 2.8128662109375, 2.911865234375, 3.0108642578125, 3.10986328125, 3.2088623046875, 3.307861328125, 3.4068603515625, 3.505859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 7.0, 11.0, 23.0, 24.0, 47.0, 63.0, 84.0, 128.0, 157.0, 295.0, 506.0, 724.0, 1187.0, 1949.0, 3185.0, 5290.0, 8806.0, 14929.0, 24821.0, 42556.0, 72856.0, 120541.0, 177031.0, 198983.0, 147241.0, 93294.0, 54634.0, 31969.0, 18987.0, 11025.0, 6735.0, 3957.0, 2505.0, 1444.0, 921.0, 586.0, 364.0, 232.0, 137.0, 119.0, 68.0, 47.0, 27.0, 14.0, 17.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3442039489746094, -0.33318328857421875, -0.3221626281738281, -0.3111419677734375, -0.3001213073730469, -0.28910064697265625, -0.2780799865722656, -0.267059326171875, -0.2560386657714844, -0.24501800537109375, -0.23399734497070312, -0.2229766845703125, -0.21195602416992188, -0.20093536376953125, -0.18991470336914062, -0.17889404296875, -0.16787338256835938, -0.15685272216796875, -0.14583206176757812, -0.1348114013671875, -0.12379074096679688, -0.11277008056640625, -0.10174942016601562, -0.090728759765625, -0.07970809936523438, -0.06868743896484375, -0.057666778564453125, -0.0466461181640625, -0.035625457763671875, -0.02460479736328125, -0.013584136962890625, -0.0025634765625, 0.008457183837890625, 0.01947784423828125, 0.030498504638671875, 0.0415191650390625, 0.052539825439453125, 0.06356048583984375, 0.07458114624023438, 0.085601806640625, 0.09662246704101562, 0.10764312744140625, 0.11866378784179688, 0.1296844482421875, 0.14070510864257812, 0.15172576904296875, 0.16274642944335938, 0.17376708984375, 0.18478775024414062, 0.19580841064453125, 0.20682907104492188, 0.2178497314453125, 0.22887039184570312, 0.23989105224609375, 0.2509117126464844, 0.261932373046875, 0.2729530334472656, 0.28397369384765625, 0.2949943542480469, 0.3060150146484375, 0.3170356750488281, 0.32805633544921875, 0.3390769958496094, 0.35009765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 4.0, 6.0, 10.0, 9.0, 11.0, 11.0, 24.0, 23.0, 13.0, 24.0, 27.0, 22.0, 41.0, 32.0, 31.0, 30.0, 42.0, 45.0, 35.0, 32.0, 1072.0, 41.0, 38.0, 37.0, 37.0, 36.0, 34.0, 36.0, 24.0, 27.0, 27.0, 19.0, 16.0, 13.0, 25.0, 15.0, 7.0, 12.0, 4.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.2578125, -2.1920928955078125, -2.126373291015625, -2.0606536865234375, -1.99493408203125, -1.9292144775390625, -1.863494873046875, -1.7977752685546875, -1.7320556640625, -1.6663360595703125, -1.600616455078125, -1.5348968505859375, -1.46917724609375, -1.4034576416015625, -1.337738037109375, -1.2720184326171875, -1.206298828125, -1.1405792236328125, -1.074859619140625, -1.0091400146484375, -0.94342041015625, -0.8777008056640625, -0.811981201171875, -0.7462615966796875, -0.6805419921875, -0.6148223876953125, -0.549102783203125, -0.4833831787109375, -0.41766357421875, -0.3519439697265625, -0.286224365234375, -0.2205047607421875, -0.15478515625, -0.0890655517578125, -0.023345947265625, 0.0423736572265625, 0.10809326171875, 0.1738128662109375, 0.239532470703125, 0.3052520751953125, 0.3709716796875, 0.4366912841796875, 0.502410888671875, 0.5681304931640625, 0.63385009765625, 0.6995697021484375, 0.765289306640625, 0.8310089111328125, 0.896728515625, 0.9624481201171875, 1.028167724609375, 1.0938873291015625, 1.15960693359375, 1.2253265380859375, 1.291046142578125, 1.3567657470703125, 1.4224853515625, 1.4882049560546875, 1.553924560546875, 1.6196441650390625, 1.68536376953125, 1.7510833740234375, 1.816802978515625, 1.8825225830078125, 1.9482421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 33.0, 35.0, 77.0, 98.0, 170.0, 247.0, 345.0, 483.0, 717.0, 953.0, 1462.0, 2170.0, 3054.0, 4441.0, 6584.0, 9438.0, 13686.0, 20246.0, 29339.0, 42698.0, 60178.0, 82444.0, 106177.0, 160178.0, 1137624.0, 111879.0, 88215.0, 65139.0, 46561.0, 32240.0, 22117.0, 15087.0, 10263.0, 7053.0, 5035.0, 3302.0, 2240.0, 1615.0, 1098.0, 771.0, 519.0, 361.0, 251.0, 180.0, 127.0, 62.0, 40.0, 31.0, 24.0, 12.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1912841796875, -0.18532752990722656, -0.17937088012695312, -0.1734142303466797, -0.16745758056640625, -0.1615009307861328, -0.15554428100585938, -0.14958763122558594, -0.1436309814453125, -0.13767433166503906, -0.13171768188476562, -0.1257610321044922, -0.11980438232421875, -0.11384773254394531, -0.10789108276367188, -0.10193443298339844, -0.095977783203125, -0.09002113342285156, -0.08406448364257812, -0.07810783386230469, -0.07215118408203125, -0.06619453430175781, -0.060237884521484375, -0.05428123474121094, -0.0483245849609375, -0.04236793518066406, -0.036411285400390625, -0.030454635620117188, -0.02449798583984375, -0.018541336059570312, -0.012584686279296875, -0.0066280364990234375, -0.00067138671875, 0.0052852630615234375, 0.011241912841796875, 0.017198562622070312, 0.02315521240234375, 0.029111862182617188, 0.035068511962890625, 0.04102516174316406, 0.0469818115234375, 0.05293846130371094, 0.058895111083984375, 0.06485176086425781, 0.07080841064453125, 0.07676506042480469, 0.08272171020507812, 0.08867835998535156, 0.094635009765625, 0.10059165954589844, 0.10654830932617188, 0.11250495910644531, 0.11846160888671875, 0.12441825866699219, 0.13037490844726562, 0.13633155822753906, 0.1422882080078125, 0.14824485778808594, 0.15420150756835938, 0.1601581573486328, 0.16611480712890625, 0.1720714569091797, 0.17802810668945312, 0.18398475646972656, 0.18994140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 3.0, 8.0, 7.0, 11.0, 7.0, 8.0, 11.0, 15.0, 28.0, 31.0, 29.0, 34.0, 49.0, 53.0, 64.0, 66.0, 87.0, 56.0, 67.0, 45.0, 46.0, 53.0, 39.0, 29.0, 27.0, 20.0, 14.0, 16.0, 10.0, 13.0, 15.0, 9.0, 2.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00189208984375, -0.001834481954574585, -0.00177687406539917, -0.0017192661762237549, -0.0016616582870483398, -0.0016040503978729248, -0.0015464425086975098, -0.0014888346195220947, -0.0014312267303466797, -0.0013736188411712646, -0.0013160109519958496, -0.0012584030628204346, -0.0012007951736450195, -0.0011431872844696045, -0.0010855793952941895, -0.0010279715061187744, -0.0009703636169433594, -0.0009127557277679443, -0.0008551478385925293, -0.0007975399494171143, -0.0007399320602416992, -0.0006823241710662842, -0.0006247162818908691, -0.0005671083927154541, -0.0005095005035400391, -0.000451892614364624, -0.000394284725189209, -0.00033667683601379395, -0.0002790689468383789, -0.00022146105766296387, -0.00016385316848754883, -0.00010624527931213379, -4.863739013671875e-05, 8.970499038696289e-06, 6.657838821411133e-05, 0.00012418627738952637, 0.0001817941665649414, 0.00023940205574035645, 0.0002970099449157715, 0.0003546178340911865, 0.00041222572326660156, 0.0004698336124420166, 0.0005274415016174316, 0.0005850493907928467, 0.0006426572799682617, 0.0007002651691436768, 0.0007578730583190918, 0.0008154809474945068, 0.0008730888366699219, 0.0009306967258453369, 0.000988304615020752, 0.001045912504196167, 0.001103520393371582, 0.001161128282546997, 0.0012187361717224121, 0.0012763440608978271, 0.0013339519500732422, 0.0013915598392486572, 0.0014491677284240723, 0.0015067756175994873, 0.0015643835067749023, 0.0016219913959503174, 0.0016795992851257324, 0.0017372071743011475, 0.0017948150634765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 11.0, 7.0, 18.0, 17.0, 20.0, 26.0, 35.0, 40.0, 70.0, 99.0, 130.0, 133.0, 221.0, 403.0, 1062.0, 640937.0, 403129.0, 927.0, 387.0, 219.0, 157.0, 120.0, 82.0, 77.0, 52.0, 39.0, 22.0, 23.0, 8.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0408935546875, -0.03969001770019531, -0.038486480712890625, -0.03728294372558594, -0.03607940673828125, -0.03487586975097656, -0.033672332763671875, -0.03246879577636719, -0.0312652587890625, -0.030061721801757812, -0.028858184814453125, -0.027654647827148438, -0.02645111083984375, -0.025247573852539062, -0.024044036865234375, -0.022840499877929688, -0.021636962890625, -0.020433425903320312, -0.019229888916015625, -0.018026351928710938, -0.01682281494140625, -0.015619277954101562, -0.014415740966796875, -0.013212203979492188, -0.0120086669921875, -0.010805130004882812, -0.009601593017578125, -0.008398056030273438, -0.00719451904296875, -0.0059909820556640625, -0.004787445068359375, -0.0035839080810546875, -0.00238037109375, -0.0011768341064453125, 2.6702880859375e-05, 0.0012302398681640625, 0.00243377685546875, 0.0036373138427734375, 0.004840850830078125, 0.0060443878173828125, 0.0072479248046875, 0.008451461791992188, 0.009654998779296875, 0.010858535766601562, 0.01206207275390625, 0.013265609741210938, 0.014469146728515625, 0.015672683715820312, 0.016876220703125, 0.018079757690429688, 0.019283294677734375, 0.020486831665039062, 0.02169036865234375, 0.022893905639648438, 0.024097442626953125, 0.025300979614257812, 0.0265045166015625, 0.027708053588867188, 0.028911590576171875, 0.030115127563476562, 0.03131866455078125, 0.03252220153808594, 0.033725738525390625, 0.03492927551269531, 0.0361328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 680.0, 336.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014875168912112713, -0.014461212791502476, -0.014047256670892239, -0.013633300550282001, -0.013219344429671764, -0.012805388309061527, -0.01239143218845129, -0.011977476067841053, -0.011563519947230816, -0.011149563826620579, -0.010735607706010342, -0.010321651585400105, -0.009907695464789867, -0.00949373934417963, -0.009079783223569393, -0.008665827102959156, -0.008251871913671494, -0.007837915793061256, -0.007423959672451019, -0.007010003551840782, -0.006596047431230545, -0.006182091310620308, -0.005768135190010071, -0.005354179069399834, -0.0049402229487895966, -0.0045262668281793594, -0.004112310707569122, -0.003698354586958885, -0.003284398466348648, -0.0028704425785690546, -0.0024564864579588175, -0.0020425303373485804, -0.0016285739839076996, -0.0012146178632974625, -0.0008006618008948863, -0.00038670573849231005, 2.7250382117927074e-05, 0.00044120638631284237, 0.0008551625069230795, 0.0012691186275333166, 0.0016830747481435537, 0.002097030868753791, 0.002510986989364028, 0.0029249428771436214, 0.0033388989977538586, 0.0037528551183640957, 0.004166811238974333, 0.00458076735958457, 0.004994723480194807, 0.005408679600805044, 0.005822635721415281, 0.006236591842025518, 0.0066505479626357555, 0.007064503617584705, 0.0074784597381949425, 0.00789241585880518, 0.008306371979415417, 0.008720328100025654, 0.009134284220635891, 0.009548240341246128, 0.009962196461856365, 0.010376152582466602, 0.01079010870307684, 0.011204064823687077, 0.011618020944297314]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 17.0, 12.0, 13.0, 14.0, 17.0, 17.0, 27.0, 20.0, 18.0, 29.0, 36.0, 27.0, 35.0, 28.0, 45.0, 46.0, 43.0, 40.0, 46.0, 41.0, 51.0, 38.0, 43.0, 44.0, 33.0, 36.0, 26.0, 21.0, 20.0, 23.0, 21.0, 12.0, 9.0, 9.0, 7.0, 4.0, 6.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009607076644897461, -0.0009289132431149483, -0.0008971188217401505, -0.0008653244003653526, -0.0008335299789905548, -0.000801735557615757, -0.0007699411362409592, -0.0007381467148661613, -0.0007063522934913635, -0.0006745578721165657, -0.0006427634507417679, -0.0006109690293669701, -0.0005791746079921722, -0.0005473801866173744, -0.0005155857652425766, -0.0004837913438677788, -0.00045199692249298096, -0.00042020250111818314, -0.0003884080797433853, -0.0003566136583685875, -0.00032481923699378967, -0.00029302481561899185, -0.00026123039424419403, -0.0002294359728693962, -0.0001976415514945984, -0.00016584713011980057, -0.00013405270874500275, -0.00010225828737020493, -7.04638659954071e-05, -3.8669444620609283e-05, -6.875023245811462e-06, 2.491939812898636e-05, 5.671381950378418e-05, 8.8508240878582e-05, 0.00012030266225337982, 0.00015209708362817764, 0.00018389150500297546, 0.00021568592637777328, 0.0002474803477525711, 0.0002792747691273689, 0.00031106919050216675, 0.00034286361187696457, 0.0003746580332517624, 0.0004064524546265602, 0.00043824687600135803, 0.00047004129737615585, 0.0005018357187509537, 0.0005336301401257515, 0.0005654245615005493, 0.0005972189828753471, 0.000629013404250145, 0.0006608078256249428, 0.0006926022469997406, 0.0007243966683745384, 0.0007561910897493362, 0.0007879855111241341, 0.0008197799324989319, 0.0008515743538737297, 0.0008833687752485275, 0.0009151631966233253, 0.0009469576179981232, 0.000978752039372921, 0.0010105464607477188, 0.0010423408821225166, 0.0010741353034973145]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 3.0, 7.0, 8.0, 11.0, 8.0, 16.0, 12.0, 17.0, 17.0, 19.0, 20.0, 26.0, 40.0, 23.0, 39.0, 32.0, 37.0, 44.0, 45.0, 36.0, 43.0, 42.0, 35.0, 36.0, 25.0, 45.0, 36.0, 32.0, 30.0, 36.0, 29.0, 25.0, 19.0, 19.0, 16.0, 17.0, 14.0, 6.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.7310791015625, -2.632080078125, -2.5330810546875, -2.43408203125, -2.3350830078125, -2.236083984375, -2.1370849609375, -2.0380859375, -1.9390869140625, -1.840087890625, -1.7410888671875, -1.64208984375, -1.5430908203125, -1.444091796875, -1.3450927734375, -1.24609375, -1.1470947265625, -1.048095703125, -0.9490966796875, -0.85009765625, -0.7510986328125, -0.652099609375, -0.5531005859375, -0.4541015625, -0.3551025390625, -0.256103515625, -0.1571044921875, -0.05810546875, 0.0408935546875, 0.139892578125, 0.2388916015625, 0.337890625, 0.4368896484375, 0.535888671875, 0.6348876953125, 0.73388671875, 0.8328857421875, 0.931884765625, 1.0308837890625, 1.1298828125, 1.2288818359375, 1.327880859375, 1.4268798828125, 1.52587890625, 1.6248779296875, 1.723876953125, 1.8228759765625, 1.921875, 2.0208740234375, 2.119873046875, 2.2188720703125, 2.31787109375, 2.4168701171875, 2.515869140625, 2.6148681640625, 2.7138671875, 2.8128662109375, 2.911865234375, 3.0108642578125, 3.10986328125, 3.2088623046875, 3.307861328125, 3.4068603515625, 3.505859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 13.0, 5.0, 20.0, 22.0, 29.0, 37.0, 60.0, 81.0, 103.0, 127.0, 194.0, 283.0, 391.0, 681.0, 1263.0, 2626.0, 6075.0, 15959.0, 45801.0, 140646.0, 380531.0, 298963.0, 99846.0, 33083.0, 12030.0, 4722.0, 2082.0, 1002.0, 628.0, 370.0, 255.0, 191.0, 132.0, 79.0, 67.0, 49.0, 25.0, 23.0, 17.0, 12.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.807403564453125, -2.70660400390625, -2.605804443359375, -2.5050048828125, -2.404205322265625, -2.30340576171875, -2.202606201171875, -2.101806640625, -2.001007080078125, -1.90020751953125, -1.799407958984375, -1.6986083984375, -1.597808837890625, -1.49700927734375, -1.396209716796875, -1.29541015625, -1.194610595703125, -1.09381103515625, -0.993011474609375, -0.8922119140625, -0.791412353515625, -0.69061279296875, -0.589813232421875, -0.489013671875, -0.388214111328125, -0.28741455078125, -0.186614990234375, -0.0858154296875, 0.014984130859375, 0.11578369140625, 0.216583251953125, 0.3173828125, 0.418182373046875, 0.51898193359375, 0.619781494140625, 0.7205810546875, 0.821380615234375, 0.92218017578125, 1.022979736328125, 1.123779296875, 1.224578857421875, 1.32537841796875, 1.426177978515625, 1.5269775390625, 1.627777099609375, 1.72857666015625, 1.829376220703125, 1.93017578125, 2.030975341796875, 2.13177490234375, 2.232574462890625, 2.3333740234375, 2.434173583984375, 2.53497314453125, 2.635772705078125, 2.736572265625, 2.837371826171875, 2.93817138671875, 3.038970947265625, 3.1397705078125, 3.240570068359375, 3.34136962890625, 3.442169189453125, 3.54296875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 11.0, 15.0, 14.0, 21.0, 26.0, 22.0, 23.0, 28.0, 27.0, 27.0, 30.0, 36.0, 52.0, 68.0, 110.0, 336.0, 1541.0, 154.0, 82.0, 40.0, 45.0, 35.0, 36.0, 32.0, 30.0, 31.0, 27.0, 18.0, 19.0, 20.0, 9.0, 9.0, 13.0, 9.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.2265625, -10.8775634765625, -10.528564453125, -10.1795654296875, -9.83056640625, -9.4815673828125, -9.132568359375, -8.7835693359375, -8.4345703125, -8.0855712890625, -7.736572265625, -7.3875732421875, -7.03857421875, -6.6895751953125, -6.340576171875, -5.9915771484375, -5.642578125, -5.2935791015625, -4.944580078125, -4.5955810546875, -4.24658203125, -3.8975830078125, -3.548583984375, -3.1995849609375, -2.8505859375, -2.5015869140625, -2.152587890625, -1.8035888671875, -1.45458984375, -1.1055908203125, -0.756591796875, -0.4075927734375, -0.05859375, 0.2904052734375, 0.639404296875, 0.9884033203125, 1.33740234375, 1.6864013671875, 2.035400390625, 2.3843994140625, 2.7333984375, 3.0823974609375, 3.431396484375, 3.7803955078125, 4.12939453125, 4.4783935546875, 4.827392578125, 5.1763916015625, 5.525390625, 5.8743896484375, 6.223388671875, 6.5723876953125, 6.92138671875, 7.2703857421875, 7.619384765625, 7.9683837890625, 8.3173828125, 8.6663818359375, 9.015380859375, 9.3643798828125, 9.71337890625, 10.0623779296875, 10.411376953125, 10.7603759765625, 11.109375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 7.0, 6.0, 6.0, 14.0, 9.0, 13.0, 19.0, 15.0, 21.0, 32.0, 36.0, 30.0, 51.0, 61.0, 79.0, 129.0, 213.0, 495.0, 1673.0, 24114.0, 3091949.0, 23762.0, 1669.0, 549.0, 205.0, 141.0, 88.0, 54.0, 40.0, 41.0, 26.0, 21.0, 23.0, 22.0, 21.0, 11.0, 9.0, 14.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-24.390625, -23.64013671875, -22.8896484375, -22.13916015625, -21.388671875, -20.63818359375, -19.8876953125, -19.13720703125, -18.38671875, -17.63623046875, -16.8857421875, -16.13525390625, -15.384765625, -14.63427734375, -13.8837890625, -13.13330078125, -12.3828125, -11.63232421875, -10.8818359375, -10.13134765625, -9.380859375, -8.63037109375, -7.8798828125, -7.12939453125, -6.37890625, -5.62841796875, -4.8779296875, -4.12744140625, -3.376953125, -2.62646484375, -1.8759765625, -1.12548828125, -0.375, 0.37548828125, 1.1259765625, 1.87646484375, 2.626953125, 3.37744140625, 4.1279296875, 4.87841796875, 5.62890625, 6.37939453125, 7.1298828125, 7.88037109375, 8.630859375, 9.38134765625, 10.1318359375, 10.88232421875, 11.6328125, 12.38330078125, 13.1337890625, 13.88427734375, 14.634765625, 15.38525390625, 16.1357421875, 16.88623046875, 17.63671875, 18.38720703125, 19.1376953125, 19.88818359375, 20.638671875, 21.38916015625, 22.1396484375, 22.89013671875, 23.640625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 53.0, 226.0, 390.0, 259.0, 64.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.25820255279541, -14.2777738571167, -13.297345161437988, -12.316917419433594, -11.336488723754883, -10.356060028076172, -9.375631332397461, -8.39520263671875, -7.414774417877197, -6.434345722198486, -5.453917503356934, -4.473488807678223, -3.493060350418091, -2.512631893157959, -1.532203197479248, -0.5517749786376953, 0.4286537170410156, 1.4090821743011475, 2.3895106315612793, 3.3699393272399902, 4.350367546081543, 5.330796241760254, 6.311224937438965, 7.291653156280518, 8.27208137512207, 9.252510070800781, 10.232938766479492, 11.213367462158203, 12.193795204162598, 13.174223899841309, 14.15465259552002, 15.135080337524414, 16.115510940551758, 17.09593963623047, 18.07636833190918, 19.05679702758789, 20.0372257232666, 21.017654418945312, 21.99808120727539, 22.9785099029541, 23.958938598632812, 24.939367294311523, 25.919795989990234, 26.900224685668945, 27.880653381347656, 28.861080169677734, 29.841510772705078, 30.821937561035156, 31.8023681640625, 32.78279495239258, 33.76322555541992, 34.74365234375, 35.724082946777344, 36.70450973510742, 37.684940338134766, 38.665367126464844, 39.64579391479492, 40.626220703125, 41.606651306152344, 42.58707809448242, 43.567508697509766, 44.547935485839844, 45.52836608886719, 46.508792877197266, 47.48922348022461]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 4.0, 0.0, 10.0, 9.0, 11.0, 12.0, 28.0, 28.0, 27.0, 20.0, 35.0, 35.0, 35.0, 37.0, 46.0, 40.0, 51.0, 45.0, 43.0, 37.0, 45.0, 51.0, 33.0, 38.0, 31.0, 33.0, 28.0, 24.0, 23.0, 21.0, 23.0, 16.0, 14.0, 15.0, 12.0, 2.0, 7.0, 6.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.05988311767578, -31.94179916381836, -30.823713302612305, -29.705629348754883, -28.587543487548828, -27.469459533691406, -26.351375579833984, -25.23328971862793, -24.115203857421875, -22.997119903564453, -21.8790340423584, -20.760950088500977, -19.642864227294922, -18.5247802734375, -17.406696319580078, -16.288610458374023, -15.170526504516602, -14.052441596984863, -12.934356689453125, -11.816272735595703, -10.698186874389648, -9.580102920532227, -8.462018013000488, -7.34393310546875, -6.225848197937012, -5.107763290405273, -3.9896786212921143, -2.871593952178955, -1.7535090446472168, -0.6354241371154785, 0.48266029357910156, 1.6007452011108398, 2.718830108642578, 3.8369150161743164, 4.954999923706055, 6.073084354400635, 7.191169261932373, 8.309253692626953, 9.427338600158691, 10.54542350769043, 11.663508415222168, 12.781593322753906, 13.899678230285645, 15.017763137817383, 16.135847091674805, 17.25393295288086, 18.37201690673828, 19.490100860595703, 20.608186721801758, 21.72627067565918, 22.844356536865234, 23.962440490722656, 25.08052635192871, 26.198610305786133, 27.316696166992188, 28.43478012084961, 29.55286407470703, 30.670948028564453, 31.789033889770508, 32.90711975097656, 34.025203704833984, 35.143287658691406, 36.26137161254883, 37.37945556640625, 38.49754333496094]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 8.0, 5.0, 7.0, 10.0, 9.0, 14.0, 11.0, 22.0, 15.0, 24.0, 21.0, 27.0, 28.0, 33.0, 36.0, 40.0, 44.0, 34.0, 44.0, 38.0, 42.0, 45.0, 31.0, 37.0, 42.0, 33.0, 28.0, 37.0, 30.0, 35.0, 28.0, 20.0, 27.0, 21.0, 12.0, 10.0, 15.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.792388916015625, -2.69024658203125, -2.588104248046875, -2.4859619140625, -2.383819580078125, -2.28167724609375, -2.179534912109375, -2.077392578125, -1.975250244140625, -1.87310791015625, -1.770965576171875, -1.6688232421875, -1.566680908203125, -1.46453857421875, -1.362396240234375, -1.26025390625, -1.158111572265625, -1.05596923828125, -0.953826904296875, -0.8516845703125, -0.749542236328125, -0.64739990234375, -0.545257568359375, -0.443115234375, -0.340972900390625, -0.23883056640625, -0.136688232421875, -0.0345458984375, 0.067596435546875, 0.16973876953125, 0.271881103515625, 0.3740234375, 0.476165771484375, 0.57830810546875, 0.680450439453125, 0.7825927734375, 0.884735107421875, 0.98687744140625, 1.089019775390625, 1.191162109375, 1.293304443359375, 1.39544677734375, 1.497589111328125, 1.5997314453125, 1.701873779296875, 1.80401611328125, 1.906158447265625, 2.00830078125, 2.110443115234375, 2.21258544921875, 2.314727783203125, 2.4168701171875, 2.519012451171875, 2.62115478515625, 2.723297119140625, 2.825439453125, 2.927581787109375, 3.02972412109375, 3.131866455078125, 3.2340087890625, 3.336151123046875, 3.43829345703125, 3.540435791015625, 3.642578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 3.0, 4.0, 9.0, 11.0, 18.0, 22.0, 20.0, 28.0, 35.0, 37.0, 50.0, 58.0, 81.0, 145.0, 212.0, 498.0, 1379.0, 5353.0, 26300.0, 205500.0, 2474710.0, 1358673.0, 100318.0, 15271.0, 3376.0, 1047.0, 404.0, 208.0, 121.0, 89.0, 59.0, 51.0, 34.0, 28.0, 34.0, 12.0, 16.0, 16.0, 9.0, 9.0, 10.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.140625, -10.767333984375, -10.39404296875, -10.020751953125, -9.6474609375, -9.274169921875, -8.90087890625, -8.527587890625, -8.154296875, -7.781005859375, -7.40771484375, -7.034423828125, -6.6611328125, -6.287841796875, -5.91455078125, -5.541259765625, -5.16796875, -4.794677734375, -4.42138671875, -4.048095703125, -3.6748046875, -3.301513671875, -2.92822265625, -2.554931640625, -2.181640625, -1.808349609375, -1.43505859375, -1.061767578125, -0.6884765625, -0.315185546875, 0.05810546875, 0.431396484375, 0.8046875, 1.177978515625, 1.55126953125, 1.924560546875, 2.2978515625, 2.671142578125, 3.04443359375, 3.417724609375, 3.791015625, 4.164306640625, 4.53759765625, 4.910888671875, 5.2841796875, 5.657470703125, 6.03076171875, 6.404052734375, 6.77734375, 7.150634765625, 7.52392578125, 7.897216796875, 8.2705078125, 8.643798828125, 9.01708984375, 9.390380859375, 9.763671875, 10.136962890625, 10.51025390625, 10.883544921875, 11.2568359375, 11.630126953125, 12.00341796875, 12.376708984375, 12.75]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 6.0, 9.0, 24.0, 16.0, 43.0, 53.0, 43.0, 69.0, 87.0, 123.0, 131.0, 188.0, 240.0, 275.0, 311.0, 377.0, 376.0, 348.0, 272.0, 209.0, 196.0, 159.0, 110.0, 100.0, 66.0, 48.0, 36.0, 35.0, 20.0, 17.0, 10.0, 16.0, 7.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.3206787109375, -8.024169921875, -7.7276611328125, -7.43115234375, -7.1346435546875, -6.838134765625, -6.5416259765625, -6.2451171875, -5.9486083984375, -5.652099609375, -5.3555908203125, -5.05908203125, -4.7625732421875, -4.466064453125, -4.1695556640625, -3.873046875, -3.5765380859375, -3.280029296875, -2.9835205078125, -2.68701171875, -2.3905029296875, -2.093994140625, -1.7974853515625, -1.5009765625, -1.2044677734375, -0.907958984375, -0.6114501953125, -0.31494140625, -0.0184326171875, 0.278076171875, 0.5745849609375, 0.87109375, 1.1676025390625, 1.464111328125, 1.7606201171875, 2.05712890625, 2.3536376953125, 2.650146484375, 2.9466552734375, 3.2431640625, 3.5396728515625, 3.836181640625, 4.1326904296875, 4.42919921875, 4.7257080078125, 5.022216796875, 5.3187255859375, 5.615234375, 5.9117431640625, 6.208251953125, 6.5047607421875, 6.80126953125, 7.0977783203125, 7.394287109375, 7.6907958984375, 7.9873046875, 8.2838134765625, 8.580322265625, 8.8768310546875, 9.17333984375, 9.4698486328125, 9.766357421875, 10.0628662109375, 10.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 11.0, 19.0, 22.0, 49.0, 80.0, 125.0, 224.0, 530.0, 1896.0, 37236.0, 3776137.0, 371070.0, 5271.0, 854.0, 306.0, 187.0, 102.0, 65.0, 29.0, 26.0, 11.0, 9.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -33.9443359375, -32.513671875, -31.0830078125, -29.65234375, -28.2216796875, -26.791015625, -25.3603515625, -23.9296875, -22.4990234375, -21.068359375, -19.6376953125, -18.20703125, -16.7763671875, -15.345703125, -13.9150390625, -12.484375, -11.0537109375, -9.623046875, -8.1923828125, -6.76171875, -5.3310546875, -3.900390625, -2.4697265625, -1.0390625, 0.3916015625, 1.822265625, 3.2529296875, 4.68359375, 6.1142578125, 7.544921875, 8.9755859375, 10.40625, 11.8369140625, 13.267578125, 14.6982421875, 16.12890625, 17.5595703125, 18.990234375, 20.4208984375, 21.8515625, 23.2822265625, 24.712890625, 26.1435546875, 27.57421875, 29.0048828125, 30.435546875, 31.8662109375, 33.296875, 34.7275390625, 36.158203125, 37.5888671875, 39.01953125, 40.4501953125, 41.880859375, 43.3115234375, 44.7421875, 46.1728515625, 47.603515625, 49.0341796875, 50.46484375, 51.8955078125, 53.326171875, 54.7568359375, 56.1875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 17.0, 37.0, 126.0, 229.0, 277.0, 192.0, 95.0, 26.0, 12.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.86409759521484, -93.87129974365234, -90.87850189208984, -87.88570404052734, -84.89290618896484, -81.90010833740234, -78.90731811523438, -75.91452026367188, -72.92172241210938, -69.92892456054688, -66.93612670898438, -63.943328857421875, -60.950531005859375, -57.957733154296875, -54.96493911743164, -51.97214126586914, -48.979339599609375, -45.986541748046875, -42.993743896484375, -40.000946044921875, -37.008148193359375, -34.015350341796875, -31.02255630493164, -28.02975845336914, -25.03696060180664, -22.04416275024414, -19.05136489868164, -16.058568954467773, -13.065771102905273, -10.072973251342773, -7.080177307128906, -4.087379455566406, -1.094573974609375, 1.8982234001159668, 4.891020774841309, 7.883817672729492, 10.876615524291992, 13.869413375854492, 16.86220932006836, 19.85500717163086, 22.84780502319336, 25.84060287475586, 28.83340072631836, 31.826196670532227, 34.818992614746094, 37.811790466308594, 40.804588317871094, 43.797386169433594, 46.790184020996094, 49.782981872558594, 52.775779724121094, 55.768577575683594, 58.761375427246094, 61.754173278808594, 64.74696350097656, 67.73976135253906, 70.73255920410156, 73.72535705566406, 76.71815490722656, 79.71095275878906, 82.70375061035156, 85.69654846191406, 88.68934631347656, 91.68214416503906, 94.67494201660156]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 5.0, 5.0, 10.0, 16.0, 8.0, 22.0, 18.0, 21.0, 32.0, 24.0, 39.0, 38.0, 33.0, 37.0, 46.0, 31.0, 41.0, 35.0, 30.0, 45.0, 48.0, 41.0, 40.0, 25.0, 35.0, 30.0, 33.0, 33.0, 26.0, 22.0, 12.0, 17.0, 14.0, 18.0, 11.0, 12.0, 14.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-38.133087158203125, -36.98931884765625, -35.84555435180664, -34.701786041259766, -33.558021545410156, -32.41425323486328, -31.270484924316406, -30.126718521118164, -28.982952117919922, -27.83918571472168, -26.695419311523438, -25.551651000976562, -24.40788459777832, -23.264118194580078, -22.120349884033203, -20.97658348083496, -19.83281707763672, -18.689050674438477, -17.545284271240234, -16.40151596069336, -15.257749557495117, -14.113983154296875, -12.970215797424316, -11.826448440551758, -10.682682037353516, -9.538915634155273, -8.395148277282715, -7.2513813972473145, -6.107614517211914, -4.963847637176514, -3.8200807571411133, -2.6763134002685547, -1.5325469970703125, -0.3887801170349121, 0.7549867630004883, 1.8987536430358887, 3.042520523071289, 4.1862874031066895, 5.33005428314209, 6.473821640014648, 7.617588043212891, 8.761354446411133, 9.905121803283691, 11.04888916015625, 12.192655563354492, 13.336421966552734, 14.480189323425293, 15.623956680297852, 16.767723083496094, 17.911489486694336, 19.055255889892578, 20.199024200439453, 21.342790603637695, 22.486557006835938, 23.630325317382812, 24.774091720581055, 25.917858123779297, 27.06162452697754, 28.20539093017578, 29.349159240722656, 30.4929256439209, 31.63669204711914, 32.780460357666016, 33.924224853515625, 35.0679931640625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 12.0, 14.0, 14.0, 19.0, 19.0, 28.0, 23.0, 32.0, 28.0, 37.0, 35.0, 38.0, 33.0, 43.0, 45.0, 40.0, 40.0, 46.0, 28.0, 34.0, 49.0, 38.0, 32.0, 28.0, 28.0, 24.0, 33.0, 15.0, 26.0, 16.0, 15.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.858154296875, -2.75146484375, -2.644775390625, -2.5380859375, -2.431396484375, -2.32470703125, -2.218017578125, -2.111328125, -2.004638671875, -1.89794921875, -1.791259765625, -1.6845703125, -1.577880859375, -1.47119140625, -1.364501953125, -1.2578125, -1.151123046875, -1.04443359375, -0.937744140625, -0.8310546875, -0.724365234375, -0.61767578125, -0.510986328125, -0.404296875, -0.297607421875, -0.19091796875, -0.084228515625, 0.0224609375, 0.129150390625, 0.23583984375, 0.342529296875, 0.44921875, 0.555908203125, 0.66259765625, 0.769287109375, 0.8759765625, 0.982666015625, 1.08935546875, 1.196044921875, 1.302734375, 1.409423828125, 1.51611328125, 1.622802734375, 1.7294921875, 1.836181640625, 1.94287109375, 2.049560546875, 2.15625, 2.262939453125, 2.36962890625, 2.476318359375, 2.5830078125, 2.689697265625, 2.79638671875, 2.903076171875, 3.009765625, 3.116455078125, 3.22314453125, 3.329833984375, 3.4365234375, 3.543212890625, 3.64990234375, 3.756591796875, 3.86328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 11.0, 20.0, 15.0, 38.0, 45.0, 77.0, 98.0, 162.0, 223.0, 307.0, 469.0, 702.0, 1054.0, 1501.0, 2290.0, 3444.0, 4905.0, 7341.0, 11159.0, 17050.0, 26151.0, 39826.0, 62347.0, 95053.0, 134413.0, 164827.0, 150797.0, 111206.0, 74123.0, 48114.0, 30814.0, 20263.0, 13096.0, 8668.0, 5771.0, 4060.0, 2673.0, 1691.0, 1192.0, 790.0, 561.0, 352.0, 242.0, 205.0, 137.0, 76.0, 56.0, 37.0, 35.0, 16.0, 10.0, 8.0, 8.0, 8.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.29833984375, -0.2889289855957031, -0.27951812744140625, -0.2701072692871094, -0.2606964111328125, -0.2512855529785156, -0.24187469482421875, -0.23246383666992188, -0.223052978515625, -0.21364212036132812, -0.20423126220703125, -0.19482040405273438, -0.1854095458984375, -0.17599868774414062, -0.16658782958984375, -0.15717697143554688, -0.14776611328125, -0.13835525512695312, -0.12894439697265625, -0.11953353881835938, -0.1101226806640625, -0.10071182250976562, -0.09130096435546875, -0.08189010620117188, -0.072479248046875, -0.06306838989257812, -0.05365753173828125, -0.044246673583984375, -0.0348358154296875, -0.025424957275390625, -0.01601409912109375, -0.006603240966796875, 0.0028076171875, 0.012218475341796875, 0.02162933349609375, 0.031040191650390625, 0.0404510498046875, 0.049861907958984375, 0.05927276611328125, 0.06868362426757812, 0.078094482421875, 0.08750534057617188, 0.09691619873046875, 0.10632705688476562, 0.1157379150390625, 0.12514877319335938, 0.13455963134765625, 0.14397048950195312, 0.15338134765625, 0.16279220581054688, 0.17220306396484375, 0.18161392211914062, 0.1910247802734375, 0.20043563842773438, 0.20984649658203125, 0.21925735473632812, 0.228668212890625, 0.23807907104492188, 0.24748992919921875, 0.2569007873535156, 0.2663116455078125, 0.2757225036621094, 0.28513336181640625, 0.2945442199707031, 0.303955078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 0.0, 4.0, 8.0, 8.0, 10.0, 7.0, 8.0, 10.0, 13.0, 12.0, 15.0, 23.0, 21.0, 29.0, 32.0, 34.0, 34.0, 39.0, 39.0, 43.0, 40.0, 34.0, 1062.0, 37.0, 38.0, 41.0, 31.0, 42.0, 39.0, 32.0, 32.0, 30.0, 24.0, 20.0, 23.0, 14.0, 13.0, 15.0, 16.0, 10.0, 7.0, 10.0, 6.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0], "bins": [-2.20703125, -2.1419830322265625, -2.076934814453125, -2.0118865966796875, -1.94683837890625, -1.8817901611328125, -1.816741943359375, -1.7516937255859375, -1.6866455078125, -1.6215972900390625, -1.556549072265625, -1.4915008544921875, -1.42645263671875, -1.3614044189453125, -1.296356201171875, -1.2313079833984375, -1.166259765625, -1.1012115478515625, -1.036163330078125, -0.9711151123046875, -0.90606689453125, -0.8410186767578125, -0.775970458984375, -0.7109222412109375, -0.6458740234375, -0.5808258056640625, -0.515777587890625, -0.4507293701171875, -0.38568115234375, -0.3206329345703125, -0.255584716796875, -0.1905364990234375, -0.12548828125, -0.0604400634765625, 0.004608154296875, 0.0696563720703125, 0.13470458984375, 0.1997528076171875, 0.264801025390625, 0.3298492431640625, 0.3948974609375, 0.4599456787109375, 0.524993896484375, 0.5900421142578125, 0.65509033203125, 0.7201385498046875, 0.785186767578125, 0.8502349853515625, 0.915283203125, 0.9803314208984375, 1.045379638671875, 1.1104278564453125, 1.17547607421875, 1.2405242919921875, 1.305572509765625, 1.3706207275390625, 1.4356689453125, 1.5007171630859375, 1.565765380859375, 1.6308135986328125, 1.69586181640625, 1.7609100341796875, 1.825958251953125, 1.8910064697265625, 1.9560546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 13.0, 19.0, 26.0, 30.0, 44.0, 107.0, 144.0, 206.0, 323.0, 498.0, 642.0, 915.0, 1439.0, 2136.0, 2944.0, 4393.0, 6447.0, 9795.0, 14689.0, 21842.0, 32012.0, 46943.0, 66101.0, 89386.0, 113710.0, 1170753.0, 133089.0, 106995.0, 82325.0, 59643.0, 41785.0, 28588.0, 19420.0, 12934.0, 8761.0, 5842.0, 3886.0, 2568.0, 1826.0, 1262.0, 875.0, 594.0, 376.0, 276.0, 183.0, 116.0, 77.0, 56.0, 37.0, 24.0, 19.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.20361328125, -0.1972198486328125, -0.190826416015625, -0.1844329833984375, -0.17803955078125, -0.1716461181640625, -0.165252685546875, -0.1588592529296875, -0.1524658203125, -0.1460723876953125, -0.139678955078125, -0.1332855224609375, -0.12689208984375, -0.1204986572265625, -0.114105224609375, -0.1077117919921875, -0.101318359375, -0.0949249267578125, -0.088531494140625, -0.0821380615234375, -0.07574462890625, -0.0693511962890625, -0.062957763671875, -0.0565643310546875, -0.0501708984375, -0.0437774658203125, -0.037384033203125, -0.0309906005859375, -0.02459716796875, -0.0182037353515625, -0.011810302734375, -0.0054168701171875, 0.0009765625, 0.0073699951171875, 0.013763427734375, 0.0201568603515625, 0.02655029296875, 0.0329437255859375, 0.039337158203125, 0.0457305908203125, 0.0521240234375, 0.0585174560546875, 0.064910888671875, 0.0713043212890625, 0.07769775390625, 0.0840911865234375, 0.090484619140625, 0.0968780517578125, 0.103271484375, 0.1096649169921875, 0.116058349609375, 0.1224517822265625, 0.12884521484375, 0.1352386474609375, 0.141632080078125, 0.1480255126953125, 0.1544189453125, 0.1608123779296875, 0.167205810546875, 0.1735992431640625, 0.17999267578125, 0.1863861083984375, 0.192779541015625, 0.1991729736328125, 0.20556640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 9.0, 3.0, 9.0, 10.0, 15.0, 11.0, 13.0, 22.0, 28.0, 27.0, 44.0, 51.0, 55.0, 70.0, 75.0, 80.0, 67.0, 73.0, 58.0, 59.0, 51.0, 28.0, 22.0, 29.0, 26.0, 17.0, 17.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0017871856689453125, -0.0017337799072265625, -0.0016803741455078125, -0.0016269683837890625, -0.0015735626220703125, -0.0015201568603515625, -0.0014667510986328125, -0.0014133453369140625, -0.0013599395751953125, -0.0013065338134765625, -0.0012531280517578125, -0.0011997222900390625, -0.0011463165283203125, -0.0010929107666015625, -0.0010395050048828125, -0.0009860992431640625, -0.0009326934814453125, -0.0008792877197265625, -0.0008258819580078125, -0.0007724761962890625, -0.0007190704345703125, -0.0006656646728515625, -0.0006122589111328125, -0.0005588531494140625, -0.0005054473876953125, -0.0004520416259765625, -0.0003986358642578125, -0.0003452301025390625, -0.0002918243408203125, -0.0002384185791015625, -0.0001850128173828125, -0.0001316070556640625, -7.82012939453125e-05, -2.47955322265625e-05, 2.86102294921875e-05, 8.20159912109375e-05, 0.0001354217529296875, 0.0001888275146484375, 0.0002422332763671875, 0.0002956390380859375, 0.0003490447998046875, 0.0004024505615234375, 0.0004558563232421875, 0.0005092620849609375, 0.0005626678466796875, 0.0006160736083984375, 0.0006694793701171875, 0.0007228851318359375, 0.0007762908935546875, 0.0008296966552734375, 0.0008831024169921875, 0.0009365081787109375, 0.0009899139404296875, 0.0010433197021484375, 0.0010967254638671875, 0.0011501312255859375, 0.0012035369873046875, 0.0012569427490234375, 0.0013103485107421875, 0.0013637542724609375, 0.0014171600341796875, 0.0014705657958984375, 0.0015239715576171875, 0.0015773773193359375, 0.0016307830810546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 15.0, 19.0, 25.0, 46.0, 63.0, 77.0, 166.0, 289.0, 487.0, 7402.0, 1037665.0, 1265.0, 415.0, 217.0, 109.0, 95.0, 60.0, 22.0, 24.0, 12.0, 23.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0443115234375, -0.042896270751953125, -0.04148101806640625, -0.040065765380859375, -0.0386505126953125, -0.037235260009765625, -0.03582000732421875, -0.034404754638671875, -0.032989501953125, -0.031574249267578125, -0.03015899658203125, -0.028743743896484375, -0.0273284912109375, -0.025913238525390625, -0.02449798583984375, -0.023082733154296875, -0.02166748046875, -0.020252227783203125, -0.01883697509765625, -0.017421722412109375, -0.0160064697265625, -0.014591217041015625, -0.01317596435546875, -0.011760711669921875, -0.010345458984375, -0.008930206298828125, -0.00751495361328125, -0.006099700927734375, -0.0046844482421875, -0.003269195556640625, -0.00185394287109375, -0.000438690185546875, 0.0009765625, 0.002391815185546875, 0.00380706787109375, 0.005222320556640625, 0.0066375732421875, 0.008052825927734375, 0.00946807861328125, 0.010883331298828125, 0.012298583984375, 0.013713836669921875, 0.01512908935546875, 0.016544342041015625, 0.0179595947265625, 0.019374847412109375, 0.02079010009765625, 0.022205352783203125, 0.02362060546875, 0.025035858154296875, 0.02645111083984375, 0.027866363525390625, 0.0292816162109375, 0.030696868896484375, 0.03211212158203125, 0.033527374267578125, 0.034942626953125, 0.036357879638671875, 0.03777313232421875, 0.039188385009765625, 0.0406036376953125, 0.042018890380859375, 0.04343414306640625, 0.044849395751953125, 0.0462646484375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 201.0, 788.0, 27.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0068946522660553455, -0.006659148260951042, -0.006423644255846739, -0.0061881402507424355, -0.005952636711299419, -0.005717132240533829, -0.005481628701090813, -0.005246124695986509, -0.005010620690882206, -0.004775116685777903, -0.004539612680673599, -0.004304108675569296, -0.0040686046704649925, -0.003833100898191333, -0.003597597125917673, -0.0033620931208133698, -0.0031265891157090664, -0.002891085110604763, -0.0026555811055004597, -0.0024200773332268, -0.0021845733281224966, -0.0019490693230181932, -0.0017135654343292117, -0.0014780615456402302, -0.0012425575405359268, -0.0010070535354316235, -0.0007715496467426419, -0.0005360456998459995, -0.00030054175294935703, -6.503774784505367e-05, 0.00017046614084392786, 0.0004059700295329094, 0.0006414745002985001, 0.0008769784471951425, 0.001112482394091785, 0.0013479862827807665, 0.0015834902878850698, 0.0018189942929893732, 0.002054498065263033, 0.0022900020703673363, 0.0025255060754716396, 0.002761010080575943, 0.0029965140856802464, 0.003232017857953906, 0.0034675218630582094, 0.0037030258681625128, 0.0039385296404361725, 0.004174033645540476, 0.004409537650644779, 0.0046450416557490826, 0.004880545660853386, 0.005116049665957689, 0.005351553671061993, 0.005587057210505009, 0.005822561215609312, 0.006058065220713615, 0.006293569225817919, 0.006529073230922222, 0.0067645772360265255, 0.007000081241130829, 0.007235584780573845, 0.007471089251339436, 0.007706592790782452, 0.007942097261548042, 0.008177600800991058]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 9.0, 6.0, 11.0, 8.0, 12.0, 9.0, 17.0, 25.0, 17.0, 31.0, 19.0, 24.0, 25.0, 31.0, 27.0, 35.0, 33.0, 35.0, 44.0, 38.0, 47.0, 45.0, 38.0, 35.0, 31.0, 29.0, 43.0, 50.0, 37.0, 27.0, 33.0, 24.0, 26.0, 14.0, 11.0, 9.0, 6.0, 10.0, 11.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0009272098541259766, -0.0009017828851938248, -0.000876355916261673, -0.0008509289473295212, -0.0008255019783973694, -0.0008000750094652176, -0.0007746480405330658, -0.000749221071600914, -0.0007237941026687622, -0.0006983671337366104, -0.0006729401648044586, -0.0006475131958723068, -0.000622086226940155, -0.0005966592580080032, -0.0005712322890758514, -0.0005458053201436996, -0.0005203783512115479, -0.0004949513822793961, -0.00046952441334724426, -0.00044409744441509247, -0.0004186704754829407, -0.0003932435065507889, -0.0003678165376186371, -0.0003423895686864853, -0.0003169625997543335, -0.0002915356308221817, -0.0002661086618900299, -0.0002406816929578781, -0.00021525472402572632, -0.00018982775509357452, -0.00016440078616142273, -0.00013897381722927094, -0.00011354684829711914, -8.811987936496735e-05, -6.269291043281555e-05, -3.726594150066376e-05, -1.1838972568511963e-05, 1.3587996363639832e-05, 3.9014965295791626e-05, 6.444193422794342e-05, 8.986890316009521e-05, 0.00011529587209224701, 0.0001407228410243988, 0.0001661498099565506, 0.0001915767788887024, 0.0002170037478208542, 0.00024243071675300598, 0.0002678576856851578, 0.00029328465461730957, 0.00031871162354946136, 0.00034413859248161316, 0.00036956556141376495, 0.00039499253034591675, 0.00042041949927806854, 0.00044584646821022034, 0.00047127343714237213, 0.0004967004060745239, 0.0005221273750066757, 0.0005475543439388275, 0.0005729813128709793, 0.0005984082818031311, 0.0006238352507352829, 0.0006492622196674347, 0.0006746891885995865, 0.0007001161575317383]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 12.0, 14.0, 14.0, 19.0, 19.0, 28.0, 23.0, 32.0, 28.0, 37.0, 35.0, 38.0, 33.0, 43.0, 45.0, 40.0, 40.0, 46.0, 28.0, 34.0, 49.0, 38.0, 32.0, 28.0, 28.0, 24.0, 33.0, 15.0, 26.0, 16.0, 15.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.858154296875, -2.75146484375, -2.644775390625, -2.5380859375, -2.431396484375, -2.32470703125, -2.218017578125, -2.111328125, -2.004638671875, -1.89794921875, -1.791259765625, -1.6845703125, -1.577880859375, -1.47119140625, -1.364501953125, -1.2578125, -1.151123046875, -1.04443359375, -0.937744140625, -0.8310546875, -0.724365234375, -0.61767578125, -0.510986328125, -0.404296875, -0.297607421875, -0.19091796875, -0.084228515625, 0.0224609375, 0.129150390625, 0.23583984375, 0.342529296875, 0.44921875, 0.555908203125, 0.66259765625, 0.769287109375, 0.8759765625, 0.982666015625, 1.08935546875, 1.196044921875, 1.302734375, 1.409423828125, 1.51611328125, 1.622802734375, 1.7294921875, 1.836181640625, 1.94287109375, 2.049560546875, 2.15625, 2.262939453125, 2.36962890625, 2.476318359375, 2.5830078125, 2.689697265625, 2.79638671875, 2.903076171875, 3.009765625, 3.116455078125, 3.22314453125, 3.329833984375, 3.4365234375, 3.543212890625, 3.64990234375, 3.756591796875, 3.86328125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 14.0, 32.0, 36.0, 48.0, 84.0, 112.0, 206.0, 272.0, 448.0, 695.0, 1164.0, 1931.0, 3224.0, 5627.0, 9836.0, 18218.0, 37799.0, 89464.0, 263893.0, 380429.0, 130761.0, 51160.0, 23734.0, 12276.0, 6939.0, 3890.0, 2373.0, 1445.0, 894.0, 526.0, 321.0, 218.0, 157.0, 103.0, 59.0, 48.0, 32.0, 21.0, 8.0, 14.0, 7.0, 7.0, 7.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-2.791015625, -2.711700439453125, -2.63238525390625, -2.553070068359375, -2.4737548828125, -2.394439697265625, -2.31512451171875, -2.235809326171875, -2.156494140625, -2.077178955078125, -1.99786376953125, -1.918548583984375, -1.8392333984375, -1.759918212890625, -1.68060302734375, -1.601287841796875, -1.52197265625, -1.442657470703125, -1.36334228515625, -1.284027099609375, -1.2047119140625, -1.125396728515625, -1.04608154296875, -0.966766357421875, -0.887451171875, -0.808135986328125, -0.72882080078125, -0.649505615234375, -0.5701904296875, -0.490875244140625, -0.41156005859375, -0.332244873046875, -0.2529296875, -0.173614501953125, -0.09429931640625, -0.014984130859375, 0.0643310546875, 0.143646240234375, 0.22296142578125, 0.302276611328125, 0.381591796875, 0.460906982421875, 0.54022216796875, 0.619537353515625, 0.6988525390625, 0.778167724609375, 0.85748291015625, 0.936798095703125, 1.01611328125, 1.095428466796875, 1.17474365234375, 1.254058837890625, 1.3333740234375, 1.412689208984375, 1.49200439453125, 1.571319580078125, 1.650634765625, 1.729949951171875, 1.80926513671875, 1.888580322265625, 1.9678955078125, 2.047210693359375, 2.12652587890625, 2.205841064453125, 2.28515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 13.0, 10.0, 23.0, 23.0, 25.0, 15.0, 29.0, 27.0, 33.0, 43.0, 46.0, 41.0, 38.0, 69.0, 70.0, 204.0, 1726.0, 126.0, 72.0, 55.0, 40.0, 32.0, 22.0, 35.0, 22.0, 23.0, 19.0, 21.0, 22.0, 21.0, 10.0, 14.0, 12.0, 6.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.734375, -11.3714599609375, -11.008544921875, -10.6456298828125, -10.28271484375, -9.9197998046875, -9.556884765625, -9.1939697265625, -8.8310546875, -8.4681396484375, -8.105224609375, -7.7423095703125, -7.37939453125, -7.0164794921875, -6.653564453125, -6.2906494140625, -5.927734375, -5.5648193359375, -5.201904296875, -4.8389892578125, -4.47607421875, -4.1131591796875, -3.750244140625, -3.3873291015625, -3.0244140625, -2.6614990234375, -2.298583984375, -1.9356689453125, -1.57275390625, -1.2098388671875, -0.846923828125, -0.4840087890625, -0.12109375, 0.2418212890625, 0.604736328125, 0.9676513671875, 1.33056640625, 1.6934814453125, 2.056396484375, 2.4193115234375, 2.7822265625, 3.1451416015625, 3.508056640625, 3.8709716796875, 4.23388671875, 4.5968017578125, 4.959716796875, 5.3226318359375, 5.685546875, 6.0484619140625, 6.411376953125, 6.7742919921875, 7.13720703125, 7.5001220703125, 7.863037109375, 8.2259521484375, 8.5888671875, 8.9517822265625, 9.314697265625, 9.6776123046875, 10.04052734375, 10.4034423828125, 10.766357421875, 11.1292724609375, 11.4921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 5.0, 4.0, 7.0, 5.0, 10.0, 12.0, 11.0, 17.0, 21.0, 32.0, 32.0, 31.0, 44.0, 66.0, 92.0, 124.0, 208.0, 470.0, 1295.0, 11317.0, 1842131.0, 1276330.0, 10820.0, 1377.0, 470.0, 207.0, 132.0, 99.0, 72.0, 44.0, 34.0, 25.0, 30.0, 29.0, 20.0, 13.0, 14.0, 13.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.193115234375, -18.57373046875, -17.954345703125, -17.3349609375, -16.715576171875, -16.09619140625, -15.476806640625, -14.857421875, -14.238037109375, -13.61865234375, -12.999267578125, -12.3798828125, -11.760498046875, -11.14111328125, -10.521728515625, -9.90234375, -9.282958984375, -8.66357421875, -8.044189453125, -7.4248046875, -6.805419921875, -6.18603515625, -5.566650390625, -4.947265625, -4.327880859375, -3.70849609375, -3.089111328125, -2.4697265625, -1.850341796875, -1.23095703125, -0.611572265625, 0.0078125, 0.627197265625, 1.24658203125, 1.865966796875, 2.4853515625, 3.104736328125, 3.72412109375, 4.343505859375, 4.962890625, 5.582275390625, 6.20166015625, 6.821044921875, 7.4404296875, 8.059814453125, 8.67919921875, 9.298583984375, 9.91796875, 10.537353515625, 11.15673828125, 11.776123046875, 12.3955078125, 13.014892578125, 13.63427734375, 14.253662109375, 14.873046875, 15.492431640625, 16.11181640625, 16.731201171875, 17.3505859375, 17.969970703125, 18.58935546875, 19.208740234375, 19.828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 771.0, 246.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-383.4617919921875, -376.8341369628906, -370.2064514160156, -363.57879638671875, -356.9511413574219, -350.3234558105469, -343.69580078125, -337.068115234375, -330.4404602050781, -323.81280517578125, -317.18511962890625, -310.5574645996094, -303.9298095703125, -297.3021240234375, -290.6744689941406, -284.04681396484375, -277.41912841796875, -270.7914733886719, -264.1637878417969, -257.5361328125, -250.90846252441406, -244.28079223632812, -237.65313720703125, -231.0254669189453, -224.39781188964844, -217.7701416015625, -211.14248657226562, -204.5148162841797, -197.88714599609375, -191.25949096679688, -184.63182067871094, -178.004150390625, -171.37648010253906, -164.74880981445312, -158.12115478515625, -151.4934844970703, -144.86581420898438, -138.2381591796875, -131.61048889160156, -124.98281860351562, -118.35514831542969, -111.72748565673828, -105.09981536865234, -98.47215270996094, -91.844482421875, -85.2168197631836, -78.58915710449219, -71.96148681640625, -65.33381652832031, -58.70615005493164, -52.07848358154297, -45.45082092285156, -38.823150634765625, -32.19548797607422, -25.567821502685547, -18.940155029296875, -12.312492370605469, -5.684826374053955, 0.9428396224975586, 7.570505142211914, 14.198171615600586, 20.825836181640625, 27.453502655029297, 34.08116912841797, 40.70883560180664]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 14.0, 10.0, 14.0, 7.0, 19.0, 26.0, 18.0, 29.0, 21.0, 37.0, 31.0, 47.0, 35.0, 35.0, 39.0, 50.0, 40.0, 44.0, 41.0, 41.0, 33.0, 34.0, 36.0, 33.0, 35.0, 23.0, 21.0, 29.0, 21.0, 24.0, 24.0, 12.0, 11.0, 11.0, 9.0, 6.0, 8.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.72179412841797, -35.518733978271484, -34.315677642822266, -33.11261749267578, -31.909557342529297, -30.706499099731445, -29.503440856933594, -28.30038070678711, -27.097322463989258, -25.894264221191406, -24.691204071044922, -23.48814582824707, -22.28508758544922, -21.082027435302734, -19.878969192504883, -18.67591094970703, -17.472850799560547, -16.269792556762695, -15.066732406616211, -13.86367416381836, -12.660614967346191, -11.457555770874023, -10.254497528076172, -9.051438331604004, -7.848379135131836, -6.645319938659668, -5.442261219024658, -4.239202499389648, -3.0361433029174805, -1.8330841064453125, -0.6300253868103027, 0.573033332824707, 1.776092529296875, 2.979151487350464, 4.182210445404053, 5.3852691650390625, 6.5883283615112305, 7.791387557983398, 8.99444580078125, 10.197504997253418, 11.400564193725586, 12.603623390197754, 13.806682586669922, 15.009740829467773, 16.212799072265625, 17.41585922241211, 18.61891746520996, 19.821975708007812, 21.025035858154297, 22.22809410095215, 23.431154251098633, 24.634212493896484, 25.83727264404297, 27.04033088684082, 28.243389129638672, 29.446449279785156, 30.649507522583008, 31.85256576538086, 33.055625915527344, 34.25868606567383, 35.46174240112305, 36.66480255126953, 37.867862701416016, 39.070919036865234, 40.27397918701172]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 7.0, 10.0, 11.0, 13.0, 15.0, 15.0, 18.0, 27.0, 21.0, 30.0, 25.0, 31.0, 37.0, 41.0, 33.0, 33.0, 34.0, 49.0, 41.0, 39.0, 44.0, 28.0, 42.0, 36.0, 34.0, 31.0, 30.0, 35.0, 38.0, 12.0, 27.0, 23.0, 15.0, 15.0, 9.0, 12.0, 9.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.91986083984375, -2.8104248046875, -2.70098876953125, -2.591552734375, -2.48211669921875, -2.3726806640625, -2.26324462890625, -2.15380859375, -2.04437255859375, -1.9349365234375, -1.82550048828125, -1.716064453125, -1.60662841796875, -1.4971923828125, -1.38775634765625, -1.2783203125, -1.16888427734375, -1.0594482421875, -0.95001220703125, -0.840576171875, -0.73114013671875, -0.6217041015625, -0.51226806640625, -0.40283203125, -0.29339599609375, -0.1839599609375, -0.07452392578125, 0.034912109375, 0.14434814453125, 0.2537841796875, 0.36322021484375, 0.47265625, 0.58209228515625, 0.6915283203125, 0.80096435546875, 0.910400390625, 1.01983642578125, 1.1292724609375, 1.23870849609375, 1.34814453125, 1.45758056640625, 1.5670166015625, 1.67645263671875, 1.785888671875, 1.89532470703125, 2.0047607421875, 2.11419677734375, 2.2236328125, 2.33306884765625, 2.4425048828125, 2.55194091796875, 2.661376953125, 2.77081298828125, 2.8802490234375, 2.98968505859375, 3.09912109375, 3.20855712890625, 3.3179931640625, 3.42742919921875, 3.536865234375, 3.64630126953125, 3.7557373046875, 3.86517333984375, 3.974609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 7.0, 12.0, 8.0, 13.0, 10.0, 21.0, 14.0, 18.0, 22.0, 24.0, 36.0, 43.0, 60.0, 101.0, 193.0, 586.0, 3151.0, 27434.0, 808404.0, 3236244.0, 107610.0, 8255.0, 1223.0, 285.0, 121.0, 80.0, 55.0, 37.0, 27.0, 22.0, 24.0, 22.0, 23.0, 22.0, 12.0, 11.0, 10.0, 7.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.89111328125, -16.3134765625, -15.73583984375, -15.158203125, -14.58056640625, -14.0029296875, -13.42529296875, -12.84765625, -12.27001953125, -11.6923828125, -11.11474609375, -10.537109375, -9.95947265625, -9.3818359375, -8.80419921875, -8.2265625, -7.64892578125, -7.0712890625, -6.49365234375, -5.916015625, -5.33837890625, -4.7607421875, -4.18310546875, -3.60546875, -3.02783203125, -2.4501953125, -1.87255859375, -1.294921875, -0.71728515625, -0.1396484375, 0.43798828125, 1.015625, 1.59326171875, 2.1708984375, 2.74853515625, 3.326171875, 3.90380859375, 4.4814453125, 5.05908203125, 5.63671875, 6.21435546875, 6.7919921875, 7.36962890625, 7.947265625, 8.52490234375, 9.1025390625, 9.68017578125, 10.2578125, 10.83544921875, 11.4130859375, 11.99072265625, 12.568359375, 13.14599609375, 13.7236328125, 14.30126953125, 14.87890625, 15.45654296875, 16.0341796875, 16.61181640625, 17.189453125, 17.76708984375, 18.3447265625, 18.92236328125, 19.5]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 8.0, 24.0, 28.0, 48.0, 62.0, 86.0, 132.0, 145.0, 186.0, 273.0, 367.0, 435.0, 493.0, 423.0, 357.0, 292.0, 198.0, 131.0, 94.0, 82.0, 50.0, 43.0, 22.0, 21.0, 13.0, 6.0, 10.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3984375, -14.033447265625, -13.66845703125, -13.303466796875, -12.9384765625, -12.573486328125, -12.20849609375, -11.843505859375, -11.478515625, -11.113525390625, -10.74853515625, -10.383544921875, -10.0185546875, -9.653564453125, -9.28857421875, -8.923583984375, -8.55859375, -8.193603515625, -7.82861328125, -7.463623046875, -7.0986328125, -6.733642578125, -6.36865234375, -6.003662109375, -5.638671875, -5.273681640625, -4.90869140625, -4.543701171875, -4.1787109375, -3.813720703125, -3.44873046875, -3.083740234375, -2.71875, -2.353759765625, -1.98876953125, -1.623779296875, -1.2587890625, -0.893798828125, -0.52880859375, -0.163818359375, 0.201171875, 0.566162109375, 0.93115234375, 1.296142578125, 1.6611328125, 2.026123046875, 2.39111328125, 2.756103515625, 3.12109375, 3.486083984375, 3.85107421875, 4.216064453125, 4.5810546875, 4.946044921875, 5.31103515625, 5.676025390625, 6.041015625, 6.406005859375, 6.77099609375, 7.135986328125, 7.5009765625, 7.865966796875, 8.23095703125, 8.595947265625, 8.9609375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 8.0, 3.0, 4.0, 7.0, 9.0, 15.0, 18.0, 18.0, 30.0, 48.0, 55.0, 90.0, 134.0, 240.0, 457.0, 1048.0, 4720.0, 101132.0, 3710549.0, 363300.0, 9457.0, 1502.0, 563.0, 296.0, 186.0, 120.0, 102.0, 49.0, 44.0, 23.0, 16.0, 18.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.562255859375, -22.42138671875, -21.280517578125, -20.1396484375, -18.998779296875, -17.85791015625, -16.717041015625, -15.576171875, -14.435302734375, -13.29443359375, -12.153564453125, -11.0126953125, -9.871826171875, -8.73095703125, -7.590087890625, -6.44921875, -5.308349609375, -4.16748046875, -3.026611328125, -1.8857421875, -0.744873046875, 0.39599609375, 1.536865234375, 2.677734375, 3.818603515625, 4.95947265625, 6.100341796875, 7.2412109375, 8.382080078125, 9.52294921875, 10.663818359375, 11.8046875, 12.945556640625, 14.08642578125, 15.227294921875, 16.3681640625, 17.509033203125, 18.64990234375, 19.790771484375, 20.931640625, 22.072509765625, 23.21337890625, 24.354248046875, 25.4951171875, 26.635986328125, 27.77685546875, 28.917724609375, 30.05859375, 31.199462890625, 32.34033203125, 33.481201171875, 34.6220703125, 35.762939453125, 36.90380859375, 38.044677734375, 39.185546875, 40.326416015625, 41.46728515625, 42.608154296875, 43.7490234375, 44.889892578125, 46.03076171875, 47.171630859375, 48.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 34.0, 110.0, 278.0, 336.0, 181.0, 55.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.61972045898438, -94.37468719482422, -90.12965393066406, -85.8846206665039, -81.63958740234375, -77.39456176757812, -73.14952850341797, -68.90449523925781, -64.65946197509766, -60.4144287109375, -56.169395446777344, -51.92436599731445, -47.6793327331543, -43.43429946899414, -39.18927001953125, -34.944236755371094, -30.699203491210938, -26.45417022705078, -22.209138870239258, -17.964107513427734, -13.719074249267578, -9.474040985107422, -5.229009628295898, -0.983978271484375, 3.2610549926757812, 7.506087303161621, 11.751119613647461, 15.9961519241333, 20.24118423461914, 24.486217498779297, 28.73124885559082, 32.976280212402344, 37.22132873535156, 41.46636199951172, 45.711395263671875, 49.956424713134766, 54.20145797729492, 58.44649124145508, 62.69152069091797, 66.93655395507812, 71.18158721923828, 75.42662048339844, 79.6716537475586, 83.91668701171875, 88.16171264648438, 92.40675354003906, 96.65177917480469, 100.89681243896484, 105.141845703125, 109.38687896728516, 113.63191223144531, 117.87694549560547, 122.12197875976562, 126.36700439453125, 130.61204528808594, 134.85707092285156, 139.10211181640625, 143.34713745117188, 147.59217834472656, 151.8372039794922, 156.08224487304688, 160.3272705078125, 164.5723114013672, 168.8173370361328, 173.06236267089844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 5.0, 11.0, 17.0, 13.0, 14.0, 14.0, 24.0, 23.0, 26.0, 44.0, 37.0, 39.0, 39.0, 50.0, 48.0, 45.0, 42.0, 38.0, 37.0, 41.0, 47.0, 34.0, 31.0, 21.0, 27.0, 31.0, 21.0, 29.0, 29.0, 23.0, 15.0, 13.0, 10.0, 9.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.396240234375, -37.092552185058594, -35.78886413574219, -34.48517608642578, -33.181488037109375, -31.877798080444336, -30.574108123779297, -29.27042007446289, -27.966732025146484, -26.663043975830078, -25.359355926513672, -24.055665969848633, -22.751977920532227, -21.44828987121582, -20.14459991455078, -18.840911865234375, -17.53722381591797, -16.233535766601562, -14.92984676361084, -13.626157760620117, -12.322469711303711, -11.018781661987305, -9.715092658996582, -8.41140365600586, -7.107715606689453, -5.804027080535889, -4.500338554382324, -3.1966500282287598, -1.8929615020751953, -0.5892729759216309, 0.7144155502319336, 2.0181045532226562, 3.3217926025390625, 4.625481128692627, 5.929169654846191, 7.232858180999756, 8.53654670715332, 9.840234756469727, 11.14392375946045, 12.447612762451172, 13.751300811767578, 15.054988861083984, 16.35867691040039, 17.66236686706543, 18.966054916381836, 20.269742965698242, 21.57343292236328, 22.877120971679688, 24.180809020996094, 25.4844970703125, 26.788185119628906, 28.091875076293945, 29.39556312561035, 30.699251174926758, 32.0029411315918, 33.3066291809082, 34.61031723022461, 35.914005279541016, 37.21769332885742, 38.52138137817383, 39.8250732421875, 41.128761291503906, 42.43244934082031, 43.73613739013672, 45.039825439453125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 9.0, 14.0, 7.0, 14.0, 11.0, 24.0, 24.0, 26.0, 27.0, 24.0, 37.0, 36.0, 29.0, 31.0, 38.0, 33.0, 48.0, 36.0, 45.0, 41.0, 41.0, 40.0, 32.0, 36.0, 33.0, 27.0, 29.0, 27.0, 32.0, 17.0, 18.0, 18.0, 15.0, 13.0, 14.0, 10.0, 8.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.391357421875, -3.27880859375, -3.166259765625, -3.0537109375, -2.941162109375, -2.82861328125, -2.716064453125, -2.603515625, -2.490966796875, -2.37841796875, -2.265869140625, -2.1533203125, -2.040771484375, -1.92822265625, -1.815673828125, -1.703125, -1.590576171875, -1.47802734375, -1.365478515625, -1.2529296875, -1.140380859375, -1.02783203125, -0.915283203125, -0.802734375, -0.690185546875, -0.57763671875, -0.465087890625, -0.3525390625, -0.239990234375, -0.12744140625, -0.014892578125, 0.09765625, 0.210205078125, 0.32275390625, 0.435302734375, 0.5478515625, 0.660400390625, 0.77294921875, 0.885498046875, 0.998046875, 1.110595703125, 1.22314453125, 1.335693359375, 1.4482421875, 1.560791015625, 1.67333984375, 1.785888671875, 1.8984375, 2.010986328125, 2.12353515625, 2.236083984375, 2.3486328125, 2.461181640625, 2.57373046875, 2.686279296875, 2.798828125, 2.911376953125, 3.02392578125, 3.136474609375, 3.2490234375, 3.361572265625, 3.47412109375, 3.586669921875, 3.69921875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 9.0, 9.0, 10.0, 15.0, 26.0, 39.0, 42.0, 67.0, 124.0, 176.0, 279.0, 365.0, 590.0, 900.0, 1421.0, 2268.0, 3491.0, 5553.0, 8798.0, 13740.0, 21860.0, 34437.0, 54994.0, 86747.0, 128681.0, 166960.0, 164962.0, 124939.0, 83766.0, 53244.0, 32825.0, 20669.0, 13184.0, 8207.0, 5436.0, 3408.0, 2273.0, 1409.0, 937.0, 606.0, 376.0, 247.0, 165.0, 104.0, 72.0, 55.0, 33.0, 16.0, 10.0, 7.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31689453125, -0.3063163757324219, -0.29573822021484375, -0.2851600646972656, -0.2745819091796875, -0.2640037536621094, -0.25342559814453125, -0.24284744262695312, -0.232269287109375, -0.22169113159179688, -0.21111297607421875, -0.20053482055664062, -0.1899566650390625, -0.17937850952148438, -0.16880035400390625, -0.15822219848632812, -0.14764404296875, -0.13706588745117188, -0.12648773193359375, -0.11590957641601562, -0.1053314208984375, -0.09475326538085938, -0.08417510986328125, -0.07359695434570312, -0.063018798828125, -0.052440643310546875, -0.04186248779296875, -0.031284332275390625, -0.0207061767578125, -0.010128021240234375, 0.00045013427734375, 0.011028289794921875, 0.0216064453125, 0.032184600830078125, 0.04276275634765625, 0.053340911865234375, 0.0639190673828125, 0.07449722290039062, 0.08507537841796875, 0.09565353393554688, 0.106231689453125, 0.11680984497070312, 0.12738800048828125, 0.13796615600585938, 0.1485443115234375, 0.15912246704101562, 0.16970062255859375, 0.18027877807617188, 0.19085693359375, 0.20143508911132812, 0.21201324462890625, 0.22259140014648438, 0.2331695556640625, 0.24374771118164062, 0.25432586669921875, 0.2649040222167969, 0.275482177734375, 0.2860603332519531, 0.29663848876953125, 0.3072166442871094, 0.3177947998046875, 0.3283729553222656, 0.33895111083984375, 0.3495292663574219, 0.360107421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 1.0, 5.0, 6.0, 7.0, 6.0, 12.0, 12.0, 16.0, 19.0, 20.0, 20.0, 14.0, 17.0, 22.0, 26.0, 31.0, 34.0, 47.0, 34.0, 34.0, 37.0, 36.0, 23.0, 1070.0, 39.0, 31.0, 40.0, 35.0, 38.0, 28.0, 31.0, 32.0, 22.0, 20.0, 24.0, 12.0, 20.0, 18.0, 10.0, 10.0, 10.0, 13.0, 6.0, 8.0, 6.0, 7.0, 3.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.13671875, -2.070220947265625, -2.00372314453125, -1.937225341796875, -1.8707275390625, -1.804229736328125, -1.73773193359375, -1.671234130859375, -1.604736328125, -1.538238525390625, -1.47174072265625, -1.405242919921875, -1.3387451171875, -1.272247314453125, -1.20574951171875, -1.139251708984375, -1.07275390625, -1.006256103515625, -0.93975830078125, -0.873260498046875, -0.8067626953125, -0.740264892578125, -0.67376708984375, -0.607269287109375, -0.540771484375, -0.474273681640625, -0.40777587890625, -0.341278076171875, -0.2747802734375, -0.208282470703125, -0.14178466796875, -0.075286865234375, -0.0087890625, 0.057708740234375, 0.12420654296875, 0.190704345703125, 0.2572021484375, 0.323699951171875, 0.39019775390625, 0.456695556640625, 0.523193359375, 0.589691162109375, 0.65618896484375, 0.722686767578125, 0.7891845703125, 0.855682373046875, 0.92218017578125, 0.988677978515625, 1.05517578125, 1.121673583984375, 1.18817138671875, 1.254669189453125, 1.3211669921875, 1.387664794921875, 1.45416259765625, 1.520660400390625, 1.587158203125, 1.653656005859375, 1.72015380859375, 1.786651611328125, 1.8531494140625, 1.919647216796875, 1.98614501953125, 2.052642822265625, 2.119140625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 12.0, 9.0, 26.0, 40.0, 47.0, 71.0, 113.0, 189.0, 288.0, 392.0, 596.0, 898.0, 1276.0, 1980.0, 2923.0, 4484.0, 6750.0, 10392.0, 16044.0, 24488.0, 37486.0, 56461.0, 82342.0, 112032.0, 140137.0, 1187833.0, 122692.0, 93895.0, 65636.0, 44116.0, 28609.0, 19140.0, 12333.0, 7898.0, 5185.0, 3430.0, 2292.0, 1509.0, 1023.0, 690.0, 478.0, 279.0, 221.0, 144.0, 86.0, 58.0, 40.0, 27.0, 24.0, 9.0, 9.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2218017578125, -0.2142047882080078, -0.20660781860351562, -0.19901084899902344, -0.19141387939453125, -0.18381690979003906, -0.17621994018554688, -0.1686229705810547, -0.1610260009765625, -0.1534290313720703, -0.14583206176757812, -0.13823509216308594, -0.13063812255859375, -0.12304115295410156, -0.11544418334960938, -0.10784721374511719, -0.100250244140625, -0.09265327453613281, -0.08505630493164062, -0.07745933532714844, -0.06986236572265625, -0.06226539611816406, -0.054668426513671875, -0.04707145690917969, -0.0394744873046875, -0.03187751770019531, -0.024280548095703125, -0.016683578491210938, -0.00908660888671875, -0.0014896392822265625, 0.006107330322265625, 0.013704299926757812, 0.02130126953125, 0.028898239135742188, 0.036495208740234375, 0.04409217834472656, 0.05168914794921875, 0.05928611755371094, 0.06688308715820312, 0.07448005676269531, 0.0820770263671875, 0.08967399597167969, 0.09727096557617188, 0.10486793518066406, 0.11246490478515625, 0.12006187438964844, 0.12765884399414062, 0.1352558135986328, 0.142852783203125, 0.1504497528076172, 0.15804672241210938, 0.16564369201660156, 0.17324066162109375, 0.18083763122558594, 0.18843460083007812, 0.1960315704345703, 0.2036285400390625, 0.2112255096435547, 0.21882247924804688, 0.22641944885253906, 0.23401641845703125, 0.24161338806152344, 0.24921035766601562, 0.2568073272705078, 0.264404296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 12.0, 13.0, 33.0, 29.0, 54.0, 40.0, 51.0, 69.0, 74.0, 61.0, 69.0, 72.0, 71.0, 56.0, 39.0, 49.0, 25.0, 37.0, 23.0, 19.0, 11.0, 11.0, 11.0, 7.0, 4.0, 7.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.001743316650390625, -0.0016871243715286255, -0.001630932092666626, -0.0015747398138046265, -0.001518547534942627, -0.0014623552560806274, -0.001406162977218628, -0.0013499706983566284, -0.001293778419494629, -0.0012375861406326294, -0.0011813938617706299, -0.0011252015829086304, -0.0010690093040466309, -0.0010128170251846313, -0.0009566247463226318, -0.0009004324674606323, -0.0008442401885986328, -0.0007880479097366333, -0.0007318556308746338, -0.0006756633520126343, -0.0006194710731506348, -0.0005632787942886353, -0.0005070865154266357, -0.00045089423656463623, -0.0003947019577026367, -0.0003385096788406372, -0.0002823173999786377, -0.00022612512111663818, -0.00016993284225463867, -0.00011374056339263916, -5.754828453063965e-05, -1.3560056686401367e-06, 5.4836273193359375e-05, 0.00011102855205535889, 0.0001672208309173584, 0.0002234131097793579, 0.0002796053886413574, 0.00033579766750335693, 0.00039198994636535645, 0.00044818222522735596, 0.0005043745040893555, 0.000560566782951355, 0.0006167590618133545, 0.000672951340675354, 0.0007291436195373535, 0.000785335898399353, 0.0008415281772613525, 0.000897720456123352, 0.0009539127349853516, 0.001010105013847351, 0.0010662972927093506, 0.00112248957157135, 0.0011786818504333496, 0.0012348741292953491, 0.0012910664081573486, 0.0013472586870193481, 0.0014034509658813477, 0.0014596432447433472, 0.0015158355236053467, 0.0015720278024673462, 0.0016282200813293457, 0.0016844123601913452, 0.0017406046390533447, 0.0017967969179153442, 0.0018529891967773438]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 7.0, 6.0, 6.0, 14.0, 9.0, 22.0, 22.0, 37.0, 52.0, 47.0, 95.0, 132.0, 274.0, 534.0, 2215.0, 1027659.0, 15870.0, 637.0, 286.0, 182.0, 139.0, 89.0, 64.0, 42.0, 29.0, 13.0, 23.0, 14.0, 4.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.041717529296875, -0.04047822952270508, -0.039238929748535156, -0.037999629974365234, -0.03676033020019531, -0.03552103042602539, -0.03428173065185547, -0.03304243087768555, -0.031803131103515625, -0.030563831329345703, -0.02932453155517578, -0.02808523178100586, -0.026845932006835938, -0.025606632232666016, -0.024367332458496094, -0.023128032684326172, -0.02188873291015625, -0.020649433135986328, -0.019410133361816406, -0.018170833587646484, -0.016931533813476562, -0.01569223403930664, -0.014452934265136719, -0.013213634490966797, -0.011974334716796875, -0.010735034942626953, -0.009495735168457031, -0.00825643539428711, -0.0070171356201171875, -0.005777835845947266, -0.004538536071777344, -0.003299236297607422, -0.0020599365234375, -0.0008206367492675781, 0.00041866302490234375, 0.0016579627990722656, 0.0028972625732421875, 0.004136562347412109, 0.005375862121582031, 0.006615161895751953, 0.007854461669921875, 0.009093761444091797, 0.010333061218261719, 0.01157236099243164, 0.012811660766601562, 0.014050960540771484, 0.015290260314941406, 0.016529560089111328, 0.01776885986328125, 0.019008159637451172, 0.020247459411621094, 0.021486759185791016, 0.022726058959960938, 0.02396535873413086, 0.02520465850830078, 0.026443958282470703, 0.027683258056640625, 0.028922557830810547, 0.03016185760498047, 0.03140115737915039, 0.03264045715332031, 0.033879756927490234, 0.035119056701660156, 0.03635835647583008, 0.03759765625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 103.0, 856.0, 55.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00784197449684143, -0.007533687632530928, -0.007225400302559137, -0.006917113438248634, -0.006608826108276844, -0.006300539243966341, -0.005992252379655838, -0.005683965049684048, -0.005375677719712257, -0.005067390855401754, -0.004759103525429964, -0.004450816661119461, -0.004142529331147671, -0.0038342424668371677, -0.003525955369696021, -0.0032176682725548744, -0.0029093814082443714, -0.0026010943111032248, -0.002292807213962078, -0.001984520349651575, -0.0016762331360951066, -0.00136794603895396, -0.0010596590582281351, -0.0007513719610869884, -0.0004430848639458418, -0.00013479779590852559, 0.00017348927212879062, 0.00048177631106227636, 0.000790063408203423, 0.0010983505053445697, 0.0014066374860703945, 0.0017149245832115412, 0.002023211680352688, 0.0023314987774938345, 0.002639785874634981, 0.002948072738945484, 0.0032563600689172745, 0.0035646469332277775, 0.003872934030368924, 0.004181221127510071, 0.004489508457481861, 0.004797795321792364, 0.0051060826517641544, 0.0054143695160746574, 0.005722656846046448, 0.006030943710356951, 0.006339230574667454, 0.006647517904639244, 0.006955804768949747, 0.00726409163326025, 0.00757237896323204, 0.00788066629320383, 0.008188952691853046, 0.008497240021824837, 0.008805527351796627, 0.009113814681768417, 0.009422101080417633, 0.009730388410389423, 0.010038674809038639, 0.01034696213901043, 0.01065524946898222, 0.01096353679895401, 0.011271823197603226, 0.011580110527575016, 0.011888397857546806]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 11.0, 8.0, 14.0, 15.0, 8.0, 17.0, 21.0, 17.0, 16.0, 21.0, 26.0, 26.0, 18.0, 23.0, 36.0, 42.0, 36.0, 39.0, 32.0, 29.0, 43.0, 45.0, 40.0, 45.0, 37.0, 34.0, 37.0, 35.0, 18.0, 29.0, 25.0, 24.0, 19.0, 11.0, 15.0, 16.0, 11.0, 7.0, 9.0, 6.0, 4.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0008956789970397949, -0.0008698729798197746, -0.0008440669625997543, -0.000818260945379734, -0.0007924549281597137, -0.0007666489109396935, -0.0007408428937196732, -0.0007150368764996529, -0.0006892308592796326, -0.0006634248420596123, -0.000637618824839592, -0.0006118128076195717, -0.0005860067903995514, -0.0005602007731795311, -0.0005343947559595108, -0.0005085887387394905, -0.0004827827215194702, -0.0004569767042994499, -0.0004311706870794296, -0.00040536466985940933, -0.00037955865263938904, -0.00035375263541936874, -0.00032794661819934845, -0.00030214060097932816, -0.00027633458375930786, -0.00025052856653928757, -0.00022472254931926727, -0.00019891653209924698, -0.00017311051487922668, -0.0001473044976592064, -0.0001214984804391861, -9.56924632191658e-05, -6.988644599914551e-05, -4.4080428779125214e-05, -1.827441155910492e-05, 7.531605660915375e-06, 3.333762288093567e-05, 5.914364010095596e-05, 8.494965732097626e-05, 0.00011075567454099655, 0.00013656169176101685, 0.00016236770898103714, 0.00018817372620105743, 0.00021397974342107773, 0.00023978576064109802, 0.0002655917778611183, 0.0002913977950811386, 0.0003172038123011589, 0.0003430098295211792, 0.0003688158467411995, 0.0003946218639612198, 0.0004204278811812401, 0.0004462338984012604, 0.00047203991562128067, 0.000497845932841301, 0.0005236519500613213, 0.0005494579672813416, 0.0005752639845013618, 0.0006010700017213821, 0.0006268760189414024, 0.0006526820361614227, 0.000678488053381443, 0.0007042940706014633, 0.0007301000878214836, 0.0007559061050415039]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 9.0, 14.0, 7.0, 14.0, 11.0, 24.0, 24.0, 26.0, 27.0, 24.0, 37.0, 36.0, 29.0, 31.0, 38.0, 33.0, 48.0, 36.0, 45.0, 41.0, 41.0, 40.0, 32.0, 36.0, 33.0, 27.0, 29.0, 27.0, 32.0, 17.0, 18.0, 18.0, 15.0, 13.0, 14.0, 10.0, 8.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.391357421875, -3.27880859375, -3.166259765625, -3.0537109375, -2.941162109375, -2.82861328125, -2.716064453125, -2.603515625, -2.490966796875, -2.37841796875, -2.265869140625, -2.1533203125, -2.040771484375, -1.92822265625, -1.815673828125, -1.703125, -1.590576171875, -1.47802734375, -1.365478515625, -1.2529296875, -1.140380859375, -1.02783203125, -0.915283203125, -0.802734375, -0.690185546875, -0.57763671875, -0.465087890625, -0.3525390625, -0.239990234375, -0.12744140625, -0.014892578125, 0.09765625, 0.210205078125, 0.32275390625, 0.435302734375, 0.5478515625, 0.660400390625, 0.77294921875, 0.885498046875, 0.998046875, 1.110595703125, 1.22314453125, 1.335693359375, 1.4482421875, 1.560791015625, 1.67333984375, 1.785888671875, 1.8984375, 2.010986328125, 2.12353515625, 2.236083984375, 2.3486328125, 2.461181640625, 2.57373046875, 2.686279296875, 2.798828125, 2.911376953125, 3.02392578125, 3.136474609375, 3.2490234375, 3.361572265625, 3.47412109375, 3.586669921875, 3.69921875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 8.0, 12.0, 22.0, 36.0, 47.0, 75.0, 93.0, 154.0, 202.0, 347.0, 506.0, 805.0, 1379.0, 2394.0, 4576.0, 9441.0, 22433.0, 57473.0, 170589.0, 427398.0, 224800.0, 74072.0, 27449.0, 11618.0, 5589.0, 2877.0, 1595.0, 936.0, 543.0, 357.0, 225.0, 170.0, 106.0, 70.0, 52.0, 44.0, 15.0, 15.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.771484375, -2.683837890625, -2.59619140625, -2.508544921875, -2.4208984375, -2.333251953125, -2.24560546875, -2.157958984375, -2.0703125, -1.982666015625, -1.89501953125, -1.807373046875, -1.7197265625, -1.632080078125, -1.54443359375, -1.456787109375, -1.369140625, -1.281494140625, -1.19384765625, -1.106201171875, -1.0185546875, -0.930908203125, -0.84326171875, -0.755615234375, -0.66796875, -0.580322265625, -0.49267578125, -0.405029296875, -0.3173828125, -0.229736328125, -0.14208984375, -0.054443359375, 0.033203125, 0.120849609375, 0.20849609375, 0.296142578125, 0.3837890625, 0.471435546875, 0.55908203125, 0.646728515625, 0.734375, 0.822021484375, 0.90966796875, 0.997314453125, 1.0849609375, 1.172607421875, 1.26025390625, 1.347900390625, 1.435546875, 1.523193359375, 1.61083984375, 1.698486328125, 1.7861328125, 1.873779296875, 1.96142578125, 2.049072265625, 2.13671875, 2.224365234375, 2.31201171875, 2.399658203125, 2.4873046875, 2.574951171875, 2.66259765625, 2.750244140625, 2.837890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 14.0, 16.0, 10.0, 20.0, 20.0, 21.0, 22.0, 33.0, 33.0, 32.0, 35.0, 46.0, 47.0, 73.0, 109.0, 1749.0, 286.0, 90.0, 50.0, 55.0, 56.0, 45.0, 37.0, 23.0, 20.0, 23.0, 15.0, 15.0, 17.0, 10.0, 10.0, 6.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.906005859375, -12.40576171875, -11.905517578125, -11.4052734375, -10.905029296875, -10.40478515625, -9.904541015625, -9.404296875, -8.904052734375, -8.40380859375, -7.903564453125, -7.4033203125, -6.903076171875, -6.40283203125, -5.902587890625, -5.40234375, -4.902099609375, -4.40185546875, -3.901611328125, -3.4013671875, -2.901123046875, -2.40087890625, -1.900634765625, -1.400390625, -0.900146484375, -0.39990234375, 0.100341796875, 0.6005859375, 1.100830078125, 1.60107421875, 2.101318359375, 2.6015625, 3.101806640625, 3.60205078125, 4.102294921875, 4.6025390625, 5.102783203125, 5.60302734375, 6.103271484375, 6.603515625, 7.103759765625, 7.60400390625, 8.104248046875, 8.6044921875, 9.104736328125, 9.60498046875, 10.105224609375, 10.60546875, 11.105712890625, 11.60595703125, 12.106201171875, 12.6064453125, 13.106689453125, 13.60693359375, 14.107177734375, 14.607421875, 15.107666015625, 15.60791015625, 16.108154296875, 16.6083984375, 17.108642578125, 17.60888671875, 18.109130859375, 18.609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 7.0, 20.0, 14.0, 17.0, 30.0, 28.0, 37.0, 56.0, 76.0, 118.0, 205.0, 407.0, 1343.0, 24443.0, 3095118.0, 21446.0, 1240.0, 421.0, 220.0, 128.0, 68.0, 45.0, 43.0, 29.0, 28.0, 23.0, 19.0, 17.0, 7.0, 17.0, 9.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.357177734375, -27.55810546875, -26.759033203125, -25.9599609375, -25.160888671875, -24.36181640625, -23.562744140625, -22.763671875, -21.964599609375, -21.16552734375, -20.366455078125, -19.5673828125, -18.768310546875, -17.96923828125, -17.170166015625, -16.37109375, -15.572021484375, -14.77294921875, -13.973876953125, -13.1748046875, -12.375732421875, -11.57666015625, -10.777587890625, -9.978515625, -9.179443359375, -8.38037109375, -7.581298828125, -6.7822265625, -5.983154296875, -5.18408203125, -4.385009765625, -3.5859375, -2.786865234375, -1.98779296875, -1.188720703125, -0.3896484375, 0.409423828125, 1.20849609375, 2.007568359375, 2.806640625, 3.605712890625, 4.40478515625, 5.203857421875, 6.0029296875, 6.802001953125, 7.60107421875, 8.400146484375, 9.19921875, 9.998291015625, 10.79736328125, 11.596435546875, 12.3955078125, 13.194580078125, 13.99365234375, 14.792724609375, 15.591796875, 16.390869140625, 17.18994140625, 17.989013671875, 18.7880859375, 19.587158203125, 20.38623046875, 21.185302734375, 21.984375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 384.0, 623.0, 9.0], "bins": [-227.7459716796875, -224.0773468017578, -220.40872192382812, -216.74009704589844, -213.07147216796875, -209.40286254882812, -205.73423767089844, -202.06561279296875, -198.39698791503906, -194.72836303710938, -191.0597381591797, -187.39111328125, -183.72250366210938, -180.0538787841797, -176.38525390625, -172.7166290283203, -169.04800415039062, -165.37937927246094, -161.71075439453125, -158.04212951660156, -154.37350463867188, -150.70489501953125, -147.03627014160156, -143.36764526367188, -139.6990203857422, -136.0303955078125, -132.3617706298828, -128.69314575195312, -125.02452850341797, -121.35590362548828, -117.68728637695312, -114.01866149902344, -110.35004425048828, -106.6814193725586, -103.01280212402344, -99.34417724609375, -95.67555236816406, -92.00692749023438, -88.33830261230469, -84.66968536376953, -81.00106048583984, -77.33243560791016, -73.663818359375, -69.99519348144531, -66.32656860351562, -62.65794372558594, -58.989322662353516, -55.320701599121094, -51.652076721191406, -47.98345184326172, -44.3148307800293, -40.646209716796875, -36.97758483886719, -33.3089599609375, -29.640338897705078, -25.971715927124023, -22.30309295654297, -18.634469985961914, -14.96584701538086, -11.297224044799805, -7.62860107421875, -3.9599781036376953, -0.2913551330566406, 3.377267837524414, 7.045891284942627]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 8.0, 5.0, 11.0, 16.0, 14.0, 16.0, 15.0, 14.0, 19.0, 26.0, 35.0, 39.0, 33.0, 35.0, 27.0, 32.0, 37.0, 39.0, 28.0, 37.0, 45.0, 46.0, 32.0, 36.0, 41.0, 32.0, 33.0, 25.0, 20.0, 27.0, 20.0, 22.0, 28.0, 10.0, 12.0, 10.0, 9.0, 8.0, 11.0, 8.0, 6.0, 9.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.27000427246094, -34.0894775390625, -32.90895080566406, -31.728422164916992, -30.547895431518555, -29.367368698120117, -28.186840057373047, -27.00631332397461, -25.825786590576172, -24.645259857177734, -23.464733123779297, -22.284204483032227, -21.10367774963379, -19.92315101623535, -18.74262237548828, -17.562095642089844, -16.381568908691406, -15.201042175292969, -14.020514488220215, -12.839986801147461, -11.659460067749023, -10.478933334350586, -9.298405647277832, -8.117877960205078, -6.937351226806641, -5.756824016571045, -4.576296806335449, -3.3957695960998535, -2.215242385864258, -1.034715175628662, 0.1458120346069336, 1.3263397216796875, 2.5068702697753906, 3.6873974800109863, 4.867924690246582, 6.048451900482178, 7.228979110717773, 8.409505844116211, 9.590033531188965, 10.770561218261719, 11.951087951660156, 13.131614685058594, 14.312142372131348, 15.492670059204102, 16.67319679260254, 17.853723526000977, 19.034252166748047, 20.214778900146484, 21.395305633544922, 22.57583236694336, 23.756359100341797, 24.936887741088867, 26.117414474487305, 27.297941207885742, 28.478469848632812, 29.65899658203125, 30.839523315429688, 32.020050048828125, 33.20057678222656, 34.381103515625, 35.56163024902344, 36.74216079711914, 37.92268753051758, 39.103214263916016, 40.28374099731445]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 11.0, 7.0, 16.0, 12.0, 9.0, 15.0, 24.0, 23.0, 30.0, 27.0, 25.0, 36.0, 31.0, 28.0, 45.0, 34.0, 35.0, 43.0, 46.0, 48.0, 41.0, 37.0, 48.0, 29.0, 38.0, 28.0, 25.0, 28.0, 31.0, 25.0, 25.0, 13.0, 12.0, 21.0, 11.0, 11.0, 13.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65234375, -3.5338134765625, -3.415283203125, -3.2967529296875, -3.17822265625, -3.0596923828125, -2.941162109375, -2.8226318359375, -2.7041015625, -2.5855712890625, -2.467041015625, -2.3485107421875, -2.22998046875, -2.1114501953125, -1.992919921875, -1.8743896484375, -1.755859375, -1.6373291015625, -1.518798828125, -1.4002685546875, -1.28173828125, -1.1632080078125, -1.044677734375, -0.9261474609375, -0.8076171875, -0.6890869140625, -0.570556640625, -0.4520263671875, -0.33349609375, -0.2149658203125, -0.096435546875, 0.0220947265625, 0.140625, 0.2591552734375, 0.377685546875, 0.4962158203125, 0.61474609375, 0.7332763671875, 0.851806640625, 0.9703369140625, 1.0888671875, 1.2073974609375, 1.325927734375, 1.4444580078125, 1.56298828125, 1.6815185546875, 1.800048828125, 1.9185791015625, 2.037109375, 2.1556396484375, 2.274169921875, 2.3927001953125, 2.51123046875, 2.6297607421875, 2.748291015625, 2.8668212890625, 2.9853515625, 3.1038818359375, 3.222412109375, 3.3409423828125, 3.45947265625, 3.5780029296875, 3.696533203125, 3.8150634765625, 3.93359375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 9.0, 15.0, 9.0, 17.0, 22.0, 25.0, 48.0, 57.0, 97.0, 157.0, 327.0, 718.0, 1702.0, 4850.0, 15756.0, 57083.0, 306449.0, 1825947.0, 1646359.0, 262055.0, 50948.0, 14188.0, 4322.0, 1683.0, 633.0, 297.0, 152.0, 94.0, 74.0, 41.0, 22.0, 26.0, 20.0, 12.0, 12.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7567138671875, -7.497802734375, -7.2388916015625, -6.97998046875, -6.7210693359375, -6.462158203125, -6.2032470703125, -5.9443359375, -5.6854248046875, -5.426513671875, -5.1676025390625, -4.90869140625, -4.6497802734375, -4.390869140625, -4.1319580078125, -3.873046875, -3.6141357421875, -3.355224609375, -3.0963134765625, -2.83740234375, -2.5784912109375, -2.319580078125, -2.0606689453125, -1.8017578125, -1.5428466796875, -1.283935546875, -1.0250244140625, -0.76611328125, -0.5072021484375, -0.248291015625, 0.0106201171875, 0.26953125, 0.5284423828125, 0.787353515625, 1.0462646484375, 1.30517578125, 1.5640869140625, 1.822998046875, 2.0819091796875, 2.3408203125, 2.5997314453125, 2.858642578125, 3.1175537109375, 3.37646484375, 3.6353759765625, 3.894287109375, 4.1531982421875, 4.412109375, 4.6710205078125, 4.929931640625, 5.1888427734375, 5.44775390625, 5.7066650390625, 5.965576171875, 6.2244873046875, 6.4833984375, 6.7423095703125, 7.001220703125, 7.2601318359375, 7.51904296875, 7.7779541015625, 8.036865234375, 8.2957763671875, 8.5546875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 3.0, 11.0, 17.0, 29.0, 59.0, 84.0, 96.0, 180.0, 282.0, 399.0, 575.0, 616.0, 551.0, 385.0, 272.0, 176.0, 120.0, 76.0, 45.0, 23.0, 24.0, 13.0, 12.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.5657958984375, -16.084716796875, -15.6036376953125, -15.12255859375, -14.6414794921875, -14.160400390625, -13.6793212890625, -13.1982421875, -12.7171630859375, -12.236083984375, -11.7550048828125, -11.27392578125, -10.7928466796875, -10.311767578125, -9.8306884765625, -9.349609375, -8.8685302734375, -8.387451171875, -7.9063720703125, -7.42529296875, -6.9442138671875, -6.463134765625, -5.9820556640625, -5.5009765625, -5.0198974609375, -4.538818359375, -4.0577392578125, -3.57666015625, -3.0955810546875, -2.614501953125, -2.1334228515625, -1.65234375, -1.1712646484375, -0.690185546875, -0.2091064453125, 0.27197265625, 0.7530517578125, 1.234130859375, 1.7152099609375, 2.1962890625, 2.6773681640625, 3.158447265625, 3.6395263671875, 4.12060546875, 4.6016845703125, 5.082763671875, 5.5638427734375, 6.044921875, 6.5260009765625, 7.007080078125, 7.4881591796875, 7.96923828125, 8.4503173828125, 8.931396484375, 9.4124755859375, 9.8935546875, 10.3746337890625, 10.855712890625, 11.3367919921875, 11.81787109375, 12.2989501953125, 12.780029296875, 13.2611083984375, 13.7421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 6.0, 8.0, 12.0, 21.0, 42.0, 44.0, 83.0, 163.0, 243.0, 512.0, 1429.0, 9940.0, 1166668.0, 2993595.0, 18447.0, 1790.0, 602.0, 258.0, 152.0, 102.0, 49.0, 45.0, 15.0, 17.0, 5.0, 9.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.59375, -32.19921875, -30.8046875, -29.41015625, -28.015625, -26.62109375, -25.2265625, -23.83203125, -22.4375, -21.04296875, -19.6484375, -18.25390625, -16.859375, -15.46484375, -14.0703125, -12.67578125, -11.28125, -9.88671875, -8.4921875, -7.09765625, -5.703125, -4.30859375, -2.9140625, -1.51953125, -0.125, 1.26953125, 2.6640625, 4.05859375, 5.453125, 6.84765625, 8.2421875, 9.63671875, 11.03125, 12.42578125, 13.8203125, 15.21484375, 16.609375, 18.00390625, 19.3984375, 20.79296875, 22.1875, 23.58203125, 24.9765625, 26.37109375, 27.765625, 29.16015625, 30.5546875, 31.94921875, 33.34375, 34.73828125, 36.1328125, 37.52734375, 38.921875, 40.31640625, 41.7109375, 43.10546875, 44.5, 45.89453125, 47.2890625, 48.68359375, 50.078125, 51.47265625, 52.8671875, 54.26171875, 55.65625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 25.0, 157.0, 381.0, 330.0, 100.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-297.197998046875, -291.6805114746094, -286.1630554199219, -280.64556884765625, -275.12811279296875, -269.6106262207031, -264.0931701660156, -258.57568359375, -253.05821228027344, -247.54074096679688, -242.0232696533203, -236.50579833984375, -230.9883270263672, -225.47085571289062, -219.953369140625, -214.43589782714844, -208.91842651367188, -203.4009552001953, -197.88348388671875, -192.3660125732422, -186.84854125976562, -181.3310546875, -175.8135986328125, -170.29611206054688, -164.77865600585938, -159.2611846923828, -153.74371337890625, -148.2262420654297, -142.70877075195312, -137.1912841796875, -131.673828125, -126.15634155273438, -120.63887786865234, -115.12140655517578, -109.60393524169922, -104.08645629882812, -98.56898498535156, -93.051513671875, -87.53404235839844, -82.01657104492188, -76.49909973144531, -70.98162841796875, -65.46415710449219, -59.94668197631836, -54.42920684814453, -48.91173553466797, -43.394264221191406, -37.87678909301758, -32.35931396484375, -26.841840744018555, -21.32436752319336, -15.806896209716797, -10.289422988891602, -4.771949768066406, 0.7455215454101562, 6.262996673583984, 11.780467987060547, 17.297941207885742, 22.815414428710938, 28.3328857421875, 33.85035705566406, 39.36783218383789, 44.88530349731445, 50.40277862548828, 55.920249938964844]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 10.0, 15.0, 8.0, 16.0, 15.0, 12.0, 28.0, 20.0, 29.0, 29.0, 18.0, 25.0, 30.0, 37.0, 33.0, 26.0, 45.0, 41.0, 39.0, 48.0, 28.0, 46.0, 43.0, 32.0, 50.0, 34.0, 34.0, 20.0, 25.0, 20.0, 18.0, 14.0, 17.0, 20.0, 12.0, 11.0, 9.0, 3.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.244903564453125, -32.07333755493164, -30.90176773071289, -29.730201721191406, -28.55863380432129, -27.387065887451172, -26.215499877929688, -25.04393196105957, -23.872364044189453, -22.700796127319336, -21.52922821044922, -20.357662200927734, -19.186094284057617, -18.0145263671875, -16.842960357666016, -15.671392440795898, -14.499824523925781, -13.328256607055664, -12.156689643859863, -10.985122680664062, -9.813554763793945, -8.641986846923828, -7.470419883728027, -6.298852920532227, -5.127285003662109, -3.9557175636291504, -2.7841501235961914, -1.6125826835632324, -0.44101524353027344, 0.7305521965026855, 1.9021196365356445, 3.0736865997314453, 4.2452545166015625, 5.4168219566345215, 6.5883893966674805, 7.7599568367004395, 8.931524276733398, 10.103092193603516, 11.274659156799316, 12.446226119995117, 13.617794036865234, 14.789361953735352, 15.960928916931152, 17.132495880126953, 18.30406379699707, 19.475631713867188, 20.647197723388672, 21.81876564025879, 22.990333557128906, 24.161901473999023, 25.33346939086914, 26.505035400390625, 27.676603317260742, 28.84817123413086, 30.019737243652344, 31.19130516052246, 32.36287307739258, 33.53443908691406, 34.70600891113281, 35.8775749206543, 37.04914093017578, 38.22071075439453, 39.392276763916016, 40.5638427734375, 41.73541259765625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 12.0, 17.0, 5.0, 17.0, 20.0, 19.0, 23.0, 25.0, 21.0, 23.0, 39.0, 34.0, 32.0, 42.0, 35.0, 43.0, 36.0, 44.0, 42.0, 47.0, 37.0, 43.0, 34.0, 32.0, 40.0, 28.0, 38.0, 22.0, 28.0, 23.0, 22.0, 14.0, 15.0, 9.0, 7.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.0234375, -3.89739990234375, -3.7713623046875, -3.64532470703125, -3.519287109375, -3.39324951171875, -3.2672119140625, -3.14117431640625, -3.01513671875, -2.88909912109375, -2.7630615234375, -2.63702392578125, -2.510986328125, -2.38494873046875, -2.2589111328125, -2.13287353515625, -2.0068359375, -1.88079833984375, -1.7547607421875, -1.62872314453125, -1.502685546875, -1.37664794921875, -1.2506103515625, -1.12457275390625, -0.99853515625, -0.87249755859375, -0.7464599609375, -0.62042236328125, -0.494384765625, -0.36834716796875, -0.2423095703125, -0.11627197265625, 0.009765625, 0.13580322265625, 0.2618408203125, 0.38787841796875, 0.513916015625, 0.63995361328125, 0.7659912109375, 0.89202880859375, 1.01806640625, 1.14410400390625, 1.2701416015625, 1.39617919921875, 1.522216796875, 1.64825439453125, 1.7742919921875, 1.90032958984375, 2.0263671875, 2.15240478515625, 2.2784423828125, 2.40447998046875, 2.530517578125, 2.65655517578125, 2.7825927734375, 2.90863037109375, 3.03466796875, 3.16070556640625, 3.2867431640625, 3.41278076171875, 3.538818359375, 3.66485595703125, 3.7908935546875, 3.91693115234375, 4.04296875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 7.0, 9.0, 23.0, 26.0, 28.0, 45.0, 77.0, 102.0, 139.0, 204.0, 276.0, 426.0, 572.0, 887.0, 1217.0, 1689.0, 2660.0, 3941.0, 5714.0, 8150.0, 12178.0, 18408.0, 28168.0, 43013.0, 65686.0, 96781.0, 133603.0, 158128.0, 142731.0, 106426.0, 73726.0, 48252.0, 31602.0, 20491.0, 14025.0, 9076.0, 6227.0, 4361.0, 2948.0, 1976.0, 1379.0, 933.0, 670.0, 484.0, 332.0, 249.0, 169.0, 114.0, 64.0, 53.0, 35.0, 20.0, 18.0, 15.0, 9.0, 6.0, 3.0, 6.0], "bins": [-0.355712890625, -0.3451385498046875, -0.334564208984375, -0.3239898681640625, -0.31341552734375, -0.3028411865234375, -0.292266845703125, -0.2816925048828125, -0.2711181640625, -0.2605438232421875, -0.249969482421875, -0.2393951416015625, -0.22882080078125, -0.2182464599609375, -0.207672119140625, -0.1970977783203125, -0.1865234375, -0.1759490966796875, -0.165374755859375, -0.1548004150390625, -0.14422607421875, -0.1336517333984375, -0.123077392578125, -0.1125030517578125, -0.1019287109375, -0.0913543701171875, -0.080780029296875, -0.0702056884765625, -0.05963134765625, -0.0490570068359375, -0.038482666015625, -0.0279083251953125, -0.017333984375, -0.0067596435546875, 0.003814697265625, 0.0143890380859375, 0.02496337890625, 0.0355377197265625, 0.046112060546875, 0.0566864013671875, 0.0672607421875, 0.0778350830078125, 0.088409423828125, 0.0989837646484375, 0.10955810546875, 0.1201324462890625, 0.130706787109375, 0.1412811279296875, 0.15185546875, 0.1624298095703125, 0.173004150390625, 0.1835784912109375, 0.19415283203125, 0.2047271728515625, 0.215301513671875, 0.2258758544921875, 0.2364501953125, 0.2470245361328125, 0.257598876953125, 0.2681732177734375, 0.27874755859375, 0.2893218994140625, 0.299896240234375, 0.3104705810546875, 0.321044921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 9.0, 7.0, 8.0, 8.0, 20.0, 14.0, 23.0, 16.0, 17.0, 26.0, 38.0, 35.0, 32.0, 51.0, 45.0, 52.0, 48.0, 31.0, 33.0, 1069.0, 28.0, 44.0, 35.0, 47.0, 35.0, 32.0, 31.0, 26.0, 31.0, 25.0, 18.0, 15.0, 21.0, 17.0, 10.0, 14.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-3.2734375, -3.187713623046875, -3.10198974609375, -3.016265869140625, -2.9305419921875, -2.844818115234375, -2.75909423828125, -2.673370361328125, -2.587646484375, -2.501922607421875, -2.41619873046875, -2.330474853515625, -2.2447509765625, -2.159027099609375, -2.07330322265625, -1.987579345703125, -1.90185546875, -1.816131591796875, -1.73040771484375, -1.644683837890625, -1.5589599609375, -1.473236083984375, -1.38751220703125, -1.301788330078125, -1.216064453125, -1.130340576171875, -1.04461669921875, -0.958892822265625, -0.8731689453125, -0.787445068359375, -0.70172119140625, -0.615997314453125, -0.5302734375, -0.444549560546875, -0.35882568359375, -0.273101806640625, -0.1873779296875, -0.101654052734375, -0.01593017578125, 0.069793701171875, 0.155517578125, 0.241241455078125, 0.32696533203125, 0.412689208984375, 0.4984130859375, 0.584136962890625, 0.66986083984375, 0.755584716796875, 0.84130859375, 0.927032470703125, 1.01275634765625, 1.098480224609375, 1.1842041015625, 1.269927978515625, 1.35565185546875, 1.441375732421875, 1.527099609375, 1.612823486328125, 1.69854736328125, 1.784271240234375, 1.8699951171875, 1.955718994140625, 2.04144287109375, 2.127166748046875, 2.212890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 12.0, 31.0, 51.0, 93.0, 109.0, 184.0, 259.0, 407.0, 617.0, 942.0, 1410.0, 2158.0, 3414.0, 5263.0, 8228.0, 12297.0, 19426.0, 29780.0, 44628.0, 64965.0, 90933.0, 118383.0, 1176537.0, 145716.0, 111943.0, 84123.0, 59332.0, 40206.0, 26304.0, 17317.0, 11234.0, 7292.0, 4738.0, 3107.0, 1993.0, 1238.0, 843.0, 564.0, 376.0, 238.0, 125.0, 113.0, 77.0, 49.0, 19.0, 22.0, 10.0, 8.0, 2.0, 4.0], "bins": [-0.30224609375, -0.2940483093261719, -0.28585052490234375, -0.2776527404785156, -0.2694549560546875, -0.2612571716308594, -0.25305938720703125, -0.24486160278320312, -0.236663818359375, -0.22846603393554688, -0.22026824951171875, -0.21207046508789062, -0.2038726806640625, -0.19567489624023438, -0.18747711181640625, -0.17927932739257812, -0.17108154296875, -0.16288375854492188, -0.15468597412109375, -0.14648818969726562, -0.1382904052734375, -0.13009262084960938, -0.12189483642578125, -0.11369705200195312, -0.105499267578125, -0.09730148315429688, -0.08910369873046875, -0.08090591430664062, -0.0727081298828125, -0.06451034545898438, -0.05631256103515625, -0.048114776611328125, -0.0399169921875, -0.031719207763671875, -0.02352142333984375, -0.015323638916015625, -0.0071258544921875, 0.001071929931640625, 0.00926971435546875, 0.017467498779296875, 0.025665283203125, 0.033863067626953125, 0.04206085205078125, 0.050258636474609375, 0.0584564208984375, 0.06665420532226562, 0.07485198974609375, 0.08304977416992188, 0.09124755859375, 0.09944534301757812, 0.10764312744140625, 0.11584091186523438, 0.1240386962890625, 0.13223648071289062, 0.14043426513671875, 0.14863204956054688, 0.156829833984375, 0.16502761840820312, 0.17322540283203125, 0.18142318725585938, 0.1896209716796875, 0.19781875610351562, 0.20601654052734375, 0.21421432495117188, 0.222412109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 1.0, 4.0, 1.0, 6.0, 4.0, 14.0, 12.0, 13.0, 18.0, 18.0, 14.0, 15.0, 28.0, 36.0, 41.0, 52.0, 53.0, 51.0, 50.0, 43.0, 51.0, 57.0, 58.0, 40.0, 53.0, 38.0, 29.0, 24.0, 27.0, 24.0, 19.0, 15.0, 20.0, 9.0, 11.0, 8.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.001674652099609375, -0.0016236752271652222, -0.0015726983547210693, -0.0015217214822769165, -0.0014707446098327637, -0.0014197677373886108, -0.001368790864944458, -0.0013178139925003052, -0.0012668371200561523, -0.0012158602476119995, -0.0011648833751678467, -0.0011139065027236938, -0.001062929630279541, -0.0010119527578353882, -0.0009609758853912354, -0.0009099990129470825, -0.0008590221405029297, -0.0008080452680587769, -0.000757068395614624, -0.0007060915231704712, -0.0006551146507263184, -0.0006041377782821655, -0.0005531609058380127, -0.0005021840333938599, -0.00045120716094970703, -0.0004002302885055542, -0.00034925341606140137, -0.00029827654361724854, -0.0002472996711730957, -0.00019632279872894287, -0.00014534592628479004, -9.436905384063721e-05, -4.3392181396484375e-05, 7.584691047668457e-06, 5.856156349182129e-05, 0.00010953843593597412, 0.00016051530838012695, 0.00021149218082427979, 0.0002624690532684326, 0.00031344592571258545, 0.0003644227981567383, 0.0004153996706008911, 0.00046637654304504395, 0.0005173534154891968, 0.0005683302879333496, 0.0006193071603775024, 0.0006702840328216553, 0.0007212609052658081, 0.0007722377777099609, 0.0008232146501541138, 0.0008741915225982666, 0.0009251683950424194, 0.0009761452674865723, 0.001027122139930725, 0.001078099012374878, 0.0011290758848190308, 0.0011800527572631836, 0.0012310296297073364, 0.0012820065021514893, 0.001332983374595642, 0.001383960247039795, 0.0014349371194839478, 0.0014859139919281006, 0.0015368908643722534, 0.0015878677368164062]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 1.0, 6.0, 9.0, 4.0, 7.0, 16.0, 8.0, 14.0, 15.0, 28.0, 36.0, 33.0, 57.0, 74.0, 106.0, 150.0, 230.0, 415.0, 990.0, 91492.0, 950934.0, 2458.0, 512.0, 281.0, 209.0, 139.0, 71.0, 55.0, 43.0, 41.0, 23.0, 26.0, 15.0, 12.0, 11.0, 5.0, 6.0, 1.0, 0.0, 4.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 3.0], "bins": [-0.043243408203125, -0.042081356048583984, -0.04091930389404297, -0.03975725173950195, -0.03859519958496094, -0.03743314743041992, -0.036271095275878906, -0.03510904312133789, -0.033946990966796875, -0.03278493881225586, -0.031622886657714844, -0.030460834503173828, -0.029298782348632812, -0.028136730194091797, -0.02697467803955078, -0.025812625885009766, -0.02465057373046875, -0.023488521575927734, -0.02232646942138672, -0.021164417266845703, -0.020002365112304688, -0.018840312957763672, -0.017678260803222656, -0.01651620864868164, -0.015354156494140625, -0.01419210433959961, -0.013030052185058594, -0.011868000030517578, -0.010705947875976562, -0.009543895721435547, -0.008381843566894531, -0.007219791412353516, -0.0060577392578125, -0.004895687103271484, -0.0037336349487304688, -0.002571582794189453, -0.0014095306396484375, -0.0002474784851074219, 0.0009145736694335938, 0.0020766258239746094, 0.003238677978515625, 0.004400730133056641, 0.005562782287597656, 0.006724834442138672, 0.007886886596679688, 0.009048938751220703, 0.010210990905761719, 0.011373043060302734, 0.01253509521484375, 0.013697147369384766, 0.014859199523925781, 0.016021251678466797, 0.017183303833007812, 0.018345355987548828, 0.019507408142089844, 0.02066946029663086, 0.021831512451171875, 0.02299356460571289, 0.024155616760253906, 0.025317668914794922, 0.026479721069335938, 0.027641773223876953, 0.02880382537841797, 0.029965877532958984, 0.0311279296875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 15.0, 698.0, 302.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001784109277650714, -0.0014131686184555292, -0.0010422280756756663, -0.0006712875328958035, -0.00030034687370061874, 7.059378549456596e-05, 0.000441534211859107, 0.0008124748710542917, 0.0011834155302494764, 0.0015543561894446611, 0.001925296732224524, 0.002296237275004387, 0.0026671779341995716, 0.0030381185933947563, 0.0034090590197592974, 0.003779999678954482, 0.004150940105319023, 0.004521880764514208, 0.0048928214237093925, 0.00526376161724329, 0.005634702742099762, 0.006005642935633659, 0.006376583594828844, 0.006747524254024029, 0.007118465378880501, 0.0074894060380756855, 0.00786034669727087, 0.008231286890804768, 0.00860222801566124, 0.008973168209195137, 0.009344108402729034, 0.009715049527585506, 0.010085990652441978, 0.010456930845975876, 0.010827871970832348, 0.011198812164366245, 0.011569753289222717, 0.011940693482756615, 0.012311633676290512, 0.012682574801146984, 0.013053515926003456, 0.013424456119537354, 0.013795397244393826, 0.014166337437927723, 0.014537278562784195, 0.014908218756318092, 0.01527915894985199, 0.015650101006031036, 0.016021039336919785, 0.016391979530453682, 0.01676291972398758, 0.017133861780166626, 0.017504801973700523, 0.01787574216723442, 0.018246682360768318, 0.018617622554302216, 0.018988564610481262, 0.01935950480401516, 0.019730444997549057, 0.020101387053728104, 0.020472327247262, 0.0208432674407959, 0.021214207634329796, 0.021585147827863693, 0.02195608988404274]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 13.0, 7.0, 9.0, 8.0, 13.0, 14.0, 21.0, 23.0, 21.0, 26.0, 32.0, 37.0, 37.0, 32.0, 39.0, 43.0, 28.0, 41.0, 42.0, 39.0, 37.0, 36.0, 42.0, 49.0, 34.0, 34.0, 28.0, 24.0, 16.0, 32.0, 15.0, 19.0, 18.0, 8.0, 17.0, 10.0, 9.0, 10.0, 7.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000985562801361084, -0.0009541893377900124, -0.0009228158742189407, -0.0008914424106478691, -0.0008600689470767975, -0.0008286954835057259, -0.0007973220199346542, -0.0007659485563635826, -0.000734575092792511, -0.0007032016292214394, -0.0006718281656503677, -0.0006404547020792961, -0.0006090812385082245, -0.0005777077749371529, -0.0005463343113660812, -0.0005149608477950096, -0.000483587384223938, -0.00045221392065286636, -0.00042084045708179474, -0.0003894669935107231, -0.0003580935299396515, -0.00032672006636857986, -0.00029534660279750824, -0.0002639731392264366, -0.000232599675655365, -0.00020122621208429337, -0.00016985274851322174, -0.00013847928494215012, -0.00010710582137107849, -7.573235780000687e-05, -4.435889422893524e-05, -1.2985430657863617e-05, 1.8388032913208008e-05, 4.976149648427963e-05, 8.113496005535126e-05, 0.00011250842362642288, 0.0001438818871974945, 0.00017525535076856613, 0.00020662881433963776, 0.00023800227791070938, 0.000269375741481781, 0.00030074920505285263, 0.00033212266862392426, 0.0003634961321949959, 0.0003948695957660675, 0.00042624305933713913, 0.00045761652290821075, 0.0004889899864792824, 0.000520363450050354, 0.0005517369136214256, 0.0005831103771924973, 0.0006144838407635689, 0.0006458573043346405, 0.0006772307679057121, 0.0007086042314767838, 0.0007399776950478554, 0.000771351158618927, 0.0008027246221899986, 0.0008340980857610703, 0.0008654715493321419, 0.0008968450129032135, 0.0009282184764742851, 0.0009595919400453568, 0.0009909654036164284, 0.0010223388671875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 12.0, 17.0, 5.0, 17.0, 20.0, 19.0, 23.0, 25.0, 21.0, 23.0, 39.0, 34.0, 32.0, 42.0, 35.0, 43.0, 36.0, 44.0, 42.0, 47.0, 37.0, 43.0, 34.0, 32.0, 40.0, 28.0, 38.0, 23.0, 27.0, 23.0, 22.0, 14.0, 15.0, 9.0, 7.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.0234375, -3.89739990234375, -3.7713623046875, -3.64532470703125, -3.519287109375, -3.39324951171875, -3.2672119140625, -3.14117431640625, -3.01513671875, -2.88909912109375, -2.7630615234375, -2.63702392578125, -2.510986328125, -2.38494873046875, -2.2589111328125, -2.13287353515625, -2.0068359375, -1.88079833984375, -1.7547607421875, -1.62872314453125, -1.502685546875, -1.37664794921875, -1.2506103515625, -1.12457275390625, -0.99853515625, -0.87249755859375, -0.7464599609375, -0.62042236328125, -0.494384765625, -0.36834716796875, -0.2423095703125, -0.11627197265625, 0.009765625, 0.13580322265625, 0.2618408203125, 0.38787841796875, 0.513916015625, 0.63995361328125, 0.7659912109375, 0.89202880859375, 1.01806640625, 1.14410400390625, 1.2701416015625, 1.39617919921875, 1.522216796875, 1.64825439453125, 1.7742919921875, 1.90032958984375, 2.0263671875, 2.15240478515625, 2.2784423828125, 2.40447998046875, 2.530517578125, 2.65655517578125, 2.7825927734375, 2.90863037109375, 3.03466796875, 3.16070556640625, 3.2867431640625, 3.41278076171875, 3.538818359375, 3.66485595703125, 3.7908935546875, 3.91693115234375, 4.04296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 11.0, 25.0, 39.0, 40.0, 68.0, 90.0, 139.0, 185.0, 267.0, 431.0, 691.0, 1158.0, 1726.0, 2802.0, 4685.0, 8460.0, 16541.0, 38807.0, 105990.0, 297786.0, 346544.0, 132329.0, 47014.0, 19378.0, 9633.0, 5228.0, 3053.0, 1947.0, 1183.0, 775.0, 518.0, 293.0, 198.0, 150.0, 89.0, 68.0, 46.0, 45.0, 31.0, 20.0, 12.0, 8.0, 9.0, 9.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.10546875, -3.016998291015625, -2.92852783203125, -2.840057373046875, -2.7515869140625, -2.663116455078125, -2.57464599609375, -2.486175537109375, -2.397705078125, -2.309234619140625, -2.22076416015625, -2.132293701171875, -2.0438232421875, -1.955352783203125, -1.86688232421875, -1.778411865234375, -1.68994140625, -1.601470947265625, -1.51300048828125, -1.424530029296875, -1.3360595703125, -1.247589111328125, -1.15911865234375, -1.070648193359375, -0.982177734375, -0.893707275390625, -0.80523681640625, -0.716766357421875, -0.6282958984375, -0.539825439453125, -0.45135498046875, -0.362884521484375, -0.2744140625, -0.185943603515625, -0.09747314453125, -0.009002685546875, 0.0794677734375, 0.167938232421875, 0.25640869140625, 0.344879150390625, 0.433349609375, 0.521820068359375, 0.61029052734375, 0.698760986328125, 0.7872314453125, 0.875701904296875, 0.96417236328125, 1.052642822265625, 1.14111328125, 1.229583740234375, 1.31805419921875, 1.406524658203125, 1.4949951171875, 1.583465576171875, 1.67193603515625, 1.760406494140625, 1.848876953125, 1.937347412109375, 2.02581787109375, 2.114288330078125, 2.2027587890625, 2.291229248046875, 2.37969970703125, 2.468170166015625, 2.556640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 10.0, 9.0, 23.0, 18.0, 23.0, 24.0, 28.0, 30.0, 35.0, 29.0, 33.0, 57.0, 42.0, 62.0, 242.0, 1711.0, 189.0, 64.0, 48.0, 48.0, 53.0, 33.0, 32.0, 35.0, 20.0, 24.0, 24.0, 16.0, 23.0, 12.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.15625, -15.6727294921875, -15.189208984375, -14.7056884765625, -14.22216796875, -13.7386474609375, -13.255126953125, -12.7716064453125, -12.2880859375, -11.8045654296875, -11.321044921875, -10.8375244140625, -10.35400390625, -9.8704833984375, -9.386962890625, -8.9034423828125, -8.419921875, -7.9364013671875, -7.452880859375, -6.9693603515625, -6.48583984375, -6.0023193359375, -5.518798828125, -5.0352783203125, -4.5517578125, -4.0682373046875, -3.584716796875, -3.1011962890625, -2.61767578125, -2.1341552734375, -1.650634765625, -1.1671142578125, -0.68359375, -0.2000732421875, 0.283447265625, 0.7669677734375, 1.25048828125, 1.7340087890625, 2.217529296875, 2.7010498046875, 3.1845703125, 3.6680908203125, 4.151611328125, 4.6351318359375, 5.11865234375, 5.6021728515625, 6.085693359375, 6.5692138671875, 7.052734375, 7.5362548828125, 8.019775390625, 8.5032958984375, 8.98681640625, 9.4703369140625, 9.953857421875, 10.4373779296875, 10.9208984375, 11.4044189453125, 11.887939453125, 12.3714599609375, 12.85498046875, 13.3385009765625, 13.822021484375, 14.3055419921875, 14.7890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 3.0, 7.0, 11.0, 17.0, 19.0, 20.0, 29.0, 29.0, 35.0, 64.0, 58.0, 88.0, 146.0, 248.0, 468.0, 1498.0, 24581.0, 3053247.0, 61447.0, 2345.0, 536.0, 243.0, 144.0, 87.0, 63.0, 57.0, 41.0, 30.0, 29.0, 23.0, 21.0, 12.0, 12.0, 9.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.83056640625, -21.0673828125, -20.30419921875, -19.541015625, -18.77783203125, -18.0146484375, -17.25146484375, -16.48828125, -15.72509765625, -14.9619140625, -14.19873046875, -13.435546875, -12.67236328125, -11.9091796875, -11.14599609375, -10.3828125, -9.61962890625, -8.8564453125, -8.09326171875, -7.330078125, -6.56689453125, -5.8037109375, -5.04052734375, -4.27734375, -3.51416015625, -2.7509765625, -1.98779296875, -1.224609375, -0.46142578125, 0.3017578125, 1.06494140625, 1.828125, 2.59130859375, 3.3544921875, 4.11767578125, 4.880859375, 5.64404296875, 6.4072265625, 7.17041015625, 7.93359375, 8.69677734375, 9.4599609375, 10.22314453125, 10.986328125, 11.74951171875, 12.5126953125, 13.27587890625, 14.0390625, 14.80224609375, 15.5654296875, 16.32861328125, 17.091796875, 17.85498046875, 18.6181640625, 19.38134765625, 20.14453125, 20.90771484375, 21.6708984375, 22.43408203125, 23.197265625, 23.96044921875, 24.7236328125, 25.48681640625, 26.25]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 912.0, 101.0, 1.0], "bins": [-461.7902526855469, -454.3035583496094, -446.8168640136719, -439.33013916015625, -431.84344482421875, -424.35675048828125, -416.87005615234375, -409.38336181640625, -401.89666748046875, -394.40997314453125, -386.92327880859375, -379.4365539550781, -371.9498596191406, -364.4631652832031, -356.9764709472656, -349.4897766113281, -342.0030517578125, -334.516357421875, -327.0296630859375, -319.5429382324219, -312.0562438964844, -304.5695495605469, -297.0828552246094, -289.5961608886719, -282.10943603515625, -274.62274169921875, -267.13604736328125, -259.6493225097656, -252.16262817382812, -244.67593383789062, -237.18923950195312, -229.70254516601562, -222.21585083007812, -214.72915649414062, -207.24244689941406, -199.75575256347656, -192.26904296875, -184.7823486328125, -177.295654296875, -169.8089599609375, -162.322265625, -154.8355712890625, -147.34886169433594, -139.86216735839844, -132.37545776367188, -124.88876342773438, -117.40206909179688, -109.91536712646484, -102.42865753173828, -94.94195556640625, -87.45526123046875, -79.96855926513672, -72.48185729980469, -64.99515533447266, -57.50845718383789, -50.021759033203125, -42.535057067871094, -35.04835510253906, -27.561656951904297, -20.0749568939209, -12.5882568359375, -5.101554870605469, 2.385143280029297, 9.871841430664062, 17.358543395996094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 3.0, 9.0, 5.0, 7.0, 10.0, 18.0, 18.0, 11.0, 28.0, 9.0, 20.0, 22.0, 26.0, 31.0, 27.0, 26.0, 33.0, 29.0, 43.0, 38.0, 41.0, 44.0, 40.0, 36.0, 28.0, 43.0, 24.0, 30.0, 28.0, 43.0, 20.0, 24.0, 26.0, 19.0, 27.0, 21.0, 19.0, 8.0, 12.0, 9.0, 11.0, 10.0, 5.0, 3.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0], "bins": [-45.746849060058594, -44.42184829711914, -43.09684371948242, -41.77184295654297, -40.44683837890625, -39.1218376159668, -37.79683303833008, -36.471832275390625, -35.146827697753906, -33.82182693481445, -32.496822357177734, -31.17181968688965, -29.846817016601562, -28.52181625366211, -27.196813583374023, -25.871810913085938, -24.546810150146484, -23.2218074798584, -21.896804809570312, -20.571802139282227, -19.24679946899414, -17.921798706054688, -16.5967960357666, -15.271793365478516, -13.94679069519043, -12.621788024902344, -11.296785354614258, -9.971783638000488, -8.646780967712402, -7.321778297424316, -5.996776103973389, -4.671773910522461, -3.346771240234375, -2.021768808364868, -0.6967663764953613, 0.6282360553741455, 1.9532384872436523, 3.2782411575317383, 4.603243350982666, 5.928245544433594, 7.25324821472168, 8.578250885009766, 9.903253555297852, 11.228255271911621, 12.553257942199707, 13.878260612487793, 15.203262329101562, 16.52826499938965, 17.853267669677734, 19.17827033996582, 20.503273010253906, 21.828275680541992, 23.153278350830078, 24.47827911376953, 25.803281784057617, 27.128284454345703, 28.45328712463379, 29.778289794921875, 31.10329246520996, 32.42829513549805, 33.7532958984375, 35.07830047607422, 36.40330123901367, 37.728302001953125, 39.053306579589844]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 9.0, 10.0, 7.0, 15.0, 16.0, 19.0, 23.0, 23.0, 19.0, 24.0, 22.0, 26.0, 41.0, 36.0, 44.0, 36.0, 43.0, 45.0, 30.0, 44.0, 44.0, 44.0, 30.0, 28.0, 39.0, 35.0, 35.0, 36.0, 29.0, 19.0, 20.0, 19.0, 17.0, 16.0, 10.0, 11.0, 12.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1328125, -4.007080078125, -3.88134765625, -3.755615234375, -3.6298828125, -3.504150390625, -3.37841796875, -3.252685546875, -3.126953125, -3.001220703125, -2.87548828125, -2.749755859375, -2.6240234375, -2.498291015625, -2.37255859375, -2.246826171875, -2.12109375, -1.995361328125, -1.86962890625, -1.743896484375, -1.6181640625, -1.492431640625, -1.36669921875, -1.240966796875, -1.115234375, -0.989501953125, -0.86376953125, -0.738037109375, -0.6123046875, -0.486572265625, -0.36083984375, -0.235107421875, -0.109375, 0.016357421875, 0.14208984375, 0.267822265625, 0.3935546875, 0.519287109375, 0.64501953125, 0.770751953125, 0.896484375, 1.022216796875, 1.14794921875, 1.273681640625, 1.3994140625, 1.525146484375, 1.65087890625, 1.776611328125, 1.90234375, 2.028076171875, 2.15380859375, 2.279541015625, 2.4052734375, 2.531005859375, 2.65673828125, 2.782470703125, 2.908203125, 3.033935546875, 3.15966796875, 3.285400390625, 3.4111328125, 3.536865234375, 3.66259765625, 3.788330078125, 3.9140625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 10.0, 6.0, 9.0, 12.0, 20.0, 24.0, 20.0, 17.0, 33.0, 46.0, 53.0, 125.0, 232.0, 617.0, 2085.0, 9640.0, 58041.0, 618730.0, 2918845.0, 522136.0, 51444.0, 8883.0, 1997.0, 587.0, 270.0, 110.0, 70.0, 43.0, 34.0, 28.0, 23.0, 23.0, 6.0, 16.0, 9.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.25, -12.8656005859375, -12.481201171875, -12.0968017578125, -11.71240234375, -11.3280029296875, -10.943603515625, -10.5592041015625, -10.1748046875, -9.7904052734375, -9.406005859375, -9.0216064453125, -8.63720703125, -8.2528076171875, -7.868408203125, -7.4840087890625, -7.099609375, -6.7152099609375, -6.330810546875, -5.9464111328125, -5.56201171875, -5.1776123046875, -4.793212890625, -4.4088134765625, -4.0244140625, -3.6400146484375, -3.255615234375, -2.8712158203125, -2.48681640625, -2.1024169921875, -1.718017578125, -1.3336181640625, -0.94921875, -0.5648193359375, -0.180419921875, 0.2039794921875, 0.58837890625, 0.9727783203125, 1.357177734375, 1.7415771484375, 2.1259765625, 2.5103759765625, 2.894775390625, 3.2791748046875, 3.66357421875, 4.0479736328125, 4.432373046875, 4.8167724609375, 5.201171875, 5.5855712890625, 5.969970703125, 6.3543701171875, 6.73876953125, 7.1231689453125, 7.507568359375, 7.8919677734375, 8.2763671875, 8.6607666015625, 9.045166015625, 9.4295654296875, 9.81396484375, 10.1983642578125, 10.582763671875, 10.9671630859375, 11.3515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 7.0, 9.0, 14.0, 16.0, 28.0, 30.0, 43.0, 49.0, 65.0, 98.0, 103.0, 150.0, 196.0, 276.0, 350.0, 417.0, 472.0, 410.0, 345.0, 229.0, 186.0, 159.0, 108.0, 82.0, 54.0, 40.0, 32.0, 29.0, 26.0, 13.0, 20.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.331298828125, -12.97509765625, -12.618896484375, -12.2626953125, -11.906494140625, -11.55029296875, -11.194091796875, -10.837890625, -10.481689453125, -10.12548828125, -9.769287109375, -9.4130859375, -9.056884765625, -8.70068359375, -8.344482421875, -7.98828125, -7.632080078125, -7.27587890625, -6.919677734375, -6.5634765625, -6.207275390625, -5.85107421875, -5.494873046875, -5.138671875, -4.782470703125, -4.42626953125, -4.070068359375, -3.7138671875, -3.357666015625, -3.00146484375, -2.645263671875, -2.2890625, -1.932861328125, -1.57666015625, -1.220458984375, -0.8642578125, -0.508056640625, -0.15185546875, 0.204345703125, 0.560546875, 0.916748046875, 1.27294921875, 1.629150390625, 1.9853515625, 2.341552734375, 2.69775390625, 3.053955078125, 3.41015625, 3.766357421875, 4.12255859375, 4.478759765625, 4.8349609375, 5.191162109375, 5.54736328125, 5.903564453125, 6.259765625, 6.615966796875, 6.97216796875, 7.328369140625, 7.6845703125, 8.040771484375, 8.39697265625, 8.753173828125, 9.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 18.0, 12.0, 20.0, 42.0, 54.0, 44.0, 81.0, 106.0, 145.0, 223.0, 374.0, 690.0, 2947.0, 26912.0, 732220.0, 3301322.0, 118559.0, 7753.0, 1337.0, 473.0, 263.0, 185.0, 131.0, 80.0, 75.0, 48.0, 33.0, 23.0, 21.0, 17.0, 19.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.53125, -24.59423828125, -23.6572265625, -22.72021484375, -21.783203125, -20.84619140625, -19.9091796875, -18.97216796875, -18.03515625, -17.09814453125, -16.1611328125, -15.22412109375, -14.287109375, -13.35009765625, -12.4130859375, -11.47607421875, -10.5390625, -9.60205078125, -8.6650390625, -7.72802734375, -6.791015625, -5.85400390625, -4.9169921875, -3.97998046875, -3.04296875, -2.10595703125, -1.1689453125, -0.23193359375, 0.705078125, 1.64208984375, 2.5791015625, 3.51611328125, 4.453125, 5.39013671875, 6.3271484375, 7.26416015625, 8.201171875, 9.13818359375, 10.0751953125, 11.01220703125, 11.94921875, 12.88623046875, 13.8232421875, 14.76025390625, 15.697265625, 16.63427734375, 17.5712890625, 18.50830078125, 19.4453125, 20.38232421875, 21.3193359375, 22.25634765625, 23.193359375, 24.13037109375, 25.0673828125, 26.00439453125, 26.94140625, 27.87841796875, 28.8154296875, 29.75244140625, 30.689453125, 31.62646484375, 32.5634765625, 33.50048828125, 34.4375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 14.0, 26.0, 41.0, 65.0, 75.0, 86.0, 111.0, 132.0, 115.0, 112.0, 81.0, 61.0, 37.0, 23.0, 8.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.14889526367188, -70.2784423828125, -68.40798950195312, -66.53753662109375, -64.66708374023438, -62.796627044677734, -60.92617416381836, -59.055721282958984, -57.185264587402344, -55.31481170654297, -53.444358825683594, -51.57390594482422, -49.70344924926758, -47.8329963684082, -45.96254348754883, -44.09209060668945, -42.22163772583008, -40.3511848449707, -38.48073196411133, -36.61027526855469, -34.73982238769531, -32.86936950683594, -30.998916625976562, -29.128463745117188, -27.25800895690918, -25.387556076049805, -23.517101287841797, -21.646648406982422, -19.776195526123047, -17.90574073791504, -16.035287857055664, -14.164834022521973, -12.294384002685547, -10.423930168151855, -8.553476333618164, -6.683023452758789, -4.812569618225098, -2.9421157836914062, -1.0716629028320312, 0.7987909317016602, 2.6692447662353516, 4.539698600769043, 6.410151958465576, 8.28060531616211, 10.1510591506958, 12.021512985229492, 13.891965866088867, 15.762419700622559, 17.63287353515625, 19.503326416015625, 21.373781204223633, 23.244234085083008, 25.114688873291016, 26.98514175415039, 28.855594635009766, 30.72604751586914, 32.59650421142578, 34.466957092285156, 36.33740997314453, 38.207862854003906, 40.07831954956055, 41.94877243041992, 43.8192253112793, 45.68967819213867, 47.56013107299805]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 5.0, 4.0, 2.0, 9.0, 6.0, 9.0, 10.0, 16.0, 10.0, 20.0, 16.0, 22.0, 21.0, 22.0, 31.0, 40.0, 33.0, 19.0, 34.0, 32.0, 46.0, 39.0, 33.0, 32.0, 43.0, 44.0, 37.0, 37.0, 36.0, 26.0, 26.0, 29.0, 39.0, 33.0, 21.0, 14.0, 13.0, 17.0, 16.0, 11.0, 9.0, 12.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-36.4029541015625, -35.30902862548828, -34.21510314941406, -33.121177673339844, -32.027252197265625, -30.933326721191406, -29.839401245117188, -28.74547576904297, -27.65155029296875, -26.55762481689453, -25.463699340820312, -24.369773864746094, -23.275848388671875, -22.181922912597656, -21.087997436523438, -19.99407196044922, -18.900146484375, -17.80622100830078, -16.712295532226562, -15.618370056152344, -14.524444580078125, -13.430519104003906, -12.336593627929688, -11.242668151855469, -10.14874267578125, -9.054817199707031, -7.9608917236328125, -6.866966247558594, -5.773040771484375, -4.679115295410156, -3.5851898193359375, -2.4912643432617188, -1.3973388671875, -0.30341339111328125, 0.7905120849609375, 1.8844375610351562, 2.978363037109375, 4.072288513183594, 5.1662139892578125, 6.260139465332031, 7.35406494140625, 8.447990417480469, 9.541915893554688, 10.635841369628906, 11.729766845703125, 12.823692321777344, 13.917617797851562, 15.011543273925781, 16.10546875, 17.19939422607422, 18.293319702148438, 19.387245178222656, 20.481170654296875, 21.575096130371094, 22.669021606445312, 23.76294708251953, 24.85687255859375, 25.95079803466797, 27.044723510742188, 28.138648986816406, 29.232574462890625, 30.326499938964844, 31.420425415039062, 32.51435089111328, 33.6082763671875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 4.0, 9.0, 11.0, 5.0, 9.0, 12.0, 14.0, 20.0, 18.0, 19.0, 30.0, 28.0, 26.0, 28.0, 26.0, 25.0, 27.0, 40.0, 40.0, 34.0, 46.0, 34.0, 37.0, 45.0, 32.0, 29.0, 28.0, 29.0, 35.0, 38.0, 26.0, 24.0, 27.0, 19.0, 32.0, 11.0, 8.0, 18.0, 9.0, 13.0, 7.0, 4.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.833984375, -3.71551513671875, -3.5970458984375, -3.47857666015625, -3.360107421875, -3.24163818359375, -3.1231689453125, -3.00469970703125, -2.88623046875, -2.76776123046875, -2.6492919921875, -2.53082275390625, -2.412353515625, -2.29388427734375, -2.1754150390625, -2.05694580078125, -1.9384765625, -1.82000732421875, -1.7015380859375, -1.58306884765625, -1.464599609375, -1.34613037109375, -1.2276611328125, -1.10919189453125, -0.99072265625, -0.87225341796875, -0.7537841796875, -0.63531494140625, -0.516845703125, -0.39837646484375, -0.2799072265625, -0.16143798828125, -0.04296875, 0.07550048828125, 0.1939697265625, 0.31243896484375, 0.430908203125, 0.54937744140625, 0.6678466796875, 0.78631591796875, 0.90478515625, 1.02325439453125, 1.1417236328125, 1.26019287109375, 1.378662109375, 1.49713134765625, 1.6156005859375, 1.73406982421875, 1.8525390625, 1.97100830078125, 2.0894775390625, 2.20794677734375, 2.326416015625, 2.44488525390625, 2.5633544921875, 2.68182373046875, 2.80029296875, 2.91876220703125, 3.0372314453125, 3.15570068359375, 3.274169921875, 3.39263916015625, 3.5111083984375, 3.62957763671875, 3.748046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 19.0, 22.0, 33.0, 56.0, 71.0, 126.0, 163.0, 215.0, 331.0, 473.0, 703.0, 952.0, 1398.0, 2096.0, 3051.0, 4271.0, 6530.0, 9573.0, 14044.0, 20729.0, 30988.0, 46430.0, 68599.0, 98186.0, 130051.0, 147737.0, 134052.0, 103295.0, 72891.0, 48943.0, 33288.0, 22380.0, 14864.0, 10145.0, 6870.0, 4752.0, 3222.0, 2151.0, 1560.0, 982.0, 716.0, 515.0, 338.0, 209.0, 166.0, 109.0, 81.0, 60.0, 35.0, 20.0, 19.0, 16.0, 9.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.329345703125, -0.31891632080078125, -0.3084869384765625, -0.29805755615234375, -0.287628173828125, -0.27719879150390625, -0.2667694091796875, -0.25634002685546875, -0.24591064453125, -0.23548126220703125, -0.2250518798828125, -0.21462249755859375, -0.204193115234375, -0.19376373291015625, -0.1833343505859375, -0.17290496826171875, -0.1624755859375, -0.15204620361328125, -0.1416168212890625, -0.13118743896484375, -0.120758056640625, -0.11032867431640625, -0.0998992919921875, -0.08946990966796875, -0.07904052734375, -0.06861114501953125, -0.0581817626953125, -0.04775238037109375, -0.037322998046875, -0.02689361572265625, -0.0164642333984375, -0.00603485107421875, 0.00439453125, 0.01482391357421875, 0.0252532958984375, 0.03568267822265625, 0.046112060546875, 0.05654144287109375, 0.0669708251953125, 0.07740020751953125, 0.08782958984375, 0.09825897216796875, 0.1086883544921875, 0.11911773681640625, 0.129547119140625, 0.13997650146484375, 0.1504058837890625, 0.16083526611328125, 0.1712646484375, 0.18169403076171875, 0.1921234130859375, 0.20255279541015625, 0.212982177734375, 0.22341156005859375, 0.2338409423828125, 0.24427032470703125, 0.25469970703125, 0.26512908935546875, 0.2755584716796875, 0.28598785400390625, 0.296417236328125, 0.30684661865234375, 0.3172760009765625, 0.32770538330078125, 0.338134765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 8.0, 3.0, 7.0, 7.0, 15.0, 10.0, 10.0, 13.0, 21.0, 20.0, 18.0, 17.0, 30.0, 28.0, 26.0, 24.0, 26.0, 46.0, 29.0, 49.0, 52.0, 1067.0, 43.0, 50.0, 41.0, 46.0, 36.0, 37.0, 28.0, 38.0, 31.0, 23.0, 20.0, 16.0, 14.0, 19.0, 15.0, 13.0, 10.0, 10.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.71875, -2.63446044921875, -2.5501708984375, -2.46588134765625, -2.381591796875, -2.29730224609375, -2.2130126953125, -2.12872314453125, -2.04443359375, -1.96014404296875, -1.8758544921875, -1.79156494140625, -1.707275390625, -1.62298583984375, -1.5386962890625, -1.45440673828125, -1.3701171875, -1.28582763671875, -1.2015380859375, -1.11724853515625, -1.032958984375, -0.94866943359375, -0.8643798828125, -0.78009033203125, -0.69580078125, -0.61151123046875, -0.5272216796875, -0.44293212890625, -0.358642578125, -0.27435302734375, -0.1900634765625, -0.10577392578125, -0.021484375, 0.06280517578125, 0.1470947265625, 0.23138427734375, 0.315673828125, 0.39996337890625, 0.4842529296875, 0.56854248046875, 0.65283203125, 0.73712158203125, 0.8214111328125, 0.90570068359375, 0.989990234375, 1.07427978515625, 1.1585693359375, 1.24285888671875, 1.3271484375, 1.41143798828125, 1.4957275390625, 1.58001708984375, 1.664306640625, 1.74859619140625, 1.8328857421875, 1.91717529296875, 2.00146484375, 2.08575439453125, 2.1700439453125, 2.25433349609375, 2.338623046875, 2.42291259765625, 2.5072021484375, 2.59149169921875, 2.67578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 12.0, 15.0, 20.0, 29.0, 37.0, 65.0, 109.0, 182.0, 252.0, 371.0, 561.0, 805.0, 1246.0, 1823.0, 2621.0, 3941.0, 5763.0, 8756.0, 13080.0, 19654.0, 29421.0, 43274.0, 62596.0, 87080.0, 112789.0, 656363.0, 655064.0, 111834.0, 86623.0, 61917.0, 43008.0, 29228.0, 19592.0, 12864.0, 8642.0, 5573.0, 3894.0, 2528.0, 1799.0, 1221.0, 791.0, 553.0, 378.0, 265.0, 170.0, 112.0, 88.0, 52.0, 33.0, 21.0, 7.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26220703125, -0.2540130615234375, -0.245819091796875, -0.2376251220703125, -0.22943115234375, -0.2212371826171875, -0.213043212890625, -0.2048492431640625, -0.1966552734375, -0.1884613037109375, -0.180267333984375, -0.1720733642578125, -0.16387939453125, -0.1556854248046875, -0.147491455078125, -0.1392974853515625, -0.131103515625, -0.1229095458984375, -0.114715576171875, -0.1065216064453125, -0.09832763671875, -0.0901336669921875, -0.081939697265625, -0.0737457275390625, -0.0655517578125, -0.0573577880859375, -0.049163818359375, -0.0409698486328125, -0.03277587890625, -0.0245819091796875, -0.016387939453125, -0.0081939697265625, 0.0, 0.0081939697265625, 0.016387939453125, 0.0245819091796875, 0.03277587890625, 0.0409698486328125, 0.049163818359375, 0.0573577880859375, 0.0655517578125, 0.0737457275390625, 0.081939697265625, 0.0901336669921875, 0.09832763671875, 0.1065216064453125, 0.114715576171875, 0.1229095458984375, 0.131103515625, 0.1392974853515625, 0.147491455078125, 0.1556854248046875, 0.16387939453125, 0.1720733642578125, 0.180267333984375, 0.1884613037109375, 0.1966552734375, 0.2048492431640625, 0.213043212890625, 0.2212371826171875, 0.22943115234375, 0.2376251220703125, 0.245819091796875, 0.2540130615234375, 0.26220703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 3.0, 3.0, 5.0, 10.0, 12.0, 11.0, 10.0, 20.0, 16.0, 21.0, 20.0, 32.0, 37.0, 54.0, 47.0, 56.0, 53.0, 50.0, 58.0, 65.0, 40.0, 51.0, 48.0, 42.0, 43.0, 27.0, 34.0, 15.0, 20.0, 20.0, 14.0, 7.0, 6.0, 12.0, 6.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001995086669921875, -0.0019290149211883545, -0.001862943172454834, -0.0017968714237213135, -0.001730799674987793, -0.0016647279262542725, -0.001598656177520752, -0.0015325844287872314, -0.001466512680053711, -0.0014004409313201904, -0.00133436918258667, -0.0012682974338531494, -0.001202225685119629, -0.0011361539363861084, -0.0010700821876525879, -0.0010040104389190674, -0.0009379386901855469, -0.0008718669414520264, -0.0008057951927185059, -0.0007397234439849854, -0.0006736516952514648, -0.0006075799465179443, -0.0005415081977844238, -0.0004754364490509033, -0.0004093647003173828, -0.0003432929515838623, -0.0002772212028503418, -0.0002111494541168213, -0.00014507770538330078, -7.900595664978027e-05, -1.2934207916259766e-05, 5.313754081726074e-05, 0.00011920928955078125, 0.00018528103828430176, 0.00025135278701782227, 0.0003174245357513428, 0.0003834962844848633, 0.0004495680332183838, 0.0005156397819519043, 0.0005817115306854248, 0.0006477832794189453, 0.0007138550281524658, 0.0007799267768859863, 0.0008459985256195068, 0.0009120702743530273, 0.0009781420230865479, 0.0010442137718200684, 0.0011102855205535889, 0.0011763572692871094, 0.0012424290180206299, 0.0013085007667541504, 0.001374572515487671, 0.0014406442642211914, 0.001506716012954712, 0.0015727877616882324, 0.001638859510421753, 0.0017049312591552734, 0.001771003007888794, 0.0018370747566223145, 0.001903146505355835, 0.0019692182540893555, 0.002035290002822876, 0.0021013617515563965, 0.002167433500289917, 0.0022335052490234375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 15.0, 23.0, 21.0, 33.0, 41.0, 64.0, 95.0, 146.0, 200.0, 354.0, 848.0, 37243.0, 1005261.0, 2748.0, 536.0, 309.0, 169.0, 109.0, 90.0, 49.0, 34.0, 36.0, 20.0, 14.0, 7.0, 8.0, 11.0, 4.0, 6.0, 4.0, 4.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05303955078125, -0.05149269104003906, -0.049945831298828125, -0.04839897155761719, -0.04685211181640625, -0.04530525207519531, -0.043758392333984375, -0.04221153259277344, -0.0406646728515625, -0.03911781311035156, -0.037570953369140625, -0.03602409362792969, -0.03447723388671875, -0.03293037414550781, -0.031383514404296875, -0.029836654663085938, -0.028289794921875, -0.026742935180664062, -0.025196075439453125, -0.023649215698242188, -0.02210235595703125, -0.020555496215820312, -0.019008636474609375, -0.017461776733398438, -0.0159149169921875, -0.014368057250976562, -0.012821197509765625, -0.011274337768554688, -0.00972747802734375, -0.008180618286132812, -0.006633758544921875, -0.0050868988037109375, -0.0035400390625, -0.0019931793212890625, -0.000446319580078125, 0.0011005401611328125, 0.00264739990234375, 0.0041942596435546875, 0.005741119384765625, 0.0072879791259765625, 0.0088348388671875, 0.010381698608398438, 0.011928558349609375, 0.013475418090820312, 0.01502227783203125, 0.016569137573242188, 0.018115997314453125, 0.019662857055664062, 0.021209716796875, 0.022756576538085938, 0.024303436279296875, 0.025850296020507812, 0.02739715576171875, 0.028944015502929688, 0.030490875244140625, 0.03203773498535156, 0.0335845947265625, 0.03513145446777344, 0.036678314208984375, 0.03822517395019531, 0.03977203369140625, 0.04131889343261719, 0.042865753173828125, 0.04441261291503906, 0.04595947265625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 116.0, 849.0, 51.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007227916736155748, -0.0067589376121759415, -0.006289958488196135, -0.005820979364216328, -0.0053519997745752335, -0.004883021116256714, -0.00441404152661562, -0.003945062402635813, -0.003476083278656006, -0.003007104154676199, -0.002538125030696392, -0.0020691456738859415, -0.0016001665499061346, -0.0011311874259263277, -0.0006622080691158772, -0.00019322894513607025, 0.00027575017884373665, 0.0007447293610312045, 0.0012137085432186723, 0.001682687783613801, 0.002151666907593608, 0.002620646031573415, 0.0030896253883838654, 0.0035586045123636723, 0.004027583636343479, 0.004496562760323286, 0.004965541884303093, 0.005434521473944187, 0.005903500132262707, 0.006372479721903801, 0.006841458845883608, 0.007310437969863415, 0.007779417559504509, 0.008248397149145603, 0.008717375807464123, 0.009186355397105217, 0.009655334055423737, 0.01012431364506483, 0.010593293234705925, 0.011062271893024445, 0.011531250551342964, 0.012000230140984058, 0.012469208799302578, 0.012938188388943672, 0.013407167047262192, 0.013876146636903286, 0.01434512622654438, 0.0148141048848629, 0.015283084474503994, 0.015752064064145088, 0.016221042722463608, 0.016690021380782127, 0.017159001901745796, 0.017627980560064316, 0.018096959218382835, 0.018565937876701355, 0.019034918397665024, 0.019503897055983543, 0.019972877576947212, 0.020441856235265732, 0.02091083489358425, 0.02137981355190277, 0.02184879407286644, 0.02231777273118496, 0.02278675138950348]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 4.0, 12.0, 19.0, 9.0, 14.0, 22.0, 12.0, 25.0, 35.0, 24.0, 29.0, 29.0, 45.0, 42.0, 40.0, 34.0, 47.0, 38.0, 40.0, 51.0, 44.0, 46.0, 38.0, 38.0, 31.0, 34.0, 28.0, 22.0, 17.0, 20.0, 14.0, 18.0, 16.0, 12.0, 12.0, 6.0, 11.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013287067413330078, -0.0012872889637947083, -0.0012458711862564087, -0.0012044534087181091, -0.0011630356311798096, -0.00112161785364151, -0.0010802000761032104, -0.0010387822985649109, -0.0009973645210266113, -0.0009559467434883118, -0.0009145289659500122, -0.0008731111884117126, -0.0008316934108734131, -0.0007902756333351135, -0.000748857855796814, -0.0007074400782585144, -0.0006660223007202148, -0.0006246045231819153, -0.0005831867456436157, -0.0005417689681053162, -0.0005003511905670166, -0.00045893341302871704, -0.0004175156354904175, -0.0003760978579521179, -0.00033468008041381836, -0.0002932623028755188, -0.00025184452533721924, -0.00021042674779891968, -0.00016900897026062012, -0.00012759119272232056, -8.6173415184021e-05, -4.4755637645721436e-05, -3.337860107421875e-06, 3.8079917430877686e-05, 7.949769496917725e-05, 0.0001209154725074768, 0.00016233325004577637, 0.00020375102758407593, 0.0002451688051223755, 0.00028658658266067505, 0.0003280043601989746, 0.00036942213773727417, 0.00041083991527557373, 0.0004522576928138733, 0.0004936754703521729, 0.0005350932478904724, 0.000576511025428772, 0.0006179288029670715, 0.0006593465805053711, 0.0007007643580436707, 0.0007421821355819702, 0.0007835999131202698, 0.0008250176906585693, 0.0008664354681968689, 0.0009078532457351685, 0.000949271023273468, 0.0009906888008117676, 0.0010321065783500671, 0.0010735243558883667, 0.0011149421334266663, 0.0011563599109649658, 0.0011977776885032654, 0.001239195466041565, 0.0012806132435798645, 0.001322031021118164]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 4.0, 9.0, 11.0, 5.0, 9.0, 12.0, 14.0, 20.0, 18.0, 19.0, 30.0, 28.0, 26.0, 28.0, 26.0, 25.0, 27.0, 40.0, 40.0, 34.0, 45.0, 35.0, 37.0, 45.0, 32.0, 29.0, 28.0, 29.0, 35.0, 38.0, 26.0, 24.0, 27.0, 19.0, 32.0, 11.0, 8.0, 18.0, 9.0, 13.0, 7.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.833984375, -3.71551513671875, -3.5970458984375, -3.47857666015625, -3.360107421875, -3.24163818359375, -3.1231689453125, -3.00469970703125, -2.88623046875, -2.76776123046875, -2.6492919921875, -2.53082275390625, -2.412353515625, -2.29388427734375, -2.1754150390625, -2.05694580078125, -1.9384765625, -1.82000732421875, -1.7015380859375, -1.58306884765625, -1.464599609375, -1.34613037109375, -1.2276611328125, -1.10919189453125, -0.99072265625, -0.87225341796875, -0.7537841796875, -0.63531494140625, -0.516845703125, -0.39837646484375, -0.2799072265625, -0.16143798828125, -0.04296875, 0.07550048828125, 0.1939697265625, 0.31243896484375, 0.430908203125, 0.54937744140625, 0.6678466796875, 0.78631591796875, 0.90478515625, 1.02325439453125, 1.1417236328125, 1.26019287109375, 1.378662109375, 1.49713134765625, 1.6156005859375, 1.73406982421875, 1.8525390625, 1.97100830078125, 2.0894775390625, 2.20794677734375, 2.326416015625, 2.44488525390625, 2.5633544921875, 2.68182373046875, 2.80029296875, 2.91876220703125, 3.0372314453125, 3.15570068359375, 3.274169921875, 3.39263916015625, 3.5111083984375, 3.62957763671875, 3.748046875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 6.0, 2.0, 11.0, 20.0, 23.0, 29.0, 53.0, 76.0, 112.0, 164.0, 228.0, 320.0, 516.0, 785.0, 1125.0, 1675.0, 2590.0, 3931.0, 6494.0, 11288.0, 23107.0, 57095.0, 192003.0, 503440.0, 148526.0, 48109.0, 20066.0, 10175.0, 5854.0, 3522.0, 2346.0, 1624.0, 1093.0, 655.0, 473.0, 311.0, 211.0, 173.0, 105.0, 75.0, 55.0, 27.0, 16.0, 9.0, 17.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.02392578125, -3.8916015625, -3.75927734375, -3.626953125, -3.49462890625, -3.3623046875, -3.22998046875, -3.09765625, -2.96533203125, -2.8330078125, -2.70068359375, -2.568359375, -2.43603515625, -2.3037109375, -2.17138671875, -2.0390625, -1.90673828125, -1.7744140625, -1.64208984375, -1.509765625, -1.37744140625, -1.2451171875, -1.11279296875, -0.98046875, -0.84814453125, -0.7158203125, -0.58349609375, -0.451171875, -0.31884765625, -0.1865234375, -0.05419921875, 0.078125, 0.21044921875, 0.3427734375, 0.47509765625, 0.607421875, 0.73974609375, 0.8720703125, 1.00439453125, 1.13671875, 1.26904296875, 1.4013671875, 1.53369140625, 1.666015625, 1.79833984375, 1.9306640625, 2.06298828125, 2.1953125, 2.32763671875, 2.4599609375, 2.59228515625, 2.724609375, 2.85693359375, 2.9892578125, 3.12158203125, 3.25390625, 3.38623046875, 3.5185546875, 3.65087890625, 3.783203125, 3.91552734375, 4.0478515625, 4.18017578125, 4.3125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 13.0, 6.0, 13.0, 10.0, 14.0, 17.0, 22.0, 19.0, 31.0, 34.0, 27.0, 37.0, 36.0, 43.0, 50.0, 68.0, 91.0, 293.0, 1580.0, 140.0, 73.0, 54.0, 34.0, 48.0, 44.0, 30.0, 30.0, 25.0, 25.0, 21.0, 27.0, 12.0, 16.0, 7.0, 6.0, 9.0, 9.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.55078125, -13.1171875, -12.68359375, -12.25, -11.81640625, -11.3828125, -10.94921875, -10.515625, -10.08203125, -9.6484375, -9.21484375, -8.78125, -8.34765625, -7.9140625, -7.48046875, -7.046875, -6.61328125, -6.1796875, -5.74609375, -5.3125, -4.87890625, -4.4453125, -4.01171875, -3.578125, -3.14453125, -2.7109375, -2.27734375, -1.84375, -1.41015625, -0.9765625, -0.54296875, -0.109375, 0.32421875, 0.7578125, 1.19140625, 1.625, 2.05859375, 2.4921875, 2.92578125, 3.359375, 3.79296875, 4.2265625, 4.66015625, 5.09375, 5.52734375, 5.9609375, 6.39453125, 6.828125, 7.26171875, 7.6953125, 8.12890625, 8.5625, 8.99609375, 9.4296875, 9.86328125, 10.296875, 10.73046875, 11.1640625, 11.59765625, 12.03125, 12.46484375, 12.8984375, 13.33203125, 13.765625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 7.0, 22.0, 11.0, 21.0, 23.0, 47.0, 68.0, 102.0, 162.0, 209.0, 520.0, 2423.0, 66256.0, 3057852.0, 15686.0, 1264.0, 365.0, 201.0, 138.0, 83.0, 66.0, 40.0, 33.0, 27.0, 19.0, 13.0, 13.0, 10.0, 8.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.84375, -32.64892578125, -31.4541015625, -30.25927734375, -29.064453125, -27.86962890625, -26.6748046875, -25.47998046875, -24.28515625, -23.09033203125, -21.8955078125, -20.70068359375, -19.505859375, -18.31103515625, -17.1162109375, -15.92138671875, -14.7265625, -13.53173828125, -12.3369140625, -11.14208984375, -9.947265625, -8.75244140625, -7.5576171875, -6.36279296875, -5.16796875, -3.97314453125, -2.7783203125, -1.58349609375, -0.388671875, 0.80615234375, 2.0009765625, 3.19580078125, 4.390625, 5.58544921875, 6.7802734375, 7.97509765625, 9.169921875, 10.36474609375, 11.5595703125, 12.75439453125, 13.94921875, 15.14404296875, 16.3388671875, 17.53369140625, 18.728515625, 19.92333984375, 21.1181640625, 22.31298828125, 23.5078125, 24.70263671875, 25.8974609375, 27.09228515625, 28.287109375, 29.48193359375, 30.6767578125, 31.87158203125, 33.06640625, 34.26123046875, 35.4560546875, 36.65087890625, 37.845703125, 39.04052734375, 40.2353515625, 41.43017578125, 42.625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 80.0, 439.0, 420.0, 66.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-116.98042297363281, -114.25823974609375, -111.53604888916016, -108.8138656616211, -106.0916748046875, -103.36949157714844, -100.64730834960938, -97.92511749267578, -95.20292663574219, -92.48074340820312, -89.75855255126953, -87.03636932373047, -84.31417846679688, -81.59199523925781, -78.86981201171875, -76.14762115478516, -73.4254379272461, -70.70325469970703, -67.98106384277344, -65.25888061523438, -62.53668975830078, -59.81450653076172, -57.09231948852539, -54.37013244628906, -51.647945404052734, -48.925758361816406, -46.20357131958008, -43.48138427734375, -40.75920104980469, -38.037010192871094, -35.31482696533203, -32.5926399230957, -29.87045669555664, -27.148269653320312, -24.426082611083984, -21.70389747619629, -18.98171043395996, -16.259523391723633, -13.537338256835938, -10.81515121459961, -8.092964172363281, -5.370777606964111, -2.6485910415649414, 0.07359504699707031, 2.7957820892333984, 5.517969131469727, 8.240154266357422, 10.96234130859375, 13.684528350830078, 16.406715393066406, 19.128902435302734, 21.85108757019043, 24.573274612426758, 27.295461654663086, 30.01764678955078, 32.73983383178711, 35.46202087402344, 38.184207916259766, 40.906394958496094, 43.628578186035156, 46.35076904296875, 49.07295227050781, 51.79513931274414, 54.51732635498047, 57.2395133972168]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 13.0, 5.0, 10.0, 8.0, 11.0, 11.0, 18.0, 18.0, 21.0, 22.0, 23.0, 24.0, 30.0, 46.0, 40.0, 33.0, 27.0, 35.0, 36.0, 44.0, 43.0, 40.0, 45.0, 40.0, 30.0, 37.0, 31.0, 35.0, 19.0, 22.0, 29.0, 22.0, 21.0, 12.0, 13.0, 15.0, 17.0, 9.0, 8.0, 5.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-39.202178955078125, -37.93834686279297, -36.67451477050781, -35.410682678222656, -34.146846771240234, -32.88301467895508, -31.619182586669922, -30.355350494384766, -29.09151840209961, -27.827686309814453, -26.563852310180664, -25.300020217895508, -24.03618812561035, -22.772354125976562, -21.508522033691406, -20.24468994140625, -18.98085594177246, -17.717023849487305, -16.453189849853516, -15.18935775756836, -13.925525665283203, -12.66169261932373, -11.397859573364258, -10.134027481079102, -8.870194435119629, -7.6063618659973145, -6.342529296875, -5.078696250915527, -3.814863681793213, -2.5510311126708984, -1.2871980667114258, -0.02336597442626953, 1.2404670715332031, 2.5042996406555176, 3.768132448196411, 5.031965255737305, 6.295797824859619, 7.559630393981934, 8.823463439941406, 10.087295532226562, 11.351128578186035, 12.614961624145508, 13.878793716430664, 15.142626762390137, 16.40645980834961, 17.670291900634766, 18.934123992919922, 20.197956085205078, 21.461790084838867, 22.725622177124023, 23.989456176757812, 25.25328826904297, 26.517120361328125, 27.78095245361328, 29.04478645324707, 30.308618545532227, 31.572452545166016, 32.83628463745117, 34.10011672973633, 35.36395263671875, 36.627784729003906, 37.89161682128906, 39.15544891357422, 40.419281005859375, 41.68311309814453]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 12.0, 9.0, 10.0, 6.0, 15.0, 20.0, 12.0, 25.0, 27.0, 23.0, 26.0, 25.0, 28.0, 32.0, 31.0, 38.0, 44.0, 33.0, 52.0, 43.0, 38.0, 34.0, 37.0, 32.0, 34.0, 43.0, 33.0, 30.0, 20.0, 32.0, 20.0, 21.0, 18.0, 15.0, 16.0, 13.0, 7.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.28515625, -4.15667724609375, -4.0281982421875, -3.89971923828125, -3.771240234375, -3.64276123046875, -3.5142822265625, -3.38580322265625, -3.25732421875, -3.12884521484375, -3.0003662109375, -2.87188720703125, -2.743408203125, -2.61492919921875, -2.4864501953125, -2.35797119140625, -2.2294921875, -2.10101318359375, -1.9725341796875, -1.84405517578125, -1.715576171875, -1.58709716796875, -1.4586181640625, -1.33013916015625, -1.20166015625, -1.07318115234375, -0.9447021484375, -0.81622314453125, -0.687744140625, -0.55926513671875, -0.4307861328125, -0.30230712890625, -0.173828125, -0.04534912109375, 0.0831298828125, 0.21160888671875, 0.340087890625, 0.46856689453125, 0.5970458984375, 0.72552490234375, 0.85400390625, 0.98248291015625, 1.1109619140625, 1.23944091796875, 1.367919921875, 1.49639892578125, 1.6248779296875, 1.75335693359375, 1.8818359375, 2.01031494140625, 2.1387939453125, 2.26727294921875, 2.395751953125, 2.52423095703125, 2.6527099609375, 2.78118896484375, 2.90966796875, 3.03814697265625, 3.1666259765625, 3.29510498046875, 3.423583984375, 3.55206298828125, 3.6805419921875, 3.80902099609375, 3.9375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 17.0, 26.0, 42.0, 59.0, 89.0, 109.0, 179.0, 271.0, 393.0, 706.0, 1278.0, 2405.0, 5039.0, 10655.0, 24160.0, 59571.0, 169230.0, 544132.0, 1273086.0, 1277046.0, 549004.0, 171296.0, 59944.0, 24346.0, 10539.0, 5042.0, 2493.0, 1198.0, 683.0, 418.0, 226.0, 177.0, 122.0, 90.0, 54.0, 34.0, 22.0, 30.0, 10.0, 12.0, 12.0, 3.0, 5.0, 2.0, 6.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.50604248046875, -5.3441162109375, -5.18218994140625, -5.020263671875, -4.85833740234375, -4.6964111328125, -4.53448486328125, -4.37255859375, -4.21063232421875, -4.0487060546875, -3.88677978515625, -3.724853515625, -3.56292724609375, -3.4010009765625, -3.23907470703125, -3.0771484375, -2.91522216796875, -2.7532958984375, -2.59136962890625, -2.429443359375, -2.26751708984375, -2.1055908203125, -1.94366455078125, -1.78173828125, -1.61981201171875, -1.4578857421875, -1.29595947265625, -1.134033203125, -0.97210693359375, -0.8101806640625, -0.64825439453125, -0.486328125, -0.32440185546875, -0.1624755859375, -0.00054931640625, 0.161376953125, 0.32330322265625, 0.4852294921875, 0.64715576171875, 0.80908203125, 0.97100830078125, 1.1329345703125, 1.29486083984375, 1.456787109375, 1.61871337890625, 1.7806396484375, 1.94256591796875, 2.1044921875, 2.26641845703125, 2.4283447265625, 2.59027099609375, 2.752197265625, 2.91412353515625, 3.0760498046875, 3.23797607421875, 3.39990234375, 3.56182861328125, 3.7237548828125, 3.88568115234375, 4.047607421875, 4.20953369140625, 4.3714599609375, 4.53338623046875, 4.6953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 25.0, 35.0, 34.0, 72.0, 113.0, 167.0, 230.0, 344.0, 465.0, 601.0, 572.0, 448.0, 315.0, 213.0, 139.0, 104.0, 57.0, 42.0, 25.0, 20.0, 13.0, 11.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.34912109375, -11.8701171875, -11.39111328125, -10.912109375, -10.43310546875, -9.9541015625, -9.47509765625, -8.99609375, -8.51708984375, -8.0380859375, -7.55908203125, -7.080078125, -6.60107421875, -6.1220703125, -5.64306640625, -5.1640625, -4.68505859375, -4.2060546875, -3.72705078125, -3.248046875, -2.76904296875, -2.2900390625, -1.81103515625, -1.33203125, -0.85302734375, -0.3740234375, 0.10498046875, 0.583984375, 1.06298828125, 1.5419921875, 2.02099609375, 2.5, 2.97900390625, 3.4580078125, 3.93701171875, 4.416015625, 4.89501953125, 5.3740234375, 5.85302734375, 6.33203125, 6.81103515625, 7.2900390625, 7.76904296875, 8.248046875, 8.72705078125, 9.2060546875, 9.68505859375, 10.1640625, 10.64306640625, 11.1220703125, 11.60107421875, 12.080078125, 12.55908203125, 13.0380859375, 13.51708984375, 13.99609375, 14.47509765625, 14.9541015625, 15.43310546875, 15.912109375, 16.39111328125, 16.8701171875, 17.34912109375, 17.828125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 12.0, 12.0, 18.0, 22.0, 23.0, 43.0, 53.0, 75.0, 91.0, 174.0, 282.0, 649.0, 2350.0, 26158.0, 1280515.0, 2827731.0, 50960.0, 3466.0, 781.0, 317.0, 183.0, 98.0, 52.0, 54.0, 48.0, 29.0, 19.0, 24.0, 15.0, 9.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.671875, -27.614013671875, -26.55615234375, -25.498291015625, -24.4404296875, -23.382568359375, -22.32470703125, -21.266845703125, -20.208984375, -19.151123046875, -18.09326171875, -17.035400390625, -15.9775390625, -14.919677734375, -13.86181640625, -12.803955078125, -11.74609375, -10.688232421875, -9.63037109375, -8.572509765625, -7.5146484375, -6.456787109375, -5.39892578125, -4.341064453125, -3.283203125, -2.225341796875, -1.16748046875, -0.109619140625, 0.9482421875, 2.006103515625, 3.06396484375, 4.121826171875, 5.1796875, 6.237548828125, 7.29541015625, 8.353271484375, 9.4111328125, 10.468994140625, 11.52685546875, 12.584716796875, 13.642578125, 14.700439453125, 15.75830078125, 16.816162109375, 17.8740234375, 18.931884765625, 19.98974609375, 21.047607421875, 22.10546875, 23.163330078125, 24.22119140625, 25.279052734375, 26.3369140625, 27.394775390625, 28.45263671875, 29.510498046875, 30.568359375, 31.626220703125, 32.68408203125, 33.741943359375, 34.7998046875, 35.857666015625, 36.91552734375, 37.973388671875, 39.03125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 17.0, 36.0, 80.0, 146.0, 189.0, 191.0, 150.0, 96.0, 52.0, 22.0, 12.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-143.0394744873047, -140.17984008789062, -137.32020568847656, -134.4605712890625, -131.60093688964844, -128.74130249023438, -125.88166809082031, -123.02203369140625, -120.16239929199219, -117.30276489257812, -114.44313049316406, -111.58349609375, -108.72386169433594, -105.86422729492188, -103.00459289550781, -100.14495849609375, -97.28532409667969, -94.42568969726562, -91.56605529785156, -88.7064208984375, -85.84678649902344, -82.98715209960938, -80.12751770019531, -77.26788330078125, -74.40825653076172, -71.54862213134766, -68.6889877319336, -65.82935333251953, -62.96971893310547, -60.110084533691406, -57.250450134277344, -54.39081573486328, -51.531185150146484, -48.67155075073242, -45.81191635131836, -42.9522819519043, -40.092647552490234, -37.23301315307617, -34.373382568359375, -31.51374626159668, -28.654111862182617, -25.794477462768555, -22.934843063354492, -20.075210571289062, -17.215576171875, -14.355940818786621, -11.496307373046875, -8.636672973632812, -5.77703857421875, -2.9174044132232666, -0.0577702522277832, 2.801863670349121, 5.661498069763184, 8.521132469177246, 11.380765914916992, 14.240400314331055, 17.100034713745117, 19.95966911315918, 22.819303512573242, 25.678936004638672, 28.538570404052734, 31.398204803466797, 34.25783920288086, 37.11747360229492, 39.977108001708984]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 8.0, 9.0, 8.0, 10.0, 15.0, 17.0, 17.0, 27.0, 21.0, 25.0, 32.0, 22.0, 28.0, 30.0, 30.0, 34.0, 35.0, 42.0, 37.0, 34.0, 33.0, 46.0, 41.0, 52.0, 23.0, 34.0, 41.0, 29.0, 24.0, 36.0, 28.0, 20.0, 14.0, 12.0, 12.0, 16.0, 11.0, 10.0, 13.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-41.2037353515625, -40.072757720947266, -38.94178009033203, -37.8108024597168, -36.67982482910156, -35.54884719848633, -34.417869567871094, -33.28689193725586, -32.155914306640625, -31.02493667602539, -29.893959045410156, -28.762981414794922, -27.632003784179688, -26.501026153564453, -25.37004852294922, -24.239070892333984, -23.10809326171875, -21.977115631103516, -20.84613800048828, -19.715160369873047, -18.584182739257812, -17.453205108642578, -16.322227478027344, -15.19124984741211, -14.060272216796875, -12.92929458618164, -11.798316955566406, -10.667339324951172, -9.536361694335938, -8.405384063720703, -7.274406433105469, -6.143428802490234, -5.012451171875, -3.8814735412597656, -2.7504959106445312, -1.6195182800292969, -0.4885406494140625, 0.6424369812011719, 1.7734146118164062, 2.9043922424316406, 4.035369873046875, 5.166347503662109, 6.297325134277344, 7.428302764892578, 8.559280395507812, 9.690258026123047, 10.821235656738281, 11.952213287353516, 13.08319091796875, 14.214168548583984, 15.345146179199219, 16.476123809814453, 17.607101440429688, 18.738079071044922, 19.869056701660156, 21.00003433227539, 22.131011962890625, 23.26198959350586, 24.392967224121094, 25.523944854736328, 26.654922485351562, 27.785900115966797, 28.91687774658203, 30.047855377197266, 31.1788330078125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 7.0, 6.0, 10.0, 5.0, 8.0, 11.0, 14.0, 17.0, 17.0, 25.0, 22.0, 17.0, 25.0, 34.0, 26.0, 24.0, 27.0, 35.0, 43.0, 35.0, 37.0, 45.0, 51.0, 31.0, 41.0, 40.0, 40.0, 31.0, 28.0, 25.0, 32.0, 23.0, 28.0, 19.0, 25.0, 15.0, 12.0, 12.0, 12.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99859619140625, -3.8682861328125, -3.73797607421875, -3.607666015625, -3.47735595703125, -3.3470458984375, -3.21673583984375, -3.08642578125, -2.95611572265625, -2.8258056640625, -2.69549560546875, -2.565185546875, -2.43487548828125, -2.3045654296875, -2.17425537109375, -2.0439453125, -1.91363525390625, -1.7833251953125, -1.65301513671875, -1.522705078125, -1.39239501953125, -1.2620849609375, -1.13177490234375, -1.00146484375, -0.87115478515625, -0.7408447265625, -0.61053466796875, -0.480224609375, -0.34991455078125, -0.2196044921875, -0.08929443359375, 0.041015625, 0.17132568359375, 0.3016357421875, 0.43194580078125, 0.562255859375, 0.69256591796875, 0.8228759765625, 0.95318603515625, 1.08349609375, 1.21380615234375, 1.3441162109375, 1.47442626953125, 1.604736328125, 1.73504638671875, 1.8653564453125, 1.99566650390625, 2.1259765625, 2.25628662109375, 2.3865966796875, 2.51690673828125, 2.647216796875, 2.77752685546875, 2.9078369140625, 3.03814697265625, 3.16845703125, 3.29876708984375, 3.4290771484375, 3.55938720703125, 3.689697265625, 3.82000732421875, 3.9503173828125, 4.08062744140625, 4.2109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 17.0, 35.0, 54.0, 80.0, 117.0, 164.0, 265.0, 330.0, 515.0, 738.0, 1091.0, 1510.0, 2131.0, 3121.0, 4446.0, 6285.0, 8877.0, 12801.0, 18040.0, 25819.0, 37011.0, 52927.0, 75539.0, 103905.0, 129966.0, 138921.0, 119504.0, 89961.0, 64397.0, 44958.0, 31551.0, 21797.0, 15303.0, 10918.0, 7594.0, 5385.0, 3715.0, 2742.0, 1853.0, 1327.0, 890.0, 580.0, 449.0, 307.0, 201.0, 127.0, 83.0, 71.0, 42.0, 31.0, 16.0, 15.0, 9.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.347900390625, -0.33712005615234375, -0.3263397216796875, -0.31555938720703125, -0.304779052734375, -0.29399871826171875, -0.2832183837890625, -0.27243804931640625, -0.26165771484375, -0.25087738037109375, -0.2400970458984375, -0.22931671142578125, -0.218536376953125, -0.20775604248046875, -0.1969757080078125, -0.18619537353515625, -0.1754150390625, -0.16463470458984375, -0.1538543701171875, -0.14307403564453125, -0.132293701171875, -0.12151336669921875, -0.1107330322265625, -0.09995269775390625, -0.08917236328125, -0.07839202880859375, -0.0676116943359375, -0.05683135986328125, -0.046051025390625, -0.03527069091796875, -0.0244903564453125, -0.01371002197265625, -0.0029296875, 0.00785064697265625, 0.0186309814453125, 0.02941131591796875, 0.040191650390625, 0.05097198486328125, 0.0617523193359375, 0.07253265380859375, 0.08331298828125, 0.09409332275390625, 0.1048736572265625, 0.11565399169921875, 0.126434326171875, 0.13721466064453125, 0.1479949951171875, 0.15877532958984375, 0.1695556640625, 0.18033599853515625, 0.1911163330078125, 0.20189666748046875, 0.212677001953125, 0.22345733642578125, 0.2342376708984375, 0.24501800537109375, 0.25579833984375, 0.26657867431640625, 0.2773590087890625, 0.28813934326171875, 0.298919677734375, 0.30970001220703125, 0.3204803466796875, 0.33126068115234375, 0.342041015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 5.0, 4.0, 10.0, 11.0, 8.0, 11.0, 14.0, 16.0, 20.0, 23.0, 24.0, 31.0, 20.0, 38.0, 29.0, 29.0, 26.0, 27.0, 36.0, 42.0, 45.0, 1065.0, 47.0, 37.0, 40.0, 44.0, 32.0, 32.0, 34.0, 28.0, 26.0, 28.0, 24.0, 19.0, 16.0, 10.0, 11.0, 8.0, 10.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.69140625, -2.60797119140625, -2.5245361328125, -2.44110107421875, -2.357666015625, -2.27423095703125, -2.1907958984375, -2.10736083984375, -2.02392578125, -1.94049072265625, -1.8570556640625, -1.77362060546875, -1.690185546875, -1.60675048828125, -1.5233154296875, -1.43988037109375, -1.3564453125, -1.27301025390625, -1.1895751953125, -1.10614013671875, -1.022705078125, -0.93927001953125, -0.8558349609375, -0.77239990234375, -0.68896484375, -0.60552978515625, -0.5220947265625, -0.43865966796875, -0.355224609375, -0.27178955078125, -0.1883544921875, -0.10491943359375, -0.021484375, 0.06195068359375, 0.1453857421875, 0.22882080078125, 0.312255859375, 0.39569091796875, 0.4791259765625, 0.56256103515625, 0.64599609375, 0.72943115234375, 0.8128662109375, 0.89630126953125, 0.979736328125, 1.06317138671875, 1.1466064453125, 1.23004150390625, 1.3134765625, 1.39691162109375, 1.4803466796875, 1.56378173828125, 1.647216796875, 1.73065185546875, 1.8140869140625, 1.89752197265625, 1.98095703125, 2.06439208984375, 2.1478271484375, 2.23126220703125, 2.314697265625, 2.39813232421875, 2.4815673828125, 2.56500244140625, 2.6484375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 12.0, 5.0, 17.0, 28.0, 53.0, 64.0, 89.0, 165.0, 262.0, 374.0, 526.0, 835.0, 1143.0, 1747.0, 2575.0, 3714.0, 5847.0, 8698.0, 12935.0, 19500.0, 29375.0, 43684.0, 62927.0, 87119.0, 113377.0, 920167.0, 392936.0, 112132.0, 86078.0, 62037.0, 42681.0, 28773.0, 19044.0, 12495.0, 8596.0, 5622.0, 3736.0, 2615.0, 1720.0, 1120.0, 825.0, 523.0, 340.0, 233.0, 132.0, 106.0, 65.0, 35.0, 21.0, 16.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.285888671875, -0.2772178649902344, -0.26854705810546875, -0.2598762512207031, -0.2512054443359375, -0.24253463745117188, -0.23386383056640625, -0.22519302368164062, -0.216522216796875, -0.20785140991210938, -0.19918060302734375, -0.19050979614257812, -0.1818389892578125, -0.17316818237304688, -0.16449737548828125, -0.15582656860351562, -0.14715576171875, -0.13848495483398438, -0.12981414794921875, -0.12114334106445312, -0.1124725341796875, -0.10380172729492188, -0.09513092041015625, -0.08646011352539062, -0.077789306640625, -0.06911849975585938, -0.06044769287109375, -0.051776885986328125, -0.0431060791015625, -0.034435272216796875, -0.02576446533203125, -0.017093658447265625, -0.0084228515625, 0.000247955322265625, 0.00891876220703125, 0.017589569091796875, 0.0262603759765625, 0.034931182861328125, 0.04360198974609375, 0.052272796630859375, 0.060943603515625, 0.06961441040039062, 0.07828521728515625, 0.08695602416992188, 0.0956268310546875, 0.10429763793945312, 0.11296844482421875, 0.12163925170898438, 0.13031005859375, 0.13898086547851562, 0.14765167236328125, 0.15632247924804688, 0.1649932861328125, 0.17366409301757812, 0.18233489990234375, 0.19100570678710938, 0.199676513671875, 0.20834732055664062, 0.21701812744140625, 0.22568893432617188, 0.2343597412109375, 0.24303054809570312, 0.25170135498046875, 0.2603721618652344, 0.26904296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 2.0, 5.0, 13.0, 10.0, 20.0, 25.0, 30.0, 38.0, 66.0, 90.0, 112.0, 111.0, 97.0, 97.0, 78.0, 50.0, 43.0, 20.0, 25.0, 14.0, 8.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00553131103515625, -0.005381345748901367, -0.005231380462646484, -0.0050814151763916016, -0.004931449890136719, -0.004781484603881836, -0.004631519317626953, -0.00448155403137207, -0.0043315887451171875, -0.004181623458862305, -0.004031658172607422, -0.003881692886352539, -0.0037317276000976562, -0.0035817623138427734, -0.0034317970275878906, -0.003281831741333008, -0.003131866455078125, -0.002981901168823242, -0.0028319358825683594, -0.0026819705963134766, -0.0025320053100585938, -0.002382040023803711, -0.002232074737548828, -0.0020821094512939453, -0.0019321441650390625, -0.0017821788787841797, -0.0016322135925292969, -0.001482248306274414, -0.0013322830200195312, -0.0011823177337646484, -0.0010323524475097656, -0.0008823871612548828, -0.000732421875, -0.0005824565887451172, -0.0004324913024902344, -0.00028252601623535156, -0.00013256072998046875, 1.7404556274414062e-05, 0.00016736984252929688, 0.0003173351287841797, 0.0004673004150390625, 0.0006172657012939453, 0.0007672309875488281, 0.0009171962738037109, 0.0010671615600585938, 0.0012171268463134766, 0.0013670921325683594, 0.0015170574188232422, 0.001667022705078125, 0.0018169879913330078, 0.0019669532775878906, 0.0021169185638427734, 0.0022668838500976562, 0.002416849136352539, 0.002566814422607422, 0.0027167797088623047, 0.0028667449951171875, 0.0030167102813720703, 0.003166675567626953, 0.003316640853881836, 0.0034666061401367188, 0.0036165714263916016, 0.0037665367126464844, 0.003916501998901367, 0.00406646728515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 11.0, 8.0, 16.0, 24.0, 44.0, 41.0, 82.0, 144.0, 274.0, 794.0, 189901.0, 855445.0, 1012.0, 307.0, 166.0, 95.0, 54.0, 30.0, 28.0, 13.0, 13.0, 11.0, 5.0, 5.0, 0.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08229255676269531, -0.07913589477539062, -0.07597923278808594, -0.07282257080078125, -0.06966590881347656, -0.06650924682617188, -0.06335258483886719, -0.0601959228515625, -0.05703926086425781, -0.053882598876953125, -0.05072593688964844, -0.04756927490234375, -0.04441261291503906, -0.041255950927734375, -0.03809928894042969, -0.034942626953125, -0.03178596496582031, -0.028629302978515625, -0.025472640991210938, -0.02231597900390625, -0.019159317016601562, -0.016002655029296875, -0.012845993041992188, -0.0096893310546875, -0.0065326690673828125, -0.003376007080078125, -0.0002193450927734375, 0.00293731689453125, 0.0060939788818359375, 0.009250640869140625, 0.012407302856445312, 0.01556396484375, 0.018720626831054688, 0.021877288818359375, 0.025033950805664062, 0.02819061279296875, 0.03134727478027344, 0.034503936767578125, 0.03766059875488281, 0.0408172607421875, 0.04397392272949219, 0.047130584716796875, 0.05028724670410156, 0.05344390869140625, 0.05660057067871094, 0.059757232666015625, 0.06291389465332031, 0.066070556640625, 0.06922721862792969, 0.07238388061523438, 0.07554054260253906, 0.07869720458984375, 0.08185386657714844, 0.08501052856445312, 0.08816719055175781, 0.0913238525390625, 0.09448051452636719, 0.09763717651367188, 0.10079383850097656, 0.10395050048828125, 0.10710716247558594, 0.11026382446289062, 0.11342048645019531, 0.1165771484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 947.0, 67.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006667268928140402, -0.005268405191600323, -0.0038695409893989563, -0.002470677252858877, -0.0010718130506575108, 0.00032705115154385567, 0.0017259144224226475, 0.003124778624624014, 0.00452364282682538, 0.0059225065633654594, 0.007321370765566826, 0.008720234036445618, 0.010119099169969559, 0.01151796244084835, 0.012916825711727142, 0.014315690845251083, 0.015714554116129875, 0.017113417387008667, 0.018512282520532608, 0.0199111457914114, 0.02131000906229019, 0.022708874195814133, 0.024107737466692924, 0.025506600737571716, 0.026905465871095657, 0.02830432914197445, 0.02970319427549839, 0.031102057546377182, 0.03250092267990112, 0.033899784088134766, 0.03529864922165871, 0.03669751435518265, 0.03809637576341629, 0.03949524089694023, 0.040894102305173874, 0.042292967438697815, 0.043691832572221756, 0.0450906977057457, 0.04648955911397934, 0.04788842424750328, 0.04928728938102722, 0.05068615451455116, 0.052085015922784805, 0.053483881056308746, 0.05488274618983269, 0.05628161132335663, 0.05768047273159027, 0.05907933786511421, 0.060478199273347855, 0.061877064406871796, 0.06327592581510544, 0.06467479467391968, 0.06607365608215332, 0.06747251749038696, 0.0688713788986206, 0.07027024775743484, 0.07166910916566849, 0.07306797057390213, 0.07446683943271637, 0.07586570084095001, 0.07726456224918365, 0.0786634311079979, 0.08006229251623154, 0.08146115392446518, 0.08286002278327942]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 14.0, 15.0, 19.0, 31.0, 38.0, 37.0, 47.0, 51.0, 57.0, 54.0, 62.0, 70.0, 55.0, 65.0, 55.0, 51.0, 48.0, 56.0, 28.0, 22.0, 28.0, 19.0, 14.0, 8.0, 13.0, 4.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.003915548324584961, -0.0038236798718571663, -0.0037318114191293716, -0.003639942966401577, -0.0035480745136737823, -0.0034562060609459877, -0.003364337608218193, -0.0032724691554903984, -0.0031806007027626038, -0.003088732250034809, -0.0029968637973070145, -0.00290499534457922, -0.002813126891851425, -0.0027212584391236305, -0.002629389986395836, -0.0025375215336680412, -0.0024456530809402466, -0.002353784628212452, -0.0022619161754846573, -0.0021700477227568626, -0.002078179270029068, -0.0019863108173012733, -0.0018944423645734787, -0.001802573911845684, -0.0017107054591178894, -0.0016188370063900948, -0.0015269685536623001, -0.0014351001009345055, -0.0013432316482067108, -0.0012513631954789162, -0.0011594947427511215, -0.0010676262900233269, -0.0009757578372955322, -0.0008838893845677376, -0.0007920209318399429, -0.0007001524791121483, -0.0006082840263843536, -0.000516415573656559, -0.00042454712092876434, -0.0003326786682009697, -0.00024081021547317505, -0.0001489417627453804, -5.7073310017585754e-05, 3.479514271020889e-05, 0.00012666359543800354, 0.0002185320481657982, 0.00031040050089359283, 0.0004022689536213875, 0.0004941374063491821, 0.0005860058590769768, 0.0006778743118047714, 0.0007697427645325661, 0.0008616112172603607, 0.0009534796699881554, 0.00104534812271595, 0.0011372165754437447, 0.0012290850281715393, 0.001320953480899334, 0.0014128219336271286, 0.0015046903863549232, 0.001596558839082718, 0.0016884272918105125, 0.0017802957445383072, 0.0018721641972661018, 0.0019640326499938965]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 7.0, 6.0, 10.0, 5.0, 8.0, 11.0, 14.0, 17.0, 17.0, 25.0, 22.0, 17.0, 25.0, 34.0, 26.0, 24.0, 27.0, 35.0, 43.0, 35.0, 37.0, 45.0, 51.0, 31.0, 41.0, 41.0, 39.0, 31.0, 28.0, 25.0, 32.0, 23.0, 28.0, 19.0, 25.0, 15.0, 12.0, 12.0, 12.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99859619140625, -3.8682861328125, -3.73797607421875, -3.607666015625, -3.47735595703125, -3.3470458984375, -3.21673583984375, -3.08642578125, -2.95611572265625, -2.8258056640625, -2.69549560546875, -2.565185546875, -2.43487548828125, -2.3045654296875, -2.17425537109375, -2.0439453125, -1.91363525390625, -1.7833251953125, -1.65301513671875, -1.522705078125, -1.39239501953125, -1.2620849609375, -1.13177490234375, -1.00146484375, -0.87115478515625, -0.7408447265625, -0.61053466796875, -0.480224609375, -0.34991455078125, -0.2196044921875, -0.08929443359375, 0.041015625, 0.17132568359375, 0.3016357421875, 0.43194580078125, 0.562255859375, 0.69256591796875, 0.8228759765625, 0.95318603515625, 1.08349609375, 1.21380615234375, 1.3441162109375, 1.47442626953125, 1.604736328125, 1.73504638671875, 1.8653564453125, 1.99566650390625, 2.1259765625, 2.25628662109375, 2.3865966796875, 2.51690673828125, 2.647216796875, 2.77752685546875, 2.9078369140625, 3.03814697265625, 3.16845703125, 3.29876708984375, 3.4290771484375, 3.55938720703125, 3.689697265625, 3.82000732421875, 3.9503173828125, 4.08062744140625, 4.2109375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 5.0, 10.0, 8.0, 13.0, 17.0, 17.0, 28.0, 48.0, 70.0, 71.0, 120.0, 125.0, 200.0, 307.0, 422.0, 689.0, 1124.0, 1761.0, 3305.0, 5811.0, 11400.0, 23870.0, 59501.0, 180321.0, 431481.0, 207831.0, 66272.0, 26337.0, 12304.0, 6257.0, 3429.0, 1921.0, 1186.0, 727.0, 426.0, 319.0, 230.0, 148.0, 118.0, 79.0, 53.0, 51.0, 33.0, 26.0, 23.0, 15.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.01171875, -3.88043212890625, -3.7491455078125, -3.61785888671875, -3.486572265625, -3.35528564453125, -3.2239990234375, -3.09271240234375, -2.96142578125, -2.83013916015625, -2.6988525390625, -2.56756591796875, -2.436279296875, -2.30499267578125, -2.1737060546875, -2.04241943359375, -1.9111328125, -1.77984619140625, -1.6485595703125, -1.51727294921875, -1.385986328125, -1.25469970703125, -1.1234130859375, -0.99212646484375, -0.86083984375, -0.72955322265625, -0.5982666015625, -0.46697998046875, -0.335693359375, -0.20440673828125, -0.0731201171875, 0.05816650390625, 0.189453125, 0.32073974609375, 0.4520263671875, 0.58331298828125, 0.714599609375, 0.84588623046875, 0.9771728515625, 1.10845947265625, 1.23974609375, 1.37103271484375, 1.5023193359375, 1.63360595703125, 1.764892578125, 1.89617919921875, 2.0274658203125, 2.15875244140625, 2.2900390625, 2.42132568359375, 2.5526123046875, 2.68389892578125, 2.815185546875, 2.94647216796875, 3.0777587890625, 3.20904541015625, 3.34033203125, 3.47161865234375, 3.6029052734375, 3.73419189453125, 3.865478515625, 3.99676513671875, 4.1280517578125, 4.25933837890625, 4.390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 7.0, 11.0, 25.0, 16.0, 18.0, 29.0, 28.0, 31.0, 39.0, 33.0, 42.0, 31.0, 45.0, 93.0, 163.0, 1562.0, 292.0, 129.0, 69.0, 50.0, 40.0, 43.0, 30.0, 39.0, 24.0, 27.0, 16.0, 16.0, 10.0, 16.0, 6.0, 12.0, 5.0, 6.0, 6.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-16.5, -15.98046875, -15.4609375, -14.94140625, -14.421875, -13.90234375, -13.3828125, -12.86328125, -12.34375, -11.82421875, -11.3046875, -10.78515625, -10.265625, -9.74609375, -9.2265625, -8.70703125, -8.1875, -7.66796875, -7.1484375, -6.62890625, -6.109375, -5.58984375, -5.0703125, -4.55078125, -4.03125, -3.51171875, -2.9921875, -2.47265625, -1.953125, -1.43359375, -0.9140625, -0.39453125, 0.125, 0.64453125, 1.1640625, 1.68359375, 2.203125, 2.72265625, 3.2421875, 3.76171875, 4.28125, 4.80078125, 5.3203125, 5.83984375, 6.359375, 6.87890625, 7.3984375, 7.91796875, 8.4375, 8.95703125, 9.4765625, 9.99609375, 10.515625, 11.03515625, 11.5546875, 12.07421875, 12.59375, 13.11328125, 13.6328125, 14.15234375, 14.671875, 15.19140625, 15.7109375, 16.23046875, 16.75]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 16.0, 30.0, 29.0, 46.0, 57.0, 109.0, 123.0, 213.0, 316.0, 828.0, 4674.0, 500961.0, 2628223.0, 7828.0, 998.0, 370.0, 267.0, 137.0, 109.0, 62.0, 48.0, 39.0, 19.0, 28.0, 28.0, 19.0, 8.0, 10.0, 9.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.73486328125, -30.5634765625, -29.39208984375, -28.220703125, -27.04931640625, -25.8779296875, -24.70654296875, -23.53515625, -22.36376953125, -21.1923828125, -20.02099609375, -18.849609375, -17.67822265625, -16.5068359375, -15.33544921875, -14.1640625, -12.99267578125, -11.8212890625, -10.64990234375, -9.478515625, -8.30712890625, -7.1357421875, -5.96435546875, -4.79296875, -3.62158203125, -2.4501953125, -1.27880859375, -0.107421875, 1.06396484375, 2.2353515625, 3.40673828125, 4.578125, 5.74951171875, 6.9208984375, 8.09228515625, 9.263671875, 10.43505859375, 11.6064453125, 12.77783203125, 13.94921875, 15.12060546875, 16.2919921875, 17.46337890625, 18.634765625, 19.80615234375, 20.9775390625, 22.14892578125, 23.3203125, 24.49169921875, 25.6630859375, 26.83447265625, 28.005859375, 29.17724609375, 30.3486328125, 31.52001953125, 32.69140625, 33.86279296875, 35.0341796875, 36.20556640625, 37.376953125, 38.54833984375, 39.7197265625, 40.89111328125, 42.0625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 710.0, 300.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-384.8196716308594, -378.04766845703125, -371.2756652832031, -364.5036926269531, -357.731689453125, -350.9596862792969, -344.18768310546875, -337.4156799316406, -330.6436767578125, -323.8716735839844, -317.09967041015625, -310.32769775390625, -303.5556945800781, -296.78369140625, -290.0116882324219, -283.23968505859375, -276.46771240234375, -269.6957092285156, -262.9237060546875, -256.1517333984375, -249.37973022460938, -242.60772705078125, -235.83572387695312, -229.063720703125, -222.29173278808594, -215.5197296142578, -208.74774169921875, -201.97573852539062, -195.2037353515625, -188.43174743652344, -181.6597442626953, -174.88775634765625, -168.11575317382812, -161.34375, -154.57176208496094, -147.7997589111328, -141.02777099609375, -134.25576782226562, -127.4837646484375, -120.7117691040039, -113.93977355957031, -107.16777801513672, -100.39578247070312, -93.623779296875, -86.8517837524414, -80.07978820800781, -73.30778503417969, -66.5357894897461, -59.7637939453125, -52.991798400878906, -46.21979904174805, -39.44779968261719, -32.675804138183594, -25.90380859375, -19.13180923461914, -12.359809875488281, -5.5878143310546875, 1.184183120727539, 7.956180572509766, 14.728178024291992, 21.50017547607422, 28.272171020507812, 35.04417037963867, 41.81616973876953, 48.588165283203125]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 12.0, 6.0, 13.0, 7.0, 9.0, 17.0, 17.0, 19.0, 17.0, 32.0, 35.0, 28.0, 31.0, 32.0, 36.0, 35.0, 32.0, 44.0, 47.0, 46.0, 48.0, 40.0, 33.0, 29.0, 44.0, 53.0, 34.0, 33.0, 29.0, 18.0, 23.0, 14.0, 18.0, 10.0, 13.0, 17.0, 7.0, 5.0, 7.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-45.09357452392578, -43.77781677246094, -42.462059020996094, -41.146297454833984, -39.83053970336914, -38.5147819519043, -37.19902038574219, -35.883262634277344, -34.5675048828125, -33.251747131347656, -31.93598747253418, -30.620227813720703, -29.30447006225586, -27.988712310791016, -26.67295265197754, -25.357192993164062, -24.04143524169922, -22.725677490234375, -21.4099178314209, -20.094158172607422, -18.778400421142578, -17.462642669677734, -16.146883010864258, -14.831124305725098, -13.515365600585938, -12.199606895446777, -10.883848190307617, -9.568089485168457, -8.252330780029297, -6.936572074890137, -5.620813369750977, -4.305054664611816, -2.9892959594726562, -1.673537254333496, -0.35777854919433594, 0.9579801559448242, 2.2737388610839844, 3.5894975662231445, 4.905256271362305, 6.221014976501465, 7.536773681640625, 8.852532386779785, 10.168291091918945, 11.484049797058105, 12.799808502197266, 14.115567207336426, 15.431325912475586, 16.747085571289062, 18.062843322753906, 19.37860107421875, 20.694360733032227, 22.010120391845703, 23.325878143310547, 24.64163589477539, 25.957395553588867, 27.273155212402344, 28.588912963867188, 29.90467071533203, 31.220430374145508, 32.536190032958984, 33.85194778442383, 35.16770553588867, 36.48346710205078, 37.799224853515625, 39.11498260498047]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 4.0, 4.0, 10.0, 7.0, 9.0, 5.0, 15.0, 10.0, 18.0, 11.0, 27.0, 14.0, 29.0, 21.0, 27.0, 27.0, 27.0, 31.0, 27.0, 33.0, 44.0, 31.0, 36.0, 47.0, 52.0, 43.0, 34.0, 30.0, 29.0, 37.0, 25.0, 29.0, 20.0, 25.0, 34.0, 17.0, 15.0, 16.0, 10.0, 13.0, 13.0, 6.0, 9.0, 9.0, 2.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.2421875, -4.11016845703125, -3.9781494140625, -3.84613037109375, -3.714111328125, -3.58209228515625, -3.4500732421875, -3.31805419921875, -3.18603515625, -3.05401611328125, -2.9219970703125, -2.78997802734375, -2.657958984375, -2.52593994140625, -2.3939208984375, -2.26190185546875, -2.1298828125, -1.99786376953125, -1.8658447265625, -1.73382568359375, -1.601806640625, -1.46978759765625, -1.3377685546875, -1.20574951171875, -1.07373046875, -0.94171142578125, -0.8096923828125, -0.67767333984375, -0.545654296875, -0.41363525390625, -0.2816162109375, -0.14959716796875, -0.017578125, 0.11444091796875, 0.2464599609375, 0.37847900390625, 0.510498046875, 0.64251708984375, 0.7745361328125, 0.90655517578125, 1.03857421875, 1.17059326171875, 1.3026123046875, 1.43463134765625, 1.566650390625, 1.69866943359375, 1.8306884765625, 1.96270751953125, 2.0947265625, 2.22674560546875, 2.3587646484375, 2.49078369140625, 2.622802734375, 2.75482177734375, 2.8868408203125, 3.01885986328125, 3.15087890625, 3.28289794921875, 3.4149169921875, 3.54693603515625, 3.678955078125, 3.81097412109375, 3.9429931640625, 4.07501220703125, 4.20703125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 2.0, 8.0, 7.0, 9.0, 21.0, 20.0, 13.0, 20.0, 17.0, 31.0, 34.0, 43.0, 31.0, 61.0, 104.0, 152.0, 265.0, 1105.0, 6439.0, 91973.0, 2947615.0, 1111563.0, 30169.0, 3170.0, 657.0, 215.0, 117.0, 75.0, 49.0, 51.0, 48.0, 30.0, 25.0, 27.0, 18.0, 15.0, 11.0, 11.0, 11.0, 6.0, 5.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.15625, -19.502197265625, -18.84814453125, -18.194091796875, -17.5400390625, -16.885986328125, -16.23193359375, -15.577880859375, -14.923828125, -14.269775390625, -13.61572265625, -12.961669921875, -12.3076171875, -11.653564453125, -10.99951171875, -10.345458984375, -9.69140625, -9.037353515625, -8.38330078125, -7.729248046875, -7.0751953125, -6.421142578125, -5.76708984375, -5.113037109375, -4.458984375, -3.804931640625, -3.15087890625, -2.496826171875, -1.8427734375, -1.188720703125, -0.53466796875, 0.119384765625, 0.7734375, 1.427490234375, 2.08154296875, 2.735595703125, 3.3896484375, 4.043701171875, 4.69775390625, 5.351806640625, 6.005859375, 6.659912109375, 7.31396484375, 7.968017578125, 8.6220703125, 9.276123046875, 9.93017578125, 10.584228515625, 11.23828125, 11.892333984375, 12.54638671875, 13.200439453125, 13.8544921875, 14.508544921875, 15.16259765625, 15.816650390625, 16.470703125, 17.124755859375, 17.77880859375, 18.432861328125, 19.0869140625, 19.740966796875, 20.39501953125, 21.049072265625, 21.703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 17.0, 12.0, 27.0, 27.0, 49.0, 70.0, 101.0, 124.0, 181.0, 264.0, 374.0, 530.0, 565.0, 537.0, 363.0, 278.0, 188.0, 104.0, 81.0, 62.0, 37.0, 28.0, 12.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.734375, -16.274658203125, -15.81494140625, -15.355224609375, -14.8955078125, -14.435791015625, -13.97607421875, -13.516357421875, -13.056640625, -12.596923828125, -12.13720703125, -11.677490234375, -11.2177734375, -10.758056640625, -10.29833984375, -9.838623046875, -9.37890625, -8.919189453125, -8.45947265625, -7.999755859375, -7.5400390625, -7.080322265625, -6.62060546875, -6.160888671875, -5.701171875, -5.241455078125, -4.78173828125, -4.322021484375, -3.8623046875, -3.402587890625, -2.94287109375, -2.483154296875, -2.0234375, -1.563720703125, -1.10400390625, -0.644287109375, -0.1845703125, 0.275146484375, 0.73486328125, 1.194580078125, 1.654296875, 2.114013671875, 2.57373046875, 3.033447265625, 3.4931640625, 3.952880859375, 4.41259765625, 4.872314453125, 5.33203125, 5.791748046875, 6.25146484375, 6.711181640625, 7.1708984375, 7.630615234375, 8.09033203125, 8.550048828125, 9.009765625, 9.469482421875, 9.92919921875, 10.388916015625, 10.8486328125, 11.308349609375, 11.76806640625, 12.227783203125, 12.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 10.0, 8.0, 12.0, 12.0, 34.0, 37.0, 38.0, 51.0, 77.0, 107.0, 161.0, 258.0, 497.0, 1272.0, 6618.0, 255793.0, 3822358.0, 100643.0, 4110.0, 934.0, 439.0, 245.0, 163.0, 106.0, 84.0, 61.0, 45.0, 36.0, 30.0, 13.0, 11.0, 8.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.06396484375, -33.7841796875, -32.50439453125, -31.224609375, -29.94482421875, -28.6650390625, -27.38525390625, -26.10546875, -24.82568359375, -23.5458984375, -22.26611328125, -20.986328125, -19.70654296875, -18.4267578125, -17.14697265625, -15.8671875, -14.58740234375, -13.3076171875, -12.02783203125, -10.748046875, -9.46826171875, -8.1884765625, -6.90869140625, -5.62890625, -4.34912109375, -3.0693359375, -1.78955078125, -0.509765625, 0.77001953125, 2.0498046875, 3.32958984375, 4.609375, 5.88916015625, 7.1689453125, 8.44873046875, 9.728515625, 11.00830078125, 12.2880859375, 13.56787109375, 14.84765625, 16.12744140625, 17.4072265625, 18.68701171875, 19.966796875, 21.24658203125, 22.5263671875, 23.80615234375, 25.0859375, 26.36572265625, 27.6455078125, 28.92529296875, 30.205078125, 31.48486328125, 32.7646484375, 34.04443359375, 35.32421875, 36.60400390625, 37.8837890625, 39.16357421875, 40.443359375, 41.72314453125, 43.0029296875, 44.28271484375, 45.5625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 15.0, 44.0, 56.0, 81.0, 102.0, 162.0, 142.0, 131.0, 101.0, 76.0, 46.0, 18.0, 10.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.72013473510742, -57.4682731628418, -55.216407775878906, -52.96454620361328, -50.71268081665039, -48.460819244384766, -46.208953857421875, -43.95709228515625, -41.705230712890625, -39.453369140625, -37.20150375366211, -34.949642181396484, -32.697776794433594, -30.44591522216797, -28.19405174255371, -25.942188262939453, -23.690322875976562, -21.438459396362305, -19.186595916748047, -16.934734344482422, -14.682869911193848, -12.43100643157959, -10.179143905639648, -7.927280426025391, -5.675416946411133, -3.423553705215454, -1.1716904640197754, 1.0801725387573242, 3.332036018371582, 5.58389949798584, 7.835762023925781, 10.087625503540039, 12.339492797851562, 14.59135627746582, 16.843219757080078, 19.095081329345703, 21.346946716308594, 23.59880828857422, 25.850671768188477, 28.102535247802734, 30.354398727416992, 32.60626220703125, 34.858123779296875, 37.109989166259766, 39.36185073852539, 41.61371612548828, 43.865577697753906, 46.11743927001953, 48.36930465698242, 50.62116622924805, 52.87303161621094, 55.12489318847656, 57.37675857543945, 59.62862014770508, 61.88048553466797, 64.1323471069336, 66.38420867919922, 68.63607025146484, 70.88793182373047, 73.13980102539062, 75.39166259765625, 77.64352416992188, 79.8953857421875, 82.14724731445312, 84.39911651611328]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 8.0, 4.0, 8.0, 13.0, 14.0, 11.0, 22.0, 21.0, 14.0, 19.0, 26.0, 19.0, 31.0, 31.0, 33.0, 23.0, 36.0, 40.0, 31.0, 31.0, 37.0, 41.0, 37.0, 35.0, 40.0, 41.0, 41.0, 34.0, 29.0, 26.0, 26.0, 28.0, 27.0, 11.0, 9.0, 20.0, 9.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-38.279693603515625, -37.09001922607422, -35.90034866333008, -34.71067428588867, -33.52100372314453, -32.331329345703125, -31.14165496826172, -29.951982498168945, -28.762310028076172, -27.5726375579834, -26.382965087890625, -25.19329071044922, -24.003618240356445, -22.813945770263672, -21.624271392822266, -20.434598922729492, -19.24492645263672, -18.055253982543945, -16.865581512451172, -15.675907135009766, -14.486234664916992, -13.296562194824219, -12.106888771057129, -10.917215347290039, -9.727542877197266, -8.537870407104492, -7.348196983337402, -6.158524036407471, -4.968851089477539, -3.7791781425476074, -2.589505195617676, -1.399831771850586, -0.2101593017578125, 0.9795136451721191, 2.169186592102051, 3.3588595390319824, 4.548532485961914, 5.738205432891846, 6.927878379821777, 8.117551803588867, 9.30722427368164, 10.496896743774414, 11.686570167541504, 12.876243591308594, 14.065916061401367, 15.25558853149414, 16.445262908935547, 17.63493537902832, 18.824607849121094, 20.014280319213867, 21.20395278930664, 22.393627166748047, 23.58329963684082, 24.772972106933594, 25.962646484375, 27.152318954467773, 28.341991424560547, 29.53166389465332, 30.721336364746094, 31.9110107421875, 33.100685119628906, 34.29035568237305, 35.48003005981445, 36.669700622558594, 37.859375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 7.0, 9.0, 3.0, 14.0, 11.0, 16.0, 14.0, 17.0, 25.0, 10.0, 21.0, 23.0, 33.0, 33.0, 33.0, 25.0, 29.0, 31.0, 45.0, 36.0, 35.0, 42.0, 39.0, 36.0, 40.0, 34.0, 34.0, 44.0, 20.0, 29.0, 35.0, 26.0, 22.0, 20.0, 17.0, 20.0, 18.0, 11.0, 9.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.33807373046875, -4.1995849609375, -4.06109619140625, -3.922607421875, -3.78411865234375, -3.6456298828125, -3.50714111328125, -3.36865234375, -3.23016357421875, -3.0916748046875, -2.95318603515625, -2.814697265625, -2.67620849609375, -2.5377197265625, -2.39923095703125, -2.2607421875, -2.12225341796875, -1.9837646484375, -1.84527587890625, -1.706787109375, -1.56829833984375, -1.4298095703125, -1.29132080078125, -1.15283203125, -1.01434326171875, -0.8758544921875, -0.73736572265625, -0.598876953125, -0.46038818359375, -0.3218994140625, -0.18341064453125, -0.044921875, 0.09356689453125, 0.2320556640625, 0.37054443359375, 0.509033203125, 0.64752197265625, 0.7860107421875, 0.92449951171875, 1.06298828125, 1.20147705078125, 1.3399658203125, 1.47845458984375, 1.616943359375, 1.75543212890625, 1.8939208984375, 2.03240966796875, 2.1708984375, 2.30938720703125, 2.4478759765625, 2.58636474609375, 2.724853515625, 2.86334228515625, 3.0018310546875, 3.14031982421875, 3.27880859375, 3.41729736328125, 3.5557861328125, 3.69427490234375, 3.832763671875, 3.97125244140625, 4.1097412109375, 4.24822998046875, 4.38671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 8.0, 20.0, 27.0, 33.0, 60.0, 75.0, 124.0, 144.0, 270.0, 433.0, 669.0, 1031.0, 1668.0, 2630.0, 3945.0, 6294.0, 9757.0, 15310.0, 24087.0, 37600.0, 58950.0, 91491.0, 133059.0, 167645.0, 158597.0, 117634.0, 78265.0, 50238.0, 31966.0, 20191.0, 13017.0, 8297.0, 5275.0, 3501.0, 2236.0, 1532.0, 895.0, 587.0, 375.0, 225.0, 144.0, 80.0, 49.0, 37.0, 28.0, 15.0, 16.0, 7.0, 10.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0], "bins": [-0.468994140625, -0.45470428466796875, -0.4404144287109375, -0.42612457275390625, -0.411834716796875, -0.39754486083984375, -0.3832550048828125, -0.36896514892578125, -0.35467529296875, -0.34038543701171875, -0.3260955810546875, -0.31180572509765625, -0.297515869140625, -0.28322601318359375, -0.2689361572265625, -0.25464630126953125, -0.2403564453125, -0.22606658935546875, -0.2117767333984375, -0.19748687744140625, -0.183197021484375, -0.16890716552734375, -0.1546173095703125, -0.14032745361328125, -0.12603759765625, -0.11174774169921875, -0.0974578857421875, -0.08316802978515625, -0.068878173828125, -0.05458831787109375, -0.0402984619140625, -0.02600860595703125, -0.01171875, 0.00257110595703125, 0.0168609619140625, 0.03115081787109375, 0.045440673828125, 0.05973052978515625, 0.0740203857421875, 0.08831024169921875, 0.10260009765625, 0.11688995361328125, 0.1311798095703125, 0.14546966552734375, 0.159759521484375, 0.17404937744140625, 0.1883392333984375, 0.20262908935546875, 0.2169189453125, 0.23120880126953125, 0.2454986572265625, 0.25978851318359375, 0.274078369140625, 0.28836822509765625, 0.3026580810546875, 0.31694793701171875, 0.33123779296875, 0.34552764892578125, 0.3598175048828125, 0.37410736083984375, 0.388397216796875, 0.40268707275390625, 0.4169769287109375, 0.43126678466796875, 0.445556640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 10.0, 12.0, 12.0, 21.0, 22.0, 25.0, 33.0, 18.0, 29.0, 32.0, 36.0, 37.0, 49.0, 50.0, 32.0, 37.0, 1073.0, 47.0, 39.0, 52.0, 27.0, 40.0, 22.0, 32.0, 34.0, 33.0, 27.0, 21.0, 15.0, 8.0, 13.0, 8.0, 15.0, 6.0, 6.0, 5.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.46282958984375, -3.3651123046875, -3.26739501953125, -3.169677734375, -3.07196044921875, -2.9742431640625, -2.87652587890625, -2.77880859375, -2.68109130859375, -2.5833740234375, -2.48565673828125, -2.387939453125, -2.29022216796875, -2.1925048828125, -2.09478759765625, -1.9970703125, -1.89935302734375, -1.8016357421875, -1.70391845703125, -1.606201171875, -1.50848388671875, -1.4107666015625, -1.31304931640625, -1.21533203125, -1.11761474609375, -1.0198974609375, -0.92218017578125, -0.824462890625, -0.72674560546875, -0.6290283203125, -0.53131103515625, -0.43359375, -0.33587646484375, -0.2381591796875, -0.14044189453125, -0.042724609375, 0.05499267578125, 0.1527099609375, 0.25042724609375, 0.34814453125, 0.44586181640625, 0.5435791015625, 0.64129638671875, 0.739013671875, 0.83673095703125, 0.9344482421875, 1.03216552734375, 1.1298828125, 1.22760009765625, 1.3253173828125, 1.42303466796875, 1.520751953125, 1.61846923828125, 1.7161865234375, 1.81390380859375, 1.91162109375, 2.00933837890625, 2.1070556640625, 2.20477294921875, 2.302490234375, 2.40020751953125, 2.4979248046875, 2.59564208984375, 2.693359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 6.0, 16.0, 9.0, 23.0, 26.0, 51.0, 77.0, 112.0, 180.0, 251.0, 386.0, 540.0, 750.0, 1073.0, 1530.0, 2197.0, 3167.0, 4538.0, 6674.0, 9379.0, 13592.0, 19943.0, 28496.0, 40419.0, 56414.0, 76108.0, 97565.0, 115900.0, 1169270.0, 111179.0, 92043.0, 70958.0, 52097.0, 37286.0, 26169.0, 18051.0, 12435.0, 8656.0, 5911.0, 4153.0, 2899.0, 2074.0, 1353.0, 931.0, 725.0, 487.0, 320.0, 242.0, 162.0, 109.0, 69.0, 53.0, 43.0, 19.0, 11.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.2626953125, -0.2543220520019531, -0.24594879150390625, -0.23757553100585938, -0.2292022705078125, -0.22082901000976562, -0.21245574951171875, -0.20408248901367188, -0.195709228515625, -0.18733596801757812, -0.17896270751953125, -0.17058944702148438, -0.1622161865234375, -0.15384292602539062, -0.14546966552734375, -0.13709640502929688, -0.12872314453125, -0.12034988403320312, -0.11197662353515625, -0.10360336303710938, -0.0952301025390625, -0.08685684204101562, -0.07848358154296875, -0.07011032104492188, -0.061737060546875, -0.053363800048828125, -0.04499053955078125, -0.036617279052734375, -0.0282440185546875, -0.019870758056640625, -0.01149749755859375, -0.003124237060546875, 0.0052490234375, 0.013622283935546875, 0.02199554443359375, 0.030368804931640625, 0.0387420654296875, 0.047115325927734375, 0.05548858642578125, 0.06386184692382812, 0.072235107421875, 0.08060836791992188, 0.08898162841796875, 0.09735488891601562, 0.1057281494140625, 0.11410140991210938, 0.12247467041015625, 0.13084793090820312, 0.13922119140625, 0.14759445190429688, 0.15596771240234375, 0.16434097290039062, 0.1727142333984375, 0.18108749389648438, 0.18946075439453125, 0.19783401489257812, 0.206207275390625, 0.21458053588867188, 0.22295379638671875, 0.23132705688476562, 0.2397003173828125, 0.24807357788085938, 0.25644683837890625, 0.2648200988769531, 0.273193359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 8.0, 4.0, 2.0, 4.0, 6.0, 14.0, 9.0, 9.0, 11.0, 23.0, 19.0, 39.0, 35.0, 37.0, 59.0, 60.0, 78.0, 85.0, 85.0, 76.0, 80.0, 44.0, 47.0, 44.0, 28.0, 23.0, 15.0, 13.0, 9.0, 14.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031223297119140625, -0.003030925989151001, -0.0029395222663879395, -0.002848118543624878, -0.0027567148208618164, -0.002665311098098755, -0.0025739073753356934, -0.002482503652572632, -0.0023910999298095703, -0.002299696207046509, -0.0022082924842834473, -0.0021168887615203857, -0.0020254850387573242, -0.0019340813159942627, -0.0018426775932312012, -0.0017512738704681396, -0.0016598701477050781, -0.0015684664249420166, -0.001477062702178955, -0.0013856589794158936, -0.001294255256652832, -0.0012028515338897705, -0.001111447811126709, -0.0010200440883636475, -0.0009286403656005859, -0.0008372366428375244, -0.0007458329200744629, -0.0006544291973114014, -0.0005630254745483398, -0.0004716217517852783, -0.0003802180290222168, -0.0002888143062591553, -0.00019741058349609375, -0.00010600686073303223, -1.4603137969970703e-05, 7.680058479309082e-05, 0.00016820430755615234, 0.00025960803031921387, 0.0003510117530822754, 0.0004424154758453369, 0.0005338191986083984, 0.00062522292137146, 0.0007166266441345215, 0.000808030366897583, 0.0008994340896606445, 0.000990837812423706, 0.0010822415351867676, 0.001173645257949829, 0.0012650489807128906, 0.0013564527034759521, 0.0014478564262390137, 0.0015392601490020752, 0.0016306638717651367, 0.0017220675945281982, 0.0018134713172912598, 0.0019048750400543213, 0.001996278762817383, 0.0020876824855804443, 0.002179086208343506, 0.0022704899311065674, 0.002361893653869629, 0.0024532973766326904, 0.002544701099395752, 0.0026361048221588135, 0.002727508544921875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 8.0, 14.0, 14.0, 18.0, 26.0, 38.0, 47.0, 95.0, 139.0, 268.0, 607.0, 4460.0, 1006589.0, 34455.0, 877.0, 357.0, 165.0, 97.0, 72.0, 41.0, 38.0, 15.0, 17.0, 20.0, 11.0, 10.0, 9.0, 10.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0506591796875, -0.048760414123535156, -0.04686164855957031, -0.04496288299560547, -0.043064117431640625, -0.04116535186767578, -0.03926658630371094, -0.037367820739746094, -0.03546905517578125, -0.033570289611816406, -0.03167152404785156, -0.02977275848388672, -0.027873992919921875, -0.02597522735595703, -0.024076461791992188, -0.022177696228027344, -0.0202789306640625, -0.018380165100097656, -0.016481399536132812, -0.014582633972167969, -0.012683868408203125, -0.010785102844238281, -0.008886337280273438, -0.006987571716308594, -0.00508880615234375, -0.0031900405883789062, -0.0012912750244140625, 0.0006074905395507812, 0.002506256103515625, 0.004405021667480469, 0.0063037872314453125, 0.008202552795410156, 0.010101318359375, 0.012000083923339844, 0.013898849487304688, 0.01579761505126953, 0.017696380615234375, 0.01959514617919922, 0.021493911743164062, 0.023392677307128906, 0.02529144287109375, 0.027190208435058594, 0.029088973999023438, 0.03098773956298828, 0.032886505126953125, 0.03478527069091797, 0.03668403625488281, 0.038582801818847656, 0.0404815673828125, 0.042380332946777344, 0.04427909851074219, 0.04617786407470703, 0.048076629638671875, 0.04997539520263672, 0.05187416076660156, 0.053772926330566406, 0.05567169189453125, 0.057570457458496094, 0.05946922302246094, 0.06136798858642578, 0.06326675415039062, 0.06516551971435547, 0.06706428527832031, 0.06896305084228516, 0.07086181640625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 71.0, 264.0, 471.0, 165.0, 28.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012221758253872395, -0.011974196881055832, -0.01172663550823927, -0.011479075066745281, -0.011231513693928719, -0.010983952321112156, -0.010736390948295593, -0.010488830506801605, -0.010241269133985043, -0.00999370776116848, -0.009746146388351917, -0.00949858594685793, -0.009251024574041367, -0.009003463201224804, -0.008755901828408241, -0.008508341386914253, -0.008260779082775116, -0.008013217709958553, -0.007765656802803278, -0.007518095429986715, -0.00727053452283144, -0.007022973150014877, -0.006775411777198315, -0.006527850870043039, -0.006280289962887764, -0.006032728590071201, -0.005785167682915926, -0.005537606310099363, -0.005290045402944088, -0.005042484030127525, -0.004794922657310963, -0.004547361750155687, -0.004299800843000412, -0.004052239470183849, -0.003804678563028574, -0.0035571171902120113, -0.003309556283056736, -0.0030619949102401733, -0.0028144337702542543, -0.0025668726302683353, -0.00231931172311306, -0.002071750583127141, -0.001824189443141222, -0.0015766281867399812, -0.0013290670467540622, -0.0010815059067681432, -0.0008339446503669024, -0.0005863835103809834, -0.00033882237039506435, -9.12612013053149e-05, 0.00015629996778443456, 0.00040386116597801447, 0.0006514223059639335, 0.0008989834459498525, 0.0011465447023510933, 0.0013941058423370123, 0.0016416669823229313, 0.0018892281223088503, 0.0021367892622947693, 0.002384350635111332, 0.0026319115422666073, 0.00287947291508317, 0.003127034055069089, 0.003374595195055008, 0.003622156335040927]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 8.0, 4.0, 16.0, 18.0, 13.0, 21.0, 21.0, 26.0, 22.0, 36.0, 27.0, 32.0, 27.0, 43.0, 33.0, 44.0, 42.0, 35.0, 33.0, 51.0, 47.0, 37.0, 36.0, 37.0, 36.0, 26.0, 28.0, 28.0, 31.0, 17.0, 19.0, 17.0, 16.0, 11.0, 7.0, 7.0, 7.0, 10.0, 8.0, 2.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0014564990997314453, -0.0014072414487600327, -0.00135798379778862, -0.0013087261468172073, -0.0012594684958457947, -0.001210210844874382, -0.0011609531939029694, -0.0011116955429315567, -0.001062437891960144, -0.0010131802409887314, -0.0009639225900173187, -0.0009146649390459061, -0.0008654072880744934, -0.0008161496371030807, -0.0007668919861316681, -0.0007176343351602554, -0.0006683766841888428, -0.0006191190332174301, -0.0005698613822460175, -0.0005206037312746048, -0.00047134608030319214, -0.0004220884293317795, -0.0003728307783603668, -0.00032357312738895416, -0.0002743154764175415, -0.00022505782544612885, -0.0001758001744747162, -0.00012654252350330353, -7.728487253189087e-05, -2.802722156047821e-05, 2.1230429410934448e-05, 7.048808038234711e-05, 0.00011974573135375977, 0.00016900338232517242, 0.00021826103329658508, 0.00026751868426799774, 0.0003167763352394104, 0.00036603398621082306, 0.0004152916371822357, 0.0004645492881536484, 0.000513806939125061, 0.0005630645900964737, 0.0006123222410678864, 0.000661579892039299, 0.0007108375430107117, 0.0007600951939821243, 0.000809352844953537, 0.0008586104959249496, 0.0009078681468963623, 0.000957125797867775, 0.0010063834488391876, 0.0010556410998106003, 0.001104898750782013, 0.0011541564017534256, 0.0012034140527248383, 0.001252671703696251, 0.0013019293546676636, 0.0013511870056390762, 0.001400444656610489, 0.0014497023075819016, 0.0014989599585533142, 0.0015482176095247269, 0.0015974752604961395, 0.0016467329114675522, 0.0016959905624389648]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 7.0, 9.0, 3.0, 14.0, 11.0, 16.0, 14.0, 17.0, 25.0, 10.0, 21.0, 23.0, 33.0, 33.0, 33.0, 26.0, 28.0, 31.0, 45.0, 36.0, 35.0, 42.0, 39.0, 36.0, 40.0, 34.0, 34.0, 44.0, 20.0, 29.0, 35.0, 26.0, 22.0, 20.0, 17.0, 20.0, 18.0, 11.0, 9.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.33807373046875, -4.1995849609375, -4.06109619140625, -3.922607421875, -3.78411865234375, -3.6456298828125, -3.50714111328125, -3.36865234375, -3.23016357421875, -3.0916748046875, -2.95318603515625, -2.814697265625, -2.67620849609375, -2.5377197265625, -2.39923095703125, -2.2607421875, -2.12225341796875, -1.9837646484375, -1.84527587890625, -1.706787109375, -1.56829833984375, -1.4298095703125, -1.29132080078125, -1.15283203125, -1.01434326171875, -0.8758544921875, -0.73736572265625, -0.598876953125, -0.46038818359375, -0.3218994140625, -0.18341064453125, -0.044921875, 0.09356689453125, 0.2320556640625, 0.37054443359375, 0.509033203125, 0.64752197265625, 0.7860107421875, 0.92449951171875, 1.06298828125, 1.20147705078125, 1.3399658203125, 1.47845458984375, 1.616943359375, 1.75543212890625, 1.8939208984375, 2.03240966796875, 2.1708984375, 2.30938720703125, 2.4478759765625, 2.58636474609375, 2.724853515625, 2.86334228515625, 3.0018310546875, 3.14031982421875, 3.27880859375, 3.41729736328125, 3.5557861328125, 3.69427490234375, 3.832763671875, 3.97125244140625, 4.1097412109375, 4.24822998046875, 4.38671875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 9.0, 17.0, 21.0, 32.0, 42.0, 73.0, 146.0, 194.0, 299.0, 454.0, 654.0, 1106.0, 1677.0, 2689.0, 4275.0, 7199.0, 12404.0, 22600.0, 42509.0, 90234.0, 231985.0, 351544.0, 144354.0, 61709.0, 30555.0, 17060.0, 9698.0, 5614.0, 3417.0, 2161.0, 1378.0, 850.0, 555.0, 349.0, 220.0, 150.0, 102.0, 63.0, 61.0, 29.0, 27.0, 17.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.26171875, -3.160614013671875, -3.05950927734375, -2.958404541015625, -2.8572998046875, -2.756195068359375, -2.65509033203125, -2.553985595703125, -2.452880859375, -2.351776123046875, -2.25067138671875, -2.149566650390625, -2.0484619140625, -1.947357177734375, -1.84625244140625, -1.745147705078125, -1.64404296875, -1.542938232421875, -1.44183349609375, -1.340728759765625, -1.2396240234375, -1.138519287109375, -1.03741455078125, -0.936309814453125, -0.835205078125, -0.734100341796875, -0.63299560546875, -0.531890869140625, -0.4307861328125, -0.329681396484375, -0.22857666015625, -0.127471923828125, -0.0263671875, 0.074737548828125, 0.17584228515625, 0.276947021484375, 0.3780517578125, 0.479156494140625, 0.58026123046875, 0.681365966796875, 0.782470703125, 0.883575439453125, 0.98468017578125, 1.085784912109375, 1.1868896484375, 1.287994384765625, 1.38909912109375, 1.490203857421875, 1.59130859375, 1.692413330078125, 1.79351806640625, 1.894622802734375, 1.9957275390625, 2.096832275390625, 2.19793701171875, 2.299041748046875, 2.400146484375, 2.501251220703125, 2.60235595703125, 2.703460693359375, 2.8045654296875, 2.905670166015625, 3.00677490234375, 3.107879638671875, 3.208984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 13.0, 10.0, 18.0, 32.0, 23.0, 29.0, 32.0, 38.0, 38.0, 42.0, 71.0, 90.0, 94.0, 360.0, 1535.0, 130.0, 84.0, 58.0, 61.0, 53.0, 46.0, 25.0, 28.0, 29.0, 25.0, 13.0, 12.0, 12.0, 15.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.46875, -20.820068359375, -20.17138671875, -19.522705078125, -18.8740234375, -18.225341796875, -17.57666015625, -16.927978515625, -16.279296875, -15.630615234375, -14.98193359375, -14.333251953125, -13.6845703125, -13.035888671875, -12.38720703125, -11.738525390625, -11.08984375, -10.441162109375, -9.79248046875, -9.143798828125, -8.4951171875, -7.846435546875, -7.19775390625, -6.549072265625, -5.900390625, -5.251708984375, -4.60302734375, -3.954345703125, -3.3056640625, -2.656982421875, -2.00830078125, -1.359619140625, -0.7109375, -0.062255859375, 0.58642578125, 1.235107421875, 1.8837890625, 2.532470703125, 3.18115234375, 3.829833984375, 4.478515625, 5.127197265625, 5.77587890625, 6.424560546875, 7.0732421875, 7.721923828125, 8.37060546875, 9.019287109375, 9.66796875, 10.316650390625, 10.96533203125, 11.614013671875, 12.2626953125, 12.911376953125, 13.56005859375, 14.208740234375, 14.857421875, 15.506103515625, 16.15478515625, 16.803466796875, 17.4521484375, 18.100830078125, 18.74951171875, 19.398193359375, 20.046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 11.0, 11.0, 24.0, 24.0, 53.0, 86.0, 124.0, 250.0, 538.0, 3185.0, 3102626.0, 37066.0, 931.0, 312.0, 155.0, 122.0, 49.0, 40.0, 32.0, 15.0, 13.0, 13.0, 3.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.03125, -57.50146484375, -54.9716796875, -52.44189453125, -49.912109375, -47.38232421875, -44.8525390625, -42.32275390625, -39.79296875, -37.26318359375, -34.7333984375, -32.20361328125, -29.673828125, -27.14404296875, -24.6142578125, -22.08447265625, -19.5546875, -17.02490234375, -14.4951171875, -11.96533203125, -9.435546875, -6.90576171875, -4.3759765625, -1.84619140625, 0.68359375, 3.21337890625, 5.7431640625, 8.27294921875, 10.802734375, 13.33251953125, 15.8623046875, 18.39208984375, 20.921875, 23.45166015625, 25.9814453125, 28.51123046875, 31.041015625, 33.57080078125, 36.1005859375, 38.63037109375, 41.16015625, 43.68994140625, 46.2197265625, 48.74951171875, 51.279296875, 53.80908203125, 56.3388671875, 58.86865234375, 61.3984375, 63.92822265625, 66.4580078125, 68.98779296875, 71.517578125, 74.04736328125, 76.5771484375, 79.10693359375, 81.63671875, 84.16650390625, 86.6962890625, 89.22607421875, 91.755859375, 94.28564453125, 96.8154296875, 99.34521484375, 101.875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 29.0, 330.0, 581.0, 73.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.201271057128906, -27.761735916137695, -23.322200775146484, -18.88266372680664, -14.44312858581543, -10.003593444824219, -5.564056396484375, -1.124521255493164, 3.315013885498047, 7.754549503326416, 12.194085121154785, 16.633621215820312, 21.073156356811523, 25.512691497802734, 29.952228546142578, 34.391761779785156, 38.831298828125, 43.270835876464844, 47.71036911010742, 52.149906158447266, 56.589439392089844, 61.02897644042969, 65.46851348876953, 69.90805053710938, 74.34757995605469, 78.78711700439453, 83.22665405273438, 87.66618347167969, 92.10572052001953, 96.54525756835938, 100.98479461669922, 105.42433166503906, 109.86386108398438, 114.30339813232422, 118.74293518066406, 123.18246459960938, 127.62200164794922, 132.06153869628906, 136.50106811523438, 140.94061279296875, 145.38014221191406, 149.81967163085938, 154.25921630859375, 158.69874572753906, 163.13829040527344, 167.57781982421875, 172.01736450195312, 176.45689392089844, 180.89642333984375, 185.33595275878906, 189.77549743652344, 194.21502685546875, 198.65457153320312, 203.09410095214844, 207.53363037109375, 211.97317504882812, 216.4127197265625, 220.8522491455078, 225.2917938232422, 229.7313232421875, 234.17086791992188, 238.6103973388672, 243.0499267578125, 247.48947143554688, 251.9290008544922]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 12.0, 22.0, 18.0, 19.0, 22.0, 22.0, 35.0, 34.0, 45.0, 42.0, 52.0, 52.0, 60.0, 55.0, 45.0, 66.0, 47.0, 43.0, 31.0, 33.0, 33.0, 36.0, 29.0, 27.0, 22.0, 16.0, 17.0, 20.0, 6.0, 10.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-67.90605163574219, -66.08020782470703, -64.25436401367188, -62.42851638793945, -60.6026725769043, -58.77682876586914, -56.95098114013672, -55.12513732910156, -53.299293518066406, -51.47344970703125, -49.647605895996094, -47.82175827026367, -45.995914459228516, -44.17007064819336, -42.34422302246094, -40.51837921142578, -38.692535400390625, -36.86669158935547, -35.04084777832031, -33.21500015258789, -31.389156341552734, -29.563312530517578, -27.73746681213379, -25.91162109375, -24.085777282714844, -22.259933471679688, -20.4340877532959, -18.60824203491211, -16.782398223876953, -14.95655345916748, -13.130708694458008, -11.304863929748535, -9.479019165039062, -7.65317440032959, -5.827329635620117, -4.0014848709106445, -2.175640106201172, -0.3497953414916992, 1.4760494232177734, 3.301894187927246, 5.127738952636719, 6.953583717346191, 8.779428482055664, 10.605273246765137, 12.43111801147461, 14.256962776184082, 16.082807540893555, 17.908653259277344, 19.7344970703125, 21.560340881347656, 23.386186599731445, 25.212032318115234, 27.03787612915039, 28.863719940185547, 30.689565658569336, 32.515411376953125, 34.34125518798828, 36.16709899902344, 37.992942810058594, 39.818790435791016, 41.64463424682617, 43.47047805786133, 45.29632568359375, 47.122169494628906, 48.94801330566406]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 6.0, 3.0, 6.0, 14.0, 10.0, 16.0, 11.0, 15.0, 28.0, 21.0, 16.0, 23.0, 28.0, 29.0, 24.0, 36.0, 31.0, 35.0, 38.0, 35.0, 36.0, 43.0, 43.0, 29.0, 34.0, 38.0, 34.0, 40.0, 35.0, 29.0, 26.0, 25.0, 19.0, 23.0, 21.0, 19.0, 16.0, 15.0, 11.0, 3.0, 9.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.78125, -4.6339111328125, -4.486572265625, -4.3392333984375, -4.19189453125, -4.0445556640625, -3.897216796875, -3.7498779296875, -3.6025390625, -3.4552001953125, -3.307861328125, -3.1605224609375, -3.01318359375, -2.8658447265625, -2.718505859375, -2.5711669921875, -2.423828125, -2.2764892578125, -2.129150390625, -1.9818115234375, -1.83447265625, -1.6871337890625, -1.539794921875, -1.3924560546875, -1.2451171875, -1.0977783203125, -0.950439453125, -0.8031005859375, -0.65576171875, -0.5084228515625, -0.361083984375, -0.2137451171875, -0.06640625, 0.0809326171875, 0.228271484375, 0.3756103515625, 0.52294921875, 0.6702880859375, 0.817626953125, 0.9649658203125, 1.1123046875, 1.2596435546875, 1.406982421875, 1.5543212890625, 1.70166015625, 1.8489990234375, 1.996337890625, 2.1436767578125, 2.291015625, 2.4383544921875, 2.585693359375, 2.7330322265625, 2.88037109375, 3.0277099609375, 3.175048828125, 3.3223876953125, 3.4697265625, 3.6170654296875, 3.764404296875, 3.9117431640625, 4.05908203125, 4.2064208984375, 4.353759765625, 4.5010986328125, 4.6484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 8.0, 6.0, 12.0, 14.0, 23.0, 24.0, 45.0, 44.0, 61.0, 80.0, 115.0, 164.0, 264.0, 443.0, 758.0, 1625.0, 3925.0, 10984.0, 33767.0, 131301.0, 632937.0, 1739036.0, 1237334.0, 303725.0, 66714.0, 19009.0, 6655.0, 2512.0, 1119.0, 527.0, 310.0, 203.0, 134.0, 102.0, 60.0, 61.0, 41.0, 29.0, 23.0, 19.0, 14.0, 13.0, 9.0, 5.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0], "bins": [-8.796875, -8.5509033203125, -8.304931640625, -8.0589599609375, -7.81298828125, -7.5670166015625, -7.321044921875, -7.0750732421875, -6.8291015625, -6.5831298828125, -6.337158203125, -6.0911865234375, -5.84521484375, -5.5992431640625, -5.353271484375, -5.1072998046875, -4.861328125, -4.6153564453125, -4.369384765625, -4.1234130859375, -3.87744140625, -3.6314697265625, -3.385498046875, -3.1395263671875, -2.8935546875, -2.6475830078125, -2.401611328125, -2.1556396484375, -1.90966796875, -1.6636962890625, -1.417724609375, -1.1717529296875, -0.92578125, -0.6798095703125, -0.433837890625, -0.1878662109375, 0.05810546875, 0.3040771484375, 0.550048828125, 0.7960205078125, 1.0419921875, 1.2879638671875, 1.533935546875, 1.7799072265625, 2.02587890625, 2.2718505859375, 2.517822265625, 2.7637939453125, 3.009765625, 3.2557373046875, 3.501708984375, 3.7476806640625, 3.99365234375, 4.2396240234375, 4.485595703125, 4.7315673828125, 4.9775390625, 5.2235107421875, 5.469482421875, 5.7154541015625, 5.96142578125, 6.2073974609375, 6.453369140625, 6.6993408203125, 6.9453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 12.0, 26.0, 40.0, 87.0, 135.0, 231.0, 377.0, 624.0, 810.0, 653.0, 421.0, 276.0, 141.0, 99.0, 60.0, 27.0, 26.0, 10.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.25, -30.5789794921875, -29.907958984375, -29.2369384765625, -28.56591796875, -27.8948974609375, -27.223876953125, -26.5528564453125, -25.8818359375, -25.2108154296875, -24.539794921875, -23.8687744140625, -23.19775390625, -22.5267333984375, -21.855712890625, -21.1846923828125, -20.513671875, -19.8426513671875, -19.171630859375, -18.5006103515625, -17.82958984375, -17.1585693359375, -16.487548828125, -15.8165283203125, -15.1455078125, -14.4744873046875, -13.803466796875, -13.1324462890625, -12.46142578125, -11.7904052734375, -11.119384765625, -10.4483642578125, -9.77734375, -9.1063232421875, -8.435302734375, -7.7642822265625, -7.09326171875, -6.4222412109375, -5.751220703125, -5.0802001953125, -4.4091796875, -3.7381591796875, -3.067138671875, -2.3961181640625, -1.72509765625, -1.0540771484375, -0.383056640625, 0.2879638671875, 0.958984375, 1.6300048828125, 2.301025390625, 2.9720458984375, 3.64306640625, 4.3140869140625, 4.985107421875, 5.6561279296875, 6.3271484375, 6.9981689453125, 7.669189453125, 8.3402099609375, 9.01123046875, 9.6822509765625, 10.353271484375, 11.0242919921875, 11.6953125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 16.0, 15.0, 27.0, 39.0, 52.0, 84.0, 145.0, 211.0, 369.0, 764.0, 4324.0, 339371.0, 3807670.0, 38388.0, 1595.0, 467.0, 259.0, 168.0, 104.0, 63.0, 48.0, 25.0, 22.0, 14.0, 12.0, 11.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -30.64599609375, -29.1357421875, -27.62548828125, -26.115234375, -24.60498046875, -23.0947265625, -21.58447265625, -20.07421875, -18.56396484375, -17.0537109375, -15.54345703125, -14.033203125, -12.52294921875, -11.0126953125, -9.50244140625, -7.9921875, -6.48193359375, -4.9716796875, -3.46142578125, -1.951171875, -0.44091796875, 1.0693359375, 2.57958984375, 4.08984375, 5.60009765625, 7.1103515625, 8.62060546875, 10.130859375, 11.64111328125, 13.1513671875, 14.66162109375, 16.171875, 17.68212890625, 19.1923828125, 20.70263671875, 22.212890625, 23.72314453125, 25.2333984375, 26.74365234375, 28.25390625, 29.76416015625, 31.2744140625, 32.78466796875, 34.294921875, 35.80517578125, 37.3154296875, 38.82568359375, 40.3359375, 41.84619140625, 43.3564453125, 44.86669921875, 46.376953125, 47.88720703125, 49.3974609375, 50.90771484375, 52.41796875, 53.92822265625, 55.4384765625, 56.94873046875, 58.458984375, 59.96923828125, 61.4794921875, 62.98974609375, 64.5]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 45.0, 83.0, 157.0, 246.0, 204.0, 164.0, 60.0, 34.0, 7.0, 4.0, 3.0, 0.0, 1.0], "bins": [-206.35142517089844, -202.59034729003906, -198.82925415039062, -195.06817626953125, -191.30709838867188, -187.54600524902344, -183.78492736816406, -180.0238494873047, -176.26275634765625, -172.50167846679688, -168.74058532714844, -164.97950744628906, -161.2184295654297, -157.45733642578125, -153.69625854492188, -149.9351806640625, -146.17410278320312, -142.41302490234375, -138.6519317626953, -134.89085388183594, -131.12977600097656, -127.36869049072266, -123.60760498046875, -119.84652709960938, -116.08543395996094, -112.32434844970703, -108.56327056884766, -104.80218505859375, -101.04109954833984, -97.28002166748047, -93.51893615722656, -89.75785827636719, -85.99677276611328, -82.23568725585938, -78.474609375, -74.7135238647461, -70.95243835449219, -67.19136047363281, -63.430274963378906, -59.669193267822266, -55.908111572265625, -52.147029876708984, -48.38594436645508, -44.62486267089844, -40.8637809753418, -37.102699279785156, -33.34161376953125, -29.58053207397461, -25.819446563720703, -22.05836296081543, -18.29728126525879, -14.536197662353516, -10.775115013122559, -7.014032363891602, -3.252948760986328, 0.5081329345703125, 4.269216537475586, 8.030299186706543, 11.7913818359375, 15.552465438842773, 19.313549041748047, 23.074630737304688, 26.83571434020996, 30.5967960357666, 34.357879638671875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 0.0, 3.0, 4.0, 3.0, 7.0, 11.0, 4.0, 7.0, 18.0, 20.0, 14.0, 18.0, 35.0, 17.0, 31.0, 35.0, 29.0, 37.0, 38.0, 41.0, 45.0, 32.0, 43.0, 36.0, 30.0, 42.0, 52.0, 38.0, 34.0, 28.0, 32.0, 21.0, 23.0, 24.0, 21.0, 24.0, 21.0, 14.0, 13.0, 10.0, 12.0, 6.0, 6.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.032928466796875, -39.76377487182617, -38.4946174621582, -37.2254638671875, -35.95630645751953, -34.68715286254883, -33.417999267578125, -32.148841857910156, -30.879688262939453, -29.610532760620117, -28.34137725830078, -27.072223663330078, -25.803068161010742, -24.533912658691406, -23.26475715637207, -21.995601654052734, -20.7264461517334, -19.457290649414062, -18.188135147094727, -16.91897964477539, -15.649826049804688, -14.380670547485352, -13.111515045166016, -11.842360496520996, -10.57320499420166, -9.304049491882324, -8.034894943237305, -6.765739440917969, -5.496584415435791, -4.227429389953613, -2.9582738876342773, -1.6891193389892578, -0.4199638366699219, 0.8491913080215454, 2.1183464527130127, 3.3875017166137695, 4.656656742095947, 5.925811767578125, 7.194967269897461, 8.46412181854248, 9.733277320861816, 11.002432823181152, 12.271587371826172, 13.540742874145508, 14.809898376464844, 16.079051971435547, 17.348209381103516, 18.61736297607422, 19.886518478393555, 21.15567398071289, 22.424829483032227, 23.693984985351562, 24.963138580322266, 26.2322940826416, 27.501449584960938, 28.77060317993164, 30.03976058959961, 31.308916091918945, 32.57807159423828, 33.847225189208984, 35.11638259887695, 36.385536193847656, 37.654693603515625, 38.92384719848633, 40.19300079345703]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 10.0, 14.0, 9.0, 23.0, 14.0, 26.0, 29.0, 19.0, 23.0, 25.0, 29.0, 34.0, 36.0, 31.0, 46.0, 37.0, 43.0, 45.0, 34.0, 35.0, 34.0, 40.0, 36.0, 38.0, 36.0, 25.0, 29.0, 26.0, 20.0, 22.0, 23.0, 18.0, 10.0, 6.0, 10.0, 8.0, 4.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.56640625, -5.4140625, -5.26171875, -5.109375, -4.95703125, -4.8046875, -4.65234375, -4.5, -4.34765625, -4.1953125, -4.04296875, -3.890625, -3.73828125, -3.5859375, -3.43359375, -3.28125, -3.12890625, -2.9765625, -2.82421875, -2.671875, -2.51953125, -2.3671875, -2.21484375, -2.0625, -1.91015625, -1.7578125, -1.60546875, -1.453125, -1.30078125, -1.1484375, -0.99609375, -0.84375, -0.69140625, -0.5390625, -0.38671875, -0.234375, -0.08203125, 0.0703125, 0.22265625, 0.375, 0.52734375, 0.6796875, 0.83203125, 0.984375, 1.13671875, 1.2890625, 1.44140625, 1.59375, 1.74609375, 1.8984375, 2.05078125, 2.203125, 2.35546875, 2.5078125, 2.66015625, 2.8125, 2.96484375, 3.1171875, 3.26953125, 3.421875, 3.57421875, 3.7265625, 3.87890625, 4.03125, 4.18359375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 19.0, 12.0, 27.0, 36.0, 58.0, 86.0, 133.0, 179.0, 284.0, 397.0, 525.0, 721.0, 1086.0, 1457.0, 1975.0, 2688.0, 3865.0, 5195.0, 7367.0, 10664.0, 15310.0, 21627.0, 31565.0, 44867.0, 63659.0, 88710.0, 117853.0, 138522.0, 129624.0, 103821.0, 76489.0, 53813.0, 37525.0, 26218.0, 18315.0, 12669.0, 8981.0, 6366.0, 4556.0, 3215.0, 2277.0, 1658.0, 1174.0, 900.0, 647.0, 442.0, 297.0, 228.0, 165.0, 96.0, 49.0, 64.0, 27.0, 23.0, 10.0, 11.0, 6.0, 6.0, 0.0, 2.0, 2.0], "bins": [-0.3740234375, -0.3618621826171875, -0.349700927734375, -0.3375396728515625, -0.32537841796875, -0.3132171630859375, -0.301055908203125, -0.2888946533203125, -0.2767333984375, -0.2645721435546875, -0.252410888671875, -0.2402496337890625, -0.22808837890625, -0.2159271240234375, -0.203765869140625, -0.1916046142578125, -0.179443359375, -0.1672821044921875, -0.155120849609375, -0.1429595947265625, -0.13079833984375, -0.1186370849609375, -0.106475830078125, -0.0943145751953125, -0.0821533203125, -0.0699920654296875, -0.057830810546875, -0.0456695556640625, -0.03350830078125, -0.0213470458984375, -0.009185791015625, 0.0029754638671875, 0.01513671875, 0.0272979736328125, 0.039459228515625, 0.0516204833984375, 0.06378173828125, 0.0759429931640625, 0.088104248046875, 0.1002655029296875, 0.1124267578125, 0.1245880126953125, 0.136749267578125, 0.1489105224609375, 0.16107177734375, 0.1732330322265625, 0.185394287109375, 0.1975555419921875, 0.209716796875, 0.2218780517578125, 0.234039306640625, 0.2462005615234375, 0.25836181640625, 0.2705230712890625, 0.282684326171875, 0.2948455810546875, 0.3070068359375, 0.3191680908203125, 0.331329345703125, 0.3434906005859375, 0.35565185546875, 0.3678131103515625, 0.379974365234375, 0.3921356201171875, 0.404296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 6.0, 15.0, 11.0, 23.0, 17.0, 20.0, 24.0, 31.0, 31.0, 29.0, 27.0, 21.0, 34.0, 41.0, 39.0, 37.0, 29.0, 1066.0, 39.0, 32.0, 54.0, 37.0, 37.0, 48.0, 33.0, 20.0, 28.0, 29.0, 27.0, 15.0, 20.0, 20.0, 11.0, 9.0, 9.0, 13.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-3.373046875, -3.272674560546875, -3.17230224609375, -3.071929931640625, -2.9715576171875, -2.871185302734375, -2.77081298828125, -2.670440673828125, -2.570068359375, -2.469696044921875, -2.36932373046875, -2.268951416015625, -2.1685791015625, -2.068206787109375, -1.96783447265625, -1.867462158203125, -1.76708984375, -1.666717529296875, -1.56634521484375, -1.465972900390625, -1.3656005859375, -1.265228271484375, -1.16485595703125, -1.064483642578125, -0.964111328125, -0.863739013671875, -0.76336669921875, -0.662994384765625, -0.5626220703125, -0.462249755859375, -0.36187744140625, -0.261505126953125, -0.1611328125, -0.060760498046875, 0.03961181640625, 0.139984130859375, 0.2403564453125, 0.340728759765625, 0.44110107421875, 0.541473388671875, 0.641845703125, 0.742218017578125, 0.84259033203125, 0.942962646484375, 1.0433349609375, 1.143707275390625, 1.24407958984375, 1.344451904296875, 1.44482421875, 1.545196533203125, 1.64556884765625, 1.745941162109375, 1.8463134765625, 1.946685791015625, 2.04705810546875, 2.147430419921875, 2.247802734375, 2.348175048828125, 2.44854736328125, 2.548919677734375, 2.6492919921875, 2.749664306640625, 2.85003662109375, 2.950408935546875, 3.05078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 13.0, 15.0, 25.0, 38.0, 82.0, 100.0, 114.0, 232.0, 305.0, 504.0, 763.0, 1072.0, 1756.0, 2502.0, 3884.0, 6044.0, 9121.0, 14090.0, 22107.0, 33491.0, 49602.0, 71837.0, 97632.0, 123333.0, 1184739.0, 128277.0, 104852.0, 78440.0, 55073.0, 36695.0, 24860.0, 15846.0, 10350.0, 6627.0, 4390.0, 2824.0, 1827.0, 1204.0, 821.0, 539.0, 392.0, 246.0, 157.0, 105.0, 78.0, 45.0, 35.0, 25.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3146781921386719, -0.30440521240234375, -0.2941322326660156, -0.2838592529296875, -0.2735862731933594, -0.26331329345703125, -0.2530403137207031, -0.242767333984375, -0.23249435424804688, -0.22222137451171875, -0.21194839477539062, -0.2016754150390625, -0.19140243530273438, -0.18112945556640625, -0.17085647583007812, -0.16058349609375, -0.15031051635742188, -0.14003753662109375, -0.12976455688476562, -0.1194915771484375, -0.10921859741210938, -0.09894561767578125, -0.08867263793945312, -0.078399658203125, -0.06812667846679688, -0.05785369873046875, -0.047580718994140625, -0.0373077392578125, -0.027034759521484375, -0.01676177978515625, -0.006488800048828125, 0.0037841796875, 0.014057159423828125, 0.02433013916015625, 0.034603118896484375, 0.0448760986328125, 0.055149078369140625, 0.06542205810546875, 0.07569503784179688, 0.085968017578125, 0.09624099731445312, 0.10651397705078125, 0.11678695678710938, 0.1270599365234375, 0.13733291625976562, 0.14760589599609375, 0.15787887573242188, 0.16815185546875, 0.17842483520507812, 0.18869781494140625, 0.19897079467773438, 0.2092437744140625, 0.21951675415039062, 0.22978973388671875, 0.24006271362304688, 0.250335693359375, 0.2606086730957031, 0.27088165283203125, 0.2811546325683594, 0.2914276123046875, 0.3017005920410156, 0.31197357177734375, 0.3222465515136719, 0.33251953125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 3.0, 11.0, 9.0, 12.0, 12.0, 26.0, 9.0, 19.0, 31.0, 33.0, 48.0, 43.0, 48.0, 69.0, 65.0, 40.0, 60.0, 61.0, 71.0, 43.0, 43.0, 57.0, 36.0, 26.0, 26.0, 14.0, 19.0, 9.0, 9.0, 14.0, 4.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002086639404296875, -0.0020099878311157227, -0.0019333362579345703, -0.001856684684753418, -0.0017800331115722656, -0.0017033815383911133, -0.001626729965209961, -0.0015500783920288086, -0.0014734268188476562, -0.001396775245666504, -0.0013201236724853516, -0.0012434720993041992, -0.0011668205261230469, -0.0010901689529418945, -0.0010135173797607422, -0.0009368658065795898, -0.0008602142333984375, -0.0007835626602172852, -0.0007069110870361328, -0.0006302595138549805, -0.0005536079406738281, -0.0004769563674926758, -0.00040030479431152344, -0.0003236532211303711, -0.00024700164794921875, -0.0001703500747680664, -9.369850158691406e-05, -1.704692840576172e-05, 5.9604644775390625e-05, 0.00013625621795654297, 0.0002129077911376953, 0.00028955936431884766, 0.0003662109375, 0.00044286251068115234, 0.0005195140838623047, 0.000596165657043457, 0.0006728172302246094, 0.0007494688034057617, 0.0008261203765869141, 0.0009027719497680664, 0.0009794235229492188, 0.001056075096130371, 0.0011327266693115234, 0.0012093782424926758, 0.0012860298156738281, 0.0013626813888549805, 0.0014393329620361328, 0.0015159845352172852, 0.0015926361083984375, 0.0016692876815795898, 0.0017459392547607422, 0.0018225908279418945, 0.0018992424011230469, 0.0019758939743041992, 0.0020525455474853516, 0.002129197120666504, 0.0022058486938476562, 0.0022825002670288086, 0.002359151840209961, 0.0024358034133911133, 0.0025124549865722656, 0.002589106559753418, 0.0026657581329345703, 0.0027424097061157227, 0.002819061279296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 4.0, 7.0, 4.0, 12.0, 16.0, 22.0, 24.0, 30.0, 51.0, 68.0, 127.0, 221.0, 494.0, 2010.0, 687397.0, 355523.0, 1538.0, 419.0, 201.0, 118.0, 67.0, 54.0, 40.0, 16.0, 20.0, 15.0, 10.0, 14.0, 4.0, 12.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06657648086547852, -0.06467151641845703, -0.06276655197143555, -0.06086158752441406, -0.05895662307739258, -0.057051658630371094, -0.05514669418334961, -0.053241729736328125, -0.05133676528930664, -0.049431800842285156, -0.04752683639526367, -0.04562187194824219, -0.0437169075012207, -0.04181194305419922, -0.039906978607177734, -0.03800201416015625, -0.036097049713134766, -0.03419208526611328, -0.0322871208190918, -0.030382156372070312, -0.028477191925048828, -0.026572227478027344, -0.02466726303100586, -0.022762298583984375, -0.02085733413696289, -0.018952369689941406, -0.017047405242919922, -0.015142440795898438, -0.013237476348876953, -0.011332511901855469, -0.009427547454833984, -0.0075225830078125, -0.005617618560791016, -0.0037126541137695312, -0.0018076896667480469, 9.72747802734375e-05, 0.002002239227294922, 0.003907203674316406, 0.005812168121337891, 0.007717132568359375, 0.00962209701538086, 0.011527061462402344, 0.013432025909423828, 0.015336990356445312, 0.017241954803466797, 0.01914691925048828, 0.021051883697509766, 0.02295684814453125, 0.024861812591552734, 0.02676677703857422, 0.028671741485595703, 0.030576705932617188, 0.03248167037963867, 0.034386634826660156, 0.03629159927368164, 0.038196563720703125, 0.04010152816772461, 0.042006492614746094, 0.04391145706176758, 0.04581642150878906, 0.04772138595581055, 0.04962635040283203, 0.051531314849853516, 0.053436279296875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 8.0, 214.0, 663.0, 128.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02327081374824047, -0.022850975394248962, -0.022431137040257454, -0.022011298686265945, -0.021591458469629288, -0.02117162011563778, -0.02075178176164627, -0.020331943407654762, -0.019912105053663254, -0.019492266699671745, -0.019072428345680237, -0.01865258999168873, -0.01823274977505207, -0.017812911421060562, -0.017393073067069054, -0.016973234713077545, -0.016553396359086037, -0.016133558005094528, -0.01571371965110302, -0.015293880365788937, -0.014874042011797428, -0.014454202726483345, -0.014034364372491837, -0.013614526018500328, -0.013194686733186245, -0.012774848379194736, -0.012355009093880653, -0.011935170739889145, -0.011515332385897636, -0.011095494031906128, -0.010675654746592045, -0.010255816392600536, -0.009835978038609028, -0.00941613968461752, -0.008996300399303436, -0.008576462045311928, -0.00815662369132042, -0.0077367848716676235, -0.007316946052014828, -0.006897107698023319, -0.0064772688783705235, -0.006057430058717728, -0.005637591704726219, -0.005217752885073423, -0.004797914531081915, -0.004378075711429119, -0.003958237357437611, -0.003538398537784815, -0.0031185599509626627, -0.0026987213641405106, -0.0022788827773183584, -0.0018590440740808845, -0.0014392054872587323, -0.0010193667840212584, -0.0005995281971991062, -0.00017968961037695408, 0.00024014897644519806, 0.0006599875632673502, 0.0010798261500895023, 0.0014996648533269763, 0.0019195034401491284, 0.0023393421433866024, 0.0027591807302087545, 0.0031790193170309067, 0.003598857903853059]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 15.0, 20.0, 17.0, 14.0, 22.0, 21.0, 23.0, 34.0, 37.0, 43.0, 52.0, 54.0, 60.0, 68.0, 54.0, 53.0, 47.0, 50.0, 36.0, 48.0, 42.0, 26.0, 30.0, 31.0, 19.0, 20.0, 15.0, 13.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001281440258026123, -0.001228530891239643, -0.0011756215244531631, -0.0011227121576666832, -0.0010698027908802032, -0.0010168934240937233, -0.0009639840573072433, -0.0009110746905207634, -0.0008581653237342834, -0.0008052559569478035, -0.0007523465901613235, -0.0006994372233748436, -0.0006465278565883636, -0.0005936184898018837, -0.0005407091230154037, -0.0004877997562289238, -0.00043489038944244385, -0.0003819810226559639, -0.00032907165586948395, -0.000276162289083004, -0.00022325292229652405, -0.0001703435555100441, -0.00011743418872356415, -6.45248219370842e-05, -1.1615455150604248e-05, 4.12939116358757e-05, 9.420327842235565e-05, 0.0001471126452088356, 0.00020002201199531555, 0.0002529313787817955, 0.00030584074556827545, 0.0003587501123547554, 0.00041165947914123535, 0.0004645688459277153, 0.0005174782127141953, 0.0005703875795006752, 0.0006232969462871552, 0.0006762063130736351, 0.000729115679860115, 0.000782025046646595, 0.000834934413433075, 0.0008878437802195549, 0.0009407531470060349, 0.0009936625137925148, 0.0010465718805789948, 0.0010994812473654747, 0.0011523906141519547, 0.0012052999809384346, 0.0012582093477249146, 0.0013111187145113945, 0.0013640280812978745, 0.0014169374480843544, 0.0014698468148708344, 0.0015227561816573143, 0.0015756655484437943, 0.0016285749152302742, 0.0016814842820167542, 0.001734393648803234, 0.001787303015589714, 0.001840212382376194, 0.001893121749162674, 0.001946031115949154, 0.001998940482735634, 0.002051849849522114, 0.0021047592163085938]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 10.0, 14.0, 9.0, 23.0, 14.0, 26.0, 29.0, 19.0, 23.0, 25.0, 29.0, 34.0, 36.0, 31.0, 46.0, 37.0, 43.0, 45.0, 34.0, 35.0, 34.0, 40.0, 36.0, 38.0, 36.0, 25.0, 29.0, 26.0, 20.0, 22.0, 23.0, 18.0, 10.0, 6.0, 10.0, 8.0, 4.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.56640625, -5.4140625, -5.26171875, -5.109375, -4.95703125, -4.8046875, -4.65234375, -4.5, -4.34765625, -4.1953125, -4.04296875, -3.890625, -3.73828125, -3.5859375, -3.43359375, -3.28125, -3.12890625, -2.9765625, -2.82421875, -2.671875, -2.51953125, -2.3671875, -2.21484375, -2.0625, -1.91015625, -1.7578125, -1.60546875, -1.453125, -1.30078125, -1.1484375, -0.99609375, -0.84375, -0.69140625, -0.5390625, -0.38671875, -0.234375, -0.08203125, 0.0703125, 0.22265625, 0.375, 0.52734375, 0.6796875, 0.83203125, 0.984375, 1.13671875, 1.2890625, 1.44140625, 1.59375, 1.74609375, 1.8984375, 2.05078125, 2.203125, 2.35546875, 2.5078125, 2.66015625, 2.8125, 2.96484375, 3.1171875, 3.26953125, 3.421875, 3.57421875, 3.7265625, 3.87890625, 4.03125, 4.18359375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 20.0, 29.0, 41.0, 55.0, 89.0, 171.0, 267.0, 459.0, 698.0, 1226.0, 2202.0, 3795.0, 7164.0, 13133.0, 24049.0, 46234.0, 90562.0, 201105.0, 314889.0, 173651.0, 80086.0, 40734.0, 21721.0, 11750.0, 6196.0, 3420.0, 1934.0, 1069.0, 663.0, 413.0, 260.0, 162.0, 111.0, 71.0, 35.0, 27.0, 16.0, 12.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.421875, -4.2969970703125, -4.172119140625, -4.0472412109375, -3.92236328125, -3.7974853515625, -3.672607421875, -3.5477294921875, -3.4228515625, -3.2979736328125, -3.173095703125, -3.0482177734375, -2.92333984375, -2.7984619140625, -2.673583984375, -2.5487060546875, -2.423828125, -2.2989501953125, -2.174072265625, -2.0491943359375, -1.92431640625, -1.7994384765625, -1.674560546875, -1.5496826171875, -1.4248046875, -1.2999267578125, -1.175048828125, -1.0501708984375, -0.92529296875, -0.8004150390625, -0.675537109375, -0.5506591796875, -0.42578125, -0.3009033203125, -0.176025390625, -0.0511474609375, 0.07373046875, 0.1986083984375, 0.323486328125, 0.4483642578125, 0.5732421875, 0.6981201171875, 0.822998046875, 0.9478759765625, 1.07275390625, 1.1976318359375, 1.322509765625, 1.4473876953125, 1.572265625, 1.6971435546875, 1.822021484375, 1.9468994140625, 2.07177734375, 2.1966552734375, 2.321533203125, 2.4464111328125, 2.5712890625, 2.6961669921875, 2.821044921875, 2.9459228515625, 3.07080078125, 3.1956787109375, 3.320556640625, 3.4454345703125, 3.5703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 5.0, 9.0, 5.0, 4.0, 11.0, 13.0, 16.0, 12.0, 24.0, 33.0, 24.0, 33.0, 43.0, 36.0, 56.0, 39.0, 68.0, 107.0, 213.0, 1482.0, 254.0, 112.0, 70.0, 65.0, 42.0, 47.0, 36.0, 28.0, 30.0, 26.0, 27.0, 11.0, 5.0, 8.0, 11.0, 5.0, 10.0, 5.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0625, -18.440185546875, -17.81787109375, -17.195556640625, -16.5732421875, -15.950927734375, -15.32861328125, -14.706298828125, -14.083984375, -13.461669921875, -12.83935546875, -12.217041015625, -11.5947265625, -10.972412109375, -10.35009765625, -9.727783203125, -9.10546875, -8.483154296875, -7.86083984375, -7.238525390625, -6.6162109375, -5.993896484375, -5.37158203125, -4.749267578125, -4.126953125, -3.504638671875, -2.88232421875, -2.260009765625, -1.6376953125, -1.015380859375, -0.39306640625, 0.229248046875, 0.8515625, 1.473876953125, 2.09619140625, 2.718505859375, 3.3408203125, 3.963134765625, 4.58544921875, 5.207763671875, 5.830078125, 6.452392578125, 7.07470703125, 7.697021484375, 8.3193359375, 8.941650390625, 9.56396484375, 10.186279296875, 10.80859375, 11.430908203125, 12.05322265625, 12.675537109375, 13.2978515625, 13.920166015625, 14.54248046875, 15.164794921875, 15.787109375, 16.409423828125, 17.03173828125, 17.654052734375, 18.2763671875, 18.898681640625, 19.52099609375, 20.143310546875, 20.765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 13.0, 10.0, 15.0, 20.0, 17.0, 16.0, 16.0, 38.0, 49.0, 58.0, 83.0, 110.0, 152.0, 201.0, 339.0, 573.0, 2346.0, 44153.0, 3058762.0, 34678.0, 2271.0, 544.0, 321.0, 243.0, 159.0, 110.0, 90.0, 46.0, 61.0, 37.0, 37.0, 24.0, 25.0, 17.0, 14.0, 9.0, 7.0, 8.0, 1.0, 2.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-48.09375, -46.69873046875, -45.3037109375, -43.90869140625, -42.513671875, -41.11865234375, -39.7236328125, -38.32861328125, -36.93359375, -35.53857421875, -34.1435546875, -32.74853515625, -31.353515625, -29.95849609375, -28.5634765625, -27.16845703125, -25.7734375, -24.37841796875, -22.9833984375, -21.58837890625, -20.193359375, -18.79833984375, -17.4033203125, -16.00830078125, -14.61328125, -13.21826171875, -11.8232421875, -10.42822265625, -9.033203125, -7.63818359375, -6.2431640625, -4.84814453125, -3.453125, -2.05810546875, -0.6630859375, 0.73193359375, 2.126953125, 3.52197265625, 4.9169921875, 6.31201171875, 7.70703125, 9.10205078125, 10.4970703125, 11.89208984375, 13.287109375, 14.68212890625, 16.0771484375, 17.47216796875, 18.8671875, 20.26220703125, 21.6572265625, 23.05224609375, 24.447265625, 25.84228515625, 27.2373046875, 28.63232421875, 30.02734375, 31.42236328125, 32.8173828125, 34.21240234375, 35.607421875, 37.00244140625, 38.3974609375, 39.79248046875, 41.1875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 11.0, 672.0, 333.0, 2.0], "bins": [-539.9373168945312, -531.2073974609375, -522.4774780273438, -513.74755859375, -505.0176696777344, -496.2877502441406, -487.557861328125, -478.82794189453125, -470.0980224609375, -461.36810302734375, -452.63818359375, -443.9082946777344, -435.1783752441406, -426.4484558105469, -417.71856689453125, -408.9886474609375, -400.25872802734375, -391.52880859375, -382.79888916015625, -374.0690002441406, -365.3390808105469, -356.6091613769531, -347.8792724609375, -339.14935302734375, -330.41943359375, -321.68951416015625, -312.9595947265625, -304.2297058105469, -295.4997863769531, -286.7698669433594, -278.03997802734375, -269.31005859375, -260.58013916015625, -251.8502197265625, -243.1203155517578, -234.39041137695312, -225.66049194335938, -216.93057250976562, -208.20066833496094, -199.47076416015625, -190.74082946777344, -182.01092529296875, -173.281005859375, -164.55108642578125, -155.82118225097656, -147.09127807617188, -138.36135864257812, -129.63143920898438, -120.90153503417969, -112.17162322998047, -103.44171142578125, -94.71179962158203, -85.98188781738281, -77.2519760131836, -68.52206420898438, -59.792152404785156, -51.06224060058594, -42.33232879638672, -33.6024169921875, -24.87250518798828, -16.142593383789062, -7.412681579589844, 1.317230224609375, 10.047142028808594, 18.777053833007812]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 10.0, 11.0, 6.0, 17.0, 13.0, 22.0, 23.0, 25.0, 24.0, 33.0, 31.0, 28.0, 31.0, 25.0, 34.0, 42.0, 45.0, 42.0, 42.0, 28.0, 43.0, 30.0, 35.0, 30.0, 28.0, 39.0, 28.0, 27.0, 21.0, 25.0, 22.0, 15.0, 18.0, 14.0, 8.0, 15.0, 11.0, 7.0, 6.0, 9.0, 9.0, 1.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.5994987487793, -41.27033233642578, -39.94116973876953, -38.612003326416016, -37.282840728759766, -35.95367431640625, -34.62451171875, -33.295345306396484, -31.9661808013916, -30.63701629638672, -29.307851791381836, -27.978687286376953, -26.649520874023438, -25.320358276367188, -23.991191864013672, -22.66202735900879, -21.332862854003906, -20.003698348999023, -18.67453384399414, -17.345369338989258, -16.016204833984375, -14.687039375305176, -13.357873916625977, -12.028709411621094, -10.699544906616211, -9.370380401611328, -8.041215896606445, -6.712050437927246, -5.382885932922363, -4.0537214279174805, -2.7245564460754395, -1.3953914642333984, -0.06622314453125, 1.262941598892212, 2.592106342315674, 3.9212710857391357, 5.250435829162598, 6.5796003341674805, 7.9087653160095215, 9.237930297851562, 10.567094802856445, 11.896259307861328, 13.225423812866211, 14.55458927154541, 15.883753776550293, 17.21291732788086, 18.542083740234375, 19.871248245239258, 21.20041275024414, 22.529577255249023, 23.858741760253906, 25.18790626525879, 26.517070770263672, 27.846237182617188, 29.17540168762207, 30.504566192626953, 31.833730697631836, 33.16289520263672, 34.492061614990234, 35.821224212646484, 37.150390625, 38.47955322265625, 39.808719635009766, 41.13788604736328, 42.46704864501953]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 10.0, 7.0, 8.0, 16.0, 19.0, 10.0, 17.0, 23.0, 21.0, 32.0, 24.0, 18.0, 27.0, 40.0, 29.0, 36.0, 42.0, 40.0, 45.0, 36.0, 30.0, 37.0, 34.0, 39.0, 36.0, 34.0, 32.0, 20.0, 31.0, 22.0, 24.0, 28.0, 21.0, 19.0, 13.0, 16.0, 10.0, 5.0, 9.0, 7.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0], "bins": [-5.71875, -5.56329345703125, -5.4078369140625, -5.25238037109375, -5.096923828125, -4.94146728515625, -4.7860107421875, -4.63055419921875, -4.47509765625, -4.31964111328125, -4.1641845703125, -4.00872802734375, -3.853271484375, -3.69781494140625, -3.5423583984375, -3.38690185546875, -3.2314453125, -3.07598876953125, -2.9205322265625, -2.76507568359375, -2.609619140625, -2.45416259765625, -2.2987060546875, -2.14324951171875, -1.98779296875, -1.83233642578125, -1.6768798828125, -1.52142333984375, -1.365966796875, -1.21051025390625, -1.0550537109375, -0.89959716796875, -0.744140625, -0.58868408203125, -0.4332275390625, -0.27777099609375, -0.122314453125, 0.03314208984375, 0.1885986328125, 0.34405517578125, 0.49951171875, 0.65496826171875, 0.8104248046875, 0.96588134765625, 1.121337890625, 1.27679443359375, 1.4322509765625, 1.58770751953125, 1.7431640625, 1.89862060546875, 2.0540771484375, 2.20953369140625, 2.364990234375, 2.52044677734375, 2.6759033203125, 2.83135986328125, 2.98681640625, 3.14227294921875, 3.2977294921875, 3.45318603515625, 3.608642578125, 3.76409912109375, 3.9195556640625, 4.07501220703125, 4.23046875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 10.0, 7.0, 9.0, 15.0, 16.0, 19.0, 29.0, 23.0, 32.0, 27.0, 41.0, 48.0, 79.0, 206.0, 733.0, 3477.0, 34246.0, 1073177.0, 2930158.0, 141337.0, 8493.0, 1328.0, 303.0, 123.0, 51.0, 42.0, 30.0, 30.0, 25.0, 29.0, 17.0, 19.0, 20.0, 13.0, 13.0, 5.0, 7.0, 7.0, 4.0, 2.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0], "bins": [-22.90625, -22.27392578125, -21.6416015625, -21.00927734375, -20.376953125, -19.74462890625, -19.1123046875, -18.47998046875, -17.84765625, -17.21533203125, -16.5830078125, -15.95068359375, -15.318359375, -14.68603515625, -14.0537109375, -13.42138671875, -12.7890625, -12.15673828125, -11.5244140625, -10.89208984375, -10.259765625, -9.62744140625, -8.9951171875, -8.36279296875, -7.73046875, -7.09814453125, -6.4658203125, -5.83349609375, -5.201171875, -4.56884765625, -3.9365234375, -3.30419921875, -2.671875, -2.03955078125, -1.4072265625, -0.77490234375, -0.142578125, 0.48974609375, 1.1220703125, 1.75439453125, 2.38671875, 3.01904296875, 3.6513671875, 4.28369140625, 4.916015625, 5.54833984375, 6.1806640625, 6.81298828125, 7.4453125, 8.07763671875, 8.7099609375, 9.34228515625, 9.974609375, 10.60693359375, 11.2392578125, 11.87158203125, 12.50390625, 13.13623046875, 13.7685546875, 14.40087890625, 15.033203125, 15.66552734375, 16.2978515625, 16.93017578125, 17.5625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 20.0, 18.0, 25.0, 29.0, 47.0, 64.0, 87.0, 108.0, 142.0, 178.0, 277.0, 337.0, 391.0, 424.0, 424.0, 373.0, 287.0, 209.0, 156.0, 122.0, 79.0, 78.0, 46.0, 34.0, 26.0, 19.0, 13.0, 17.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-14.4296875, -14.05615234375, -13.6826171875, -13.30908203125, -12.935546875, -12.56201171875, -12.1884765625, -11.81494140625, -11.44140625, -11.06787109375, -10.6943359375, -10.32080078125, -9.947265625, -9.57373046875, -9.2001953125, -8.82666015625, -8.453125, -8.07958984375, -7.7060546875, -7.33251953125, -6.958984375, -6.58544921875, -6.2119140625, -5.83837890625, -5.46484375, -5.09130859375, -4.7177734375, -4.34423828125, -3.970703125, -3.59716796875, -3.2236328125, -2.85009765625, -2.4765625, -2.10302734375, -1.7294921875, -1.35595703125, -0.982421875, -0.60888671875, -0.2353515625, 0.13818359375, 0.51171875, 0.88525390625, 1.2587890625, 1.63232421875, 2.005859375, 2.37939453125, 2.7529296875, 3.12646484375, 3.5, 3.87353515625, 4.2470703125, 4.62060546875, 4.994140625, 5.36767578125, 5.7412109375, 6.11474609375, 6.48828125, 6.86181640625, 7.2353515625, 7.60888671875, 7.982421875, 8.35595703125, 8.7294921875, 9.10302734375, 9.4765625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 10.0, 18.0, 23.0, 25.0, 50.0, 53.0, 95.0, 145.0, 210.0, 388.0, 1109.0, 12431.0, 2200016.0, 1966275.0, 11257.0, 1021.0, 403.0, 252.0, 153.0, 107.0, 74.0, 42.0, 40.0, 22.0, 15.0, 12.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.3125, -56.81689453125, -55.3212890625, -53.82568359375, -52.330078125, -50.83447265625, -49.3388671875, -47.84326171875, -46.34765625, -44.85205078125, -43.3564453125, -41.86083984375, -40.365234375, -38.86962890625, -37.3740234375, -35.87841796875, -34.3828125, -32.88720703125, -31.3916015625, -29.89599609375, -28.400390625, -26.90478515625, -25.4091796875, -23.91357421875, -22.41796875, -20.92236328125, -19.4267578125, -17.93115234375, -16.435546875, -14.93994140625, -13.4443359375, -11.94873046875, -10.453125, -8.95751953125, -7.4619140625, -5.96630859375, -4.470703125, -2.97509765625, -1.4794921875, 0.01611328125, 1.51171875, 3.00732421875, 4.5029296875, 5.99853515625, 7.494140625, 8.98974609375, 10.4853515625, 11.98095703125, 13.4765625, 14.97216796875, 16.4677734375, 17.96337890625, 19.458984375, 20.95458984375, 22.4501953125, 23.94580078125, 25.44140625, 26.93701171875, 28.4326171875, 29.92822265625, 31.423828125, 32.91943359375, 34.4150390625, 35.91064453125, 37.40625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 83.0, 215.0, 347.0, 246.0, 95.0, 19.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.125, -86.58455657958984, -81.04411315917969, -75.50366973876953, -69.96322631835938, -64.42278289794922, -58.88234329223633, -53.34189987182617, -47.801456451416016, -42.26101303100586, -36.7205696105957, -31.18012809753418, -25.639684677124023, -20.099241256713867, -14.558799743652344, -9.018356323242188, -3.4779129028320312, 2.062530040740967, 7.602972984313965, 13.143415451049805, 18.68385887145996, 24.224302291870117, 29.76474380493164, 35.3051872253418, 40.84563064575195, 46.38607406616211, 51.926517486572266, 57.466957092285156, 63.00740051269531, 68.54784393310547, 74.08828735351562, 79.62873077392578, 85.16917419433594, 90.7096176147461, 96.25006103515625, 101.7905044555664, 107.33094787597656, 112.87139129638672, 118.41183471679688, 123.9522705078125, 129.4927215576172, 135.0331573486328, 140.5736083984375, 146.11404418945312, 151.6544952392578, 157.19493103027344, 162.73538208007812, 168.27581787109375, 173.81625366210938, 179.356689453125, 184.8971405029297, 190.4375762939453, 195.97802734375, 201.51846313476562, 207.0589141845703, 212.59934997558594, 218.13980102539062, 223.68023681640625, 229.22068786621094, 234.76112365722656, 240.30157470703125, 245.84201049804688, 251.38246154785156, 256.92291259765625, 262.4633483886719]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 5.0, 8.0, 12.0, 10.0, 32.0, 25.0, 21.0, 19.0, 25.0, 19.0, 34.0, 31.0, 42.0, 31.0, 44.0, 37.0, 31.0, 43.0, 48.0, 44.0, 34.0, 41.0, 46.0, 44.0, 26.0, 39.0, 20.0, 33.0, 26.0, 21.0, 21.0, 12.0, 14.0, 8.0, 8.0, 12.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-45.05827331542969, -43.780174255371094, -42.502071380615234, -41.22397232055664, -39.94586944580078, -38.66777038574219, -37.38966751098633, -36.111568450927734, -34.833465576171875, -33.55536651611328, -32.27726364135742, -30.999162673950195, -29.72106170654297, -28.442962646484375, -27.16486167907715, -25.886760711669922, -24.608661651611328, -23.3305606842041, -22.052459716796875, -20.77435874938965, -19.496257781982422, -18.218158721923828, -16.9400577545166, -15.661956787109375, -14.383855819702148, -13.105754852294922, -11.827653884887695, -10.549553871154785, -9.271452903747559, -7.993351936340332, -6.715251445770264, -5.437150955200195, -4.159049987792969, -2.8809492588043213, -1.6028485298156738, -0.32474780082702637, 0.9533529281616211, 2.2314538955688477, 3.509554386138916, 4.787654876708984, 6.065755844116211, 7.3438568115234375, 8.621957778930664, 9.900057792663574, 11.1781587600708, 12.456259727478027, 13.734359741210938, 15.012460708618164, 16.29056167602539, 17.568662643432617, 18.846763610839844, 20.12486457824707, 21.402965545654297, 22.68106460571289, 23.959165573120117, 25.237266540527344, 26.51536750793457, 27.793468475341797, 29.071569442749023, 30.34967041015625, 31.627769470214844, 32.9058723449707, 34.1839714050293, 35.462074279785156, 36.74017333984375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 15.0, 17.0, 15.0, 15.0, 19.0, 21.0, 17.0, 29.0, 31.0, 40.0, 46.0, 40.0, 52.0, 41.0, 41.0, 42.0, 39.0, 33.0, 42.0, 42.0, 30.0, 37.0, 35.0, 27.0, 29.0, 20.0, 22.0, 23.0, 14.0, 15.0, 21.0, 5.0, 3.0, 10.0, 9.0, 11.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.93377685546875, -4.7738037109375, -4.61383056640625, -4.453857421875, -4.29388427734375, -4.1339111328125, -3.97393798828125, -3.81396484375, -3.65399169921875, -3.4940185546875, -3.33404541015625, -3.174072265625, -3.01409912109375, -2.8541259765625, -2.69415283203125, -2.5341796875, -2.37420654296875, -2.2142333984375, -2.05426025390625, -1.894287109375, -1.73431396484375, -1.5743408203125, -1.41436767578125, -1.25439453125, -1.09442138671875, -0.9344482421875, -0.77447509765625, -0.614501953125, -0.45452880859375, -0.2945556640625, -0.13458251953125, 0.025390625, 0.18536376953125, 0.3453369140625, 0.50531005859375, 0.665283203125, 0.82525634765625, 0.9852294921875, 1.14520263671875, 1.30517578125, 1.46514892578125, 1.6251220703125, 1.78509521484375, 1.945068359375, 2.10504150390625, 2.2650146484375, 2.42498779296875, 2.5849609375, 2.74493408203125, 2.9049072265625, 3.06488037109375, 3.224853515625, 3.38482666015625, 3.5447998046875, 3.70477294921875, 3.86474609375, 4.02471923828125, 4.1846923828125, 4.34466552734375, 4.504638671875, 4.66461181640625, 4.8245849609375, 4.98455810546875, 5.14453125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 12.0, 22.0, 22.0, 45.0, 58.0, 95.0, 132.0, 186.0, 282.0, 441.0, 599.0, 894.0, 1312.0, 1974.0, 2814.0, 4283.0, 6352.0, 9569.0, 14363.0, 22001.0, 33830.0, 52429.0, 80599.0, 118215.0, 154809.0, 159856.0, 127054.0, 88594.0, 58200.0, 37331.0, 24293.0, 15752.0, 10530.0, 7081.0, 4728.0, 3233.0, 2170.0, 1409.0, 965.0, 633.0, 437.0, 302.0, 218.0, 137.0, 84.0, 58.0, 51.0, 35.0, 14.0, 16.0, 11.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4406890869140625, -0.426055908203125, -0.4114227294921875, -0.39678955078125, -0.3821563720703125, -0.367523193359375, -0.3528900146484375, -0.3382568359375, -0.3236236572265625, -0.308990478515625, -0.2943572998046875, -0.27972412109375, -0.2650909423828125, -0.250457763671875, -0.2358245849609375, -0.22119140625, -0.2065582275390625, -0.191925048828125, -0.1772918701171875, -0.16265869140625, -0.1480255126953125, -0.133392333984375, -0.1187591552734375, -0.1041259765625, -0.0894927978515625, -0.074859619140625, -0.0602264404296875, -0.04559326171875, -0.0309600830078125, -0.016326904296875, -0.0016937255859375, 0.012939453125, 0.0275726318359375, 0.042205810546875, 0.0568389892578125, 0.07147216796875, 0.0861053466796875, 0.100738525390625, 0.1153717041015625, 0.1300048828125, 0.1446380615234375, 0.159271240234375, 0.1739044189453125, 0.18853759765625, 0.2031707763671875, 0.217803955078125, 0.2324371337890625, 0.2470703125, 0.2617034912109375, 0.276336669921875, 0.2909698486328125, 0.30560302734375, 0.3202362060546875, 0.334869384765625, 0.3495025634765625, 0.3641357421875, 0.3787689208984375, 0.393402099609375, 0.4080352783203125, 0.42266845703125, 0.4373016357421875, 0.451934814453125, 0.4665679931640625, 0.481201171875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 8.0, 9.0, 10.0, 15.0, 14.0, 24.0, 22.0, 17.0, 20.0, 28.0, 32.0, 38.0, 35.0, 41.0, 49.0, 40.0, 40.0, 1078.0, 63.0, 41.0, 41.0, 38.0, 35.0, 41.0, 37.0, 21.0, 30.0, 28.0, 25.0, 14.0, 13.0, 16.0, 15.0, 7.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.7734375, -3.66546630859375, -3.5574951171875, -3.44952392578125, -3.341552734375, -3.23358154296875, -3.1256103515625, -3.01763916015625, -2.90966796875, -2.80169677734375, -2.6937255859375, -2.58575439453125, -2.477783203125, -2.36981201171875, -2.2618408203125, -2.15386962890625, -2.0458984375, -1.93792724609375, -1.8299560546875, -1.72198486328125, -1.614013671875, -1.50604248046875, -1.3980712890625, -1.29010009765625, -1.18212890625, -1.07415771484375, -0.9661865234375, -0.85821533203125, -0.750244140625, -0.64227294921875, -0.5343017578125, -0.42633056640625, -0.318359375, -0.21038818359375, -0.1024169921875, 0.00555419921875, 0.113525390625, 0.22149658203125, 0.3294677734375, 0.43743896484375, 0.54541015625, 0.65338134765625, 0.7613525390625, 0.86932373046875, 0.977294921875, 1.08526611328125, 1.1932373046875, 1.30120849609375, 1.4091796875, 1.51715087890625, 1.6251220703125, 1.73309326171875, 1.841064453125, 1.94903564453125, 2.0570068359375, 2.16497802734375, 2.27294921875, 2.38092041015625, 2.4888916015625, 2.59686279296875, 2.704833984375, 2.81280517578125, 2.9207763671875, 3.02874755859375, 3.13671875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 10.0, 16.0, 20.0, 18.0, 32.0, 55.0, 69.0, 108.0, 149.0, 233.0, 337.0, 484.0, 697.0, 1013.0, 1598.0, 2285.0, 3296.0, 4902.0, 7429.0, 11086.0, 16735.0, 25409.0, 37838.0, 55665.0, 79037.0, 106784.0, 130346.0, 1185017.0, 120719.0, 94473.0, 68376.0, 47402.0, 31852.0, 21322.0, 14141.0, 9182.0, 6120.0, 4103.0, 2847.0, 1829.0, 1290.0, 841.0, 627.0, 433.0, 291.0, 219.0, 133.0, 95.0, 55.0, 48.0, 27.0, 16.0, 12.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.325439453125, -0.3150367736816406, -0.30463409423828125, -0.2942314147949219, -0.2838287353515625, -0.2734260559082031, -0.26302337646484375, -0.2526206970214844, -0.242218017578125, -0.23181533813476562, -0.22141265869140625, -0.21100997924804688, -0.2006072998046875, -0.19020462036132812, -0.17980194091796875, -0.16939926147460938, -0.15899658203125, -0.14859390258789062, -0.13819122314453125, -0.12778854370117188, -0.1173858642578125, -0.10698318481445312, -0.09658050537109375, -0.08617782592773438, -0.075775146484375, -0.06537246704101562, -0.05496978759765625, -0.044567108154296875, -0.0341644287109375, -0.023761749267578125, -0.01335906982421875, -0.002956390380859375, 0.0074462890625, 0.017848968505859375, 0.02825164794921875, 0.038654327392578125, 0.0490570068359375, 0.059459686279296875, 0.06986236572265625, 0.08026504516601562, 0.090667724609375, 0.10107040405273438, 0.11147308349609375, 0.12187576293945312, 0.1322784423828125, 0.14268112182617188, 0.15308380126953125, 0.16348648071289062, 0.17388916015625, 0.18429183959960938, 0.19469451904296875, 0.20509719848632812, 0.2154998779296875, 0.22590255737304688, 0.23630523681640625, 0.24670791625976562, 0.257110595703125, 0.2675132751464844, 0.27791595458984375, 0.2883186340332031, 0.2987213134765625, 0.3091239929199219, 0.31952667236328125, 0.3299293518066406, 0.34033203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 5.0, 11.0, 9.0, 10.0, 16.0, 14.0, 13.0, 23.0, 27.0, 27.0, 33.0, 39.0, 35.0, 39.0, 42.0, 57.0, 56.0, 55.0, 52.0, 44.0, 55.0, 45.0, 29.0, 40.0, 30.0, 26.0, 25.0, 17.0, 19.0, 18.0, 22.0, 14.0, 13.0, 10.0, 6.0, 1.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001712799072265625, -0.0016520321369171143, -0.0015912652015686035, -0.0015304982662200928, -0.001469731330871582, -0.0014089643955230713, -0.0013481974601745605, -0.0012874305248260498, -0.001226663589477539, -0.0011658966541290283, -0.0011051297187805176, -0.0010443627834320068, -0.000983595848083496, -0.0009228289127349854, -0.0008620619773864746, -0.0008012950420379639, -0.0007405281066894531, -0.0006797611713409424, -0.0006189942359924316, -0.0005582273006439209, -0.0004974603652954102, -0.0004366934299468994, -0.00037592649459838867, -0.00031515955924987793, -0.0002543926239013672, -0.00019362568855285645, -0.0001328587532043457, -7.209181785583496e-05, -1.1324882507324219e-05, 4.9442052841186523e-05, 0.00011020898818969727, 0.000170975923538208, 0.00023174285888671875, 0.0002925097942352295, 0.00035327672958374023, 0.000414043664932251, 0.0004748106002807617, 0.0005355775356292725, 0.0005963444709777832, 0.0006571114063262939, 0.0007178783416748047, 0.0007786452770233154, 0.0008394122123718262, 0.0009001791477203369, 0.0009609460830688477, 0.0010217130184173584, 0.0010824799537658691, 0.0011432468891143799, 0.0012040138244628906, 0.0012647807598114014, 0.0013255476951599121, 0.0013863146305084229, 0.0014470815658569336, 0.0015078485012054443, 0.001568615436553955, 0.0016293823719024658, 0.0016901493072509766, 0.0017509162425994873, 0.001811683177947998, 0.0018724501132965088, 0.0019332170486450195, 0.0019939839839935303, 0.002054750919342041, 0.0021155178546905518, 0.0021762847900390625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 5.0, 10.0, 7.0, 11.0, 15.0, 13.0, 15.0, 28.0, 26.0, 35.0, 49.0, 66.0, 78.0, 115.0, 145.0, 234.0, 496.0, 1578.0, 27777.0, 903821.0, 109097.0, 3274.0, 675.0, 333.0, 161.0, 105.0, 80.0, 55.0, 35.0, 33.0, 30.0, 23.0, 28.0, 17.0, 12.0, 10.0, 11.0, 10.0, 4.0, 7.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.038909912109375, -0.037754058837890625, -0.03659820556640625, -0.035442352294921875, -0.0342864990234375, -0.033130645751953125, -0.03197479248046875, -0.030818939208984375, -0.0296630859375, -0.028507232666015625, -0.02735137939453125, -0.026195526123046875, -0.0250396728515625, -0.023883819580078125, -0.02272796630859375, -0.021572113037109375, -0.020416259765625, -0.019260406494140625, -0.01810455322265625, -0.016948699951171875, -0.0157928466796875, -0.014636993408203125, -0.01348114013671875, -0.012325286865234375, -0.01116943359375, -0.010013580322265625, -0.00885772705078125, -0.007701873779296875, -0.0065460205078125, -0.005390167236328125, -0.00423431396484375, -0.003078460693359375, -0.001922607421875, -0.000766754150390625, 0.00038909912109375, 0.001544952392578125, 0.0027008056640625, 0.003856658935546875, 0.00501251220703125, 0.006168365478515625, 0.00732421875, 0.008480072021484375, 0.00963592529296875, 0.010791778564453125, 0.0119476318359375, 0.013103485107421875, 0.01425933837890625, 0.015415191650390625, 0.016571044921875, 0.017726898193359375, 0.01888275146484375, 0.020038604736328125, 0.0211944580078125, 0.022350311279296875, 0.02350616455078125, 0.024662017822265625, 0.02581787109375, 0.026973724365234375, 0.02812957763671875, 0.029285430908203125, 0.0304412841796875, 0.031597137451171875, 0.03275299072265625, 0.033908843994140625, 0.035064697265625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 25.0, 125.0, 469.0, 326.0, 49.0, 19.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001179486745968461, -0.0008728373213671148, -0.0005661878967657685, -0.0002595384721644223, 4.711095243692398e-05, 0.0003537603188306093, 0.0006604098016396165, 0.0009670592844486237, 0.001273708650842309, 0.0015803580172359943, 0.0018870075000450015, 0.0021936569828540087, 0.002500306349247694, 0.0028069557156413794, 0.0031136050820350647, 0.0034202546812593937, 0.003726904047653079, 0.004033553414046764, 0.004340203013271093, 0.004646852146834135, 0.004953501746058464, 0.005260150879621506, 0.005566800478845835, 0.005873450078070164, 0.006180099211633205, 0.006486748810857534, 0.006793397944420576, 0.007100047543644905, 0.007406696677207947, 0.007713346276432276, 0.008019995875656605, 0.008326645009219646, 0.008633295074105263, 0.008939944207668304, 0.00924659427255392, 0.009553243406116962, 0.009859892539680004, 0.01016654260456562, 0.010473191738128662, 0.010779840871691704, 0.011086490005254745, 0.011393139138817787, 0.011699789203703403, 0.012006438337266445, 0.012313087470829487, 0.012619737535715103, 0.012926386669278145, 0.013233035802841187, 0.013539685867726803, 0.013846335001289845, 0.01415298506617546, 0.014459634199738503, 0.014766283333301544, 0.015072932466864586, 0.015379582531750202, 0.01568623259663582, 0.01599288173019886, 0.016299530863761902, 0.016606179997324944, 0.016912829130887985, 0.017219480127096176, 0.017526129260659218, 0.01783277839422226, 0.0181394275277853, 0.018446076661348343]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 8.0, 4.0, 2.0, 11.0, 8.0, 12.0, 7.0, 6.0, 9.0, 19.0, 14.0, 21.0, 29.0, 30.0, 34.0, 34.0, 46.0, 39.0, 34.0, 35.0, 31.0, 37.0, 37.0, 31.0, 42.0, 26.0, 29.0, 50.0, 49.0, 28.0, 23.0, 22.0, 27.0, 36.0, 18.0, 13.0, 17.0, 17.0, 15.0, 9.0, 10.0, 4.0, 7.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0], "bins": [-0.0011725425720214844, -0.001139884814620018, -0.0011072270572185516, -0.0010745692998170853, -0.001041911542415619, -0.0010092537850141525, -0.0009765960276126862, -0.0009439382702112198, -0.0009112805128097534, -0.000878622755408287, -0.0008459649980068207, -0.0008133072406053543, -0.0007806494832038879, -0.0007479917258024216, -0.0007153339684009552, -0.0006826762109994888, -0.0006500184535980225, -0.0006173606961965561, -0.0005847029387950897, -0.0005520451813936234, -0.000519387423992157, -0.0004867296665906906, -0.00045407190918922424, -0.0004214141517877579, -0.0003887563943862915, -0.00035609863698482513, -0.00032344087958335876, -0.0002907831221818924, -0.000258125364780426, -0.00022546760737895966, -0.00019280984997749329, -0.00016015209257602692, -0.00012749433517456055, -9.483657777309418e-05, -6.217882037162781e-05, -2.9521062970161438e-05, 3.1366944313049316e-06, 3.57944518327713e-05, 6.845220923423767e-05, 0.00010110996663570404, 0.0001337677240371704, 0.00016642548143863678, 0.00019908323884010315, 0.00023174099624156952, 0.0002643987536430359, 0.00029705651104450226, 0.00032971426844596863, 0.000362372025847435, 0.00039502978324890137, 0.00042768754065036774, 0.0004603452980518341, 0.0004930030554533005, 0.0005256608128547668, 0.0005583185702562332, 0.0005909763276576996, 0.000623634085059166, 0.0006562918424606323, 0.0006889495998620987, 0.0007216073572635651, 0.0007542651146650314, 0.0007869228720664978, 0.0008195806294679642, 0.0008522383868694305, 0.0008848961442708969, 0.0009175539016723633]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 15.0, 17.0, 15.0, 15.0, 19.0, 21.0, 17.0, 29.0, 31.0, 40.0, 46.0, 40.0, 52.0, 41.0, 41.0, 42.0, 39.0, 33.0, 42.0, 42.0, 30.0, 37.0, 35.0, 27.0, 28.0, 21.0, 22.0, 23.0, 14.0, 15.0, 21.0, 5.0, 3.0, 10.0, 9.0, 11.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.93377685546875, -4.7738037109375, -4.61383056640625, -4.453857421875, -4.29388427734375, -4.1339111328125, -3.97393798828125, -3.81396484375, -3.65399169921875, -3.4940185546875, -3.33404541015625, -3.174072265625, -3.01409912109375, -2.8541259765625, -2.69415283203125, -2.5341796875, -2.37420654296875, -2.2142333984375, -2.05426025390625, -1.894287109375, -1.73431396484375, -1.5743408203125, -1.41436767578125, -1.25439453125, -1.09442138671875, -0.9344482421875, -0.77447509765625, -0.614501953125, -0.45452880859375, -0.2945556640625, -0.13458251953125, 0.025390625, 0.18536376953125, 0.3453369140625, 0.50531005859375, 0.665283203125, 0.82525634765625, 0.9852294921875, 1.14520263671875, 1.30517578125, 1.46514892578125, 1.6251220703125, 1.78509521484375, 1.945068359375, 2.10504150390625, 2.2650146484375, 2.42498779296875, 2.5849609375, 2.74493408203125, 2.9049072265625, 3.06488037109375, 3.224853515625, 3.38482666015625, 3.5447998046875, 3.70477294921875, 3.86474609375, 4.02471923828125, 4.1846923828125, 4.34466552734375, 4.504638671875, 4.66461181640625, 4.8245849609375, 4.98455810546875, 5.14453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 7.0, 11.0, 9.0, 19.0, 40.0, 47.0, 69.0, 91.0, 169.0, 219.0, 417.0, 628.0, 1111.0, 1930.0, 3732.0, 7020.0, 14479.0, 30554.0, 69540.0, 165415.0, 387310.0, 207503.0, 85575.0, 37446.0, 17192.0, 8205.0, 4208.0, 2279.0, 1280.0, 783.0, 459.0, 294.0, 172.0, 118.0, 76.0, 54.0, 23.0, 28.0, 12.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.7435302734375, -4.588623046875, -4.4337158203125, -4.27880859375, -4.1239013671875, -3.968994140625, -3.8140869140625, -3.6591796875, -3.5042724609375, -3.349365234375, -3.1944580078125, -3.03955078125, -2.8846435546875, -2.729736328125, -2.5748291015625, -2.419921875, -2.2650146484375, -2.110107421875, -1.9552001953125, -1.80029296875, -1.6453857421875, -1.490478515625, -1.3355712890625, -1.1806640625, -1.0257568359375, -0.870849609375, -0.7159423828125, -0.56103515625, -0.4061279296875, -0.251220703125, -0.0963134765625, 0.05859375, 0.2135009765625, 0.368408203125, 0.5233154296875, 0.67822265625, 0.8331298828125, 0.988037109375, 1.1429443359375, 1.2978515625, 1.4527587890625, 1.607666015625, 1.7625732421875, 1.91748046875, 2.0723876953125, 2.227294921875, 2.3822021484375, 2.537109375, 2.6920166015625, 2.846923828125, 3.0018310546875, 3.15673828125, 3.3116455078125, 3.466552734375, 3.6214599609375, 3.7763671875, 3.9312744140625, 4.086181640625, 4.2410888671875, 4.39599609375, 4.5509033203125, 4.705810546875, 4.8607177734375, 5.015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 15.0, 13.0, 11.0, 15.0, 13.0, 22.0, 23.0, 18.0, 27.0, 31.0, 43.0, 47.0, 50.0, 48.0, 57.0, 98.0, 247.0, 1503.0, 201.0, 107.0, 65.0, 34.0, 42.0, 42.0, 38.0, 34.0, 29.0, 23.0, 22.0, 24.0, 24.0, 14.0, 4.0, 8.0, 7.0, 7.0, 10.0, 8.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.764404296875, -17.21630859375, -16.668212890625, -16.1201171875, -15.572021484375, -15.02392578125, -14.475830078125, -13.927734375, -13.379638671875, -12.83154296875, -12.283447265625, -11.7353515625, -11.187255859375, -10.63916015625, -10.091064453125, -9.54296875, -8.994873046875, -8.44677734375, -7.898681640625, -7.3505859375, -6.802490234375, -6.25439453125, -5.706298828125, -5.158203125, -4.610107421875, -4.06201171875, -3.513916015625, -2.9658203125, -2.417724609375, -1.86962890625, -1.321533203125, -0.7734375, -0.225341796875, 0.32275390625, 0.870849609375, 1.4189453125, 1.967041015625, 2.51513671875, 3.063232421875, 3.611328125, 4.159423828125, 4.70751953125, 5.255615234375, 5.8037109375, 6.351806640625, 6.89990234375, 7.447998046875, 7.99609375, 8.544189453125, 9.09228515625, 9.640380859375, 10.1884765625, 10.736572265625, 11.28466796875, 11.832763671875, 12.380859375, 12.928955078125, 13.47705078125, 14.025146484375, 14.5732421875, 15.121337890625, 15.66943359375, 16.217529296875, 16.765625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 17.0, 30.0, 39.0, 67.0, 105.0, 149.0, 349.0, 745.0, 15097.0, 3124529.0, 3383.0, 572.0, 271.0, 117.0, 78.0, 63.0, 38.0, 20.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.75, -86.8876953125, -84.025390625, -81.1630859375, -78.30078125, -75.4384765625, -72.576171875, -69.7138671875, -66.8515625, -63.9892578125, -61.126953125, -58.2646484375, -55.40234375, -52.5400390625, -49.677734375, -46.8154296875, -43.953125, -41.0908203125, -38.228515625, -35.3662109375, -32.50390625, -29.6416015625, -26.779296875, -23.9169921875, -21.0546875, -18.1923828125, -15.330078125, -12.4677734375, -9.60546875, -6.7431640625, -3.880859375, -1.0185546875, 1.84375, 4.7060546875, 7.568359375, 10.4306640625, 13.29296875, 16.1552734375, 19.017578125, 21.8798828125, 24.7421875, 27.6044921875, 30.466796875, 33.3291015625, 36.19140625, 39.0537109375, 41.916015625, 44.7783203125, 47.640625, 50.5029296875, 53.365234375, 56.2275390625, 59.08984375, 61.9521484375, 64.814453125, 67.6767578125, 70.5390625, 73.4013671875, 76.263671875, 79.1259765625, 81.98828125, 84.8505859375, 87.712890625, 90.5751953125, 93.4375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 16.0, 189.0, 509.0, 268.0, 27.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-178.96446228027344, -175.49362182617188, -172.0227813720703, -168.5519561767578, -165.08111572265625, -161.6102752685547, -158.13943481445312, -154.66860961914062, -151.19776916503906, -147.7269287109375, -144.25608825683594, -140.78526306152344, -137.31442260742188, -133.8435821533203, -130.37274169921875, -126.90190887451172, -123.43106842041016, -119.9602279663086, -116.48939514160156, -113.0185546875, -109.54772186279297, -106.0768814086914, -102.60604858398438, -99.13520812988281, -95.66436767578125, -92.19352722167969, -88.72269439697266, -85.2518539428711, -81.78102111816406, -78.3101806640625, -74.83934020996094, -71.3685073852539, -67.89767456054688, -64.42683410644531, -60.95600128173828, -57.48516082763672, -54.01432800292969, -50.543487548828125, -47.07265090942383, -43.60181427001953, -40.130977630615234, -36.66014099121094, -33.18930435180664, -29.71846580505371, -26.247629165649414, -22.776792526245117, -19.305953979492188, -15.83511734008789, -12.364280700683594, -8.893444061279297, -5.422606468200684, -1.9517688751220703, 1.5190677642822266, 4.989904403686523, 8.460742950439453, 11.93157958984375, 15.402416229248047, 18.873252868652344, 22.34408950805664, 25.81492805480957, 29.285764694213867, 32.75659942626953, 36.227439880371094, 39.69827651977539, 43.16911315917969]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 5.0, 10.0, 5.0, 7.0, 13.0, 12.0, 18.0, 15.0, 22.0, 23.0, 17.0, 27.0, 22.0, 30.0, 39.0, 30.0, 35.0, 45.0, 46.0, 36.0, 36.0, 36.0, 49.0, 39.0, 34.0, 39.0, 39.0, 33.0, 25.0, 26.0, 23.0, 25.0, 23.0, 21.0, 26.0, 16.0, 11.0, 8.0, 11.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.80858612060547, -44.289833068847656, -42.77108383178711, -41.2523307800293, -39.73358154296875, -38.21482849121094, -36.696075439453125, -35.17732238769531, -33.658573150634766, -32.13982009887695, -30.621070861816406, -29.102317810058594, -27.583566665649414, -26.064815521240234, -24.546062469482422, -23.027311325073242, -21.508560180664062, -19.989809036254883, -18.471057891845703, -16.95230484008789, -15.433553695678711, -13.914802551269531, -12.396050453186035, -10.877298355102539, -9.35854721069336, -7.8397955894470215, -6.321043968200684, -4.802292346954346, -3.283540725708008, -1.76478910446167, -0.24603748321533203, 1.272714614868164, 2.7914657592773438, 4.310217380523682, 5.8289690017700195, 7.347720623016357, 8.866472244262695, 10.385223388671875, 11.903975486755371, 13.422727584838867, 14.941478729248047, 16.460229873657227, 17.978981018066406, 19.49773406982422, 21.0164852142334, 22.535236358642578, 24.05398941040039, 25.57274055480957, 27.09149169921875, 28.61024284362793, 30.12899398803711, 31.647747039794922, 33.16649627685547, 34.68524932861328, 36.204002380371094, 37.722755432128906, 39.24150466918945, 40.760257720947266, 42.27900695800781, 43.797760009765625, 45.31651306152344, 46.835262298583984, 48.3540153503418, 49.872764587402344, 51.391517639160156]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 6.0, 2.0, 4.0, 7.0, 12.0, 14.0, 9.0, 17.0, 20.0, 17.0, 18.0, 23.0, 29.0, 27.0, 46.0, 48.0, 40.0, 49.0, 48.0, 36.0, 42.0, 42.0, 38.0, 32.0, 41.0, 41.0, 34.0, 38.0, 36.0, 25.0, 22.0, 20.0, 12.0, 23.0, 13.0, 10.0, 8.0, 9.0, 12.0, 7.0, 8.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.0543212890625, -4.878173828125, -4.7020263671875, -4.52587890625, -4.3497314453125, -4.173583984375, -3.9974365234375, -3.8212890625, -3.6451416015625, -3.468994140625, -3.2928466796875, -3.11669921875, -2.9405517578125, -2.764404296875, -2.5882568359375, -2.412109375, -2.2359619140625, -2.059814453125, -1.8836669921875, -1.70751953125, -1.5313720703125, -1.355224609375, -1.1790771484375, -1.0029296875, -0.8267822265625, -0.650634765625, -0.4744873046875, -0.29833984375, -0.1221923828125, 0.053955078125, 0.2301025390625, 0.40625, 0.5823974609375, 0.758544921875, 0.9346923828125, 1.11083984375, 1.2869873046875, 1.463134765625, 1.6392822265625, 1.8154296875, 1.9915771484375, 2.167724609375, 2.3438720703125, 2.52001953125, 2.6961669921875, 2.872314453125, 3.0484619140625, 3.224609375, 3.4007568359375, 3.576904296875, 3.7530517578125, 3.92919921875, 4.1053466796875, 4.281494140625, 4.4576416015625, 4.6337890625, 4.8099365234375, 4.986083984375, 5.1622314453125, 5.33837890625, 5.5145263671875, 5.690673828125, 5.8668212890625, 6.04296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 8.0, 6.0, 7.0, 10.0, 13.0, 12.0, 17.0, 15.0, 26.0, 37.0, 34.0, 47.0, 89.0, 168.0, 422.0, 1536.0, 8510.0, 118054.0, 2501779.0, 1501111.0, 55483.0, 5114.0, 1019.0, 309.0, 139.0, 73.0, 60.0, 37.0, 20.0, 22.0, 15.0, 15.0, 17.0, 5.0, 13.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.0771484375, -17.451171875, -16.8251953125, -16.19921875, -15.5732421875, -14.947265625, -14.3212890625, -13.6953125, -13.0693359375, -12.443359375, -11.8173828125, -11.19140625, -10.5654296875, -9.939453125, -9.3134765625, -8.6875, -8.0615234375, -7.435546875, -6.8095703125, -6.18359375, -5.5576171875, -4.931640625, -4.3056640625, -3.6796875, -3.0537109375, -2.427734375, -1.8017578125, -1.17578125, -0.5498046875, 0.076171875, 0.7021484375, 1.328125, 1.9541015625, 2.580078125, 3.2060546875, 3.83203125, 4.4580078125, 5.083984375, 5.7099609375, 6.3359375, 6.9619140625, 7.587890625, 8.2138671875, 8.83984375, 9.4658203125, 10.091796875, 10.7177734375, 11.34375, 11.9697265625, 12.595703125, 13.2216796875, 13.84765625, 14.4736328125, 15.099609375, 15.7255859375, 16.3515625, 16.9775390625, 17.603515625, 18.2294921875, 18.85546875, 19.4814453125, 20.107421875, 20.7333984375, 21.359375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 13.0, 9.0, 11.0, 11.0, 20.0, 26.0, 26.0, 30.0, 53.0, 57.0, 79.0, 77.0, 110.0, 157.0, 183.0, 231.0, 329.0, 347.0, 347.0, 374.0, 326.0, 255.0, 214.0, 158.0, 141.0, 102.0, 80.0, 64.0, 48.0, 35.0, 35.0, 25.0, 19.0, 19.0, 10.0, 10.0, 11.0, 5.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.8515625, -10.5308837890625, -10.210205078125, -9.8895263671875, -9.56884765625, -9.2481689453125, -8.927490234375, -8.6068115234375, -8.2861328125, -7.9654541015625, -7.644775390625, -7.3240966796875, -7.00341796875, -6.6827392578125, -6.362060546875, -6.0413818359375, -5.720703125, -5.4000244140625, -5.079345703125, -4.7586669921875, -4.43798828125, -4.1173095703125, -3.796630859375, -3.4759521484375, -3.1552734375, -2.8345947265625, -2.513916015625, -2.1932373046875, -1.87255859375, -1.5518798828125, -1.231201171875, -0.9105224609375, -0.58984375, -0.2691650390625, 0.051513671875, 0.3721923828125, 0.69287109375, 1.0135498046875, 1.334228515625, 1.6549072265625, 1.9755859375, 2.2962646484375, 2.616943359375, 2.9376220703125, 3.25830078125, 3.5789794921875, 3.899658203125, 4.2203369140625, 4.541015625, 4.8616943359375, 5.182373046875, 5.5030517578125, 5.82373046875, 6.1444091796875, 6.465087890625, 6.7857666015625, 7.1064453125, 7.4271240234375, 7.747802734375, 8.0684814453125, 8.38916015625, 8.7098388671875, 9.030517578125, 9.3511962890625, 9.671875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 9.0, 8.0, 12.0, 23.0, 16.0, 26.0, 28.0, 38.0, 32.0, 61.0, 65.0, 79.0, 125.0, 143.0, 134.0, 195.0, 298.0, 576.0, 2113.0, 29055.0, 1862660.0, 2259695.0, 34495.0, 2412.0, 583.0, 324.0, 225.0, 165.0, 136.0, 116.0, 68.0, 73.0, 57.0, 60.0, 33.0, 32.0, 23.0, 23.0, 14.0, 9.0, 4.0, 7.0, 9.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.29052734375, -32.1435546875, -30.99658203125, -29.849609375, -28.70263671875, -27.5556640625, -26.40869140625, -25.26171875, -24.11474609375, -22.9677734375, -21.82080078125, -20.673828125, -19.52685546875, -18.3798828125, -17.23291015625, -16.0859375, -14.93896484375, -13.7919921875, -12.64501953125, -11.498046875, -10.35107421875, -9.2041015625, -8.05712890625, -6.91015625, -5.76318359375, -4.6162109375, -3.46923828125, -2.322265625, -1.17529296875, -0.0283203125, 1.11865234375, 2.265625, 3.41259765625, 4.5595703125, 5.70654296875, 6.853515625, 8.00048828125, 9.1474609375, 10.29443359375, 11.44140625, 12.58837890625, 13.7353515625, 14.88232421875, 16.029296875, 17.17626953125, 18.3232421875, 19.47021484375, 20.6171875, 21.76416015625, 22.9111328125, 24.05810546875, 25.205078125, 26.35205078125, 27.4990234375, 28.64599609375, 29.79296875, 30.93994140625, 32.0869140625, 33.23388671875, 34.380859375, 35.52783203125, 36.6748046875, 37.82177734375, 38.96875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 382.0, 568.0, 53.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-500.4175720214844, -488.2671813964844, -476.11676025390625, -463.96636962890625, -451.81597900390625, -439.66558837890625, -427.5151672363281, -415.3647766113281, -403.21435546875, -391.06396484375, -378.9135437011719, -366.7631530761719, -354.6127624511719, -342.46234130859375, -330.31195068359375, -318.16156005859375, -306.01116943359375, -293.86077880859375, -281.7103576660156, -269.5599670410156, -257.4095764160156, -245.25917053222656, -233.1087646484375, -220.9583740234375, -208.80796813964844, -196.65756225585938, -184.50717163085938, -172.3567657470703, -160.20635986328125, -148.05596923828125, -135.9055633544922, -123.75516510009766, -111.60479736328125, -99.45439910888672, -87.30400085449219, -75.15359497070312, -63.003196716308594, -50.85279846191406, -38.702392578125, -26.55199432373047, -14.401596069335938, -2.2511959075927734, 9.89920425415039, 22.049606323242188, 34.20000457763672, 46.35040283203125, 58.50080871582031, 70.65120697021484, 82.80160522460938, 94.9520034790039, 107.10240173339844, 119.2528076171875, 131.4031982421875, 143.55360412597656, 155.70401000976562, 167.85440063476562, 180.0048065185547, 192.15521240234375, 204.30560302734375, 216.4560089111328, 228.60641479492188, 240.75680541992188, 252.90721130371094, 265.0576171875, 277.2080078125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 2.0, 7.0, 9.0, 9.0, 15.0, 14.0, 14.0, 21.0, 23.0, 13.0, 20.0, 25.0, 33.0, 32.0, 45.0, 32.0, 36.0, 46.0, 32.0, 37.0, 41.0, 37.0, 40.0, 30.0, 40.0, 22.0, 32.0, 35.0, 32.0, 37.0, 21.0, 14.0, 30.0, 17.0, 19.0, 15.0, 18.0, 5.0, 7.0, 6.0, 3.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-40.8155517578125, -39.58872985839844, -38.36191177368164, -37.13508987426758, -35.90827178955078, -34.68144989013672, -33.454627990722656, -32.22780990600586, -31.000988006591797, -29.774168014526367, -28.547348022460938, -27.320526123046875, -26.093706130981445, -24.866886138916016, -23.640066146850586, -22.413246154785156, -21.186426162719727, -19.959606170654297, -18.732786178588867, -17.505966186523438, -16.279144287109375, -15.052324295043945, -13.825504302978516, -12.59868335723877, -11.37186336517334, -10.14504337310791, -8.918222427368164, -7.691402435302734, -6.4645819664001465, -5.237761497497559, -4.010941505432129, -2.784120559692383, -1.5573005676269531, -0.3304802179336548, 0.8963401317596436, 2.1231603622436523, 3.3499808311462402, 4.576801300048828, 5.803621292114258, 7.030442237854004, 8.257262229919434, 9.484082221984863, 10.71090316772461, 11.937723159790039, 13.164543151855469, 14.391364097595215, 15.618184089660645, 16.84500503540039, 18.07182502746582, 19.29864501953125, 20.52546501159668, 21.75228500366211, 22.979106903076172, 24.2059268951416, 25.43274688720703, 26.659568786621094, 27.88638687133789, 29.11320686340332, 30.34002685546875, 31.566848754882812, 32.79366683959961, 34.02048873901367, 35.24730682373047, 36.47412872314453, 37.700950622558594]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 2.0, 8.0, 14.0, 17.0, 17.0, 16.0, 20.0, 19.0, 24.0, 32.0, 40.0, 35.0, 41.0, 41.0, 56.0, 37.0, 37.0, 45.0, 44.0, 40.0, 40.0, 40.0, 39.0, 35.0, 36.0, 29.0, 23.0, 30.0, 19.0, 19.0, 13.0, 13.0, 10.0, 8.0, 11.0, 10.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.159423828125, -4.97900390625, -4.798583984375, -4.6181640625, -4.437744140625, -4.25732421875, -4.076904296875, -3.896484375, -3.716064453125, -3.53564453125, -3.355224609375, -3.1748046875, -2.994384765625, -2.81396484375, -2.633544921875, -2.453125, -2.272705078125, -2.09228515625, -1.911865234375, -1.7314453125, -1.551025390625, -1.37060546875, -1.190185546875, -1.009765625, -0.829345703125, -0.64892578125, -0.468505859375, -0.2880859375, -0.107666015625, 0.07275390625, 0.253173828125, 0.43359375, 0.614013671875, 0.79443359375, 0.974853515625, 1.1552734375, 1.335693359375, 1.51611328125, 1.696533203125, 1.876953125, 2.057373046875, 2.23779296875, 2.418212890625, 2.5986328125, 2.779052734375, 2.95947265625, 3.139892578125, 3.3203125, 3.500732421875, 3.68115234375, 3.861572265625, 4.0419921875, 4.222412109375, 4.40283203125, 4.583251953125, 4.763671875, 4.944091796875, 5.12451171875, 5.304931640625, 5.4853515625, 5.665771484375, 5.84619140625, 6.026611328125, 6.20703125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 8.0, 15.0, 21.0, 20.0, 44.0, 60.0, 89.0, 133.0, 212.0, 335.0, 528.0, 840.0, 1386.0, 2320.0, 3825.0, 6528.0, 11047.0, 19552.0, 34927.0, 62997.0, 109663.0, 172308.0, 210599.0, 167278.0, 105500.0, 59815.0, 33388.0, 18825.0, 10617.0, 6214.0, 3632.0, 2276.0, 1285.0, 853.0, 503.0, 313.0, 202.0, 127.0, 97.0, 45.0, 53.0, 28.0, 21.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6502304077148438, -0.6295623779296875, -0.6088943481445312, -0.588226318359375, -0.5675582885742188, -0.5468902587890625, -0.5262222290039062, -0.50555419921875, -0.48488616943359375, -0.4642181396484375, -0.44355010986328125, -0.422882080078125, -0.40221405029296875, -0.3815460205078125, -0.36087799072265625, -0.3402099609375, -0.31954193115234375, -0.2988739013671875, -0.27820587158203125, -0.257537841796875, -0.23686981201171875, -0.2162017822265625, -0.19553375244140625, -0.17486572265625, -0.15419769287109375, -0.1335296630859375, -0.11286163330078125, -0.092193603515625, -0.07152557373046875, -0.0508575439453125, -0.03018951416015625, -0.009521484375, 0.01114654541015625, 0.0318145751953125, 0.05248260498046875, 0.073150634765625, 0.09381866455078125, 0.1144866943359375, 0.13515472412109375, 0.15582275390625, 0.17649078369140625, 0.1971588134765625, 0.21782684326171875, 0.238494873046875, 0.25916290283203125, 0.2798309326171875, 0.30049896240234375, 0.3211669921875, 0.34183502197265625, 0.3625030517578125, 0.38317108154296875, 0.403839111328125, 0.42450714111328125, 0.4451751708984375, 0.46584320068359375, 0.48651123046875, 0.5071792602539062, 0.5278472900390625, 0.5485153198242188, 0.569183349609375, 0.5898513793945312, 0.6105194091796875, 0.6311874389648438, 0.65185546875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 14.0, 5.0, 14.0, 17.0, 20.0, 18.0, 16.0, 24.0, 22.0, 26.0, 40.0, 32.0, 45.0, 38.0, 27.0, 30.0, 39.0, 26.0, 1054.0, 59.0, 37.0, 41.0, 38.0, 34.0, 26.0, 27.0, 25.0, 25.0, 25.0, 23.0, 21.0, 13.0, 15.0, 19.0, 10.0, 12.0, 10.0, 5.0, 10.0, 3.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.17926025390625, -3.0772705078125, -2.97528076171875, -2.873291015625, -2.77130126953125, -2.6693115234375, -2.56732177734375, -2.46533203125, -2.36334228515625, -2.2613525390625, -2.15936279296875, -2.057373046875, -1.95538330078125, -1.8533935546875, -1.75140380859375, -1.6494140625, -1.54742431640625, -1.4454345703125, -1.34344482421875, -1.241455078125, -1.13946533203125, -1.0374755859375, -0.93548583984375, -0.83349609375, -0.73150634765625, -0.6295166015625, -0.52752685546875, -0.425537109375, -0.32354736328125, -0.2215576171875, -0.11956787109375, -0.017578125, 0.08441162109375, 0.1864013671875, 0.28839111328125, 0.390380859375, 0.49237060546875, 0.5943603515625, 0.69635009765625, 0.79833984375, 0.90032958984375, 1.0023193359375, 1.10430908203125, 1.206298828125, 1.30828857421875, 1.4102783203125, 1.51226806640625, 1.6142578125, 1.71624755859375, 1.8182373046875, 1.92022705078125, 2.022216796875, 2.12420654296875, 2.2261962890625, 2.32818603515625, 2.43017578125, 2.53216552734375, 2.6341552734375, 2.73614501953125, 2.838134765625, 2.94012451171875, 3.0421142578125, 3.14410400390625, 3.24609375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 8.0, 7.0, 17.0, 28.0, 42.0, 60.0, 108.0, 147.0, 249.0, 385.0, 626.0, 927.0, 1414.0, 2022.0, 3290.0, 4996.0, 7870.0, 12093.0, 18638.0, 28398.0, 42453.0, 62092.0, 88028.0, 116566.0, 877516.0, 443902.0, 115653.0, 86719.0, 61873.0, 41639.0, 27715.0, 18119.0, 11743.0, 7771.0, 4858.0, 3282.0, 2061.0, 1362.0, 853.0, 587.0, 378.0, 229.0, 157.0, 84.0, 62.0, 46.0, 27.0, 14.0, 14.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31884765625, -0.3074531555175781, -0.29605865478515625, -0.2846641540527344, -0.2732696533203125, -0.2618751525878906, -0.25048065185546875, -0.23908615112304688, -0.227691650390625, -0.21629714965820312, -0.20490264892578125, -0.19350814819335938, -0.1821136474609375, -0.17071914672851562, -0.15932464599609375, -0.14793014526367188, -0.13653564453125, -0.12514114379882812, -0.11374664306640625, -0.10235214233398438, -0.0909576416015625, -0.07956314086914062, -0.06816864013671875, -0.056774139404296875, -0.045379638671875, -0.033985137939453125, -0.02259063720703125, -0.011196136474609375, 0.0001983642578125, 0.011592864990234375, 0.02298736572265625, 0.034381866455078125, 0.0457763671875, 0.057170867919921875, 0.06856536865234375, 0.07995986938476562, 0.0913543701171875, 0.10274887084960938, 0.11414337158203125, 0.12553787231445312, 0.136932373046875, 0.14832687377929688, 0.15972137451171875, 0.17111587524414062, 0.1825103759765625, 0.19390487670898438, 0.20529937744140625, 0.21669387817382812, 0.22808837890625, 0.23948287963867188, 0.25087738037109375, 0.2622718811035156, 0.2736663818359375, 0.2850608825683594, 0.29645538330078125, 0.3078498840332031, 0.319244384765625, 0.3306388854980469, 0.34203338623046875, 0.3534278869628906, 0.3648223876953125, 0.3762168884277344, 0.38761138916015625, 0.3990058898925781, 0.410400390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 20.0, 7.0, 7.0, 26.0, 17.0, 26.0, 41.0, 53.0, 49.0, 55.0, 67.0, 79.0, 81.0, 81.0, 61.0, 58.0, 39.0, 55.0, 34.0, 30.0, 22.0, 16.0, 14.0, 7.0, 6.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027828216552734375, -0.0026868879795074463, -0.002590954303741455, -0.002495020627975464, -0.0023990869522094727, -0.0023031532764434814, -0.0022072196006774902, -0.002111285924911499, -0.002015352249145508, -0.0019194185733795166, -0.0018234848976135254, -0.0017275512218475342, -0.001631617546081543, -0.0015356838703155518, -0.0014397501945495605, -0.0013438165187835693, -0.0012478828430175781, -0.001151949167251587, -0.0010560154914855957, -0.0009600818157196045, -0.0008641481399536133, -0.0007682144641876221, -0.0006722807884216309, -0.0005763471126556396, -0.00048041343688964844, -0.0003844797611236572, -0.000288546085357666, -0.0001926124095916748, -9.66787338256836e-05, -7.450580596923828e-07, 9.518861770629883e-05, 0.00019112229347229004, 0.00028705596923828125, 0.00038298964500427246, 0.00047892332077026367, 0.0005748569965362549, 0.0006707906723022461, 0.0007667243480682373, 0.0008626580238342285, 0.0009585916996002197, 0.001054525375366211, 0.0011504590511322021, 0.0012463927268981934, 0.0013423264026641846, 0.0014382600784301758, 0.001534193754196167, 0.0016301274299621582, 0.0017260611057281494, 0.0018219947814941406, 0.0019179284572601318, 0.002013862133026123, 0.0021097958087921143, 0.0022057294845581055, 0.0023016631603240967, 0.002397596836090088, 0.002493530511856079, 0.0025894641876220703, 0.0026853978633880615, 0.0027813315391540527, 0.002877265214920044, 0.002973198890686035, 0.0030691325664520264, 0.0031650662422180176, 0.003260999917984009, 0.00335693359375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 11.0, 13.0, 16.0, 26.0, 29.0, 43.0, 61.0, 76.0, 106.0, 193.0, 434.0, 1945.0, 554878.0, 487841.0, 1901.0, 420.0, 173.0, 104.0, 76.0, 54.0, 27.0, 22.0, 12.0, 19.0, 11.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.072509765625, -0.07043743133544922, -0.06836509704589844, -0.06629276275634766, -0.06422042846679688, -0.062148094177246094, -0.06007575988769531, -0.05800342559814453, -0.05593109130859375, -0.05385875701904297, -0.05178642272949219, -0.049714088439941406, -0.047641754150390625, -0.045569419860839844, -0.04349708557128906, -0.04142475128173828, -0.0393524169921875, -0.03728008270263672, -0.03520774841308594, -0.033135414123535156, -0.031063079833984375, -0.028990745544433594, -0.026918411254882812, -0.02484607696533203, -0.02277374267578125, -0.02070140838623047, -0.018629074096679688, -0.016556739807128906, -0.014484405517578125, -0.012412071228027344, -0.010339736938476562, -0.008267402648925781, -0.006195068359375, -0.004122734069824219, -0.0020503997802734375, 2.193450927734375e-05, 0.002094268798828125, 0.004166603088378906, 0.0062389373779296875, 0.008311271667480469, 0.01038360595703125, 0.012455940246582031, 0.014528274536132812, 0.016600608825683594, 0.018672943115234375, 0.020745277404785156, 0.022817611694335938, 0.02488994598388672, 0.0269622802734375, 0.02903461456298828, 0.031106948852539062, 0.033179283142089844, 0.035251617431640625, 0.037323951721191406, 0.03939628601074219, 0.04146862030029297, 0.04354095458984375, 0.04561328887939453, 0.04768562316894531, 0.049757957458496094, 0.051830291748046875, 0.053902626037597656, 0.05597496032714844, 0.05804729461669922, 0.06011962890625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 16.0, 53.0, 187.0, 333.0, 257.0, 111.0, 35.0, 10.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001603191951289773, -0.0013987160054966807, -0.0011942400597035885, -0.000989764230325818, -0.0007852882845327258, -0.0005808123387396336, -0.00037633650936186314, -0.00017186056356877089, 3.2615382224321365e-05, 0.00023709129891358316, 0.00044156721560284495, 0.0006460431031882763, 0.0008505190489813685, 0.0010549949947744608, 0.0012594708241522312, 0.0014639467699453235, 0.0016684227157384157, 0.001872898661531508, 0.0020773746073246002, 0.0022818504367023706, 0.002486326266080141, 0.002690802328288555, 0.0028952781576663256, 0.003099753987044096, 0.00330423004925251, 0.0035087058786302805, 0.0037131819408386946, 0.003917657770216465, 0.004122133832424879, 0.004326609894633293, 0.00453108549118042, 0.004735561553388834, 0.004940037615597248, 0.005144513677805662, 0.005348989274352789, 0.005553465336561203, 0.005757941398769617, 0.005962417460978031, 0.006166893057525158, 0.006371369119733572, 0.006575845181941986, 0.0067803212441504, 0.006984796840697527, 0.007189272902905941, 0.007393748965114355, 0.007598225027322769, 0.007802700623869896, 0.008007176220417023, 0.00821165181696415, 0.008416127413511276, 0.008620603941380978, 0.008825079537928104, 0.009029555134475231, 0.009234031662344933, 0.00943850725889206, 0.009642982855439186, 0.009847459383308887, 0.010051934979856014, 0.010256411507725716, 0.010460887104272842, 0.01066536270081997, 0.01086983922868967, 0.011074314825236797, 0.011278790421783924, 0.011483266949653625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 5.0, 8.0, 7.0, 8.0, 11.0, 14.0, 17.0, 22.0, 37.0, 26.0, 23.0, 27.0, 35.0, 48.0, 49.0, 51.0, 60.0, 52.0, 53.0, 57.0, 57.0, 39.0, 43.0, 39.0, 36.0, 40.0, 20.0, 29.0, 13.0, 13.0, 18.0, 8.0, 8.0, 7.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.002217233180999756, -0.0021609943360090256, -0.0021047554910182953, -0.002048516646027565, -0.0019922778010368347, -0.0019360389560461044, -0.0018798001110553741, -0.0018235612660646439, -0.0017673224210739136, -0.0017110835760831833, -0.001654844731092453, -0.0015986058861017227, -0.0015423670411109924, -0.0014861281961202621, -0.0014298893511295319, -0.0013736505061388016, -0.0013174116611480713, -0.001261172816157341, -0.0012049339711666107, -0.0011486951261758804, -0.0010924562811851501, -0.0010362174361944199, -0.0009799785912036896, -0.0009237397462129593, -0.000867500901222229, -0.0008112620562314987, -0.0007550232112407684, -0.0006987843662500381, -0.0006425455212593079, -0.0005863066762685776, -0.0005300678312778473, -0.000473828986287117, -0.0004175901412963867, -0.00036135129630565643, -0.00030511245131492615, -0.00024887360632419586, -0.00019263476133346558, -0.0001363959163427353, -8.0157071352005e-05, -2.391822636127472e-05, 3.2320618629455566e-05, 8.855946362018585e-05, 0.00014479830861091614, 0.00020103715360164642, 0.0002572759985923767, 0.000313514843583107, 0.0003697536885738373, 0.00042599253356456757, 0.00048223137855529785, 0.0005384702235460281, 0.0005947090685367584, 0.0006509479135274887, 0.000707186758518219, 0.0007634256035089493, 0.0008196644484996796, 0.0008759032934904099, 0.0009321421384811401, 0.0009883809834718704, 0.0010446198284626007, 0.001100858673453331, 0.0011570975184440613, 0.0012133363634347916, 0.0012695752084255219, 0.0013258140534162521, 0.0013820528984069824]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 2.0, 8.0, 14.0, 17.0, 17.0, 16.0, 20.0, 19.0, 24.0, 32.0, 40.0, 35.0, 41.0, 41.0, 56.0, 37.0, 37.0, 45.0, 44.0, 40.0, 40.0, 40.0, 39.0, 35.0, 36.0, 29.0, 23.0, 30.0, 19.0, 19.0, 13.0, 13.0, 10.0, 8.0, 11.0, 10.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.159423828125, -4.97900390625, -4.798583984375, -4.6181640625, -4.437744140625, -4.25732421875, -4.076904296875, -3.896484375, -3.716064453125, -3.53564453125, -3.355224609375, -3.1748046875, -2.994384765625, -2.81396484375, -2.633544921875, -2.453125, -2.272705078125, -2.09228515625, -1.911865234375, -1.7314453125, -1.551025390625, -1.37060546875, -1.190185546875, -1.009765625, -0.829345703125, -0.64892578125, -0.468505859375, -0.2880859375, -0.107666015625, 0.07275390625, 0.253173828125, 0.43359375, 0.614013671875, 0.79443359375, 0.974853515625, 1.1552734375, 1.335693359375, 1.51611328125, 1.696533203125, 1.876953125, 2.057373046875, 2.23779296875, 2.418212890625, 2.5986328125, 2.779052734375, 2.95947265625, 3.139892578125, 3.3203125, 3.500732421875, 3.68115234375, 3.861572265625, 4.0419921875, 4.222412109375, 4.40283203125, 4.583251953125, 4.763671875, 4.944091796875, 5.12451171875, 5.304931640625, 5.4853515625, 5.665771484375, 5.84619140625, 6.026611328125, 6.20703125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 15.0, 20.0, 22.0, 35.0, 52.0, 102.0, 154.0, 211.0, 393.0, 586.0, 1052.0, 1878.0, 3480.0, 6715.0, 13717.0, 30765.0, 80686.0, 254838.0, 423713.0, 141292.0, 48415.0, 20131.0, 9552.0, 4809.0, 2470.0, 1419.0, 777.0, 444.0, 265.0, 183.0, 130.0, 93.0, 61.0, 31.0, 16.0, 11.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.99505615234375, -4.8182373046875, -4.64141845703125, -4.464599609375, -4.28778076171875, -4.1109619140625, -3.93414306640625, -3.75732421875, -3.58050537109375, -3.4036865234375, -3.22686767578125, -3.050048828125, -2.87322998046875, -2.6964111328125, -2.51959228515625, -2.3427734375, -2.16595458984375, -1.9891357421875, -1.81231689453125, -1.635498046875, -1.45867919921875, -1.2818603515625, -1.10504150390625, -0.92822265625, -0.75140380859375, -0.5745849609375, -0.39776611328125, -0.220947265625, -0.04412841796875, 0.1326904296875, 0.30950927734375, 0.486328125, 0.66314697265625, 0.8399658203125, 1.01678466796875, 1.193603515625, 1.37042236328125, 1.5472412109375, 1.72406005859375, 1.90087890625, 2.07769775390625, 2.2545166015625, 2.43133544921875, 2.608154296875, 2.78497314453125, 2.9617919921875, 3.13861083984375, 3.3154296875, 3.49224853515625, 3.6690673828125, 3.84588623046875, 4.022705078125, 4.19952392578125, 4.3763427734375, 4.55316162109375, 4.72998046875, 4.90679931640625, 5.0836181640625, 5.26043701171875, 5.437255859375, 5.61407470703125, 5.7908935546875, 5.96771240234375, 6.14453125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 0.0, 10.0, 6.0, 12.0, 10.0, 9.0, 19.0, 16.0, 25.0, 23.0, 28.0, 41.0, 37.0, 37.0, 70.0, 58.0, 108.0, 257.0, 1546.0, 234.0, 107.0, 69.0, 58.0, 45.0, 36.0, 34.0, 28.0, 25.0, 18.0, 17.0, 14.0, 15.0, 10.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.59375, -24.9091796875, -24.224609375, -23.5400390625, -22.85546875, -22.1708984375, -21.486328125, -20.8017578125, -20.1171875, -19.4326171875, -18.748046875, -18.0634765625, -17.37890625, -16.6943359375, -16.009765625, -15.3251953125, -14.640625, -13.9560546875, -13.271484375, -12.5869140625, -11.90234375, -11.2177734375, -10.533203125, -9.8486328125, -9.1640625, -8.4794921875, -7.794921875, -7.1103515625, -6.42578125, -5.7412109375, -5.056640625, -4.3720703125, -3.6875, -3.0029296875, -2.318359375, -1.6337890625, -0.94921875, -0.2646484375, 0.419921875, 1.1044921875, 1.7890625, 2.4736328125, 3.158203125, 3.8427734375, 4.52734375, 5.2119140625, 5.896484375, 6.5810546875, 7.265625, 7.9501953125, 8.634765625, 9.3193359375, 10.00390625, 10.6884765625, 11.373046875, 12.0576171875, 12.7421875, 13.4267578125, 14.111328125, 14.7958984375, 15.48046875, 16.1650390625, 16.849609375, 17.5341796875, 18.21875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 5.0, 17.0, 15.0, 24.0, 24.0, 47.0, 68.0, 103.0, 175.0, 307.0, 534.0, 1955.0, 3032211.0, 108013.0, 1024.0, 462.0, 251.0, 157.0, 110.0, 63.0, 44.0, 25.0, 28.0, 9.0, 8.0, 5.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.125, -73.57421875, -71.0234375, -68.47265625, -65.921875, -63.37109375, -60.8203125, -58.26953125, -55.71875, -53.16796875, -50.6171875, -48.06640625, -45.515625, -42.96484375, -40.4140625, -37.86328125, -35.3125, -32.76171875, -30.2109375, -27.66015625, -25.109375, -22.55859375, -20.0078125, -17.45703125, -14.90625, -12.35546875, -9.8046875, -7.25390625, -4.703125, -2.15234375, 0.3984375, 2.94921875, 5.5, 8.05078125, 10.6015625, 13.15234375, 15.703125, 18.25390625, 20.8046875, 23.35546875, 25.90625, 28.45703125, 31.0078125, 33.55859375, 36.109375, 38.66015625, 41.2109375, 43.76171875, 46.3125, 48.86328125, 51.4140625, 53.96484375, 56.515625, 59.06640625, 61.6171875, 64.16796875, 66.71875, 69.26953125, 71.8203125, 74.37109375, 76.921875, 79.47265625, 82.0234375, 84.57421875, 87.125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 199.0, 744.0, 71.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-345.2974853515625, -339.2752990722656, -333.2530822753906, -327.23089599609375, -321.20867919921875, -315.1864929199219, -309.164306640625, -303.14208984375, -297.1199035644531, -291.09771728515625, -285.07550048828125, -279.0533142089844, -273.0310974121094, -267.0089111328125, -260.9866943359375, -254.96450805664062, -248.94229125976562, -242.9200897216797, -236.89788818359375, -230.87570190429688, -224.85350036621094, -218.831298828125, -212.80909729003906, -206.78689575195312, -200.76470947265625, -194.7425079345703, -188.72030639648438, -182.6981201171875, -176.67591857910156, -170.65371704101562, -164.6315155029297, -158.60931396484375, -152.58712768554688, -146.56492614746094, -140.542724609375, -134.52053833007812, -128.4983367919922, -122.47613525390625, -116.45393371582031, -110.43173217773438, -104.40953063964844, -98.3873291015625, -92.3651351928711, -86.34293365478516, -80.32073211669922, -74.29853820800781, -68.27633666992188, -62.25413513183594, -56.23193359375, -50.20973587036133, -44.18753433227539, -38.16533660888672, -32.14313507080078, -26.12093734741211, -20.098739624023438, -14.0765380859375, -8.054340362548828, -2.0321412086486816, 3.990057945251465, 10.012256622314453, 16.034456253051758, 22.056655883789062, 28.078853607177734, 34.10105514526367, 40.123252868652344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 21.0, 16.0, 21.0, 19.0, 22.0, 29.0, 37.0, 28.0, 38.0, 32.0, 39.0, 31.0, 42.0, 32.0, 39.0, 48.0, 47.0, 36.0, 36.0, 28.0, 41.0, 27.0, 35.0, 25.0, 18.0, 32.0, 22.0, 18.0, 15.0, 19.0, 17.0, 10.0, 11.0, 5.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.002620697021484, -44.465362548828125, -42.92810821533203, -41.39085006713867, -39.85359191894531, -38.31633377075195, -36.779075622558594, -35.2418212890625, -33.70456314086914, -32.16730499267578, -30.630048751831055, -29.092792510986328, -27.55553436279297, -26.01827621459961, -24.481019973754883, -22.943763732910156, -21.406505584716797, -19.869247436523438, -18.33199119567871, -16.794734954833984, -15.257476806640625, -13.720219612121582, -12.182962417602539, -10.645705223083496, -9.108448028564453, -7.57119083404541, -6.033933639526367, -4.496676445007324, -2.9594192504882812, -1.4221620559692383, 0.11509513854980469, 1.6523523330688477, 3.1896133422851562, 4.726870536804199, 6.264127731323242, 7.801384925842285, 9.338642120361328, 10.875899314880371, 12.413156509399414, 13.950413703918457, 15.4876708984375, 17.02492904663086, 18.562185287475586, 20.099441528320312, 21.636699676513672, 23.17395782470703, 24.711214065551758, 26.248470306396484, 27.785728454589844, 29.322986602783203, 30.86024284362793, 32.397499084472656, 33.934757232666016, 35.472015380859375, 37.00926971435547, 38.54652786254883, 40.08378601074219, 41.62104415893555, 43.158302307128906, 44.695556640625, 46.23281478881836, 47.77007293701172, 49.30732727050781, 50.84458541870117, 52.38184356689453]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 4.0, 9.0, 15.0, 7.0, 19.0, 16.0, 18.0, 20.0, 19.0, 17.0, 31.0, 39.0, 46.0, 45.0, 45.0, 41.0, 35.0, 42.0, 46.0, 40.0, 37.0, 45.0, 30.0, 35.0, 41.0, 31.0, 33.0, 32.0, 21.0, 20.0, 22.0, 14.0, 11.0, 9.0, 10.0, 5.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.17779541015625, -4.9884033203125, -4.79901123046875, -4.609619140625, -4.42022705078125, -4.2308349609375, -4.04144287109375, -3.85205078125, -3.66265869140625, -3.4732666015625, -3.28387451171875, -3.094482421875, -2.90509033203125, -2.7156982421875, -2.52630615234375, -2.3369140625, -2.14752197265625, -1.9581298828125, -1.76873779296875, -1.579345703125, -1.38995361328125, -1.2005615234375, -1.01116943359375, -0.82177734375, -0.63238525390625, -0.4429931640625, -0.25360107421875, -0.064208984375, 0.12518310546875, 0.3145751953125, 0.50396728515625, 0.693359375, 0.88275146484375, 1.0721435546875, 1.26153564453125, 1.450927734375, 1.64031982421875, 1.8297119140625, 2.01910400390625, 2.20849609375, 2.39788818359375, 2.5872802734375, 2.77667236328125, 2.966064453125, 3.15545654296875, 3.3448486328125, 3.53424072265625, 3.7236328125, 3.91302490234375, 4.1024169921875, 4.29180908203125, 4.481201171875, 4.67059326171875, 4.8599853515625, 5.04937744140625, 5.23876953125, 5.42816162109375, 5.6175537109375, 5.80694580078125, 5.996337890625, 6.18572998046875, 6.3751220703125, 6.56451416015625, 6.75390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 7.0, 8.0, 11.0, 12.0, 14.0, 28.0, 19.0, 29.0, 52.0, 82.0, 129.0, 183.0, 390.0, 872.0, 2853.0, 14120.0, 135912.0, 1747612.0, 2082852.0, 185965.0, 17739.0, 3355.0, 919.0, 436.0, 223.0, 147.0, 75.0, 56.0, 42.0, 22.0, 19.0, 16.0, 16.0, 17.0, 11.0, 6.0, 4.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7578125, -12.2681884765625, -11.778564453125, -11.2889404296875, -10.79931640625, -10.3096923828125, -9.820068359375, -9.3304443359375, -8.8408203125, -8.3511962890625, -7.861572265625, -7.3719482421875, -6.88232421875, -6.3927001953125, -5.903076171875, -5.4134521484375, -4.923828125, -4.4342041015625, -3.944580078125, -3.4549560546875, -2.96533203125, -2.4757080078125, -1.986083984375, -1.4964599609375, -1.0068359375, -0.5172119140625, -0.027587890625, 0.4620361328125, 0.95166015625, 1.4412841796875, 1.930908203125, 2.4205322265625, 2.91015625, 3.3997802734375, 3.889404296875, 4.3790283203125, 4.86865234375, 5.3582763671875, 5.847900390625, 6.3375244140625, 6.8271484375, 7.3167724609375, 7.806396484375, 8.2960205078125, 8.78564453125, 9.2752685546875, 9.764892578125, 10.2545166015625, 10.744140625, 11.2337646484375, 11.723388671875, 12.2130126953125, 12.70263671875, 13.1922607421875, 13.681884765625, 14.1715087890625, 14.6611328125, 15.1507568359375, 15.640380859375, 16.1300048828125, 16.61962890625, 17.1092529296875, 17.598876953125, 18.0885009765625, 18.578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 16.0, 21.0, 33.0, 50.0, 59.0, 97.0, 124.0, 223.0, 352.0, 534.0, 566.0, 559.0, 461.0, 318.0, 222.0, 127.0, 109.0, 49.0, 50.0, 28.0, 19.0, 20.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.40625, -20.86865234375, -20.3310546875, -19.79345703125, -19.255859375, -18.71826171875, -18.1806640625, -17.64306640625, -17.10546875, -16.56787109375, -16.0302734375, -15.49267578125, -14.955078125, -14.41748046875, -13.8798828125, -13.34228515625, -12.8046875, -12.26708984375, -11.7294921875, -11.19189453125, -10.654296875, -10.11669921875, -9.5791015625, -9.04150390625, -8.50390625, -7.96630859375, -7.4287109375, -6.89111328125, -6.353515625, -5.81591796875, -5.2783203125, -4.74072265625, -4.203125, -3.66552734375, -3.1279296875, -2.59033203125, -2.052734375, -1.51513671875, -0.9775390625, -0.43994140625, 0.09765625, 0.63525390625, 1.1728515625, 1.71044921875, 2.248046875, 2.78564453125, 3.3232421875, 3.86083984375, 4.3984375, 4.93603515625, 5.4736328125, 6.01123046875, 6.548828125, 7.08642578125, 7.6240234375, 8.16162109375, 8.69921875, 9.23681640625, 9.7744140625, 10.31201171875, 10.849609375, 11.38720703125, 11.9248046875, 12.46240234375, 13.0]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 13.0, 17.0, 18.0, 35.0, 40.0, 73.0, 102.0, 129.0, 244.0, 328.0, 603.0, 2183.0, 372815.0, 3805280.0, 10419.0, 838.0, 386.0, 240.0, 162.0, 112.0, 89.0, 60.0, 37.0, 23.0, 14.0, 8.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.53125, -44.52685546875, -42.5224609375, -40.51806640625, -38.513671875, -36.50927734375, -34.5048828125, -32.50048828125, -30.49609375, -28.49169921875, -26.4873046875, -24.48291015625, -22.478515625, -20.47412109375, -18.4697265625, -16.46533203125, -14.4609375, -12.45654296875, -10.4521484375, -8.44775390625, -6.443359375, -4.43896484375, -2.4345703125, -0.43017578125, 1.57421875, 3.57861328125, 5.5830078125, 7.58740234375, 9.591796875, 11.59619140625, 13.6005859375, 15.60498046875, 17.609375, 19.61376953125, 21.6181640625, 23.62255859375, 25.626953125, 27.63134765625, 29.6357421875, 31.64013671875, 33.64453125, 35.64892578125, 37.6533203125, 39.65771484375, 41.662109375, 43.66650390625, 45.6708984375, 47.67529296875, 49.6796875, 51.68408203125, 53.6884765625, 55.69287109375, 57.697265625, 59.70166015625, 61.7060546875, 63.71044921875, 65.71484375, 67.71923828125, 69.7236328125, 71.72802734375, 73.732421875, 75.73681640625, 77.7412109375, 79.74560546875, 81.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 13.0, 40.0, 59.0, 98.0, 120.0, 156.0, 175.0, 129.0, 82.0, 57.0, 36.0, 19.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-93.42448425292969, -91.0718002319336, -88.71910858154297, -86.36642456054688, -84.01374053955078, -81.66105651855469, -79.30836486816406, -76.95568084716797, -74.60299682617188, -72.25031280517578, -69.89762115478516, -67.54493713378906, -65.19225311279297, -62.83956527709961, -60.48687744140625, -58.134193420410156, -55.7815055847168, -53.42881774902344, -51.076133728027344, -48.723445892333984, -46.37076187133789, -44.01807403564453, -41.66539001464844, -39.31270217895508, -36.96001434326172, -34.60732650756836, -32.254642486572266, -29.901954650878906, -27.549270629882812, -25.196582794189453, -22.843896865844727, -20.4912109375, -18.138526916503906, -15.78584098815918, -13.433155059814453, -11.08046817779541, -8.727782249450684, -6.375096321105957, -4.022409439086914, -1.6697235107421875, 0.6829624176025391, 3.0356485843658447, 5.38833475112915, 7.741021156311035, 10.093707084655762, 12.446393013000488, 14.799079895019531, 17.151765823364258, 19.504451751708984, 21.85713768005371, 24.209823608398438, 26.562511444091797, 28.91519546508789, 31.26788330078125, 33.620567321777344, 35.9732551574707, 38.32594299316406, 40.67863082885742, 43.031314849853516, 45.384002685546875, 47.73668670654297, 50.08937454223633, 52.44206237792969, 54.79474639892578, 57.147430419921875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 1.0, 6.0, 3.0, 10.0, 6.0, 8.0, 11.0, 9.0, 20.0, 10.0, 20.0, 17.0, 22.0, 27.0, 23.0, 32.0, 37.0, 35.0, 38.0, 40.0, 40.0, 35.0, 45.0, 38.0, 36.0, 35.0, 47.0, 29.0, 38.0, 39.0, 36.0, 27.0, 26.0, 23.0, 21.0, 17.0, 16.0, 18.0, 9.0, 13.0, 6.0, 8.0, 6.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.076873779296875, -40.76036071777344, -39.44384765625, -38.12733459472656, -36.810821533203125, -35.49431228637695, -34.177799224853516, -32.86128616333008, -31.54477310180664, -30.228260040283203, -28.911746978759766, -27.59523582458496, -26.278722763061523, -24.962209701538086, -23.64569854736328, -22.329185485839844, -21.012672424316406, -19.69615936279297, -18.37964630126953, -17.063135147094727, -15.746622085571289, -14.430109024047852, -13.11359691619873, -11.79708480834961, -10.480571746826172, -9.164058685302734, -7.847546577453613, -6.531033992767334, -5.214521408081055, -3.8980088233947754, -2.581496238708496, -1.264984130859375, 0.0515289306640625, 1.3680415153503418, 2.684554100036621, 4.0010666847229, 5.31757926940918, 6.634091854095459, 7.950604438781738, 9.26711654663086, 10.583629608154297, 11.900142669677734, 13.216654777526855, 14.533166885375977, 15.849679946899414, 17.16619300842285, 18.482704162597656, 19.799217224121094, 21.11573028564453, 22.43224334716797, 23.748756408691406, 25.06526756286621, 26.38178062438965, 27.698293685913086, 29.01480484008789, 30.331317901611328, 31.647830963134766, 32.9643440246582, 34.28085708618164, 35.59737014770508, 36.91387939453125, 38.23039245605469, 39.546905517578125, 40.86341857910156, 42.179931640625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 11.0, 11.0, 19.0, 13.0, 13.0, 32.0, 18.0, 24.0, 22.0, 29.0, 25.0, 35.0, 43.0, 37.0, 35.0, 50.0, 37.0, 46.0, 44.0, 33.0, 45.0, 22.0, 31.0, 29.0, 32.0, 33.0, 30.0, 30.0, 15.0, 19.0, 17.0, 18.0, 15.0, 11.0, 6.0, 5.0, 9.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.43359375, -5.26470947265625, -5.0958251953125, -4.92694091796875, -4.758056640625, -4.58917236328125, -4.4202880859375, -4.25140380859375, -4.08251953125, -3.91363525390625, -3.7447509765625, -3.57586669921875, -3.406982421875, -3.23809814453125, -3.0692138671875, -2.90032958984375, -2.7314453125, -2.56256103515625, -2.3936767578125, -2.22479248046875, -2.055908203125, -1.88702392578125, -1.7181396484375, -1.54925537109375, -1.38037109375, -1.21148681640625, -1.0426025390625, -0.87371826171875, -0.704833984375, -0.53594970703125, -0.3670654296875, -0.19818115234375, -0.029296875, 0.13958740234375, 0.3084716796875, 0.47735595703125, 0.646240234375, 0.81512451171875, 0.9840087890625, 1.15289306640625, 1.32177734375, 1.49066162109375, 1.6595458984375, 1.82843017578125, 1.997314453125, 2.16619873046875, 2.3350830078125, 2.50396728515625, 2.6728515625, 2.84173583984375, 3.0106201171875, 3.17950439453125, 3.348388671875, 3.51727294921875, 3.6861572265625, 3.85504150390625, 4.02392578125, 4.19281005859375, 4.3616943359375, 4.53057861328125, 4.699462890625, 4.86834716796875, 5.0372314453125, 5.20611572265625, 5.375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 10.0, 13.0, 27.0, 42.0, 52.0, 83.0, 109.0, 125.0, 228.0, 363.0, 538.0, 728.0, 1166.0, 1895.0, 2968.0, 4621.0, 7268.0, 11448.0, 18275.0, 29799.0, 48158.0, 77136.0, 118020.0, 159589.0, 172111.0, 139049.0, 95036.0, 60139.0, 37151.0, 23030.0, 14302.0, 8997.0, 5684.0, 3611.0, 2358.0, 1544.0, 931.0, 622.0, 435.0, 305.0, 184.0, 119.0, 83.0, 60.0, 41.0, 30.0, 22.0, 15.0, 12.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5712890625, -0.5541000366210938, -0.5369110107421875, -0.5197219848632812, -0.502532958984375, -0.48534393310546875, -0.4681549072265625, -0.45096588134765625, -0.43377685546875, -0.41658782958984375, -0.3993988037109375, -0.38220977783203125, -0.365020751953125, -0.34783172607421875, -0.3306427001953125, -0.31345367431640625, -0.2962646484375, -0.27907562255859375, -0.2618865966796875, -0.24469757080078125, -0.227508544921875, -0.21031951904296875, -0.1931304931640625, -0.17594146728515625, -0.15875244140625, -0.14156341552734375, -0.1243743896484375, -0.10718536376953125, -0.089996337890625, -0.07280731201171875, -0.0556182861328125, -0.03842926025390625, -0.021240234375, -0.00405120849609375, 0.0131378173828125, 0.03032684326171875, 0.047515869140625, 0.06470489501953125, 0.0818939208984375, 0.09908294677734375, 0.11627197265625, 0.13346099853515625, 0.1506500244140625, 0.16783905029296875, 0.185028076171875, 0.20221710205078125, 0.2194061279296875, 0.23659515380859375, 0.2537841796875, 0.27097320556640625, 0.2881622314453125, 0.30535125732421875, 0.322540283203125, 0.33972930908203125, 0.3569183349609375, 0.37410736083984375, 0.39129638671875, 0.40848541259765625, 0.4256744384765625, 0.44286346435546875, 0.460052490234375, 0.47724151611328125, 0.4944305419921875, 0.5116195678710938, 0.52880859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 11.0, 15.0, 12.0, 18.0, 22.0, 17.0, 25.0, 35.0, 35.0, 31.0, 42.0, 39.0, 44.0, 36.0, 36.0, 45.0, 1057.0, 43.0, 39.0, 42.0, 44.0, 43.0, 31.0, 30.0, 22.0, 26.0, 20.0, 20.0, 21.0, 18.0, 14.0, 8.0, 9.0, 11.0, 8.0, 5.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.555511474609375, -3.44110107421875, -3.326690673828125, -3.2122802734375, -3.097869873046875, -2.98345947265625, -2.869049072265625, -2.754638671875, -2.640228271484375, -2.52581787109375, -2.411407470703125, -2.2969970703125, -2.182586669921875, -2.06817626953125, -1.953765869140625, -1.83935546875, -1.724945068359375, -1.61053466796875, -1.496124267578125, -1.3817138671875, -1.267303466796875, -1.15289306640625, -1.038482666015625, -0.924072265625, -0.809661865234375, -0.69525146484375, -0.580841064453125, -0.4664306640625, -0.352020263671875, -0.23760986328125, -0.123199462890625, -0.0087890625, 0.105621337890625, 0.22003173828125, 0.334442138671875, 0.4488525390625, 0.563262939453125, 0.67767333984375, 0.792083740234375, 0.906494140625, 1.020904541015625, 1.13531494140625, 1.249725341796875, 1.3641357421875, 1.478546142578125, 1.59295654296875, 1.707366943359375, 1.82177734375, 1.936187744140625, 2.05059814453125, 2.165008544921875, 2.2794189453125, 2.393829345703125, 2.50823974609375, 2.622650146484375, 2.737060546875, 2.851470947265625, 2.96588134765625, 3.080291748046875, 3.1947021484375, 3.309112548828125, 3.42352294921875, 3.537933349609375, 3.65234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 6.0, 9.0, 9.0, 14.0, 21.0, 33.0, 47.0, 61.0, 99.0, 163.0, 193.0, 332.0, 504.0, 723.0, 1060.0, 1640.0, 2583.0, 4002.0, 6118.0, 9544.0, 14664.0, 23130.0, 35670.0, 53972.0, 78813.0, 109237.0, 135928.0, 1191802.0, 127457.0, 98125.0, 68871.0, 46557.0, 30373.0, 19593.0, 12634.0, 7973.0, 5345.0, 3352.0, 2156.0, 1480.0, 999.0, 595.0, 406.0, 275.0, 206.0, 122.0, 73.0, 58.0, 38.0, 24.0, 11.0, 12.0, 7.0, 11.0, 7.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.39794921875, -0.3856391906738281, -0.37332916259765625, -0.3610191345214844, -0.3487091064453125, -0.3363990783691406, -0.32408905029296875, -0.3117790222167969, -0.299468994140625, -0.2871589660644531, -0.27484893798828125, -0.2625389099121094, -0.2502288818359375, -0.23791885375976562, -0.22560882568359375, -0.21329879760742188, -0.20098876953125, -0.18867874145507812, -0.17636871337890625, -0.16405868530273438, -0.1517486572265625, -0.13943862915039062, -0.12712860107421875, -0.11481857299804688, -0.102508544921875, -0.09019851684570312, -0.07788848876953125, -0.06557846069335938, -0.0532684326171875, -0.040958404541015625, -0.02864837646484375, -0.016338348388671875, -0.0040283203125, 0.008281707763671875, 0.02059173583984375, 0.032901763916015625, 0.0452117919921875, 0.057521820068359375, 0.06983184814453125, 0.08214187622070312, 0.094451904296875, 0.10676193237304688, 0.11907196044921875, 0.13138198852539062, 0.1436920166015625, 0.15600204467773438, 0.16831207275390625, 0.18062210083007812, 0.19293212890625, 0.20524215698242188, 0.21755218505859375, 0.22986221313476562, 0.2421722412109375, 0.2544822692871094, 0.26679229736328125, 0.2791023254394531, 0.291412353515625, 0.3037223815917969, 0.31603240966796875, 0.3283424377441406, 0.3406524658203125, 0.3529624938964844, 0.36527252197265625, 0.3775825500488281, 0.389892578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 11.0, 13.0, 15.0, 19.0, 23.0, 23.0, 32.0, 24.0, 42.0, 55.0, 66.0, 75.0, 73.0, 77.0, 75.0, 62.0, 53.0, 51.0, 40.0, 26.0, 17.0, 20.0, 25.0, 17.0, 9.0, 9.0, 8.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.005336761474609375, -0.0051937103271484375, -0.0050506591796875, -0.0049076080322265625, -0.004764556884765625, -0.0046215057373046875, -0.00447845458984375, -0.0043354034423828125, -0.004192352294921875, -0.0040493011474609375, -0.00390625, -0.0037631988525390625, -0.003620147705078125, -0.0034770965576171875, -0.00333404541015625, -0.0031909942626953125, -0.003047943115234375, -0.0029048919677734375, -0.0027618408203125, -0.0026187896728515625, -0.002475738525390625, -0.0023326873779296875, -0.00218963623046875, -0.0020465850830078125, -0.001903533935546875, -0.0017604827880859375, -0.001617431640625, -0.0014743804931640625, -0.001331329345703125, -0.0011882781982421875, -0.00104522705078125, -0.0009021759033203125, -0.000759124755859375, -0.0006160736083984375, -0.0004730224609375, -0.0003299713134765625, -0.000186920166015625, -4.38690185546875e-05, 9.918212890625e-05, 0.0002422332763671875, 0.000385284423828125, 0.0005283355712890625, 0.00067138671875, 0.0008144378662109375, 0.000957489013671875, 0.0011005401611328125, 0.00124359130859375, 0.0013866424560546875, 0.001529693603515625, 0.0016727447509765625, 0.0018157958984375, 0.0019588470458984375, 0.002101898193359375, 0.0022449493408203125, 0.00238800048828125, 0.0025310516357421875, 0.002674102783203125, 0.0028171539306640625, 0.002960205078125, 0.0031032562255859375, 0.003246307373046875, 0.0033893585205078125, 0.00353240966796875, 0.0036754608154296875, 0.003818511962890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 14.0, 11.0, 8.0, 17.0, 19.0, 17.0, 30.0, 44.0, 62.0, 70.0, 118.0, 213.0, 592.0, 6382.0, 1035193.0, 4530.0, 574.0, 200.0, 127.0, 81.0, 65.0, 39.0, 21.0, 29.0, 20.0, 15.0, 12.0, 12.0, 4.0, 2.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0865478515625, -0.08339691162109375, -0.0802459716796875, -0.07709503173828125, -0.073944091796875, -0.07079315185546875, -0.0676422119140625, -0.06449127197265625, -0.06134033203125, -0.05818939208984375, -0.0550384521484375, -0.05188751220703125, -0.048736572265625, -0.04558563232421875, -0.0424346923828125, -0.03928375244140625, -0.0361328125, -0.03298187255859375, -0.0298309326171875, -0.02667999267578125, -0.023529052734375, -0.02037811279296875, -0.0172271728515625, -0.01407623291015625, -0.01092529296875, -0.00777435302734375, -0.0046234130859375, -0.00147247314453125, 0.001678466796875, 0.00482940673828125, 0.0079803466796875, 0.01113128662109375, 0.0142822265625, 0.01743316650390625, 0.0205841064453125, 0.02373504638671875, 0.026885986328125, 0.03003692626953125, 0.0331878662109375, 0.03633880615234375, 0.03948974609375, 0.04264068603515625, 0.0457916259765625, 0.04894256591796875, 0.052093505859375, 0.05524444580078125, 0.0583953857421875, 0.06154632568359375, 0.064697265625, 0.06784820556640625, 0.0709991455078125, 0.07415008544921875, 0.077301025390625, 0.08045196533203125, 0.0836029052734375, 0.08675384521484375, 0.08990478515625, 0.09305572509765625, 0.0962066650390625, 0.09935760498046875, 0.102508544921875, 0.10565948486328125, 0.1088104248046875, 0.11196136474609375, 0.1151123046875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 43.0, 840.0, 126.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022291839122772217, -0.0013804666232317686, -0.0005317492177709937, 0.0003169681876897812, 0.0011656854767352343, 0.0020144027657806873, 0.002863120287656784, 0.0037118373438715935, 0.00456055486574769, 0.005409272387623787, 0.006257989443838596, 0.007106706965714693, 0.00795542448759079, 0.0088041415438056, 0.009652858600020409, 0.010501576587557793, 0.011350293643772602, 0.012199010699987411, 0.013047728687524796, 0.013896445743739605, 0.014745162799954414, 0.015593880787491798, 0.016442596912384033, 0.017291314899921417, 0.0181400328874588, 0.018988750874996185, 0.01983746699988842, 0.020686184987425804, 0.021534902974963188, 0.022383619099855423, 0.023232337087392807, 0.02408105507493019, 0.024929771199822426, 0.02577848918735981, 0.026627205312252045, 0.02747592329978943, 0.028324641287326813, 0.029173357412219048, 0.03002207539975643, 0.030870791524648666, 0.03171950951218605, 0.032568227499723434, 0.03341694548726082, 0.034265659749507904, 0.03511437773704529, 0.03596309572458267, 0.036811813712120056, 0.03766053169965744, 0.038509249687194824, 0.03935796767473221, 0.04020668566226959, 0.041055403649806976, 0.04190411791205406, 0.042752835899591446, 0.04360155388712883, 0.044450271874666214, 0.0452989861369133, 0.046147704124450684, 0.04699642211198807, 0.04784514009952545, 0.04869385436177254, 0.04954257234930992, 0.050391290336847305, 0.05124000832438469, 0.05208872631192207]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 10.0, 7.0, 13.0, 15.0, 24.0, 23.0, 48.0, 51.0, 65.0, 59.0, 74.0, 73.0, 70.0, 75.0, 68.0, 71.0, 55.0, 56.0, 40.0, 32.0, 21.0, 20.0, 15.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00472414493560791, -0.004573778249323368, -0.004423411563038826, -0.004273044876754284, -0.004122678190469742, -0.0039723115041852, -0.0038219448179006577, -0.0036715781316161156, -0.0035212114453315735, -0.0033708447590470314, -0.0032204780727624893, -0.0030701113864779472, -0.002919744700193405, -0.002769378013908863, -0.002619011327624321, -0.002468644641339779, -0.002318277955055237, -0.0021679112687706947, -0.0020175445824861526, -0.0018671778962016106, -0.0017168112099170685, -0.0015664445236325264, -0.0014160778373479843, -0.0012657111510634422, -0.0011153444647789001, -0.0009649777784943581, -0.000814611092209816, -0.0006642444059252739, -0.0005138777196407318, -0.00036351103335618973, -0.00021314434707164764, -6.277766078710556e-05, 8.758902549743652e-05, 0.0002379557117819786, 0.0003883223980665207, 0.0005386890843510628, 0.0006890557706356049, 0.0008394224569201469, 0.000989789143204689, 0.0011401558294892311, 0.0012905225157737732, 0.0014408892020583153, 0.0015912558883428574, 0.0017416225746273994, 0.0018919892609119415, 0.0020423559471964836, 0.0021927226334810257, 0.0023430893197655678, 0.00249345600605011, 0.002643822692334652, 0.002794189378619194, 0.002944556064903736, 0.003094922751188278, 0.0032452894374728203, 0.0033956561237573624, 0.0035460228100419044, 0.0036963894963264465, 0.0038467561826109886, 0.003997122868895531, 0.004147489555180073, 0.004297856241464615, 0.004448222927749157, 0.004598589614033699, 0.004748956300318241, 0.004899322986602783]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 11.0, 11.0, 19.0, 13.0, 13.0, 32.0, 18.0, 24.0, 22.0, 28.0, 26.0, 35.0, 43.0, 37.0, 35.0, 50.0, 37.0, 46.0, 44.0, 33.0, 45.0, 22.0, 31.0, 29.0, 32.0, 33.0, 30.0, 30.0, 15.0, 19.0, 17.0, 18.0, 15.0, 11.0, 6.0, 5.0, 9.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.43359375, -5.26470947265625, -5.0958251953125, -4.92694091796875, -4.758056640625, -4.58917236328125, -4.4202880859375, -4.25140380859375, -4.08251953125, -3.91363525390625, -3.7447509765625, -3.57586669921875, -3.406982421875, -3.23809814453125, -3.0692138671875, -2.90032958984375, -2.7314453125, -2.56256103515625, -2.3936767578125, -2.22479248046875, -2.055908203125, -1.88702392578125, -1.7181396484375, -1.54925537109375, -1.38037109375, -1.21148681640625, -1.0426025390625, -0.87371826171875, -0.704833984375, -0.53594970703125, -0.3670654296875, -0.19818115234375, -0.029296875, 0.13958740234375, 0.3084716796875, 0.47735595703125, 0.646240234375, 0.81512451171875, 0.9840087890625, 1.15289306640625, 1.32177734375, 1.49066162109375, 1.6595458984375, 1.82843017578125, 1.997314453125, 2.16619873046875, 2.3350830078125, 2.50396728515625, 2.6728515625, 2.84173583984375, 3.0106201171875, 3.17950439453125, 3.348388671875, 3.51727294921875, 3.6861572265625, 3.85504150390625, 4.02392578125, 4.19281005859375, 4.3616943359375, 4.53057861328125, 4.699462890625, 4.86834716796875, 5.0372314453125, 5.20611572265625, 5.375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 11.0, 18.0, 16.0, 29.0, 42.0, 57.0, 68.0, 117.0, 205.0, 303.0, 537.0, 913.0, 2109.0, 4806.0, 12403.0, 36688.0, 118350.0, 431056.0, 307436.0, 88473.0, 27584.0, 9791.0, 3717.0, 1669.0, 883.0, 437.0, 296.0, 156.0, 112.0, 88.0, 51.0, 36.0, 24.0, 16.0, 14.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.07421875, -6.88238525390625, -6.6905517578125, -6.49871826171875, -6.306884765625, -6.11505126953125, -5.9232177734375, -5.73138427734375, -5.53955078125, -5.34771728515625, -5.1558837890625, -4.96405029296875, -4.772216796875, -4.58038330078125, -4.3885498046875, -4.19671630859375, -4.0048828125, -3.81304931640625, -3.6212158203125, -3.42938232421875, -3.237548828125, -3.04571533203125, -2.8538818359375, -2.66204833984375, -2.47021484375, -2.27838134765625, -2.0865478515625, -1.89471435546875, -1.702880859375, -1.51104736328125, -1.3192138671875, -1.12738037109375, -0.935546875, -0.74371337890625, -0.5518798828125, -0.36004638671875, -0.168212890625, 0.02362060546875, 0.2154541015625, 0.40728759765625, 0.59912109375, 0.79095458984375, 0.9827880859375, 1.17462158203125, 1.366455078125, 1.55828857421875, 1.7501220703125, 1.94195556640625, 2.1337890625, 2.32562255859375, 2.5174560546875, 2.70928955078125, 2.901123046875, 3.09295654296875, 3.2847900390625, 3.47662353515625, 3.66845703125, 3.86029052734375, 4.0521240234375, 4.24395751953125, 4.435791015625, 4.62762451171875, 4.8194580078125, 5.01129150390625, 5.203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 7.0, 10.0, 3.0, 12.0, 11.0, 10.0, 14.0, 21.0, 16.0, 26.0, 27.0, 27.0, 35.0, 30.0, 44.0, 38.0, 46.0, 70.0, 110.0, 308.0, 1505.0, 176.0, 73.0, 47.0, 46.0, 38.0, 32.0, 37.0, 27.0, 26.0, 21.0, 23.0, 23.0, 19.0, 14.0, 10.0, 9.0, 8.0, 5.0, 7.0, 8.0, 6.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.296875, -17.729248046875, -17.16162109375, -16.593994140625, -16.0263671875, -15.458740234375, -14.89111328125, -14.323486328125, -13.755859375, -13.188232421875, -12.62060546875, -12.052978515625, -11.4853515625, -10.917724609375, -10.35009765625, -9.782470703125, -9.21484375, -8.647216796875, -8.07958984375, -7.511962890625, -6.9443359375, -6.376708984375, -5.80908203125, -5.241455078125, -4.673828125, -4.106201171875, -3.53857421875, -2.970947265625, -2.4033203125, -1.835693359375, -1.26806640625, -0.700439453125, -0.1328125, 0.434814453125, 1.00244140625, 1.570068359375, 2.1376953125, 2.705322265625, 3.27294921875, 3.840576171875, 4.408203125, 4.975830078125, 5.54345703125, 6.111083984375, 6.6787109375, 7.246337890625, 7.81396484375, 8.381591796875, 8.94921875, 9.516845703125, 10.08447265625, 10.652099609375, 11.2197265625, 11.787353515625, 12.35498046875, 12.922607421875, 13.490234375, 14.057861328125, 14.62548828125, 15.193115234375, 15.7607421875, 16.328369140625, 16.89599609375, 17.463623046875, 18.03125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 13.0, 24.0, 31.0, 34.0, 65.0, 125.0, 183.0, 356.0, 545.0, 3392.0, 3112454.0, 26494.0, 946.0, 409.0, 235.0, 131.0, 95.0, 45.0, 36.0, 25.0, 11.0, 13.0, 6.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.0, -87.408203125, -84.81640625, -82.224609375, -79.6328125, -77.041015625, -74.44921875, -71.857421875, -69.265625, -66.673828125, -64.08203125, -61.490234375, -58.8984375, -56.306640625, -53.71484375, -51.123046875, -48.53125, -45.939453125, -43.34765625, -40.755859375, -38.1640625, -35.572265625, -32.98046875, -30.388671875, -27.796875, -25.205078125, -22.61328125, -20.021484375, -17.4296875, -14.837890625, -12.24609375, -9.654296875, -7.0625, -4.470703125, -1.87890625, 0.712890625, 3.3046875, 5.896484375, 8.48828125, 11.080078125, 13.671875, 16.263671875, 18.85546875, 21.447265625, 24.0390625, 26.630859375, 29.22265625, 31.814453125, 34.40625, 36.998046875, 39.58984375, 42.181640625, 44.7734375, 47.365234375, 49.95703125, 52.548828125, 55.140625, 57.732421875, 60.32421875, 62.916015625, 65.5078125, 68.099609375, 70.69140625, 73.283203125, 75.875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 20.0, 289.0, 541.0, 156.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.69527435302734, -100.67316436767578, -97.65105438232422, -94.62894439697266, -91.6068344116211, -88.58472442626953, -85.56261444091797, -82.5405044555664, -79.51839447021484, -76.49628448486328, -73.47417449951172, -70.45206451416016, -67.4299545288086, -64.40784454345703, -61.38573455810547, -58.363624572753906, -55.34151840209961, -52.31940841674805, -49.297298431396484, -46.27518844604492, -43.25307846069336, -40.2309684753418, -37.2088623046875, -34.18675231933594, -31.164640426635742, -28.14253044128418, -25.120420455932617, -22.098312377929688, -19.076202392578125, -16.054092407226562, -13.031982421875, -10.009872436523438, -6.987762451171875, -3.9656527042388916, -0.9435429573059082, 2.078566551208496, 5.100676536560059, 8.122786521911621, 11.144895553588867, 14.16700553894043, 17.189115524291992, 20.211225509643555, 23.233335494995117, 26.255443572998047, 29.27755355834961, 32.29966354370117, 35.321773529052734, 38.3438835144043, 41.36599349975586, 44.38810348510742, 47.410213470458984, 50.43232345581055, 53.45443344116211, 56.47654342651367, 59.49864959716797, 62.52075958251953, 65.5428695678711, 68.56497955322266, 71.58708953857422, 74.60919952392578, 77.63130950927734, 80.6534194946289, 83.67552947998047, 86.69763946533203, 89.7197494506836]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 9.0, 5.0, 8.0, 12.0, 12.0, 15.0, 9.0, 16.0, 31.0, 29.0, 30.0, 33.0, 36.0, 43.0, 42.0, 36.0, 32.0, 53.0, 48.0, 45.0, 42.0, 39.0, 41.0, 37.0, 30.0, 36.0, 25.0, 29.0, 26.0, 22.0, 27.0, 27.0, 11.0, 13.0, 6.0, 5.0, 5.0, 7.0, 3.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.810935974121094, -53.16584777832031, -51.52075958251953, -49.87567138671875, -48.23058319091797, -46.58549499511719, -44.94041061401367, -43.29532241821289, -41.65023422241211, -40.00514602661133, -38.36005783081055, -36.714969635009766, -35.06988525390625, -33.42479705810547, -31.779708862304688, -30.134620666503906, -28.489532470703125, -26.844444274902344, -25.199356079101562, -23.554269790649414, -21.909181594848633, -20.26409339904785, -18.619007110595703, -16.973918914794922, -15.32883071899414, -13.68374252319336, -12.038655281066895, -10.39356803894043, -8.748479843139648, -7.103391647338867, -5.458304405212402, -3.8132171630859375, -2.168132781982422, -0.5230450630187988, 1.1220426559448242, 2.7671303749084473, 4.41221809387207, 6.057306289672852, 7.702393531799316, 9.347480773925781, 10.992568969726562, 12.637657165527344, 14.282744407653809, 15.927831649780273, 17.572919845581055, 19.218008041381836, 20.863094329833984, 22.508182525634766, 24.153270721435547, 25.798358917236328, 27.44344711303711, 29.088533401489258, 30.73362159729004, 32.37870788574219, 34.02379608154297, 35.66888427734375, 37.31397247314453, 38.95906066894531, 40.604148864746094, 42.249237060546875, 43.894325256347656, 45.53941345214844, 47.18449783325195, 48.829586029052734, 50.474674224853516]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 10.0, 12.0, 19.0, 18.0, 10.0, 17.0, 26.0, 28.0, 18.0, 33.0, 22.0, 29.0, 46.0, 41.0, 45.0, 35.0, 53.0, 40.0, 51.0, 32.0, 40.0, 30.0, 36.0, 32.0, 35.0, 26.0, 29.0, 27.0, 18.0, 24.0, 14.0, 20.0, 9.0, 9.0, 12.0, 4.0, 5.0, 7.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.5487060546875, -5.366943359375, -5.1851806640625, -5.00341796875, -4.8216552734375, -4.639892578125, -4.4581298828125, -4.2763671875, -4.0946044921875, -3.912841796875, -3.7310791015625, -3.54931640625, -3.3675537109375, -3.185791015625, -3.0040283203125, -2.822265625, -2.6405029296875, -2.458740234375, -2.2769775390625, -2.09521484375, -1.9134521484375, -1.731689453125, -1.5499267578125, -1.3681640625, -1.1864013671875, -1.004638671875, -0.8228759765625, -0.64111328125, -0.4593505859375, -0.277587890625, -0.0958251953125, 0.0859375, 0.2677001953125, 0.449462890625, 0.6312255859375, 0.81298828125, 0.9947509765625, 1.176513671875, 1.3582763671875, 1.5400390625, 1.7218017578125, 1.903564453125, 2.0853271484375, 2.26708984375, 2.4488525390625, 2.630615234375, 2.8123779296875, 2.994140625, 3.1759033203125, 3.357666015625, 3.5394287109375, 3.72119140625, 3.9029541015625, 4.084716796875, 4.2664794921875, 4.4482421875, 4.6300048828125, 4.811767578125, 4.9935302734375, 5.17529296875, 5.3570556640625, 5.538818359375, 5.7205810546875, 5.90234375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 10.0, 9.0, 17.0, 14.0, 18.0, 35.0, 26.0, 40.0, 46.0, 62.0, 57.0, 105.0, 164.0, 226.0, 391.0, 918.0, 2774.0, 11556.0, 75819.0, 884145.0, 2596142.0, 558902.0, 50037.0, 8547.0, 2307.0, 766.0, 351.0, 229.0, 123.0, 86.0, 69.0, 66.0, 41.0, 32.0, 33.0, 16.0, 16.0, 15.0, 14.0, 13.0, 14.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.7281494140625, -13.276611328125, -12.8250732421875, -12.37353515625, -11.9219970703125, -11.470458984375, -11.0189208984375, -10.5673828125, -10.1158447265625, -9.664306640625, -9.2127685546875, -8.76123046875, -8.3096923828125, -7.858154296875, -7.4066162109375, -6.955078125, -6.5035400390625, -6.052001953125, -5.6004638671875, -5.14892578125, -4.6973876953125, -4.245849609375, -3.7943115234375, -3.3427734375, -2.8912353515625, -2.439697265625, -1.9881591796875, -1.53662109375, -1.0850830078125, -0.633544921875, -0.1820068359375, 0.26953125, 0.7210693359375, 1.172607421875, 1.6241455078125, 2.07568359375, 2.5272216796875, 2.978759765625, 3.4302978515625, 3.8818359375, 4.3333740234375, 4.784912109375, 5.2364501953125, 5.68798828125, 6.1395263671875, 6.591064453125, 7.0426025390625, 7.494140625, 7.9456787109375, 8.397216796875, 8.8487548828125, 9.30029296875, 9.7518310546875, 10.203369140625, 10.6549072265625, 11.1064453125, 11.5579833984375, 12.009521484375, 12.4610595703125, 12.91259765625, 13.3641357421875, 13.815673828125, 14.2672119140625, 14.71875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 7.0, 12.0, 23.0, 17.0, 20.0, 39.0, 41.0, 65.0, 67.0, 118.0, 130.0, 181.0, 234.0, 316.0, 397.0, 453.0, 409.0, 371.0, 289.0, 225.0, 160.0, 146.0, 83.0, 72.0, 44.0, 33.0, 25.0, 20.0, 14.0, 14.0, 6.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8125, -14.4306640625, -14.048828125, -13.6669921875, -13.28515625, -12.9033203125, -12.521484375, -12.1396484375, -11.7578125, -11.3759765625, -10.994140625, -10.6123046875, -10.23046875, -9.8486328125, -9.466796875, -9.0849609375, -8.703125, -8.3212890625, -7.939453125, -7.5576171875, -7.17578125, -6.7939453125, -6.412109375, -6.0302734375, -5.6484375, -5.2666015625, -4.884765625, -4.5029296875, -4.12109375, -3.7392578125, -3.357421875, -2.9755859375, -2.59375, -2.2119140625, -1.830078125, -1.4482421875, -1.06640625, -0.6845703125, -0.302734375, 0.0791015625, 0.4609375, 0.8427734375, 1.224609375, 1.6064453125, 1.98828125, 2.3701171875, 2.751953125, 3.1337890625, 3.515625, 3.8974609375, 4.279296875, 4.6611328125, 5.04296875, 5.4248046875, 5.806640625, 6.1884765625, 6.5703125, 6.9521484375, 7.333984375, 7.7158203125, 8.09765625, 8.4794921875, 8.861328125, 9.2431640625, 9.625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 16.0, 16.0, 18.0, 26.0, 34.0, 45.0, 60.0, 98.0, 140.0, 183.0, 229.0, 384.0, 719.0, 6231.0, 2482166.0, 1696963.0, 4995.0, 648.0, 351.0, 238.0, 193.0, 146.0, 102.0, 73.0, 61.0, 30.0, 34.0, 19.0, 17.0, 8.0, 12.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.625, -43.7216796875, -41.818359375, -39.9150390625, -38.01171875, -36.1083984375, -34.205078125, -32.3017578125, -30.3984375, -28.4951171875, -26.591796875, -24.6884765625, -22.78515625, -20.8818359375, -18.978515625, -17.0751953125, -15.171875, -13.2685546875, -11.365234375, -9.4619140625, -7.55859375, -5.6552734375, -3.751953125, -1.8486328125, 0.0546875, 1.9580078125, 3.861328125, 5.7646484375, 7.66796875, 9.5712890625, 11.474609375, 13.3779296875, 15.28125, 17.1845703125, 19.087890625, 20.9912109375, 22.89453125, 24.7978515625, 26.701171875, 28.6044921875, 30.5078125, 32.4111328125, 34.314453125, 36.2177734375, 38.12109375, 40.0244140625, 41.927734375, 43.8310546875, 45.734375, 47.6376953125, 49.541015625, 51.4443359375, 53.34765625, 55.2509765625, 57.154296875, 59.0576171875, 60.9609375, 62.8642578125, 64.767578125, 66.6708984375, 68.57421875, 70.4775390625, 72.380859375, 74.2841796875, 76.1875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 20.0, 115.0, 346.0, 360.0, 145.0, 21.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-309.4000244140625, -303.4617919921875, -297.5235900878906, -291.5853576660156, -285.64715576171875, -279.70892333984375, -273.77069091796875, -267.8324890136719, -261.8942565917969, -255.95603942871094, -250.017822265625, -244.07958984375, -238.14137268066406, -232.20315551757812, -226.26492309570312, -220.3267059326172, -214.38848876953125, -208.4502716064453, -202.51205444335938, -196.57382202148438, -190.63560485839844, -184.6973876953125, -178.7591552734375, -172.82093811035156, -166.88272094726562, -160.9445037841797, -155.00628662109375, -149.06805419921875, -143.1298370361328, -137.19161987304688, -131.25338745117188, -125.31517028808594, -119.376953125, -113.43873596191406, -107.5005111694336, -101.56228637695312, -95.62406921386719, -89.68585205078125, -83.74762725830078, -77.80940246582031, -71.87118530273438, -65.93296813964844, -59.99474334716797, -54.056522369384766, -48.11830139160156, -42.18008041381836, -36.241859436035156, -30.303638458251953, -24.36541748046875, -18.427196502685547, -12.488975524902344, -6.550754547119141, -0.6125335693359375, 5.325687408447266, 11.263908386230469, 17.202129364013672, 23.140350341796875, 29.078571319580078, 35.01679229736328, 40.955013275146484, 46.89323425292969, 52.83145523071289, 58.769676208496094, 64.70790100097656, 70.6461181640625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 2.0, 9.0, 4.0, 8.0, 10.0, 12.0, 16.0, 8.0, 20.0, 28.0, 27.0, 27.0, 23.0, 32.0, 33.0, 39.0, 33.0, 35.0, 45.0, 31.0, 41.0, 38.0, 41.0, 43.0, 40.0, 41.0, 39.0, 44.0, 32.0, 22.0, 24.0, 23.0, 16.0, 28.0, 10.0, 8.0, 15.0, 11.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.456787109375, -38.23329544067383, -37.009803771972656, -35.78630828857422, -34.56281661987305, -33.339324951171875, -32.1158332824707, -30.8923397064209, -29.668846130371094, -28.445354461669922, -27.221860885620117, -25.998369216918945, -24.77487564086914, -23.55138397216797, -22.327892303466797, -21.104398727416992, -19.88090705871582, -18.65741539001465, -17.433921813964844, -16.210430145263672, -14.986936569213867, -13.763444900512695, -12.539952278137207, -11.316459655761719, -10.09296703338623, -8.869474411010742, -7.645981788635254, -6.422489643096924, -5.1989970207214355, -3.9755043983459473, -2.752012252807617, -1.528519630432129, -0.3050270080566406, 0.9184654951095581, 2.141957998275757, 3.365450382232666, 4.588943004608154, 5.812435626983643, 7.035927772521973, 8.259420394897461, 9.48291301727295, 10.706405639648438, 11.929898262023926, 13.153390884399414, 14.376882553100586, 15.60037612915039, 16.823867797851562, 18.047359466552734, 19.27085304260254, 20.49434471130371, 21.717838287353516, 22.941329956054688, 24.164823532104492, 25.388315200805664, 26.61180877685547, 27.83530044555664, 29.058792114257812, 30.282283782958984, 31.50577735900879, 32.729270935058594, 33.952762603759766, 35.17625427246094, 36.39974594116211, 37.62323760986328, 38.84673309326172]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 16.0, 11.0, 13.0, 17.0, 19.0, 19.0, 21.0, 27.0, 27.0, 24.0, 33.0, 36.0, 29.0, 40.0, 41.0, 41.0, 47.0, 47.0, 32.0, 39.0, 37.0, 38.0, 43.0, 43.0, 33.0, 23.0, 41.0, 26.0, 17.0, 13.0, 20.0, 19.0, 13.0, 11.0, 8.0, 5.0, 4.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0], "bins": [-6.59765625, -6.4124755859375, -6.227294921875, -6.0421142578125, -5.85693359375, -5.6717529296875, -5.486572265625, -5.3013916015625, -5.1162109375, -4.9310302734375, -4.745849609375, -4.5606689453125, -4.37548828125, -4.1903076171875, -4.005126953125, -3.8199462890625, -3.634765625, -3.4495849609375, -3.264404296875, -3.0792236328125, -2.89404296875, -2.7088623046875, -2.523681640625, -2.3385009765625, -2.1533203125, -1.9681396484375, -1.782958984375, -1.5977783203125, -1.41259765625, -1.2274169921875, -1.042236328125, -0.8570556640625, -0.671875, -0.4866943359375, -0.301513671875, -0.1163330078125, 0.06884765625, 0.2540283203125, 0.439208984375, 0.6243896484375, 0.8095703125, 0.9947509765625, 1.179931640625, 1.3651123046875, 1.55029296875, 1.7354736328125, 1.920654296875, 2.1058349609375, 2.291015625, 2.4761962890625, 2.661376953125, 2.8465576171875, 3.03173828125, 3.2169189453125, 3.402099609375, 3.5872802734375, 3.7724609375, 3.9576416015625, 4.142822265625, 4.3280029296875, 4.51318359375, 4.6983642578125, 4.883544921875, 5.0687255859375, 5.25390625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 29.0, 39.0, 43.0, 68.0, 95.0, 151.0, 176.0, 340.0, 448.0, 699.0, 1042.0, 1685.0, 2554.0, 4182.0, 6562.0, 10062.0, 16034.0, 26132.0, 41031.0, 65697.0, 101046.0, 144413.0, 173384.0, 151292.0, 108347.0, 70788.0, 45028.0, 28331.0, 17792.0, 11304.0, 6944.0, 4547.0, 2959.0, 1862.0, 1142.0, 739.0, 497.0, 342.0, 220.0, 143.0, 91.0, 76.0, 50.0, 34.0, 23.0, 17.0, 16.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5513153076171875, -0.533294677734375, -0.5152740478515625, -0.49725341796875, -0.4792327880859375, -0.461212158203125, -0.4431915283203125, -0.4251708984375, -0.4071502685546875, -0.389129638671875, -0.3711090087890625, -0.35308837890625, -0.3350677490234375, -0.317047119140625, -0.2990264892578125, -0.281005859375, -0.2629852294921875, -0.244964599609375, -0.2269439697265625, -0.20892333984375, -0.1909027099609375, -0.172882080078125, -0.1548614501953125, -0.1368408203125, -0.1188201904296875, -0.100799560546875, -0.0827789306640625, -0.06475830078125, -0.0467376708984375, -0.028717041015625, -0.0106964111328125, 0.00732421875, 0.0253448486328125, 0.043365478515625, 0.0613861083984375, 0.07940673828125, 0.0974273681640625, 0.115447998046875, 0.1334686279296875, 0.1514892578125, 0.1695098876953125, 0.187530517578125, 0.2055511474609375, 0.22357177734375, 0.2415924072265625, 0.259613037109375, 0.2776336669921875, 0.295654296875, 0.3136749267578125, 0.331695556640625, 0.3497161865234375, 0.36773681640625, 0.3857574462890625, 0.403778076171875, 0.4217987060546875, 0.4398193359375, 0.4578399658203125, 0.475860595703125, 0.4938812255859375, 0.51190185546875, 0.5299224853515625, 0.547943115234375, 0.5659637451171875, 0.583984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 16.0, 9.0, 15.0, 22.0, 15.0, 18.0, 26.0, 25.0, 25.0, 36.0, 40.0, 27.0, 40.0, 38.0, 41.0, 35.0, 1058.0, 51.0, 40.0, 44.0, 46.0, 22.0, 41.0, 26.0, 33.0, 19.0, 21.0, 24.0, 26.0, 18.0, 17.0, 16.0, 10.0, 12.0, 8.0, 7.0, 2.0, 6.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8515625, -3.7366943359375, -3.621826171875, -3.5069580078125, -3.39208984375, -3.2772216796875, -3.162353515625, -3.0474853515625, -2.9326171875, -2.8177490234375, -2.702880859375, -2.5880126953125, -2.47314453125, -2.3582763671875, -2.243408203125, -2.1285400390625, -2.013671875, -1.8988037109375, -1.783935546875, -1.6690673828125, -1.55419921875, -1.4393310546875, -1.324462890625, -1.2095947265625, -1.0947265625, -0.9798583984375, -0.864990234375, -0.7501220703125, -0.63525390625, -0.5203857421875, -0.405517578125, -0.2906494140625, -0.17578125, -0.0609130859375, 0.053955078125, 0.1688232421875, 0.28369140625, 0.3985595703125, 0.513427734375, 0.6282958984375, 0.7431640625, 0.8580322265625, 0.972900390625, 1.0877685546875, 1.20263671875, 1.3175048828125, 1.432373046875, 1.5472412109375, 1.662109375, 1.7769775390625, 1.891845703125, 2.0067138671875, 2.12158203125, 2.2364501953125, 2.351318359375, 2.4661865234375, 2.5810546875, 2.6959228515625, 2.810791015625, 2.9256591796875, 3.04052734375, 3.1553955078125, 3.270263671875, 3.3851318359375, 3.5]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 20.0, 20.0, 35.0, 45.0, 56.0, 103.0, 159.0, 232.0, 384.0, 538.0, 807.0, 1168.0, 1689.0, 2708.0, 4185.0, 6203.0, 9434.0, 14539.0, 22104.0, 34354.0, 51468.0, 75753.0, 104570.0, 131254.0, 1190740.0, 128516.0, 101328.0, 72132.0, 49212.0, 32546.0, 21167.0, 13452.0, 8910.0, 5843.0, 3789.0, 2510.0, 1685.0, 1123.0, 786.0, 543.0, 359.0, 234.0, 152.0, 107.0, 70.0, 36.0, 20.0, 16.0, 8.0, 6.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3846397399902344, -0.37157440185546875, -0.3585090637207031, -0.3454437255859375, -0.3323783874511719, -0.31931304931640625, -0.3062477111816406, -0.293182373046875, -0.2801170349121094, -0.26705169677734375, -0.2539863586425781, -0.2409210205078125, -0.22785568237304688, -0.21479034423828125, -0.20172500610351562, -0.18865966796875, -0.17559432983398438, -0.16252899169921875, -0.14946365356445312, -0.1363983154296875, -0.12333297729492188, -0.11026763916015625, -0.09720230102539062, -0.084136962890625, -0.07107162475585938, -0.05800628662109375, -0.044940948486328125, -0.0318756103515625, -0.018810272216796875, -0.00574493408203125, 0.007320404052734375, 0.0203857421875, 0.033451080322265625, 0.04651641845703125, 0.059581756591796875, 0.0726470947265625, 0.08571243286132812, 0.09877777099609375, 0.11184310913085938, 0.124908447265625, 0.13797378540039062, 0.15103912353515625, 0.16410446166992188, 0.1771697998046875, 0.19023513793945312, 0.20330047607421875, 0.21636581420898438, 0.22943115234375, 0.24249649047851562, 0.25556182861328125, 0.2686271667480469, 0.2816925048828125, 0.2947578430175781, 0.30782318115234375, 0.3208885192871094, 0.333953857421875, 0.3470191955566406, 0.36008453369140625, 0.3731498718261719, 0.3862152099609375, 0.3992805480957031, 0.41234588623046875, 0.4254112243652344, 0.4384765625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 2.0, 7.0, 10.0, 10.0, 9.0, 22.0, 25.0, 22.0, 37.0, 34.0, 56.0, 74.0, 83.0, 73.0, 77.0, 68.0, 62.0, 63.0, 55.0, 31.0, 31.0, 28.0, 19.0, 11.0, 18.0, 5.0, 13.0, 10.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037250518798828125, -0.0036031901836395264, -0.0034813284873962402, -0.003359466791152954, -0.003237605094909668, -0.003115743398666382, -0.0029938817024230957, -0.0028720200061798096, -0.0027501583099365234, -0.0026282966136932373, -0.002506434917449951, -0.002384573221206665, -0.002262711524963379, -0.0021408498287200928, -0.0020189881324768066, -0.0018971264362335205, -0.0017752647399902344, -0.0016534030437469482, -0.0015315413475036621, -0.001409679651260376, -0.0012878179550170898, -0.0011659562587738037, -0.0010440945625305176, -0.0009222328662872314, -0.0008003711700439453, -0.0006785094738006592, -0.000556647777557373, -0.0004347860813140869, -0.0003129243850708008, -0.00019106268882751465, -6.920099258422852e-05, 5.266070365905762e-05, 0.00017452239990234375, 0.0002963840961456299, 0.000418245792388916, 0.0005401074886322021, 0.0006619691848754883, 0.0007838308811187744, 0.0009056925773620605, 0.0010275542736053467, 0.0011494159698486328, 0.001271277666091919, 0.001393139362335205, 0.0015150010585784912, 0.0016368627548217773, 0.0017587244510650635, 0.0018805861473083496, 0.0020024478435516357, 0.002124309539794922, 0.002246171236038208, 0.002368032932281494, 0.0024898946285247803, 0.0026117563247680664, 0.0027336180210113525, 0.0028554797172546387, 0.002977341413497925, 0.003099203109741211, 0.003221064805984497, 0.003342926502227783, 0.0034647881984710693, 0.0035866498947143555, 0.0037085115909576416, 0.0038303732872009277, 0.003952234983444214, 0.0040740966796875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 13.0, 15.0, 12.0, 22.0, 17.0, 31.0, 51.0, 65.0, 69.0, 130.0, 236.0, 522.0, 5768.0, 1024990.0, 15111.0, 674.0, 288.0, 161.0, 96.0, 52.0, 46.0, 38.0, 30.0, 21.0, 16.0, 10.0, 8.0, 4.0, 11.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08984375, -0.08716869354248047, -0.08449363708496094, -0.0818185806274414, -0.07914352416992188, -0.07646846771240234, -0.07379341125488281, -0.07111835479736328, -0.06844329833984375, -0.06576824188232422, -0.06309318542480469, -0.060418128967285156, -0.057743072509765625, -0.055068016052246094, -0.05239295959472656, -0.04971790313720703, -0.0470428466796875, -0.04436779022216797, -0.04169273376464844, -0.039017677307128906, -0.036342620849609375, -0.033667564392089844, -0.030992507934570312, -0.02831745147705078, -0.02564239501953125, -0.02296733856201172, -0.020292282104492188, -0.017617225646972656, -0.014942169189453125, -0.012267112731933594, -0.009592056274414062, -0.006916999816894531, -0.004241943359375, -0.0015668869018554688, 0.0011081695556640625, 0.0037832260131835938, 0.006458282470703125, 0.009133338928222656, 0.011808395385742188, 0.014483451843261719, 0.01715850830078125, 0.01983356475830078, 0.022508621215820312, 0.025183677673339844, 0.027858734130859375, 0.030533790588378906, 0.03320884704589844, 0.03588390350341797, 0.0385589599609375, 0.04123401641845703, 0.04390907287597656, 0.046584129333496094, 0.049259185791015625, 0.051934242248535156, 0.05460929870605469, 0.05728435516357422, 0.05995941162109375, 0.06263446807861328, 0.06530952453613281, 0.06798458099365234, 0.07065963745117188, 0.0733346939086914, 0.07600975036621094, 0.07868480682373047, 0.08135986328125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [71.0, 879.0, 67.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001219928846694529, -0.00038170168409124017, 0.0004565254785120487, 0.0012947526993229985, 0.0021329796873033047, 0.00297120725736022, 0.003809434361755848, 0.004647661466151476, 0.005485888570547104, 0.006324115674942732, 0.00716234277933836, 0.008000570349395275, 0.008838796988129616, 0.009677024558186531, 0.010515252128243446, 0.011353478766977787, 0.012191705405712128, 0.013029932975769043, 0.013868159614503384, 0.014706387184560299, 0.01554461382329464, 0.016382841393351555, 0.01722106896340847, 0.018059294670820236, 0.01889752224087715, 0.019735749810934067, 0.020573977380990982, 0.021412203088402748, 0.022250430658459663, 0.02308865822851658, 0.023926885798573494, 0.02476511150598526, 0.025603340938687325, 0.02644156850874424, 0.027279796078801155, 0.02811802178621292, 0.028956249356269836, 0.02979447692632675, 0.030632704496383667, 0.03147093206644058, 0.0323091596364975, 0.03314738720655441, 0.03398561477661133, 0.03482384234666824, 0.03566206991672516, 0.036500297486782074, 0.03733852133154869, 0.038176748901605606, 0.03901497647166252, 0.03985320404171944, 0.04069143161177635, 0.04152965918183327, 0.04236788675189018, 0.0432061105966568, 0.044044338166713715, 0.04488256573677063, 0.045720793306827545, 0.04655902087688446, 0.047397248446941376, 0.04823547601699829, 0.049073703587055206, 0.04991193115711212, 0.05075015500187874, 0.051588382571935654, 0.05242661014199257]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 9.0, 9.0, 16.0, 24.0, 30.0, 32.0, 29.0, 37.0, 44.0, 57.0, 67.0, 60.0, 76.0, 60.0, 68.0, 45.0, 45.0, 61.0, 45.0, 52.0, 30.0, 25.0, 17.0, 12.0, 14.0, 11.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036977529525756836, -0.003597537986934185, -0.0034973230212926865, -0.003397108055651188, -0.0032968930900096893, -0.0031966781243681908, -0.003096463158726692, -0.0029962481930851936, -0.002896033227443695, -0.0027958182618021965, -0.002695603296160698, -0.0025953883305191994, -0.002495173364877701, -0.0023949583992362022, -0.0022947434335947037, -0.002194528467953205, -0.0020943135023117065, -0.001994098536670208, -0.0018938835710287094, -0.0017936686053872108, -0.0016934536397457123, -0.0015932386741042137, -0.0014930237084627151, -0.0013928087428212166, -0.001292593777179718, -0.0011923788115382195, -0.0010921638458967209, -0.0009919488802552223, -0.0008917339146137238, -0.0007915189489722252, -0.0006913039833307266, -0.0005910890176892281, -0.0004908740520477295, -0.0003906590864062309, -0.00029044412076473236, -0.0001902291551232338, -9.001418948173523e-05, 1.0200776159763336e-05, 0.0001104157418012619, 0.00021063070744276047, 0.00031084567308425903, 0.0004110606387257576, 0.0005112756043672562, 0.0006114905700087547, 0.0007117055356502533, 0.0008119205012917519, 0.0009121354669332504, 0.001012350432574749, 0.0011125653982162476, 0.0012127803638577461, 0.0013129953294992447, 0.0014132102951407433, 0.0015134252607822418, 0.0016136402264237404, 0.001713855192065239, 0.0018140701577067375, 0.001914285123348236, 0.0020145000889897346, 0.002114715054631233, 0.0022149300202727318, 0.0023151449859142303, 0.002415359951555729, 0.0025155749171972275, 0.002615789882838726, 0.0027160048484802246]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 16.0, 11.0, 13.0, 17.0, 19.0, 18.0, 22.0, 27.0, 27.0, 24.0, 34.0, 35.0, 29.0, 40.0, 41.0, 41.0, 47.0, 47.0, 32.0, 39.0, 37.0, 38.0, 43.0, 43.0, 33.0, 23.0, 41.0, 26.0, 17.0, 13.0, 20.0, 19.0, 13.0, 11.0, 8.0, 5.0, 4.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0], "bins": [-6.59765625, -6.4124755859375, -6.227294921875, -6.0421142578125, -5.85693359375, -5.6717529296875, -5.486572265625, -5.3013916015625, -5.1162109375, -4.9310302734375, -4.745849609375, -4.5606689453125, -4.37548828125, -4.1903076171875, -4.005126953125, -3.8199462890625, -3.634765625, -3.4495849609375, -3.264404296875, -3.0792236328125, -2.89404296875, -2.7088623046875, -2.523681640625, -2.3385009765625, -2.1533203125, -1.9681396484375, -1.782958984375, -1.5977783203125, -1.41259765625, -1.2274169921875, -1.042236328125, -0.8570556640625, -0.671875, -0.4866943359375, -0.301513671875, -0.1163330078125, 0.06884765625, 0.2540283203125, 0.439208984375, 0.6243896484375, 0.8095703125, 0.9947509765625, 1.179931640625, 1.3651123046875, 1.55029296875, 1.7354736328125, 1.920654296875, 2.1058349609375, 2.291015625, 2.4761962890625, 2.661376953125, 2.8465576171875, 3.03173828125, 3.2169189453125, 3.402099609375, 3.5872802734375, 3.7724609375, 3.9576416015625, 4.142822265625, 4.3280029296875, 4.51318359375, 4.6983642578125, 4.883544921875, 5.0687255859375, 5.25390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 13.0, 17.0, 32.0, 48.0, 73.0, 134.0, 206.0, 362.0, 637.0, 1120.0, 2195.0, 4443.0, 9505.0, 20660.0, 48966.0, 124286.0, 348908.0, 299073.0, 109153.0, 43303.0, 18423.0, 8526.0, 3999.0, 1971.0, 1071.0, 590.0, 324.0, 165.0, 113.0, 71.0, 54.0, 28.0, 26.0, 14.0, 11.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.3125, -5.1407470703125, -4.968994140625, -4.7972412109375, -4.62548828125, -4.4537353515625, -4.281982421875, -4.1102294921875, -3.9384765625, -3.7667236328125, -3.594970703125, -3.4232177734375, -3.25146484375, -3.0797119140625, -2.907958984375, -2.7362060546875, -2.564453125, -2.3927001953125, -2.220947265625, -2.0491943359375, -1.87744140625, -1.7056884765625, -1.533935546875, -1.3621826171875, -1.1904296875, -1.0186767578125, -0.846923828125, -0.6751708984375, -0.50341796875, -0.3316650390625, -0.159912109375, 0.0118408203125, 0.18359375, 0.3553466796875, 0.527099609375, 0.6988525390625, 0.87060546875, 1.0423583984375, 1.214111328125, 1.3858642578125, 1.5576171875, 1.7293701171875, 1.901123046875, 2.0728759765625, 2.24462890625, 2.4163818359375, 2.588134765625, 2.7598876953125, 2.931640625, 3.1033935546875, 3.275146484375, 3.4468994140625, 3.61865234375, 3.7904052734375, 3.962158203125, 4.1339111328125, 4.3056640625, 4.4774169921875, 4.649169921875, 4.8209228515625, 4.99267578125, 5.1644287109375, 5.336181640625, 5.5079345703125, 5.6796875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 11.0, 12.0, 11.0, 15.0, 17.0, 20.0, 21.0, 21.0, 24.0, 26.0, 50.0, 52.0, 41.0, 41.0, 66.0, 100.0, 235.0, 1461.0, 253.0, 101.0, 69.0, 37.0, 27.0, 44.0, 33.0, 30.0, 25.0, 26.0, 16.0, 18.0, 17.0, 20.0, 13.0, 14.0, 16.0, 10.0, 4.0, 6.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 5.0], "bins": [-20.921875, -20.349609375, -19.77734375, -19.205078125, -18.6328125, -18.060546875, -17.48828125, -16.916015625, -16.34375, -15.771484375, -15.19921875, -14.626953125, -14.0546875, -13.482421875, -12.91015625, -12.337890625, -11.765625, -11.193359375, -10.62109375, -10.048828125, -9.4765625, -8.904296875, -8.33203125, -7.759765625, -7.1875, -6.615234375, -6.04296875, -5.470703125, -4.8984375, -4.326171875, -3.75390625, -3.181640625, -2.609375, -2.037109375, -1.46484375, -0.892578125, -0.3203125, 0.251953125, 0.82421875, 1.396484375, 1.96875, 2.541015625, 3.11328125, 3.685546875, 4.2578125, 4.830078125, 5.40234375, 5.974609375, 6.546875, 7.119140625, 7.69140625, 8.263671875, 8.8359375, 9.408203125, 9.98046875, 10.552734375, 11.125, 11.697265625, 12.26953125, 12.841796875, 13.4140625, 13.986328125, 14.55859375, 15.130859375, 15.703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 10.0, 10.0, 7.0, 15.0, 18.0, 34.0, 39.0, 40.0, 49.0, 69.0, 108.0, 154.0, 226.0, 299.0, 583.0, 2828.0, 447872.0, 2686451.0, 4881.0, 759.0, 381.0, 238.0, 165.0, 117.0, 73.0, 61.0, 59.0, 32.0, 27.0, 23.0, 13.0, 12.0, 13.0, 8.0, 5.0, 7.0, 3.0, 1.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.84375, -54.10400390625, -52.3642578125, -50.62451171875, -48.884765625, -47.14501953125, -45.4052734375, -43.66552734375, -41.92578125, -40.18603515625, -38.4462890625, -36.70654296875, -34.966796875, -33.22705078125, -31.4873046875, -29.74755859375, -28.0078125, -26.26806640625, -24.5283203125, -22.78857421875, -21.048828125, -19.30908203125, -17.5693359375, -15.82958984375, -14.08984375, -12.35009765625, -10.6103515625, -8.87060546875, -7.130859375, -5.39111328125, -3.6513671875, -1.91162109375, -0.171875, 1.56787109375, 3.3076171875, 5.04736328125, 6.787109375, 8.52685546875, 10.2666015625, 12.00634765625, 13.74609375, 15.48583984375, 17.2255859375, 18.96533203125, 20.705078125, 22.44482421875, 24.1845703125, 25.92431640625, 27.6640625, 29.40380859375, 31.1435546875, 32.88330078125, 34.623046875, 36.36279296875, 38.1025390625, 39.84228515625, 41.58203125, 43.32177734375, 45.0615234375, 46.80126953125, 48.541015625, 50.28076171875, 52.0205078125, 53.76025390625, 55.5]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 103.0, 784.0, 127.0, 1.0, 0.0, 2.0], "bins": [-326.47576904296875, -320.9872131347656, -315.4986877441406, -310.0101318359375, -304.5215759277344, -299.03302001953125, -293.54449462890625, -288.0559387207031, -282.5673828125, -277.0788269042969, -271.5903015136719, -266.10174560546875, -260.6131896972656, -255.12464904785156, -249.6361083984375, -244.14755249023438, -238.65902709960938, -233.1704864501953, -227.6819305419922, -222.19338989257812, -216.704833984375, -211.21629333496094, -205.72775268554688, -200.23919677734375, -194.75064086914062, -189.26210021972656, -183.77354431152344, -178.28500366210938, -172.79644775390625, -167.3079071044922, -161.81936645507812, -156.330810546875, -150.84228515625, -145.35374450683594, -139.8651885986328, -134.37664794921875, -128.88809204101562, -123.39955139160156, -117.91100311279297, -112.42245483398438, -106.93390655517578, -101.44535827636719, -95.9568099975586, -90.46826171875, -84.97972106933594, -79.49117279052734, -74.00262451171875, -68.51408386230469, -63.025535583496094, -57.5369873046875, -52.04844284057617, -46.55989456176758, -41.07135009765625, -35.582801818847656, -30.094253540039062, -24.605709075927734, -19.117158889770508, -13.628612518310547, -8.14006519317627, -2.651517868041992, 2.8370285034179688, 8.32557487487793, 13.814123153686523, 19.30266761779785, 24.791215896606445]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 3.0, 3.0, 8.0, 13.0, 15.0, 14.0, 15.0, 12.0, 21.0, 11.0, 26.0, 23.0, 33.0, 30.0, 41.0, 38.0, 47.0, 46.0, 37.0, 38.0, 38.0, 49.0, 40.0, 41.0, 35.0, 43.0, 32.0, 44.0, 27.0, 32.0, 10.0, 22.0, 22.0, 19.0, 11.0, 12.0, 8.0, 2.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.37596893310547, -43.847267150878906, -42.318565368652344, -40.78986358642578, -39.26116180419922, -37.73246383666992, -36.20376205444336, -34.6750602722168, -33.146358489990234, -31.617656707763672, -30.08895492553711, -28.56025505065918, -27.031553268432617, -25.502851486206055, -23.974151611328125, -22.445449829101562, -20.916748046875, -19.388046264648438, -17.859344482421875, -16.330644607543945, -14.801942825317383, -13.27324104309082, -11.744540214538574, -10.215839385986328, -8.687137603759766, -7.158436298370361, -5.629734992980957, -4.101033687591553, -2.5723323822021484, -1.0436310768127441, 0.48507022857666016, 2.0137710571289062, 3.5424766540527344, 5.071177959442139, 6.599879264831543, 8.128580093383789, 9.657281875610352, 11.185983657836914, 12.71468448638916, 14.243385314941406, 15.772087097167969, 17.30078887939453, 18.829490661621094, 20.358190536499023, 21.886892318725586, 23.41559410095215, 24.944293975830078, 26.47299575805664, 28.001697540283203, 29.530399322509766, 31.059101104736328, 32.58780288696289, 34.11650085449219, 35.64520263671875, 37.17390441894531, 38.702606201171875, 40.23130798339844, 41.760009765625, 43.28871154785156, 44.817413330078125, 46.34611511230469, 47.874813079833984, 49.40351486206055, 50.93221664428711, 52.46091842651367]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 4.0, 9.0, 14.0, 12.0, 15.0, 14.0, 24.0, 22.0, 16.0, 27.0, 36.0, 35.0, 33.0, 35.0, 31.0, 46.0, 33.0, 54.0, 38.0, 35.0, 47.0, 41.0, 31.0, 39.0, 40.0, 32.0, 33.0, 26.0, 24.0, 21.0, 27.0, 10.0, 18.0, 9.0, 15.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.23828125, -6.04193115234375, -5.8455810546875, -5.64923095703125, -5.452880859375, -5.25653076171875, -5.0601806640625, -4.86383056640625, -4.66748046875, -4.47113037109375, -4.2747802734375, -4.07843017578125, -3.882080078125, -3.68572998046875, -3.4893798828125, -3.29302978515625, -3.0966796875, -2.90032958984375, -2.7039794921875, -2.50762939453125, -2.311279296875, -2.11492919921875, -1.9185791015625, -1.72222900390625, -1.52587890625, -1.32952880859375, -1.1331787109375, -0.93682861328125, -0.740478515625, -0.54412841796875, -0.3477783203125, -0.15142822265625, 0.044921875, 0.24127197265625, 0.4376220703125, 0.63397216796875, 0.830322265625, 1.02667236328125, 1.2230224609375, 1.41937255859375, 1.61572265625, 1.81207275390625, 2.0084228515625, 2.20477294921875, 2.401123046875, 2.59747314453125, 2.7938232421875, 2.99017333984375, 3.1865234375, 3.38287353515625, 3.5792236328125, 3.77557373046875, 3.971923828125, 4.16827392578125, 4.3646240234375, 4.56097412109375, 4.75732421875, 4.95367431640625, 5.1500244140625, 5.34637451171875, 5.542724609375, 5.73907470703125, 5.9354248046875, 6.13177490234375, 6.328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 2.0, 7.0, 12.0, 13.0, 13.0, 9.0, 12.0, 18.0, 20.0, 26.0, 38.0, 57.0, 60.0, 118.0, 198.0, 458.0, 1363.0, 5872.0, 45823.0, 1085378.0, 2854394.0, 182657.0, 13740.0, 2528.0, 713.0, 281.0, 134.0, 87.0, 50.0, 40.0, 29.0, 28.0, 13.0, 20.0, 19.0, 10.0, 8.0, 8.0, 1.0, 6.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.783203125, -19.12890625, -18.474609375, -17.8203125, -17.166015625, -16.51171875, -15.857421875, -15.203125, -14.548828125, -13.89453125, -13.240234375, -12.5859375, -11.931640625, -11.27734375, -10.623046875, -9.96875, -9.314453125, -8.66015625, -8.005859375, -7.3515625, -6.697265625, -6.04296875, -5.388671875, -4.734375, -4.080078125, -3.42578125, -2.771484375, -2.1171875, -1.462890625, -0.80859375, -0.154296875, 0.5, 1.154296875, 1.80859375, 2.462890625, 3.1171875, 3.771484375, 4.42578125, 5.080078125, 5.734375, 6.388671875, 7.04296875, 7.697265625, 8.3515625, 9.005859375, 9.66015625, 10.314453125, 10.96875, 11.623046875, 12.27734375, 12.931640625, 13.5859375, 14.240234375, 14.89453125, 15.548828125, 16.203125, 16.857421875, 17.51171875, 18.166015625, 18.8203125, 19.474609375, 20.12890625, 20.783203125, 21.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 10.0, 16.0, 19.0, 23.0, 46.0, 67.0, 65.0, 107.0, 124.0, 135.0, 212.0, 311.0, 417.0, 475.0, 503.0, 427.0, 304.0, 212.0, 168.0, 125.0, 81.0, 65.0, 33.0, 30.0, 16.0, 20.0, 15.0, 14.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.046875, -15.6126708984375, -15.178466796875, -14.7442626953125, -14.31005859375, -13.8758544921875, -13.441650390625, -13.0074462890625, -12.5732421875, -12.1390380859375, -11.704833984375, -11.2706298828125, -10.83642578125, -10.4022216796875, -9.968017578125, -9.5338134765625, -9.099609375, -8.6654052734375, -8.231201171875, -7.7969970703125, -7.36279296875, -6.9285888671875, -6.494384765625, -6.0601806640625, -5.6259765625, -5.1917724609375, -4.757568359375, -4.3233642578125, -3.88916015625, -3.4549560546875, -3.020751953125, -2.5865478515625, -2.15234375, -1.7181396484375, -1.283935546875, -0.8497314453125, -0.41552734375, 0.0186767578125, 0.452880859375, 0.8870849609375, 1.3212890625, 1.7554931640625, 2.189697265625, 2.6239013671875, 3.05810546875, 3.4923095703125, 3.926513671875, 4.3607177734375, 4.794921875, 5.2291259765625, 5.663330078125, 6.0975341796875, 6.53173828125, 6.9659423828125, 7.400146484375, 7.8343505859375, 8.2685546875, 8.7027587890625, 9.136962890625, 9.5711669921875, 10.00537109375, 10.4395751953125, 10.873779296875, 11.3079833984375, 11.7421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 13.0, 17.0, 31.0, 22.0, 26.0, 42.0, 62.0, 102.0, 152.0, 211.0, 247.0, 367.0, 846.0, 19431.0, 4001614.0, 167875.0, 1617.0, 464.0, 278.0, 206.0, 197.0, 126.0, 99.0, 74.0, 44.0, 36.0, 22.0, 16.0, 13.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.21875, -53.14892578125, -51.0791015625, -49.00927734375, -46.939453125, -44.86962890625, -42.7998046875, -40.72998046875, -38.66015625, -36.59033203125, -34.5205078125, -32.45068359375, -30.380859375, -28.31103515625, -26.2412109375, -24.17138671875, -22.1015625, -20.03173828125, -17.9619140625, -15.89208984375, -13.822265625, -11.75244140625, -9.6826171875, -7.61279296875, -5.54296875, -3.47314453125, -1.4033203125, 0.66650390625, 2.736328125, 4.80615234375, 6.8759765625, 8.94580078125, 11.015625, 13.08544921875, 15.1552734375, 17.22509765625, 19.294921875, 21.36474609375, 23.4345703125, 25.50439453125, 27.57421875, 29.64404296875, 31.7138671875, 33.78369140625, 35.853515625, 37.92333984375, 39.9931640625, 42.06298828125, 44.1328125, 46.20263671875, 48.2724609375, 50.34228515625, 52.412109375, 54.48193359375, 56.5517578125, 58.62158203125, 60.69140625, 62.76123046875, 64.8310546875, 66.90087890625, 68.970703125, 71.04052734375, 73.1103515625, 75.18017578125, 77.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 103.0, 387.0, 379.0, 121.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.4558410644531, -293.9368591308594, -287.4178466796875, -280.89886474609375, -274.3798828125, -267.86090087890625, -261.3418884277344, -254.82290649414062, -248.3039093017578, -241.784912109375, -235.26593017578125, -228.74693298339844, -222.22793579101562, -215.70895385742188, -209.18995666503906, -202.67095947265625, -196.1519775390625, -189.6329803466797, -183.11399841308594, -176.59500122070312, -170.07601928710938, -163.55702209472656, -157.03802490234375, -150.51904296875, -144.0000457763672, -137.48104858398438, -130.96206665039062, -124.44306945800781, -117.92407989501953, -111.40509033203125, -104.88609313964844, -98.36710357666016, -91.84811401367188, -85.3291244506836, -78.81013488769531, -72.2911376953125, -65.77214813232422, -59.25315856933594, -52.73416519165039, -46.215171813964844, -39.69618225097656, -33.17719268798828, -26.658199310302734, -20.13920783996582, -13.620216369628906, -7.101226806640625, -0.5822334289550781, 5.936759948730469, 12.45574951171875, 18.974740982055664, 25.493732452392578, 32.012725830078125, 38.531715393066406, 45.05070495605469, 51.569698333740234, 58.08869171142578, 64.60768127441406, 71.12667083740234, 77.64566040039062, 84.16465759277344, 90.68364715576172, 97.20263671875, 103.72163391113281, 110.2406234741211, 116.75961303710938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 11.0, 10.0, 10.0, 18.0, 24.0, 21.0, 29.0, 30.0, 44.0, 38.0, 33.0, 28.0, 38.0, 36.0, 39.0, 42.0, 46.0, 37.0, 34.0, 33.0, 35.0, 34.0, 47.0, 31.0, 33.0, 27.0, 25.0, 28.0, 21.0, 14.0, 13.0, 13.0, 13.0, 8.0, 6.0, 16.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-45.386871337890625, -44.06365966796875, -42.74044418334961, -41.41722869873047, -40.094017028808594, -38.77080535888672, -37.44758987426758, -36.12437438964844, -34.80116271972656, -33.47795104980469, -32.15473556518555, -30.83152198791504, -29.50830841064453, -28.185094833374023, -26.861881256103516, -25.538667678833008, -24.2154541015625, -22.892240524291992, -21.569026947021484, -20.245813369750977, -18.92259979248047, -17.59938621520996, -16.276172637939453, -14.952959060668945, -13.629745483398438, -12.30653190612793, -10.983318328857422, -9.660104751586914, -8.336891174316406, -7.013677597045898, -5.690464019775391, -4.367250442504883, -3.044036865234375, -1.7208232879638672, -0.3976097106933594, 0.9256038665771484, 2.2488174438476562, 3.572031021118164, 4.895244598388672, 6.21845817565918, 7.5416717529296875, 8.864885330200195, 10.188098907470703, 11.511312484741211, 12.834526062011719, 14.157739639282227, 15.480953216552734, 16.804166793823242, 18.12738037109375, 19.450593948364258, 20.773807525634766, 22.097021102905273, 23.42023468017578, 24.74344825744629, 26.066661834716797, 27.389875411987305, 28.713088989257812, 30.03630256652832, 31.359516143798828, 32.68273162841797, 34.005943298339844, 35.32915496826172, 36.65237045288086, 37.9755859375, 39.298797607421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 10.0, 7.0, 13.0, 15.0, 14.0, 20.0, 23.0, 28.0, 37.0, 27.0, 40.0, 35.0, 24.0, 42.0, 41.0, 30.0, 48.0, 40.0, 42.0, 56.0, 50.0, 40.0, 38.0, 36.0, 34.0, 29.0, 37.0, 24.0, 18.0, 16.0, 12.0, 16.0, 13.0, 9.0, 6.0, 6.0, 5.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.33984375, -6.131103515625, -5.92236328125, -5.713623046875, -5.5048828125, -5.296142578125, -5.08740234375, -4.878662109375, -4.669921875, -4.461181640625, -4.25244140625, -4.043701171875, -3.8349609375, -3.626220703125, -3.41748046875, -3.208740234375, -3.0, -2.791259765625, -2.58251953125, -2.373779296875, -2.1650390625, -1.956298828125, -1.74755859375, -1.538818359375, -1.330078125, -1.121337890625, -0.91259765625, -0.703857421875, -0.4951171875, -0.286376953125, -0.07763671875, 0.131103515625, 0.33984375, 0.548583984375, 0.75732421875, 0.966064453125, 1.1748046875, 1.383544921875, 1.59228515625, 1.801025390625, 2.009765625, 2.218505859375, 2.42724609375, 2.635986328125, 2.8447265625, 3.053466796875, 3.26220703125, 3.470947265625, 3.6796875, 3.888427734375, 4.09716796875, 4.305908203125, 4.5146484375, 4.723388671875, 4.93212890625, 5.140869140625, 5.349609375, 5.558349609375, 5.76708984375, 5.975830078125, 6.1845703125, 6.393310546875, 6.60205078125, 6.810791015625, 7.01953125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 10.0, 27.0, 31.0, 35.0, 69.0, 120.0, 184.0, 260.0, 428.0, 591.0, 969.0, 1465.0, 2432.0, 3778.0, 6205.0, 10201.0, 16611.0, 27363.0, 45864.0, 74443.0, 118052.0, 168866.0, 184317.0, 142999.0, 94501.0, 58315.0, 35358.0, 21050.0, 13020.0, 7873.0, 4780.0, 3038.0, 1870.0, 1250.0, 745.0, 461.0, 328.0, 218.0, 140.0, 84.0, 60.0, 36.0, 31.0, 24.0, 16.0, 7.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.658203125, -0.6384048461914062, -0.6186065673828125, -0.5988082885742188, -0.579010009765625, -0.5592117309570312, -0.5394134521484375, -0.5196151733398438, -0.49981689453125, -0.48001861572265625, -0.4602203369140625, -0.44042205810546875, -0.420623779296875, -0.40082550048828125, -0.3810272216796875, -0.36122894287109375, -0.3414306640625, -0.32163238525390625, -0.3018341064453125, -0.28203582763671875, -0.262237548828125, -0.24243927001953125, -0.2226409912109375, -0.20284271240234375, -0.18304443359375, -0.16324615478515625, -0.1434478759765625, -0.12364959716796875, -0.103851318359375, -0.08405303955078125, -0.0642547607421875, -0.04445648193359375, -0.024658203125, -0.00485992431640625, 0.0149383544921875, 0.03473663330078125, 0.054534912109375, 0.07433319091796875, 0.0941314697265625, 0.11392974853515625, 0.13372802734375, 0.15352630615234375, 0.1733245849609375, 0.19312286376953125, 0.212921142578125, 0.23271942138671875, 0.2525177001953125, 0.27231597900390625, 0.2921142578125, 0.31191253662109375, 0.3317108154296875, 0.35150909423828125, 0.371307373046875, 0.39110565185546875, 0.4109039306640625, 0.43070220947265625, 0.45050048828125, 0.47029876708984375, 0.4900970458984375, 0.5098953247070312, 0.529693603515625, 0.5494918823242188, 0.5692901611328125, 0.5890884399414062, 0.60888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 4.0, 11.0, 7.0, 12.0, 12.0, 20.0, 25.0, 27.0, 28.0, 24.0, 34.0, 38.0, 34.0, 30.0, 25.0, 51.0, 47.0, 49.0, 1063.0, 35.0, 47.0, 41.0, 27.0, 41.0, 38.0, 37.0, 22.0, 32.0, 28.0, 7.0, 15.0, 19.0, 11.0, 19.0, 10.0, 5.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.82421875, -3.700927734375, -3.57763671875, -3.454345703125, -3.3310546875, -3.207763671875, -3.08447265625, -2.961181640625, -2.837890625, -2.714599609375, -2.59130859375, -2.468017578125, -2.3447265625, -2.221435546875, -2.09814453125, -1.974853515625, -1.8515625, -1.728271484375, -1.60498046875, -1.481689453125, -1.3583984375, -1.235107421875, -1.11181640625, -0.988525390625, -0.865234375, -0.741943359375, -0.61865234375, -0.495361328125, -0.3720703125, -0.248779296875, -0.12548828125, -0.002197265625, 0.12109375, 0.244384765625, 0.36767578125, 0.490966796875, 0.6142578125, 0.737548828125, 0.86083984375, 0.984130859375, 1.107421875, 1.230712890625, 1.35400390625, 1.477294921875, 1.6005859375, 1.723876953125, 1.84716796875, 1.970458984375, 2.09375, 2.217041015625, 2.34033203125, 2.463623046875, 2.5869140625, 2.710205078125, 2.83349609375, 2.956787109375, 3.080078125, 3.203369140625, 3.32666015625, 3.449951171875, 3.5732421875, 3.696533203125, 3.81982421875, 3.943115234375, 4.06640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 8.0, 9.0, 26.0, 22.0, 36.0, 55.0, 91.0, 159.0, 201.0, 274.0, 502.0, 746.0, 1006.0, 1513.0, 2313.0, 3333.0, 4921.0, 7543.0, 11356.0, 17515.0, 26108.0, 39365.0, 58054.0, 81631.0, 107198.0, 131506.0, 1179433.0, 119300.0, 93625.0, 68268.0, 46755.0, 31876.0, 20788.0, 13914.0, 9152.0, 6081.0, 4077.0, 2738.0, 1869.0, 1218.0, 824.0, 615.0, 390.0, 270.0, 168.0, 117.0, 59.0, 41.0, 26.0, 16.0, 15.0, 2.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.3614654541015625, -0.348663330078125, -0.3358612060546875, -0.32305908203125, -0.3102569580078125, -0.297454833984375, -0.2846527099609375, -0.2718505859375, -0.2590484619140625, -0.246246337890625, -0.2334442138671875, -0.22064208984375, -0.2078399658203125, -0.195037841796875, -0.1822357177734375, -0.16943359375, -0.1566314697265625, -0.143829345703125, -0.1310272216796875, -0.11822509765625, -0.1054229736328125, -0.092620849609375, -0.0798187255859375, -0.0670166015625, -0.0542144775390625, -0.041412353515625, -0.0286102294921875, -0.01580810546875, -0.0030059814453125, 0.009796142578125, 0.0225982666015625, 0.035400390625, 0.0482025146484375, 0.061004638671875, 0.0738067626953125, 0.08660888671875, 0.0994110107421875, 0.112213134765625, 0.1250152587890625, 0.1378173828125, 0.1506195068359375, 0.163421630859375, 0.1762237548828125, 0.18902587890625, 0.2018280029296875, 0.214630126953125, 0.2274322509765625, 0.240234375, 0.2530364990234375, 0.265838623046875, 0.2786407470703125, 0.29144287109375, 0.3042449951171875, 0.317047119140625, 0.3298492431640625, 0.3426513671875, 0.3554534912109375, 0.368255615234375, 0.3810577392578125, 0.39385986328125, 0.4066619873046875, 0.419464111328125, 0.4322662353515625, 0.445068359375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 7.0, 19.0, 16.0, 11.0, 31.0, 34.0, 39.0, 31.0, 42.0, 54.0, 50.0, 64.0, 52.0, 78.0, 61.0, 60.0, 55.0, 57.0, 31.0, 31.0, 27.0, 27.0, 21.0, 13.0, 10.0, 17.0, 11.0, 4.0, 8.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004526108503341675, -0.004394471645355225, -0.004262834787368774, -0.004131197929382324, -0.003999561071395874, -0.003867924213409424, -0.0037362873554229736, -0.0036046504974365234, -0.0034730136394500732, -0.003341376781463623, -0.003209739923477173, -0.0030781030654907227, -0.0029464662075042725, -0.0028148293495178223, -0.002683192491531372, -0.002551555633544922, -0.0024199187755584717, -0.0022882819175720215, -0.0021566450595855713, -0.002025008201599121, -0.001893371343612671, -0.0017617344856262207, -0.0016300976276397705, -0.0014984607696533203, -0.0013668239116668701, -0.00123518705368042, -0.0011035501956939697, -0.0009719133377075195, -0.0008402764797210693, -0.0007086396217346191, -0.0005770027637481689, -0.00044536590576171875, -0.00031372904777526855, -0.00018209218978881836, -5.0455331802368164e-05, 8.118152618408203e-05, 0.00021281838417053223, 0.0003444552421569824, 0.0004760921001434326, 0.0006077289581298828, 0.000739365816116333, 0.0008710026741027832, 0.0010026395320892334, 0.0011342763900756836, 0.0012659132480621338, 0.001397550106048584, 0.0015291869640350342, 0.0016608238220214844, 0.0017924606800079346, 0.0019240975379943848, 0.002055734395980835, 0.002187371253967285, 0.0023190081119537354, 0.0024506449699401855, 0.0025822818279266357, 0.002713918685913086, 0.002845555543899536, 0.0029771924018859863, 0.0031088292598724365, 0.0032404661178588867, 0.003372102975845337, 0.003503739833831787, 0.0036353766918182373, 0.0037670135498046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 13.0, 3.0, 17.0, 14.0, 18.0, 13.0, 32.0, 34.0, 34.0, 54.0, 77.0, 95.0, 159.0, 262.0, 688.0, 16167.0, 1021004.0, 8435.0, 565.0, 276.0, 144.0, 111.0, 65.0, 50.0, 48.0, 38.0, 33.0, 23.0, 16.0, 14.0, 6.0, 13.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07415771484375, -0.07135295867919922, -0.06854820251464844, -0.06574344635009766, -0.06293869018554688, -0.060133934020996094, -0.05732917785644531, -0.05452442169189453, -0.05171966552734375, -0.04891490936279297, -0.04611015319824219, -0.043305397033691406, -0.040500640869140625, -0.037695884704589844, -0.03489112854003906, -0.03208637237548828, -0.0292816162109375, -0.02647686004638672, -0.023672103881835938, -0.020867347717285156, -0.018062591552734375, -0.015257835388183594, -0.012453079223632812, -0.009648323059082031, -0.00684356689453125, -0.004038810729980469, -0.0012340545654296875, 0.0015707015991210938, 0.004375457763671875, 0.007180213928222656, 0.009984970092773438, 0.012789726257324219, 0.015594482421875, 0.01839923858642578, 0.021203994750976562, 0.024008750915527344, 0.026813507080078125, 0.029618263244628906, 0.03242301940917969, 0.03522777557373047, 0.03803253173828125, 0.04083728790283203, 0.04364204406738281, 0.046446800231933594, 0.049251556396484375, 0.052056312561035156, 0.05486106872558594, 0.05766582489013672, 0.0604705810546875, 0.06327533721923828, 0.06608009338378906, 0.06888484954833984, 0.07168960571289062, 0.0744943618774414, 0.07729911804199219, 0.08010387420654297, 0.08290863037109375, 0.08571338653564453, 0.08851814270019531, 0.0913228988647461, 0.09412765502929688, 0.09693241119384766, 0.09973716735839844, 0.10254192352294922, 0.1053466796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 10.0, 892.0, 110.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033840483520179987, -0.002118284348398447, -0.000852520577609539, 0.0004132434260100126, 0.0016790071967989206, 0.0029447709675878286, 0.004210535436868668, 0.005476298741996288, 0.006742062978446484, 0.008007827214896679, 0.0092735905200243, 0.010539354756474495, 0.01180511899292469, 0.013070882298052311, 0.014336646534502506, 0.015602409839630127, 0.016868174076080322, 0.018133938312530518, 0.019399702548980713, 0.020665466785430908, 0.021931229159235954, 0.02319699339568615, 0.024462757632136345, 0.02572852000594139, 0.026994284242391586, 0.02826004847884178, 0.029525812715291977, 0.030791576951742172, 0.03205734118819237, 0.033323101699352264, 0.03458886593580246, 0.035854630172252655, 0.03712039813399315, 0.038386162370443344, 0.03965192660689354, 0.040917690843343735, 0.04218345507979393, 0.04344921559095383, 0.04471497982740402, 0.04598074406385422, 0.04724650830030441, 0.04851227253675461, 0.0497780367732048, 0.051043801009655, 0.052309565246105194, 0.05357532948255539, 0.054841093719005585, 0.05610685423016548, 0.057372622191905975, 0.05863838642835617, 0.059904150664806366, 0.06116991490125656, 0.06243567913770676, 0.06370144337415695, 0.06496720761060715, 0.06623297184705734, 0.06749872863292694, 0.06876449286937714, 0.07003025710582733, 0.07129602134227753, 0.07256178557872772, 0.07382754981517792, 0.07509331405162811, 0.07635907828807831, 0.0776248425245285]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 1.0, 5.0, 5.0, 5.0, 7.0, 17.0, 17.0, 12.0, 30.0, 39.0, 33.0, 48.0, 50.0, 48.0, 49.0, 56.0, 68.0, 55.0, 66.0, 60.0, 52.0, 49.0, 45.0, 31.0, 42.0, 28.0, 28.0, 18.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004139840602874756, -0.004024936817586422, -0.003910033032298088, -0.003795129247009754, -0.0036802254617214203, -0.0035653216764330864, -0.0034504178911447525, -0.0033355141058564186, -0.0032206103205680847, -0.003105706535279751, -0.002990802749991417, -0.002875898964703083, -0.002760995179414749, -0.0026460913941264153, -0.0025311876088380814, -0.0024162838235497475, -0.0023013800382614136, -0.0021864762529730797, -0.002071572467684746, -0.001956668682396412, -0.001841764897108078, -0.0017268611118197441, -0.0016119573265314102, -0.0014970535412430763, -0.0013821497559547424, -0.0012672459706664085, -0.0011523421853780746, -0.0010374384000897408, -0.0009225346148014069, -0.000807630829513073, -0.0006927270442247391, -0.0005778232589364052, -0.0004629194736480713, -0.0003480156883597374, -0.0002331119030714035, -0.00011820811778306961, -3.3043324947357178e-06, 0.00011159945279359818, 0.00022650323808193207, 0.00034140702337026596, 0.00045631080865859985, 0.0005712145939469337, 0.0006861183792352676, 0.0008010221645236015, 0.0009159259498119354, 0.0010308297351002693, 0.0011457335203886032, 0.001260637305676937, 0.001375541090965271, 0.0014904448762536049, 0.0016053486615419388, 0.0017202524468302727, 0.0018351562321186066, 0.0019500600174069405, 0.0020649638026952744, 0.0021798675879836082, 0.002294771373271942, 0.002409675158560276, 0.00252457894384861, 0.002639482729136944, 0.0027543865144252777, 0.0028692902997136116, 0.0029841940850019455, 0.0030990978702902794, 0.0032140016555786133]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 10.0, 7.0, 13.0, 15.0, 14.0, 20.0, 23.0, 28.0, 37.0, 27.0, 40.0, 35.0, 24.0, 42.0, 41.0, 30.0, 47.0, 41.0, 42.0, 56.0, 50.0, 40.0, 38.0, 36.0, 34.0, 29.0, 37.0, 24.0, 18.0, 16.0, 12.0, 16.0, 13.0, 9.0, 6.0, 6.0, 5.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.33984375, -6.131103515625, -5.92236328125, -5.713623046875, -5.5048828125, -5.296142578125, -5.08740234375, -4.878662109375, -4.669921875, -4.461181640625, -4.25244140625, -4.043701171875, -3.8349609375, -3.626220703125, -3.41748046875, -3.208740234375, -3.0, -2.791259765625, -2.58251953125, -2.373779296875, -2.1650390625, -1.956298828125, -1.74755859375, -1.538818359375, -1.330078125, -1.121337890625, -0.91259765625, -0.703857421875, -0.4951171875, -0.286376953125, -0.07763671875, 0.131103515625, 0.33984375, 0.548583984375, 0.75732421875, 0.966064453125, 1.1748046875, 1.383544921875, 1.59228515625, 1.801025390625, 2.009765625, 2.218505859375, 2.42724609375, 2.635986328125, 2.8447265625, 3.053466796875, 3.26220703125, 3.470947265625, 3.6796875, 3.888427734375, 4.09716796875, 4.305908203125, 4.5146484375, 4.723388671875, 4.93212890625, 5.140869140625, 5.349609375, 5.558349609375, 5.76708984375, 5.975830078125, 6.1845703125, 6.393310546875, 6.60205078125, 6.810791015625, 7.01953125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 13.0, 13.0, 16.0, 22.0, 30.0, 36.0, 59.0, 74.0, 93.0, 120.0, 211.0, 305.0, 642.0, 1360.0, 3251.0, 8775.0, 24009.0, 69591.0, 222593.0, 481514.0, 155921.0, 50551.0, 17758.0, 6541.0, 2587.0, 1041.0, 546.0, 289.0, 158.0, 117.0, 71.0, 50.0, 47.0, 35.0, 26.0, 17.0, 15.0, 8.0, 8.0, 5.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.037109375, -5.81640625, -5.595703125, -5.375, -5.154296875, -4.93359375, -4.712890625, -4.4921875, -4.271484375, -4.05078125, -3.830078125, -3.609375, -3.388671875, -3.16796875, -2.947265625, -2.7265625, -2.505859375, -2.28515625, -2.064453125, -1.84375, -1.623046875, -1.40234375, -1.181640625, -0.9609375, -0.740234375, -0.51953125, -0.298828125, -0.078125, 0.142578125, 0.36328125, 0.583984375, 0.8046875, 1.025390625, 1.24609375, 1.466796875, 1.6875, 1.908203125, 2.12890625, 2.349609375, 2.5703125, 2.791015625, 3.01171875, 3.232421875, 3.453125, 3.673828125, 3.89453125, 4.115234375, 4.3359375, 4.556640625, 4.77734375, 4.998046875, 5.21875, 5.439453125, 5.66015625, 5.880859375, 6.1015625, 6.322265625, 6.54296875, 6.763671875, 6.984375, 7.205078125, 7.42578125, 7.646484375, 7.8671875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 5.0, 4.0, 1.0, 5.0, 6.0, 5.0, 9.0, 15.0, 18.0, 15.0, 19.0, 31.0, 34.0, 32.0, 39.0, 41.0, 47.0, 63.0, 66.0, 157.0, 1621.0, 296.0, 118.0, 57.0, 41.0, 56.0, 42.0, 30.0, 38.0, 21.0, 31.0, 15.0, 16.0, 13.0, 12.0, 11.0, 4.0, 9.0, 2.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.046875, -25.2978515625, -24.548828125, -23.7998046875, -23.05078125, -22.3017578125, -21.552734375, -20.8037109375, -20.0546875, -19.3056640625, -18.556640625, -17.8076171875, -17.05859375, -16.3095703125, -15.560546875, -14.8115234375, -14.0625, -13.3134765625, -12.564453125, -11.8154296875, -11.06640625, -10.3173828125, -9.568359375, -8.8193359375, -8.0703125, -7.3212890625, -6.572265625, -5.8232421875, -5.07421875, -4.3251953125, -3.576171875, -2.8271484375, -2.078125, -1.3291015625, -0.580078125, 0.1689453125, 0.91796875, 1.6669921875, 2.416015625, 3.1650390625, 3.9140625, 4.6630859375, 5.412109375, 6.1611328125, 6.91015625, 7.6591796875, 8.408203125, 9.1572265625, 9.90625, 10.6552734375, 11.404296875, 12.1533203125, 12.90234375, 13.6513671875, 14.400390625, 15.1494140625, 15.8984375, 16.6474609375, 17.396484375, 18.1455078125, 18.89453125, 19.6435546875, 20.392578125, 21.1416015625, 21.890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 17.0, 15.0, 14.0, 19.0, 16.0, 38.0, 38.0, 49.0, 66.0, 87.0, 131.0, 200.0, 353.0, 681.0, 1884.0, 48743.0, 3080383.0, 10106.0, 1299.0, 587.0, 298.0, 174.0, 120.0, 90.0, 71.0, 52.0, 37.0, 29.0, 26.0, 11.0, 12.0, 11.0, 8.0, 4.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.84375, -60.04345703125, -58.2431640625, -56.44287109375, -54.642578125, -52.84228515625, -51.0419921875, -49.24169921875, -47.44140625, -45.64111328125, -43.8408203125, -42.04052734375, -40.240234375, -38.43994140625, -36.6396484375, -34.83935546875, -33.0390625, -31.23876953125, -29.4384765625, -27.63818359375, -25.837890625, -24.03759765625, -22.2373046875, -20.43701171875, -18.63671875, -16.83642578125, -15.0361328125, -13.23583984375, -11.435546875, -9.63525390625, -7.8349609375, -6.03466796875, -4.234375, -2.43408203125, -0.6337890625, 1.16650390625, 2.966796875, 4.76708984375, 6.5673828125, 8.36767578125, 10.16796875, 11.96826171875, 13.7685546875, 15.56884765625, 17.369140625, 19.16943359375, 20.9697265625, 22.77001953125, 24.5703125, 26.37060546875, 28.1708984375, 29.97119140625, 31.771484375, 33.57177734375, 35.3720703125, 37.17236328125, 38.97265625, 40.77294921875, 42.5732421875, 44.37353515625, 46.173828125, 47.97412109375, 49.7744140625, 51.57470703125, 53.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 27.0, 89.0, 199.0, 290.0, 211.0, 131.0, 43.0, 12.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.803340911865234, -27.34074592590332, -25.878150939941406, -24.41555404663086, -22.952960968017578, -21.49036407470703, -20.027769088745117, -18.565174102783203, -17.10257911682129, -15.639984130859375, -14.177389144897461, -12.71479320526123, -11.252198219299316, -9.789603233337402, -8.327007293701172, -6.864412307739258, -5.401817321777344, -3.9392220973968506, -2.4766268730163574, -1.0140314102172852, 0.4485635757446289, 1.911158561706543, 3.3737545013427734, 4.8363494873046875, 6.298944473266602, 7.761539459228516, 9.22413444519043, 10.68673038482666, 12.149325370788574, 13.611920356750488, 15.074516296386719, 16.537111282348633, 17.99970245361328, 19.462297439575195, 20.92489242553711, 22.387489318847656, 23.850082397460938, 25.312679290771484, 26.7752742767334, 28.237869262695312, 29.700464248657227, 31.16305923461914, 32.62565612792969, 34.08824920654297, 35.550846099853516, 37.0134391784668, 38.476036071777344, 39.938629150390625, 41.40122604370117, 42.86382293701172, 44.326416015625, 45.78901290893555, 47.25160598754883, 48.714202880859375, 50.176795959472656, 51.6393928527832, 53.10198974609375, 54.5645866394043, 56.02717971801758, 57.489776611328125, 58.952369689941406, 60.41496658325195, 61.8775634765625, 63.34015655517578, 64.80274963378906]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 7.0, 3.0, 2.0, 4.0, 5.0, 4.0, 12.0, 9.0, 15.0, 18.0, 17.0, 17.0, 20.0, 19.0, 20.0, 32.0, 32.0, 24.0, 39.0, 28.0, 31.0, 37.0, 30.0, 50.0, 49.0, 52.0, 45.0, 29.0, 34.0, 46.0, 32.0, 44.0, 21.0, 25.0, 25.0, 14.0, 20.0, 17.0, 11.0, 10.0, 7.0, 11.0, 7.0, 7.0, 7.0, 6.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.92815017700195, -51.248390197753906, -49.568626403808594, -47.88886642456055, -46.209102630615234, -44.52934265136719, -42.849578857421875, -41.16981887817383, -39.49005889892578, -37.810298919677734, -36.13053512573242, -34.450775146484375, -32.77101135253906, -31.091251373291016, -29.411489486694336, -27.731727600097656, -26.051963806152344, -24.372201919555664, -22.692440032958984, -21.012680053710938, -19.332916259765625, -17.653156280517578, -15.973394393920898, -14.293632507324219, -12.613870620727539, -10.93410873413086, -9.25434684753418, -7.574585914611816, -5.894824028015137, -4.215062141418457, -2.5353012084960938, -0.8555393218994141, 0.82421875, 2.5039803981781006, 4.183742046356201, 5.863503456115723, 7.543265342712402, 9.223027229309082, 10.902788162231445, 12.582550048828125, 14.262311935424805, 15.942073822021484, 17.621835708618164, 19.301597595214844, 20.98135757446289, 22.661121368408203, 24.34088134765625, 26.02064323425293, 27.70040512084961, 29.38016700744629, 31.05992889404297, 32.739688873291016, 34.41945266723633, 36.099212646484375, 37.77897644042969, 39.458736419677734, 41.13849639892578, 42.81825637817383, 44.49802017211914, 46.17778015136719, 47.8575439453125, 49.53730392456055, 51.217063903808594, 52.896827697753906, 54.57659149169922]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 6.0, 4.0, 5.0, 5.0, 17.0, 11.0, 24.0, 10.0, 19.0, 22.0, 28.0, 24.0, 30.0, 37.0, 30.0, 33.0, 32.0, 40.0, 38.0, 42.0, 54.0, 32.0, 56.0, 53.0, 45.0, 39.0, 30.0, 32.0, 27.0, 30.0, 32.0, 20.0, 19.0, 13.0, 16.0, 10.0, 6.0, 11.0, 10.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.515625, -6.29534912109375, -6.0750732421875, -5.85479736328125, -5.634521484375, -5.41424560546875, -5.1939697265625, -4.97369384765625, -4.75341796875, -4.53314208984375, -4.3128662109375, -4.09259033203125, -3.872314453125, -3.65203857421875, -3.4317626953125, -3.21148681640625, -2.9912109375, -2.77093505859375, -2.5506591796875, -2.33038330078125, -2.110107421875, -1.88983154296875, -1.6695556640625, -1.44927978515625, -1.22900390625, -1.00872802734375, -0.7884521484375, -0.56817626953125, -0.347900390625, -0.12762451171875, 0.0926513671875, 0.31292724609375, 0.533203125, 0.75347900390625, 0.9737548828125, 1.19403076171875, 1.414306640625, 1.63458251953125, 1.8548583984375, 2.07513427734375, 2.29541015625, 2.51568603515625, 2.7359619140625, 2.95623779296875, 3.176513671875, 3.39678955078125, 3.6170654296875, 3.83734130859375, 4.0576171875, 4.27789306640625, 4.4981689453125, 4.71844482421875, 4.938720703125, 5.15899658203125, 5.3792724609375, 5.59954833984375, 5.81982421875, 6.04010009765625, 6.2603759765625, 6.48065185546875, 6.700927734375, 6.92120361328125, 7.1414794921875, 7.36175537109375, 7.58203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 5.0, 6.0, 10.0, 11.0, 12.0, 13.0, 25.0, 19.0, 33.0, 37.0, 51.0, 77.0, 106.0, 187.0, 321.0, 888.0, 4285.0, 49407.0, 1724629.0, 2333356.0, 73361.0, 5481.0, 1024.0, 350.0, 148.0, 115.0, 79.0, 58.0, 33.0, 31.0, 24.0, 20.0, 15.0, 9.0, 14.0, 11.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.3125, -22.58544921875, -21.8583984375, -21.13134765625, -20.404296875, -19.67724609375, -18.9501953125, -18.22314453125, -17.49609375, -16.76904296875, -16.0419921875, -15.31494140625, -14.587890625, -13.86083984375, -13.1337890625, -12.40673828125, -11.6796875, -10.95263671875, -10.2255859375, -9.49853515625, -8.771484375, -8.04443359375, -7.3173828125, -6.59033203125, -5.86328125, -5.13623046875, -4.4091796875, -3.68212890625, -2.955078125, -2.22802734375, -1.5009765625, -0.77392578125, -0.046875, 0.68017578125, 1.4072265625, 2.13427734375, 2.861328125, 3.58837890625, 4.3154296875, 5.04248046875, 5.76953125, 6.49658203125, 7.2236328125, 7.95068359375, 8.677734375, 9.40478515625, 10.1318359375, 10.85888671875, 11.5859375, 12.31298828125, 13.0400390625, 13.76708984375, 14.494140625, 15.22119140625, 15.9482421875, 16.67529296875, 17.40234375, 18.12939453125, 18.8564453125, 19.58349609375, 20.310546875, 21.03759765625, 21.7646484375, 22.49169921875, 23.21875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 10.0, 16.0, 25.0, 30.0, 41.0, 67.0, 76.0, 144.0, 163.0, 264.0, 362.0, 492.0, 547.0, 532.0, 360.0, 258.0, 213.0, 138.0, 109.0, 52.0, 38.0, 35.0, 24.0, 17.0, 16.0, 10.0, 4.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.4833984375, -12.013671875, -11.5439453125, -11.07421875, -10.6044921875, -10.134765625, -9.6650390625, -9.1953125, -8.7255859375, -8.255859375, -7.7861328125, -7.31640625, -6.8466796875, -6.376953125, -5.9072265625, -5.4375, -4.9677734375, -4.498046875, -4.0283203125, -3.55859375, -3.0888671875, -2.619140625, -2.1494140625, -1.6796875, -1.2099609375, -0.740234375, -0.2705078125, 0.19921875, 0.6689453125, 1.138671875, 1.6083984375, 2.078125, 2.5478515625, 3.017578125, 3.4873046875, 3.95703125, 4.4267578125, 4.896484375, 5.3662109375, 5.8359375, 6.3056640625, 6.775390625, 7.2451171875, 7.71484375, 8.1845703125, 8.654296875, 9.1240234375, 9.59375, 10.0634765625, 10.533203125, 11.0029296875, 11.47265625, 11.9423828125, 12.412109375, 12.8818359375, 13.3515625, 13.8212890625, 14.291015625, 14.7607421875, 15.23046875, 15.7001953125, 16.169921875, 16.6396484375, 17.109375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 13.0, 9.0, 23.0, 20.0, 47.0, 35.0, 72.0, 87.0, 143.0, 197.0, 291.0, 406.0, 1017.0, 51073.0, 4113891.0, 24742.0, 844.0, 430.0, 274.0, 220.0, 127.0, 95.0, 69.0, 45.0, 30.0, 25.0, 15.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-89.4375, -86.9833984375, -84.529296875, -82.0751953125, -79.62109375, -77.1669921875, -74.712890625, -72.2587890625, -69.8046875, -67.3505859375, -64.896484375, -62.4423828125, -59.98828125, -57.5341796875, -55.080078125, -52.6259765625, -50.171875, -47.7177734375, -45.263671875, -42.8095703125, -40.35546875, -37.9013671875, -35.447265625, -32.9931640625, -30.5390625, -28.0849609375, -25.630859375, -23.1767578125, -20.72265625, -18.2685546875, -15.814453125, -13.3603515625, -10.90625, -8.4521484375, -5.998046875, -3.5439453125, -1.08984375, 1.3642578125, 3.818359375, 6.2724609375, 8.7265625, 11.1806640625, 13.634765625, 16.0888671875, 18.54296875, 20.9970703125, 23.451171875, 25.9052734375, 28.359375, 30.8134765625, 33.267578125, 35.7216796875, 38.17578125, 40.6298828125, 43.083984375, 45.5380859375, 47.9921875, 50.4462890625, 52.900390625, 55.3544921875, 57.80859375, 60.2626953125, 62.716796875, 65.1708984375, 67.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 15.0, 17.0, 22.0, 47.0, 82.0, 125.0, 139.0, 133.0, 149.0, 108.0, 74.0, 43.0, 26.0, 14.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.05316162109375, -57.044376373291016, -55.03559494018555, -53.02680969238281, -51.018028259277344, -49.00924301147461, -47.000457763671875, -44.991676330566406, -42.98289489746094, -40.9741096496582, -38.965328216552734, -36.95654296875, -34.94776153564453, -32.9389762878418, -30.930192947387695, -28.921409606933594, -26.91262435913086, -24.903841018676758, -22.895057678222656, -20.886272430419922, -18.877490997314453, -16.86870574951172, -14.859922409057617, -12.851139068603516, -10.842355728149414, -8.833572387695312, -6.824788570404053, -4.816004753112793, -2.8072214126586914, -0.7984380722045898, 1.2103462219238281, 3.2191295623779297, 5.227912902832031, 7.236696243286133, 9.245479583740234, 11.254263877868652, 13.263047218322754, 15.271830558776855, 17.280614852905273, 19.289398193359375, 21.298181533813477, 23.306964874267578, 25.31574821472168, 27.32453155517578, 29.333316802978516, 31.342098236083984, 33.35088348388672, 35.35966491699219, 37.36845016479492, 39.377235412597656, 41.386016845703125, 43.39480209350586, 45.40358352661133, 47.41236877441406, 49.42115020751953, 51.429935455322266, 53.438720703125, 55.447505950927734, 57.4562873840332, 59.46507263183594, 61.473854064941406, 63.48263931274414, 65.49142456054688, 67.50020599365234, 69.50898742675781]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 17.0, 13.0, 14.0, 8.0, 12.0, 19.0, 22.0, 28.0, 32.0, 23.0, 36.0, 33.0, 32.0, 47.0, 34.0, 27.0, 33.0, 36.0, 31.0, 39.0, 40.0, 28.0, 41.0, 42.0, 27.0, 28.0, 31.0, 28.0, 27.0, 21.0, 16.0, 17.0, 13.0, 10.0, 5.0, 14.0, 8.0, 13.0, 8.0, 10.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.251251220703125, -37.02933120727539, -35.807411193847656, -34.58549499511719, -33.36357498168945, -32.14165496826172, -30.919736862182617, -29.697818756103516, -28.47589874267578, -27.253978729248047, -26.032060623168945, -24.810142517089844, -23.58822250366211, -22.366302490234375, -21.144384384155273, -19.922466278076172, -18.700546264648438, -17.478626251220703, -16.2567081451416, -15.034789085388184, -13.812870025634766, -12.590950965881348, -11.36903190612793, -10.147112846374512, -8.925193786621094, -7.703274726867676, -6.481355667114258, -5.25943660736084, -4.037517547607422, -2.815598487854004, -1.593679428100586, -0.37176036834716797, 0.85015869140625, 2.072077751159668, 3.293996810913086, 4.515915870666504, 5.737834930419922, 6.95975399017334, 8.181673049926758, 9.403592109680176, 10.625511169433594, 11.847430229187012, 13.06934928894043, 14.291268348693848, 15.513187408447266, 16.735107421875, 17.9570255279541, 19.178943634033203, 20.400863647460938, 21.622783660888672, 22.844701766967773, 24.066619873046875, 25.28853988647461, 26.510459899902344, 27.732378005981445, 28.954296112060547, 30.17621612548828, 31.398136138916016, 32.62005615234375, 33.84197235107422, 35.06389236450195, 36.28581237792969, 37.507728576660156, 38.72964859008789, 39.951568603515625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 4.0, 11.0, 11.0, 17.0, 9.0, 18.0, 26.0, 30.0, 27.0, 20.0, 23.0, 34.0, 41.0, 31.0, 34.0, 33.0, 37.0, 48.0, 44.0, 38.0, 45.0, 46.0, 27.0, 31.0, 30.0, 29.0, 39.0, 29.0, 28.0, 25.0, 24.0, 11.0, 16.0, 17.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.234375, -6.02325439453125, -5.8121337890625, -5.60101318359375, -5.389892578125, -5.17877197265625, -4.9676513671875, -4.75653076171875, -4.54541015625, -4.33428955078125, -4.1231689453125, -3.91204833984375, -3.700927734375, -3.48980712890625, -3.2786865234375, -3.06756591796875, -2.8564453125, -2.64532470703125, -2.4342041015625, -2.22308349609375, -2.011962890625, -1.80084228515625, -1.5897216796875, -1.37860107421875, -1.16748046875, -0.95635986328125, -0.7452392578125, -0.53411865234375, -0.322998046875, -0.11187744140625, 0.0992431640625, 0.31036376953125, 0.521484375, 0.73260498046875, 0.9437255859375, 1.15484619140625, 1.365966796875, 1.57708740234375, 1.7882080078125, 1.99932861328125, 2.21044921875, 2.42156982421875, 2.6326904296875, 2.84381103515625, 3.054931640625, 3.26605224609375, 3.4771728515625, 3.68829345703125, 3.8994140625, 4.11053466796875, 4.3216552734375, 4.53277587890625, 4.743896484375, 4.95501708984375, 5.1661376953125, 5.37725830078125, 5.58837890625, 5.79949951171875, 6.0106201171875, 6.22174072265625, 6.432861328125, 6.64398193359375, 6.8551025390625, 7.06622314453125, 7.27734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 11.0, 15.0, 22.0, 28.0, 45.0, 82.0, 128.0, 189.0, 335.0, 539.0, 986.0, 1653.0, 2899.0, 5041.0, 8831.0, 15892.0, 28667.0, 52982.0, 99218.0, 171983.0, 229198.0, 187151.0, 110648.0, 59523.0, 31914.0, 17429.0, 9827.0, 5558.0, 3258.0, 1830.0, 1105.0, 639.0, 350.0, 223.0, 108.0, 86.0, 47.0, 27.0, 29.0, 12.0, 15.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.935546875, -0.9085006713867188, -0.8814544677734375, -0.8544082641601562, -0.827362060546875, -0.8003158569335938, -0.7732696533203125, -0.7462234497070312, -0.71917724609375, -0.6921310424804688, -0.6650848388671875, -0.6380386352539062, -0.610992431640625, -0.5839462280273438, -0.5569000244140625, -0.5298538208007812, -0.5028076171875, -0.47576141357421875, -0.4487152099609375, -0.42166900634765625, -0.394622802734375, -0.36757659912109375, -0.3405303955078125, -0.31348419189453125, -0.28643798828125, -0.25939178466796875, -0.2323455810546875, -0.20529937744140625, -0.178253173828125, -0.15120697021484375, -0.1241607666015625, -0.09711456298828125, -0.070068359375, -0.04302215576171875, -0.0159759521484375, 0.01107025146484375, 0.038116455078125, 0.06516265869140625, 0.0922088623046875, 0.11925506591796875, 0.14630126953125, 0.17334747314453125, 0.2003936767578125, 0.22743988037109375, 0.254486083984375, 0.28153228759765625, 0.3085784912109375, 0.33562469482421875, 0.3626708984375, 0.38971710205078125, 0.4167633056640625, 0.44380950927734375, 0.470855712890625, 0.49790191650390625, 0.5249481201171875, 0.5519943237304688, 0.57904052734375, 0.6060867309570312, 0.6331329345703125, 0.6601791381835938, 0.687225341796875, 0.7142715454101562, 0.7413177490234375, 0.7683639526367188, 0.79541015625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 4.0, 8.0, 10.0, 10.0, 16.0, 12.0, 24.0, 14.0, 20.0, 21.0, 23.0, 22.0, 28.0, 33.0, 35.0, 38.0, 32.0, 30.0, 35.0, 43.0, 1070.0, 45.0, 38.0, 30.0, 32.0, 33.0, 35.0, 35.0, 32.0, 31.0, 25.0, 18.0, 28.0, 24.0, 14.0, 14.0, 8.0, 8.0, 9.0, 8.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.89453125, -4.76123046875, -4.6279296875, -4.49462890625, -4.361328125, -4.22802734375, -4.0947265625, -3.96142578125, -3.828125, -3.69482421875, -3.5615234375, -3.42822265625, -3.294921875, -3.16162109375, -3.0283203125, -2.89501953125, -2.76171875, -2.62841796875, -2.4951171875, -2.36181640625, -2.228515625, -2.09521484375, -1.9619140625, -1.82861328125, -1.6953125, -1.56201171875, -1.4287109375, -1.29541015625, -1.162109375, -1.02880859375, -0.8955078125, -0.76220703125, -0.62890625, -0.49560546875, -0.3623046875, -0.22900390625, -0.095703125, 0.03759765625, 0.1708984375, 0.30419921875, 0.4375, 0.57080078125, 0.7041015625, 0.83740234375, 0.970703125, 1.10400390625, 1.2373046875, 1.37060546875, 1.50390625, 1.63720703125, 1.7705078125, 1.90380859375, 2.037109375, 2.17041015625, 2.3037109375, 2.43701171875, 2.5703125, 2.70361328125, 2.8369140625, 2.97021484375, 3.103515625, 3.23681640625, 3.3701171875, 3.50341796875, 3.63671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 6.0, 7.0, 15.0, 18.0, 39.0, 44.0, 65.0, 111.0, 131.0, 220.0, 318.0, 460.0, 616.0, 1020.0, 1363.0, 2043.0, 2954.0, 4346.0, 6225.0, 9466.0, 13838.0, 20542.0, 30493.0, 44887.0, 63640.0, 87730.0, 112104.0, 989791.0, 314533.0, 109501.0, 84833.0, 62118.0, 43142.0, 29349.0, 20013.0, 13196.0, 8850.0, 6044.0, 4159.0, 2775.0, 1913.0, 1347.0, 892.0, 626.0, 448.0, 303.0, 198.0, 138.0, 101.0, 52.0, 48.0, 25.0, 13.0, 6.0, 14.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.42041015625, -0.406829833984375, -0.39324951171875, -0.379669189453125, -0.3660888671875, -0.352508544921875, -0.33892822265625, -0.325347900390625, -0.311767578125, -0.298187255859375, -0.28460693359375, -0.271026611328125, -0.2574462890625, -0.243865966796875, -0.23028564453125, -0.216705322265625, -0.203125, -0.189544677734375, -0.17596435546875, -0.162384033203125, -0.1488037109375, -0.135223388671875, -0.12164306640625, -0.108062744140625, -0.094482421875, -0.080902099609375, -0.06732177734375, -0.053741455078125, -0.0401611328125, -0.026580810546875, -0.01300048828125, 0.000579833984375, 0.01416015625, 0.027740478515625, 0.04132080078125, 0.054901123046875, 0.0684814453125, 0.082061767578125, 0.09564208984375, 0.109222412109375, 0.122802734375, 0.136383056640625, 0.14996337890625, 0.163543701171875, 0.1771240234375, 0.190704345703125, 0.20428466796875, 0.217864990234375, 0.2314453125, 0.245025634765625, 0.25860595703125, 0.272186279296875, 0.2857666015625, 0.299346923828125, 0.31292724609375, 0.326507568359375, 0.340087890625, 0.353668212890625, 0.36724853515625, 0.380828857421875, 0.3944091796875, 0.407989501953125, 0.42156982421875, 0.435150146484375, 0.44873046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 11.0, 9.0, 16.0, 24.0, 29.0, 34.0, 34.0, 59.0, 88.0, 74.0, 102.0, 82.0, 106.0, 66.0, 46.0, 43.0, 28.0, 29.0, 14.0, 9.0, 21.0, 14.0, 11.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.008966803550720215, -0.00870966911315918, -0.008452534675598145, -0.00819540023803711, -0.007938265800476074, -0.007681131362915039, -0.007423996925354004, -0.007166862487792969, -0.006909728050231934, -0.0066525936126708984, -0.006395459175109863, -0.006138324737548828, -0.005881190299987793, -0.005624055862426758, -0.005366921424865723, -0.0051097869873046875, -0.004852652549743652, -0.004595518112182617, -0.004338383674621582, -0.004081249237060547, -0.0038241147994995117, -0.0035669803619384766, -0.0033098459243774414, -0.0030527114868164062, -0.002795577049255371, -0.002538442611694336, -0.0022813081741333008, -0.0020241737365722656, -0.0017670392990112305, -0.0015099048614501953, -0.0012527704238891602, -0.000995635986328125, -0.0007385015487670898, -0.0004813671112060547, -0.00022423267364501953, 3.2901763916015625e-05, 0.0002900362014770508, 0.0005471706390380859, 0.0008043050765991211, 0.0010614395141601562, 0.0013185739517211914, 0.0015757083892822266, 0.0018328428268432617, 0.002089977264404297, 0.002347111701965332, 0.002604246139526367, 0.0028613805770874023, 0.0031185150146484375, 0.0033756494522094727, 0.003632783889770508, 0.003889918327331543, 0.004147052764892578, 0.004404187202453613, 0.0046613216400146484, 0.004918456077575684, 0.005175590515136719, 0.005432724952697754, 0.005689859390258789, 0.005946993827819824, 0.006204128265380859, 0.0064612627029418945, 0.00671839714050293, 0.006975531578063965, 0.007232666015625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 4.0, 8.0, 12.0, 19.0, 28.0, 22.0, 35.0, 43.0, 58.0, 86.0, 128.0, 276.0, 733.0, 73865.0, 971411.0, 1009.0, 306.0, 162.0, 89.0, 62.0, 53.0, 31.0, 27.0, 25.0, 13.0, 9.0, 8.0, 9.0, 2.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.15081214904785156, -0.14525222778320312, -0.1396923065185547, -0.13413238525390625, -0.1285724639892578, -0.12301254272460938, -0.11745262145996094, -0.1118927001953125, -0.10633277893066406, -0.10077285766601562, -0.09521293640136719, -0.08965301513671875, -0.08409309387207031, -0.07853317260742188, -0.07297325134277344, -0.067413330078125, -0.06185340881347656, -0.056293487548828125, -0.05073356628417969, -0.04517364501953125, -0.03961372375488281, -0.034053802490234375, -0.028493881225585938, -0.0229339599609375, -0.017374038696289062, -0.011814117431640625, -0.0062541961669921875, -0.00069427490234375, 0.0048656463623046875, 0.010425567626953125, 0.015985488891601562, 0.02154541015625, 0.027105331420898438, 0.032665252685546875, 0.03822517395019531, 0.04378509521484375, 0.04934501647949219, 0.054904937744140625, 0.06046485900878906, 0.0660247802734375, 0.07158470153808594, 0.07714462280273438, 0.08270454406738281, 0.08826446533203125, 0.09382438659667969, 0.09938430786132812, 0.10494422912597656, 0.110504150390625, 0.11606407165527344, 0.12162399291992188, 0.1271839141845703, 0.13274383544921875, 0.1383037567138672, 0.14386367797851562, 0.14942359924316406, 0.1549835205078125, 0.16054344177246094, 0.16610336303710938, 0.1716632843017578, 0.17722320556640625, 0.1827831268310547, 0.18834304809570312, 0.19390296936035156, 0.199462890625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 440.0, 571.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007699718698859215, -0.0061701624654233456, -0.004640606231987476, -0.003111049998551607, -0.001581493765115738, -5.19375316798687e-05, 0.0014776187017560005, 0.003007175400853157, 0.004536731168627739, 0.006066287402063608, 0.007595843635499477, 0.009125400334596634, 0.010654956102371216, 0.012184511870145798, 0.013714068569242954, 0.01524362526834011, 0.016773181036114693, 0.018302736803889275, 0.019832294434309006, 0.021361850202083588, 0.02289140596985817, 0.02442096173763275, 0.025950517505407333, 0.027480075135827065, 0.029009630903601646, 0.03053918667137623, 0.03206874430179596, 0.03359830006957054, 0.03512785583734512, 0.036657411605119705, 0.03818696737289429, 0.03971652686595917, 0.04124607890844345, 0.04277563467621803, 0.044305190443992615, 0.0458347462117672, 0.04736430197954178, 0.04889386147260666, 0.05042341724038124, 0.05195297300815582, 0.053482528775930405, 0.05501208454370499, 0.05654164031147957, 0.05807119607925415, 0.05960075557231903, 0.06113031134009361, 0.0626598671078682, 0.06418941915035248, 0.06571897864341736, 0.06724853813648224, 0.06877809017896652, 0.0703076496720314, 0.07183720171451569, 0.07336676120758057, 0.07489631325006485, 0.07642587274312973, 0.07795542478561401, 0.0794849842786789, 0.08101453632116318, 0.08254409581422806, 0.08407364785671234, 0.08560320734977722, 0.0871327593922615, 0.08866231888532639, 0.09019187837839127]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 15.0, 12.0, 13.0, 20.0, 36.0, 29.0, 38.0, 46.0, 36.0, 62.0, 42.0, 60.0, 58.0, 67.0, 62.0, 73.0, 54.0, 51.0, 44.0, 38.0, 36.0, 26.0, 18.0, 19.0, 14.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00683361291885376, -0.006640167906880379, -0.006446722894906998, -0.006253277882933617, -0.006059832870960236, -0.0058663878589868546, -0.0056729428470134735, -0.0054794978350400925, -0.005286052823066711, -0.00509260781109333, -0.004899162799119949, -0.004705717787146568, -0.004512272775173187, -0.004318827763199806, -0.004125382751226425, -0.003931937739253044, -0.003738492727279663, -0.003545047715306282, -0.003351602703332901, -0.00315815769135952, -0.002964712679386139, -0.002771267667412758, -0.002577822655439377, -0.002384377643465996, -0.0021909326314926147, -0.0019974876195192337, -0.0018040426075458527, -0.0016105975955724716, -0.0014171525835990906, -0.0012237075716257095, -0.0010302625596523285, -0.0008368175476789474, -0.0006433725357055664, -0.00044992752373218536, -0.0002564825117588043, -6.303749978542328e-05, 0.00013040751218795776, 0.0003238525241613388, 0.0005172975361347198, 0.0007107425481081009, 0.0009041875600814819, 0.001097632572054863, 0.001291077584028244, 0.001484522596001625, 0.001677967607975006, 0.0018714126199483871, 0.002064857631921768, 0.0022583026438951492, 0.0024517476558685303, 0.0026451926678419113, 0.0028386376798152924, 0.0030320826917886734, 0.0032255277037620544, 0.0034189727157354355, 0.0036124177277088165, 0.0038058627396821976, 0.003999307751655579, 0.00419275276362896, 0.004386197775602341, 0.004579642787575722, 0.004773087799549103, 0.004966532811522484, 0.005159977823495865, 0.005353422835469246, 0.005546867847442627]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 4.0, 11.0, 11.0, 17.0, 9.0, 18.0, 26.0, 30.0, 27.0, 20.0, 23.0, 34.0, 41.0, 31.0, 34.0, 33.0, 37.0, 48.0, 44.0, 39.0, 44.0, 46.0, 27.0, 31.0, 30.0, 29.0, 39.0, 29.0, 28.0, 25.0, 24.0, 11.0, 16.0, 17.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.234375, -6.02325439453125, -5.8121337890625, -5.60101318359375, -5.389892578125, -5.17877197265625, -4.9676513671875, -4.75653076171875, -4.54541015625, -4.33428955078125, -4.1231689453125, -3.91204833984375, -3.700927734375, -3.48980712890625, -3.2786865234375, -3.06756591796875, -2.8564453125, -2.64532470703125, -2.4342041015625, -2.22308349609375, -2.011962890625, -1.80084228515625, -1.5897216796875, -1.37860107421875, -1.16748046875, -0.95635986328125, -0.7452392578125, -0.53411865234375, -0.322998046875, -0.11187744140625, 0.0992431640625, 0.31036376953125, 0.521484375, 0.73260498046875, 0.9437255859375, 1.15484619140625, 1.365966796875, 1.57708740234375, 1.7882080078125, 1.99932861328125, 2.21044921875, 2.42156982421875, 2.6326904296875, 2.84381103515625, 3.054931640625, 3.26605224609375, 3.4771728515625, 3.68829345703125, 3.8994140625, 4.11053466796875, 4.3216552734375, 4.53277587890625, 4.743896484375, 4.95501708984375, 5.1661376953125, 5.37725830078125, 5.58837890625, 5.79949951171875, 6.0106201171875, 6.22174072265625, 6.432861328125, 6.64398193359375, 6.8551025390625, 7.06622314453125, 7.27734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 11.0, 8.0, 7.0, 12.0, 17.0, 13.0, 26.0, 36.0, 41.0, 57.0, 70.0, 76.0, 99.0, 185.0, 223.0, 353.0, 721.0, 1722.0, 6081.0, 30020.0, 232816.0, 679922.0, 77375.0, 12928.0, 3125.0, 1059.0, 477.0, 293.0, 218.0, 151.0, 90.0, 79.0, 49.0, 50.0, 34.0, 19.0, 25.0, 13.0, 10.0, 9.0, 11.0, 4.0, 5.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.2578125, -10.8729248046875, -10.488037109375, -10.1031494140625, -9.71826171875, -9.3333740234375, -8.948486328125, -8.5635986328125, -8.1787109375, -7.7938232421875, -7.408935546875, -7.0240478515625, -6.63916015625, -6.2542724609375, -5.869384765625, -5.4844970703125, -5.099609375, -4.7147216796875, -4.329833984375, -3.9449462890625, -3.56005859375, -3.1751708984375, -2.790283203125, -2.4053955078125, -2.0205078125, -1.6356201171875, -1.250732421875, -0.8658447265625, -0.48095703125, -0.0960693359375, 0.288818359375, 0.6737060546875, 1.05859375, 1.4434814453125, 1.828369140625, 2.2132568359375, 2.59814453125, 2.9830322265625, 3.367919921875, 3.7528076171875, 4.1376953125, 4.5225830078125, 4.907470703125, 5.2923583984375, 5.67724609375, 6.0621337890625, 6.447021484375, 6.8319091796875, 7.216796875, 7.6016845703125, 7.986572265625, 8.3714599609375, 8.75634765625, 9.1412353515625, 9.526123046875, 9.9110107421875, 10.2958984375, 10.6807861328125, 11.065673828125, 11.4505615234375, 11.83544921875, 12.2203369140625, 12.605224609375, 12.9901123046875, 13.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 15.0, 11.0, 20.0, 25.0, 20.0, 30.0, 38.0, 52.0, 51.0, 50.0, 81.0, 125.0, 1528.0, 422.0, 92.0, 72.0, 48.0, 27.0, 38.0, 49.0, 26.0, 35.0, 31.0, 26.0, 17.0, 16.0, 13.0, 6.0, 9.0, 9.0, 7.0, 9.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.078125, -23.247314453125, -22.41650390625, -21.585693359375, -20.7548828125, -19.924072265625, -19.09326171875, -18.262451171875, -17.431640625, -16.600830078125, -15.77001953125, -14.939208984375, -14.1083984375, -13.277587890625, -12.44677734375, -11.615966796875, -10.78515625, -9.954345703125, -9.12353515625, -8.292724609375, -7.4619140625, -6.631103515625, -5.80029296875, -4.969482421875, -4.138671875, -3.307861328125, -2.47705078125, -1.646240234375, -0.8154296875, 0.015380859375, 0.84619140625, 1.677001953125, 2.5078125, 3.338623046875, 4.16943359375, 5.000244140625, 5.8310546875, 6.661865234375, 7.49267578125, 8.323486328125, 9.154296875, 9.985107421875, 10.81591796875, 11.646728515625, 12.4775390625, 13.308349609375, 14.13916015625, 14.969970703125, 15.80078125, 16.631591796875, 17.46240234375, 18.293212890625, 19.1240234375, 19.954833984375, 20.78564453125, 21.616455078125, 22.447265625, 23.278076171875, 24.10888671875, 24.939697265625, 25.7705078125, 26.601318359375, 27.43212890625, 28.262939453125, 29.09375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 9.0, 6.0, 10.0, 13.0, 18.0, 19.0, 33.0, 33.0, 48.0, 50.0, 73.0, 78.0, 132.0, 249.0, 467.0, 1950.0, 2665048.0, 474781.0, 1526.0, 434.0, 215.0, 131.0, 92.0, 64.0, 39.0, 30.0, 23.0, 26.0, 13.0, 18.0, 11.0, 9.0, 11.0, 9.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-86.0, -83.5390625, -81.078125, -78.6171875, -76.15625, -73.6953125, -71.234375, -68.7734375, -66.3125, -63.8515625, -61.390625, -58.9296875, -56.46875, -54.0078125, -51.546875, -49.0859375, -46.625, -44.1640625, -41.703125, -39.2421875, -36.78125, -34.3203125, -31.859375, -29.3984375, -26.9375, -24.4765625, -22.015625, -19.5546875, -17.09375, -14.6328125, -12.171875, -9.7109375, -7.25, -4.7890625, -2.328125, 0.1328125, 2.59375, 5.0546875, 7.515625, 9.9765625, 12.4375, 14.8984375, 17.359375, 19.8203125, 22.28125, 24.7421875, 27.203125, 29.6640625, 32.125, 34.5859375, 37.046875, 39.5078125, 41.96875, 44.4296875, 46.890625, 49.3515625, 51.8125, 54.2734375, 56.734375, 59.1953125, 61.65625, 64.1171875, 66.578125, 69.0390625, 71.5]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 72.0, 867.0, 77.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.89897155761719, -93.84879302978516, -87.79861450195312, -81.7484359741211, -75.69825744628906, -69.64807891845703, -63.597900390625, -57.54772186279297, -51.49754333496094, -45.447364807128906, -39.397186279296875, -33.347007751464844, -27.296829223632812, -21.24665069580078, -15.19647216796875, -9.146293640136719, -3.0961151123046875, 2.9540634155273438, 9.004241943359375, 15.054420471191406, 21.104598999023438, 27.15477752685547, 33.2049560546875, 39.25513458251953, 45.30531311035156, 51.355491638183594, 57.405670166015625, 63.455848693847656, 69.50602722167969, 75.55620574951172, 81.60638427734375, 87.65656280517578, 93.70675659179688, 99.7569351196289, 105.80711364746094, 111.85729217529297, 117.907470703125, 123.95764923095703, 130.00782775878906, 136.05801391601562, 142.10818481445312, 148.15835571289062, 154.2085418701172, 160.25872802734375, 166.30889892578125, 172.35906982421875, 178.4092559814453, 184.45944213867188, 190.50961303710938, 196.55978393554688, 202.60997009277344, 208.66015625, 214.7103271484375, 220.760498046875, 226.81068420410156, 232.86087036132812, 238.91104125976562, 244.96121215820312, 251.0113983154297, 257.06158447265625, 263.11175537109375, 269.16192626953125, 275.21209716796875, 281.2622985839844, 287.3124694824219]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 4.0, 3.0, 4.0, 8.0, 8.0, 7.0, 14.0, 9.0, 14.0, 19.0, 18.0, 14.0, 24.0, 24.0, 20.0, 31.0, 35.0, 33.0, 32.0, 42.0, 45.0, 45.0, 41.0, 48.0, 41.0, 37.0, 36.0, 34.0, 42.0, 31.0, 32.0, 33.0, 28.0, 21.0, 19.0, 17.0, 12.0, 11.0, 18.0, 13.0, 7.0, 3.0, 5.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.26817321777344, -67.18627166748047, -65.1043701171875, -63.022464752197266, -60.94055938720703, -58.85865783691406, -56.776756286621094, -54.69485092163086, -52.612945556640625, -50.531044006347656, -48.44913864135742, -46.36723709106445, -44.28533172607422, -42.20343017578125, -40.12152862548828, -38.03962326049805, -35.95772171020508, -33.87582015991211, -31.793914794921875, -29.712013244628906, -27.630107879638672, -25.548206329345703, -23.4663028717041, -21.3843994140625, -19.3024959564209, -17.220592498779297, -15.138689041137695, -13.05678653717041, -10.974883079528809, -8.892979621887207, -6.811077117919922, -4.72917366027832, -2.6472702026367188, -0.5653669834136963, 1.5165362358093262, 3.5984392166137695, 5.680342674255371, 7.762246131896973, 9.844148635864258, 11.92605209350586, 14.007955551147461, 16.089859008789062, 18.171762466430664, 20.253665924072266, 22.335567474365234, 24.41747283935547, 26.499374389648438, 28.58127784729004, 30.66318130493164, 32.74508285522461, 34.826988220214844, 36.90888977050781, 38.99079513549805, 41.072696685791016, 43.15460205078125, 45.23650360107422, 47.31840515136719, 49.400306701660156, 51.48221206665039, 53.56411361694336, 55.646018981933594, 57.72792053222656, 59.80982208251953, 61.891727447509766, 63.9736328125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 6.0, 6.0, 11.0, 13.0, 12.0, 12.0, 10.0, 20.0, 18.0, 23.0, 29.0, 28.0, 23.0, 26.0, 31.0, 43.0, 32.0, 32.0, 38.0, 38.0, 44.0, 43.0, 38.0, 34.0, 34.0, 37.0, 25.0, 29.0, 41.0, 34.0, 27.0, 23.0, 26.0, 19.0, 12.0, 11.0, 6.0, 15.0, 12.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.08984375, -5.8709716796875, -5.652099609375, -5.4332275390625, -5.21435546875, -4.9954833984375, -4.776611328125, -4.5577392578125, -4.3388671875, -4.1199951171875, -3.901123046875, -3.6822509765625, -3.46337890625, -3.2445068359375, -3.025634765625, -2.8067626953125, -2.587890625, -2.3690185546875, -2.150146484375, -1.9312744140625, -1.71240234375, -1.4935302734375, -1.274658203125, -1.0557861328125, -0.8369140625, -0.6180419921875, -0.399169921875, -0.1802978515625, 0.03857421875, 0.2574462890625, 0.476318359375, 0.6951904296875, 0.9140625, 1.1329345703125, 1.351806640625, 1.5706787109375, 1.78955078125, 2.0084228515625, 2.227294921875, 2.4461669921875, 2.6650390625, 2.8839111328125, 3.102783203125, 3.3216552734375, 3.54052734375, 3.7593994140625, 3.978271484375, 4.1971435546875, 4.416015625, 4.6348876953125, 4.853759765625, 5.0726318359375, 5.29150390625, 5.5103759765625, 5.729248046875, 5.9481201171875, 6.1669921875, 6.3858642578125, 6.604736328125, 6.8236083984375, 7.04248046875, 7.2613525390625, 7.480224609375, 7.6990966796875, 7.91796875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 8.0, 12.0, 7.0, 18.0, 15.0, 22.0, 22.0, 31.0, 54.0, 78.0, 104.0, 171.0, 263.0, 571.0, 1208.0, 2745.0, 7447.0, 24763.0, 105675.0, 484855.0, 1467828.0, 1458387.0, 499599.0, 103311.0, 24507.0, 7391.0, 2685.0, 1104.0, 601.0, 296.0, 157.0, 90.0, 66.0, 38.0, 25.0, 20.0, 26.0, 17.0, 12.0, 5.0, 5.0, 9.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.828125, -9.5111083984375, -9.194091796875, -8.8770751953125, -8.56005859375, -8.2430419921875, -7.926025390625, -7.6090087890625, -7.2919921875, -6.9749755859375, -6.657958984375, -6.3409423828125, -6.02392578125, -5.7069091796875, -5.389892578125, -5.0728759765625, -4.755859375, -4.4388427734375, -4.121826171875, -3.8048095703125, -3.48779296875, -3.1707763671875, -2.853759765625, -2.5367431640625, -2.2197265625, -1.9027099609375, -1.585693359375, -1.2686767578125, -0.95166015625, -0.6346435546875, -0.317626953125, -0.0006103515625, 0.31640625, 0.6334228515625, 0.950439453125, 1.2674560546875, 1.58447265625, 1.9014892578125, 2.218505859375, 2.5355224609375, 2.8525390625, 3.1695556640625, 3.486572265625, 3.8035888671875, 4.12060546875, 4.4376220703125, 4.754638671875, 5.0716552734375, 5.388671875, 5.7056884765625, 6.022705078125, 6.3397216796875, 6.65673828125, 6.9737548828125, 7.290771484375, 7.6077880859375, 7.9248046875, 8.2418212890625, 8.558837890625, 8.8758544921875, 9.19287109375, 9.5098876953125, 9.826904296875, 10.1439208984375, 10.4609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 13.0, 8.0, 20.0, 49.0, 60.0, 110.0, 166.0, 277.0, 422.0, 639.0, 727.0, 567.0, 375.0, 234.0, 154.0, 92.0, 57.0, 40.0, 26.0, 15.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.56494140625, -18.8486328125, -18.13232421875, -17.416015625, -16.69970703125, -15.9833984375, -15.26708984375, -14.55078125, -13.83447265625, -13.1181640625, -12.40185546875, -11.685546875, -10.96923828125, -10.2529296875, -9.53662109375, -8.8203125, -8.10400390625, -7.3876953125, -6.67138671875, -5.955078125, -5.23876953125, -4.5224609375, -3.80615234375, -3.08984375, -2.37353515625, -1.6572265625, -0.94091796875, -0.224609375, 0.49169921875, 1.2080078125, 1.92431640625, 2.640625, 3.35693359375, 4.0732421875, 4.78955078125, 5.505859375, 6.22216796875, 6.9384765625, 7.65478515625, 8.37109375, 9.08740234375, 9.8037109375, 10.52001953125, 11.236328125, 11.95263671875, 12.6689453125, 13.38525390625, 14.1015625, 14.81787109375, 15.5341796875, 16.25048828125, 16.966796875, 17.68310546875, 18.3994140625, 19.11572265625, 19.83203125, 20.54833984375, 21.2646484375, 21.98095703125, 22.697265625, 23.41357421875, 24.1298828125, 24.84619140625, 25.5625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 8.0, 23.0, 32.0, 44.0, 60.0, 107.0, 204.0, 275.0, 482.0, 988.0, 6675.0, 3760234.0, 420681.0, 2720.0, 769.0, 398.0, 231.0, 118.0, 94.0, 63.0, 22.0, 15.0, 11.0, 11.0, 10.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.3125, -84.8056640625, -82.298828125, -79.7919921875, -77.28515625, -74.7783203125, -72.271484375, -69.7646484375, -67.2578125, -64.7509765625, -62.244140625, -59.7373046875, -57.23046875, -54.7236328125, -52.216796875, -49.7099609375, -47.203125, -44.6962890625, -42.189453125, -39.6826171875, -37.17578125, -34.6689453125, -32.162109375, -29.6552734375, -27.1484375, -24.6416015625, -22.134765625, -19.6279296875, -17.12109375, -14.6142578125, -12.107421875, -9.6005859375, -7.09375, -4.5869140625, -2.080078125, 0.4267578125, 2.93359375, 5.4404296875, 7.947265625, 10.4541015625, 12.9609375, 15.4677734375, 17.974609375, 20.4814453125, 22.98828125, 25.4951171875, 28.001953125, 30.5087890625, 33.015625, 35.5224609375, 38.029296875, 40.5361328125, 43.04296875, 45.5498046875, 48.056640625, 50.5634765625, 53.0703125, 55.5771484375, 58.083984375, 60.5908203125, 63.09765625, 65.6044921875, 68.111328125, 70.6181640625, 73.125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 28.0, 86.0, 202.0, 256.0, 223.0, 133.0, 51.0, 21.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.90630340576172, -116.95026397705078, -112.99422454833984, -109.03819274902344, -105.0821533203125, -101.12611389160156, -97.17007446289062, -93.21403503417969, -89.25799560546875, -85.30195617675781, -81.34591674804688, -77.38987731933594, -73.43384552001953, -69.4778060913086, -65.52176666259766, -61.56572723388672, -57.60969543457031, -53.653656005859375, -49.6976203918457, -45.741580963134766, -41.785545349121094, -37.829505920410156, -33.87346649169922, -29.917428970336914, -25.96139144897461, -22.005353927612305, -18.04931640625, -14.093276977539062, -10.137239456176758, -6.181201934814453, -2.2251625061035156, 1.730875015258789, 5.6869049072265625, 9.642942428588867, 13.598980903625488, 17.55501937866211, 21.511056900024414, 25.46709442138672, 29.423133850097656, 33.379173278808594, 37.335208892822266, 41.2912483215332, 45.247283935546875, 49.20332336425781, 53.15936279296875, 57.11539840698242, 61.07143783569336, 65.02747344970703, 68.98351287841797, 72.9395523071289, 76.89559173583984, 80.85162353515625, 84.80766296386719, 88.76370239257812, 92.71974182128906, 96.67578125, 100.63182067871094, 104.58786010742188, 108.54389953613281, 112.49993896484375, 116.45597076416016, 120.4120101928711, 124.36804962158203, 128.32408142089844, 132.28012084960938]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 10.0, 9.0, 12.0, 7.0, 8.0, 13.0, 13.0, 15.0, 20.0, 32.0, 24.0, 27.0, 31.0, 41.0, 43.0, 38.0, 47.0, 48.0, 37.0, 30.0, 45.0, 42.0, 30.0, 51.0, 45.0, 27.0, 37.0, 31.0, 27.0, 32.0, 24.0, 13.0, 22.0, 17.0, 9.0, 11.0, 6.0, 7.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.512664794921875, -49.87195587158203, -48.23124694824219, -46.590538024902344, -44.9498291015625, -43.309120178222656, -41.66840744018555, -40.0276985168457, -38.38698959350586, -36.746280670166016, -35.10557174682617, -33.46486282348633, -31.82415199279785, -30.183443069458008, -28.54273223876953, -26.902023315429688, -25.261314392089844, -23.62060546875, -21.979896545410156, -20.33918571472168, -18.698476791381836, -17.057767868041992, -15.417057991027832, -13.776348114013672, -12.135639190673828, -10.494930267333984, -8.854220390319824, -7.213510990142822, -5.57280158996582, -3.9320926666259766, -2.2913827896118164, -0.6506729125976562, 0.9900360107421875, 2.6307454109191895, 4.271454811096191, 5.912164211273193, 7.552873611450195, 9.193582534790039, 10.8342924118042, 12.47500228881836, 14.115711212158203, 15.756420135498047, 17.39712905883789, 19.037839889526367, 20.67854881286621, 22.319257736206055, 23.95996856689453, 25.600677490234375, 27.24138641357422, 28.882095336914062, 30.522804260253906, 32.16351318359375, 33.804222106933594, 35.44493103027344, 37.08564376831055, 38.72635269165039, 40.367061614990234, 42.00777053833008, 43.64847946166992, 45.289188385009766, 46.929901123046875, 48.57061004638672, 50.21131896972656, 51.852027893066406, 53.49273681640625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 8.0, 6.0, 7.0, 10.0, 20.0, 20.0, 21.0, 17.0, 11.0, 23.0, 26.0, 27.0, 32.0, 35.0, 35.0, 32.0, 40.0, 46.0, 44.0, 39.0, 38.0, 32.0, 40.0, 38.0, 42.0, 36.0, 41.0, 28.0, 33.0, 18.0, 24.0, 19.0, 21.0, 19.0, 18.0, 4.0, 13.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.13671875, -5.90838623046875, -5.6800537109375, -5.45172119140625, -5.223388671875, -4.99505615234375, -4.7667236328125, -4.53839111328125, -4.31005859375, -4.08172607421875, -3.8533935546875, -3.62506103515625, -3.396728515625, -3.16839599609375, -2.9400634765625, -2.71173095703125, -2.4833984375, -2.25506591796875, -2.0267333984375, -1.79840087890625, -1.570068359375, -1.34173583984375, -1.1134033203125, -0.88507080078125, -0.65673828125, -0.42840576171875, -0.2000732421875, 0.02825927734375, 0.256591796875, 0.48492431640625, 0.7132568359375, 0.94158935546875, 1.169921875, 1.39825439453125, 1.6265869140625, 1.85491943359375, 2.083251953125, 2.31158447265625, 2.5399169921875, 2.76824951171875, 2.99658203125, 3.22491455078125, 3.4532470703125, 3.68157958984375, 3.909912109375, 4.13824462890625, 4.3665771484375, 4.59490966796875, 4.8232421875, 5.05157470703125, 5.2799072265625, 5.50823974609375, 5.736572265625, 5.96490478515625, 6.1932373046875, 6.42156982421875, 6.64990234375, 6.87823486328125, 7.1065673828125, 7.33489990234375, 7.563232421875, 7.79156494140625, 8.0198974609375, 8.24822998046875, 8.4765625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 11.0, 12.0, 15.0, 30.0, 34.0, 68.0, 101.0, 164.0, 303.0, 458.0, 760.0, 1201.0, 2011.0, 3222.0, 5332.0, 8691.0, 15138.0, 26001.0, 44037.0, 75998.0, 126663.0, 187142.0, 198706.0, 141934.0, 87046.0, 51098.0, 29505.0, 17165.0, 10238.0, 6089.0, 3595.0, 2211.0, 1358.0, 851.0, 508.0, 307.0, 210.0, 136.0, 76.0, 56.0, 25.0, 19.0, 19.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8720703125, -0.8472442626953125, -0.822418212890625, -0.7975921630859375, -0.77276611328125, -0.7479400634765625, -0.723114013671875, -0.6982879638671875, -0.6734619140625, -0.6486358642578125, -0.623809814453125, -0.5989837646484375, -0.57415771484375, -0.5493316650390625, -0.524505615234375, -0.4996795654296875, -0.474853515625, -0.4500274658203125, -0.425201416015625, -0.4003753662109375, -0.37554931640625, -0.3507232666015625, -0.325897216796875, -0.3010711669921875, -0.2762451171875, -0.2514190673828125, -0.226593017578125, -0.2017669677734375, -0.17694091796875, -0.1521148681640625, -0.127288818359375, -0.1024627685546875, -0.07763671875, -0.0528106689453125, -0.027984619140625, -0.0031585693359375, 0.02166748046875, 0.0464935302734375, 0.071319580078125, 0.0961456298828125, 0.1209716796875, 0.1457977294921875, 0.170623779296875, 0.1954498291015625, 0.22027587890625, 0.2451019287109375, 0.269927978515625, 0.2947540283203125, 0.319580078125, 0.3444061279296875, 0.369232177734375, 0.3940582275390625, 0.41888427734375, 0.4437103271484375, 0.468536376953125, 0.4933624267578125, 0.5181884765625, 0.5430145263671875, 0.567840576171875, 0.5926666259765625, 0.61749267578125, 0.6423187255859375, 0.667144775390625, 0.6919708251953125, 0.716796875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 7.0, 12.0, 13.0, 12.0, 10.0, 28.0, 19.0, 20.0, 31.0, 27.0, 27.0, 41.0, 44.0, 37.0, 35.0, 44.0, 44.0, 1073.0, 43.0, 57.0, 30.0, 30.0, 41.0, 43.0, 36.0, 28.0, 25.0, 30.0, 22.0, 15.0, 19.0, 14.0, 7.0, 15.0, 4.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.953125, -4.79949951171875, -4.6458740234375, -4.49224853515625, -4.338623046875, -4.18499755859375, -4.0313720703125, -3.87774658203125, -3.72412109375, -3.57049560546875, -3.4168701171875, -3.26324462890625, -3.109619140625, -2.95599365234375, -2.8023681640625, -2.64874267578125, -2.4951171875, -2.34149169921875, -2.1878662109375, -2.03424072265625, -1.880615234375, -1.72698974609375, -1.5733642578125, -1.41973876953125, -1.26611328125, -1.11248779296875, -0.9588623046875, -0.80523681640625, -0.651611328125, -0.49798583984375, -0.3443603515625, -0.19073486328125, -0.037109375, 0.11651611328125, 0.2701416015625, 0.42376708984375, 0.577392578125, 0.73101806640625, 0.8846435546875, 1.03826904296875, 1.19189453125, 1.34552001953125, 1.4991455078125, 1.65277099609375, 1.806396484375, 1.96002197265625, 2.1136474609375, 2.26727294921875, 2.4208984375, 2.57452392578125, 2.7281494140625, 2.88177490234375, 3.035400390625, 3.18902587890625, 3.3426513671875, 3.49627685546875, 3.64990234375, 3.80352783203125, 3.9571533203125, 4.11077880859375, 4.264404296875, 4.41802978515625, 4.5716552734375, 4.72528076171875, 4.87890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 8.0, 9.0, 9.0, 28.0, 39.0, 41.0, 64.0, 78.0, 125.0, 164.0, 246.0, 342.0, 482.0, 774.0, 1040.0, 1595.0, 2359.0, 3485.0, 5163.0, 7956.0, 12193.0, 18527.0, 28450.0, 43003.0, 64104.0, 91842.0, 120987.0, 1153575.0, 173834.0, 113341.0, 83088.0, 57584.0, 38967.0, 25373.0, 16413.0, 10727.0, 6952.0, 4547.0, 3037.0, 2082.0, 1438.0, 949.0, 659.0, 475.0, 326.0, 178.0, 152.0, 113.0, 70.0, 53.0, 26.0, 25.0, 18.0, 15.0, 6.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.505859375, -0.4904632568359375, -0.475067138671875, -0.4596710205078125, -0.44427490234375, -0.4288787841796875, -0.413482666015625, -0.3980865478515625, -0.3826904296875, -0.3672943115234375, -0.351898193359375, -0.3365020751953125, -0.32110595703125, -0.3057098388671875, -0.290313720703125, -0.2749176025390625, -0.259521484375, -0.2441253662109375, -0.228729248046875, -0.2133331298828125, -0.19793701171875, -0.1825408935546875, -0.167144775390625, -0.1517486572265625, -0.1363525390625, -0.1209564208984375, -0.105560302734375, -0.0901641845703125, -0.07476806640625, -0.0593719482421875, -0.043975830078125, -0.0285797119140625, -0.01318359375, 0.0022125244140625, 0.017608642578125, 0.0330047607421875, 0.04840087890625, 0.0637969970703125, 0.079193115234375, 0.0945892333984375, 0.1099853515625, 0.1253814697265625, 0.140777587890625, 0.1561737060546875, 0.17156982421875, 0.1869659423828125, 0.202362060546875, 0.2177581787109375, 0.233154296875, 0.2485504150390625, 0.263946533203125, 0.2793426513671875, 0.29473876953125, 0.3101348876953125, 0.325531005859375, 0.3409271240234375, 0.3563232421875, 0.3717193603515625, 0.387115478515625, 0.4025115966796875, 0.41790771484375, 0.4333038330078125, 0.448699951171875, 0.4640960693359375, 0.4794921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 8.0, 5.0, 5.0, 8.0, 10.0, 20.0, 21.0, 21.0, 23.0, 18.0, 36.0, 34.0, 51.0, 51.0, 39.0, 53.0, 64.0, 54.0, 67.0, 50.0, 46.0, 43.0, 46.0, 27.0, 35.0, 25.0, 18.0, 15.0, 19.0, 12.0, 12.0, 9.0, 9.0, 9.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00539398193359375, -0.005188345909118652, -0.004982709884643555, -0.004777073860168457, -0.004571437835693359, -0.004365801811218262, -0.004160165786743164, -0.003954529762268066, -0.0037488937377929688, -0.003543257713317871, -0.0033376216888427734, -0.0031319856643676758, -0.002926349639892578, -0.0027207136154174805, -0.002515077590942383, -0.002309441566467285, -0.0021038055419921875, -0.0018981695175170898, -0.0016925334930419922, -0.0014868974685668945, -0.0012812614440917969, -0.0010756254196166992, -0.0008699893951416016, -0.0006643533706665039, -0.00045871734619140625, -0.0002530813217163086, -4.744529724121094e-05, 0.00015819072723388672, 0.0003638267517089844, 0.000569462776184082, 0.0007750988006591797, 0.0009807348251342773, 0.001186370849609375, 0.0013920068740844727, 0.0015976428985595703, 0.001803278923034668, 0.0020089149475097656, 0.0022145509719848633, 0.002420186996459961, 0.0026258230209350586, 0.0028314590454101562, 0.003037095069885254, 0.0032427310943603516, 0.0034483671188354492, 0.003654003143310547, 0.0038596391677856445, 0.004065275192260742, 0.00427091121673584, 0.0044765472412109375, 0.004682183265686035, 0.004887819290161133, 0.0050934553146362305, 0.005299091339111328, 0.005504727363586426, 0.0057103633880615234, 0.005915999412536621, 0.006121635437011719, 0.006327271461486816, 0.006532907485961914, 0.006738543510437012, 0.006944179534912109, 0.007149815559387207, 0.007355451583862305, 0.007561087608337402, 0.0077667236328125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 15.0, 12.0, 7.0, 17.0, 19.0, 18.0, 29.0, 25.0, 32.0, 46.0, 62.0, 62.0, 125.0, 141.0, 286.0, 533.0, 2994.0, 1032376.0, 10098.0, 670.0, 303.0, 191.0, 98.0, 78.0, 60.0, 47.0, 38.0, 41.0, 21.0, 25.0, 17.0, 12.0, 5.0, 5.0, 5.0, 8.0, 13.0, 1.0, 2.0, 6.0, 1.0, 0.0, 2.0], "bins": [-0.1728515625, -0.16837406158447266, -0.1638965606689453, -0.15941905975341797, -0.15494155883789062, -0.15046405792236328, -0.14598655700683594, -0.1415090560913086, -0.13703155517578125, -0.1325540542602539, -0.12807655334472656, -0.12359905242919922, -0.11912155151367188, -0.11464405059814453, -0.11016654968261719, -0.10568904876708984, -0.1012115478515625, -0.09673404693603516, -0.09225654602050781, -0.08777904510498047, -0.08330154418945312, -0.07882404327392578, -0.07434654235839844, -0.0698690414428711, -0.06539154052734375, -0.060914039611816406, -0.05643653869628906, -0.05195903778076172, -0.047481536865234375, -0.04300403594970703, -0.03852653503417969, -0.034049034118652344, -0.029571533203125, -0.025094032287597656, -0.020616531372070312, -0.01613903045654297, -0.011661529541015625, -0.007184028625488281, -0.0027065277099609375, 0.0017709732055664062, 0.00624847412109375, 0.010725975036621094, 0.015203475952148438, 0.01968097686767578, 0.024158477783203125, 0.02863597869873047, 0.03311347961425781, 0.037590980529785156, 0.0420684814453125, 0.046545982360839844, 0.05102348327636719, 0.05550098419189453, 0.059978485107421875, 0.06445598602294922, 0.06893348693847656, 0.0734109878540039, 0.07788848876953125, 0.0823659896850586, 0.08684349060058594, 0.09132099151611328, 0.09579849243164062, 0.10027599334716797, 0.10475349426269531, 0.10923099517822266, 0.11370849609375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 774.0, 236.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008752589114010334, -0.0069612362422049046, -0.005169883370399475, -0.003378530964255333, -0.0015871780924499035, 0.00020417477935552597, 0.001995527185499668, 0.003786880522966385, 0.005578232929110527, 0.0073695858009159565, 0.009160938672721386, 0.010952291078865528, 0.012743644416332245, 0.014534996822476387, 0.01632634922862053, 0.01811770349740982, 0.019909054040908813, 0.021700406447052956, 0.023491758853197098, 0.02528311312198639, 0.02707446552813053, 0.028865817934274673, 0.030657170340418816, 0.03244852274656296, 0.03423987701535225, 0.03603123128414154, 0.03782258182764053, 0.039613936096429825, 0.04140528663992882, 0.04319664090871811, 0.0449879914522171, 0.04677934572100639, 0.048570696264505386, 0.05036205053329468, 0.05215340107679367, 0.05394475534558296, 0.055736105889081955, 0.057527460157871246, 0.05931881070137024, 0.06111016497015953, 0.06290151923894882, 0.06469286978244781, 0.0664842277765274, 0.0682755783200264, 0.07006692886352539, 0.07185828685760498, 0.07364963740110397, 0.07544098794460297, 0.07723233848810196, 0.07902368903160095, 0.08081504702568054, 0.08260639756917953, 0.08439774811267853, 0.08618910610675812, 0.08798045665025711, 0.0897718071937561, 0.0915631651878357, 0.09335451573133469, 0.09514587372541428, 0.09693722426891327, 0.09872857481241226, 0.10051992535591125, 0.10231128334999084, 0.10410263389348984, 0.10589398443698883]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 10.0, 17.0, 25.0, 27.0, 51.0, 34.0, 58.0, 45.0, 51.0, 51.0, 73.0, 52.0, 63.0, 53.0, 52.0, 47.0, 51.0, 41.0, 34.0, 31.0, 29.0, 23.0, 22.0, 10.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00812751054763794, -0.007922119460999966, -0.007716728374361992, -0.007511337287724018, -0.007305946201086044, -0.0071005551144480705, -0.006895164027810097, -0.006689772941172123, -0.006484381854534149, -0.006278990767896175, -0.006073599681258202, -0.005868208594620228, -0.005662817507982254, -0.00545742642134428, -0.0052520353347063065, -0.005046644248068333, -0.004841253161430359, -0.004635862074792385, -0.004430470988154411, -0.0042250799015164375, -0.004019688814878464, -0.00381429772824049, -0.003608906641602516, -0.0034035155549645424, -0.0031981244683265686, -0.002992733381688595, -0.002787342295050621, -0.0025819512084126472, -0.0023765601217746735, -0.0021711690351366997, -0.001965777948498726, -0.001760386861860752, -0.0015549957752227783, -0.0013496046885848045, -0.0011442136019468307, -0.000938822515308857, -0.0007334314286708832, -0.0005280403420329094, -0.0003226492553949356, -0.00011725816875696182, 8.813291788101196e-05, 0.00029352400451898575, 0.0004989150911569595, 0.0007043061777949333, 0.0009096972644329071, 0.0011150883510708809, 0.0013204794377088547, 0.0015258705243468285, 0.0017312616109848022, 0.001936652697622776, 0.00214204378426075, 0.0023474348708987236, 0.0025528259575366974, 0.002758217044174671, 0.002963608130812645, 0.0031689992174506187, 0.0033743903040885925, 0.0035797813907265663, 0.00378517247736454, 0.003990563564002514, 0.004195954650640488, 0.0044013457372784615, 0.004606736823916435, 0.004812127910554409, 0.005017518997192383]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 8.0, 6.0, 7.0, 10.0, 20.0, 20.0, 21.0, 17.0, 11.0, 23.0, 26.0, 27.0, 32.0, 35.0, 35.0, 32.0, 40.0, 46.0, 44.0, 39.0, 38.0, 32.0, 40.0, 38.0, 42.0, 37.0, 40.0, 28.0, 33.0, 18.0, 24.0, 19.0, 21.0, 19.0, 18.0, 4.0, 13.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.13671875, -5.90838623046875, -5.6800537109375, -5.45172119140625, -5.223388671875, -4.99505615234375, -4.7667236328125, -4.53839111328125, -4.31005859375, -4.08172607421875, -3.8533935546875, -3.62506103515625, -3.396728515625, -3.16839599609375, -2.9400634765625, -2.71173095703125, -2.4833984375, -2.25506591796875, -2.0267333984375, -1.79840087890625, -1.570068359375, -1.34173583984375, -1.1134033203125, -0.88507080078125, -0.65673828125, -0.42840576171875, -0.2000732421875, 0.02825927734375, 0.256591796875, 0.48492431640625, 0.7132568359375, 0.94158935546875, 1.169921875, 1.39825439453125, 1.6265869140625, 1.85491943359375, 2.083251953125, 2.31158447265625, 2.5399169921875, 2.76824951171875, 2.99658203125, 3.22491455078125, 3.4532470703125, 3.68157958984375, 3.909912109375, 4.13824462890625, 4.3665771484375, 4.59490966796875, 4.8232421875, 5.05157470703125, 5.2799072265625, 5.50823974609375, 5.736572265625, 5.96490478515625, 6.1932373046875, 6.42156982421875, 6.64990234375, 6.87823486328125, 7.1065673828125, 7.33489990234375, 7.563232421875, 7.79156494140625, 8.0198974609375, 8.24822998046875, 8.4765625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 8.0, 1.0, 5.0, 4.0, 5.0, 9.0, 15.0, 19.0, 29.0, 24.0, 46.0, 49.0, 109.0, 153.0, 275.0, 465.0, 842.0, 1673.0, 2965.0, 6042.0, 11762.0, 24548.0, 54106.0, 141089.0, 377181.0, 262815.0, 90002.0, 38020.0, 17879.0, 8728.0, 4595.0, 2345.0, 1160.0, 673.0, 346.0, 187.0, 123.0, 82.0, 43.0, 43.0, 32.0, 21.0, 9.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.046875, -5.8292236328125, -5.611572265625, -5.3939208984375, -5.17626953125, -4.9586181640625, -4.740966796875, -4.5233154296875, -4.3056640625, -4.0880126953125, -3.870361328125, -3.6527099609375, -3.43505859375, -3.2174072265625, -2.999755859375, -2.7821044921875, -2.564453125, -2.3468017578125, -2.129150390625, -1.9114990234375, -1.69384765625, -1.4761962890625, -1.258544921875, -1.0408935546875, -0.8232421875, -0.6055908203125, -0.387939453125, -0.1702880859375, 0.04736328125, 0.2650146484375, 0.482666015625, 0.7003173828125, 0.91796875, 1.1356201171875, 1.353271484375, 1.5709228515625, 1.78857421875, 2.0062255859375, 2.223876953125, 2.4415283203125, 2.6591796875, 2.8768310546875, 3.094482421875, 3.3121337890625, 3.52978515625, 3.7474365234375, 3.965087890625, 4.1827392578125, 4.400390625, 4.6180419921875, 4.835693359375, 5.0533447265625, 5.27099609375, 5.4886474609375, 5.706298828125, 5.9239501953125, 6.1416015625, 6.3592529296875, 6.576904296875, 6.7945556640625, 7.01220703125, 7.2298583984375, 7.447509765625, 7.6651611328125, 7.8828125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 10.0, 7.0, 7.0, 12.0, 11.0, 8.0, 23.0, 24.0, 19.0, 30.0, 18.0, 33.0, 34.0, 38.0, 49.0, 52.0, 72.0, 149.0, 403.0, 1424.0, 141.0, 76.0, 51.0, 42.0, 42.0, 41.0, 33.0, 20.0, 27.0, 23.0, 18.0, 13.0, 15.0, 9.0, 14.0, 8.0, 9.0, 3.0, 11.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.984375, -26.21484375, -25.4453125, -24.67578125, -23.90625, -23.13671875, -22.3671875, -21.59765625, -20.828125, -20.05859375, -19.2890625, -18.51953125, -17.75, -16.98046875, -16.2109375, -15.44140625, -14.671875, -13.90234375, -13.1328125, -12.36328125, -11.59375, -10.82421875, -10.0546875, -9.28515625, -8.515625, -7.74609375, -6.9765625, -6.20703125, -5.4375, -4.66796875, -3.8984375, -3.12890625, -2.359375, -1.58984375, -0.8203125, -0.05078125, 0.71875, 1.48828125, 2.2578125, 3.02734375, 3.796875, 4.56640625, 5.3359375, 6.10546875, 6.875, 7.64453125, 8.4140625, 9.18359375, 9.953125, 10.72265625, 11.4921875, 12.26171875, 13.03125, 13.80078125, 14.5703125, 15.33984375, 16.109375, 16.87890625, 17.6484375, 18.41796875, 19.1875, 19.95703125, 20.7265625, 21.49609375, 22.265625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 7.0, 11.0, 8.0, 11.0, 11.0, 27.0, 28.0, 38.0, 63.0, 70.0, 90.0, 120.0, 191.0, 298.0, 512.0, 1921.0, 47753.0, 3039474.0, 51449.0, 2078.0, 547.0, 294.0, 163.0, 132.0, 91.0, 80.0, 55.0, 41.0, 32.0, 17.0, 17.0, 16.0, 16.0, 12.0, 14.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.80712890625, -42.2705078125, -40.73388671875, -39.197265625, -37.66064453125, -36.1240234375, -34.58740234375, -33.05078125, -31.51416015625, -29.9775390625, -28.44091796875, -26.904296875, -25.36767578125, -23.8310546875, -22.29443359375, -20.7578125, -19.22119140625, -17.6845703125, -16.14794921875, -14.611328125, -13.07470703125, -11.5380859375, -10.00146484375, -8.46484375, -6.92822265625, -5.3916015625, -3.85498046875, -2.318359375, -0.78173828125, 0.7548828125, 2.29150390625, 3.828125, 5.36474609375, 6.9013671875, 8.43798828125, 9.974609375, 11.51123046875, 13.0478515625, 14.58447265625, 16.12109375, 17.65771484375, 19.1943359375, 20.73095703125, 22.267578125, 23.80419921875, 25.3408203125, 26.87744140625, 28.4140625, 29.95068359375, 31.4873046875, 33.02392578125, 34.560546875, 36.09716796875, 37.6337890625, 39.17041015625, 40.70703125, 42.24365234375, 43.7802734375, 45.31689453125, 46.853515625, 48.39013671875, 49.9267578125, 51.46337890625, 53.0]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 162.0, 632.0, 208.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.86866760253906, -232.40467834472656, -226.94068908691406, -221.47669982910156, -216.01271057128906, -210.54872131347656, -205.08474731445312, -199.62075805664062, -194.15676879882812, -188.69277954101562, -183.22879028320312, -177.76480102539062, -172.30081176757812, -166.83682250976562, -161.37283325195312, -155.90884399414062, -150.44485473632812, -144.98086547851562, -139.51687622070312, -134.05288696289062, -128.58889770507812, -123.12490844726562, -117.66092681884766, -112.19693756103516, -106.73294830322266, -101.26895904541016, -95.80496978759766, -90.34098815917969, -84.87699890136719, -79.41300964355469, -73.94902038574219, -68.48503112792969, -63.021034240722656, -57.557044982910156, -52.093055725097656, -46.62907028198242, -41.16508102416992, -35.70109176635742, -30.237106323242188, -24.773117065429688, -19.309127807617188, -13.845139503479004, -8.38115119934082, -2.917163848876953, 2.546825408935547, 8.010814666748047, 13.474800109863281, 18.93878936767578, 24.40277862548828, 29.86676788330078, 35.33075714111328, 40.794742584228516, 46.258731842041016, 51.722721099853516, 57.18670654296875, 62.65069580078125, 68.11468505859375, 73.57867431640625, 79.04266357421875, 84.50665283203125, 89.97064208984375, 95.43463134765625, 100.89861297607422, 106.36260223388672, 111.82659149169922]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 11.0, 15.0, 22.0, 17.0, 17.0, 29.0, 22.0, 32.0, 27.0, 29.0, 33.0, 41.0, 41.0, 56.0, 39.0, 39.0, 56.0, 50.0, 49.0, 41.0, 35.0, 40.0, 32.0, 40.0, 26.0, 19.0, 16.0, 22.0, 14.0, 10.0, 17.0, 16.0, 7.0, 9.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-76.28996276855469, -74.11717987060547, -71.94440460205078, -69.77162170410156, -67.59883880615234, -65.42605590820312, -63.25328063964844, -61.08049774169922, -58.907718658447266, -56.73493957519531, -54.562156677246094, -52.38937759399414, -50.21659851074219, -48.04381561279297, -45.871036529541016, -43.69825744628906, -41.525474548339844, -39.35269546508789, -37.17991256713867, -35.00713348388672, -32.8343505859375, -30.661571502685547, -28.488792419433594, -26.316011428833008, -24.143230438232422, -21.970449447631836, -19.79766845703125, -17.624889373779297, -15.452108383178711, -13.279327392578125, -11.106547355651855, -8.933767318725586, -6.760993957519531, -4.5882134437561035, -2.415432929992676, -0.24265241622924805, 1.9301280975341797, 4.102909088134766, 6.275689125061035, 8.448469161987305, 10.62125015258789, 12.794031143188477, 14.966811180114746, 17.139591217041016, 19.3123722076416, 21.485153198242188, 23.65793228149414, 25.830713272094727, 28.003494262695312, 30.1762752532959, 32.349056243896484, 34.52183532714844, 36.694618225097656, 38.86739730834961, 41.04017639160156, 43.21295928955078, 45.385738372802734, 47.55851745605469, 49.731300354003906, 51.90407943725586, 54.07685852050781, 56.24964141845703, 58.422420501708984, 60.59519958496094, 62.767982482910156]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 11.0, 16.0, 17.0, 14.0, 18.0, 23.0, 24.0, 19.0, 31.0, 26.0, 35.0, 38.0, 44.0, 44.0, 38.0, 53.0, 33.0, 37.0, 41.0, 41.0, 44.0, 45.0, 45.0, 40.0, 29.0, 18.0, 21.0, 23.0, 17.0, 14.0, 18.0, 14.0, 8.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -6.97979736328125, -6.7291259765625, -6.47845458984375, -6.227783203125, -5.97711181640625, -5.7264404296875, -5.47576904296875, -5.22509765625, -4.97442626953125, -4.7237548828125, -4.47308349609375, -4.222412109375, -3.97174072265625, -3.7210693359375, -3.47039794921875, -3.2197265625, -2.96905517578125, -2.7183837890625, -2.46771240234375, -2.217041015625, -1.96636962890625, -1.7156982421875, -1.46502685546875, -1.21435546875, -0.96368408203125, -0.7130126953125, -0.46234130859375, -0.211669921875, 0.03900146484375, 0.2896728515625, 0.54034423828125, 0.791015625, 1.04168701171875, 1.2923583984375, 1.54302978515625, 1.793701171875, 2.04437255859375, 2.2950439453125, 2.54571533203125, 2.79638671875, 3.04705810546875, 3.2977294921875, 3.54840087890625, 3.799072265625, 4.04974365234375, 4.3004150390625, 4.55108642578125, 4.8017578125, 5.05242919921875, 5.3031005859375, 5.55377197265625, 5.804443359375, 6.05511474609375, 6.3057861328125, 6.55645751953125, 6.80712890625, 7.05780029296875, 7.3084716796875, 7.55914306640625, 7.809814453125, 8.06048583984375, 8.3111572265625, 8.56182861328125, 8.8125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 12.0, 5.0, 7.0, 11.0, 18.0, 18.0, 26.0, 38.0, 34.0, 53.0, 70.0, 80.0, 118.0, 187.0, 690.0, 4473.0, 68207.0, 2397156.0, 1676961.0, 41505.0, 3398.0, 573.0, 196.0, 113.0, 63.0, 52.0, 49.0, 31.0, 33.0, 25.0, 17.0, 13.0, 17.0, 12.0, 10.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.266845703125, -21.43994140625, -20.613037109375, -19.7861328125, -18.959228515625, -18.13232421875, -17.305419921875, -16.478515625, -15.651611328125, -14.82470703125, -13.997802734375, -13.1708984375, -12.343994140625, -11.51708984375, -10.690185546875, -9.86328125, -9.036376953125, -8.20947265625, -7.382568359375, -6.5556640625, -5.728759765625, -4.90185546875, -4.074951171875, -3.248046875, -2.421142578125, -1.59423828125, -0.767333984375, 0.0595703125, 0.886474609375, 1.71337890625, 2.540283203125, 3.3671875, 4.194091796875, 5.02099609375, 5.847900390625, 6.6748046875, 7.501708984375, 8.32861328125, 9.155517578125, 9.982421875, 10.809326171875, 11.63623046875, 12.463134765625, 13.2900390625, 14.116943359375, 14.94384765625, 15.770751953125, 16.59765625, 17.424560546875, 18.25146484375, 19.078369140625, 19.9052734375, 20.732177734375, 21.55908203125, 22.385986328125, 23.212890625, 24.039794921875, 24.86669921875, 25.693603515625, 26.5205078125, 27.347412109375, 28.17431640625, 29.001220703125, 29.828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 12.0, 13.0, 17.0, 33.0, 40.0, 45.0, 53.0, 96.0, 104.0, 163.0, 240.0, 332.0, 449.0, 542.0, 433.0, 439.0, 298.0, 198.0, 161.0, 120.0, 75.0, 67.0, 36.0, 27.0, 21.0, 16.0, 8.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.609375, -17.1566162109375, -16.703857421875, -16.2510986328125, -15.79833984375, -15.3455810546875, -14.892822265625, -14.4400634765625, -13.9873046875, -13.5345458984375, -13.081787109375, -12.6290283203125, -12.17626953125, -11.7235107421875, -11.270751953125, -10.8179931640625, -10.365234375, -9.9124755859375, -9.459716796875, -9.0069580078125, -8.55419921875, -8.1014404296875, -7.648681640625, -7.1959228515625, -6.7431640625, -6.2904052734375, -5.837646484375, -5.3848876953125, -4.93212890625, -4.4793701171875, -4.026611328125, -3.5738525390625, -3.12109375, -2.6683349609375, -2.215576171875, -1.7628173828125, -1.31005859375, -0.8572998046875, -0.404541015625, 0.0482177734375, 0.5009765625, 0.9537353515625, 1.406494140625, 1.8592529296875, 2.31201171875, 2.7647705078125, 3.217529296875, 3.6702880859375, 4.123046875, 4.5758056640625, 5.028564453125, 5.4813232421875, 5.93408203125, 6.3868408203125, 6.839599609375, 7.2923583984375, 7.7451171875, 8.1978759765625, 8.650634765625, 9.1033935546875, 9.55615234375, 10.0089111328125, 10.461669921875, 10.9144287109375, 11.3671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 10.0, 12.0, 17.0, 27.0, 34.0, 54.0, 75.0, 101.0, 118.0, 161.0, 223.0, 329.0, 603.0, 2391.0, 52060.0, 3744109.0, 384818.0, 6715.0, 947.0, 428.0, 243.0, 192.0, 121.0, 119.0, 92.0, 67.0, 45.0, 43.0, 26.0, 25.0, 16.0, 11.0, 8.0, 13.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.4375, -41.8115234375, -40.185546875, -38.5595703125, -36.93359375, -35.3076171875, -33.681640625, -32.0556640625, -30.4296875, -28.8037109375, -27.177734375, -25.5517578125, -23.92578125, -22.2998046875, -20.673828125, -19.0478515625, -17.421875, -15.7958984375, -14.169921875, -12.5439453125, -10.91796875, -9.2919921875, -7.666015625, -6.0400390625, -4.4140625, -2.7880859375, -1.162109375, 0.4638671875, 2.08984375, 3.7158203125, 5.341796875, 6.9677734375, 8.59375, 10.2197265625, 11.845703125, 13.4716796875, 15.09765625, 16.7236328125, 18.349609375, 19.9755859375, 21.6015625, 23.2275390625, 24.853515625, 26.4794921875, 28.10546875, 29.7314453125, 31.357421875, 32.9833984375, 34.609375, 36.2353515625, 37.861328125, 39.4873046875, 41.11328125, 42.7392578125, 44.365234375, 45.9912109375, 47.6171875, 49.2431640625, 50.869140625, 52.4951171875, 54.12109375, 55.7470703125, 57.373046875, 58.9990234375, 60.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 13.0, 63.0, 220.0, 365.0, 252.0, 82.0, 12.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.92921447753906, -117.7292251586914, -112.52922821044922, -107.32923889160156, -102.12924194335938, -96.92925262451172, -91.72926330566406, -86.52926635742188, -81.32927703857422, -76.12928771972656, -70.92929077148438, -65.72930145263672, -60.5293083190918, -55.329315185546875, -50.12932586669922, -44.9293327331543, -39.729339599609375, -34.52934646606445, -29.329355239868164, -24.129364013671875, -18.929370880126953, -13.729377746582031, -8.529386520385742, -3.329395294189453, 1.8705978393554688, 7.070590019226074, 12.27058219909668, 17.47057342529297, 22.67056655883789, 27.870559692382812, 33.07054901123047, 38.27054214477539, 43.47052001953125, 48.67051315307617, 53.870506286621094, 59.07049560546875, 64.27049255371094, 69.4704818725586, 74.67047119140625, 79.87046813964844, 85.0704574584961, 90.27044677734375, 95.47044372558594, 100.6704330444336, 105.87042236328125, 111.07041931152344, 116.2704086303711, 121.47039794921875, 126.67039489746094, 131.87039184570312, 137.07037353515625, 142.27037048339844, 147.47036743164062, 152.67034912109375, 157.87034606933594, 163.07034301757812, 168.27032470703125, 173.47032165527344, 178.67030334472656, 183.87030029296875, 189.07029724121094, 194.27029418945312, 199.47027587890625, 204.67027282714844, 209.87026977539062]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 14.0, 13.0, 18.0, 15.0, 25.0, 17.0, 20.0, 29.0, 27.0, 39.0, 42.0, 35.0, 48.0, 31.0, 37.0, 48.0, 40.0, 46.0, 38.0, 42.0, 32.0, 58.0, 47.0, 23.0, 22.0, 17.0, 27.0, 17.0, 13.0, 20.0, 14.0, 14.0, 10.0, 5.0, 9.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.7757568359375, -39.295555114746094, -37.81535720825195, -36.33515930175781, -34.854957580566406, -33.374755859375, -31.89455795288086, -30.414358139038086, -28.934158325195312, -27.45395851135254, -25.973758697509766, -24.493558883666992, -23.01335906982422, -21.533159255981445, -20.052959442138672, -18.5727596282959, -17.092559814453125, -15.612360000610352, -14.132160186767578, -12.651960372924805, -11.171760559082031, -9.691560745239258, -8.211360931396484, -6.731161117553711, -5.2509613037109375, -3.770761489868164, -2.2905616760253906, -0.8103618621826172, 0.6698379516601562, 2.1500377655029297, 3.630237579345703, 5.110437393188477, 6.59063720703125, 8.070837020874023, 9.551036834716797, 11.03123664855957, 12.511436462402344, 13.991636276245117, 15.47183609008789, 16.952035903930664, 18.432235717773438, 19.91243553161621, 21.392635345458984, 22.872835159301758, 24.35303497314453, 25.833234786987305, 27.313434600830078, 28.79363441467285, 30.273834228515625, 31.7540340423584, 33.23423385620117, 34.71443176269531, 36.19463348388672, 37.674835205078125, 39.155033111572266, 40.635231018066406, 42.11543273925781, 43.59563446044922, 45.07583236694336, 46.5560302734375, 48.036231994628906, 49.51643371582031, 50.99663162231445, 52.476829528808594, 53.95703125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 13.0, 5.0, 9.0, 11.0, 9.0, 22.0, 18.0, 22.0, 23.0, 16.0, 28.0, 28.0, 26.0, 43.0, 36.0, 43.0, 31.0, 50.0, 50.0, 28.0, 44.0, 41.0, 32.0, 43.0, 28.0, 34.0, 34.0, 35.0, 18.0, 23.0, 10.0, 20.0, 19.0, 14.0, 19.0, 14.0, 10.0, 9.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.80859375, -6.57501220703125, -6.3414306640625, -6.10784912109375, -5.874267578125, -5.64068603515625, -5.4071044921875, -5.17352294921875, -4.93994140625, -4.70635986328125, -4.4727783203125, -4.23919677734375, -4.005615234375, -3.77203369140625, -3.5384521484375, -3.30487060546875, -3.0712890625, -2.83770751953125, -2.6041259765625, -2.37054443359375, -2.136962890625, -1.90338134765625, -1.6697998046875, -1.43621826171875, -1.20263671875, -0.96905517578125, -0.7354736328125, -0.50189208984375, -0.268310546875, -0.03472900390625, 0.1988525390625, 0.43243408203125, 0.666015625, 0.89959716796875, 1.1331787109375, 1.36676025390625, 1.600341796875, 1.83392333984375, 2.0675048828125, 2.30108642578125, 2.53466796875, 2.76824951171875, 3.0018310546875, 3.23541259765625, 3.468994140625, 3.70257568359375, 3.9361572265625, 4.16973876953125, 4.4033203125, 4.63690185546875, 4.8704833984375, 5.10406494140625, 5.337646484375, 5.57122802734375, 5.8048095703125, 6.03839111328125, 6.27197265625, 6.50555419921875, 6.7391357421875, 6.97271728515625, 7.206298828125, 7.43988037109375, 7.6734619140625, 7.90704345703125, 8.140625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 8.0, 12.0, 12.0, 26.0, 39.0, 66.0, 100.0, 164.0, 249.0, 382.0, 653.0, 1056.0, 1743.0, 2771.0, 4541.0, 7720.0, 12701.0, 21628.0, 36990.0, 63727.0, 107749.0, 165975.0, 202122.0, 162701.0, 105024.0, 62100.0, 35954.0, 21063.0, 12231.0, 7507.0, 4371.0, 2726.0, 1697.0, 1021.0, 683.0, 372.0, 275.0, 139.0, 95.0, 48.0, 40.0, 20.0, 20.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77734375, -0.7509689331054688, -0.7245941162109375, -0.6982192993164062, -0.671844482421875, -0.6454696655273438, -0.6190948486328125, -0.5927200317382812, -0.56634521484375, -0.5399703979492188, -0.5135955810546875, -0.48722076416015625, -0.460845947265625, -0.43447113037109375, -0.4080963134765625, -0.38172149658203125, -0.3553466796875, -0.32897186279296875, -0.3025970458984375, -0.27622222900390625, -0.249847412109375, -0.22347259521484375, -0.1970977783203125, -0.17072296142578125, -0.14434814453125, -0.11797332763671875, -0.0915985107421875, -0.06522369384765625, -0.038848876953125, -0.01247406005859375, 0.0139007568359375, 0.04027557373046875, 0.066650390625, 0.09302520751953125, 0.1194000244140625, 0.14577484130859375, 0.172149658203125, 0.19852447509765625, 0.2248992919921875, 0.25127410888671875, 0.27764892578125, 0.30402374267578125, 0.3303985595703125, 0.35677337646484375, 0.383148193359375, 0.40952301025390625, 0.4358978271484375, 0.46227264404296875, 0.4886474609375, 0.5150222778320312, 0.5413970947265625, 0.5677719116210938, 0.594146728515625, 0.6205215454101562, 0.6468963623046875, 0.6732711791992188, 0.69964599609375, 0.7260208129882812, 0.7523956298828125, 0.7787704467773438, 0.805145263671875, 0.8315200805664062, 0.8578948974609375, 0.8842697143554688, 0.91064453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 9.0, 11.0, 9.0, 17.0, 11.0, 15.0, 22.0, 20.0, 20.0, 25.0, 29.0, 31.0, 43.0, 36.0, 49.0, 41.0, 42.0, 33.0, 1063.0, 43.0, 34.0, 43.0, 47.0, 37.0, 36.0, 26.0, 34.0, 30.0, 19.0, 24.0, 15.0, 20.0, 12.0, 12.0, 9.0, 12.0, 9.0, 5.0, 10.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.640625, -4.48431396484375, -4.3280029296875, -4.17169189453125, -4.015380859375, -3.85906982421875, -3.7027587890625, -3.54644775390625, -3.39013671875, -3.23382568359375, -3.0775146484375, -2.92120361328125, -2.764892578125, -2.60858154296875, -2.4522705078125, -2.29595947265625, -2.1396484375, -1.98333740234375, -1.8270263671875, -1.67071533203125, -1.514404296875, -1.35809326171875, -1.2017822265625, -1.04547119140625, -0.88916015625, -0.73284912109375, -0.5765380859375, -0.42022705078125, -0.263916015625, -0.10760498046875, 0.0487060546875, 0.20501708984375, 0.361328125, 0.51763916015625, 0.6739501953125, 0.83026123046875, 0.986572265625, 1.14288330078125, 1.2991943359375, 1.45550537109375, 1.61181640625, 1.76812744140625, 1.9244384765625, 2.08074951171875, 2.237060546875, 2.39337158203125, 2.5496826171875, 2.70599365234375, 2.8623046875, 3.01861572265625, 3.1749267578125, 3.33123779296875, 3.487548828125, 3.64385986328125, 3.8001708984375, 3.95648193359375, 4.11279296875, 4.26910400390625, 4.4254150390625, 4.58172607421875, 4.738037109375, 4.89434814453125, 5.0506591796875, 5.20697021484375, 5.36328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 2.0, 4.0, 10.0, 17.0, 27.0, 31.0, 45.0, 71.0, 125.0, 183.0, 265.0, 350.0, 480.0, 752.0, 960.0, 1426.0, 1966.0, 2837.0, 3908.0, 5702.0, 8166.0, 11884.0, 17260.0, 25089.0, 36122.0, 50868.0, 70080.0, 93805.0, 116084.0, 1174150.0, 120827.0, 98075.0, 74792.0, 54020.0, 38652.0, 27285.0, 18483.0, 12721.0, 9052.0, 6269.0, 4177.0, 3008.0, 2084.0, 1463.0, 1097.0, 736.0, 524.0, 408.0, 263.0, 176.0, 131.0, 76.0, 50.0, 33.0, 27.0, 14.0, 12.0, 12.0, 3.0, 2.0, 2.0], "bins": [-0.471435546875, -0.45697021484375, -0.4425048828125, -0.42803955078125, -0.41357421875, -0.39910888671875, -0.3846435546875, -0.37017822265625, -0.355712890625, -0.34124755859375, -0.3267822265625, -0.31231689453125, -0.2978515625, -0.28338623046875, -0.2689208984375, -0.25445556640625, -0.239990234375, -0.22552490234375, -0.2110595703125, -0.19659423828125, -0.18212890625, -0.16766357421875, -0.1531982421875, -0.13873291015625, -0.124267578125, -0.10980224609375, -0.0953369140625, -0.08087158203125, -0.06640625, -0.05194091796875, -0.0374755859375, -0.02301025390625, -0.008544921875, 0.00592041015625, 0.0203857421875, 0.03485107421875, 0.04931640625, 0.06378173828125, 0.0782470703125, 0.09271240234375, 0.107177734375, 0.12164306640625, 0.1361083984375, 0.15057373046875, 0.1650390625, 0.17950439453125, 0.1939697265625, 0.20843505859375, 0.222900390625, 0.23736572265625, 0.2518310546875, 0.26629638671875, 0.28076171875, 0.29522705078125, 0.3096923828125, 0.32415771484375, 0.338623046875, 0.35308837890625, 0.3675537109375, 0.38201904296875, 0.396484375, 0.41094970703125, 0.4254150390625, 0.43988037109375, 0.454345703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 8.0, 10.0, 5.0, 8.0, 13.0, 12.0, 10.0, 17.0, 25.0, 13.0, 22.0, 24.0, 23.0, 37.0, 42.0, 63.0, 66.0, 77.0, 72.0, 67.0, 57.0, 55.0, 47.0, 33.0, 29.0, 24.0, 31.0, 16.0, 14.0, 13.0, 13.0, 6.0, 5.0, 7.0, 8.0, 5.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.006500244140625, -0.006311535835266113, -0.0061228275299072266, -0.00593411922454834, -0.005745410919189453, -0.005556702613830566, -0.00536799430847168, -0.005179286003112793, -0.004990577697753906, -0.0048018693923950195, -0.004613161087036133, -0.004424452781677246, -0.004235744476318359, -0.004047036170959473, -0.003858327865600586, -0.0036696195602416992, -0.0034809112548828125, -0.0032922029495239258, -0.003103494644165039, -0.0029147863388061523, -0.0027260780334472656, -0.002537369728088379, -0.002348661422729492, -0.0021599531173706055, -0.0019712448120117188, -0.001782536506652832, -0.0015938282012939453, -0.0014051198959350586, -0.0012164115905761719, -0.0010277032852172852, -0.0008389949798583984, -0.0006502866744995117, -0.000461578369140625, -0.0002728700637817383, -8.416175842285156e-05, 0.00010454654693603516, 0.0002932548522949219, 0.0004819631576538086, 0.0006706714630126953, 0.000859379768371582, 0.0010480880737304688, 0.0012367963790893555, 0.0014255046844482422, 0.001614212989807129, 0.0018029212951660156, 0.0019916296005249023, 0.002180337905883789, 0.0023690462112426758, 0.0025577545166015625, 0.0027464628219604492, 0.002935171127319336, 0.0031238794326782227, 0.0033125877380371094, 0.003501296043395996, 0.003690004348754883, 0.0038787126541137695, 0.004067420959472656, 0.004256129264831543, 0.00444483757019043, 0.004633545875549316, 0.004822254180908203, 0.00501096248626709, 0.0051996707916259766, 0.005388379096984863, 0.00557708740234375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 0.0, 3.0, 8.0, 9.0, 1.0, 11.0, 8.0, 9.0, 13.0, 22.0, 14.0, 17.0, 25.0, 38.0, 46.0, 59.0, 112.0, 141.0, 222.0, 454.0, 2040.0, 1023789.0, 19853.0, 725.0, 298.0, 182.0, 100.0, 75.0, 46.0, 36.0, 32.0, 34.0, 20.0, 24.0, 18.0, 13.0, 15.0, 10.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12158203125, -0.11734771728515625, -0.1131134033203125, -0.10887908935546875, -0.104644775390625, -0.10041046142578125, -0.0961761474609375, -0.09194183349609375, -0.08770751953125, -0.08347320556640625, -0.0792388916015625, -0.07500457763671875, -0.070770263671875, -0.06653594970703125, -0.0623016357421875, -0.05806732177734375, -0.0538330078125, -0.04959869384765625, -0.0453643798828125, -0.04113006591796875, -0.036895751953125, -0.03266143798828125, -0.0284271240234375, -0.02419281005859375, -0.01995849609375, -0.01572418212890625, -0.0114898681640625, -0.00725555419921875, -0.003021240234375, 0.00121307373046875, 0.0054473876953125, 0.00968170166015625, 0.013916015625, 0.01815032958984375, 0.0223846435546875, 0.02661895751953125, 0.030853271484375, 0.03508758544921875, 0.0393218994140625, 0.04355621337890625, 0.04779052734375, 0.05202484130859375, 0.0562591552734375, 0.06049346923828125, 0.064727783203125, 0.06896209716796875, 0.0731964111328125, 0.07743072509765625, 0.0816650390625, 0.08589935302734375, 0.0901336669921875, 0.09436798095703125, 0.098602294921875, 0.10283660888671875, 0.1070709228515625, 0.11130523681640625, 0.11553955078125, 0.11977386474609375, 0.1240081787109375, 0.12824249267578125, 0.132476806640625, 0.13671112060546875, 0.1409454345703125, 0.14517974853515625, 0.1494140625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 22.0, 376.0, 571.0, 39.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016687728464603424, -0.016023458912968636, -0.015359189361333847, -0.014694919809699059, -0.01403065025806427, -0.013366380706429482, -0.012702110223472118, -0.01203784067183733, -0.011373571120202541, -0.010709301568567753, -0.010045032016932964, -0.009380761533975601, -0.008716491982340813, -0.008052222430706024, -0.007387952879071236, -0.006723683327436447, -0.006059413775801659, -0.00539514422416687, -0.004730874672532082, -0.004066604655236006, -0.0034023351036012173, -0.0027380655519664288, -0.002073795534670353, -0.0014095259830355644, -0.0007452564314007759, -8.098676335066557e-05, 0.0005832829046994448, 0.001247552689164877, 0.0019118222407996655, 0.002576091792434454, 0.00324036180973053, 0.0039046313613653183, 0.004568900913000107, 0.005233170464634895, 0.005897440016269684, 0.00656171003356576, 0.007225979585200548, 0.00789024867117405, 0.008554519154131413, 0.009218788705766201, 0.00988305825740099, 0.010547327809035778, 0.011211597360670567, 0.01187586784362793, 0.012540137395262718, 0.013204406946897507, 0.013868676498532295, 0.014532946050167084, 0.015197215601801872, 0.01586148515343666, 0.01652575470507145, 0.017190024256706238, 0.017854293808341026, 0.018518563359975815, 0.019182834774255753, 0.019847102463245392, 0.02051137387752533, 0.021175643429160118, 0.021839912980794907, 0.022504182532429695, 0.023168452084064484, 0.023832721635699272, 0.02449699118733406, 0.025161262601614, 0.025825530290603638]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 8.0, 3.0, 6.0, 10.0, 12.0, 12.0, 10.0, 24.0, 17.0, 35.0, 18.0, 35.0, 33.0, 29.0, 32.0, 43.0, 51.0, 43.0, 43.0, 42.0, 40.0, 48.0, 50.0, 40.0, 45.0, 21.0, 37.0, 35.0, 29.0, 29.0, 19.0, 24.0, 13.0, 10.0, 16.0, 5.0, 7.0, 8.0, 10.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.004335641860961914, -0.004209012724459171, -0.0040823835879564285, -0.003955754451453686, -0.003829125314950943, -0.0037024961784482002, -0.0035758670419454575, -0.0034492379054427147, -0.003322608768939972, -0.003195979632437229, -0.0030693504959344864, -0.0029427213594317436, -0.002816092222929001, -0.002689463086426258, -0.0025628339499235153, -0.0024362048134207726, -0.00230957567691803, -0.002182946540415287, -0.0020563174039125443, -0.0019296882674098015, -0.0018030591309070587, -0.001676429994404316, -0.0015498008579015732, -0.0014231717213988304, -0.0012965425848960876, -0.0011699134483933449, -0.0010432843118906021, -0.0009166551753878593, -0.0007900260388851166, -0.0006633969023823738, -0.000536767765879631, -0.0004101386293768883, -0.0002835094928741455, -0.00015688035637140274, -3.0251219868659973e-05, 9.63779166340828e-05, 0.00022300705313682556, 0.00034963618963956833, 0.0004762653261423111, 0.0006028944626450539, 0.0007295235991477966, 0.0008561527356505394, 0.0009827818721532822, 0.001109411008656025, 0.0012360401451587677, 0.0013626692816615105, 0.0014892984181642532, 0.001615927554666996, 0.0017425566911697388, 0.0018691858276724815, 0.0019958149641752243, 0.002122444100677967, 0.00224907323718071, 0.0023757023736834526, 0.0025023315101861954, 0.002628960646688938, 0.002755589783191681, 0.0028822189196944237, 0.0030088480561971664, 0.003135477192699909, 0.003262106329202652, 0.0033887354657053947, 0.0035153646022081375, 0.0036419937387108803, 0.003768622875213623]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 13.0, 5.0, 9.0, 11.0, 9.0, 22.0, 18.0, 22.0, 24.0, 15.0, 28.0, 28.0, 26.0, 43.0, 36.0, 43.0, 31.0, 50.0, 50.0, 28.0, 44.0, 41.0, 32.0, 43.0, 28.0, 34.0, 34.0, 35.0, 18.0, 23.0, 10.0, 20.0, 19.0, 14.0, 19.0, 14.0, 10.0, 9.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.80859375, -6.57501220703125, -6.3414306640625, -6.10784912109375, -5.874267578125, -5.64068603515625, -5.4071044921875, -5.17352294921875, -4.93994140625, -4.70635986328125, -4.4727783203125, -4.23919677734375, -4.005615234375, -3.77203369140625, -3.5384521484375, -3.30487060546875, -3.0712890625, -2.83770751953125, -2.6041259765625, -2.37054443359375, -2.136962890625, -1.90338134765625, -1.6697998046875, -1.43621826171875, -1.20263671875, -0.96905517578125, -0.7354736328125, -0.50189208984375, -0.268310546875, -0.03472900390625, 0.1988525390625, 0.43243408203125, 0.666015625, 0.89959716796875, 1.1331787109375, 1.36676025390625, 1.600341796875, 1.83392333984375, 2.0675048828125, 2.30108642578125, 2.53466796875, 2.76824951171875, 3.0018310546875, 3.23541259765625, 3.468994140625, 3.70257568359375, 3.9361572265625, 4.16973876953125, 4.4033203125, 4.63690185546875, 4.8704833984375, 5.10406494140625, 5.337646484375, 5.57122802734375, 5.8048095703125, 6.03839111328125, 6.27197265625, 6.50555419921875, 6.7391357421875, 6.97271728515625, 7.206298828125, 7.43988037109375, 7.6734619140625, 7.90704345703125, 8.140625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 10.0, 13.0, 7.0, 13.0, 15.0, 18.0, 31.0, 40.0, 46.0, 69.0, 76.0, 117.0, 129.0, 216.0, 324.0, 602.0, 1903.0, 7765.0, 43275.0, 339219.0, 571974.0, 66852.0, 11277.0, 2527.0, 764.0, 363.0, 234.0, 173.0, 119.0, 76.0, 64.0, 34.0, 46.0, 38.0, 18.0, 29.0, 16.0, 14.0, 11.0, 10.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4453125, -12.9835205078125, -12.521728515625, -12.0599365234375, -11.59814453125, -11.1363525390625, -10.674560546875, -10.2127685546875, -9.7509765625, -9.2891845703125, -8.827392578125, -8.3656005859375, -7.90380859375, -7.4420166015625, -6.980224609375, -6.5184326171875, -6.056640625, -5.5948486328125, -5.133056640625, -4.6712646484375, -4.20947265625, -3.7476806640625, -3.285888671875, -2.8240966796875, -2.3623046875, -1.9005126953125, -1.438720703125, -0.9769287109375, -0.51513671875, -0.0533447265625, 0.408447265625, 0.8702392578125, 1.33203125, 1.7938232421875, 2.255615234375, 2.7174072265625, 3.17919921875, 3.6409912109375, 4.102783203125, 4.5645751953125, 5.0263671875, 5.4881591796875, 5.949951171875, 6.4117431640625, 6.87353515625, 7.3353271484375, 7.797119140625, 8.2589111328125, 8.720703125, 9.1824951171875, 9.644287109375, 10.1060791015625, 10.56787109375, 11.0296630859375, 11.491455078125, 11.9532470703125, 12.4150390625, 12.8768310546875, 13.338623046875, 13.8004150390625, 14.26220703125, 14.7239990234375, 15.185791015625, 15.6475830078125, 16.109375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 7.0, 6.0, 17.0, 5.0, 11.0, 9.0, 11.0, 16.0, 14.0, 20.0, 27.0, 26.0, 35.0, 39.0, 42.0, 52.0, 63.0, 104.0, 380.0, 1568.0, 142.0, 66.0, 61.0, 41.0, 37.0, 40.0, 23.0, 38.0, 25.0, 20.0, 17.0, 10.0, 13.0, 18.0, 13.0, 5.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-31.609375, -30.758056640625, -29.90673828125, -29.055419921875, -28.2041015625, -27.352783203125, -26.50146484375, -25.650146484375, -24.798828125, -23.947509765625, -23.09619140625, -22.244873046875, -21.3935546875, -20.542236328125, -19.69091796875, -18.839599609375, -17.98828125, -17.136962890625, -16.28564453125, -15.434326171875, -14.5830078125, -13.731689453125, -12.88037109375, -12.029052734375, -11.177734375, -10.326416015625, -9.47509765625, -8.623779296875, -7.7724609375, -6.921142578125, -6.06982421875, -5.218505859375, -4.3671875, -3.515869140625, -2.66455078125, -1.813232421875, -0.9619140625, -0.110595703125, 0.74072265625, 1.592041015625, 2.443359375, 3.294677734375, 4.14599609375, 4.997314453125, 5.8486328125, 6.699951171875, 7.55126953125, 8.402587890625, 9.25390625, 10.105224609375, 10.95654296875, 11.807861328125, 12.6591796875, 13.510498046875, 14.36181640625, 15.213134765625, 16.064453125, 16.915771484375, 17.76708984375, 18.618408203125, 19.4697265625, 20.321044921875, 21.17236328125, 22.023681640625, 22.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 3.0, 15.0, 17.0, 14.0, 17.0, 18.0, 24.0, 35.0, 41.0, 57.0, 83.0, 121.0, 168.0, 313.0, 689.0, 5600.0, 3004248.0, 131291.0, 1694.0, 472.0, 240.0, 121.0, 103.0, 75.0, 43.0, 43.0, 29.0, 18.0, 19.0, 7.0, 13.0, 13.0, 6.0, 13.0, 8.0, 6.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.125, -50.1787109375, -48.232421875, -46.2861328125, -44.33984375, -42.3935546875, -40.447265625, -38.5009765625, -36.5546875, -34.6083984375, -32.662109375, -30.7158203125, -28.76953125, -26.8232421875, -24.876953125, -22.9306640625, -20.984375, -19.0380859375, -17.091796875, -15.1455078125, -13.19921875, -11.2529296875, -9.306640625, -7.3603515625, -5.4140625, -3.4677734375, -1.521484375, 0.4248046875, 2.37109375, 4.3173828125, 6.263671875, 8.2099609375, 10.15625, 12.1025390625, 14.048828125, 15.9951171875, 17.94140625, 19.8876953125, 21.833984375, 23.7802734375, 25.7265625, 27.6728515625, 29.619140625, 31.5654296875, 33.51171875, 35.4580078125, 37.404296875, 39.3505859375, 41.296875, 43.2431640625, 45.189453125, 47.1357421875, 49.08203125, 51.0283203125, 52.974609375, 54.9208984375, 56.8671875, 58.8134765625, 60.759765625, 62.7060546875, 64.65234375, 66.5986328125, 68.544921875, 70.4912109375, 72.4375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 10.0, 62.0, 175.0, 317.0, 274.0, 129.0, 39.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.91346740722656, -95.90614318847656, -93.89881896972656, -91.8915023803711, -89.8841781616211, -87.8768539428711, -85.8695297241211, -83.8622055053711, -81.85488891601562, -79.84756469726562, -77.84024047851562, -75.83292388916016, -73.82559967041016, -71.81827545166016, -69.81095123291016, -67.80362701416016, -65.79630279541016, -63.788978576660156, -61.78165817260742, -59.77433395385742, -57.76701354980469, -55.75968933105469, -53.75236511230469, -51.74504089355469, -49.73772048950195, -47.73039627075195, -45.72307586669922, -43.71575164794922, -41.70842742919922, -39.701107025146484, -37.693782806396484, -35.68646240234375, -33.67913818359375, -31.671815872192383, -29.664493560791016, -27.657169342041016, -25.64984703063965, -23.64252471923828, -21.63520050048828, -19.627878189086914, -17.620555877685547, -15.61323356628418, -13.605910301208496, -11.598587036132812, -9.591264724731445, -7.583942413330078, -5.5766191482543945, -3.569295883178711, -1.5619735717773438, 0.44534921646118164, 2.452672004699707, 4.459994792938232, 6.467317581176758, 8.474639892578125, 10.481963157653809, 12.489286422729492, 14.49660873413086, 16.503931045532227, 18.511253356933594, 20.518577575683594, 22.52589988708496, 24.533222198486328, 26.540546417236328, 28.547868728637695, 30.555191040039062]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 11.0, 9.0, 21.0, 18.0, 16.0, 13.0, 22.0, 24.0, 27.0, 40.0, 42.0, 44.0, 50.0, 48.0, 58.0, 38.0, 47.0, 43.0, 46.0, 58.0, 38.0, 31.0, 29.0, 37.0, 22.0, 27.0, 26.0, 30.0, 11.0, 22.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.64433288574219, -74.42533111572266, -72.20632934570312, -69.98733520507812, -67.7683334350586, -65.54933166503906, -63.33032989501953, -61.111328125, -58.892330169677734, -56.6733283996582, -54.45433044433594, -52.235328674316406, -50.016326904296875, -47.79732894897461, -45.57832717895508, -43.35932922363281, -41.14032745361328, -38.92132568359375, -36.702327728271484, -34.48332595825195, -32.26432800292969, -30.045326232910156, -27.826324462890625, -25.607324600219727, -23.388324737548828, -21.16932487487793, -18.95032501220703, -16.7313232421875, -14.512323379516602, -12.293323516845703, -10.074322700500488, -7.855321884155273, -5.636322021484375, -3.4173216819763184, -1.1983213424682617, 1.020678997039795, 3.2396793365478516, 5.45867919921875, 7.677680015563965, 9.89668083190918, 12.115680694580078, 14.334680557250977, 16.553680419921875, 18.772682189941406, 20.991682052612305, 23.210681915283203, 25.429683685302734, 27.648683547973633, 29.86768341064453, 32.08668518066406, 34.30568313598633, 36.52468490600586, 38.743682861328125, 40.962684631347656, 43.18168640136719, 45.40068817138672, 47.619686126708984, 49.838687896728516, 52.05768585205078, 54.27668762207031, 56.495689392089844, 58.71468734741211, 60.93368911743164, 63.152687072753906, 65.37168884277344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 9.0, 12.0, 10.0, 8.0, 10.0, 12.0, 13.0, 12.0, 20.0, 25.0, 26.0, 23.0, 43.0, 25.0, 29.0, 20.0, 41.0, 35.0, 38.0, 35.0, 39.0, 31.0, 38.0, 48.0, 36.0, 34.0, 27.0, 42.0, 32.0, 28.0, 32.0, 25.0, 15.0, 15.0, 13.0, 16.0, 12.0, 17.0, 11.0, 10.0, 7.0, 7.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.49774169921875, -6.2650146484375, -6.03228759765625, -5.799560546875, -5.56683349609375, -5.3341064453125, -5.10137939453125, -4.86865234375, -4.63592529296875, -4.4031982421875, -4.17047119140625, -3.937744140625, -3.70501708984375, -3.4722900390625, -3.23956298828125, -3.0068359375, -2.77410888671875, -2.5413818359375, -2.30865478515625, -2.075927734375, -1.84320068359375, -1.6104736328125, -1.37774658203125, -1.14501953125, -0.91229248046875, -0.6795654296875, -0.44683837890625, -0.214111328125, 0.01861572265625, 0.2513427734375, 0.48406982421875, 0.716796875, 0.94952392578125, 1.1822509765625, 1.41497802734375, 1.647705078125, 1.88043212890625, 2.1131591796875, 2.34588623046875, 2.57861328125, 2.81134033203125, 3.0440673828125, 3.27679443359375, 3.509521484375, 3.74224853515625, 3.9749755859375, 4.20770263671875, 4.4404296875, 4.67315673828125, 4.9058837890625, 5.13861083984375, 5.371337890625, 5.60406494140625, 5.8367919921875, 6.06951904296875, 6.30224609375, 6.53497314453125, 6.7677001953125, 7.00042724609375, 7.233154296875, 7.46588134765625, 7.6986083984375, 7.93133544921875, 8.1640625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 7.0, 7.0, 13.0, 13.0, 13.0, 22.0, 12.0, 18.0, 30.0, 34.0, 40.0, 39.0, 61.0, 91.0, 151.0, 319.0, 727.0, 2099.0, 9446.0, 65711.0, 874990.0, 2698306.0, 492841.0, 40021.0, 6327.0, 1640.0, 524.0, 239.0, 148.0, 86.0, 52.0, 39.0, 31.0, 38.0, 21.0, 18.0, 16.0, 13.0, 11.0, 13.0, 11.0, 6.0, 5.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-18.375, -17.8076171875, -17.240234375, -16.6728515625, -16.10546875, -15.5380859375, -14.970703125, -14.4033203125, -13.8359375, -13.2685546875, -12.701171875, -12.1337890625, -11.56640625, -10.9990234375, -10.431640625, -9.8642578125, -9.296875, -8.7294921875, -8.162109375, -7.5947265625, -7.02734375, -6.4599609375, -5.892578125, -5.3251953125, -4.7578125, -4.1904296875, -3.623046875, -3.0556640625, -2.48828125, -1.9208984375, -1.353515625, -0.7861328125, -0.21875, 0.3486328125, 0.916015625, 1.4833984375, 2.05078125, 2.6181640625, 3.185546875, 3.7529296875, 4.3203125, 4.8876953125, 5.455078125, 6.0224609375, 6.58984375, 7.1572265625, 7.724609375, 8.2919921875, 8.859375, 9.4267578125, 9.994140625, 10.5615234375, 11.12890625, 11.6962890625, 12.263671875, 12.8310546875, 13.3984375, 13.9658203125, 14.533203125, 15.1005859375, 15.66796875, 16.2353515625, 16.802734375, 17.3701171875, 17.9375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 9.0, 12.0, 18.0, 20.0, 37.0, 47.0, 38.0, 79.0, 94.0, 130.0, 175.0, 237.0, 359.0, 413.0, 468.0, 480.0, 418.0, 275.0, 225.0, 157.0, 116.0, 54.0, 55.0, 39.0, 22.0, 21.0, 16.0, 13.0, 10.0, 10.0, 1.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7005615234375, -10.268310546875, -9.8360595703125, -9.40380859375, -8.9715576171875, -8.539306640625, -8.1070556640625, -7.6748046875, -7.2425537109375, -6.810302734375, -6.3780517578125, -5.94580078125, -5.5135498046875, -5.081298828125, -4.6490478515625, -4.216796875, -3.7845458984375, -3.352294921875, -2.9200439453125, -2.48779296875, -2.0555419921875, -1.623291015625, -1.1910400390625, -0.7587890625, -0.3265380859375, 0.105712890625, 0.5379638671875, 0.97021484375, 1.4024658203125, 1.834716796875, 2.2669677734375, 2.69921875, 3.1314697265625, 3.563720703125, 3.9959716796875, 4.42822265625, 4.8604736328125, 5.292724609375, 5.7249755859375, 6.1572265625, 6.5894775390625, 7.021728515625, 7.4539794921875, 7.88623046875, 8.3184814453125, 8.750732421875, 9.1829833984375, 9.615234375, 10.0474853515625, 10.479736328125, 10.9119873046875, 11.34423828125, 11.7764892578125, 12.208740234375, 12.6409912109375, 13.0732421875, 13.5054931640625, 13.937744140625, 14.3699951171875, 14.80224609375, 15.2344970703125, 15.666748046875, 16.0989990234375, 16.53125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 18.0, 29.0, 19.0, 27.0, 48.0, 69.0, 78.0, 91.0, 137.0, 215.0, 341.0, 677.0, 1923.0, 18995.0, 913111.0, 3200212.0, 52500.0, 3623.0, 868.0, 410.0, 243.0, 170.0, 133.0, 80.0, 68.0, 52.0, 35.0, 28.0, 14.0, 16.0, 11.0, 12.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -36.13818359375, -34.8076171875, -33.47705078125, -32.146484375, -30.81591796875, -29.4853515625, -28.15478515625, -26.82421875, -25.49365234375, -24.1630859375, -22.83251953125, -21.501953125, -20.17138671875, -18.8408203125, -17.51025390625, -16.1796875, -14.84912109375, -13.5185546875, -12.18798828125, -10.857421875, -9.52685546875, -8.1962890625, -6.86572265625, -5.53515625, -4.20458984375, -2.8740234375, -1.54345703125, -0.212890625, 1.11767578125, 2.4482421875, 3.77880859375, 5.109375, 6.43994140625, 7.7705078125, 9.10107421875, 10.431640625, 11.76220703125, 13.0927734375, 14.42333984375, 15.75390625, 17.08447265625, 18.4150390625, 19.74560546875, 21.076171875, 22.40673828125, 23.7373046875, 25.06787109375, 26.3984375, 27.72900390625, 29.0595703125, 30.39013671875, 31.720703125, 33.05126953125, 34.3818359375, 35.71240234375, 37.04296875, 38.37353515625, 39.7041015625, 41.03466796875, 42.365234375, 43.69580078125, 45.0263671875, 46.35693359375, 47.6875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 35.0, 97.0, 237.0, 310.0, 222.0, 82.0, 20.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.12657165527344, -185.76608276367188, -181.40557861328125, -177.0450897216797, -172.68460083007812, -168.32411193847656, -163.963623046875, -159.60311889648438, -155.2426300048828, -150.88214111328125, -146.52163696289062, -142.16114807128906, -137.8006591796875, -133.44017028808594, -129.07968139648438, -124.71917724609375, -120.35868835449219, -115.99819946289062, -111.63770294189453, -107.27720642089844, -102.91671752929688, -98.55622863769531, -94.19573211669922, -89.83523559570312, -85.47474670410156, -81.1142578125, -76.7537612915039, -72.39326477050781, -68.03277587890625, -63.67228317260742, -59.311790466308594, -54.951297760009766, -50.590797424316406, -46.23030471801758, -41.86981201171875, -37.50931930541992, -33.148826599121094, -28.788333892822266, -24.427841186523438, -20.06734848022461, -15.706855773925781, -11.346363067626953, -6.985870361328125, -2.625377655029297, 1.7351150512695312, 6.095607757568359, 10.456100463867188, 14.816593170166016, 19.177085876464844, 23.537578582763672, 27.8980712890625, 32.25856399536133, 36.619056701660156, 40.979549407958984, 45.34004211425781, 49.70053482055664, 54.06102752685547, 58.4215202331543, 62.782012939453125, 67.14250183105469, 71.50299835205078, 75.86349487304688, 80.22398376464844, 84.58447265625, 88.9449691772461]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 3.0, 8.0, 10.0, 12.0, 14.0, 13.0, 15.0, 31.0, 21.0, 30.0, 19.0, 36.0, 27.0, 49.0, 36.0, 46.0, 34.0, 31.0, 44.0, 45.0, 30.0, 47.0, 36.0, 44.0, 33.0, 40.0, 35.0, 31.0, 24.0, 24.0, 20.0, 15.0, 15.0, 17.0, 10.0, 11.0, 6.0, 6.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.854400634765625, -41.38603973388672, -39.91767883300781, -38.449317932128906, -36.98095703125, -35.51259231567383, -34.04423141479492, -32.575870513916016, -31.10750961303711, -29.639148712158203, -28.170787811279297, -26.702425003051758, -25.23406410217285, -23.765703201293945, -22.297340393066406, -20.8289794921875, -19.360618591308594, -17.892257690429688, -16.42389678955078, -14.955533981323242, -13.487173080444336, -12.01881217956543, -10.550450325012207, -9.082088470458984, -7.613727569580078, -6.145366191864014, -4.677004814147949, -3.2086434364318848, -1.7402820587158203, -0.27192068099975586, 1.1964406967163086, 2.6648025512695312, 4.1331634521484375, 5.601524829864502, 7.069886207580566, 8.538248062133789, 10.006608963012695, 11.474969863891602, 12.943331718444824, 14.411693572998047, 15.880054473876953, 17.34841537475586, 18.816776275634766, 20.285139083862305, 21.75349998474121, 23.221860885620117, 24.690223693847656, 26.158584594726562, 27.62694549560547, 29.095306396484375, 30.56366729736328, 32.03202819824219, 33.500389099121094, 34.968753814697266, 36.43711471557617, 37.90547561645508, 39.373836517333984, 40.84219741821289, 42.3105583190918, 43.7789192199707, 45.247283935546875, 46.71564483642578, 48.18400573730469, 49.652366638183594, 51.1207275390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 3.0, 8.0, 8.0, 11.0, 13.0, 18.0, 12.0, 11.0, 10.0, 20.0, 20.0, 22.0, 22.0, 23.0, 30.0, 27.0, 17.0, 24.0, 37.0, 33.0, 36.0, 30.0, 41.0, 40.0, 40.0, 30.0, 34.0, 37.0, 25.0, 35.0, 27.0, 28.0, 19.0, 17.0, 20.0, 23.0, 19.0, 21.0, 22.0, 20.0, 12.0, 9.0, 11.0, 5.0, 4.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.89453125, -6.67431640625, -6.4541015625, -6.23388671875, -6.013671875, -5.79345703125, -5.5732421875, -5.35302734375, -5.1328125, -4.91259765625, -4.6923828125, -4.47216796875, -4.251953125, -4.03173828125, -3.8115234375, -3.59130859375, -3.37109375, -3.15087890625, -2.9306640625, -2.71044921875, -2.490234375, -2.27001953125, -2.0498046875, -1.82958984375, -1.609375, -1.38916015625, -1.1689453125, -0.94873046875, -0.728515625, -0.50830078125, -0.2880859375, -0.06787109375, 0.15234375, 0.37255859375, 0.5927734375, 0.81298828125, 1.033203125, 1.25341796875, 1.4736328125, 1.69384765625, 1.9140625, 2.13427734375, 2.3544921875, 2.57470703125, 2.794921875, 3.01513671875, 3.2353515625, 3.45556640625, 3.67578125, 3.89599609375, 4.1162109375, 4.33642578125, 4.556640625, 4.77685546875, 4.9970703125, 5.21728515625, 5.4375, 5.65771484375, 5.8779296875, 6.09814453125, 6.318359375, 6.53857421875, 6.7587890625, 6.97900390625, 7.19921875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 14.0, 16.0, 26.0, 29.0, 70.0, 102.0, 136.0, 152.0, 260.0, 428.0, 590.0, 1039.0, 1560.0, 2530.0, 3849.0, 6299.0, 10396.0, 16999.0, 28476.0, 47172.0, 78194.0, 123597.0, 172034.0, 182285.0, 140064.0, 90825.0, 55851.0, 33224.0, 20093.0, 12349.0, 7341.0, 4585.0, 2821.0, 1751.0, 1166.0, 774.0, 454.0, 323.0, 212.0, 159.0, 113.0, 48.0, 50.0, 37.0, 12.0, 10.0, 6.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8154296875, -0.7892608642578125, -0.763092041015625, -0.7369232177734375, -0.71075439453125, -0.6845855712890625, -0.658416748046875, -0.6322479248046875, -0.6060791015625, -0.5799102783203125, -0.553741455078125, -0.5275726318359375, -0.50140380859375, -0.4752349853515625, -0.449066162109375, -0.4228973388671875, -0.396728515625, -0.3705596923828125, -0.344390869140625, -0.3182220458984375, -0.29205322265625, -0.2658843994140625, -0.239715576171875, -0.2135467529296875, -0.1873779296875, -0.1612091064453125, -0.135040283203125, -0.1088714599609375, -0.08270263671875, -0.0565338134765625, -0.030364990234375, -0.0041961669921875, 0.02197265625, 0.0481414794921875, 0.074310302734375, 0.1004791259765625, 0.12664794921875, 0.1528167724609375, 0.178985595703125, 0.2051544189453125, 0.2313232421875, 0.2574920654296875, 0.283660888671875, 0.3098297119140625, 0.33599853515625, 0.3621673583984375, 0.388336181640625, 0.4145050048828125, 0.440673828125, 0.4668426513671875, 0.493011474609375, 0.5191802978515625, 0.54534912109375, 0.5715179443359375, 0.597686767578125, 0.6238555908203125, 0.6500244140625, 0.6761932373046875, 0.702362060546875, 0.7285308837890625, 0.75469970703125, 0.7808685302734375, 0.807037353515625, 0.8332061767578125, 0.859375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 13.0, 16.0, 15.0, 22.0, 21.0, 27.0, 37.0, 37.0, 40.0, 38.0, 34.0, 35.0, 48.0, 48.0, 1080.0, 54.0, 40.0, 43.0, 43.0, 42.0, 39.0, 34.0, 27.0, 32.0, 32.0, 21.0, 24.0, 19.0, 16.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.60833740234375, -5.4119873046875, -5.21563720703125, -5.019287109375, -4.82293701171875, -4.6265869140625, -4.43023681640625, -4.23388671875, -4.03753662109375, -3.8411865234375, -3.64483642578125, -3.448486328125, -3.25213623046875, -3.0557861328125, -2.85943603515625, -2.6630859375, -2.46673583984375, -2.2703857421875, -2.07403564453125, -1.877685546875, -1.68133544921875, -1.4849853515625, -1.28863525390625, -1.09228515625, -0.89593505859375, -0.6995849609375, -0.50323486328125, -0.306884765625, -0.11053466796875, 0.0858154296875, 0.28216552734375, 0.478515625, 0.67486572265625, 0.8712158203125, 1.06756591796875, 1.263916015625, 1.46026611328125, 1.6566162109375, 1.85296630859375, 2.04931640625, 2.24566650390625, 2.4420166015625, 2.63836669921875, 2.834716796875, 3.03106689453125, 3.2274169921875, 3.42376708984375, 3.6201171875, 3.81646728515625, 4.0128173828125, 4.20916748046875, 4.405517578125, 4.60186767578125, 4.7982177734375, 4.99456787109375, 5.19091796875, 5.38726806640625, 5.5836181640625, 5.77996826171875, 5.976318359375, 6.17266845703125, 6.3690185546875, 6.56536865234375, 6.76171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 6.0, 11.0, 14.0, 28.0, 36.0, 51.0, 84.0, 135.0, 201.0, 282.0, 422.0, 630.0, 917.0, 1314.0, 1979.0, 2766.0, 4309.0, 6283.0, 9285.0, 14094.0, 21222.0, 31590.0, 46802.0, 67400.0, 93013.0, 118996.0, 1162956.0, 149220.0, 107157.0, 80543.0, 56921.0, 38983.0, 26495.0, 17401.0, 11635.0, 7664.0, 5286.0, 3571.0, 2350.0, 1585.0, 1189.0, 734.0, 494.0, 370.0, 235.0, 160.0, 102.0, 88.0, 44.0, 31.0, 19.0, 14.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.52685546875, -0.509735107421875, -0.49261474609375, -0.475494384765625, -0.4583740234375, -0.441253662109375, -0.42413330078125, -0.407012939453125, -0.389892578125, -0.372772216796875, -0.35565185546875, -0.338531494140625, -0.3214111328125, -0.304290771484375, -0.28717041015625, -0.270050048828125, -0.2529296875, -0.235809326171875, -0.21868896484375, -0.201568603515625, -0.1844482421875, -0.167327880859375, -0.15020751953125, -0.133087158203125, -0.115966796875, -0.098846435546875, -0.08172607421875, -0.064605712890625, -0.0474853515625, -0.030364990234375, -0.01324462890625, 0.003875732421875, 0.02099609375, 0.038116455078125, 0.05523681640625, 0.072357177734375, 0.0894775390625, 0.106597900390625, 0.12371826171875, 0.140838623046875, 0.157958984375, 0.175079345703125, 0.19219970703125, 0.209320068359375, 0.2264404296875, 0.243560791015625, 0.26068115234375, 0.277801513671875, 0.294921875, 0.312042236328125, 0.32916259765625, 0.346282958984375, 0.3634033203125, 0.380523681640625, 0.39764404296875, 0.414764404296875, 0.431884765625, 0.449005126953125, 0.46612548828125, 0.483245849609375, 0.5003662109375, 0.517486572265625, 0.53460693359375, 0.551727294921875, 0.56884765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 9.0, 7.0, 6.0, 6.0, 11.0, 10.0, 15.0, 15.0, 16.0, 34.0, 32.0, 54.0, 67.0, 81.0, 79.0, 85.0, 82.0, 90.0, 67.0, 40.0, 52.0, 32.0, 23.0, 20.0, 7.0, 11.0, 6.0, 8.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0113372802734375, -0.010990262031555176, -0.010643243789672852, -0.010296225547790527, -0.009949207305908203, -0.009602189064025879, -0.009255170822143555, -0.00890815258026123, -0.008561134338378906, -0.008214116096496582, -0.007867097854614258, -0.007520079612731934, -0.007173061370849609, -0.006826043128967285, -0.006479024887084961, -0.006132006645202637, -0.0057849884033203125, -0.005437970161437988, -0.005090951919555664, -0.00474393367767334, -0.004396915435791016, -0.004049897193908691, -0.003702878952026367, -0.003355860710144043, -0.0030088424682617188, -0.0026618242263793945, -0.0023148059844970703, -0.001967787742614746, -0.0016207695007324219, -0.0012737512588500977, -0.0009267330169677734, -0.0005797147750854492, -0.000232696533203125, 0.00011432170867919922, 0.00046133995056152344, 0.0008083581924438477, 0.0011553764343261719, 0.001502394676208496, 0.0018494129180908203, 0.0021964311599731445, 0.0025434494018554688, 0.002890467643737793, 0.003237485885620117, 0.0035845041275024414, 0.003931522369384766, 0.00427854061126709, 0.004625558853149414, 0.004972577095031738, 0.0053195953369140625, 0.005666613578796387, 0.006013631820678711, 0.006360650062561035, 0.006707668304443359, 0.007054686546325684, 0.007401704788208008, 0.007748723030090332, 0.008095741271972656, 0.00844275951385498, 0.008789777755737305, 0.009136795997619629, 0.009483814239501953, 0.009830832481384277, 0.010177850723266602, 0.010524868965148926, 0.01087188720703125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 9.0, 9.0, 10.0, 17.0, 20.0, 28.0, 39.0, 62.0, 117.0, 139.0, 246.0, 487.0, 3164.0, 1039810.0, 3079.0, 519.0, 256.0, 159.0, 92.0, 66.0, 36.0, 29.0, 23.0, 24.0, 15.0, 13.0, 15.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.227783203125, -0.220550537109375, -0.21331787109375, -0.206085205078125, -0.1988525390625, -0.191619873046875, -0.18438720703125, -0.177154541015625, -0.169921875, -0.162689208984375, -0.15545654296875, -0.148223876953125, -0.1409912109375, -0.133758544921875, -0.12652587890625, -0.119293212890625, -0.112060546875, -0.104827880859375, -0.09759521484375, -0.090362548828125, -0.0831298828125, -0.075897216796875, -0.06866455078125, -0.061431884765625, -0.05419921875, -0.046966552734375, -0.03973388671875, -0.032501220703125, -0.0252685546875, -0.018035888671875, -0.01080322265625, -0.003570556640625, 0.003662109375, 0.010894775390625, 0.01812744140625, 0.025360107421875, 0.0325927734375, 0.039825439453125, 0.04705810546875, 0.054290771484375, 0.0615234375, 0.068756103515625, 0.07598876953125, 0.083221435546875, 0.0904541015625, 0.097686767578125, 0.10491943359375, 0.112152099609375, 0.119384765625, 0.126617431640625, 0.13385009765625, 0.141082763671875, 0.1483154296875, 0.155548095703125, 0.16278076171875, 0.170013427734375, 0.17724609375, 0.184478759765625, 0.19171142578125, 0.198944091796875, 0.2061767578125, 0.213409423828125, 0.22064208984375, 0.227874755859375, 0.235107421875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 157.0, 850.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02097179926931858, -0.019102659076452255, -0.01723351702094078, -0.015364376828074455, -0.01349523663520813, -0.011626096442341805, -0.009756955318152905, -0.007887814193964005, -0.006018674001097679, -0.0041495333425700665, -0.0022803926840424538, -0.0004112520255148411, 0.0014578886330127716, 0.003327028825879097, 0.005196169950067997, 0.007065311074256897, 0.008934451267123222, 0.010803591459989548, 0.012672732584178448, 0.014541873708367348, 0.016411013901233673, 0.0182801540941, 0.020149294286966324, 0.0220184363424778, 0.023887576535344124, 0.02575671672821045, 0.027625858783721924, 0.02949499897658825, 0.031364139169454575, 0.03323327749967575, 0.035102419555187225, 0.0369715616106987, 0.038840703666210175, 0.04070984572172165, 0.042578984051942825, 0.0444481261074543, 0.046317264437675476, 0.04818640649318695, 0.050055548548698425, 0.0519246906042099, 0.053793828934431076, 0.05566297098994255, 0.05753210932016373, 0.0594012513756752, 0.061270393431186676, 0.06313952803611755, 0.06500867009162903, 0.0668778121471405, 0.06874695420265198, 0.07061609625816345, 0.07248523831367493, 0.0743543729186058, 0.07622351497411728, 0.07809265702962875, 0.07996179908514023, 0.0818309411406517, 0.08370007574558258, 0.08556921780109406, 0.08743835985660553, 0.08930749446153641, 0.09117663651704788, 0.09304577857255936, 0.09491492062807083, 0.0967840626835823, 0.09865320473909378]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 10.0, 10.0, 9.0, 21.0, 22.0, 29.0, 25.0, 31.0, 34.0, 39.0, 34.0, 46.0, 47.0, 42.0, 43.0, 45.0, 55.0, 51.0, 42.0, 52.0, 40.0, 35.0, 26.0, 29.0, 26.0, 25.0, 25.0, 16.0, 15.0, 17.0, 11.0, 13.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006829380989074707, -0.006621931679546833, -0.006414482370018959, -0.006207033060491085, -0.005999583750963211, -0.005792134441435337, -0.005584685131907463, -0.005377235822379589, -0.005169786512851715, -0.004962337203323841, -0.004754887893795967, -0.004547438584268093, -0.004339989274740219, -0.004132539965212345, -0.003925090655684471, -0.003717641346156597, -0.003510192036628723, -0.003302742727100849, -0.003095293417572975, -0.002887844108045101, -0.002680394798517227, -0.002472945488989353, -0.002265496179461479, -0.002058046869933605, -0.0018505975604057312, -0.0016431482508778572, -0.0014356989413499832, -0.0012282496318221092, -0.0010208003222942352, -0.0008133510127663612, -0.0006059017032384872, -0.00039845239371061325, -0.00019100308418273926, 1.6446225345134735e-05, 0.00022389553487300873, 0.0004313448444008827, 0.0006387941539287567, 0.0008462434634566307, 0.0010536927729845047, 0.0012611420825123787, 0.0014685913920402527, 0.0016760407015681267, 0.0018834900110960007, 0.0020909393206238747, 0.0022983886301517487, 0.0025058379396796227, 0.0027132872492074966, 0.0029207365587353706, 0.0031281858682632446, 0.0033356351777911186, 0.0035430844873189926, 0.0037505337968468666, 0.003957983106374741, 0.004165432415902615, 0.004372881725430489, 0.004580331034958363, 0.004787780344486237, 0.0049952296540141106, 0.0052026789635419846, 0.0054101282730698586, 0.0056175775825977325, 0.0058250268921256065, 0.0060324762016534805, 0.0062399255111813545, 0.0064473748207092285]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 3.0, 8.0, 8.0, 11.0, 13.0, 18.0, 12.0, 11.0, 10.0, 20.0, 19.0, 23.0, 22.0, 23.0, 30.0, 27.0, 17.0, 24.0, 37.0, 33.0, 36.0, 30.0, 41.0, 39.0, 41.0, 30.0, 34.0, 37.0, 25.0, 35.0, 27.0, 28.0, 19.0, 18.0, 19.0, 23.0, 19.0, 21.0, 22.0, 20.0, 12.0, 9.0, 11.0, 5.0, 5.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.89453125, -6.67431640625, -6.4541015625, -6.23388671875, -6.013671875, -5.79345703125, -5.5732421875, -5.35302734375, -5.1328125, -4.91259765625, -4.6923828125, -4.47216796875, -4.251953125, -4.03173828125, -3.8115234375, -3.59130859375, -3.37109375, -3.15087890625, -2.9306640625, -2.71044921875, -2.490234375, -2.27001953125, -2.0498046875, -1.82958984375, -1.609375, -1.38916015625, -1.1689453125, -0.94873046875, -0.728515625, -0.50830078125, -0.2880859375, -0.06787109375, 0.15234375, 0.37255859375, 0.5927734375, 0.81298828125, 1.033203125, 1.25341796875, 1.4736328125, 1.69384765625, 1.9140625, 2.13427734375, 2.3544921875, 2.57470703125, 2.794921875, 3.01513671875, 3.2353515625, 3.45556640625, 3.67578125, 3.89599609375, 4.1162109375, 4.33642578125, 4.556640625, 4.77685546875, 4.9970703125, 5.21728515625, 5.4375, 5.65771484375, 5.8779296875, 6.09814453125, 6.318359375, 6.53857421875, 6.7587890625, 6.97900390625, 7.19921875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 15.0, 10.0, 15.0, 33.0, 43.0, 34.0, 45.0, 48.0, 69.0, 84.0, 122.0, 149.0, 195.0, 272.0, 329.0, 430.0, 549.0, 993.0, 2406.0, 7159.0, 24815.0, 145303.0, 767302.0, 72391.0, 16029.0, 4826.0, 1740.0, 849.0, 511.0, 381.0, 292.0, 227.0, 187.0, 125.0, 137.0, 88.0, 74.0, 71.0, 44.0, 38.0, 19.0, 17.0, 19.0, 9.0, 11.0, 7.0, 9.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-17.375, -16.820556640625, -16.26611328125, -15.711669921875, -15.1572265625, -14.602783203125, -14.04833984375, -13.493896484375, -12.939453125, -12.385009765625, -11.83056640625, -11.276123046875, -10.7216796875, -10.167236328125, -9.61279296875, -9.058349609375, -8.50390625, -7.949462890625, -7.39501953125, -6.840576171875, -6.2861328125, -5.731689453125, -5.17724609375, -4.622802734375, -4.068359375, -3.513916015625, -2.95947265625, -2.405029296875, -1.8505859375, -1.296142578125, -0.74169921875, -0.187255859375, 0.3671875, 0.921630859375, 1.47607421875, 2.030517578125, 2.5849609375, 3.139404296875, 3.69384765625, 4.248291015625, 4.802734375, 5.357177734375, 5.91162109375, 6.466064453125, 7.0205078125, 7.574951171875, 8.12939453125, 8.683837890625, 9.23828125, 9.792724609375, 10.34716796875, 10.901611328125, 11.4560546875, 12.010498046875, 12.56494140625, 13.119384765625, 13.673828125, 14.228271484375, 14.78271484375, 15.337158203125, 15.8916015625, 16.446044921875, 17.00048828125, 17.554931640625, 18.109375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 11.0, 9.0, 5.0, 6.0, 7.0, 15.0, 20.0, 19.0, 20.0, 19.0, 16.0, 31.0, 31.0, 29.0, 32.0, 39.0, 39.0, 54.0, 51.0, 92.0, 340.0, 1546.0, 99.0, 77.0, 50.0, 53.0, 40.0, 43.0, 41.0, 37.0, 21.0, 33.0, 20.0, 22.0, 17.0, 16.0, 7.0, 5.0, 7.0, 4.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.203125, -24.442626953125, -23.68212890625, -22.921630859375, -22.1611328125, -21.400634765625, -20.64013671875, -19.879638671875, -19.119140625, -18.358642578125, -17.59814453125, -16.837646484375, -16.0771484375, -15.316650390625, -14.55615234375, -13.795654296875, -13.03515625, -12.274658203125, -11.51416015625, -10.753662109375, -9.9931640625, -9.232666015625, -8.47216796875, -7.711669921875, -6.951171875, -6.190673828125, -5.43017578125, -4.669677734375, -3.9091796875, -3.148681640625, -2.38818359375, -1.627685546875, -0.8671875, -0.106689453125, 0.65380859375, 1.414306640625, 2.1748046875, 2.935302734375, 3.69580078125, 4.456298828125, 5.216796875, 5.977294921875, 6.73779296875, 7.498291015625, 8.2587890625, 9.019287109375, 9.77978515625, 10.540283203125, 11.30078125, 12.061279296875, 12.82177734375, 13.582275390625, 14.3427734375, 15.103271484375, 15.86376953125, 16.624267578125, 17.384765625, 18.145263671875, 18.90576171875, 19.666259765625, 20.4267578125, 21.187255859375, 21.94775390625, 22.708251953125, 23.46875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 11.0, 9.0, 14.0, 16.0, 22.0, 34.0, 58.0, 47.0, 94.0, 113.0, 168.0, 320.0, 1040.0, 16020.0, 3113939.0, 11984.0, 894.0, 321.0, 172.0, 93.0, 68.0, 47.0, 45.0, 37.0, 31.0, 18.0, 14.0, 13.0, 15.0, 10.0, 8.0, 1.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.6875, -89.7421875, -86.796875, -83.8515625, -80.90625, -77.9609375, -75.015625, -72.0703125, -69.125, -66.1796875, -63.234375, -60.2890625, -57.34375, -54.3984375, -51.453125, -48.5078125, -45.5625, -42.6171875, -39.671875, -36.7265625, -33.78125, -30.8359375, -27.890625, -24.9453125, -22.0, -19.0546875, -16.109375, -13.1640625, -10.21875, -7.2734375, -4.328125, -1.3828125, 1.5625, 4.5078125, 7.453125, 10.3984375, 13.34375, 16.2890625, 19.234375, 22.1796875, 25.125, 28.0703125, 31.015625, 33.9609375, 36.90625, 39.8515625, 42.796875, 45.7421875, 48.6875, 51.6328125, 54.578125, 57.5234375, 60.46875, 63.4140625, 66.359375, 69.3046875, 72.25, 75.1953125, 78.140625, 81.0859375, 84.03125, 86.9765625, 89.921875, 92.8671875, 95.8125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 155.0, 733.0, 125.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.6582794189453, -137.4762725830078, -132.29428100585938, -127.11227416992188, -121.9302749633789, -116.74827575683594, -111.56626892089844, -106.38426971435547, -101.2022705078125, -96.02027130126953, -90.83827209472656, -85.65626525878906, -80.4742660522461, -75.29226684570312, -70.11026000976562, -64.92826080322266, -59.74626159667969, -54.56426239013672, -49.382259368896484, -44.20025634765625, -39.01825714111328, -33.83625793457031, -28.654254913330078, -23.472251892089844, -18.290252685546875, -13.108251571655273, -7.926250457763672, -2.7442493438720703, 2.4377517700195312, 7.619752883911133, 12.801753997802734, 17.98375701904297, 23.165756225585938, 28.34775733947754, 33.52975845336914, 38.711761474609375, 43.893760681152344, 49.07575988769531, 54.25776290893555, 59.43976593017578, 64.62176513671875, 69.80376434326172, 74.98576354980469, 80.16777038574219, 85.34976959228516, 90.53176879882812, 95.71377563476562, 100.8957748413086, 106.07777404785156, 111.25977325439453, 116.4417724609375, 121.623779296875, 126.80577850341797, 131.98777770996094, 137.16978454589844, 142.35177612304688, 147.53378295898438, 152.71578979492188, 157.8977813720703, 163.0797882080078, 168.26177978515625, 173.44378662109375, 178.62579345703125, 183.80780029296875, 188.9897918701172]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 9.0, 7.0, 10.0, 13.0, 8.0, 16.0, 28.0, 20.0, 17.0, 33.0, 25.0, 22.0, 36.0, 36.0, 42.0, 34.0, 40.0, 40.0, 52.0, 50.0, 39.0, 49.0, 33.0, 38.0, 31.0, 42.0, 24.0, 32.0, 19.0, 23.0, 19.0, 18.0, 11.0, 16.0, 13.0, 6.0, 9.0, 9.0, 9.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.78366088867188, -68.73002624511719, -66.67639923095703, -64.62276458740234, -62.56913757324219, -60.515506744384766, -58.461875915527344, -56.408241271972656, -54.3546142578125, -52.30098342895508, -50.247352600097656, -48.193721771240234, -46.14009094238281, -44.08646011352539, -42.03282928466797, -39.97919464111328, -37.92556381225586, -35.87193298339844, -33.818302154541016, -31.764671325683594, -29.711040496826172, -27.65740966796875, -25.603776931762695, -23.550146102905273, -21.49651527404785, -19.44288444519043, -17.389253616333008, -15.33562183380127, -13.281991004943848, -11.228360176086426, -9.174728393554688, -7.121097564697266, -5.067470550537109, -3.0138394832611084, -0.9602084159851074, 1.0934228897094727, 3.1470537185668945, 5.200684547424316, 7.254316329956055, 9.307947158813477, 11.361577987670898, 13.41520881652832, 15.468839645385742, 17.522472381591797, 19.57610321044922, 21.62973403930664, 23.683364868164062, 25.736995697021484, 27.790626525878906, 29.844257354736328, 31.89788818359375, 33.95151901245117, 36.005149841308594, 38.058780670166016, 40.11241149902344, 42.166046142578125, 44.21967315673828, 46.2733039855957, 48.326934814453125, 50.38056564331055, 52.43419647216797, 54.48782730102539, 56.54145812988281, 58.5950927734375, 60.64872360229492]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 7.0, 7.0, 8.0, 19.0, 17.0, 17.0, 17.0, 26.0, 22.0, 22.0, 20.0, 22.0, 22.0, 23.0, 30.0, 30.0, 29.0, 37.0, 31.0, 45.0, 40.0, 28.0, 44.0, 41.0, 27.0, 33.0, 35.0, 27.0, 28.0, 18.0, 24.0, 15.0, 31.0, 20.0, 11.0, 22.0, 7.0, 14.0, 14.0, 8.0, 12.0, 6.0, 7.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.484375, -7.253173828125, -7.02197265625, -6.790771484375, -6.5595703125, -6.328369140625, -6.09716796875, -5.865966796875, -5.634765625, -5.403564453125, -5.17236328125, -4.941162109375, -4.7099609375, -4.478759765625, -4.24755859375, -4.016357421875, -3.78515625, -3.553955078125, -3.32275390625, -3.091552734375, -2.8603515625, -2.629150390625, -2.39794921875, -2.166748046875, -1.935546875, -1.704345703125, -1.47314453125, -1.241943359375, -1.0107421875, -0.779541015625, -0.54833984375, -0.317138671875, -0.0859375, 0.145263671875, 0.37646484375, 0.607666015625, 0.8388671875, 1.070068359375, 1.30126953125, 1.532470703125, 1.763671875, 1.994873046875, 2.22607421875, 2.457275390625, 2.6884765625, 2.919677734375, 3.15087890625, 3.382080078125, 3.61328125, 3.844482421875, 4.07568359375, 4.306884765625, 4.5380859375, 4.769287109375, 5.00048828125, 5.231689453125, 5.462890625, 5.694091796875, 5.92529296875, 6.156494140625, 6.3876953125, 6.618896484375, 6.85009765625, 7.081298828125, 7.3125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 6.0, 10.0, 15.0, 19.0, 32.0, 17.0, 29.0, 46.0, 35.0, 65.0, 120.0, 138.0, 168.0, 224.0, 342.0, 573.0, 1087.0, 2266.0, 5985.0, 19477.0, 90458.0, 589102.0, 2034367.0, 1190433.0, 204976.0, 36791.0, 10195.0, 3519.0, 1503.0, 779.0, 437.0, 280.0, 185.0, 124.0, 94.0, 94.0, 61.0, 39.0, 39.0, 34.0, 18.0, 18.0, 11.0, 11.0, 8.0, 13.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.8515625, -13.42822265625, -13.0048828125, -12.58154296875, -12.158203125, -11.73486328125, -11.3115234375, -10.88818359375, -10.46484375, -10.04150390625, -9.6181640625, -9.19482421875, -8.771484375, -8.34814453125, -7.9248046875, -7.50146484375, -7.078125, -6.65478515625, -6.2314453125, -5.80810546875, -5.384765625, -4.96142578125, -4.5380859375, -4.11474609375, -3.69140625, -3.26806640625, -2.8447265625, -2.42138671875, -1.998046875, -1.57470703125, -1.1513671875, -0.72802734375, -0.3046875, 0.11865234375, 0.5419921875, 0.96533203125, 1.388671875, 1.81201171875, 2.2353515625, 2.65869140625, 3.08203125, 3.50537109375, 3.9287109375, 4.35205078125, 4.775390625, 5.19873046875, 5.6220703125, 6.04541015625, 6.46875, 6.89208984375, 7.3154296875, 7.73876953125, 8.162109375, 8.58544921875, 9.0087890625, 9.43212890625, 9.85546875, 10.27880859375, 10.7021484375, 11.12548828125, 11.548828125, 11.97216796875, 12.3955078125, 12.81884765625, 13.2421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 4.0, 2.0, 6.0, 18.0, 16.0, 12.0, 20.0, 22.0, 28.0, 52.0, 53.0, 85.0, 97.0, 121.0, 184.0, 249.0, 293.0, 372.0, 423.0, 414.0, 329.0, 266.0, 219.0, 163.0, 126.0, 114.0, 63.0, 68.0, 53.0, 51.0, 32.0, 24.0, 5.0, 16.0, 12.0, 7.0, 8.0, 6.0, 5.0, 4.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-10.2265625, -9.8712158203125, -9.515869140625, -9.1605224609375, -8.80517578125, -8.4498291015625, -8.094482421875, -7.7391357421875, -7.3837890625, -7.0284423828125, -6.673095703125, -6.3177490234375, -5.96240234375, -5.6070556640625, -5.251708984375, -4.8963623046875, -4.541015625, -4.1856689453125, -3.830322265625, -3.4749755859375, -3.11962890625, -2.7642822265625, -2.408935546875, -2.0535888671875, -1.6982421875, -1.3428955078125, -0.987548828125, -0.6322021484375, -0.27685546875, 0.0784912109375, 0.433837890625, 0.7891845703125, 1.14453125, 1.4998779296875, 1.855224609375, 2.2105712890625, 2.56591796875, 2.9212646484375, 3.276611328125, 3.6319580078125, 3.9873046875, 4.3426513671875, 4.697998046875, 5.0533447265625, 5.40869140625, 5.7640380859375, 6.119384765625, 6.4747314453125, 6.830078125, 7.1854248046875, 7.540771484375, 7.8961181640625, 8.25146484375, 8.6068115234375, 8.962158203125, 9.3175048828125, 9.6728515625, 10.0281982421875, 10.383544921875, 10.7388916015625, 11.09423828125, 11.4495849609375, 11.804931640625, 12.1602783203125, 12.515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 9.0, 10.0, 13.0, 11.0, 10.0, 27.0, 23.0, 25.0, 58.0, 62.0, 112.0, 130.0, 208.0, 290.0, 468.0, 1062.0, 3660.0, 27315.0, 597643.0, 3415959.0, 132682.0, 10737.0, 1956.0, 714.0, 340.0, 214.0, 149.0, 93.0, 95.0, 53.0, 42.0, 26.0, 21.0, 14.0, 13.0, 4.0, 10.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.49951171875, -37.3427734375, -36.18603515625, -35.029296875, -33.87255859375, -32.7158203125, -31.55908203125, -30.40234375, -29.24560546875, -28.0888671875, -26.93212890625, -25.775390625, -24.61865234375, -23.4619140625, -22.30517578125, -21.1484375, -19.99169921875, -18.8349609375, -17.67822265625, -16.521484375, -15.36474609375, -14.2080078125, -13.05126953125, -11.89453125, -10.73779296875, -9.5810546875, -8.42431640625, -7.267578125, -6.11083984375, -4.9541015625, -3.79736328125, -2.640625, -1.48388671875, -0.3271484375, 0.82958984375, 1.986328125, 3.14306640625, 4.2998046875, 5.45654296875, 6.61328125, 7.77001953125, 8.9267578125, 10.08349609375, 11.240234375, 12.39697265625, 13.5537109375, 14.71044921875, 15.8671875, 17.02392578125, 18.1806640625, 19.33740234375, 20.494140625, 21.65087890625, 22.8076171875, 23.96435546875, 25.12109375, 26.27783203125, 27.4345703125, 28.59130859375, 29.748046875, 30.90478515625, 32.0615234375, 33.21826171875, 34.375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 23.0, 965.0, 29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-614.2161865234375, -590.099609375, -565.9830322265625, -541.866455078125, -517.7498779296875, -493.63330078125, -469.5167541503906, -445.4001770019531, -421.2835998535156, -397.1670227050781, -373.0504455566406, -348.93389892578125, -324.81732177734375, -300.70074462890625, -276.58416748046875, -252.46759033203125, -228.35101318359375, -204.23443603515625, -180.11785888671875, -156.0012969970703, -131.8847198486328, -107.76814270019531, -83.65158081054688, -59.535003662109375, -35.418426513671875, -11.30185317993164, 12.814720153808594, 36.93128967285156, 61.04786682128906, 85.16444396972656, 109.281005859375, 133.3975830078125, 157.51422119140625, 181.63079833984375, 205.74737548828125, 229.8639373779297, 253.9805145263672, 278.09710693359375, 302.2136535644531, 326.3302307128906, 350.4468078613281, 374.5633850097656, 398.6799621582031, 422.7965087890625, 446.9130859375, 471.0296630859375, 495.146240234375, 519.2628173828125, 543.37939453125, 567.4959716796875, 591.612548828125, 615.7291259765625, 639.845703125, 663.9622802734375, 688.078857421875, 712.1954345703125, 736.31201171875, 760.4285888671875, 784.545166015625, 808.6617431640625, 832.7783203125, 856.8948974609375, 881.011474609375, 905.1280517578125, 929.2445678710938]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 14.0, 13.0, 10.0, 17.0, 16.0, 24.0, 17.0, 36.0, 31.0, 39.0, 27.0, 37.0, 32.0, 32.0, 48.0, 44.0, 41.0, 55.0, 40.0, 49.0, 43.0, 35.0, 28.0, 43.0, 28.0, 33.0, 26.0, 20.0, 16.0, 24.0, 17.0, 14.0, 9.0, 10.0, 7.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.998779296875, -47.50312805175781, -46.00748062133789, -44.5118293762207, -43.01618194580078, -41.520530700683594, -40.024879455566406, -38.52922821044922, -37.0335807800293, -35.53792953491211, -34.04228210449219, -32.546630859375, -31.050981521606445, -29.55533218383789, -28.059680938720703, -26.56403160095215, -25.068382263183594, -23.57273292541504, -22.077083587646484, -20.581432342529297, -19.085783004760742, -17.590133666992188, -16.094482421875, -14.598833084106445, -13.10318374633789, -11.607534408569336, -10.111884117126465, -8.616233825683594, -7.120584487915039, -5.624934673309326, -4.129284858703613, -2.633634567260742, -1.1379852294921875, 0.3576645851135254, 1.8533143997192383, 3.348964214324951, 4.844614028930664, 6.340263843536377, 7.83591365814209, 9.331563949584961, 10.827213287353516, 12.32286262512207, 13.818512916564941, 15.314163208007812, 16.809812545776367, 18.305461883544922, 19.80111312866211, 21.296762466430664, 22.79241180419922, 24.288061141967773, 25.783710479736328, 27.279361724853516, 28.77501106262207, 30.270660400390625, 31.766311645507812, 33.261962890625, 34.75761032104492, 36.25326156616211, 37.74890899658203, 39.24456024169922, 40.740211486816406, 42.23585891723633, 43.731510162353516, 45.22715759277344, 46.722808837890625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 5.0, 11.0, 12.0, 18.0, 14.0, 15.0, 23.0, 26.0, 21.0, 33.0, 31.0, 27.0, 42.0, 33.0, 39.0, 33.0, 37.0, 36.0, 51.0, 33.0, 48.0, 43.0, 41.0, 35.0, 24.0, 25.0, 28.0, 28.0, 33.0, 26.0, 21.0, 19.0, 13.0, 7.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9617919921875, -7.689208984375, -7.4166259765625, -7.14404296875, -6.8714599609375, -6.598876953125, -6.3262939453125, -6.0537109375, -5.7811279296875, -5.508544921875, -5.2359619140625, -4.96337890625, -4.6907958984375, -4.418212890625, -4.1456298828125, -3.873046875, -3.6004638671875, -3.327880859375, -3.0552978515625, -2.78271484375, -2.5101318359375, -2.237548828125, -1.9649658203125, -1.6923828125, -1.4197998046875, -1.147216796875, -0.8746337890625, -0.60205078125, -0.3294677734375, -0.056884765625, 0.2156982421875, 0.48828125, 0.7608642578125, 1.033447265625, 1.3060302734375, 1.57861328125, 1.8511962890625, 2.123779296875, 2.3963623046875, 2.6689453125, 2.9415283203125, 3.214111328125, 3.4866943359375, 3.75927734375, 4.0318603515625, 4.304443359375, 4.5770263671875, 4.849609375, 5.1221923828125, 5.394775390625, 5.6673583984375, 5.93994140625, 6.2125244140625, 6.485107421875, 6.7576904296875, 7.0302734375, 7.3028564453125, 7.575439453125, 7.8480224609375, 8.12060546875, 8.3931884765625, 8.665771484375, 8.9383544921875, 9.2109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 16.0, 22.0, 29.0, 59.0, 58.0, 119.0, 160.0, 226.0, 343.0, 462.0, 669.0, 1090.0, 1534.0, 2386.0, 3587.0, 5463.0, 8448.0, 13325.0, 20584.0, 32221.0, 50229.0, 76252.0, 112241.0, 150397.0, 163227.0, 133511.0, 94597.0, 62466.0, 40906.0, 26002.0, 16634.0, 10781.0, 6969.0, 4560.0, 2924.0, 2033.0, 1263.0, 917.0, 618.0, 400.0, 253.0, 172.0, 132.0, 88.0, 56.0, 50.0, 24.0, 19.0, 12.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73876953125, -0.7151412963867188, -0.6915130615234375, -0.6678848266601562, -0.644256591796875, -0.6206283569335938, -0.5970001220703125, -0.5733718872070312, -0.54974365234375, -0.5261154174804688, -0.5024871826171875, -0.47885894775390625, -0.455230712890625, -0.43160247802734375, -0.4079742431640625, -0.38434600830078125, -0.3607177734375, -0.33708953857421875, -0.3134613037109375, -0.28983306884765625, -0.266204833984375, -0.24257659912109375, -0.2189483642578125, -0.19532012939453125, -0.17169189453125, -0.14806365966796875, -0.1244354248046875, -0.10080718994140625, -0.077178955078125, -0.05355072021484375, -0.0299224853515625, -0.00629425048828125, 0.017333984375, 0.04096221923828125, 0.0645904541015625, 0.08821868896484375, 0.111846923828125, 0.13547515869140625, 0.1591033935546875, 0.18273162841796875, 0.20635986328125, 0.22998809814453125, 0.2536163330078125, 0.27724456787109375, 0.300872802734375, 0.32450103759765625, 0.3481292724609375, 0.37175750732421875, 0.3953857421875, 0.41901397705078125, 0.4426422119140625, 0.46627044677734375, 0.489898681640625, 0.5135269165039062, 0.5371551513671875, 0.5607833862304688, 0.58441162109375, 0.6080398559570312, 0.6316680908203125, 0.6552963256835938, 0.678924560546875, 0.7025527954101562, 0.7261810302734375, 0.7498092651367188, 0.7734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 8.0, 7.0, 8.0, 10.0, 8.0, 14.0, 12.0, 15.0, 19.0, 21.0, 17.0, 18.0, 28.0, 25.0, 33.0, 33.0, 34.0, 33.0, 36.0, 32.0, 41.0, 1063.0, 49.0, 39.0, 30.0, 43.0, 40.0, 33.0, 34.0, 32.0, 30.0, 26.0, 30.0, 24.0, 10.0, 12.0, 13.0, 11.0, 8.0, 8.0, 7.0, 7.0, 3.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.5078125, -5.33544921875, -5.1630859375, -4.99072265625, -4.818359375, -4.64599609375, -4.4736328125, -4.30126953125, -4.12890625, -3.95654296875, -3.7841796875, -3.61181640625, -3.439453125, -3.26708984375, -3.0947265625, -2.92236328125, -2.75, -2.57763671875, -2.4052734375, -2.23291015625, -2.060546875, -1.88818359375, -1.7158203125, -1.54345703125, -1.37109375, -1.19873046875, -1.0263671875, -0.85400390625, -0.681640625, -0.50927734375, -0.3369140625, -0.16455078125, 0.0078125, 0.18017578125, 0.3525390625, 0.52490234375, 0.697265625, 0.86962890625, 1.0419921875, 1.21435546875, 1.38671875, 1.55908203125, 1.7314453125, 1.90380859375, 2.076171875, 2.24853515625, 2.4208984375, 2.59326171875, 2.765625, 2.93798828125, 3.1103515625, 3.28271484375, 3.455078125, 3.62744140625, 3.7998046875, 3.97216796875, 4.14453125, 4.31689453125, 4.4892578125, 4.66162109375, 4.833984375, 5.00634765625, 5.1787109375, 5.35107421875, 5.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 23.0, 20.0, 37.0, 60.0, 85.0, 117.0, 191.0, 293.0, 447.0, 638.0, 927.0, 1304.0, 1961.0, 2843.0, 4116.0, 5890.0, 8579.0, 12715.0, 19126.0, 27649.0, 40673.0, 58829.0, 81655.0, 107203.0, 148987.0, 1156326.0, 114524.0, 90740.0, 65971.0, 45934.0, 31593.0, 21330.0, 14681.0, 9890.0, 6932.0, 4612.0, 3307.0, 2165.0, 1488.0, 1045.0, 730.0, 507.0, 319.0, 227.0, 148.0, 97.0, 69.0, 46.0, 32.0, 15.0, 9.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.537109375, -0.5198745727539062, -0.5026397705078125, -0.48540496826171875, -0.468170166015625, -0.45093536376953125, -0.4337005615234375, -0.41646575927734375, -0.39923095703125, -0.38199615478515625, -0.3647613525390625, -0.34752655029296875, -0.330291748046875, -0.31305694580078125, -0.2958221435546875, -0.27858734130859375, -0.2613525390625, -0.24411773681640625, -0.2268829345703125, -0.20964813232421875, -0.192413330078125, -0.17517852783203125, -0.1579437255859375, -0.14070892333984375, -0.12347412109375, -0.10623931884765625, -0.0890045166015625, -0.07176971435546875, -0.054534912109375, -0.03730010986328125, -0.0200653076171875, -0.00283050537109375, 0.014404296875, 0.03163909912109375, 0.0488739013671875, 0.06610870361328125, 0.083343505859375, 0.10057830810546875, 0.1178131103515625, 0.13504791259765625, 0.15228271484375, 0.16951751708984375, 0.1867523193359375, 0.20398712158203125, 0.221221923828125, 0.23845672607421875, 0.2556915283203125, 0.27292633056640625, 0.2901611328125, 0.30739593505859375, 0.3246307373046875, 0.34186553955078125, 0.359100341796875, 0.37633514404296875, 0.3935699462890625, 0.41080474853515625, 0.42803955078125, 0.44527435302734375, 0.4625091552734375, 0.47974395751953125, 0.496978759765625, 0.5142135620117188, 0.5314483642578125, 0.5486831665039062, 0.56591796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 8.0, 6.0, 15.0, 25.0, 32.0, 49.0, 63.0, 76.0, 87.0, 101.0, 95.0, 90.0, 64.0, 60.0, 47.0, 36.0, 28.0, 28.0, 19.0, 9.0, 5.0, 5.0, 3.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00931549072265625, -0.009016275405883789, -0.008717060089111328, -0.008417844772338867, -0.008118629455566406, -0.007819414138793945, -0.007520198822021484, -0.0072209835052490234, -0.0069217681884765625, -0.0066225528717041016, -0.006323337554931641, -0.00602412223815918, -0.005724906921386719, -0.005425691604614258, -0.005126476287841797, -0.004827260971069336, -0.004528045654296875, -0.004228830337524414, -0.003929615020751953, -0.003630399703979492, -0.0033311843872070312, -0.0030319690704345703, -0.0027327537536621094, -0.0024335384368896484, -0.0021343231201171875, -0.0018351078033447266, -0.0015358924865722656, -0.0012366771697998047, -0.0009374618530273438, -0.0006382465362548828, -0.0003390312194824219, -3.981590270996094e-05, 0.0002593994140625, 0.0005586147308349609, 0.0008578300476074219, 0.0011570453643798828, 0.0014562606811523438, 0.0017554759979248047, 0.0020546913146972656, 0.0023539066314697266, 0.0026531219482421875, 0.0029523372650146484, 0.0032515525817871094, 0.0035507678985595703, 0.0038499832153320312, 0.004149198532104492, 0.004448413848876953, 0.004747629165649414, 0.005046844482421875, 0.005346059799194336, 0.005645275115966797, 0.005944490432739258, 0.006243705749511719, 0.00654292106628418, 0.006842136383056641, 0.0071413516998291016, 0.0074405670166015625, 0.0077397823333740234, 0.008038997650146484, 0.008338212966918945, 0.008637428283691406, 0.008936643600463867, 0.009235858917236328, 0.009535074234008789, 0.00983428955078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 11.0, 14.0, 16.0, 32.0, 45.0, 56.0, 96.0, 116.0, 223.0, 428.0, 2202.0, 1039631.0, 4445.0, 513.0, 241.0, 156.0, 86.0, 62.0, 45.0, 22.0, 13.0, 12.0, 12.0, 16.0, 5.0, 5.0, 3.0, 4.0, 2.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.203857421875, -0.1977863311767578, -0.19171524047851562, -0.18564414978027344, -0.17957305908203125, -0.17350196838378906, -0.16743087768554688, -0.1613597869873047, -0.1552886962890625, -0.1492176055908203, -0.14314651489257812, -0.13707542419433594, -0.13100433349609375, -0.12493324279785156, -0.11886215209960938, -0.11279106140136719, -0.106719970703125, -0.10064888000488281, -0.09457778930664062, -0.08850669860839844, -0.08243560791015625, -0.07636451721191406, -0.07029342651367188, -0.06422233581542969, -0.0581512451171875, -0.05208015441894531, -0.046009063720703125, -0.03993797302246094, -0.03386688232421875, -0.027795791625976562, -0.021724700927734375, -0.015653610229492188, -0.00958251953125, -0.0035114288330078125, 0.002559661865234375, 0.008630752563476562, 0.01470184326171875, 0.020772933959960938, 0.026844024658203125, 0.03291511535644531, 0.0389862060546875, 0.04505729675292969, 0.051128387451171875, 0.05719947814941406, 0.06327056884765625, 0.06934165954589844, 0.07541275024414062, 0.08148384094238281, 0.087554931640625, 0.09362602233886719, 0.09969711303710938, 0.10576820373535156, 0.11183929443359375, 0.11791038513183594, 0.12398147583007812, 0.1300525665283203, 0.1361236572265625, 0.1421947479248047, 0.14826583862304688, 0.15433692932128906, 0.16040802001953125, 0.16647911071777344, 0.17255020141601562, 0.1786212921142578, 0.1846923828125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 904.0, 103.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027525294572114944, -0.0011728373356163502, 0.0004068547859787941, 0.0019865469075739384, 0.0035662390291690826, 0.005145931616425514, 0.006725623272359371, 0.008305314928293228, 0.00988500751554966, 0.011464700102806091, 0.013044391758739948, 0.014624083414673805, 0.016203776001930237, 0.01778346858918667, 0.0193631611764431, 0.020942851901054382, 0.022522544488310814, 0.024102237075567245, 0.025681927800178528, 0.02726162038743496, 0.02884131297469139, 0.030421005561947823, 0.032000698149204254, 0.033580388873815536, 0.03516007959842682, 0.0367397703230381, 0.03831946477293968, 0.039899155497550964, 0.041478849947452545, 0.04305854067206383, 0.04463823139667511, 0.04621792584657669, 0.04779762029647827, 0.049377311021089554, 0.050957005470991135, 0.05253669619560242, 0.054116390645504, 0.05569608137011528, 0.05727577209472656, 0.05885546654462814, 0.060435157269239426, 0.06201484799385071, 0.06359454244375229, 0.06517423689365387, 0.06675392389297485, 0.06833361834287643, 0.06991331279277802, 0.071492999792099, 0.07307269424200058, 0.07465238869190216, 0.07623207569122314, 0.07781177014112473, 0.0793914645910263, 0.08097115159034729, 0.08255084604024887, 0.08413054049015045, 0.08571022748947144, 0.08728992193937302, 0.088869608938694, 0.09044930338859558, 0.09202899783849716, 0.09360869228839874, 0.09518837928771973, 0.09676807373762131, 0.09834776818752289]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 7.0, 15.0, 21.0, 21.0, 26.0, 36.0, 31.0, 42.0, 35.0, 32.0, 31.0, 54.0, 46.0, 52.0, 62.0, 58.0, 67.0, 50.0, 38.0, 35.0, 33.0, 29.0, 37.0, 29.0, 21.0, 16.0, 15.0, 9.0, 9.0, 5.0, 6.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0068048834800720215, -0.006634333170950413, -0.006463782861828804, -0.006293232552707195, -0.0061226822435855865, -0.005952131934463978, -0.005781581625342369, -0.00561103131622076, -0.005440481007099152, -0.005269930697977543, -0.005099380388855934, -0.004928830079734325, -0.004758279770612717, -0.004587729461491108, -0.004417179152369499, -0.0042466288432478905, -0.004076078534126282, -0.003905528225004673, -0.0037349779158830643, -0.0035644276067614555, -0.003393877297639847, -0.003223326988518238, -0.0030527766793966293, -0.0028822263702750206, -0.002711676061153412, -0.002541125752031803, -0.0023705754429101944, -0.0022000251337885857, -0.002029474824666977, -0.0018589245155453682, -0.0016883742064237595, -0.0015178238973021507, -0.001347273588180542, -0.0011767232790589333, -0.0010061729699373245, -0.0008356226608157158, -0.0006650723516941071, -0.0004945220425724983, -0.0003239717334508896, -0.00015342142432928085, 1.712888479232788e-05, 0.00018767919391393661, 0.00035822950303554535, 0.0005287798121571541, 0.0006993301212787628, 0.0008698804304003716, 0.0010404307395219803, 0.001210981048643589, 0.0013815313577651978, 0.0015520816668868065, 0.0017226319760084152, 0.001893182285130024, 0.0020637325942516327, 0.0022342829033732414, 0.00240483321249485, 0.002575383521616459, 0.0027459338307380676, 0.0029164841398596764, 0.003087034448981285, 0.003257584758102894, 0.0034281350672245026, 0.0035986853763461113, 0.00376923568546772, 0.003939785994589329, 0.0041103363037109375]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 5.0, 11.0, 12.0, 18.0, 14.0, 15.0, 23.0, 26.0, 21.0, 33.0, 31.0, 27.0, 42.0, 33.0, 39.0, 33.0, 37.0, 36.0, 51.0, 33.0, 48.0, 43.0, 41.0, 35.0, 24.0, 25.0, 28.0, 28.0, 33.0, 26.0, 21.0, 19.0, 13.0, 7.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9617919921875, -7.689208984375, -7.4166259765625, -7.14404296875, -6.8714599609375, -6.598876953125, -6.3262939453125, -6.0537109375, -5.7811279296875, -5.508544921875, -5.2359619140625, -4.96337890625, -4.6907958984375, -4.418212890625, -4.1456298828125, -3.873046875, -3.6004638671875, -3.327880859375, -3.0552978515625, -2.78271484375, -2.5101318359375, -2.237548828125, -1.9649658203125, -1.6923828125, -1.4197998046875, -1.147216796875, -0.8746337890625, -0.60205078125, -0.3294677734375, -0.056884765625, 0.2156982421875, 0.48828125, 0.7608642578125, 1.033447265625, 1.3060302734375, 1.57861328125, 1.8511962890625, 2.123779296875, 2.3963623046875, 2.6689453125, 2.9415283203125, 3.214111328125, 3.4866943359375, 3.75927734375, 4.0318603515625, 4.304443359375, 4.5770263671875, 4.849609375, 5.1221923828125, 5.394775390625, 5.6673583984375, 5.93994140625, 6.2125244140625, 6.485107421875, 6.7576904296875, 7.0302734375, 7.3028564453125, 7.575439453125, 7.8480224609375, 8.12060546875, 8.3931884765625, 8.665771484375, 8.9383544921875, 9.2109375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 8.0, 9.0, 13.0, 17.0, 13.0, 25.0, 23.0, 45.0, 53.0, 55.0, 90.0, 142.0, 189.0, 250.0, 451.0, 815.0, 1560.0, 3119.0, 6812.0, 15647.0, 38604.0, 103737.0, 349520.0, 354060.0, 104694.0, 38973.0, 15802.0, 6799.0, 3197.0, 1580.0, 821.0, 496.0, 274.0, 174.0, 131.0, 93.0, 73.0, 42.0, 42.0, 26.0, 20.0, 20.0, 18.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.0518798828125, -9.705322265625, -9.3587646484375, -9.01220703125, -8.6656494140625, -8.319091796875, -7.9725341796875, -7.6259765625, -7.2794189453125, -6.932861328125, -6.5863037109375, -6.23974609375, -5.8931884765625, -5.546630859375, -5.2000732421875, -4.853515625, -4.5069580078125, -4.160400390625, -3.8138427734375, -3.46728515625, -3.1207275390625, -2.774169921875, -2.4276123046875, -2.0810546875, -1.7344970703125, -1.387939453125, -1.0413818359375, -0.69482421875, -0.3482666015625, -0.001708984375, 0.3448486328125, 0.69140625, 1.0379638671875, 1.384521484375, 1.7310791015625, 2.07763671875, 2.4241943359375, 2.770751953125, 3.1173095703125, 3.4638671875, 3.8104248046875, 4.156982421875, 4.5035400390625, 4.85009765625, 5.1966552734375, 5.543212890625, 5.8897705078125, 6.236328125, 6.5828857421875, 6.929443359375, 7.2760009765625, 7.62255859375, 7.9691162109375, 8.315673828125, 8.6622314453125, 9.0087890625, 9.3553466796875, 9.701904296875, 10.0484619140625, 10.39501953125, 10.7415771484375, 11.088134765625, 11.4346923828125, 11.78125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 4.0, 8.0, 5.0, 14.0, 8.0, 8.0, 16.0, 18.0, 26.0, 24.0, 26.0, 21.0, 35.0, 33.0, 32.0, 49.0, 67.0, 82.0, 149.0, 1509.0, 292.0, 113.0, 73.0, 66.0, 51.0, 45.0, 43.0, 22.0, 24.0, 36.0, 20.0, 19.0, 16.0, 14.0, 12.0, 18.0, 10.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-25.140625, -24.349853515625, -23.55908203125, -22.768310546875, -21.9775390625, -21.186767578125, -20.39599609375, -19.605224609375, -18.814453125, -18.023681640625, -17.23291015625, -16.442138671875, -15.6513671875, -14.860595703125, -14.06982421875, -13.279052734375, -12.48828125, -11.697509765625, -10.90673828125, -10.115966796875, -9.3251953125, -8.534423828125, -7.74365234375, -6.952880859375, -6.162109375, -5.371337890625, -4.58056640625, -3.789794921875, -2.9990234375, -2.208251953125, -1.41748046875, -0.626708984375, 0.1640625, 0.954833984375, 1.74560546875, 2.536376953125, 3.3271484375, 4.117919921875, 4.90869140625, 5.699462890625, 6.490234375, 7.281005859375, 8.07177734375, 8.862548828125, 9.6533203125, 10.444091796875, 11.23486328125, 12.025634765625, 12.81640625, 13.607177734375, 14.39794921875, 15.188720703125, 15.9794921875, 16.770263671875, 17.56103515625, 18.351806640625, 19.142578125, 19.933349609375, 20.72412109375, 21.514892578125, 22.3056640625, 23.096435546875, 23.88720703125, 24.677978515625, 25.46875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 10.0, 11.0, 12.0, 16.0, 24.0, 31.0, 46.0, 61.0, 83.0, 108.0, 181.0, 296.0, 537.0, 1778.0, 29276.0, 2739511.0, 363707.0, 7918.0, 913.0, 412.0, 219.0, 157.0, 107.0, 62.0, 61.0, 47.0, 24.0, 23.0, 22.0, 15.0, 3.0, 10.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-50.40625, -48.9580078125, -47.509765625, -46.0615234375, -44.61328125, -43.1650390625, -41.716796875, -40.2685546875, -38.8203125, -37.3720703125, -35.923828125, -34.4755859375, -33.02734375, -31.5791015625, -30.130859375, -28.6826171875, -27.234375, -25.7861328125, -24.337890625, -22.8896484375, -21.44140625, -19.9931640625, -18.544921875, -17.0966796875, -15.6484375, -14.2001953125, -12.751953125, -11.3037109375, -9.85546875, -8.4072265625, -6.958984375, -5.5107421875, -4.0625, -2.6142578125, -1.166015625, 0.2822265625, 1.73046875, 3.1787109375, 4.626953125, 6.0751953125, 7.5234375, 8.9716796875, 10.419921875, 11.8681640625, 13.31640625, 14.7646484375, 16.212890625, 17.6611328125, 19.109375, 20.5576171875, 22.005859375, 23.4541015625, 24.90234375, 26.3505859375, 27.798828125, 29.2470703125, 30.6953125, 32.1435546875, 33.591796875, 35.0400390625, 36.48828125, 37.9365234375, 39.384765625, 40.8330078125, 42.28125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 77.0, 701.0, 229.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.974557876586914, -19.619478225708008, -12.264399528503418, -4.909320831298828, 2.445758819580078, 9.800836563110352, 17.155916213989258, 24.510995864868164, 31.86607551574707, 39.221153259277344, 46.57623291015625, 53.931312561035156, 61.28639221191406, 68.64147186279297, 75.99655151367188, 83.35163116455078, 90.70671081542969, 98.0617904663086, 105.4168701171875, 112.7719497680664, 120.12702941894531, 127.48210144042969, 134.83718872070312, 142.1922607421875, 149.54734802246094, 156.9024200439453, 164.25750732421875, 171.61257934570312, 178.96766662597656, 186.32273864746094, 193.67782592773438, 201.03289794921875, 208.3879852294922, 215.74305725097656, 223.09814453125, 230.45321655273438, 237.8083038330078, 245.1633758544922, 252.51846313476562, 259.87353515625, 267.2286071777344, 274.58367919921875, 281.9387512207031, 289.2938537597656, 296.64892578125, 304.0039978027344, 311.35906982421875, 318.71417236328125, 326.0692443847656, 333.42431640625, 340.7793884277344, 348.1344909667969, 355.48956298828125, 362.8446350097656, 370.19970703125, 377.5548095703125, 384.9098815917969, 392.26495361328125, 399.6200256347656, 406.9751281738281, 414.3302001953125, 421.6852722167969, 429.04034423828125, 436.39544677734375, 443.7505187988281]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 6.0, 3.0, 5.0, 11.0, 20.0, 11.0, 15.0, 17.0, 22.0, 25.0, 27.0, 35.0, 34.0, 30.0, 39.0, 44.0, 51.0, 53.0, 37.0, 39.0, 49.0, 50.0, 42.0, 36.0, 26.0, 33.0, 35.0, 25.0, 25.0, 24.0, 20.0, 20.0, 16.0, 11.0, 8.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.38353729248047, -62.39617156982422, -60.40880584716797, -58.42144012451172, -56.43407440185547, -54.44670867919922, -52.45934295654297, -50.47197341918945, -48.4846076965332, -46.49724197387695, -44.5098762512207, -42.52251052856445, -40.5351448059082, -38.54777526855469, -36.56040954589844, -34.57304382324219, -32.58567810058594, -30.598312377929688, -28.610946655273438, -26.623580932617188, -24.636213302612305, -22.648847579956055, -20.661481857299805, -18.674114227294922, -16.686752319335938, -14.699386596679688, -12.712019920349121, -10.724654197692871, -8.737287521362305, -6.749921798706055, -4.762556076049805, -2.7751893997192383, -0.7878227233886719, 1.1995433568954468, 3.1869094371795654, 5.1742753982543945, 7.161641597747803, 9.149007797241211, 11.136373519897461, 13.123740196228027, 15.111105918884277, 17.098472595214844, 19.085838317871094, 21.073204040527344, 23.060569763183594, 25.047935485839844, 27.035301208496094, 29.022668838500977, 31.010034561157227, 32.99740219116211, 34.98476791381836, 36.97213363647461, 38.95949935913086, 40.94686508178711, 42.93423080444336, 44.92159652709961, 46.90896224975586, 48.89632797241211, 50.88369369506836, 52.87105941772461, 54.85842514038086, 56.845794677734375, 58.833160400390625, 60.820526123046875, 62.807891845703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 11.0, 10.0, 9.0, 17.0, 20.0, 9.0, 17.0, 23.0, 21.0, 26.0, 28.0, 37.0, 33.0, 25.0, 33.0, 38.0, 43.0, 41.0, 32.0, 42.0, 46.0, 35.0, 32.0, 31.0, 36.0, 28.0, 36.0, 25.0, 40.0, 26.0, 22.0, 18.0, 12.0, 14.0, 14.0, 11.0, 10.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.59375, -8.3255615234375, -8.057373046875, -7.7891845703125, -7.52099609375, -7.2528076171875, -6.984619140625, -6.7164306640625, -6.4482421875, -6.1800537109375, -5.911865234375, -5.6436767578125, -5.37548828125, -5.1072998046875, -4.839111328125, -4.5709228515625, -4.302734375, -4.0345458984375, -3.766357421875, -3.4981689453125, -3.22998046875, -2.9617919921875, -2.693603515625, -2.4254150390625, -2.1572265625, -1.8890380859375, -1.620849609375, -1.3526611328125, -1.08447265625, -0.8162841796875, -0.548095703125, -0.2799072265625, -0.01171875, 0.2564697265625, 0.524658203125, 0.7928466796875, 1.06103515625, 1.3292236328125, 1.597412109375, 1.8656005859375, 2.1337890625, 2.4019775390625, 2.670166015625, 2.9383544921875, 3.20654296875, 3.4747314453125, 3.742919921875, 4.0111083984375, 4.279296875, 4.5474853515625, 4.815673828125, 5.0838623046875, 5.35205078125, 5.6202392578125, 5.888427734375, 6.1566162109375, 6.4248046875, 6.6929931640625, 6.961181640625, 7.2293701171875, 7.49755859375, 7.7657470703125, 8.033935546875, 8.3021240234375, 8.5703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 12.0, 10.0, 18.0, 11.0, 19.0, 21.0, 25.0, 31.0, 42.0, 68.0, 112.0, 253.0, 637.0, 1635.0, 5503.0, 23650.0, 184926.0, 1634120.0, 2024148.0, 276098.0, 32335.0, 7007.0, 2093.0, 759.0, 308.0, 146.0, 78.0, 44.0, 43.0, 28.0, 23.0, 15.0, 13.0, 10.0, 8.0, 10.0, 5.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.7734375, -15.2310791015625, -14.688720703125, -14.1463623046875, -13.60400390625, -13.0616455078125, -12.519287109375, -11.9769287109375, -11.4345703125, -10.8922119140625, -10.349853515625, -9.8074951171875, -9.26513671875, -8.7227783203125, -8.180419921875, -7.6380615234375, -7.095703125, -6.5533447265625, -6.010986328125, -5.4686279296875, -4.92626953125, -4.3839111328125, -3.841552734375, -3.2991943359375, -2.7568359375, -2.2144775390625, -1.672119140625, -1.1297607421875, -0.58740234375, -0.0450439453125, 0.497314453125, 1.0396728515625, 1.58203125, 2.1243896484375, 2.666748046875, 3.2091064453125, 3.75146484375, 4.2938232421875, 4.836181640625, 5.3785400390625, 5.9208984375, 6.4632568359375, 7.005615234375, 7.5479736328125, 8.09033203125, 8.6326904296875, 9.175048828125, 9.7174072265625, 10.259765625, 10.8021240234375, 11.344482421875, 11.8868408203125, 12.42919921875, 12.9715576171875, 13.513916015625, 14.0562744140625, 14.5986328125, 15.1409912109375, 15.683349609375, 16.2257080078125, 16.76806640625, 17.3104248046875, 17.852783203125, 18.3951416015625, 18.9375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 9.0, 4.0, 8.0, 15.0, 13.0, 19.0, 28.0, 39.0, 39.0, 49.0, 68.0, 93.0, 161.0, 233.0, 293.0, 397.0, 524.0, 500.0, 452.0, 342.0, 214.0, 154.0, 111.0, 83.0, 55.0, 44.0, 34.0, 23.0, 21.0, 17.0, 7.0, 7.0, 7.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.2864990234375, -11.862060546875, -11.4376220703125, -11.01318359375, -10.5887451171875, -10.164306640625, -9.7398681640625, -9.3154296875, -8.8909912109375, -8.466552734375, -8.0421142578125, -7.61767578125, -7.1932373046875, -6.768798828125, -6.3443603515625, -5.919921875, -5.4954833984375, -5.071044921875, -4.6466064453125, -4.22216796875, -3.7977294921875, -3.373291015625, -2.9488525390625, -2.5244140625, -2.0999755859375, -1.675537109375, -1.2510986328125, -0.82666015625, -0.4022216796875, 0.022216796875, 0.4466552734375, 0.87109375, 1.2955322265625, 1.719970703125, 2.1444091796875, 2.56884765625, 2.9932861328125, 3.417724609375, 3.8421630859375, 4.2666015625, 4.6910400390625, 5.115478515625, 5.5399169921875, 5.96435546875, 6.3887939453125, 6.813232421875, 7.2376708984375, 7.662109375, 8.0865478515625, 8.510986328125, 8.9354248046875, 9.35986328125, 9.7843017578125, 10.208740234375, 10.6331787109375, 11.0576171875, 11.4820556640625, 11.906494140625, 12.3309326171875, 12.75537109375, 13.1798095703125, 13.604248046875, 14.0286865234375, 14.453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 12.0, 7.0, 21.0, 27.0, 30.0, 52.0, 71.0, 83.0, 133.0, 214.0, 397.0, 781.0, 1794.0, 4768.0, 16468.0, 66892.0, 387167.0, 2756361.0, 811114.0, 111511.0, 25033.0, 6777.0, 2335.0, 911.0, 471.0, 269.0, 156.0, 93.0, 87.0, 59.0, 27.0, 37.0, 33.0, 14.0, 15.0, 10.0, 8.0, 10.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-19.953125, -19.3603515625, -18.767578125, -18.1748046875, -17.58203125, -16.9892578125, -16.396484375, -15.8037109375, -15.2109375, -14.6181640625, -14.025390625, -13.4326171875, -12.83984375, -12.2470703125, -11.654296875, -11.0615234375, -10.46875, -9.8759765625, -9.283203125, -8.6904296875, -8.09765625, -7.5048828125, -6.912109375, -6.3193359375, -5.7265625, -5.1337890625, -4.541015625, -3.9482421875, -3.35546875, -2.7626953125, -2.169921875, -1.5771484375, -0.984375, -0.3916015625, 0.201171875, 0.7939453125, 1.38671875, 1.9794921875, 2.572265625, 3.1650390625, 3.7578125, 4.3505859375, 4.943359375, 5.5361328125, 6.12890625, 6.7216796875, 7.314453125, 7.9072265625, 8.5, 9.0927734375, 9.685546875, 10.2783203125, 10.87109375, 11.4638671875, 12.056640625, 12.6494140625, 13.2421875, 13.8349609375, 14.427734375, 15.0205078125, 15.61328125, 16.2060546875, 16.798828125, 17.3916015625, 17.984375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 12.0, 81.0, 237.0, 391.0, 227.0, 50.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.9368591308594, -255.65013122558594, -250.3634033203125, -245.07667541503906, -239.78994750976562, -234.50320434570312, -229.21649169921875, -223.92974853515625, -218.6430206298828, -213.35629272460938, -208.06956481933594, -202.7828369140625, -197.49610900878906, -192.20938110351562, -186.92263793945312, -181.6359100341797, -176.34918212890625, -171.0624542236328, -165.77572631835938, -160.48899841308594, -155.2022705078125, -149.91552734375, -144.62881469726562, -139.34207153320312, -134.05535888671875, -128.7686309814453, -123.48190307617188, -118.19517517089844, -112.90843963623047, -107.62171173095703, -102.3349838256836, -97.04824829101562, -91.76152038574219, -86.47479248046875, -81.18806457519531, -75.90133666992188, -70.6146011352539, -65.32787322998047, -60.04114532470703, -54.75441360473633, -49.46768569946289, -44.18095779418945, -38.89422607421875, -33.60749816894531, -28.320768356323242, -23.034038543701172, -17.747310638427734, -12.460578918457031, -7.173851013183594, -1.8871216773986816, 3.3996076583862305, 8.686336517333984, 13.973066329956055, 19.259796142578125, 24.546524047851562, 29.833255767822266, 35.1199836730957, 40.40671157836914, 45.693443298339844, 50.98017120361328, 56.26689910888672, 61.55363082885742, 66.84036254882812, 72.12709045410156, 77.413818359375]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 5.0, 6.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 21.0, 15.0, 12.0, 22.0, 27.0, 23.0, 27.0, 19.0, 25.0, 29.0, 36.0, 35.0, 37.0, 31.0, 37.0, 40.0, 30.0, 35.0, 34.0, 37.0, 27.0, 32.0, 27.0, 34.0, 31.0, 26.0, 17.0, 25.0, 20.0, 14.0, 21.0, 21.0, 16.0, 10.0, 9.0, 7.0, 7.0, 7.0, 2.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.501312255859375, -42.18320846557617, -40.86510467529297, -39.5469970703125, -38.2288932800293, -36.910789489746094, -35.592681884765625, -34.27457809448242, -32.95647430419922, -31.638370513916016, -30.32026481628418, -29.002159118652344, -27.68405532836914, -26.365951538085938, -25.0478458404541, -23.729740142822266, -22.411636352539062, -21.09353256225586, -19.775426864624023, -18.457321166992188, -17.139217376708984, -15.821112632751465, -14.503007888793945, -13.184903144836426, -11.866798400878906, -10.548693656921387, -9.230588912963867, -7.912484169006348, -6.594379425048828, -5.276274681091309, -3.958169937133789, -2.6400651931762695, -1.32196044921875, -0.0038557052612304688, 1.314249038696289, 2.6323537826538086, 3.950458526611328, 5.268563270568848, 6.586668014526367, 7.904772758483887, 9.222877502441406, 10.540982246398926, 11.859086990356445, 13.177191734313965, 14.495296478271484, 15.813401222229004, 17.131505966186523, 18.44961166381836, 19.767715454101562, 21.085819244384766, 22.4039249420166, 23.722030639648438, 25.04013442993164, 26.358238220214844, 27.67634391784668, 28.994449615478516, 30.31255340576172, 31.630657196044922, 32.948760986328125, 34.266868591308594, 35.5849723815918, 36.903076171875, 38.22118377685547, 39.53928756713867, 40.857391357421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 7.0, 9.0, 13.0, 12.0, 19.0, 9.0, 15.0, 21.0, 30.0, 33.0, 32.0, 34.0, 17.0, 33.0, 40.0, 45.0, 44.0, 46.0, 41.0, 39.0, 34.0, 36.0, 44.0, 42.0, 33.0, 32.0, 30.0, 28.0, 21.0, 17.0, 21.0, 16.0, 14.0, 9.0, 14.0, 15.0, 7.0, 6.0, 6.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-9.640625, -9.3541259765625, -9.067626953125, -8.7811279296875, -8.49462890625, -8.2081298828125, -7.921630859375, -7.6351318359375, -7.3486328125, -7.0621337890625, -6.775634765625, -6.4891357421875, -6.20263671875, -5.9161376953125, -5.629638671875, -5.3431396484375, -5.056640625, -4.7701416015625, -4.483642578125, -4.1971435546875, -3.91064453125, -3.6241455078125, -3.337646484375, -3.0511474609375, -2.7646484375, -2.4781494140625, -2.191650390625, -1.9051513671875, -1.61865234375, -1.3321533203125, -1.045654296875, -0.7591552734375, -0.47265625, -0.1861572265625, 0.100341796875, 0.3868408203125, 0.67333984375, 0.9598388671875, 1.246337890625, 1.5328369140625, 1.8193359375, 2.1058349609375, 2.392333984375, 2.6788330078125, 2.96533203125, 3.2518310546875, 3.538330078125, 3.8248291015625, 4.111328125, 4.3978271484375, 4.684326171875, 4.9708251953125, 5.25732421875, 5.5438232421875, 5.830322265625, 6.1168212890625, 6.4033203125, 6.6898193359375, 6.976318359375, 7.2628173828125, 7.54931640625, 7.8358154296875, 8.122314453125, 8.4088134765625, 8.6953125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 8.0, 13.0, 15.0, 27.0, 32.0, 48.0, 62.0, 96.0, 126.0, 182.0, 267.0, 396.0, 544.0, 823.0, 1161.0, 1693.0, 2598.0, 3832.0, 5906.0, 9005.0, 14186.0, 22884.0, 36169.0, 57353.0, 90229.0, 132910.0, 171448.0, 160812.0, 119508.0, 79207.0, 50011.0, 31046.0, 19824.0, 12402.0, 7993.0, 5232.0, 3408.0, 2214.0, 1495.0, 1048.0, 720.0, 477.0, 340.0, 263.0, 158.0, 113.0, 92.0, 47.0, 41.0, 29.0, 16.0, 12.0, 9.0, 11.0, 4.0, 4.0, 4.0], "bins": [-0.908203125, -0.8813705444335938, -0.8545379638671875, -0.8277053833007812, -0.800872802734375, -0.7740402221679688, -0.7472076416015625, -0.7203750610351562, -0.69354248046875, -0.6667098999023438, -0.6398773193359375, -0.6130447387695312, -0.586212158203125, -0.5593795776367188, -0.5325469970703125, -0.5057144165039062, -0.4788818359375, -0.45204925537109375, -0.4252166748046875, -0.39838409423828125, -0.371551513671875, -0.34471893310546875, -0.3178863525390625, -0.29105377197265625, -0.26422119140625, -0.23738861083984375, -0.2105560302734375, -0.18372344970703125, -0.156890869140625, -0.13005828857421875, -0.1032257080078125, -0.07639312744140625, -0.049560546875, -0.02272796630859375, 0.0041046142578125, 0.03093719482421875, 0.057769775390625, 0.08460235595703125, 0.1114349365234375, 0.13826751708984375, 0.16510009765625, 0.19193267822265625, 0.2187652587890625, 0.24559783935546875, 0.272430419921875, 0.29926300048828125, 0.3260955810546875, 0.35292816162109375, 0.3797607421875, 0.40659332275390625, 0.4334259033203125, 0.46025848388671875, 0.487091064453125, 0.5139236450195312, 0.5407562255859375, 0.5675888061523438, 0.59442138671875, 0.6212539672851562, 0.6480865478515625, 0.6749191284179688, 0.701751708984375, 0.7285842895507812, 0.7554168701171875, 0.7822494506835938, 0.80908203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 3.0, 9.0, 9.0, 14.0, 12.0, 19.0, 15.0, 28.0, 25.0, 22.0, 30.0, 33.0, 30.0, 26.0, 40.0, 36.0, 37.0, 55.0, 41.0, 1055.0, 30.0, 48.0, 44.0, 40.0, 35.0, 36.0, 41.0, 27.0, 27.0, 30.0, 23.0, 18.0, 19.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.05078125, -6.856689453125, -6.66259765625, -6.468505859375, -6.2744140625, -6.080322265625, -5.88623046875, -5.692138671875, -5.498046875, -5.303955078125, -5.10986328125, -4.915771484375, -4.7216796875, -4.527587890625, -4.33349609375, -4.139404296875, -3.9453125, -3.751220703125, -3.55712890625, -3.363037109375, -3.1689453125, -2.974853515625, -2.78076171875, -2.586669921875, -2.392578125, -2.198486328125, -2.00439453125, -1.810302734375, -1.6162109375, -1.422119140625, -1.22802734375, -1.033935546875, -0.83984375, -0.645751953125, -0.45166015625, -0.257568359375, -0.0634765625, 0.130615234375, 0.32470703125, 0.518798828125, 0.712890625, 0.906982421875, 1.10107421875, 1.295166015625, 1.4892578125, 1.683349609375, 1.87744140625, 2.071533203125, 2.265625, 2.459716796875, 2.65380859375, 2.847900390625, 3.0419921875, 3.236083984375, 3.43017578125, 3.624267578125, 3.818359375, 4.012451171875, 4.20654296875, 4.400634765625, 4.5947265625, 4.788818359375, 4.98291015625, 5.177001953125, 5.37109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 9.0, 12.0, 23.0, 41.0, 46.0, 86.0, 145.0, 175.0, 261.0, 364.0, 528.0, 808.0, 1210.0, 1618.0, 2448.0, 3620.0, 5149.0, 7744.0, 11363.0, 16883.0, 24934.0, 37289.0, 54810.0, 76905.0, 103780.0, 129580.0, 1180421.0, 121436.0, 95276.0, 69841.0, 48498.0, 33153.0, 22182.0, 14788.0, 10115.0, 6761.0, 4624.0, 3106.0, 2234.0, 1535.0, 1008.0, 740.0, 520.0, 358.0, 227.0, 161.0, 100.0, 69.0, 54.0, 42.0, 25.0, 12.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5505752563476562, -0.5318145751953125, -0.5130538940429688, -0.494293212890625, -0.47553253173828125, -0.4567718505859375, -0.43801116943359375, -0.41925048828125, -0.40048980712890625, -0.3817291259765625, -0.36296844482421875, -0.344207763671875, -0.32544708251953125, -0.3066864013671875, -0.28792572021484375, -0.2691650390625, -0.25040435791015625, -0.2316436767578125, -0.21288299560546875, -0.194122314453125, -0.17536163330078125, -0.1566009521484375, -0.13784027099609375, -0.11907958984375, -0.10031890869140625, -0.0815582275390625, -0.06279754638671875, -0.044036865234375, -0.02527618408203125, -0.0065155029296875, 0.01224517822265625, 0.031005859375, 0.04976654052734375, 0.0685272216796875, 0.08728790283203125, 0.106048583984375, 0.12480926513671875, 0.1435699462890625, 0.16233062744140625, 0.18109130859375, 0.19985198974609375, 0.2186126708984375, 0.23737335205078125, 0.256134033203125, 0.27489471435546875, 0.2936553955078125, 0.31241607666015625, 0.3311767578125, 0.34993743896484375, 0.3686981201171875, 0.38745880126953125, 0.406219482421875, 0.42498016357421875, 0.4437408447265625, 0.46250152587890625, 0.48126220703125, 0.5000228881835938, 0.5187835693359375, 0.5375442504882812, 0.556304931640625, 0.5750656127929688, 0.5938262939453125, 0.6125869750976562, 0.63134765625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 4.0, 4.0, 6.0, 18.0, 13.0, 33.0, 26.0, 30.0, 43.0, 38.0, 46.0, 54.0, 64.0, 79.0, 60.0, 73.0, 64.0, 45.0, 51.0, 46.0, 27.0, 25.0, 24.0, 25.0, 18.0, 13.0, 14.0, 5.0, 9.0, 9.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.01027679443359375, -0.010010778903961182, -0.009744763374328613, -0.009478747844696045, -0.009212732315063477, -0.008946716785430908, -0.00868070125579834, -0.008414685726165771, -0.008148670196533203, -0.007882654666900635, -0.007616639137268066, -0.007350623607635498, -0.00708460807800293, -0.006818592548370361, -0.006552577018737793, -0.006286561489105225, -0.006020545959472656, -0.005754530429840088, -0.0054885149002075195, -0.005222499370574951, -0.004956483840942383, -0.0046904683113098145, -0.004424452781677246, -0.004158437252044678, -0.0038924217224121094, -0.003626406192779541, -0.0033603906631469727, -0.0030943751335144043, -0.002828359603881836, -0.0025623440742492676, -0.0022963285446166992, -0.002030313014984131, -0.0017642974853515625, -0.0014982819557189941, -0.0012322664260864258, -0.0009662508964538574, -0.0007002353668212891, -0.0004342198371887207, -0.00016820430755615234, 9.781122207641602e-05, 0.0003638267517089844, 0.0006298422813415527, 0.0008958578109741211, 0.0011618733406066895, 0.0014278888702392578, 0.0016939043998718262, 0.0019599199295043945, 0.002225935459136963, 0.0024919509887695312, 0.0027579665184020996, 0.003023982048034668, 0.0032899975776672363, 0.0035560131072998047, 0.003822028636932373, 0.004088044166564941, 0.00435405969619751, 0.004620075225830078, 0.0048860907554626465, 0.005152106285095215, 0.005418121814727783, 0.0056841373443603516, 0.00595015287399292, 0.006216168403625488, 0.006482183933258057, 0.006748199462890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 10.0, 12.0, 10.0, 10.0, 16.0, 22.0, 25.0, 39.0, 45.0, 43.0, 65.0, 72.0, 153.0, 180.0, 372.0, 786.0, 38013.0, 1005782.0, 1539.0, 492.0, 246.0, 164.0, 94.0, 88.0, 55.0, 45.0, 49.0, 26.0, 19.0, 19.0, 14.0, 6.0, 9.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13220596313476562, -0.12696075439453125, -0.12171554565429688, -0.1164703369140625, -0.11122512817382812, -0.10597991943359375, -0.10073471069335938, -0.095489501953125, -0.09024429321289062, -0.08499908447265625, -0.07975387573242188, -0.0745086669921875, -0.06926345825195312, -0.06401824951171875, -0.058773040771484375, -0.05352783203125, -0.048282623291015625, -0.04303741455078125, -0.037792205810546875, -0.0325469970703125, -0.027301788330078125, -0.02205657958984375, -0.016811370849609375, -0.011566162109375, -0.006320953369140625, -0.00107574462890625, 0.004169464111328125, 0.0094146728515625, 0.014659881591796875, 0.01990509033203125, 0.025150299072265625, 0.0303955078125, 0.035640716552734375, 0.04088592529296875, 0.046131134033203125, 0.0513763427734375, 0.056621551513671875, 0.06186676025390625, 0.06711196899414062, 0.072357177734375, 0.07760238647460938, 0.08284759521484375, 0.08809280395507812, 0.0933380126953125, 0.09858322143554688, 0.10382843017578125, 0.10907363891601562, 0.11431884765625, 0.11956405639648438, 0.12480926513671875, 0.13005447387695312, 0.1352996826171875, 0.14054489135742188, 0.14579010009765625, 0.15103530883789062, 0.156280517578125, 0.16152572631835938, 0.16677093505859375, 0.17201614379882812, 0.1772613525390625, 0.18250656127929688, 0.18775177001953125, 0.19299697875976562, 0.1982421875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 928.0, 85.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13417647778987885, -0.13158658146858215, -0.12899667024612427, -0.12640677392482758, -0.12381686270236969, -0.121226966381073, -0.11863706260919571, -0.11604715883731842, -0.11345725506544113, -0.11086735129356384, -0.10827744752168655, -0.10568754374980927, -0.10309764742851257, -0.10050774365663528, -0.097917839884758, -0.0953279361128807, -0.09273803234100342, -0.09014812856912613, -0.08755822479724884, -0.08496832102537155, -0.08237841725349426, -0.07978852093219757, -0.07719861716032028, -0.074608713388443, -0.0720188096165657, -0.06942890584468842, -0.06683900207281113, -0.06424909830093384, -0.06165919825434685, -0.05906929448246956, -0.05647939443588257, -0.05388949066400528, -0.05129958316683769, -0.0487096793949604, -0.04611977934837341, -0.043529875576496124, -0.040939971804618835, -0.03835006803274155, -0.03576016426086426, -0.03317026421427727, -0.03058036044239998, -0.02799045667052269, -0.02540055476129055, -0.02281065285205841, -0.020220749080181122, -0.017630845308303833, -0.015040943399071693, -0.012451041489839554, -0.009861137717962265, -0.007271234877407551, -0.004681332036852837, -0.0020914291962981224, 0.0004984736442565918, 0.003088376484811306, 0.00567827932536602, 0.00826818123459816, 0.010858085006475449, 0.013447987847030163, 0.016037890687584877, 0.018627792596817017, 0.021217696368694305, 0.023807600140571594, 0.026397502049803734, 0.028987403959035873, 0.03157730773091316]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 9.0, 10.0, 22.0, 13.0, 31.0, 17.0, 32.0, 30.0, 36.0, 36.0, 51.0, 41.0, 49.0, 51.0, 50.0, 63.0, 45.0, 52.0, 54.0, 43.0, 47.0, 33.0, 30.0, 31.0, 22.0, 25.0, 11.0, 14.0, 15.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0054509639739990234, -0.0052637457847595215, -0.0050765275955200195, -0.004889309406280518, -0.004702091217041016, -0.004514873027801514, -0.004327654838562012, -0.00414043664932251, -0.003953218460083008, -0.003766000270843506, -0.003578782081604004, -0.003391563892364502, -0.003204345703125, -0.003017127513885498, -0.002829909324645996, -0.002642691135406494, -0.002455472946166992, -0.0022682547569274902, -0.0020810365676879883, -0.0018938183784484863, -0.0017066001892089844, -0.0015193819999694824, -0.0013321638107299805, -0.0011449456214904785, -0.0009577274322509766, -0.0007705092430114746, -0.0005832910537719727, -0.0003960728645324707, -0.00020885467529296875, -2.1636486053466797e-05, 0.00016558170318603516, 0.0003527998924255371, 0.0005400180816650391, 0.000727236270904541, 0.000914454460144043, 0.001101672649383545, 0.0012888908386230469, 0.0014761090278625488, 0.0016633272171020508, 0.0018505454063415527, 0.0020377635955810547, 0.0022249817848205566, 0.0024121999740600586, 0.0025994181632995605, 0.0027866363525390625, 0.0029738545417785645, 0.0031610727310180664, 0.0033482909202575684, 0.0035355091094970703, 0.0037227272987365723, 0.003909945487976074, 0.004097163677215576, 0.004284381866455078, 0.00447160005569458, 0.004658818244934082, 0.004846036434173584, 0.005033254623413086, 0.005220472812652588, 0.00540769100189209, 0.005594909191131592, 0.005782127380371094, 0.005969345569610596, 0.006156563758850098, 0.0063437819480896, 0.0065310001373291016]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 7.0, 9.0, 13.0, 12.0, 19.0, 9.0, 15.0, 21.0, 30.0, 33.0, 32.0, 34.0, 17.0, 32.0, 41.0, 45.0, 44.0, 46.0, 41.0, 39.0, 34.0, 36.0, 44.0, 42.0, 33.0, 32.0, 30.0, 28.0, 21.0, 17.0, 21.0, 16.0, 14.0, 9.0, 14.0, 15.0, 7.0, 6.0, 6.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-9.640625, -9.3541259765625, -9.067626953125, -8.7811279296875, -8.49462890625, -8.2081298828125, -7.921630859375, -7.6351318359375, -7.3486328125, -7.0621337890625, -6.775634765625, -6.4891357421875, -6.20263671875, -5.9161376953125, -5.629638671875, -5.3431396484375, -5.056640625, -4.7701416015625, -4.483642578125, -4.1971435546875, -3.91064453125, -3.6241455078125, -3.337646484375, -3.0511474609375, -2.7646484375, -2.4781494140625, -2.191650390625, -1.9051513671875, -1.61865234375, -1.3321533203125, -1.045654296875, -0.7591552734375, -0.47265625, -0.1861572265625, 0.100341796875, 0.3868408203125, 0.67333984375, 0.9598388671875, 1.246337890625, 1.5328369140625, 1.8193359375, 2.1058349609375, 2.392333984375, 2.6788330078125, 2.96533203125, 3.2518310546875, 3.538330078125, 3.8248291015625, 4.111328125, 4.3978271484375, 4.684326171875, 4.9708251953125, 5.25732421875, 5.5438232421875, 5.830322265625, 6.1168212890625, 6.4033203125, 6.6898193359375, 6.976318359375, 7.2628173828125, 7.54931640625, 7.8358154296875, 8.122314453125, 8.4088134765625, 8.6953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 12.0, 13.0, 25.0, 34.0, 39.0, 47.0, 69.0, 103.0, 128.0, 174.0, 238.0, 322.0, 482.0, 771.0, 1436.0, 2949.0, 6656.0, 17600.0, 51953.0, 180314.0, 500240.0, 196589.0, 55492.0, 18752.0, 7015.0, 3023.0, 1468.0, 811.0, 496.0, 346.0, 248.0, 190.0, 135.0, 98.0, 69.0, 45.0, 42.0, 38.0, 21.0, 21.0, 12.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.328125, -11.9371337890625, -11.546142578125, -11.1551513671875, -10.76416015625, -10.3731689453125, -9.982177734375, -9.5911865234375, -9.2001953125, -8.8092041015625, -8.418212890625, -8.0272216796875, -7.63623046875, -7.2452392578125, -6.854248046875, -6.4632568359375, -6.072265625, -5.6812744140625, -5.290283203125, -4.8992919921875, -4.50830078125, -4.1173095703125, -3.726318359375, -3.3353271484375, -2.9443359375, -2.5533447265625, -2.162353515625, -1.7713623046875, -1.38037109375, -0.9893798828125, -0.598388671875, -0.2073974609375, 0.18359375, 0.5745849609375, 0.965576171875, 1.3565673828125, 1.74755859375, 2.1385498046875, 2.529541015625, 2.9205322265625, 3.3115234375, 3.7025146484375, 4.093505859375, 4.4844970703125, 4.87548828125, 5.2664794921875, 5.657470703125, 6.0484619140625, 6.439453125, 6.8304443359375, 7.221435546875, 7.6124267578125, 8.00341796875, 8.3944091796875, 8.785400390625, 9.1763916015625, 9.5673828125, 9.9583740234375, 10.349365234375, 10.7403564453125, 11.13134765625, 11.5223388671875, 11.913330078125, 12.3043212890625, 12.6953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 12.0, 8.0, 8.0, 9.0, 14.0, 13.0, 19.0, 24.0, 26.0, 29.0, 42.0, 44.0, 49.0, 56.0, 57.0, 85.0, 139.0, 288.0, 1426.0, 169.0, 88.0, 62.0, 52.0, 41.0, 32.0, 39.0, 44.0, 25.0, 21.0, 19.0, 28.0, 9.0, 16.0, 14.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.703125, -24.90283203125, -24.1025390625, -23.30224609375, -22.501953125, -21.70166015625, -20.9013671875, -20.10107421875, -19.30078125, -18.50048828125, -17.7001953125, -16.89990234375, -16.099609375, -15.29931640625, -14.4990234375, -13.69873046875, -12.8984375, -12.09814453125, -11.2978515625, -10.49755859375, -9.697265625, -8.89697265625, -8.0966796875, -7.29638671875, -6.49609375, -5.69580078125, -4.8955078125, -4.09521484375, -3.294921875, -2.49462890625, -1.6943359375, -0.89404296875, -0.09375, 0.70654296875, 1.5068359375, 2.30712890625, 3.107421875, 3.90771484375, 4.7080078125, 5.50830078125, 6.30859375, 7.10888671875, 7.9091796875, 8.70947265625, 9.509765625, 10.31005859375, 11.1103515625, 11.91064453125, 12.7109375, 13.51123046875, 14.3115234375, 15.11181640625, 15.912109375, 16.71240234375, 17.5126953125, 18.31298828125, 19.11328125, 19.91357421875, 20.7138671875, 21.51416015625, 22.314453125, 23.11474609375, 23.9150390625, 24.71533203125, 25.515625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 11.0, 9.0, 12.0, 23.0, 20.0, 36.0, 41.0, 53.0, 73.0, 91.0, 133.0, 203.0, 293.0, 499.0, 1121.0, 9677.0, 707781.0, 2405458.0, 17042.0, 1466.0, 568.0, 307.0, 193.0, 156.0, 91.0, 71.0, 63.0, 31.0, 34.0, 22.0, 31.0, 17.0, 11.0, 11.0, 10.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.9375, -43.537109375, -42.13671875, -40.736328125, -39.3359375, -37.935546875, -36.53515625, -35.134765625, -33.734375, -32.333984375, -30.93359375, -29.533203125, -28.1328125, -26.732421875, -25.33203125, -23.931640625, -22.53125, -21.130859375, -19.73046875, -18.330078125, -16.9296875, -15.529296875, -14.12890625, -12.728515625, -11.328125, -9.927734375, -8.52734375, -7.126953125, -5.7265625, -4.326171875, -2.92578125, -1.525390625, -0.125, 1.275390625, 2.67578125, 4.076171875, 5.4765625, 6.876953125, 8.27734375, 9.677734375, 11.078125, 12.478515625, 13.87890625, 15.279296875, 16.6796875, 18.080078125, 19.48046875, 20.880859375, 22.28125, 23.681640625, 25.08203125, 26.482421875, 27.8828125, 29.283203125, 30.68359375, 32.083984375, 33.484375, 34.884765625, 36.28515625, 37.685546875, 39.0859375, 40.486328125, 41.88671875, 43.287109375, 44.6875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 984.0, 29.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-648.4768676757812, -631.6690063476562, -614.861083984375, -598.05322265625, -581.245361328125, -564.4374389648438, -547.6295776367188, -530.8217163085938, -514.0137939453125, -497.2059020996094, -480.3980407714844, -463.59014892578125, -446.7822570800781, -429.974365234375, -413.16650390625, -396.3586120605469, -379.5507507324219, -362.74285888671875, -345.93499755859375, -329.1271057128906, -312.3192138671875, -295.5113525390625, -278.7034606933594, -261.89556884765625, -245.0876922607422, -228.27981567382812, -211.471923828125, -194.66404724121094, -177.85617065429688, -161.04827880859375, -144.2404022216797, -127.4325180053711, -110.62460327148438, -93.81671905517578, -77.00883483886719, -60.200958251953125, -43.39307403564453, -26.585189819335938, -9.777313232421875, 7.030570983886719, 23.838455200195312, 40.646339416503906, 57.454219818115234, 74.26210021972656, 91.06998443603516, 107.87786865234375, 124.68574523925781, 141.49362182617188, 158.301513671875, 175.10939025878906, 191.9172821044922, 208.72515869140625, 225.53305053710938, 242.34092712402344, 259.1488037109375, 275.9566955566406, 292.76458740234375, 309.5724792480469, 326.3803405761719, 343.188232421875, 359.9961242675781, 376.80401611328125, 393.61187744140625, 410.4197692871094, 427.2276306152344]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 9.0, 11.0, 12.0, 8.0, 15.0, 24.0, 22.0, 27.0, 21.0, 27.0, 26.0, 34.0, 32.0, 34.0, 35.0, 36.0, 43.0, 40.0, 40.0, 32.0, 37.0, 38.0, 39.0, 39.0, 39.0, 28.0, 25.0, 26.0, 27.0, 27.0, 17.0, 12.0, 16.0, 18.0, 16.0, 12.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.15359115600586, -57.307254791259766, -55.46091842651367, -53.61458206176758, -51.768245697021484, -49.92190933227539, -48.0755729675293, -46.2292366027832, -44.38290023803711, -42.536563873291016, -40.69022750854492, -38.84389114379883, -36.997554779052734, -35.15121841430664, -33.30488204956055, -31.458545684814453, -29.61220932006836, -27.765872955322266, -25.919536590576172, -24.073200225830078, -22.226863861083984, -20.38052749633789, -18.534191131591797, -16.687854766845703, -14.84151840209961, -12.995182037353516, -11.148845672607422, -9.302509307861328, -7.456172943115234, -5.609836578369141, -3.763500213623047, -1.9171638488769531, -0.07082366943359375, 1.7755126953125, 3.6218490600585938, 5.4681854248046875, 7.314521789550781, 9.160858154296875, 11.007194519042969, 12.853530883789062, 14.699867248535156, 16.54620361328125, 18.392539978027344, 20.238876342773438, 22.08521270751953, 23.931549072265625, 25.77788543701172, 27.624221801757812, 29.470558166503906, 31.31689453125, 33.163230895996094, 35.00956726074219, 36.85590362548828, 38.702239990234375, 40.54857635498047, 42.39491271972656, 44.241249084472656, 46.08758544921875, 47.933921813964844, 49.78025817871094, 51.62659454345703, 53.472930908203125, 55.31926727294922, 57.16560363769531, 59.011940002441406]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 13.0, 6.0, 6.0, 9.0, 21.0, 17.0, 25.0, 18.0, 33.0, 30.0, 36.0, 36.0, 32.0, 37.0, 44.0, 51.0, 48.0, 31.0, 51.0, 39.0, 46.0, 51.0, 40.0, 34.0, 35.0, 24.0, 28.0, 14.0, 24.0, 10.0, 22.0, 9.0, 17.0, 19.0, 7.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.4375, -10.1185302734375, -9.799560546875, -9.4805908203125, -9.16162109375, -8.8426513671875, -8.523681640625, -8.2047119140625, -7.8857421875, -7.5667724609375, -7.247802734375, -6.9288330078125, -6.60986328125, -6.2908935546875, -5.971923828125, -5.6529541015625, -5.333984375, -5.0150146484375, -4.696044921875, -4.3770751953125, -4.05810546875, -3.7391357421875, -3.420166015625, -3.1011962890625, -2.7822265625, -2.4632568359375, -2.144287109375, -1.8253173828125, -1.50634765625, -1.1873779296875, -0.868408203125, -0.5494384765625, -0.23046875, 0.0885009765625, 0.407470703125, 0.7264404296875, 1.04541015625, 1.3643798828125, 1.683349609375, 2.0023193359375, 2.3212890625, 2.6402587890625, 2.959228515625, 3.2781982421875, 3.59716796875, 3.9161376953125, 4.235107421875, 4.5540771484375, 4.873046875, 5.1920166015625, 5.510986328125, 5.8299560546875, 6.14892578125, 6.4678955078125, 6.786865234375, 7.1058349609375, 7.4248046875, 7.7437744140625, 8.062744140625, 8.3817138671875, 8.70068359375, 9.0196533203125, 9.338623046875, 9.6575927734375, 9.9765625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 14.0, 15.0, 19.0, 22.0, 24.0, 38.0, 34.0, 52.0, 68.0, 93.0, 104.0, 198.0, 251.0, 312.0, 406.0, 1344.0, 4142324.0, 46846.0, 583.0, 404.0, 306.0, 208.0, 151.0, 116.0, 71.0, 51.0, 48.0, 44.0, 21.0, 26.0, 14.0, 12.0, 13.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-139.5, -134.814453125, -130.12890625, -125.443359375, -120.7578125, -116.072265625, -111.38671875, -106.701171875, -102.015625, -97.330078125, -92.64453125, -87.958984375, -83.2734375, -78.587890625, -73.90234375, -69.216796875, -64.53125, -59.845703125, -55.16015625, -50.474609375, -45.7890625, -41.103515625, -36.41796875, -31.732421875, -27.046875, -22.361328125, -17.67578125, -12.990234375, -8.3046875, -3.619140625, 1.06640625, 5.751953125, 10.4375, 15.123046875, 19.80859375, 24.494140625, 29.1796875, 33.865234375, 38.55078125, 43.236328125, 47.921875, 52.607421875, 57.29296875, 61.978515625, 66.6640625, 71.349609375, 76.03515625, 80.720703125, 85.40625, 90.091796875, 94.77734375, 99.462890625, 104.1484375, 108.833984375, 113.51953125, 118.205078125, 122.890625, 127.576171875, 132.26171875, 136.947265625, 141.6328125, 146.318359375, 151.00390625, 155.689453125, 160.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 13.0, 13.0, 12.0, 19.0, 32.0, 42.0, 55.0, 87.0, 73.0, 113.0, 216.0, 278.0, 423.0, 600.0, 642.0, 483.0, 295.0, 202.0, 118.0, 78.0, 53.0, 60.0, 43.0, 22.0, 18.0, 14.0, 11.0, 4.0, 12.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.40625, -17.909912109375, -17.41357421875, -16.917236328125, -16.4208984375, -15.924560546875, -15.42822265625, -14.931884765625, -14.435546875, -13.939208984375, -13.44287109375, -12.946533203125, -12.4501953125, -11.953857421875, -11.45751953125, -10.961181640625, -10.46484375, -9.968505859375, -9.47216796875, -8.975830078125, -8.4794921875, -7.983154296875, -7.48681640625, -6.990478515625, -6.494140625, -5.997802734375, -5.50146484375, -5.005126953125, -4.5087890625, -4.012451171875, -3.51611328125, -3.019775390625, -2.5234375, -2.027099609375, -1.53076171875, -1.034423828125, -0.5380859375, -0.041748046875, 0.45458984375, 0.950927734375, 1.447265625, 1.943603515625, 2.43994140625, 2.936279296875, 3.4326171875, 3.928955078125, 4.42529296875, 4.921630859375, 5.41796875, 5.914306640625, 6.41064453125, 6.906982421875, 7.4033203125, 7.899658203125, 8.39599609375, 8.892333984375, 9.388671875, 9.885009765625, 10.38134765625, 10.877685546875, 11.3740234375, 11.870361328125, 12.36669921875, 12.863037109375, 13.359375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 7.0, 7.0, 16.0, 9.0, 25.0, 22.0, 18.0, 31.0, 33.0, 35.0, 56.0, 97.0, 146.0, 412.0, 3403.0, 345265.0, 3829061.0, 14185.0, 806.0, 219.0, 96.0, 54.0, 42.0, 43.0, 37.0, 30.0, 19.0, 16.0, 15.0, 13.0, 14.0, 2.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.3125, -63.9609375, -61.609375, -59.2578125, -56.90625, -54.5546875, -52.203125, -49.8515625, -47.5, -45.1484375, -42.796875, -40.4453125, -38.09375, -35.7421875, -33.390625, -31.0390625, -28.6875, -26.3359375, -23.984375, -21.6328125, -19.28125, -16.9296875, -14.578125, -12.2265625, -9.875, -7.5234375, -5.171875, -2.8203125, -0.46875, 1.8828125, 4.234375, 6.5859375, 8.9375, 11.2890625, 13.640625, 15.9921875, 18.34375, 20.6953125, 23.046875, 25.3984375, 27.75, 30.1015625, 32.453125, 34.8046875, 37.15625, 39.5078125, 41.859375, 44.2109375, 46.5625, 48.9140625, 51.265625, 53.6171875, 55.96875, 58.3203125, 60.671875, 63.0234375, 65.375, 67.7265625, 70.078125, 72.4296875, 74.78125, 77.1328125, 79.484375, 81.8359375, 84.1875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 20.0, 103.0, 323.0, 366.0, 163.0, 31.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.02180862426758, -38.618289947509766, -33.21476745605469, -27.811248779296875, -22.407730102539062, -17.00421142578125, -11.600688934326172, -6.197170257568359, -0.7936515808105469, 4.609868049621582, 10.013387680053711, 15.416908264160156, 20.82042694091797, 26.22394561767578, 31.62746810913086, 37.03098678588867, 42.434505462646484, 47.8380241394043, 53.241546630859375, 58.64506530761719, 64.048583984375, 69.45210266113281, 74.85562133789062, 80.25914001464844, 85.66265869140625, 91.06617736816406, 96.46969604492188, 101.87321472167969, 107.2767333984375, 112.68025207519531, 118.08377838134766, 123.48729705810547, 128.89080810546875, 134.29432678222656, 139.69784545898438, 145.1013641357422, 150.5048828125, 155.9084014892578, 161.31192016601562, 166.7154541015625, 172.11895751953125, 177.52247619628906, 182.92599487304688, 188.3295135498047, 193.7330322265625, 199.1365509033203, 204.54006958007812, 209.943603515625, 215.3471221923828, 220.75064086914062, 226.15415954589844, 231.55767822265625, 236.96119689941406, 242.36471557617188, 247.76824951171875, 253.1717529296875, 258.5752868652344, 263.97882080078125, 269.38232421875, 274.7858581542969, 280.1893615722656, 285.5928955078125, 290.99639892578125, 296.3999328613281, 301.8034362792969]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 5.0, 7.0, 5.0, 10.0, 18.0, 10.0, 9.0, 17.0, 9.0, 20.0, 18.0, 28.0, 25.0, 25.0, 39.0, 27.0, 20.0, 42.0, 33.0, 41.0, 37.0, 42.0, 39.0, 47.0, 29.0, 40.0, 39.0, 48.0, 39.0, 29.0, 24.0, 28.0, 27.0, 15.0, 21.0, 13.0, 16.0, 13.0, 11.0, 11.0, 3.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-50.619972229003906, -49.09144592285156, -47.56291961669922, -46.034393310546875, -44.5058708190918, -42.97734451293945, -41.44881820678711, -39.920291900634766, -38.39176559448242, -36.86323928833008, -35.334712982177734, -33.806190490722656, -32.27766418457031, -30.74913787841797, -29.220611572265625, -27.69208526611328, -26.16356086730957, -24.635034561157227, -23.106510162353516, -21.577983856201172, -20.049457550048828, -18.520931243896484, -16.992406845092773, -15.46388053894043, -13.935355186462402, -12.406829833984375, -10.878303527832031, -9.349778175354004, -7.821252346038818, -6.292726516723633, -4.7642011642456055, -3.2356748580932617, -1.7071495056152344, -0.17862379550933838, 1.3499019145965576, 2.878427505493164, 4.40695333480835, 5.935479164123535, 7.4640045166015625, 8.992530822753906, 10.521056175231934, 12.049581527709961, 13.578107833862305, 15.106633186340332, 16.63515853881836, 18.163684844970703, 19.692211151123047, 21.22073745727539, 22.7492618560791, 24.277788162231445, 25.806312561035156, 27.3348388671875, 28.863365173339844, 30.391891479492188, 31.9204158782959, 33.448944091796875, 34.97746658325195, 36.5059928894043, 38.03451919555664, 39.56304168701172, 41.09156799316406, 42.620094299316406, 44.14862060546875, 45.677146911621094, 47.20567321777344]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 10.0, 4.0, 7.0, 11.0, 20.0, 20.0, 19.0, 26.0, 32.0, 17.0, 32.0, 35.0, 35.0, 34.0, 42.0, 36.0, 35.0, 38.0, 46.0, 47.0, 39.0, 43.0, 36.0, 39.0, 40.0, 36.0, 30.0, 35.0, 23.0, 25.0, 13.0, 12.0, 17.0, 12.0, 8.0, 13.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-10.8515625, -10.5557861328125, -10.260009765625, -9.9642333984375, -9.66845703125, -9.3726806640625, -9.076904296875, -8.7811279296875, -8.4853515625, -8.1895751953125, -7.893798828125, -7.5980224609375, -7.30224609375, -7.0064697265625, -6.710693359375, -6.4149169921875, -6.119140625, -5.8233642578125, -5.527587890625, -5.2318115234375, -4.93603515625, -4.6402587890625, -4.344482421875, -4.0487060546875, -3.7529296875, -3.4571533203125, -3.161376953125, -2.8656005859375, -2.56982421875, -2.2740478515625, -1.978271484375, -1.6824951171875, -1.38671875, -1.0909423828125, -0.795166015625, -0.4993896484375, -0.20361328125, 0.0921630859375, 0.387939453125, 0.6837158203125, 0.9794921875, 1.2752685546875, 1.571044921875, 1.8668212890625, 2.16259765625, 2.4583740234375, 2.754150390625, 3.0499267578125, 3.345703125, 3.6414794921875, 3.937255859375, 4.2330322265625, 4.52880859375, 4.8245849609375, 5.120361328125, 5.4161376953125, 5.7119140625, 6.0076904296875, 6.303466796875, 6.5992431640625, 6.89501953125, 7.1907958984375, 7.486572265625, 7.7823486328125, 8.078125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 7.0, 13.0, 23.0, 34.0, 57.0, 81.0, 80.0, 113.0, 194.0, 240.0, 366.0, 511.0, 773.0, 1080.0, 1661.0, 2382.0, 3647.0, 5427.0, 8495.0, 13281.0, 21614.0, 35392.0, 58901.0, 96049.0, 147396.0, 184347.0, 165266.0, 114990.0, 71502.0, 42815.0, 26122.0, 16136.0, 10058.0, 6500.0, 4209.0, 2749.0, 1896.0, 1234.0, 879.0, 575.0, 432.0, 315.0, 218.0, 146.0, 95.0, 71.0, 69.0, 38.0, 28.0, 11.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.90576171875, -0.8771820068359375, -0.848602294921875, -0.8200225830078125, -0.79144287109375, -0.7628631591796875, -0.734283447265625, -0.7057037353515625, -0.6771240234375, -0.6485443115234375, -0.619964599609375, -0.5913848876953125, -0.56280517578125, -0.5342254638671875, -0.505645751953125, -0.4770660400390625, -0.448486328125, -0.4199066162109375, -0.391326904296875, -0.3627471923828125, -0.33416748046875, -0.3055877685546875, -0.277008056640625, -0.2484283447265625, -0.2198486328125, -0.1912689208984375, -0.162689208984375, -0.1341094970703125, -0.10552978515625, -0.0769500732421875, -0.048370361328125, -0.0197906494140625, 0.0087890625, 0.0373687744140625, 0.065948486328125, 0.0945281982421875, 0.12310791015625, 0.1516876220703125, 0.180267333984375, 0.2088470458984375, 0.2374267578125, 0.2660064697265625, 0.294586181640625, 0.3231658935546875, 0.35174560546875, 0.3803253173828125, 0.408905029296875, 0.4374847412109375, 0.466064453125, 0.4946441650390625, 0.523223876953125, 0.5518035888671875, 0.58038330078125, 0.6089630126953125, 0.637542724609375, 0.6661224365234375, 0.6947021484375, 0.7232818603515625, 0.751861572265625, 0.7804412841796875, 0.80902099609375, 0.8376007080078125, 0.866180419921875, 0.8947601318359375, 0.92333984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 11.0, 9.0, 11.0, 8.0, 14.0, 23.0, 22.0, 20.0, 21.0, 22.0, 25.0, 23.0, 29.0, 23.0, 30.0, 32.0, 42.0, 37.0, 42.0, 37.0, 1061.0, 39.0, 48.0, 33.0, 36.0, 35.0, 21.0, 33.0, 23.0, 30.0, 27.0, 13.0, 22.0, 23.0, 10.0, 11.0, 16.0, 10.0, 8.0, 7.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0], "bins": [-6.03125, -5.8646240234375, -5.697998046875, -5.5313720703125, -5.36474609375, -5.1981201171875, -5.031494140625, -4.8648681640625, -4.6982421875, -4.5316162109375, -4.364990234375, -4.1983642578125, -4.03173828125, -3.8651123046875, -3.698486328125, -3.5318603515625, -3.365234375, -3.1986083984375, -3.031982421875, -2.8653564453125, -2.69873046875, -2.5321044921875, -2.365478515625, -2.1988525390625, -2.0322265625, -1.8656005859375, -1.698974609375, -1.5323486328125, -1.36572265625, -1.1990966796875, -1.032470703125, -0.8658447265625, -0.69921875, -0.5325927734375, -0.365966796875, -0.1993408203125, -0.03271484375, 0.1339111328125, 0.300537109375, 0.4671630859375, 0.6337890625, 0.8004150390625, 0.967041015625, 1.1336669921875, 1.30029296875, 1.4669189453125, 1.633544921875, 1.8001708984375, 1.966796875, 2.1334228515625, 2.300048828125, 2.4666748046875, 2.63330078125, 2.7999267578125, 2.966552734375, 3.1331787109375, 3.2998046875, 3.4664306640625, 3.633056640625, 3.7996826171875, 3.96630859375, 4.1329345703125, 4.299560546875, 4.4661865234375, 4.6328125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 15.0, 20.0, 46.0, 73.0, 101.0, 161.0, 231.0, 330.0, 506.0, 816.0, 1226.0, 1702.0, 2530.0, 3646.0, 5351.0, 8079.0, 11922.0, 17656.0, 26214.0, 38547.0, 56421.0, 79870.0, 108808.0, 162171.0, 1156782.0, 119616.0, 91541.0, 64828.0, 44824.0, 30426.0, 20444.0, 13731.0, 9215.0, 6178.0, 4155.0, 2964.0, 1954.0, 1306.0, 912.0, 609.0, 423.0, 264.0, 167.0, 102.0, 93.0, 57.0, 42.0, 17.0, 14.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.6005859375, -0.5819320678710938, -0.5632781982421875, -0.5446243286132812, -0.525970458984375, -0.5073165893554688, -0.4886627197265625, -0.47000885009765625, -0.45135498046875, -0.43270111083984375, -0.4140472412109375, -0.39539337158203125, -0.376739501953125, -0.35808563232421875, -0.3394317626953125, -0.32077789306640625, -0.3021240234375, -0.28347015380859375, -0.2648162841796875, -0.24616241455078125, -0.227508544921875, -0.20885467529296875, -0.1902008056640625, -0.17154693603515625, -0.15289306640625, -0.13423919677734375, -0.1155853271484375, -0.09693145751953125, -0.078277587890625, -0.05962371826171875, -0.0409698486328125, -0.02231597900390625, -0.003662109375, 0.01499176025390625, 0.0336456298828125, 0.05229949951171875, 0.070953369140625, 0.08960723876953125, 0.1082611083984375, 0.12691497802734375, 0.14556884765625, 0.16422271728515625, 0.1828765869140625, 0.20153045654296875, 0.220184326171875, 0.23883819580078125, 0.2574920654296875, 0.27614593505859375, 0.2947998046875, 0.31345367431640625, 0.3321075439453125, 0.35076141357421875, 0.369415283203125, 0.38806915283203125, 0.4067230224609375, 0.42537689208984375, 0.44403076171875, 0.46268463134765625, 0.4813385009765625, 0.49999237060546875, 0.518646240234375, 0.5373001098632812, 0.5559539794921875, 0.5746078491210938, 0.59326171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 12.0, 12.0, 12.0, 9.0, 17.0, 13.0, 25.0, 31.0, 28.0, 39.0, 45.0, 49.0, 61.0, 63.0, 75.0, 63.0, 77.0, 51.0, 63.0, 39.0, 40.0, 24.0, 24.0, 19.0, 12.0, 19.0, 11.0, 7.0, 7.0, 7.0, 7.0, 7.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0098419189453125, -0.009496450424194336, -0.009150981903076172, -0.008805513381958008, -0.008460044860839844, -0.00811457633972168, -0.007769107818603516, -0.0074236392974853516, -0.0070781707763671875, -0.0067327022552490234, -0.006387233734130859, -0.006041765213012695, -0.005696296691894531, -0.005350828170776367, -0.005005359649658203, -0.004659891128540039, -0.004314422607421875, -0.003968954086303711, -0.003623485565185547, -0.003278017044067383, -0.0029325485229492188, -0.0025870800018310547, -0.0022416114807128906, -0.0018961429595947266, -0.0015506744384765625, -0.0012052059173583984, -0.0008597373962402344, -0.0005142688751220703, -0.00016880035400390625, 0.0001766681671142578, 0.0005221366882324219, 0.0008676052093505859, 0.00121307373046875, 0.001558542251586914, 0.0019040107727050781, 0.002249479293823242, 0.0025949478149414062, 0.0029404163360595703, 0.0032858848571777344, 0.0036313533782958984, 0.0039768218994140625, 0.0043222904205322266, 0.004667758941650391, 0.005013227462768555, 0.005358695983886719, 0.005704164505004883, 0.006049633026123047, 0.006395101547241211, 0.006740570068359375, 0.007086038589477539, 0.007431507110595703, 0.007776975631713867, 0.008122444152832031, 0.008467912673950195, 0.00881338119506836, 0.009158849716186523, 0.009504318237304688, 0.009849786758422852, 0.010195255279541016, 0.01054072380065918, 0.010886192321777344, 0.011231660842895508, 0.011577129364013672, 0.011922597885131836, 0.01226806640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 7.0, 7.0, 15.0, 11.0, 16.0, 16.0, 27.0, 26.0, 28.0, 42.0, 47.0, 76.0, 104.0, 176.0, 260.0, 379.0, 739.0, 4403.0, 1034350.0, 5889.0, 737.0, 374.0, 230.0, 152.0, 101.0, 84.0, 48.0, 28.0, 38.0, 22.0, 24.0, 20.0, 19.0, 10.0, 12.0, 4.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.22265625, -0.21638870239257812, -0.21012115478515625, -0.20385360717773438, -0.1975860595703125, -0.19131851196289062, -0.18505096435546875, -0.17878341674804688, -0.172515869140625, -0.16624832153320312, -0.15998077392578125, -0.15371322631835938, -0.1474456787109375, -0.14117813110351562, -0.13491058349609375, -0.12864303588867188, -0.12237548828125, -0.11610794067382812, -0.10984039306640625, -0.10357284545898438, -0.0973052978515625, -0.09103775024414062, -0.08477020263671875, -0.07850265502929688, -0.072235107421875, -0.06596755981445312, -0.05970001220703125, -0.053432464599609375, -0.0471649169921875, -0.040897369384765625, -0.03462982177734375, -0.028362274169921875, -0.0220947265625, -0.015827178955078125, -0.00955963134765625, -0.003292083740234375, 0.0029754638671875, 0.009243011474609375, 0.01551055908203125, 0.021778106689453125, 0.028045654296875, 0.034313201904296875, 0.04058074951171875, 0.046848297119140625, 0.0531158447265625, 0.059383392333984375, 0.06565093994140625, 0.07191848754882812, 0.07818603515625, 0.08445358276367188, 0.09072113037109375, 0.09698867797851562, 0.1032562255859375, 0.10952377319335938, 0.11579132080078125, 0.12205886840820312, 0.128326416015625, 0.13459396362304688, 0.14086151123046875, 0.14712905883789062, 0.1533966064453125, 0.15966415405273438, 0.16593170166015625, 0.17219924926757812, 0.178466796875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 96.0, 915.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06217178329825401, -0.059098780155181885, -0.05602577328681946, -0.05295277014374733, -0.0498797670006752, -0.046806760132312775, -0.043733756989240646, -0.04066075384616852, -0.03758774697780609, -0.03451474383473396, -0.031441736966371536, -0.028368733823299408, -0.02529572881758213, -0.022222723811864853, -0.019149720668792725, -0.016076715663075447, -0.01300371065735817, -0.009930705651640892, -0.006857701577246189, -0.003784697502851486, -0.0007116924971342087, 0.002361312508583069, 0.005434315651655197, 0.008507320657372475, 0.011580325663089752, 0.01465333066880703, 0.017726335674524307, 0.020799338817596436, 0.023872343823313713, 0.02694534882903099, 0.03001835197210312, 0.033091358840465546, 0.036164358258247375, 0.039237361401319504, 0.04231036826968193, 0.04538337141275406, 0.048456378281116486, 0.051529381424188614, 0.05460238456726074, 0.05767539143562317, 0.0607483945786953, 0.06382139772176743, 0.06689440459012985, 0.06996740400791168, 0.07304041087627411, 0.07611341774463654, 0.07918642461299896, 0.08225942403078079, 0.08533243089914322, 0.08840543776750565, 0.09147843718528748, 0.0945514440536499, 0.09762445092201233, 0.10069745779037476, 0.10377045720815659, 0.10684346407651901, 0.10991646349430084, 0.11298947036266327, 0.1160624697804451, 0.11913547664880753, 0.12220848351716995, 0.12528148293495178, 0.1283544898033142, 0.13142749667167664, 0.13450050354003906]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 13.0, 20.0, 16.0, 18.0, 29.0, 41.0, 51.0, 64.0, 53.0, 52.0, 72.0, 80.0, 57.0, 64.0, 45.0, 54.0, 50.0, 52.0, 36.0, 39.0, 24.0, 19.0, 14.0, 9.0, 9.0, 10.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009626805782318115, -0.009287890046834946, -0.008948974311351776, -0.008610058575868607, -0.008271142840385437, -0.007932227104902267, -0.007593311369419098, -0.007254395633935928, -0.006915479898452759, -0.006576564162969589, -0.00623764842748642, -0.00589873269200325, -0.005559816956520081, -0.005220901221036911, -0.0048819854855537415, -0.004543069750070572, -0.004204154014587402, -0.003865238279104233, -0.0035263225436210632, -0.0031874068081378937, -0.002848491072654724, -0.0025095753371715546, -0.002170659601688385, -0.0018317438662052155, -0.001492828130722046, -0.0011539123952388763, -0.0008149966597557068, -0.00047608092427253723, -0.00013716518878936768, 0.00020175054669380188, 0.0005406662821769714, 0.000879582017660141, 0.0012184977531433105, 0.00155741348862648, 0.0018963292241096497, 0.002235244959592819, 0.0025741606950759888, 0.0029130764305591583, 0.003251992166042328, 0.0035909079015254974, 0.003929823637008667, 0.0042687393724918365, 0.004607655107975006, 0.004946570843458176, 0.005285486578941345, 0.005624402314424515, 0.005963318049907684, 0.006302233785390854, 0.0066411495208740234, 0.006980065256357193, 0.0073189809918403625, 0.007657896727323532, 0.007996812462806702, 0.008335728198289871, 0.00867464393377304, 0.00901355966925621, 0.00935247540473938, 0.00969139114022255, 0.010030306875705719, 0.010369222611188889, 0.010708138346672058, 0.011047054082155228, 0.011385969817638397, 0.011724885553121567, 0.012063801288604736]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 10.0, 4.0, 7.0, 11.0, 20.0, 20.0, 19.0, 26.0, 32.0, 17.0, 32.0, 35.0, 35.0, 34.0, 42.0, 36.0, 36.0, 37.0, 45.0, 48.0, 39.0, 43.0, 36.0, 39.0, 40.0, 36.0, 30.0, 35.0, 23.0, 25.0, 13.0, 12.0, 17.0, 12.0, 8.0, 13.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-10.8515625, -10.5557861328125, -10.260009765625, -9.9642333984375, -9.66845703125, -9.3726806640625, -9.076904296875, -8.7811279296875, -8.4853515625, -8.1895751953125, -7.893798828125, -7.5980224609375, -7.30224609375, -7.0064697265625, -6.710693359375, -6.4149169921875, -6.119140625, -5.8233642578125, -5.527587890625, -5.2318115234375, -4.93603515625, -4.6402587890625, -4.344482421875, -4.0487060546875, -3.7529296875, -3.4571533203125, -3.161376953125, -2.8656005859375, -2.56982421875, -2.2740478515625, -1.978271484375, -1.6824951171875, -1.38671875, -1.0909423828125, -0.795166015625, -0.4993896484375, -0.20361328125, 0.0921630859375, 0.387939453125, 0.6837158203125, 0.9794921875, 1.2752685546875, 1.571044921875, 1.8668212890625, 2.16259765625, 2.4583740234375, 2.754150390625, 3.0499267578125, 3.345703125, 3.6414794921875, 3.937255859375, 4.2330322265625, 4.52880859375, 4.8245849609375, 5.120361328125, 5.4161376953125, 5.7119140625, 6.0076904296875, 6.303466796875, 6.5992431640625, 6.89501953125, 7.1907958984375, 7.486572265625, 7.7823486328125, 8.078125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 11.0, 9.0, 15.0, 19.0, 40.0, 57.0, 74.0, 105.0, 134.0, 178.0, 274.0, 319.0, 503.0, 623.0, 882.0, 1259.0, 2226.0, 5832.0, 28294.0, 194362.0, 624232.0, 154853.0, 22875.0, 4946.0, 2030.0, 1210.0, 888.0, 638.0, 455.0, 354.0, 242.0, 156.0, 127.0, 81.0, 68.0, 54.0, 31.0, 25.0, 20.0, 11.0, 11.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.62890625, -18.0546875, -17.48046875, -16.90625, -16.33203125, -15.7578125, -15.18359375, -14.609375, -14.03515625, -13.4609375, -12.88671875, -12.3125, -11.73828125, -11.1640625, -10.58984375, -10.015625, -9.44140625, -8.8671875, -8.29296875, -7.71875, -7.14453125, -6.5703125, -5.99609375, -5.421875, -4.84765625, -4.2734375, -3.69921875, -3.125, -2.55078125, -1.9765625, -1.40234375, -0.828125, -0.25390625, 0.3203125, 0.89453125, 1.46875, 2.04296875, 2.6171875, 3.19140625, 3.765625, 4.33984375, 4.9140625, 5.48828125, 6.0625, 6.63671875, 7.2109375, 7.78515625, 8.359375, 8.93359375, 9.5078125, 10.08203125, 10.65625, 11.23046875, 11.8046875, 12.37890625, 12.953125, 13.52734375, 14.1015625, 14.67578125, 15.25, 15.82421875, 16.3984375, 16.97265625, 17.546875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 8.0, 4.0, 9.0, 7.0, 9.0, 13.0, 13.0, 21.0, 17.0, 25.0, 29.0, 33.0, 33.0, 33.0, 52.0, 56.0, 87.0, 103.0, 229.0, 1374.0, 283.0, 145.0, 82.0, 67.0, 43.0, 31.0, 29.0, 31.0, 30.0, 33.0, 17.0, 15.0, 17.0, 11.0, 12.0, 12.0, 12.0, 5.0, 6.0, 2.0, 1.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.398681640625, -18.67236328125, -17.946044921875, -17.2197265625, -16.493408203125, -15.76708984375, -15.040771484375, -14.314453125, -13.588134765625, -12.86181640625, -12.135498046875, -11.4091796875, -10.682861328125, -9.95654296875, -9.230224609375, -8.50390625, -7.777587890625, -7.05126953125, -6.324951171875, -5.5986328125, -4.872314453125, -4.14599609375, -3.419677734375, -2.693359375, -1.967041015625, -1.24072265625, -0.514404296875, 0.2119140625, 0.938232421875, 1.66455078125, 2.390869140625, 3.1171875, 3.843505859375, 4.56982421875, 5.296142578125, 6.0224609375, 6.748779296875, 7.47509765625, 8.201416015625, 8.927734375, 9.654052734375, 10.38037109375, 11.106689453125, 11.8330078125, 12.559326171875, 13.28564453125, 14.011962890625, 14.73828125, 15.464599609375, 16.19091796875, 16.917236328125, 17.6435546875, 18.369873046875, 19.09619140625, 19.822509765625, 20.548828125, 21.275146484375, 22.00146484375, 22.727783203125, 23.4541015625, 24.180419921875, 24.90673828125, 25.633056640625, 26.359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 9.0, 10.0, 4.0, 22.0, 14.0, 13.0, 23.0, 39.0, 51.0, 64.0, 75.0, 140.0, 213.0, 369.0, 708.0, 2029.0, 383184.0, 2754101.0, 2557.0, 846.0, 401.0, 257.0, 164.0, 89.0, 83.0, 52.0, 38.0, 30.0, 19.0, 17.0, 14.0, 8.0, 9.0, 4.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.5, -65.970703125, -63.44140625, -60.912109375, -58.3828125, -55.853515625, -53.32421875, -50.794921875, -48.265625, -45.736328125, -43.20703125, -40.677734375, -38.1484375, -35.619140625, -33.08984375, -30.560546875, -28.03125, -25.501953125, -22.97265625, -20.443359375, -17.9140625, -15.384765625, -12.85546875, -10.326171875, -7.796875, -5.267578125, -2.73828125, -0.208984375, 2.3203125, 4.849609375, 7.37890625, 9.908203125, 12.4375, 14.966796875, 17.49609375, 20.025390625, 22.5546875, 25.083984375, 27.61328125, 30.142578125, 32.671875, 35.201171875, 37.73046875, 40.259765625, 42.7890625, 45.318359375, 47.84765625, 50.376953125, 52.90625, 55.435546875, 57.96484375, 60.494140625, 63.0234375, 65.552734375, 68.08203125, 70.611328125, 73.140625, 75.669921875, 78.19921875, 80.728515625, 83.2578125, 85.787109375, 88.31640625, 90.845703125, 93.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 784.0, 221.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-315.14605712890625, -299.9920959472656, -284.838134765625, -269.6842041015625, -254.53024291992188, -239.37628173828125, -224.2223358154297, -209.06838989257812, -193.9144287109375, -178.76046752929688, -163.6065216064453, -148.45257568359375, -133.29861450195312, -118.14466094970703, -102.99070739746094, -87.83675384521484, -72.68280029296875, -57.528846740722656, -42.37489318847656, -27.22093963623047, -12.066986083984375, 3.0869674682617188, 18.240921020507812, 33.394874572753906, 48.548828125, 63.702781677246094, 78.85673522949219, 94.01068878173828, 109.16464233398438, 124.31859588623047, 139.47254943847656, 154.62649536132812, 169.78045654296875, 184.93441772460938, 200.08836364746094, 215.2423095703125, 230.39627075195312, 245.55023193359375, 260.70416259765625, 275.8581237792969, 291.0120849609375, 306.1660461425781, 321.32000732421875, 336.47393798828125, 351.6278991699219, 366.7818603515625, 381.935791015625, 397.0897521972656, 412.24371337890625, 427.3976745605469, 442.5516357421875, 457.70556640625, 472.8595275878906, 488.01348876953125, 503.16741943359375, 518.3214111328125, 533.475341796875, 548.6292724609375, 563.7832641601562, 578.9371948242188, 594.0911865234375, 609.2451171875, 624.3990478515625, 639.5530395507812, 654.7069702148438]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 11.0, 10.0, 16.0, 12.0, 16.0, 14.0, 25.0, 22.0, 18.0, 23.0, 37.0, 32.0, 38.0, 28.0, 27.0, 49.0, 38.0, 37.0, 34.0, 44.0, 37.0, 33.0, 52.0, 22.0, 28.0, 38.0, 30.0, 33.0, 20.0, 23.0, 21.0, 15.0, 16.0, 14.0, 10.0, 12.0, 7.0, 13.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-58.36372375488281, -56.542327880859375, -54.7209358215332, -52.899539947509766, -51.07814407348633, -49.256752014160156, -47.43535614013672, -45.61396026611328, -43.792564392089844, -41.971168518066406, -40.149776458740234, -38.3283805847168, -36.50698471069336, -34.68559265136719, -32.86419677734375, -31.042800903320312, -29.22140884399414, -27.400014877319336, -25.5786190032959, -23.757225036621094, -21.935829162597656, -20.11443519592285, -18.293041229248047, -16.47164535522461, -14.650251388549805, -12.828856468200684, -11.007461547851562, -9.186067581176758, -7.364672660827637, -5.543277740478516, -3.721883773803711, -1.9004888534545898, -0.07909393310546875, 1.7423007488250732, 3.5636954307556152, 5.385089874267578, 7.206484794616699, 9.02787971496582, 10.849273681640625, 12.670668601989746, 14.492063522338867, 16.313457489013672, 18.13485336303711, 19.956247329711914, 21.77764129638672, 23.599037170410156, 25.42043113708496, 27.241825103759766, 29.063220977783203, 30.884614944458008, 32.70600891113281, 34.52740478515625, 36.34880065917969, 38.170196533203125, 39.9915885925293, 41.812984466552734, 43.634376525878906, 45.455772399902344, 47.277164459228516, 49.09856033325195, 50.91995620727539, 52.74134826660156, 54.562744140625, 56.38414001464844, 58.205535888671875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 9.0, 20.0, 8.0, 18.0, 19.0, 21.0, 26.0, 27.0, 38.0, 32.0, 36.0, 42.0, 40.0, 26.0, 42.0, 41.0, 44.0, 35.0, 44.0, 42.0, 36.0, 40.0, 42.0, 26.0, 34.0, 28.0, 23.0, 21.0, 25.0, 11.0, 12.0, 11.0, 9.0, 7.0, 8.0, 9.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0], "bins": [-10.4375, -10.1422119140625, -9.846923828125, -9.5516357421875, -9.25634765625, -8.9610595703125, -8.665771484375, -8.3704833984375, -8.0751953125, -7.7799072265625, -7.484619140625, -7.1893310546875, -6.89404296875, -6.5987548828125, -6.303466796875, -6.0081787109375, -5.712890625, -5.4176025390625, -5.122314453125, -4.8270263671875, -4.53173828125, -4.2364501953125, -3.941162109375, -3.6458740234375, -3.3505859375, -3.0552978515625, -2.760009765625, -2.4647216796875, -2.16943359375, -1.8741455078125, -1.578857421875, -1.2835693359375, -0.98828125, -0.6929931640625, -0.397705078125, -0.1024169921875, 0.19287109375, 0.4881591796875, 0.783447265625, 1.0787353515625, 1.3740234375, 1.6693115234375, 1.964599609375, 2.2598876953125, 2.55517578125, 2.8504638671875, 3.145751953125, 3.4410400390625, 3.736328125, 4.0316162109375, 4.326904296875, 4.6221923828125, 4.91748046875, 5.2127685546875, 5.508056640625, 5.8033447265625, 6.0986328125, 6.3939208984375, 6.689208984375, 6.9844970703125, 7.27978515625, 7.5750732421875, 7.870361328125, 8.1656494140625, 8.4609375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 9.0, 13.0, 26.0, 24.0, 28.0, 31.0, 38.0, 52.0, 72.0, 99.0, 158.0, 222.0, 401.0, 738.0, 1805.0, 5246.0, 20037.0, 147754.0, 1408210.0, 2232876.0, 327943.0, 36035.0, 7654.0, 2462.0, 1002.0, 478.0, 263.0, 159.0, 128.0, 78.0, 68.0, 43.0, 28.0, 25.0, 14.0, 11.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.03125, -19.42724609375, -18.8232421875, -18.21923828125, -17.615234375, -17.01123046875, -16.4072265625, -15.80322265625, -15.19921875, -14.59521484375, -13.9912109375, -13.38720703125, -12.783203125, -12.17919921875, -11.5751953125, -10.97119140625, -10.3671875, -9.76318359375, -9.1591796875, -8.55517578125, -7.951171875, -7.34716796875, -6.7431640625, -6.13916015625, -5.53515625, -4.93115234375, -4.3271484375, -3.72314453125, -3.119140625, -2.51513671875, -1.9111328125, -1.30712890625, -0.703125, -0.09912109375, 0.5048828125, 1.10888671875, 1.712890625, 2.31689453125, 2.9208984375, 3.52490234375, 4.12890625, 4.73291015625, 5.3369140625, 5.94091796875, 6.544921875, 7.14892578125, 7.7529296875, 8.35693359375, 8.9609375, 9.56494140625, 10.1689453125, 10.77294921875, 11.376953125, 11.98095703125, 12.5849609375, 13.18896484375, 13.79296875, 14.39697265625, 15.0009765625, 15.60498046875, 16.208984375, 16.81298828125, 17.4169921875, 18.02099609375, 18.625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 22.0, 30.0, 56.0, 74.0, 107.0, 174.0, 248.0, 433.0, 691.0, 799.0, 545.0, 291.0, 204.0, 143.0, 96.0, 54.0, 32.0, 19.0, 15.0, 12.0, 8.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.520263671875, -18.68115234375, -17.842041015625, -17.0029296875, -16.163818359375, -15.32470703125, -14.485595703125, -13.646484375, -12.807373046875, -11.96826171875, -11.129150390625, -10.2900390625, -9.450927734375, -8.61181640625, -7.772705078125, -6.93359375, -6.094482421875, -5.25537109375, -4.416259765625, -3.5771484375, -2.738037109375, -1.89892578125, -1.059814453125, -0.220703125, 0.618408203125, 1.45751953125, 2.296630859375, 3.1357421875, 3.974853515625, 4.81396484375, 5.653076171875, 6.4921875, 7.331298828125, 8.17041015625, 9.009521484375, 9.8486328125, 10.687744140625, 11.52685546875, 12.365966796875, 13.205078125, 14.044189453125, 14.88330078125, 15.722412109375, 16.5615234375, 17.400634765625, 18.23974609375, 19.078857421875, 19.91796875, 20.757080078125, 21.59619140625, 22.435302734375, 23.2744140625, 24.113525390625, 24.95263671875, 25.791748046875, 26.630859375, 27.469970703125, 28.30908203125, 29.148193359375, 29.9873046875, 30.826416015625, 31.66552734375, 32.504638671875, 33.34375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 6.0, 3.0, 5.0, 10.0, 17.0, 32.0, 51.0, 94.0, 183.0, 458.0, 1042.0, 3506.0, 45980.0, 3637785.0, 492235.0, 9486.0, 2010.0, 713.0, 319.0, 165.0, 71.0, 41.0, 26.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-65.3125, -63.7099609375, -62.107421875, -60.5048828125, -58.90234375, -57.2998046875, -55.697265625, -54.0947265625, -52.4921875, -50.8896484375, -49.287109375, -47.6845703125, -46.08203125, -44.4794921875, -42.876953125, -41.2744140625, -39.671875, -38.0693359375, -36.466796875, -34.8642578125, -33.26171875, -31.6591796875, -30.056640625, -28.4541015625, -26.8515625, -25.2490234375, -23.646484375, -22.0439453125, -20.44140625, -18.8388671875, -17.236328125, -15.6337890625, -14.03125, -12.4287109375, -10.826171875, -9.2236328125, -7.62109375, -6.0185546875, -4.416015625, -2.8134765625, -1.2109375, 0.3916015625, 1.994140625, 3.5966796875, 5.19921875, 6.8017578125, 8.404296875, 10.0068359375, 11.609375, 13.2119140625, 14.814453125, 16.4169921875, 18.01953125, 19.6220703125, 21.224609375, 22.8271484375, 24.4296875, 26.0322265625, 27.634765625, 29.2373046875, 30.83984375, 32.4423828125, 34.044921875, 35.6474609375, 37.25]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1009.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-494.6995849609375, -435.8778076171875, -377.0560607910156, -318.23431396484375, -259.41253662109375, -200.59075927734375, -141.76901245117188, -82.947265625, -24.12548828125, 34.69627380371094, 93.51803588867188, 152.3397979736328, 211.16156005859375, 269.98333740234375, 328.8050842285156, 387.6268310546875, 446.4486083984375, 505.2703857421875, 564.0921630859375, 622.9138793945312, 681.7356567382812, 740.5574340820312, 799.379150390625, 858.200927734375, 917.022705078125, 975.844482421875, 1034.666259765625, 1093.488037109375, 1152.309814453125, 1211.131591796875, 1269.9532470703125, 1328.7750244140625, 1387.596923828125, 1446.418701171875, 1505.240478515625, 1564.062255859375, 1622.884033203125, 1681.705810546875, 1740.5274658203125, 1799.3492431640625, 1858.1710205078125, 1916.9927978515625, 1975.8145751953125, 2034.6363525390625, 2093.4580078125, 2152.27978515625, 2211.1015625, 2269.92333984375, 2328.7451171875, 2387.56689453125, 2446.388671875, 2505.21044921875, 2564.0322265625, 2622.85400390625, 2681.67578125, 2740.49755859375, 2799.3193359375, 2858.14111328125, 2916.962890625, 2975.78466796875, 3034.6064453125, 3093.42822265625, 3152.25, 3211.07177734375, 3269.893310546875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 8.0, 11.0, 16.0, 28.0, 33.0, 40.0, 49.0, 61.0, 71.0, 102.0, 88.0, 87.0, 100.0, 83.0, 71.0, 58.0, 36.0, 27.0, 13.0, 11.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-193.9503173828125, -189.4902801513672, -185.03024291992188, -180.5701904296875, -176.1101531982422, -171.65011596679688, -167.1900634765625, -162.7300262451172, -158.26998901367188, -153.80995178222656, -149.34991455078125, -144.88986206054688, -140.42982482910156, -135.96978759765625, -131.50973510742188, -127.04969787597656, -122.58966064453125, -118.12962341308594, -113.6695785522461, -109.20953369140625, -104.74949645996094, -100.28945922851562, -95.82941436767578, -91.36936950683594, -86.90933227539062, -82.44929504394531, -77.98925018310547, -73.52920532226562, -69.06916809082031, -64.609130859375, -60.149085998535156, -55.68904495239258, -51.22900390625, -46.76896286010742, -42.308921813964844, -37.848880767822266, -33.38883972167969, -28.92879867553711, -24.46875762939453, -20.008716583251953, -15.548675537109375, -11.088634490966797, -6.628593444824219, -2.1685523986816406, 2.2914886474609375, 6.751529693603516, 11.211570739746094, 15.671611785888672, 20.13165283203125, 24.591693878173828, 29.051734924316406, 33.511775970458984, 37.97181701660156, 42.43185806274414, 46.89189910888672, 51.3519401550293, 55.811981201171875, 60.27202224731445, 64.73206329345703, 69.19210815429688, 73.65214538574219, 78.1121826171875, 82.57222747802734, 87.03227233886719, 91.4923095703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 3.0, 6.0, 12.0, 7.0, 16.0, 15.0, 23.0, 16.0, 28.0, 28.0, 26.0, 30.0, 28.0, 37.0, 43.0, 39.0, 34.0, 41.0, 45.0, 32.0, 44.0, 45.0, 35.0, 32.0, 31.0, 34.0, 40.0, 32.0, 37.0, 20.0, 14.0, 17.0, 17.0, 17.0, 16.0, 13.0, 5.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.3671875, -7.13848876953125, -6.9097900390625, -6.68109130859375, -6.452392578125, -6.22369384765625, -5.9949951171875, -5.76629638671875, -5.53759765625, -5.30889892578125, -5.0802001953125, -4.85150146484375, -4.622802734375, -4.39410400390625, -4.1654052734375, -3.93670654296875, -3.7080078125, -3.47930908203125, -3.2506103515625, -3.02191162109375, -2.793212890625, -2.56451416015625, -2.3358154296875, -2.10711669921875, -1.87841796875, -1.64971923828125, -1.4210205078125, -1.19232177734375, -0.963623046875, -0.73492431640625, -0.5062255859375, -0.27752685546875, -0.048828125, 0.17987060546875, 0.4085693359375, 0.63726806640625, 0.865966796875, 1.09466552734375, 1.3233642578125, 1.55206298828125, 1.78076171875, 2.00946044921875, 2.2381591796875, 2.46685791015625, 2.695556640625, 2.92425537109375, 3.1529541015625, 3.38165283203125, 3.6103515625, 3.83905029296875, 4.0677490234375, 4.29644775390625, 4.525146484375, 4.75384521484375, 4.9825439453125, 5.21124267578125, 5.43994140625, 5.66864013671875, 5.8973388671875, 6.12603759765625, 6.354736328125, 6.58343505859375, 6.8121337890625, 7.04083251953125, 7.26953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 13.0, 12.0, 25.0, 37.0, 52.0, 81.0, 100.0, 141.0, 203.0, 308.0, 471.0, 676.0, 1076.0, 1693.0, 2505.0, 3921.0, 6263.0, 10565.0, 17444.0, 30825.0, 54576.0, 97339.0, 159916.0, 208239.0, 180078.0, 115218.0, 65771.0, 37132.0, 21083.0, 12301.0, 7486.0, 4524.0, 2874.0, 1852.0, 1228.0, 824.0, 559.0, 371.0, 237.0, 161.0, 108.0, 80.0, 50.0, 37.0, 31.0, 24.0, 12.0, 11.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7978515625, -0.7726516723632812, -0.7474517822265625, -0.7222518920898438, -0.697052001953125, -0.6718521118164062, -0.6466522216796875, -0.6214523315429688, -0.59625244140625, -0.5710525512695312, -0.5458526611328125, -0.5206527709960938, -0.495452880859375, -0.47025299072265625, -0.4450531005859375, -0.41985321044921875, -0.3946533203125, -0.36945343017578125, -0.3442535400390625, -0.31905364990234375, -0.293853759765625, -0.26865386962890625, -0.2434539794921875, -0.21825408935546875, -0.19305419921875, -0.16785430908203125, -0.1426544189453125, -0.11745452880859375, -0.092254638671875, -0.06705474853515625, -0.0418548583984375, -0.01665496826171875, 0.008544921875, 0.03374481201171875, 0.0589447021484375, 0.08414459228515625, 0.109344482421875, 0.13454437255859375, 0.1597442626953125, 0.18494415283203125, 0.21014404296875, 0.23534393310546875, 0.2605438232421875, 0.28574371337890625, 0.310943603515625, 0.33614349365234375, 0.3613433837890625, 0.38654327392578125, 0.4117431640625, 0.43694305419921875, 0.4621429443359375, 0.48734283447265625, 0.512542724609375, 0.5377426147460938, 0.5629425048828125, 0.5881423950195312, 0.61334228515625, 0.6385421752929688, 0.6637420654296875, 0.6889419555664062, 0.714141845703125, 0.7393417358398438, 0.7645416259765625, 0.7897415161132812, 0.81494140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 9.0, 5.0, 10.0, 13.0, 9.0, 13.0, 14.0, 17.0, 9.0, 26.0, 21.0, 20.0, 27.0, 30.0, 34.0, 37.0, 39.0, 35.0, 52.0, 51.0, 1065.0, 46.0, 28.0, 46.0, 54.0, 52.0, 28.0, 31.0, 30.0, 23.0, 24.0, 25.0, 28.0, 17.0, 16.0, 15.0, 3.0, 10.0, 5.0, 2.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0390625, -4.87493896484375, -4.7108154296875, -4.54669189453125, -4.382568359375, -4.21844482421875, -4.0543212890625, -3.89019775390625, -3.72607421875, -3.56195068359375, -3.3978271484375, -3.23370361328125, -3.069580078125, -2.90545654296875, -2.7413330078125, -2.57720947265625, -2.4130859375, -2.24896240234375, -2.0848388671875, -1.92071533203125, -1.756591796875, -1.59246826171875, -1.4283447265625, -1.26422119140625, -1.10009765625, -0.93597412109375, -0.7718505859375, -0.60772705078125, -0.443603515625, -0.27947998046875, -0.1153564453125, 0.04876708984375, 0.212890625, 0.37701416015625, 0.5411376953125, 0.70526123046875, 0.869384765625, 1.03350830078125, 1.1976318359375, 1.36175537109375, 1.52587890625, 1.69000244140625, 1.8541259765625, 2.01824951171875, 2.182373046875, 2.34649658203125, 2.5106201171875, 2.67474365234375, 2.8388671875, 3.00299072265625, 3.1671142578125, 3.33123779296875, 3.495361328125, 3.65948486328125, 3.8236083984375, 3.98773193359375, 4.15185546875, 4.31597900390625, 4.4801025390625, 4.64422607421875, 4.808349609375, 4.97247314453125, 5.1365966796875, 5.30072021484375, 5.46484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 10.0, 18.0, 37.0, 59.0, 72.0, 100.0, 154.0, 230.0, 365.0, 535.0, 809.0, 1183.0, 1657.0, 2484.0, 3522.0, 5134.0, 7504.0, 11238.0, 16855.0, 25110.0, 37302.0, 54681.0, 77230.0, 104195.0, 134710.0, 1179974.0, 121605.0, 94455.0, 68533.0, 48098.0, 32226.0, 21660.0, 14535.0, 9795.0, 6642.0, 4471.0, 3208.0, 2132.0, 1509.0, 971.0, 676.0, 471.0, 349.0, 198.0, 159.0, 92.0, 56.0, 40.0, 24.0, 15.0, 15.0, 7.0, 8.0, 5.0, 0.0, 3.0], "bins": [-0.49560546875, -0.4807319641113281, -0.46585845947265625, -0.4509849548339844, -0.4361114501953125, -0.4212379455566406, -0.40636444091796875, -0.3914909362792969, -0.376617431640625, -0.3617439270019531, -0.34687042236328125, -0.3319969177246094, -0.3171234130859375, -0.3022499084472656, -0.28737640380859375, -0.2725028991699219, -0.25762939453125, -0.24275588989257812, -0.22788238525390625, -0.21300888061523438, -0.1981353759765625, -0.18326187133789062, -0.16838836669921875, -0.15351486206054688, -0.138641357421875, -0.12376785278320312, -0.10889434814453125, -0.09402084350585938, -0.0791473388671875, -0.06427383422851562, -0.04940032958984375, -0.034526824951171875, -0.0196533203125, -0.004779815673828125, 0.01009368896484375, 0.024967193603515625, 0.0398406982421875, 0.054714202880859375, 0.06958770751953125, 0.08446121215820312, 0.099334716796875, 0.11420822143554688, 0.12908172607421875, 0.14395523071289062, 0.1588287353515625, 0.17370223999023438, 0.18857574462890625, 0.20344924926757812, 0.21832275390625, 0.23319625854492188, 0.24806976318359375, 0.2629432678222656, 0.2778167724609375, 0.2926902770996094, 0.30756378173828125, 0.3224372863769531, 0.337310791015625, 0.3521842956542969, 0.36705780029296875, 0.3819313049316406, 0.3968048095703125, 0.4116783142089844, 0.42655181884765625, 0.4414253234863281, 0.456298828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 4.0, 3.0, 9.0, 8.0, 11.0, 13.0, 14.0, 10.0, 28.0, 22.0, 32.0, 34.0, 37.0, 47.0, 47.0, 63.0, 59.0, 71.0, 54.0, 47.0, 44.0, 42.0, 40.0, 44.0, 36.0, 24.0, 26.0, 24.0, 18.0, 17.0, 6.0, 15.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0], "bins": [-0.0084075927734375, -0.008178770542144775, -0.00794994831085205, -0.007721126079559326, -0.0074923038482666016, -0.007263481616973877, -0.007034659385681152, -0.006805837154388428, -0.006577014923095703, -0.0063481926918029785, -0.006119370460510254, -0.005890548229217529, -0.005661725997924805, -0.00543290376663208, -0.0052040815353393555, -0.004975259304046631, -0.004746437072753906, -0.004517614841461182, -0.004288792610168457, -0.004059970378875732, -0.003831148147583008, -0.003602325916290283, -0.0033735036849975586, -0.003144681453704834, -0.0029158592224121094, -0.0026870369911193848, -0.00245821475982666, -0.0022293925285339355, -0.002000570297241211, -0.0017717480659484863, -0.0015429258346557617, -0.0013141036033630371, -0.0010852813720703125, -0.0008564591407775879, -0.0006276369094848633, -0.00039881467819213867, -0.00016999244689941406, 5.882978439331055e-05, 0.00028765201568603516, 0.0005164742469787598, 0.0007452964782714844, 0.000974118709564209, 0.0012029409408569336, 0.0014317631721496582, 0.0016605854034423828, 0.0018894076347351074, 0.002118229866027832, 0.0023470520973205566, 0.0025758743286132812, 0.002804696559906006, 0.0030335187911987305, 0.003262341022491455, 0.0034911632537841797, 0.0037199854850769043, 0.003948807716369629, 0.0041776299476623535, 0.004406452178955078, 0.004635274410247803, 0.004864096641540527, 0.005092918872833252, 0.0053217411041259766, 0.005550563335418701, 0.005779385566711426, 0.00600820779800415, 0.006237030029296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 7.0, 5.0, 4.0, 5.0, 13.0, 9.0, 30.0, 21.0, 30.0, 30.0, 52.0, 62.0, 78.0, 97.0, 143.0, 188.0, 270.0, 575.0, 1495.0, 823036.0, 219651.0, 1201.0, 521.0, 285.0, 175.0, 120.0, 88.0, 73.0, 58.0, 37.0, 31.0, 31.0, 15.0, 19.0, 14.0, 10.0, 7.0, 18.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.123291015625, -0.11887741088867188, -0.11446380615234375, -0.11005020141601562, -0.1056365966796875, -0.10122299194335938, -0.09680938720703125, -0.09239578247070312, -0.087982177734375, -0.08356857299804688, -0.07915496826171875, -0.07474136352539062, -0.0703277587890625, -0.06591415405273438, -0.06150054931640625, -0.057086944580078125, -0.05267333984375, -0.048259735107421875, -0.04384613037109375, -0.039432525634765625, -0.0350189208984375, -0.030605316162109375, -0.02619171142578125, -0.021778106689453125, -0.017364501953125, -0.012950897216796875, -0.00853729248046875, -0.004123687744140625, 0.0002899169921875, 0.004703521728515625, 0.00911712646484375, 0.013530731201171875, 0.0179443359375, 0.022357940673828125, 0.02677154541015625, 0.031185150146484375, 0.0355987548828125, 0.040012359619140625, 0.04442596435546875, 0.048839569091796875, 0.053253173828125, 0.057666778564453125, 0.06208038330078125, 0.06649398803710938, 0.0709075927734375, 0.07532119750976562, 0.07973480224609375, 0.08414840698242188, 0.08856201171875, 0.09297561645507812, 0.09738922119140625, 0.10180282592773438, 0.1062164306640625, 0.11063003540039062, 0.11504364013671875, 0.11945724487304688, 0.123870849609375, 0.12828445434570312, 0.13269805908203125, 0.13711166381835938, 0.1415252685546875, 0.14593887329101562, 0.15035247802734375, 0.15476608276367188, 0.1591796875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 7.0, 1004.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01850746013224125, -0.01513953972607851, -0.011771619319915771, -0.008403699845075607, -0.0050357794389128685, -0.0016678590327501297, 0.0017000604420900345, 0.005067981779575348, 0.008435901254415512, 0.011803821660578251, 0.01517174206674099, 0.018539661541581154, 0.021907582879066467, 0.02527550235390663, 0.028643421828746796, 0.03201134502887726, 0.035379260778427124, 0.03874718025326729, 0.04211509972810745, 0.045483022928237915, 0.04885094240307808, 0.05221886187791824, 0.05558678135275841, 0.05895470082759857, 0.062322624027729034, 0.0656905472278595, 0.06905846297740936, 0.07242638617753983, 0.07579430192708969, 0.07916222512722015, 0.08253014087677002, 0.08589806407690048, 0.08926597982645035, 0.09263390302658081, 0.09600181877613068, 0.09936974197626114, 0.102737657725811, 0.10610558092594147, 0.10947349667549133, 0.1128414198756218, 0.11620934307575226, 0.11957726627588272, 0.12294518202543259, 0.12631310522556305, 0.12968102097511292, 0.13304895162582397, 0.13641686737537384, 0.1397847831249237, 0.14315269887447357, 0.14652061462402344, 0.1498885452747345, 0.15325646102428436, 0.15662437677383423, 0.1599923074245453, 0.16336022317409515, 0.16672813892364502, 0.17009606957435608, 0.17346398532390594, 0.176831915974617, 0.18019983172416687, 0.18356774747371674, 0.1869356632232666, 0.19030359387397766, 0.19367150962352753, 0.1970394253730774]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 11.0, 13.0, 22.0, 33.0, 40.0, 66.0, 65.0, 81.0, 92.0, 79.0, 81.0, 88.0, 69.0, 66.0, 60.0, 39.0, 28.0, 22.0, 14.0, 17.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.011212050914764404, -0.010908388532698154, -0.010604726150631905, -0.010301063768565655, -0.009997401386499405, -0.009693739004433155, -0.009390076622366905, -0.009086414240300655, -0.008782751858234406, -0.008479089476168156, -0.008175427094101906, -0.007871764712035656, -0.007568102329969406, -0.007264439947903156, -0.006960777565836906, -0.006657115183770657, -0.006353452801704407, -0.006049790419638157, -0.005746128037571907, -0.005442465655505657, -0.005138803273439407, -0.0048351408913731575, -0.004531478509306908, -0.004227816127240658, -0.003924153745174408, -0.003620491363108158, -0.0033168289810419083, -0.0030131665989756584, -0.0027095042169094086, -0.0024058418348431587, -0.002102179452776909, -0.001798517070710659, -0.0014948546886444092, -0.0011911923065781593, -0.0008875299245119095, -0.0005838675424456596, -0.0002802051603794098, 2.3457221686840057e-05, 0.0003271196037530899, 0.0006307819858193398, 0.0009344443678855896, 0.0012381067499518394, 0.0015417691320180893, 0.0018454315140843391, 0.002149093896150589, 0.002452756278216839, 0.0027564186602830887, 0.0030600810423493385, 0.0033637434244155884, 0.0036674058064818382, 0.003971068188548088, 0.004274730570614338, 0.004578392952680588, 0.004882055334746838, 0.0051857177168130875, 0.005489380098879337, 0.005793042480945587, 0.006096704863011837, 0.006400367245078087, 0.006704029627144337, 0.0070076920092105865, 0.007311354391276836, 0.007615016773343086, 0.007918679155409336, 0.008222341537475586]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 3.0, 6.0, 12.0, 7.0, 16.0, 15.0, 23.0, 16.0, 28.0, 28.0, 26.0, 30.0, 28.0, 37.0, 43.0, 39.0, 34.0, 41.0, 45.0, 32.0, 44.0, 45.0, 35.0, 32.0, 31.0, 34.0, 40.0, 32.0, 37.0, 20.0, 14.0, 17.0, 17.0, 17.0, 16.0, 13.0, 5.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.3671875, -7.13848876953125, -6.9097900390625, -6.68109130859375, -6.452392578125, -6.22369384765625, -5.9949951171875, -5.76629638671875, -5.53759765625, -5.30889892578125, -5.0802001953125, -4.85150146484375, -4.622802734375, -4.39410400390625, -4.1654052734375, -3.93670654296875, -3.7080078125, -3.47930908203125, -3.2506103515625, -3.02191162109375, -2.793212890625, -2.56451416015625, -2.3358154296875, -2.10711669921875, -1.87841796875, -1.64971923828125, -1.4210205078125, -1.19232177734375, -0.963623046875, -0.73492431640625, -0.5062255859375, -0.27752685546875, -0.048828125, 0.17987060546875, 0.4085693359375, 0.63726806640625, 0.865966796875, 1.09466552734375, 1.3233642578125, 1.55206298828125, 1.78076171875, 2.00946044921875, 2.2381591796875, 2.46685791015625, 2.695556640625, 2.92425537109375, 3.1529541015625, 3.38165283203125, 3.6103515625, 3.83905029296875, 4.0677490234375, 4.29644775390625, 4.525146484375, 4.75384521484375, 4.9825439453125, 5.21124267578125, 5.43994140625, 5.66864013671875, 5.8973388671875, 6.12603759765625, 6.354736328125, 6.58343505859375, 6.8121337890625, 7.04083251953125, 7.26953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 1.0, 5.0, 5.0, 6.0, 14.0, 11.0, 29.0, 31.0, 32.0, 60.0, 69.0, 85.0, 127.0, 170.0, 246.0, 333.0, 451.0, 689.0, 936.0, 1399.0, 2109.0, 3659.0, 9466.0, 64929.0, 655245.0, 270107.0, 24034.0, 5736.0, 2770.0, 1788.0, 1171.0, 805.0, 571.0, 417.0, 286.0, 190.0, 140.0, 112.0, 77.0, 65.0, 53.0, 41.0, 18.0, 18.0, 12.0, 10.0, 6.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.515625, -17.9140625, -17.3125, -16.7109375, -16.109375, -15.5078125, -14.90625, -14.3046875, -13.703125, -13.1015625, -12.5, -11.8984375, -11.296875, -10.6953125, -10.09375, -9.4921875, -8.890625, -8.2890625, -7.6875, -7.0859375, -6.484375, -5.8828125, -5.28125, -4.6796875, -4.078125, -3.4765625, -2.875, -2.2734375, -1.671875, -1.0703125, -0.46875, 0.1328125, 0.734375, 1.3359375, 1.9375, 2.5390625, 3.140625, 3.7421875, 4.34375, 4.9453125, 5.546875, 6.1484375, 6.75, 7.3515625, 7.953125, 8.5546875, 9.15625, 9.7578125, 10.359375, 10.9609375, 11.5625, 12.1640625, 12.765625, 13.3671875, 13.96875, 14.5703125, 15.171875, 15.7734375, 16.375, 16.9765625, 17.578125, 18.1796875, 18.78125, 19.3828125, 19.984375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 10.0, 9.0, 5.0, 10.0, 12.0, 16.0, 25.0, 28.0, 24.0, 40.0, 49.0, 44.0, 53.0, 71.0, 93.0, 223.0, 1622.0, 207.0, 108.0, 66.0, 49.0, 42.0, 38.0, 31.0, 31.0, 31.0, 13.0, 15.0, 13.0, 9.0, 16.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.853759765625, -21.11376953125, -20.373779296875, -19.6337890625, -18.893798828125, -18.15380859375, -17.413818359375, -16.673828125, -15.933837890625, -15.19384765625, -14.453857421875, -13.7138671875, -12.973876953125, -12.23388671875, -11.493896484375, -10.75390625, -10.013916015625, -9.27392578125, -8.533935546875, -7.7939453125, -7.053955078125, -6.31396484375, -5.573974609375, -4.833984375, -4.093994140625, -3.35400390625, -2.614013671875, -1.8740234375, -1.134033203125, -0.39404296875, 0.345947265625, 1.0859375, 1.825927734375, 2.56591796875, 3.305908203125, 4.0458984375, 4.785888671875, 5.52587890625, 6.265869140625, 7.005859375, 7.745849609375, 8.48583984375, 9.225830078125, 9.9658203125, 10.705810546875, 11.44580078125, 12.185791015625, 12.92578125, 13.665771484375, 14.40576171875, 15.145751953125, 15.8857421875, 16.625732421875, 17.36572265625, 18.105712890625, 18.845703125, 19.585693359375, 20.32568359375, 21.065673828125, 21.8056640625, 22.545654296875, 23.28564453125, 24.025634765625, 24.765625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 5.0, 6.0, 11.0, 9.0, 12.0, 22.0, 30.0, 31.0, 36.0, 49.0, 59.0, 90.0, 93.0, 163.0, 246.0, 468.0, 926.0, 3390.0, 2998684.0, 137543.0, 1887.0, 752.0, 379.0, 211.0, 142.0, 95.0, 90.0, 74.0, 41.0, 26.0, 24.0, 27.0, 12.0, 13.0, 14.0, 7.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-65.6875, -63.74609375, -61.8046875, -59.86328125, -57.921875, -55.98046875, -54.0390625, -52.09765625, -50.15625, -48.21484375, -46.2734375, -44.33203125, -42.390625, -40.44921875, -38.5078125, -36.56640625, -34.625, -32.68359375, -30.7421875, -28.80078125, -26.859375, -24.91796875, -22.9765625, -21.03515625, -19.09375, -17.15234375, -15.2109375, -13.26953125, -11.328125, -9.38671875, -7.4453125, -5.50390625, -3.5625, -1.62109375, 0.3203125, 2.26171875, 4.203125, 6.14453125, 8.0859375, 10.02734375, 11.96875, 13.91015625, 15.8515625, 17.79296875, 19.734375, 21.67578125, 23.6171875, 25.55859375, 27.5, 29.44140625, 31.3828125, 33.32421875, 35.265625, 37.20703125, 39.1484375, 41.08984375, 43.03125, 44.97265625, 46.9140625, 48.85546875, 50.796875, 52.73828125, 54.6796875, 56.62109375, 58.5625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [7.0, 89.0, 569.0, 320.0, 33.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.345535278320312, -13.693492889404297, -6.041450500488281, 1.6105918884277344, 9.26263427734375, 16.914676666259766, 24.56671905517578, 32.2187614440918, 39.87080383300781, 47.52284622192383, 55.174888610839844, 62.82693099975586, 70.47897338867188, 78.13101196289062, 85.7830581665039, 93.43510437011719, 101.08714294433594, 108.73918151855469, 116.39122772216797, 124.04327392578125, 131.6953125, 139.34735107421875, 146.9993896484375, 154.6514434814453, 162.30348205566406, 169.9555206298828, 177.60757446289062, 185.25961303710938, 192.91165161132812, 200.56369018554688, 208.21572875976562, 215.86778259277344, 223.51983642578125, 231.171875, 238.82391357421875, 246.47596740722656, 254.1280059814453, 261.7800598144531, 269.4320983886719, 277.0841369628906, 284.7361755371094, 292.3882141113281, 300.0402526855469, 307.6922912597656, 315.3443603515625, 322.99639892578125, 330.6484375, 338.30047607421875, 345.9525146484375, 353.60455322265625, 361.256591796875, 368.90863037109375, 376.5606689453125, 384.2127380371094, 391.8647766113281, 399.5168151855469, 407.1688537597656, 414.8208923339844, 422.4729309082031, 430.1249694824219, 437.77703857421875, 445.4290771484375, 453.08111572265625, 460.733154296875, 468.38519287109375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 13.0, 18.0, 10.0, 9.0, 16.0, 17.0, 19.0, 19.0, 23.0, 21.0, 29.0, 22.0, 34.0, 26.0, 30.0, 34.0, 46.0, 32.0, 33.0, 40.0, 49.0, 39.0, 34.0, 29.0, 29.0, 38.0, 34.0, 25.0, 32.0, 23.0, 23.0, 20.0, 14.0, 15.0, 16.0, 8.0, 7.0, 6.0, 9.0, 7.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.63916015625, -49.982940673828125, -48.32672119140625, -46.670501708984375, -45.0142822265625, -43.358062744140625, -41.701847076416016, -40.04562759399414, -38.389408111572266, -36.73318862915039, -35.076969146728516, -33.42074966430664, -31.7645320892334, -30.108312606811523, -28.45209503173828, -26.795875549316406, -25.13965606689453, -23.483436584472656, -21.82721710205078, -20.17099952697754, -18.514780044555664, -16.85856056213379, -15.20234203338623, -13.546123504638672, -11.889904022216797, -10.233684539794922, -8.577466011047363, -6.9212470054626465, -5.26502799987793, -3.6088085174560547, -1.952589988708496, -0.2963714599609375, 1.3598480224609375, 3.0160670280456543, 4.672286033630371, 6.328505039215088, 7.984724044799805, 9.64094352722168, 11.297162055969238, 12.953380584716797, 14.609600067138672, 16.265819549560547, 17.922039031982422, 19.578256607055664, 21.23447608947754, 22.890695571899414, 24.546913146972656, 26.20313262939453, 27.859352111816406, 29.51557159423828, 31.171791076660156, 32.82801055908203, 34.484230041503906, 36.14044952392578, 37.79666519165039, 39.452884674072266, 41.10910415649414, 42.765323638916016, 44.42154312133789, 46.077762603759766, 47.733978271484375, 49.39019775390625, 51.046417236328125, 52.70263671875, 54.358856201171875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 10.0, 6.0, 9.0, 15.0, 11.0, 18.0, 16.0, 27.0, 35.0, 34.0, 34.0, 48.0, 36.0, 47.0, 29.0, 40.0, 38.0, 35.0, 45.0, 42.0, 48.0, 32.0, 40.0, 36.0, 34.0, 24.0, 31.0, 25.0, 17.0, 25.0, 13.0, 12.0, 16.0, 9.0, 3.0, 16.0, 5.0, 3.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.359375, -8.110107421875, -7.86083984375, -7.611572265625, -7.3623046875, -7.113037109375, -6.86376953125, -6.614501953125, -6.365234375, -6.115966796875, -5.86669921875, -5.617431640625, -5.3681640625, -5.118896484375, -4.86962890625, -4.620361328125, -4.37109375, -4.121826171875, -3.87255859375, -3.623291015625, -3.3740234375, -3.124755859375, -2.87548828125, -2.626220703125, -2.376953125, -2.127685546875, -1.87841796875, -1.629150390625, -1.3798828125, -1.130615234375, -0.88134765625, -0.632080078125, -0.3828125, -0.133544921875, 0.11572265625, 0.364990234375, 0.6142578125, 0.863525390625, 1.11279296875, 1.362060546875, 1.611328125, 1.860595703125, 2.10986328125, 2.359130859375, 2.6083984375, 2.857666015625, 3.10693359375, 3.356201171875, 3.60546875, 3.854736328125, 4.10400390625, 4.353271484375, 4.6025390625, 4.851806640625, 5.10107421875, 5.350341796875, 5.599609375, 5.848876953125, 6.09814453125, 6.347412109375, 6.5966796875, 6.845947265625, 7.09521484375, 7.344482421875, 7.59375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 6.0, 9.0, 10.0, 14.0, 15.0, 22.0, 25.0, 32.0, 49.0, 69.0, 104.0, 115.0, 162.0, 266.0, 412.0, 680.0, 1125.0, 1819.0, 3285.0, 6476.0, 15654.0, 58917.0, 388698.0, 1786196.0, 1550733.0, 301917.0, 50007.0, 13796.0, 5877.0, 3081.0, 1747.0, 1002.0, 660.0, 397.0, 261.0, 169.0, 123.0, 70.0, 70.0, 50.0, 39.0, 25.0, 18.0, 15.0, 23.0, 9.0, 10.0, 8.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-13.5390625, -13.14013671875, -12.7412109375, -12.34228515625, -11.943359375, -11.54443359375, -11.1455078125, -10.74658203125, -10.34765625, -9.94873046875, -9.5498046875, -9.15087890625, -8.751953125, -8.35302734375, -7.9541015625, -7.55517578125, -7.15625, -6.75732421875, -6.3583984375, -5.95947265625, -5.560546875, -5.16162109375, -4.7626953125, -4.36376953125, -3.96484375, -3.56591796875, -3.1669921875, -2.76806640625, -2.369140625, -1.97021484375, -1.5712890625, -1.17236328125, -0.7734375, -0.37451171875, 0.0244140625, 0.42333984375, 0.822265625, 1.22119140625, 1.6201171875, 2.01904296875, 2.41796875, 2.81689453125, 3.2158203125, 3.61474609375, 4.013671875, 4.41259765625, 4.8115234375, 5.21044921875, 5.609375, 6.00830078125, 6.4072265625, 6.80615234375, 7.205078125, 7.60400390625, 8.0029296875, 8.40185546875, 8.80078125, 9.19970703125, 9.5986328125, 9.99755859375, 10.396484375, 10.79541015625, 11.1943359375, 11.59326171875, 11.9921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 16.0, 23.0, 50.0, 123.0, 288.0, 687.0, 1342.0, 889.0, 390.0, 165.0, 65.0, 23.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.625, -37.40625, -36.1875, -34.96875, -33.75, -32.53125, -31.3125, -30.09375, -28.875, -27.65625, -26.4375, -25.21875, -24.0, -22.78125, -21.5625, -20.34375, -19.125, -17.90625, -16.6875, -15.46875, -14.25, -13.03125, -11.8125, -10.59375, -9.375, -8.15625, -6.9375, -5.71875, -4.5, -3.28125, -2.0625, -0.84375, 0.375, 1.59375, 2.8125, 4.03125, 5.25, 6.46875, 7.6875, 8.90625, 10.125, 11.34375, 12.5625, 13.78125, 15.0, 16.21875, 17.4375, 18.65625, 19.875, 21.09375, 22.3125, 23.53125, 24.75, 25.96875, 27.1875, 28.40625, 29.625, 30.84375, 32.0625, 33.28125, 34.5, 35.71875, 36.9375, 38.15625, 39.375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 2.0, 9.0, 10.0, 35.0, 91.0, 227.0, 693.0, 2876.0, 1582489.0, 2603416.0, 3207.0, 752.0, 269.0, 105.0, 53.0, 18.0, 10.0, 3.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.9375, -82.365234375, -79.79296875, -77.220703125, -74.6484375, -72.076171875, -69.50390625, -66.931640625, -64.359375, -61.787109375, -59.21484375, -56.642578125, -54.0703125, -51.498046875, -48.92578125, -46.353515625, -43.78125, -41.208984375, -38.63671875, -36.064453125, -33.4921875, -30.919921875, -28.34765625, -25.775390625, -23.203125, -20.630859375, -18.05859375, -15.486328125, -12.9140625, -10.341796875, -7.76953125, -5.197265625, -2.625, -0.052734375, 2.51953125, 5.091796875, 7.6640625, 10.236328125, 12.80859375, 15.380859375, 17.953125, 20.525390625, 23.09765625, 25.669921875, 28.2421875, 30.814453125, 33.38671875, 35.958984375, 38.53125, 41.103515625, 43.67578125, 46.248046875, 48.8203125, 51.392578125, 53.96484375, 56.537109375, 59.109375, 61.681640625, 64.25390625, 66.826171875, 69.3984375, 71.970703125, 74.54296875, 77.115234375, 79.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 84.0, 923.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.2861022949219, -308.18603515625, -285.08599853515625, -261.9859619140625, -238.88589477539062, -215.7858428955078, -192.685791015625, -169.5857391357422, -146.48568725585938, -123.38563537597656, -100.28558349609375, -77.18553161621094, -54.085479736328125, -30.985427856445312, -7.8853759765625, 15.214675903320312, 38.314727783203125, 61.41477966308594, 84.51483154296875, 107.61488342285156, 130.71493530273438, 153.8149871826172, 176.9150390625, 200.0150909423828, 223.11514282226562, 246.21519470214844, 269.31524658203125, 292.415283203125, 315.5153503417969, 338.61541748046875, 361.7154541015625, 384.81549072265625, 407.91552734375, 431.01556396484375, 454.1156311035156, 477.2156982421875, 500.31573486328125, 523.415771484375, 546.515869140625, 569.6159057617188, 592.7159423828125, 615.8159790039062, 638.916015625, 662.01611328125, 685.1161499023438, 708.2161865234375, 731.3162841796875, 754.4163208007812, 777.516357421875, 800.6163940429688, 823.7164306640625, 846.8165283203125, 869.9165649414062, 893.0166015625, 916.11669921875, 939.2167358398438, 962.3167724609375, 985.4168090820312, 1008.516845703125, 1031.616943359375, 1054.717041015625, 1077.8170166015625, 1100.9171142578125, 1124.01708984375, 1147.1171875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 2.0, 9.0, 9.0, 11.0, 14.0, 11.0, 14.0, 14.0, 18.0, 24.0, 25.0, 25.0, 28.0, 24.0, 37.0, 43.0, 44.0, 43.0, 50.0, 52.0, 52.0, 37.0, 47.0, 54.0, 41.0, 29.0, 37.0, 34.0, 32.0, 22.0, 20.0, 16.0, 21.0, 13.0, 11.0, 9.0, 5.0, 8.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.85218811035156, -50.176151275634766, -48.50011444091797, -46.82408142089844, -45.14804458618164, -43.472007751464844, -41.79597091674805, -40.11993408203125, -38.44390106201172, -36.76786422729492, -35.091827392578125, -33.415794372558594, -31.739757537841797, -30.063720703125, -28.387683868408203, -26.711647033691406, -25.03561019897461, -23.359573364257812, -21.68353843688965, -20.00750160217285, -18.331466674804688, -16.65542984008789, -14.979393005371094, -13.303357124328613, -11.627321243286133, -9.951285362243652, -8.275249481201172, -6.599212646484375, -4.9231767654418945, -3.247140884399414, -1.5711040496826172, 0.10493183135986328, 1.7809677124023438, 3.4570038318634033, 5.133039951324463, 6.809076309204102, 8.485112190246582, 10.161148071289062, 11.83718490600586, 13.51322078704834, 15.18925666809082, 16.865293502807617, 18.54132843017578, 20.217365264892578, 21.893402099609375, 23.56943702697754, 25.245473861694336, 26.9215087890625, 28.597545623779297, 30.273582458496094, 31.949617385864258, 33.62565612792969, 35.30168914794922, 36.977725982666016, 38.65376281738281, 40.32979965209961, 42.005836486816406, 43.6818733215332, 45.35791015625, 47.03394317626953, 48.70998001098633, 50.386016845703125, 52.06205368041992, 53.73809051513672, 55.41412353515625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 4.0, 9.0, 12.0, 11.0, 17.0, 14.0, 19.0, 32.0, 29.0, 34.0, 36.0, 41.0, 27.0, 34.0, 49.0, 62.0, 50.0, 33.0, 38.0, 58.0, 41.0, 38.0, 43.0, 27.0, 27.0, 22.0, 29.0, 18.0, 25.0, 23.0, 17.0, 18.0, 11.0, 13.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.4884033203125, -6.269775390625, -6.0511474609375, -5.83251953125, -5.6138916015625, -5.395263671875, -5.1766357421875, -4.9580078125, -4.7393798828125, -4.520751953125, -4.3021240234375, -4.08349609375, -3.8648681640625, -3.646240234375, -3.4276123046875, -3.208984375, -2.9903564453125, -2.771728515625, -2.5531005859375, -2.33447265625, -2.1158447265625, -1.897216796875, -1.6785888671875, -1.4599609375, -1.2413330078125, -1.022705078125, -0.8040771484375, -0.58544921875, -0.3668212890625, -0.148193359375, 0.0704345703125, 0.2890625, 0.5076904296875, 0.726318359375, 0.9449462890625, 1.16357421875, 1.3822021484375, 1.600830078125, 1.8194580078125, 2.0380859375, 2.2567138671875, 2.475341796875, 2.6939697265625, 2.91259765625, 3.1312255859375, 3.349853515625, 3.5684814453125, 3.787109375, 4.0057373046875, 4.224365234375, 4.4429931640625, 4.66162109375, 4.8802490234375, 5.098876953125, 5.3175048828125, 5.5361328125, 5.7547607421875, 5.973388671875, 6.1920166015625, 6.41064453125, 6.6292724609375, 6.847900390625, 7.0665283203125, 7.28515625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 8.0, 8.0, 15.0, 19.0, 23.0, 42.0, 45.0, 72.0, 99.0, 127.0, 206.0, 309.0, 443.0, 668.0, 921.0, 1546.0, 2302.0, 3663.0, 5739.0, 9362.0, 15206.0, 25161.0, 41386.0, 69276.0, 115801.0, 175645.0, 198594.0, 148383.0, 92592.0, 54966.0, 32884.0, 19912.0, 12187.0, 7472.0, 4652.0, 2998.0, 1995.0, 1281.0, 814.0, 548.0, 366.0, 284.0, 166.0, 121.0, 76.0, 49.0, 47.0, 37.0, 15.0, 11.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.6318359375, -0.61163330078125, -0.5914306640625, -0.57122802734375, -0.551025390625, -0.53082275390625, -0.5106201171875, -0.49041748046875, -0.47021484375, -0.45001220703125, -0.4298095703125, -0.40960693359375, -0.389404296875, -0.36920166015625, -0.3489990234375, -0.32879638671875, -0.30859375, -0.28839111328125, -0.2681884765625, -0.24798583984375, -0.227783203125, -0.20758056640625, -0.1873779296875, -0.16717529296875, -0.14697265625, -0.12677001953125, -0.1065673828125, -0.08636474609375, -0.066162109375, -0.04595947265625, -0.0257568359375, -0.00555419921875, 0.0146484375, 0.03485107421875, 0.0550537109375, 0.07525634765625, 0.095458984375, 0.11566162109375, 0.1358642578125, 0.15606689453125, 0.17626953125, 0.19647216796875, 0.2166748046875, 0.23687744140625, 0.257080078125, 0.27728271484375, 0.2974853515625, 0.31768798828125, 0.337890625, 0.35809326171875, 0.3782958984375, 0.39849853515625, 0.418701171875, 0.43890380859375, 0.4591064453125, 0.47930908203125, 0.49951171875, 0.51971435546875, 0.5399169921875, 0.56011962890625, 0.580322265625, 0.60052490234375, 0.6207275390625, 0.64093017578125, 0.6611328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 15.0, 15.0, 10.0, 19.0, 16.0, 17.0, 17.0, 24.0, 29.0, 31.0, 26.0, 43.0, 32.0, 34.0, 35.0, 44.0, 39.0, 48.0, 1065.0, 43.0, 43.0, 34.0, 43.0, 26.0, 28.0, 46.0, 25.0, 23.0, 18.0, 20.0, 21.0, 10.0, 13.0, 15.0, 8.0, 7.0, 7.0, 13.0, 3.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0546875, -3.9244384765625, -3.794189453125, -3.6639404296875, -3.53369140625, -3.4034423828125, -3.273193359375, -3.1429443359375, -3.0126953125, -2.8824462890625, -2.752197265625, -2.6219482421875, -2.49169921875, -2.3614501953125, -2.231201171875, -2.1009521484375, -1.970703125, -1.8404541015625, -1.710205078125, -1.5799560546875, -1.44970703125, -1.3194580078125, -1.189208984375, -1.0589599609375, -0.9287109375, -0.7984619140625, -0.668212890625, -0.5379638671875, -0.40771484375, -0.2774658203125, -0.147216796875, -0.0169677734375, 0.11328125, 0.2435302734375, 0.373779296875, 0.5040283203125, 0.63427734375, 0.7645263671875, 0.894775390625, 1.0250244140625, 1.1552734375, 1.2855224609375, 1.415771484375, 1.5460205078125, 1.67626953125, 1.8065185546875, 1.936767578125, 2.0670166015625, 2.197265625, 2.3275146484375, 2.457763671875, 2.5880126953125, 2.71826171875, 2.8485107421875, 2.978759765625, 3.1090087890625, 3.2392578125, 3.3695068359375, 3.499755859375, 3.6300048828125, 3.76025390625, 3.8905029296875, 4.020751953125, 4.1510009765625, 4.28125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 8.0, 10.0, 8.0, 11.0, 23.0, 32.0, 66.0, 98.0, 184.0, 283.0, 462.0, 791.0, 1214.0, 2005.0, 3322.0, 5603.0, 9395.0, 15640.0, 26810.0, 44978.0, 74079.0, 114177.0, 157156.0, 1222533.0, 148361.0, 104458.0, 66820.0, 40107.0, 23725.0, 13966.0, 8271.0, 4871.0, 2948.0, 1804.0, 1050.0, 740.0, 442.0, 251.0, 147.0, 107.0, 60.0, 34.0, 27.0, 17.0, 11.0, 13.0, 5.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5015640258789062, -0.4850616455078125, -0.46855926513671875, -0.452056884765625, -0.43555450439453125, -0.4190521240234375, -0.40254974365234375, -0.38604736328125, -0.36954498291015625, -0.3530426025390625, -0.33654022216796875, -0.320037841796875, -0.30353546142578125, -0.2870330810546875, -0.27053070068359375, -0.2540283203125, -0.23752593994140625, -0.2210235595703125, -0.20452117919921875, -0.188018798828125, -0.17151641845703125, -0.1550140380859375, -0.13851165771484375, -0.12200927734375, -0.10550689697265625, -0.0890045166015625, -0.07250213623046875, -0.055999755859375, -0.03949737548828125, -0.0229949951171875, -0.00649261474609375, 0.010009765625, 0.02651214599609375, 0.0430145263671875, 0.05951690673828125, 0.076019287109375, 0.09252166748046875, 0.1090240478515625, 0.12552642822265625, 0.14202880859375, 0.15853118896484375, 0.1750335693359375, 0.19153594970703125, 0.208038330078125, 0.22454071044921875, 0.2410430908203125, 0.25754547119140625, 0.2740478515625, 0.29055023193359375, 0.3070526123046875, 0.32355499267578125, 0.340057373046875, 0.35655975341796875, 0.3730621337890625, 0.38956451416015625, 0.40606689453125, 0.42256927490234375, 0.4390716552734375, 0.45557403564453125, 0.472076416015625, 0.48857879638671875, 0.5050811767578125, 0.5215835571289062, 0.5380859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 8.0, 14.0, 17.0, 15.0, 14.0, 29.0, 27.0, 33.0, 38.0, 45.0, 53.0, 49.0, 61.0, 75.0, 65.0, 55.0, 71.0, 47.0, 35.0, 40.0, 29.0, 23.0, 24.0, 24.0, 15.0, 12.0, 14.0, 12.0, 7.0, 8.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00457000732421875, -0.004423201084136963, -0.004276394844055176, -0.004129588603973389, -0.0039827823638916016, -0.0038359761238098145, -0.0036891698837280273, -0.0035423636436462402, -0.003395557403564453, -0.003248751163482666, -0.003101944923400879, -0.002955138683319092, -0.0028083324432373047, -0.0026615262031555176, -0.0025147199630737305, -0.0023679137229919434, -0.0022211074829101562, -0.002074301242828369, -0.001927495002746582, -0.001780688762664795, -0.0016338825225830078, -0.0014870762825012207, -0.0013402700424194336, -0.0011934638023376465, -0.0010466575622558594, -0.0008998513221740723, -0.0007530450820922852, -0.000606238842010498, -0.00045943260192871094, -0.00031262636184692383, -0.00016582012176513672, -1.901388168334961e-05, 0.0001277923583984375, 0.0002745985984802246, 0.0004214048385620117, 0.0005682110786437988, 0.0007150173187255859, 0.000861823558807373, 0.0010086297988891602, 0.0011554360389709473, 0.0013022422790527344, 0.0014490485191345215, 0.0015958547592163086, 0.0017426609992980957, 0.0018894672393798828, 0.00203627347946167, 0.002183079719543457, 0.002329885959625244, 0.0024766921997070312, 0.0026234984397888184, 0.0027703046798706055, 0.0029171109199523926, 0.0030639171600341797, 0.003210723400115967, 0.003357529640197754, 0.003504335880279541, 0.003651142120361328, 0.0037979483604431152, 0.003944754600524902, 0.0040915608406066895, 0.0042383670806884766, 0.004385173320770264, 0.004531979560852051, 0.004678785800933838, 0.004825592041015625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 3.0, 13.0, 7.0, 17.0, 11.0, 26.0, 24.0, 26.0, 35.0, 44.0, 77.0, 87.0, 119.0, 134.0, 179.0, 338.0, 558.0, 1332.0, 552272.0, 490196.0, 1271.0, 571.0, 325.0, 227.0, 156.0, 114.0, 94.0, 72.0, 34.0, 50.0, 26.0, 27.0, 17.0, 12.0, 13.0, 3.0, 6.0, 9.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.08001708984375, -0.0775918960571289, -0.07516670227050781, -0.07274150848388672, -0.07031631469726562, -0.06789112091064453, -0.06546592712402344, -0.06304073333740234, -0.06061553955078125, -0.058190345764160156, -0.05576515197753906, -0.05333995819091797, -0.050914764404296875, -0.04848957061767578, -0.04606437683105469, -0.043639183044433594, -0.0412139892578125, -0.038788795471191406, -0.03636360168457031, -0.03393840789794922, -0.031513214111328125, -0.02908802032470703, -0.026662826538085938, -0.024237632751464844, -0.02181243896484375, -0.019387245178222656, -0.016962051391601562, -0.014536857604980469, -0.012111663818359375, -0.009686470031738281, -0.0072612762451171875, -0.004836082458496094, -0.002410888671875, 1.430511474609375e-05, 0.0024394989013671875, 0.004864692687988281, 0.007289886474609375, 0.009715080261230469, 0.012140274047851562, 0.014565467834472656, 0.01699066162109375, 0.019415855407714844, 0.021841049194335938, 0.02426624298095703, 0.026691436767578125, 0.02911663055419922, 0.03154182434082031, 0.033967018127441406, 0.0363922119140625, 0.038817405700683594, 0.04124259948730469, 0.04366779327392578, 0.046092987060546875, 0.04851818084716797, 0.05094337463378906, 0.053368568420410156, 0.05579376220703125, 0.058218955993652344, 0.06064414978027344, 0.06306934356689453, 0.06549453735351562, 0.06791973114013672, 0.07034492492675781, 0.0727701187133789, 0.0751953125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 990.0, 23.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04008892551064491, -0.03816116228699684, -0.03623339906334877, -0.0343056358397007, -0.03237787261605263, -0.030450109392404556, -0.028522348031401634, -0.026594584807753563, -0.02466682158410549, -0.02273905836045742, -0.02081129513680935, -0.018883533775806427, -0.016955770552158356, -0.01502800639718771, -0.013100244104862213, -0.011172480881214142, -0.00924471765756607, -0.007316954433917999, -0.005389191675931215, -0.0034614289179444313, -0.00153366569429636, 0.0003940975293517113, 0.002321859821677208, 0.004249623045325279, 0.0061773862689733505, 0.008105149492621422, 0.010032912716269493, 0.01196067500859499, 0.013888438232243061, 0.015816200524568558, 0.01774396374821663, 0.0196717269718647, 0.02159949392080307, 0.02352725714445114, 0.025455020368099213, 0.027382783591747284, 0.029310546815395355, 0.031238310039043427, 0.0331660732626915, 0.03509383648633957, 0.03702159970998764, 0.03894936293363571, 0.04087712615728378, 0.042804889380931854, 0.044732652604579926, 0.046660415828228, 0.04858817905187607, 0.05051594227552414, 0.05244370177388191, 0.054371464997529984, 0.056299228221178055, 0.058226991444826126, 0.0601547546684742, 0.06208251789212227, 0.06401027739048004, 0.06593804061412811, 0.06786580383777618, 0.06979356706142426, 0.07172133028507233, 0.0736490935087204, 0.07557685673236847, 0.07750461995601654, 0.07943238317966461, 0.08136014640331268, 0.08328790962696075]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 18.0, 15.0, 37.0, 39.0, 45.0, 78.0, 82.0, 83.0, 89.0, 95.0, 87.0, 92.0, 84.0, 36.0, 38.0, 30.0, 16.0, 16.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005775809288024902, -0.00559038482606411, -0.005404960364103317, -0.005219535902142525, -0.005034111440181732, -0.00484868697822094, -0.004663262516260147, -0.0044778380542993546, -0.004292413592338562, -0.0041069891303777695, -0.003921564668416977, -0.0037361402064561844, -0.003550715744495392, -0.0033652912825345993, -0.0031798668205738068, -0.0029944423586130142, -0.0028090178966522217, -0.002623593434691429, -0.0024381689727306366, -0.002252744510769844, -0.0020673200488090515, -0.001881895586848259, -0.0016964711248874664, -0.0015110466629266739, -0.0013256222009658813, -0.0011401977390050888, -0.0009547732770442963, -0.0007693488150835037, -0.0005839243531227112, -0.00039849989116191864, -0.0002130754292011261, -2.7650967240333557e-05, 0.00015777349472045898, 0.0003431979566812515, 0.0005286224186420441, 0.0007140468806028366, 0.0008994713425636292, 0.0010848958045244217, 0.0012703202664852142, 0.0014557447284460068, 0.0016411691904067993, 0.0018265936523675919, 0.0020120181143283844, 0.002197442576289177, 0.0023828670382499695, 0.002568291500210762, 0.0027537159621715546, 0.002939140424132347, 0.0031245648860931396, 0.003309989348053932, 0.0034954138100147247, 0.0036808382719755173, 0.00386626273393631, 0.004051687195897102, 0.004237111657857895, 0.0044225361198186874, 0.00460796058177948, 0.0047933850437402725, 0.004978809505701065, 0.005164233967661858, 0.00534965842962265, 0.005535082891583443, 0.005720507353544235, 0.005905931815505028, 0.00609135627746582]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 4.0, 9.0, 12.0, 11.0, 17.0, 14.0, 19.0, 32.0, 29.0, 34.0, 36.0, 41.0, 27.0, 34.0, 49.0, 62.0, 50.0, 33.0, 38.0, 58.0, 41.0, 39.0, 42.0, 27.0, 27.0, 22.0, 29.0, 18.0, 25.0, 23.0, 17.0, 18.0, 11.0, 13.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.4884033203125, -6.269775390625, -6.0511474609375, -5.83251953125, -5.6138916015625, -5.395263671875, -5.1766357421875, -4.9580078125, -4.7393798828125, -4.520751953125, -4.3021240234375, -4.08349609375, -3.8648681640625, -3.646240234375, -3.4276123046875, -3.208984375, -2.9903564453125, -2.771728515625, -2.5531005859375, -2.33447265625, -2.1158447265625, -1.897216796875, -1.6785888671875, -1.4599609375, -1.2413330078125, -1.022705078125, -0.8040771484375, -0.58544921875, -0.3668212890625, -0.148193359375, 0.0704345703125, 0.2890625, 0.5076904296875, 0.726318359375, 0.9449462890625, 1.16357421875, 1.3822021484375, 1.600830078125, 1.8194580078125, 2.0380859375, 2.2567138671875, 2.475341796875, 2.6939697265625, 2.91259765625, 3.1312255859375, 3.349853515625, 3.5684814453125, 3.787109375, 4.0057373046875, 4.224365234375, 4.4429931640625, 4.66162109375, 4.8802490234375, 5.098876953125, 5.3175048828125, 5.5361328125, 5.7547607421875, 5.973388671875, 6.1920166015625, 6.41064453125, 6.6292724609375, 6.847900390625, 7.0665283203125, 7.28515625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 14.0, 11.0, 16.0, 21.0, 34.0, 47.0, 58.0, 80.0, 98.0, 159.0, 250.0, 378.0, 615.0, 931.0, 1658.0, 3617.0, 10492.0, 43585.0, 302098.0, 574311.0, 82397.0, 17129.0, 5191.0, 2219.0, 1142.0, 624.0, 403.0, 267.0, 194.0, 130.0, 112.0, 74.0, 54.0, 47.0, 24.0, 19.0, 15.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.857177734375, -11.46435546875, -11.071533203125, -10.6787109375, -10.285888671875, -9.89306640625, -9.500244140625, -9.107421875, -8.714599609375, -8.32177734375, -7.928955078125, -7.5361328125, -7.143310546875, -6.75048828125, -6.357666015625, -5.96484375, -5.572021484375, -5.17919921875, -4.786376953125, -4.3935546875, -4.000732421875, -3.60791015625, -3.215087890625, -2.822265625, -2.429443359375, -2.03662109375, -1.643798828125, -1.2509765625, -0.858154296875, -0.46533203125, -0.072509765625, 0.3203125, 0.713134765625, 1.10595703125, 1.498779296875, 1.8916015625, 2.284423828125, 2.67724609375, 3.070068359375, 3.462890625, 3.855712890625, 4.24853515625, 4.641357421875, 5.0341796875, 5.427001953125, 5.81982421875, 6.212646484375, 6.60546875, 6.998291015625, 7.39111328125, 7.783935546875, 8.1767578125, 8.569580078125, 8.96240234375, 9.355224609375, 9.748046875, 10.140869140625, 10.53369140625, 10.926513671875, 11.3193359375, 11.712158203125, 12.10498046875, 12.497802734375, 12.890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 11.0, 9.0, 6.0, 11.0, 13.0, 19.0, 28.0, 21.0, 26.0, 41.0, 48.0, 68.0, 66.0, 82.0, 246.0, 1542.0, 286.0, 123.0, 81.0, 61.0, 45.0, 38.0, 33.0, 35.0, 18.0, 20.0, 13.0, 10.0, 7.0, 2.0, 11.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-23.40625, -22.708740234375, -22.01123046875, -21.313720703125, -20.6162109375, -19.918701171875, -19.22119140625, -18.523681640625, -17.826171875, -17.128662109375, -16.43115234375, -15.733642578125, -15.0361328125, -14.338623046875, -13.64111328125, -12.943603515625, -12.24609375, -11.548583984375, -10.85107421875, -10.153564453125, -9.4560546875, -8.758544921875, -8.06103515625, -7.363525390625, -6.666015625, -5.968505859375, -5.27099609375, -4.573486328125, -3.8759765625, -3.178466796875, -2.48095703125, -1.783447265625, -1.0859375, -0.388427734375, 0.30908203125, 1.006591796875, 1.7041015625, 2.401611328125, 3.09912109375, 3.796630859375, 4.494140625, 5.191650390625, 5.88916015625, 6.586669921875, 7.2841796875, 7.981689453125, 8.67919921875, 9.376708984375, 10.07421875, 10.771728515625, 11.46923828125, 12.166748046875, 12.8642578125, 13.561767578125, 14.25927734375, 14.956787109375, 15.654296875, 16.351806640625, 17.04931640625, 17.746826171875, 18.4443359375, 19.141845703125, 19.83935546875, 20.536865234375, 21.234375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 7.0, 5.0, 3.0, 7.0, 6.0, 16.0, 21.0, 23.0, 36.0, 65.0, 74.0, 129.0, 251.0, 475.0, 1385.0, 151575.0, 2988473.0, 1837.0, 595.0, 264.0, 161.0, 91.0, 49.0, 51.0, 33.0, 19.0, 14.0, 7.0, 10.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.90625, -59.85009765625, -57.7939453125, -55.73779296875, -53.681640625, -51.62548828125, -49.5693359375, -47.51318359375, -45.45703125, -43.40087890625, -41.3447265625, -39.28857421875, -37.232421875, -35.17626953125, -33.1201171875, -31.06396484375, -29.0078125, -26.95166015625, -24.8955078125, -22.83935546875, -20.783203125, -18.72705078125, -16.6708984375, -14.61474609375, -12.55859375, -10.50244140625, -8.4462890625, -6.39013671875, -4.333984375, -2.27783203125, -0.2216796875, 1.83447265625, 3.890625, 5.94677734375, 8.0029296875, 10.05908203125, 12.115234375, 14.17138671875, 16.2275390625, 18.28369140625, 20.33984375, 22.39599609375, 24.4521484375, 26.50830078125, 28.564453125, 30.62060546875, 32.6767578125, 34.73291015625, 36.7890625, 38.84521484375, 40.9013671875, 42.95751953125, 45.013671875, 47.06982421875, 49.1259765625, 51.18212890625, 53.23828125, 55.29443359375, 57.3505859375, 59.40673828125, 61.462890625, 63.51904296875, 65.5751953125, 67.63134765625, 69.6875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 34.0, 260.0, 603.0, 108.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.34366607666016, -63.65916442871094, -59.97466278076172, -56.290164947509766, -52.60566329956055, -48.92116165161133, -45.236663818359375, -41.552162170410156, -37.86766052246094, -34.18315887451172, -30.498659133911133, -26.814159393310547, -23.129657745361328, -19.44515609741211, -15.760656356811523, -12.076156616210938, -8.391654968261719, -4.707154273986816, -1.022653579711914, 2.6618471145629883, 6.346347808837891, 10.03084945678711, 13.715349197387695, 17.39984893798828, 21.0843505859375, 24.76885223388672, 28.453351974487305, 32.13785171508789, 35.82235336303711, 39.50685501098633, 43.19135284423828, 46.8758544921875, 50.56036376953125, 54.24486541748047, 57.92936706542969, 61.61386489868164, 65.29837036132812, 68.98286437988281, 72.66736602783203, 76.35186767578125, 80.03636932373047, 83.72087097167969, 87.4053726196289, 91.08987426757812, 94.77436828613281, 98.45887756347656, 102.14337158203125, 105.82787322998047, 109.51237487792969, 113.1968765258789, 116.88137817382812, 120.56587982177734, 124.25038146972656, 127.93487548828125, 131.619384765625, 135.3038787841797, 138.98837280273438, 142.67286682128906, 146.3573760986328, 150.0418701171875, 153.72637939453125, 157.41087341308594, 161.0953826904297, 164.77987670898438, 168.46438598632812]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 9.0, 3.0, 6.0, 11.0, 11.0, 17.0, 16.0, 26.0, 19.0, 27.0, 25.0, 25.0, 37.0, 37.0, 39.0, 38.0, 49.0, 46.0, 36.0, 41.0, 37.0, 47.0, 35.0, 50.0, 37.0, 33.0, 43.0, 29.0, 28.0, 20.0, 22.0, 12.0, 18.0, 10.0, 12.0, 12.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.211280822753906, -42.739295959472656, -41.267311096191406, -39.79533004760742, -38.32334518432617, -36.85136032104492, -35.37937545776367, -33.90739440917969, -32.43540954589844, -30.963424682617188, -29.49144172668457, -28.01945686340332, -26.547473907470703, -25.075489044189453, -23.603504180908203, -22.131521224975586, -20.659536361694336, -19.187551498413086, -17.71556854248047, -16.24358367919922, -14.771600723266602, -13.299615859985352, -11.827631950378418, -10.355648040771484, -8.88366413116455, -7.411680221557617, -5.939696311950684, -4.467711925506592, -2.995728015899658, -1.5237441062927246, -0.05175971984863281, 1.4202241897583008, 2.8922080993652344, 4.364192008972168, 5.836175918579102, 7.308160305023193, 8.780143737792969, 10.252128601074219, 11.724112510681152, 13.196096420288086, 14.66808032989502, 16.140064239501953, 17.612049102783203, 19.08403205871582, 20.55601692199707, 22.027999877929688, 23.499984741210938, 24.971969604492188, 26.443952560424805, 27.915937423706055, 29.387920379638672, 30.859905242919922, 32.33189010620117, 33.803871154785156, 35.275856018066406, 36.747840881347656, 38.219825744628906, 39.691810607910156, 41.163795471191406, 42.63577651977539, 44.10776138305664, 45.57974624633789, 47.05173110961914, 48.523712158203125, 49.995697021484375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 13.0, 14.0, 16.0, 22.0, 20.0, 27.0, 30.0, 24.0, 40.0, 36.0, 40.0, 44.0, 62.0, 57.0, 51.0, 45.0, 47.0, 31.0, 36.0, 35.0, 38.0, 36.0, 27.0, 33.0, 13.0, 26.0, 17.0, 17.0, 14.0, 15.0, 12.0, 5.0, 6.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.485595703125, -8.22119140625, -7.956787109375, -7.6923828125, -7.427978515625, -7.16357421875, -6.899169921875, -6.634765625, -6.370361328125, -6.10595703125, -5.841552734375, -5.5771484375, -5.312744140625, -5.04833984375, -4.783935546875, -4.51953125, -4.255126953125, -3.99072265625, -3.726318359375, -3.4619140625, -3.197509765625, -2.93310546875, -2.668701171875, -2.404296875, -2.139892578125, -1.87548828125, -1.611083984375, -1.3466796875, -1.082275390625, -0.81787109375, -0.553466796875, -0.2890625, -0.024658203125, 0.23974609375, 0.504150390625, 0.7685546875, 1.032958984375, 1.29736328125, 1.561767578125, 1.826171875, 2.090576171875, 2.35498046875, 2.619384765625, 2.8837890625, 3.148193359375, 3.41259765625, 3.677001953125, 3.94140625, 4.205810546875, 4.47021484375, 4.734619140625, 4.9990234375, 5.263427734375, 5.52783203125, 5.792236328125, 6.056640625, 6.321044921875, 6.58544921875, 6.849853515625, 7.1142578125, 7.378662109375, 7.64306640625, 7.907470703125, 8.171875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 10.0, 8.0, 8.0, 11.0, 15.0, 17.0, 35.0, 49.0, 58.0, 78.0, 72.0, 117.0, 149.0, 212.0, 257.0, 379.0, 628.0, 1230.0, 4251.0, 46035.0, 3483162.0, 641235.0, 11403.0, 2157.0, 840.0, 484.0, 328.0, 270.0, 181.0, 128.0, 107.0, 79.0, 70.0, 56.0, 43.0, 39.0, 17.0, 15.0, 6.0, 10.0, 7.0, 5.0, 7.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-48.625, -47.1845703125, -45.744140625, -44.3037109375, -42.86328125, -41.4228515625, -39.982421875, -38.5419921875, -37.1015625, -35.6611328125, -34.220703125, -32.7802734375, -31.33984375, -29.8994140625, -28.458984375, -27.0185546875, -25.578125, -24.1376953125, -22.697265625, -21.2568359375, -19.81640625, -18.3759765625, -16.935546875, -15.4951171875, -14.0546875, -12.6142578125, -11.173828125, -9.7333984375, -8.29296875, -6.8525390625, -5.412109375, -3.9716796875, -2.53125, -1.0908203125, 0.349609375, 1.7900390625, 3.23046875, 4.6708984375, 6.111328125, 7.5517578125, 8.9921875, 10.4326171875, 11.873046875, 13.3134765625, 14.75390625, 16.1943359375, 17.634765625, 19.0751953125, 20.515625, 21.9560546875, 23.396484375, 24.8369140625, 26.27734375, 27.7177734375, 29.158203125, 30.5986328125, 32.0390625, 33.4794921875, 34.919921875, 36.3603515625, 37.80078125, 39.2412109375, 40.681640625, 42.1220703125, 43.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 15.0, 36.0, 62.0, 115.0, 181.0, 352.0, 622.0, 889.0, 767.0, 445.0, 225.0, 121.0, 77.0, 49.0, 38.0, 15.0, 9.0, 7.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.921875, -18.21484375, -17.5078125, -16.80078125, -16.09375, -15.38671875, -14.6796875, -13.97265625, -13.265625, -12.55859375, -11.8515625, -11.14453125, -10.4375, -9.73046875, -9.0234375, -8.31640625, -7.609375, -6.90234375, -6.1953125, -5.48828125, -4.78125, -4.07421875, -3.3671875, -2.66015625, -1.953125, -1.24609375, -0.5390625, 0.16796875, 0.875, 1.58203125, 2.2890625, 2.99609375, 3.703125, 4.41015625, 5.1171875, 5.82421875, 6.53125, 7.23828125, 7.9453125, 8.65234375, 9.359375, 10.06640625, 10.7734375, 11.48046875, 12.1875, 12.89453125, 13.6015625, 14.30859375, 15.015625, 15.72265625, 16.4296875, 17.13671875, 17.84375, 18.55078125, 19.2578125, 19.96484375, 20.671875, 21.37890625, 22.0859375, 22.79296875, 23.5, 24.20703125, 24.9140625, 25.62109375, 26.328125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 2.0, 8.0, 4.0, 15.0, 29.0, 45.0, 116.0, 334.0, 1020.0, 4402.0, 44350.0, 3414229.0, 709601.0, 16507.0, 2457.0, 727.0, 243.0, 96.0, 42.0, 22.0, 11.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.703125, -27.591552734375, -26.47998046875, -25.368408203125, -24.2568359375, -23.145263671875, -22.03369140625, -20.922119140625, -19.810546875, -18.698974609375, -17.58740234375, -16.475830078125, -15.3642578125, -14.252685546875, -13.14111328125, -12.029541015625, -10.91796875, -9.806396484375, -8.69482421875, -7.583251953125, -6.4716796875, -5.360107421875, -4.24853515625, -3.136962890625, -2.025390625, -0.913818359375, 0.19775390625, 1.309326171875, 2.4208984375, 3.532470703125, 4.64404296875, 5.755615234375, 6.8671875, 7.978759765625, 9.09033203125, 10.201904296875, 11.3134765625, 12.425048828125, 13.53662109375, 14.648193359375, 15.759765625, 16.871337890625, 17.98291015625, 19.094482421875, 20.2060546875, 21.317626953125, 22.42919921875, 23.540771484375, 24.65234375, 25.763916015625, 26.87548828125, 27.987060546875, 29.0986328125, 30.210205078125, 31.32177734375, 32.433349609375, 33.544921875, 34.656494140625, 35.76806640625, 36.879638671875, 37.9912109375, 39.102783203125, 40.21435546875, 41.325927734375, 42.4375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 18.0, 22.0, 42.0, 78.0, 125.0, 137.0, 155.0, 156.0, 101.0, 64.0, 44.0, 26.0, 14.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.293460845947266, -50.813377380371094, -46.333290100097656, -41.853206634521484, -37.37312316894531, -32.89303970336914, -28.412954330444336, -23.93286895751953, -19.45278549194336, -14.972701072692871, -10.492616653442383, -6.0125322341918945, -1.5324478149414062, 2.9476356506347656, 7.42772102355957, 11.907806396484375, 16.387889862060547, 20.86797332763672, 25.348058700561523, 29.828144073486328, 34.3082275390625, 38.78831100463867, 43.268394470214844, 47.74848175048828, 52.22856521606445, 56.708648681640625, 61.18873596191406, 65.66881561279297, 70.1489028930664, 74.62898254394531, 79.10906982421875, 83.58915710449219, 88.06924438476562, 92.54933166503906, 97.02941131591797, 101.5094985961914, 105.98957824707031, 110.46966552734375, 114.94975280761719, 119.42984008789062, 123.90991973876953, 128.38999938964844, 132.87008666992188, 137.3501739501953, 141.83026123046875, 146.31033325195312, 150.79042053222656, 155.2705078125, 159.75059509277344, 164.23068237304688, 168.7107696533203, 173.1908416748047, 177.67092895507812, 182.15101623535156, 186.631103515625, 191.11119079589844, 195.59127807617188, 200.0713653564453, 204.55145263671875, 209.03152465820312, 213.51161193847656, 217.99169921875, 222.47178649902344, 226.95187377929688, 231.43194580078125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 15.0, 10.0, 15.0, 25.0, 24.0, 36.0, 42.0, 41.0, 58.0, 68.0, 47.0, 56.0, 65.0, 61.0, 67.0, 58.0, 54.0, 42.0, 48.0, 36.0, 28.0, 18.0, 29.0, 14.0, 18.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.00747680664062, -70.64595794677734, -68.2844467163086, -65.92292785644531, -63.56141662597656, -61.19989776611328, -58.838382720947266, -56.47686767578125, -54.115352630615234, -51.75383758544922, -49.3923225402832, -47.03080749511719, -44.669288635253906, -42.307777404785156, -39.946258544921875, -37.58474349975586, -35.223228454589844, -32.86171340942383, -30.500198364257812, -28.138681411743164, -25.77716636657715, -23.415651321411133, -21.054134368896484, -18.69261932373047, -16.331104278564453, -13.969589233398438, -11.608073234558105, -9.246557235717773, -6.885042190551758, -4.523527145385742, -2.16201114654541, 0.19950485229492188, 2.5610198974609375, 4.922535419464111, 7.284050941467285, 9.645566940307617, 12.007081985473633, 14.368597030639648, 16.730113983154297, 19.091629028320312, 21.453144073486328, 23.814659118652344, 26.17617416381836, 28.537691116333008, 30.899206161499023, 33.260719299316406, 35.62223815917969, 37.9837532043457, 40.34526824951172, 42.706783294677734, 45.06829833984375, 47.429813385009766, 49.79132843017578, 52.15284729003906, 54.51436233520508, 56.875877380371094, 59.23739242553711, 61.598907470703125, 63.96042251586914, 66.32193756103516, 68.68345642089844, 71.04496765136719, 73.40648651123047, 75.76800537109375, 78.1295166015625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 12.0, 17.0, 25.0, 22.0, 28.0, 42.0, 41.0, 56.0, 58.0, 82.0, 54.0, 60.0, 71.0, 63.0, 62.0, 55.0, 47.0, 38.0, 33.0, 29.0, 26.0, 22.0, 18.0, 15.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.6875, -112.5146484375, -108.341796875, -104.1689453125, -99.99609375, -95.8232421875, -91.650390625, -87.4775390625, -83.3046875, -79.1318359375, -74.958984375, -70.7861328125, -66.61328125, -62.4404296875, -58.267578125, -54.0947265625, -49.921875, -45.7490234375, -41.576171875, -37.4033203125, -33.23046875, -29.0576171875, -24.884765625, -20.7119140625, -16.5390625, -12.3662109375, -8.193359375, -4.0205078125, 0.15234375, 4.3251953125, 8.498046875, 12.6708984375, 16.84375, 21.0166015625, 25.189453125, 29.3623046875, 33.53515625, 37.7080078125, 41.880859375, 46.0537109375, 50.2265625, 54.3994140625, 58.572265625, 62.7451171875, 66.91796875, 71.0908203125, 75.263671875, 79.4365234375, 83.609375, 87.7822265625, 91.955078125, 96.1279296875, 100.30078125, 104.4736328125, 108.646484375, 112.8193359375, 116.9921875, 121.1650390625, 125.337890625, 129.5107421875, 133.68359375, 137.8564453125, 142.029296875, 146.2021484375, 150.375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 18.0, 21.0, 26.0, 30.0, 50.0, 102.0, 103.0, 192.0, 303.0, 543.0, 906.0, 1586.0, 2777.0, 4496.0, 7960.0, 13928.0, 24163.0, 42263.0, 73599.0, 124959.0, 187678.0, 203549.0, 147532.0, 90031.0, 52017.0, 29535.0, 16871.0, 9620.0, 5603.0, 3252.0, 2014.0, 1123.0, 635.0, 383.0, 233.0, 152.0, 81.0, 54.0, 47.0, 33.0, 20.0, 12.0, 7.0, 6.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.21875, -8.94091796875, -8.6630859375, -8.38525390625, -8.107421875, -7.82958984375, -7.5517578125, -7.27392578125, -6.99609375, -6.71826171875, -6.4404296875, -6.16259765625, -5.884765625, -5.60693359375, -5.3291015625, -5.05126953125, -4.7734375, -4.49560546875, -4.2177734375, -3.93994140625, -3.662109375, -3.38427734375, -3.1064453125, -2.82861328125, -2.55078125, -2.27294921875, -1.9951171875, -1.71728515625, -1.439453125, -1.16162109375, -0.8837890625, -0.60595703125, -0.328125, -0.05029296875, 0.2275390625, 0.50537109375, 0.783203125, 1.06103515625, 1.3388671875, 1.61669921875, 1.89453125, 2.17236328125, 2.4501953125, 2.72802734375, 3.005859375, 3.28369140625, 3.5615234375, 3.83935546875, 4.1171875, 4.39501953125, 4.6728515625, 4.95068359375, 5.228515625, 5.50634765625, 5.7841796875, 6.06201171875, 6.33984375, 6.61767578125, 6.8955078125, 7.17333984375, 7.451171875, 7.72900390625, 8.0068359375, 8.28466796875, 8.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 10.0, 16.0, 11.0, 11.0, 21.0, 21.0, 29.0, 22.0, 22.0, 31.0, 44.0, 46.0, 31.0, 43.0, 44.0, 38.0, 42.0, 1074.0, 51.0, 46.0, 44.0, 33.0, 28.0, 41.0, 30.0, 29.0, 29.0, 23.0, 22.0, 15.0, 15.0, 9.0, 12.0, 9.0, 2.0, 3.0, 10.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.3125, -60.43896484375, -58.5654296875, -56.69189453125, -54.818359375, -52.94482421875, -51.0712890625, -49.19775390625, -47.32421875, -45.45068359375, -43.5771484375, -41.70361328125, -39.830078125, -37.95654296875, -36.0830078125, -34.20947265625, -32.3359375, -30.46240234375, -28.5888671875, -26.71533203125, -24.841796875, -22.96826171875, -21.0947265625, -19.22119140625, -17.34765625, -15.47412109375, -13.6005859375, -11.72705078125, -9.853515625, -7.97998046875, -6.1064453125, -4.23291015625, -2.359375, -0.48583984375, 1.3876953125, 3.26123046875, 5.134765625, 7.00830078125, 8.8818359375, 10.75537109375, 12.62890625, 14.50244140625, 16.3759765625, 18.24951171875, 20.123046875, 21.99658203125, 23.8701171875, 25.74365234375, 27.6171875, 29.49072265625, 31.3642578125, 33.23779296875, 35.111328125, 36.98486328125, 38.8583984375, 40.73193359375, 42.60546875, 44.47900390625, 46.3525390625, 48.22607421875, 50.099609375, 51.97314453125, 53.8466796875, 55.72021484375, 57.59375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 28.0, 24.0, 48.0, 71.0, 105.0, 132.0, 222.0, 347.0, 518.0, 734.0, 1160.0, 1816.0, 2661.0, 4042.0, 6166.0, 9444.0, 14784.0, 23460.0, 37372.0, 58738.0, 91229.0, 132533.0, 1210425.0, 160812.0, 119807.0, 80326.0, 51087.0, 32020.0, 20525.0, 12855.0, 8129.0, 5306.0, 3442.0, 2335.0, 1463.0, 961.0, 650.0, 437.0, 308.0, 177.0, 140.0, 102.0, 56.0, 41.0, 21.0, 26.0, 16.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.7109375, -6.49334716796875, -6.2757568359375, -6.05816650390625, -5.840576171875, -5.62298583984375, -5.4053955078125, -5.18780517578125, -4.97021484375, -4.75262451171875, -4.5350341796875, -4.31744384765625, -4.099853515625, -3.88226318359375, -3.6646728515625, -3.44708251953125, -3.2294921875, -3.01190185546875, -2.7943115234375, -2.57672119140625, -2.359130859375, -2.14154052734375, -1.9239501953125, -1.70635986328125, -1.48876953125, -1.27117919921875, -1.0535888671875, -0.83599853515625, -0.618408203125, -0.40081787109375, -0.1832275390625, 0.03436279296875, 0.251953125, 0.46954345703125, 0.6871337890625, 0.90472412109375, 1.122314453125, 1.33990478515625, 1.5574951171875, 1.77508544921875, 1.99267578125, 2.21026611328125, 2.4278564453125, 2.64544677734375, 2.863037109375, 3.08062744140625, 3.2982177734375, 3.51580810546875, 3.7333984375, 3.95098876953125, 4.1685791015625, 4.38616943359375, 4.603759765625, 4.82135009765625, 5.0389404296875, 5.25653076171875, 5.47412109375, 5.69171142578125, 5.9093017578125, 6.12689208984375, 6.344482421875, 6.56207275390625, 6.7796630859375, 6.99725341796875, 7.21484375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 2.0, 10.0, 11.0, 6.0, 11.0, 12.0, 10.0, 12.0, 18.0, 22.0, 32.0, 35.0, 58.0, 54.0, 59.0, 88.0, 69.0, 69.0, 70.0, 76.0, 51.0, 47.0, 31.0, 25.0, 16.0, 10.0, 12.0, 11.0, 7.0, 6.0, 7.0, 5.0, 9.0, 4.0, 2.0, 10.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.07086181640625, -0.0685739517211914, -0.06628608703613281, -0.06399822235107422, -0.061710357666015625, -0.05942249298095703, -0.05713462829589844, -0.054846763610839844, -0.05255889892578125, -0.050271034240722656, -0.04798316955566406, -0.04569530487060547, -0.043407440185546875, -0.04111957550048828, -0.03883171081542969, -0.036543846130371094, -0.0342559814453125, -0.031968116760253906, -0.029680252075195312, -0.02739238739013672, -0.025104522705078125, -0.02281665802001953, -0.020528793334960938, -0.018240928649902344, -0.01595306396484375, -0.013665199279785156, -0.011377334594726562, -0.009089469909667969, -0.006801605224609375, -0.004513740539550781, -0.0022258758544921875, 6.198883056640625e-05, 0.002349853515625, 0.004637718200683594, 0.0069255828857421875, 0.009213447570800781, 0.011501312255859375, 0.013789176940917969, 0.016077041625976562, 0.018364906311035156, 0.02065277099609375, 0.022940635681152344, 0.025228500366210938, 0.02751636505126953, 0.029804229736328125, 0.03209209442138672, 0.03437995910644531, 0.036667823791503906, 0.0389556884765625, 0.041243553161621094, 0.04353141784667969, 0.04581928253173828, 0.048107147216796875, 0.05039501190185547, 0.05268287658691406, 0.054970741271972656, 0.05725860595703125, 0.059546470642089844, 0.06183433532714844, 0.06412220001220703, 0.06641006469726562, 0.06869792938232422, 0.07098579406738281, 0.0732736587524414, 0.0755615234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 7.0, 10.0, 12.0, 20.0, 22.0, 25.0, 35.0, 55.0, 54.0, 74.0, 87.0, 143.0, 161.0, 236.0, 338.0, 641.0, 1161.0, 2505.0, 6020.0, 16795.0, 65098.0, 401296.0, 449366.0, 73771.0, 18258.0, 6379.0, 2634.0, 1233.0, 660.0, 377.0, 289.0, 207.0, 145.0, 82.0, 78.0, 65.0, 50.0, 34.0, 25.0, 19.0, 19.0, 11.0, 10.0, 4.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.47412109375, -0.45977020263671875, -0.4454193115234375, -0.43106842041015625, -0.416717529296875, -0.40236663818359375, -0.3880157470703125, -0.37366485595703125, -0.35931396484375, -0.34496307373046875, -0.3306121826171875, -0.31626129150390625, -0.301910400390625, -0.28755950927734375, -0.2732086181640625, -0.25885772705078125, -0.2445068359375, -0.23015594482421875, -0.2158050537109375, -0.20145416259765625, -0.187103271484375, -0.17275238037109375, -0.1584014892578125, -0.14405059814453125, -0.12969970703125, -0.11534881591796875, -0.1009979248046875, -0.08664703369140625, -0.072296142578125, -0.05794525146484375, -0.0435943603515625, -0.02924346923828125, -0.014892578125, -0.00054168701171875, 0.0138092041015625, 0.02816009521484375, 0.042510986328125, 0.05686187744140625, 0.0712127685546875, 0.08556365966796875, 0.09991455078125, 0.11426544189453125, 0.1286163330078125, 0.14296722412109375, 0.157318115234375, 0.17166900634765625, 0.1860198974609375, 0.20037078857421875, 0.2147216796875, 0.22907257080078125, 0.2434234619140625, 0.25777435302734375, 0.272125244140625, 0.28647613525390625, 0.3008270263671875, 0.31517791748046875, 0.32952880859375, 0.34387969970703125, 0.3582305908203125, 0.37258148193359375, 0.386932373046875, 0.40128326416015625, 0.4156341552734375, 0.42998504638671875, 0.4443359375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 26.0, 122.0, 368.0, 267.0, 109.0, 40.0, 24.0, 10.0, 10.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24437034130096436, -0.23556004464626312, -0.2267497479915619, -0.21793943643569946, -0.20912913978099823, -0.200318843126297, -0.19150853157043457, -0.18269823491573334, -0.1738879382610321, -0.16507764160633087, -0.15626734495162964, -0.1474570333957672, -0.13864673674106598, -0.12983644008636475, -0.12102613598108292, -0.11221583187580109, -0.10340553522109985, -0.09459523856639862, -0.08578493446111679, -0.07697463035583496, -0.06816433370113373, -0.0593540333211422, -0.050543732941150665, -0.041733432561159134, -0.0329231321811676, -0.02411283180117607, -0.01530253142118454, -0.006492231041193008, 0.002318069338798523, 0.011128369718790054, 0.019938670098781586, 0.028748970478773117, 0.03755924105644226, 0.04636954143643379, 0.055179841816425323, 0.06399014592170715, 0.07280044257640839, 0.08161073923110962, 0.09042104333639145, 0.09923134744167328, 0.10804164409637451, 0.11685194075107574, 0.12566223740577698, 0.1344725489616394, 0.14328284561634064, 0.15209314227104187, 0.1609034538269043, 0.16971375048160553, 0.17852404713630676, 0.187334343791008, 0.19614464044570923, 0.20495495200157166, 0.2137652486562729, 0.22257554531097412, 0.23138585686683655, 0.24019615352153778, 0.249006450176239, 0.25781676173210144, 0.2666270434856415, 0.2754373550415039, 0.28424763679504395, 0.29305794835090637, 0.3018682599067688, 0.31067854166030884, 0.31948885321617126]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 3.0, 9.0, 10.0, 9.0, 14.0, 18.0, 27.0, 22.0, 30.0, 20.0, 26.0, 31.0, 37.0, 34.0, 36.0, 45.0, 45.0, 29.0, 43.0, 37.0, 40.0, 48.0, 34.0, 37.0, 35.0, 39.0, 34.0, 38.0, 24.0, 22.0, 21.0, 14.0, 13.0, 6.0, 9.0, 8.0, 12.0, 6.0, 4.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06726968288421631, -0.0653594583272934, -0.06344922631978989, -0.061539001762866974, -0.05962877348065376, -0.05771854519844055, -0.05580832064151764, -0.05389809235930443, -0.05198786407709122, -0.050077635794878006, -0.048167407512664795, -0.04625718295574188, -0.04434695467352867, -0.04243672639131546, -0.04052650183439255, -0.03861627355217934, -0.036706045269966125, -0.034795816987752914, -0.0328855887055397, -0.03097536414861679, -0.02906513586640358, -0.02715490758419037, -0.025244681164622307, -0.023334454745054245, -0.021424226462841034, -0.019513998180627823, -0.01760377176105976, -0.0156935453414917, -0.013783317059278488, -0.011873089708387852, -0.009962862357497215, -0.008052635006606579, -0.006142407655715942, -0.004232180304825306, -0.0023219529539346695, -0.00041172560304403305, 0.0014985017478466034, 0.00340872909873724, 0.005318956449627876, 0.007229183800518513, 0.00913941115140915, 0.011049638502299786, 0.012959865853190422, 0.014870093204081059, 0.016780320554971695, 0.018690548837184906, 0.020600775256752968, 0.02251100167632103, 0.02442122995853424, 0.026331458240747452, 0.028241684660315514, 0.030151911079883575, 0.032062139362096786, 0.03397236764431, 0.03588259220123291, 0.03779282048344612, 0.03970304876565933, 0.04161327704787254, 0.043523505330085754, 0.04543372988700867, 0.04734395816922188, 0.04925418645143509, 0.051164411008358, 0.05307463929057121, 0.054984867572784424]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 12.0, 17.0, 25.0, 23.0, 29.0, 41.0, 41.0, 56.0, 57.0, 82.0, 53.0, 61.0, 67.0, 67.0, 62.0, 54.0, 48.0, 37.0, 34.0, 30.0, 26.0, 22.0, 17.0, 15.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.4375, -112.2724609375, -108.107421875, -103.9423828125, -99.77734375, -95.6123046875, -91.447265625, -87.2822265625, -83.1171875, -78.9521484375, -74.787109375, -70.6220703125, -66.45703125, -62.2919921875, -58.126953125, -53.9619140625, -49.796875, -45.6318359375, -41.466796875, -37.3017578125, -33.13671875, -28.9716796875, -24.806640625, -20.6416015625, -16.4765625, -12.3115234375, -8.146484375, -3.9814453125, 0.18359375, 4.3486328125, 8.513671875, 12.6787109375, 16.84375, 21.0087890625, 25.173828125, 29.3388671875, 33.50390625, 37.6689453125, 41.833984375, 45.9990234375, 50.1640625, 54.3291015625, 58.494140625, 62.6591796875, 66.82421875, 70.9892578125, 75.154296875, 79.3193359375, 83.484375, 87.6494140625, 91.814453125, 95.9794921875, 100.14453125, 104.3095703125, 108.474609375, 112.6396484375, 116.8046875, 120.9697265625, 125.134765625, 129.2998046875, 133.46484375, 137.6298828125, 141.794921875, 145.9599609375, 150.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 11.0, 20.0, 23.0, 43.0, 65.0, 104.0, 187.0, 385.0, 942.0, 2322.0, 7234.0, 34993.0, 470455.0, 484643.0, 35943.0, 7081.0, 2319.0, 918.0, 387.0, 180.0, 107.0, 64.0, 44.0, 37.0, 18.0, 7.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.359375, -28.272216796875, -27.18505859375, -26.097900390625, -25.0107421875, -23.923583984375, -22.83642578125, -21.749267578125, -20.662109375, -19.574951171875, -18.48779296875, -17.400634765625, -16.3134765625, -15.226318359375, -14.13916015625, -13.052001953125, -11.96484375, -10.877685546875, -9.79052734375, -8.703369140625, -7.6162109375, -6.529052734375, -5.44189453125, -4.354736328125, -3.267578125, -2.180419921875, -1.09326171875, -0.006103515625, 1.0810546875, 2.168212890625, 3.25537109375, 4.342529296875, 5.4296875, 6.516845703125, 7.60400390625, 8.691162109375, 9.7783203125, 10.865478515625, 11.95263671875, 13.039794921875, 14.126953125, 15.214111328125, 16.30126953125, 17.388427734375, 18.4755859375, 19.562744140625, 20.64990234375, 21.737060546875, 22.82421875, 23.911376953125, 24.99853515625, 26.085693359375, 27.1728515625, 28.260009765625, 29.34716796875, 30.434326171875, 31.521484375, 32.608642578125, 33.69580078125, 34.782958984375, 35.8701171875, 36.957275390625, 38.04443359375, 39.131591796875, 40.21875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 8.0, 13.0, 21.0, 28.0, 30.0, 37.0, 52.0, 69.0, 55.0, 79.0, 225.0, 1987.0, 77.0, 79.0, 54.0, 49.0, 41.0, 35.0, 27.0, 14.0, 10.0, 9.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-205.0, -198.404296875, -191.80859375, -185.212890625, -178.6171875, -172.021484375, -165.42578125, -158.830078125, -152.234375, -145.638671875, -139.04296875, -132.447265625, -125.8515625, -119.255859375, -112.66015625, -106.064453125, -99.46875, -92.873046875, -86.27734375, -79.681640625, -73.0859375, -66.490234375, -59.89453125, -53.298828125, -46.703125, -40.107421875, -33.51171875, -26.916015625, -20.3203125, -13.724609375, -7.12890625, -0.533203125, 6.0625, 12.658203125, 19.25390625, 25.849609375, 32.4453125, 39.041015625, 45.63671875, 52.232421875, 58.828125, 65.423828125, 72.01953125, 78.615234375, 85.2109375, 91.806640625, 98.40234375, 104.998046875, 111.59375, 118.189453125, 124.78515625, 131.380859375, 137.9765625, 144.572265625, 151.16796875, 157.763671875, 164.359375, 170.955078125, 177.55078125, 184.146484375, 190.7421875, 197.337890625, 203.93359375, 210.529296875, 217.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 12.0, 7.0, 15.0, 20.0, 34.0, 36.0, 62.0, 108.0, 158.0, 289.0, 540.0, 1185.0, 3914.0, 42279.0, 2981650.0, 106332.0, 6076.0, 1475.0, 649.0, 345.0, 190.0, 118.0, 57.0, 46.0, 43.0, 21.0, 13.0, 15.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34375, -45.74560546875, -44.1474609375, -42.54931640625, -40.951171875, -39.35302734375, -37.7548828125, -36.15673828125, -34.55859375, -32.96044921875, -31.3623046875, -29.76416015625, -28.166015625, -26.56787109375, -24.9697265625, -23.37158203125, -21.7734375, -20.17529296875, -18.5771484375, -16.97900390625, -15.380859375, -13.78271484375, -12.1845703125, -10.58642578125, -8.98828125, -7.39013671875, -5.7919921875, -4.19384765625, -2.595703125, -0.99755859375, 0.6005859375, 2.19873046875, 3.796875, 5.39501953125, 6.9931640625, 8.59130859375, 10.189453125, 11.78759765625, 13.3857421875, 14.98388671875, 16.58203125, 18.18017578125, 19.7783203125, 21.37646484375, 22.974609375, 24.57275390625, 26.1708984375, 27.76904296875, 29.3671875, 30.96533203125, 32.5634765625, 34.16162109375, 35.759765625, 37.35791015625, 38.9560546875, 40.55419921875, 42.15234375, 43.75048828125, 45.3486328125, 46.94677734375, 48.544921875, 50.14306640625, 51.7412109375, 53.33935546875, 54.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 14.0, 24.0, 85.0, 186.0, 297.0, 186.0, 92.0, 45.0, 26.0, 11.0, 9.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.56553649902344, -133.92076110839844, -122.27598571777344, -110.63121032714844, -98.98643493652344, -87.34165954589844, -75.69689178466797, -64.05211639404297, -52.40734100341797, -40.76256561279297, -29.1177921295166, -17.473018646240234, -5.828243255615234, 5.816532135009766, 17.4613037109375, 29.1060791015625, 40.7508544921875, 52.3956298828125, 64.0404052734375, 75.6851806640625, 87.3299560546875, 98.9747314453125, 110.61949920654297, 122.26427459716797, 133.9090576171875, 145.5538330078125, 157.1986083984375, 168.8433837890625, 180.4881591796875, 192.1329345703125, 203.7777099609375, 215.4224853515625, 227.06723022460938, 238.71200561523438, 250.35678100585938, 262.0015563964844, 273.6463317871094, 285.2911071777344, 296.9358825683594, 308.5806579589844, 320.2254333496094, 331.8702087402344, 343.5149841308594, 355.1597595214844, 366.8045349121094, 378.4493103027344, 390.0940856933594, 401.7388610839844, 413.38360595703125, 425.02838134765625, 436.67315673828125, 448.31793212890625, 459.96270751953125, 471.60748291015625, 483.25225830078125, 494.89703369140625, 506.54180908203125, 518.1865844726562, 529.8313598632812, 541.4761352539062, 553.1209106445312, 564.7656860351562, 576.4104614257812, 588.0552368164062, 599.7000122070312]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 13.0, 5.0, 8.0, 14.0, 20.0, 25.0, 29.0, 29.0, 29.0, 44.0, 31.0, 50.0, 63.0, 63.0, 49.0, 66.0, 54.0, 52.0, 51.0, 44.0, 45.0, 33.0, 37.0, 33.0, 20.0, 21.0, 14.0, 5.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-258.65252685546875, -251.70884704589844, -244.76516723632812, -237.82150268554688, -230.87782287597656, -223.93414306640625, -216.990478515625, -210.0467987060547, -203.10311889648438, -196.15943908691406, -189.21575927734375, -182.2720947265625, -175.3284149169922, -168.38473510742188, -161.44107055664062, -154.4973907470703, -147.5537109375, -140.6100311279297, -133.66635131835938, -126.72268676757812, -119.77900695800781, -112.8353271484375, -105.89165496826172, -98.94798278808594, -92.00430297851562, -85.06062316894531, -78.11695098876953, -71.17327880859375, -64.22959899902344, -57.28592300415039, -50.342247009277344, -43.3985710144043, -36.45489501953125, -29.511219024658203, -22.567543029785156, -15.62386703491211, -8.680191040039062, -1.7365150451660156, 5.207160949707031, 12.150836944580078, 19.094512939453125, 26.038188934326172, 32.98186492919922, 39.925540924072266, 46.86921691894531, 53.81289291381836, 60.756568908691406, 67.70024108886719, 74.6439208984375, 81.58760070800781, 88.5312728881836, 95.47494506835938, 102.41862487792969, 109.3623046875, 116.30597686767578, 123.24964904785156, 130.19332885742188, 137.1370086669922, 144.0806884765625, 151.02435302734375, 157.96803283691406, 164.91171264648438, 171.85537719726562, 178.79905700683594, 185.74273681640625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 11.0, 14.0, 13.0, 25.0, 29.0, 47.0, 61.0, 71.0, 104.0, 96.0, 156.0, 183.0, 222.0, 289.0, 413.0, 499.0, 713.0, 1070.0, 1039838.0, 1226.0, 922.0, 573.0, 445.0, 325.0, 285.0, 209.0, 161.0, 127.0, 114.0, 87.0, 55.0, 32.0, 30.0, 23.0, 20.0, 16.0, 15.0, 7.0, 11.0, 2.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.28384017944336, -52.57477569580078, -50.86570739746094, -49.15664291381836, -47.44757843017578, -45.7385139465332, -44.029449462890625, -42.32038116455078, -40.6113166809082, -38.902252197265625, -37.19318389892578, -35.4841194152832, -33.775054931640625, -32.06599044799805, -30.356924057006836, -28.647857666015625, -26.938793182373047, -25.22972869873047, -23.520662307739258, -21.811595916748047, -20.10253143310547, -18.39346694946289, -16.68440055847168, -14.975335121154785, -13.26626968383789, -11.557204246520996, -9.848138809204102, -8.139073371887207, -6.4300079345703125, -4.720942497253418, -3.0118770599365234, -1.302811622619629, 0.40625, 2.1153154373168945, 3.824380874633789, 5.533446311950684, 7.242511749267578, 8.951577186584473, 10.660642623901367, 12.369708061218262, 14.078773498535156, 15.78783893585205, 17.496904373168945, 19.205970764160156, 20.915035247802734, 22.624099731445312, 24.333166122436523, 26.042232513427734, 27.751296997070312, 29.46036148071289, 31.1694278717041, 32.87849426269531, 34.58755874633789, 36.29662322998047, 38.00569152832031, 39.71475601196289, 41.42382049560547, 43.13288497924805, 44.841949462890625, 46.55101776123047, 48.26008224487305, 49.969146728515625, 51.67821502685547, 53.38727951049805, 55.096343994140625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 13.0, 10.0, 16.0, 76.0, 873.0, 51462040.0, 56.0, 15.0, 7.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5690.978515625, -5473.685546875, -5256.392578125, -5039.09912109375, -4821.80615234375, -4604.51318359375, -4387.2197265625, -4169.9267578125, -3952.6337890625, -3735.3408203125, -3518.047607421875, -3300.75439453125, -3083.46142578125, -2866.16845703125, -2648.875244140625, -2431.58203125, -2214.2890625, -1996.9959716796875, -1779.702880859375, -1562.4097900390625, -1345.11669921875, -1127.8236083984375, -910.530517578125, -693.2374267578125, -475.9443359375, -258.6512451171875, -41.358154296875, 175.9349365234375, 393.22802734375, 610.5211181640625, 827.814208984375, 1045.1072998046875, 1262.400390625, 1479.6934814453125, 1696.986572265625, 1914.2796630859375, 2131.57275390625, 2348.86572265625, 2566.158935546875, 2783.4521484375, 3000.7451171875, 3218.0380859375, 3435.331298828125, 3652.62451171875, 3869.91748046875, 4087.21044921875, 4304.50390625, 4521.796875, 4739.08984375, 4956.3828125, 5173.67578125, 5390.96923828125, 5608.26220703125, 5825.55517578125, 6042.8486328125, 6260.1416015625, 6477.4345703125, 6694.7275390625, 6912.0205078125, 7129.31396484375, 7346.60693359375, 7563.89990234375, 7781.193359375, 7998.486328125, 8215.779296875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 6.0, 18.0, 25.0, 54.0, 67.0, 89.0, 141.0, 206.0, 329.0, 475.0, 772.0, 1165.0, 1784.0, 2863.0, 4461.0, 7431.0, 11966.0, 19382.0, 32006.0, 53278.0, 88133.0, 142322.0, 225605.0, 337179.0, 499887.0, 3569745.0, 439555.0, 312748.0, 207841.0, 129647.0, 79426.0, 47723.0, 28995.0, 17386.0, 10923.0, 6414.0, 4013.0, 2637.0, 1700.0, 1033.0, 656.0, 478.0, 285.0, 212.0, 131.0, 77.0, 57.0, 40.0, 32.0, 22.0, 13.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.40625, -2.32440185546875, -2.2425537109375, -2.16070556640625, -2.078857421875, -1.99700927734375, -1.9151611328125, -1.83331298828125, -1.75146484375, -1.66961669921875, -1.5877685546875, -1.50592041015625, -1.424072265625, -1.34222412109375, -1.2603759765625, -1.17852783203125, -1.0966796875, -1.01483154296875, -0.9329833984375, -0.85113525390625, -0.769287109375, -0.68743896484375, -0.6055908203125, -0.52374267578125, -0.44189453125, -0.36004638671875, -0.2781982421875, -0.19635009765625, -0.114501953125, -0.03265380859375, 0.0491943359375, 0.13104248046875, 0.212890625, 0.29473876953125, 0.3765869140625, 0.45843505859375, 0.540283203125, 0.62213134765625, 0.7039794921875, 0.78582763671875, 0.86767578125, 0.94952392578125, 1.0313720703125, 1.11322021484375, 1.195068359375, 1.27691650390625, 1.3587646484375, 1.44061279296875, 1.5224609375, 1.60430908203125, 1.6861572265625, 1.76800537109375, 1.849853515625, 1.93170166015625, 2.0135498046875, 2.09539794921875, 2.17724609375, 2.25909423828125, 2.3409423828125, 2.42279052734375, 2.504638671875, 2.58648681640625, 2.6683349609375, 2.75018310546875, 2.83203125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 4.0, 3.0, 9.0, 9.0, 12.0, 8.0, 12.0, 19.0, 9.0, 12.0, 14.0, 26.0, 26.0, 29.0, 31.0, 30.0, 31.0, 38.0, 30.0, 39.0, 49.0, 41.0, 355.0, 705.0, 66.0, 33.0, 31.0, 39.0, 29.0, 29.0, 26.0, 29.0, 23.0, 19.0, 33.0, 20.0, 29.0, 15.0, 13.0, 10.0, 12.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.531494140625, -16.96923828125, -16.406982421875, -15.8447265625, -15.282470703125, -14.72021484375, -14.157958984375, -13.595703125, -13.033447265625, -12.47119140625, -11.908935546875, -11.3466796875, -10.784423828125, -10.22216796875, -9.659912109375, -9.09765625, -8.535400390625, -7.97314453125, -7.410888671875, -6.8486328125, -6.286376953125, -5.72412109375, -5.161865234375, -4.599609375, -4.037353515625, -3.47509765625, -2.912841796875, -2.3505859375, -1.788330078125, -1.22607421875, -0.663818359375, -0.1015625, 0.460693359375, 1.02294921875, 1.585205078125, 2.1474609375, 2.709716796875, 3.27197265625, 3.834228515625, 4.396484375, 4.958740234375, 5.52099609375, 6.083251953125, 6.6455078125, 7.207763671875, 7.77001953125, 8.332275390625, 8.89453125, 9.456787109375, 10.01904296875, 10.581298828125, 11.1435546875, 11.705810546875, 12.26806640625, 12.830322265625, 13.392578125, 13.954833984375, 14.51708984375, 15.079345703125, 15.6416015625, 16.203857421875, 16.76611328125, 17.328369140625, 17.890625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 13.0, 22.0, 35.0, 54.0, 105.0, 139.0, 233.0, 386.0, 545.0, 804.0, 1309.0, 2124.0, 3265.0, 4930.0, 7702.0, 12401.0, 20134.0, 32479.0, 53945.0, 89832.0, 145680.0, 227393.0, 332992.0, 500873.0, 3500994.0, 459177.0, 320505.0, 217632.0, 138059.0, 84204.0, 50994.0, 31386.0, 18921.0, 11624.0, 7405.0, 4668.0, 3080.0, 1975.0, 1266.0, 795.0, 497.0, 335.0, 214.0, 119.0, 75.0, 32.0, 40.0, 13.0, 12.0, 8.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.369140625, -2.29132080078125, -2.2135009765625, -2.13568115234375, -2.057861328125, -1.98004150390625, -1.9022216796875, -1.82440185546875, -1.74658203125, -1.66876220703125, -1.5909423828125, -1.51312255859375, -1.435302734375, -1.35748291015625, -1.2796630859375, -1.20184326171875, -1.1240234375, -1.04620361328125, -0.9683837890625, -0.89056396484375, -0.812744140625, -0.73492431640625, -0.6571044921875, -0.57928466796875, -0.50146484375, -0.42364501953125, -0.3458251953125, -0.26800537109375, -0.190185546875, -0.11236572265625, -0.0345458984375, 0.04327392578125, 0.12109375, 0.19891357421875, 0.2767333984375, 0.35455322265625, 0.432373046875, 0.51019287109375, 0.5880126953125, 0.66583251953125, 0.74365234375, 0.82147216796875, 0.8992919921875, 0.97711181640625, 1.054931640625, 1.13275146484375, 1.2105712890625, 1.28839111328125, 1.3662109375, 1.44403076171875, 1.5218505859375, 1.59967041015625, 1.677490234375, 1.75531005859375, 1.8331298828125, 1.91094970703125, 1.98876953125, 2.06658935546875, 2.1444091796875, 2.22222900390625, 2.300048828125, 2.37786865234375, 2.4556884765625, 2.53350830078125, 2.611328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 3.0, 7.0, 13.0, 16.0, 17.0, 10.0, 26.0, 31.0, 22.0, 18.0, 38.0, 24.0, 32.0, 40.0, 35.0, 43.0, 53.0, 45.0, 373.0, 688.0, 77.0, 38.0, 50.0, 36.0, 30.0, 25.0, 31.0, 32.0, 24.0, 15.0, 20.0, 12.0, 21.0, 14.0, 14.0, 11.0, 9.0, 1.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0, -11.55908203125, -11.1181640625, -10.67724609375, -10.236328125, -9.79541015625, -9.3544921875, -8.91357421875, -8.47265625, -8.03173828125, -7.5908203125, -7.14990234375, -6.708984375, -6.26806640625, -5.8271484375, -5.38623046875, -4.9453125, -4.50439453125, -4.0634765625, -3.62255859375, -3.181640625, -2.74072265625, -2.2998046875, -1.85888671875, -1.41796875, -0.97705078125, -0.5361328125, -0.09521484375, 0.345703125, 0.78662109375, 1.2275390625, 1.66845703125, 2.109375, 2.55029296875, 2.9912109375, 3.43212890625, 3.873046875, 4.31396484375, 4.7548828125, 5.19580078125, 5.63671875, 6.07763671875, 6.5185546875, 6.95947265625, 7.400390625, 7.84130859375, 8.2822265625, 8.72314453125, 9.1640625, 9.60498046875, 10.0458984375, 10.48681640625, 10.927734375, 11.36865234375, 11.8095703125, 12.25048828125, 12.69140625, 13.13232421875, 13.5732421875, 14.01416015625, 14.455078125, 14.89599609375, 15.3369140625, 15.77783203125, 16.21875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 14.0, 18.0, 21.0, 37.0, 44.0, 64.0, 75.0, 105.0, 157.0, 229.0, 365.0, 501.0, 698.0, 1121.0, 1900.0, 3019.0, 5459.0, 10440.0, 21688.0, 46996.0, 110431.0, 5608109.0, 313857.0, 88196.0, 38864.0, 18009.0, 8936.0, 4622.0, 2710.0, 1598.0, 1021.0, 671.0, 415.0, 287.0, 221.0, 155.0, 100.0, 89.0, 51.0, 41.0, 32.0, 17.0, 10.0, 9.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.4375, -9.150390625, -8.86328125, -8.576171875, -8.2890625, -8.001953125, -7.71484375, -7.427734375, -7.140625, -6.853515625, -6.56640625, -6.279296875, -5.9921875, -5.705078125, -5.41796875, -5.130859375, -4.84375, -4.556640625, -4.26953125, -3.982421875, -3.6953125, -3.408203125, -3.12109375, -2.833984375, -2.546875, -2.259765625, -1.97265625, -1.685546875, -1.3984375, -1.111328125, -0.82421875, -0.537109375, -0.25, 0.037109375, 0.32421875, 0.611328125, 0.8984375, 1.185546875, 1.47265625, 1.759765625, 2.046875, 2.333984375, 2.62109375, 2.908203125, 3.1953125, 3.482421875, 3.76953125, 4.056640625, 4.34375, 4.630859375, 4.91796875, 5.205078125, 5.4921875, 5.779296875, 6.06640625, 6.353515625, 6.640625, 6.927734375, 7.21484375, 7.501953125, 7.7890625, 8.076171875, 8.36328125, 8.650390625, 8.9375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 5.0, 5.0, 10.0, 6.0, 11.0, 13.0, 20.0, 19.0, 26.0, 20.0, 21.0, 24.0, 20.0, 29.0, 33.0, 22.0, 28.0, 31.0, 44.0, 47.0, 156.0, 667.0, 282.0, 53.0, 32.0, 37.0, 43.0, 40.0, 28.0, 27.0, 22.0, 22.0, 19.0, 21.0, 21.0, 14.0, 16.0, 20.0, 8.0, 5.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.2578125, -8.9560546875, -8.654296875, -8.3525390625, -8.05078125, -7.7490234375, -7.447265625, -7.1455078125, -6.84375, -6.5419921875, -6.240234375, -5.9384765625, -5.63671875, -5.3349609375, -5.033203125, -4.7314453125, -4.4296875, -4.1279296875, -3.826171875, -3.5244140625, -3.22265625, -2.9208984375, -2.619140625, -2.3173828125, -2.015625, -1.7138671875, -1.412109375, -1.1103515625, -0.80859375, -0.5068359375, -0.205078125, 0.0966796875, 0.3984375, 0.7001953125, 1.001953125, 1.3037109375, 1.60546875, 1.9072265625, 2.208984375, 2.5107421875, 2.8125, 3.1142578125, 3.416015625, 3.7177734375, 4.01953125, 4.3212890625, 4.623046875, 4.9248046875, 5.2265625, 5.5283203125, 5.830078125, 6.1318359375, 6.43359375, 6.7353515625, 7.037109375, 7.3388671875, 7.640625, 7.9423828125, 8.244140625, 8.5458984375, 8.84765625, 9.1494140625, 9.451171875, 9.7529296875, 10.0546875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 8.0, 12.0, 16.0, 32.0, 41.0, 65.0, 74.0, 124.0, 148.0, 139.0, 115.0, 67.0, 45.0, 46.0, 23.0, 16.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.156448364257812, -30.262786865234375, -29.369123458862305, -28.475461959838867, -27.581798553466797, -26.68813705444336, -25.794475555419922, -24.90081214904785, -24.00714874267578, -23.113487243652344, -22.219823837280273, -21.326162338256836, -20.432498931884766, -19.538837432861328, -18.64517593383789, -17.75151252746582, -16.857851028442383, -15.964188575744629, -15.070526123046875, -14.176864624023438, -13.283201217651367, -12.38953971862793, -11.495877265930176, -10.602214813232422, -9.708552360534668, -8.814889907836914, -7.92122745513916, -7.0275654792785645, -6.1339030265808105, -5.240240573883057, -4.346578598022461, -3.452916145324707, -2.559253692626953, -1.6655913591384888, -0.7719290256500244, 0.12173318862915039, 1.0153956413269043, 1.9090580940246582, 2.802720069885254, 3.696382522583008, 4.590044975280762, 5.483707427978516, 6.3773698806762695, 7.271031856536865, 8.164693832397461, 9.058357238769531, 9.952018737792969, 10.845681190490723, 11.739343643188477, 12.63300609588623, 13.526668548583984, 14.420330047607422, 15.313993453979492, 16.20765495300293, 17.101318359375, 17.994979858398438, 18.888641357421875, 19.782302856445312, 20.675966262817383, 21.56962776184082, 22.46329116821289, 23.356952667236328, 24.250614166259766, 25.144277572631836, 26.037940979003906]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 10.0, 9.0, 5.0, 6.0, 5.0, 8.0, 10.0, 19.0, 17.0, 16.0, 28.0, 32.0, 36.0, 34.0, 41.0, 48.0, 42.0, 34.0, 53.0, 60.0, 51.0, 40.0, 48.0, 65.0, 56.0, 30.0, 45.0, 31.0, 24.0, 20.0, 12.0, 16.0, 9.0, 14.0, 11.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.59416961669922, -20.966276168823242, -20.338382720947266, -19.710487365722656, -19.08259391784668, -18.454700469970703, -17.826807022094727, -17.19891357421875, -16.57101821899414, -15.943124771118164, -15.315230369567871, -14.687336921691895, -14.059442520141602, -13.431549072265625, -12.803655624389648, -12.175761222839355, -11.547867774963379, -10.919974327087402, -10.29207992553711, -9.664186477661133, -9.03629207611084, -8.408398628234863, -7.7805047035217285, -7.152610778808594, -6.524716854095459, -5.896822929382324, -5.2689290046691895, -4.641035079956055, -4.013141632080078, -3.3852474689483643, -2.7573537826538086, -2.129459857940674, -1.501565933227539, -0.8736720681190491, -0.24577820301055908, 0.38211560249328613, 1.010009527206421, 1.6379034519195557, 2.2657971382141113, 2.893691062927246, 3.521584987640381, 4.149478912353516, 4.77737283706665, 5.405266761779785, 6.033160209655762, 6.661054611206055, 7.288948059082031, 7.916841983795166, 8.5447359085083, 9.172629356384277, 9.80052375793457, 10.428417205810547, 11.05631160736084, 11.684205055236816, 12.31209945678711, 12.939992904663086, 13.567886352539062, 14.195779800415039, 14.823674201965332, 15.451567649841309, 16.0794620513916, 16.707355499267578, 17.335248947143555, 17.96314239501953, 18.59103775024414]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 7.0, 12.0, 19.0, 19.0, 20.0, 33.0, 36.0, 56.0, 83.0, 115.0, 180.0, 231.0, 336.0, 479.0, 763.0, 1335.0, 2152.0, 3804.0, 7556.0, 17123.0, 53340.0, 3664084.0, 376709.0, 38988.0, 13137.0, 5661.0, 3065.0, 1720.0, 1023.0, 655.0, 455.0, 308.0, 220.0, 149.0, 104.0, 69.0, 57.0, 50.0, 36.0, 22.0, 15.0, 15.0, 11.0, 7.0, 8.0, 7.0, 1.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.82373046875, -0.7952346801757812, -0.7667388916015625, -0.7382431030273438, -0.709747314453125, -0.6812515258789062, -0.6527557373046875, -0.6242599487304688, -0.59576416015625, -0.5672683715820312, -0.5387725830078125, -0.5102767944335938, -0.481781005859375, -0.45328521728515625, -0.4247894287109375, -0.39629364013671875, -0.3677978515625, -0.33930206298828125, -0.3108062744140625, -0.28231048583984375, -0.253814697265625, -0.22531890869140625, -0.1968231201171875, -0.16832733154296875, -0.13983154296875, -0.11133575439453125, -0.0828399658203125, -0.05434417724609375, -0.025848388671875, 0.00264739990234375, 0.0311431884765625, 0.05963897705078125, 0.088134765625, 0.11663055419921875, 0.1451263427734375, 0.17362213134765625, 0.202117919921875, 0.23061370849609375, 0.2591094970703125, 0.28760528564453125, 0.31610107421875, 0.34459686279296875, 0.3730926513671875, 0.40158843994140625, 0.430084228515625, 0.45858001708984375, 0.4870758056640625, 0.5155715942382812, 0.5440673828125, 0.5725631713867188, 0.6010589599609375, 0.6295547485351562, 0.658050537109375, 0.6865463256835938, 0.7150421142578125, 0.7435379028320312, 0.77203369140625, 0.8005294799804688, 0.8290252685546875, 0.8575210571289062, 0.886016845703125, 0.9145126342773438, 0.9430084228515625, 0.9715042114257812, 1.0]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 6.0, 8.0, 8.0, 7.0, 16.0, 13.0, 21.0, 26.0, 774.0, 28.0, 18.0, 11.0, 10.0, 9.0, 6.0, 5.0, 7.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2278728485107422, -0.22124862670898438, -0.21462440490722656, -0.20800018310546875, -0.20137596130371094, -0.19475173950195312, -0.1881275177001953, -0.1815032958984375, -0.1748790740966797, -0.16825485229492188, -0.16163063049316406, -0.15500640869140625, -0.14838218688964844, -0.14175796508789062, -0.1351337432861328, -0.128509521484375, -0.12188529968261719, -0.11526107788085938, -0.10863685607910156, -0.10201263427734375, -0.09538841247558594, -0.08876419067382812, -0.08213996887207031, -0.0755157470703125, -0.06889152526855469, -0.062267303466796875, -0.05564308166503906, -0.04901885986328125, -0.04239463806152344, -0.035770416259765625, -0.029146194458007812, -0.02252197265625, -0.015897750854492188, -0.009273529052734375, -0.0026493072509765625, 0.00397491455078125, 0.010599136352539062, 0.017223358154296875, 0.023847579956054688, 0.0304718017578125, 0.03709602355957031, 0.043720245361328125, 0.05034446716308594, 0.05696868896484375, 0.06359291076660156, 0.07021713256835938, 0.07684135437011719, 0.083465576171875, 0.09008979797363281, 0.09671401977539062, 0.10333824157714844, 0.10996246337890625, 0.11658668518066406, 0.12321090698242188, 0.1298351287841797, 0.1364593505859375, 0.1430835723876953, 0.14970779418945312, 0.15633201599121094, 0.16295623779296875, 0.16958045959472656, 0.17620468139648438, 0.1828289031982422, 0.189453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 19.0, 21.0, 28.0, 55.0, 82.0, 125.0, 175.0, 254.0, 476.0, 701.0, 1185.0, 1927.0, 3366.0, 6293.0, 11603.0, 24571.0, 57362.0, 165481.0, 721179.0, 2507328.0, 468786.0, 128426.0, 48021.0, 21427.0, 10886.0, 5799.0, 3325.0, 1988.0, 1289.0, 710.0, 488.0, 282.0, 201.0, 124.0, 96.0, 55.0, 42.0, 22.0, 26.0, 7.0, 7.0, 9.0, 8.0, 2.0, 6.0, 0.0, 2.0], "bins": [-0.55712890625, -0.5418128967285156, -0.5264968872070312, -0.5111808776855469, -0.4958648681640625, -0.4805488586425781, -0.46523284912109375, -0.4499168395996094, -0.434600830078125, -0.4192848205566406, -0.40396881103515625, -0.3886528015136719, -0.3733367919921875, -0.3580207824707031, -0.34270477294921875, -0.3273887634277344, -0.31207275390625, -0.2967567443847656, -0.28144073486328125, -0.2661247253417969, -0.2508087158203125, -0.23549270629882812, -0.22017669677734375, -0.20486068725585938, -0.189544677734375, -0.17422866821289062, -0.15891265869140625, -0.14359664916992188, -0.1282806396484375, -0.11296463012695312, -0.09764862060546875, -0.08233261108398438, -0.0670166015625, -0.051700592041015625, -0.03638458251953125, -0.021068572998046875, -0.0057525634765625, 0.009563446044921875, 0.02487945556640625, 0.040195465087890625, 0.055511474609375, 0.07082748413085938, 0.08614349365234375, 0.10145950317382812, 0.1167755126953125, 0.13209152221679688, 0.14740753173828125, 0.16272354125976562, 0.17803955078125, 0.19335556030273438, 0.20867156982421875, 0.22398757934570312, 0.2393035888671875, 0.2546195983886719, 0.26993560791015625, 0.2852516174316406, 0.300567626953125, 0.3158836364746094, 0.33119964599609375, 0.3465156555175781, 0.3618316650390625, 0.3771476745605469, 0.39246368408203125, 0.4077796936035156, 0.423095703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 5.0, 5.0, 1.0, 12.0, 8.0, 18.0, 18.0, 30.0, 39.0, 50.0, 88.0, 128.0, 195.0, 286.0, 502.0, 986.0, 585.0, 339.0, 217.0, 152.0, 95.0, 58.0, 49.0, 50.0, 34.0, 28.0, 27.0, 13.0, 13.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.17273902893066406, -0.16542434692382812, -0.1581096649169922, -0.15079498291015625, -0.1434803009033203, -0.13616561889648438, -0.12885093688964844, -0.1215362548828125, -0.11422157287597656, -0.10690689086914062, -0.09959220886230469, -0.09227752685546875, -0.08496284484863281, -0.07764816284179688, -0.07033348083496094, -0.063018798828125, -0.05570411682128906, -0.048389434814453125, -0.04107475280761719, -0.03376007080078125, -0.026445388793945312, -0.019130706787109375, -0.011816024780273438, -0.0045013427734375, 0.0028133392333984375, 0.010128021240234375, 0.017442703247070312, 0.02475738525390625, 0.03207206726074219, 0.039386749267578125, 0.04670143127441406, 0.05401611328125, 0.06133079528808594, 0.06864547729492188, 0.07596015930175781, 0.08327484130859375, 0.09058952331542969, 0.09790420532226562, 0.10521888732910156, 0.1125335693359375, 0.11984825134277344, 0.12716293334960938, 0.1344776153564453, 0.14179229736328125, 0.1491069793701172, 0.15642166137695312, 0.16373634338378906, 0.171051025390625, 0.17836570739746094, 0.18568038940429688, 0.1929950714111328, 0.20030975341796875, 0.2076244354248047, 0.21493911743164062, 0.22225379943847656, 0.2295684814453125, 0.23688316345214844, 0.24419784545898438, 0.2515125274658203, 0.25882720947265625, 0.2661418914794922, 0.2734565734863281, 0.28077125549316406, 0.2880859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 11.0, 12.0, 21.0, 30.0, 44.0, 69.0, 92.0, 131.0, 131.0, 106.0, 93.0, 77.0, 43.0, 34.0, 32.0, 17.0, 14.0, 7.0, 6.0, 1.0, 12.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9362760186195374, -0.8914228677749634, -0.8465697765350342, -0.8017166256904602, -0.7568634748458862, -0.712010383605957, -0.6671572327613831, -0.6223040819168091, -0.5774509906768799, -0.5325978398323059, -0.4877447485923767, -0.44289159774780273, -0.39803847670555115, -0.35318535566329956, -0.3083322048187256, -0.263479083776474, -0.2186259627342224, -0.17377284169197083, -0.12891970574855804, -0.08406656980514526, -0.03921344876289368, 0.00563967227935791, 0.050492823123931885, 0.09534594416618347, 0.14019906520843506, 0.18505218625068665, 0.22990532219409943, 0.2747584581375122, 0.3196115791797638, 0.3644647002220154, 0.40931785106658936, 0.45417097210884094, 0.4990241527557373, 0.5438773036003113, 0.5887303948402405, 0.6335835456848145, 0.6784366369247437, 0.7232897877693176, 0.7681429386138916, 0.8129960298538208, 0.8578491806983948, 0.9027023315429688, 0.947555422782898, 0.9924085736274719, 1.037261724472046, 1.082114815711975, 1.1269679069519043, 1.171821117401123, 1.2166742086410522, 1.2615272998809814, 1.3063805103302002, 1.3512336015701294, 1.3960866928100586, 1.4409399032592773, 1.4857929944992065, 1.5306460857391357, 1.5754992961883545, 1.6203523874282837, 1.6652055978775024, 1.7100586891174316, 1.7549117803573608, 1.79976487159729, 1.8446180820465088, 1.889471173286438, 1.9343242645263672]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 7.0, 5.0, 9.0, 11.0, 21.0, 26.0, 22.0, 32.0, 33.0, 40.0, 44.0, 52.0, 45.0, 53.0, 46.0, 62.0, 58.0, 69.0, 46.0, 50.0, 53.0, 37.0, 40.0, 28.0, 22.0, 16.0, 11.0, 17.0, 7.0, 13.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1244583129882812, -1.0869141817092896, -1.0493699312210083, -1.0118257999420166, -0.9742815494537354, -0.9367374181747437, -0.8991932272911072, -0.8616490364074707, -0.8241048455238342, -0.7865606546401978, -0.7490164637565613, -0.7114722728729248, -0.6739281415939331, -0.6363838911056519, -0.5988397598266602, -0.5612955689430237, -0.5237513780593872, -0.48620718717575073, -0.44866299629211426, -0.41111883521080017, -0.3735746443271637, -0.3360304534435272, -0.29848629236221313, -0.26094210147857666, -0.22339791059494019, -0.1858537197113037, -0.14830954372882843, -0.11076536029577255, -0.07322117686271667, -0.0356769859790802, 0.0018671900033950806, 0.03941136598587036, 0.07695543766021729, 0.11449962109327316, 0.15204380452632904, 0.18958798050880432, 0.2271321713924408, 0.26467636227607727, 0.30222052335739136, 0.33976471424102783, 0.3773089051246643, 0.4148530960083008, 0.45239728689193726, 0.48994144797325134, 0.5274856090545654, 0.5650298595428467, 0.6025739908218384, 0.6401181817054749, 0.6776623725891113, 0.7152065634727478, 0.7527507543563843, 0.7902949452400208, 0.8278391361236572, 0.8653832674026489, 0.9029274582862854, 0.9404716491699219, 0.9780158400535583, 1.0155600309371948, 1.0531041622161865, 1.0906484127044678, 1.1281925439834595, 1.1657367944717407, 1.2032809257507324, 1.2408251762390137, 1.2783693075180054]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 4.0, 3.0, 7.0, 13.0, 18.0, 20.0, 27.0, 45.0, 56.0, 89.0, 143.0, 197.0, 255.0, 401.0, 573.0, 927.0, 1479.0, 2290.0, 3558.0, 5694.0, 9408.0, 16536.0, 33004.0, 411660.0, 484977.0, 34823.0, 16545.0, 9723.0, 5773.0, 3666.0, 2275.0, 1466.0, 938.0, 701.0, 418.0, 243.0, 185.0, 118.0, 90.0, 56.0, 42.0, 44.0, 18.0, 19.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7431640625, -0.719207763671875, -0.69525146484375, -0.671295166015625, -0.6473388671875, -0.623382568359375, -0.59942626953125, -0.575469970703125, -0.551513671875, -0.527557373046875, -0.50360107421875, -0.479644775390625, -0.4556884765625, -0.431732177734375, -0.40777587890625, -0.383819580078125, -0.35986328125, -0.335906982421875, -0.31195068359375, -0.287994384765625, -0.2640380859375, -0.240081787109375, -0.21612548828125, -0.192169189453125, -0.168212890625, -0.144256591796875, -0.12030029296875, -0.096343994140625, -0.0723876953125, -0.048431396484375, -0.02447509765625, -0.000518798828125, 0.0234375, 0.047393798828125, 0.07135009765625, 0.095306396484375, 0.1192626953125, 0.143218994140625, 0.16717529296875, 0.191131591796875, 0.215087890625, 0.239044189453125, 0.26300048828125, 0.286956787109375, 0.3109130859375, 0.334869384765625, 0.35882568359375, 0.382781982421875, 0.40673828125, 0.430694580078125, 0.45465087890625, 0.478607177734375, 0.5025634765625, 0.526519775390625, 0.55047607421875, 0.574432373046875, 0.598388671875, 0.622344970703125, 0.64630126953125, 0.670257568359375, 0.6942138671875, 0.718170166015625, 0.74212646484375, 0.766082763671875, 0.7900390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 6.0, 6.0, 6.0, 10.0, 16.0, 16.0, 22.0, 147.0, 368.0, 251.0, 64.0, 23.0, 14.0, 9.0, 3.0, 4.0, 7.0, 8.0, 0.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.2257976531982422, -0.21929550170898438, -0.21279335021972656, -0.20629119873046875, -0.19978904724121094, -0.19328689575195312, -0.1867847442626953, -0.1802825927734375, -0.1737804412841797, -0.16727828979492188, -0.16077613830566406, -0.15427398681640625, -0.14777183532714844, -0.14126968383789062, -0.1347675323486328, -0.128265380859375, -0.12176322937011719, -0.11526107788085938, -0.10875892639160156, -0.10225677490234375, -0.09575462341308594, -0.08925247192382812, -0.08275032043457031, -0.0762481689453125, -0.06974601745605469, -0.06324386596679688, -0.05674171447753906, -0.05023956298828125, -0.04373741149902344, -0.037235260009765625, -0.030733108520507812, -0.02423095703125, -0.017728805541992188, -0.011226654052734375, -0.0047245025634765625, 0.00177764892578125, 0.008279800415039062, 0.014781951904296875, 0.021284103393554688, 0.0277862548828125, 0.03428840637207031, 0.040790557861328125, 0.04729270935058594, 0.05379486083984375, 0.06029701232910156, 0.06679916381835938, 0.07330131530761719, 0.079803466796875, 0.08630561828613281, 0.09280776977539062, 0.09930992126464844, 0.10581207275390625, 0.11231422424316406, 0.11881637573242188, 0.1253185272216797, 0.1318206787109375, 0.1383228302001953, 0.14482498168945312, 0.15132713317871094, 0.15782928466796875, 0.16433143615722656, 0.17083358764648438, 0.1773357391357422, 0.183837890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 12.0, 11.0, 26.0, 26.0, 43.0, 59.0, 108.0, 121.0, 189.0, 265.0, 458.0, 736.0, 1236.0, 2162.0, 4108.0, 8403.0, 18542.0, 45720.0, 123822.0, 322205.0, 316086.0, 122668.0, 45342.0, 18435.0, 8262.0, 4093.0, 2174.0, 1177.0, 683.0, 421.0, 286.0, 166.0, 161.0, 86.0, 65.0, 41.0, 36.0, 22.0, 16.0, 18.0, 13.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.7705078125, -0.7471542358398438, -0.7238006591796875, -0.7004470825195312, -0.677093505859375, -0.6537399291992188, -0.6303863525390625, -0.6070327758789062, -0.58367919921875, -0.5603256225585938, -0.5369720458984375, -0.5136184692382812, -0.490264892578125, -0.46691131591796875, -0.4435577392578125, -0.42020416259765625, -0.3968505859375, -0.37349700927734375, -0.3501434326171875, -0.32678985595703125, -0.303436279296875, -0.28008270263671875, -0.2567291259765625, -0.23337554931640625, -0.21002197265625, -0.18666839599609375, -0.1633148193359375, -0.13996124267578125, -0.116607666015625, -0.09325408935546875, -0.0699005126953125, -0.04654693603515625, -0.023193359375, 0.00016021728515625, 0.0235137939453125, 0.04686737060546875, 0.070220947265625, 0.09357452392578125, 0.1169281005859375, 0.14028167724609375, 0.16363525390625, 0.18698883056640625, 0.2103424072265625, 0.23369598388671875, 0.257049560546875, 0.28040313720703125, 0.3037567138671875, 0.32711029052734375, 0.3504638671875, 0.37381744384765625, 0.3971710205078125, 0.42052459716796875, 0.443878173828125, 0.46723175048828125, 0.4905853271484375, 0.5139389038085938, 0.53729248046875, 0.5606460571289062, 0.5839996337890625, 0.6073532104492188, 0.630706787109375, 0.6540603637695312, 0.6774139404296875, 0.7007675170898438, 0.72412109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 9.0, 6.0, 5.0, 10.0, 9.0, 13.0, 16.0, 17.0, 20.0, 29.0, 24.0, 25.0, 36.0, 30.0, 42.0, 33.0, 34.0, 44.0, 50.0, 48.0, 31.0, 49.0, 38.0, 35.0, 47.0, 36.0, 36.0, 31.0, 32.0, 28.0, 17.0, 20.0, 13.0, 14.0, 23.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6378173828125, -0.616943359375, -0.5960693359375, -0.5751953125, -0.5543212890625, -0.533447265625, -0.5125732421875, -0.49169921875, -0.4708251953125, -0.449951171875, -0.4290771484375, -0.408203125, -0.3873291015625, -0.366455078125, -0.3455810546875, -0.32470703125, -0.3038330078125, -0.282958984375, -0.2620849609375, -0.2412109375, -0.2203369140625, -0.199462890625, -0.1785888671875, -0.15771484375, -0.1368408203125, -0.115966796875, -0.0950927734375, -0.07421875, -0.0533447265625, -0.032470703125, -0.0115966796875, 0.00927734375, 0.0301513671875, 0.051025390625, 0.0718994140625, 0.0927734375, 0.1136474609375, 0.134521484375, 0.1553955078125, 0.17626953125, 0.1971435546875, 0.218017578125, 0.2388916015625, 0.259765625, 0.2806396484375, 0.301513671875, 0.3223876953125, 0.34326171875, 0.3641357421875, 0.385009765625, 0.4058837890625, 0.4267578125, 0.4476318359375, 0.468505859375, 0.4893798828125, 0.51025390625, 0.5311279296875, 0.552001953125, 0.5728759765625, 0.59375, 0.6146240234375, 0.635498046875, 0.6563720703125, 0.67724609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 9.0, 15.0, 16.0, 39.0, 42.0, 51.0, 78.0, 127.0, 223.0, 384.0, 758.0, 1663.0, 4702.0, 19575.0, 263743.0, 709002.0, 36567.0, 7115.0, 2334.0, 969.0, 465.0, 246.0, 131.0, 79.0, 59.0, 33.0, 39.0, 25.0, 13.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7734375, -1.7199554443359375, -1.666473388671875, -1.6129913330078125, -1.55950927734375, -1.5060272216796875, -1.452545166015625, -1.3990631103515625, -1.3455810546875, -1.2920989990234375, -1.238616943359375, -1.1851348876953125, -1.13165283203125, -1.0781707763671875, -1.024688720703125, -0.9712066650390625, -0.917724609375, -0.8642425537109375, -0.810760498046875, -0.7572784423828125, -0.70379638671875, -0.6503143310546875, -0.596832275390625, -0.5433502197265625, -0.4898681640625, -0.4363861083984375, -0.382904052734375, -0.3294219970703125, -0.27593994140625, -0.2224578857421875, -0.168975830078125, -0.1154937744140625, -0.06201171875, -0.0085296630859375, 0.044952392578125, 0.0984344482421875, 0.15191650390625, 0.2053985595703125, 0.258880615234375, 0.3123626708984375, 0.3658447265625, 0.4193267822265625, 0.472808837890625, 0.5262908935546875, 0.57977294921875, 0.6332550048828125, 0.686737060546875, 0.7402191162109375, 0.793701171875, 0.8471832275390625, 0.900665283203125, 0.9541473388671875, 1.00762939453125, 1.0611114501953125, 1.114593505859375, 1.1680755615234375, 1.2215576171875, 1.2750396728515625, 1.328521728515625, 1.3820037841796875, 1.43548583984375, 1.4889678955078125, 1.542449951171875, 1.5959320068359375, 1.6494140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 12.0, 30.0, 29.0, 62.0, 106.0, 106.0, 130.0, 151.0, 111.0, 74.0, 65.0, 30.0, 24.0, 17.0, 10.0, 10.0, 7.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.644559860229492e-05, -5.346816033124924e-05, -5.049072206020355e-05, -4.751328378915787e-05, -4.453584551811218e-05, -4.15584072470665e-05, -3.858096897602081e-05, -3.560353070497513e-05, -3.262609243392944e-05, -2.964865416288376e-05, -2.6671215891838074e-05, -2.369377762079239e-05, -2.0716339349746704e-05, -1.773890107870102e-05, -1.4761462807655334e-05, -1.178402453660965e-05, -8.806586265563965e-06, -5.82914799451828e-06, -2.8517097234725952e-06, 1.257285475730896e-07, 3.1031668186187744e-06, 6.080605089664459e-06, 9.058043360710144e-06, 1.2035481631755829e-05, 1.5012919902801514e-05, 1.79903581738472e-05, 2.0967796444892883e-05, 2.3945234715938568e-05, 2.6922672986984253e-05, 2.9900111258029938e-05, 3.287754952907562e-05, 3.585498780012131e-05, 3.883242607116699e-05, 4.180986434221268e-05, 4.478730261325836e-05, 4.776474088430405e-05, 5.074217915534973e-05, 5.3719617426395416e-05, 5.66970556974411e-05, 5.9674493968486786e-05, 6.265193223953247e-05, 6.562937051057816e-05, 6.860680878162384e-05, 7.158424705266953e-05, 7.456168532371521e-05, 7.75391235947609e-05, 8.051656186580658e-05, 8.349400013685226e-05, 8.647143840789795e-05, 8.944887667894363e-05, 9.242631494998932e-05, 9.5403753221035e-05, 9.838119149208069e-05, 0.00010135862976312637, 0.00010433606803417206, 0.00010731350630521774, 0.00011029094457626343, 0.00011326838284730911, 0.0001162458211183548, 0.00011922325938940048, 0.00012220069766044617, 0.00012517813593149185, 0.00012815557420253754, 0.00013113301247358322, 0.0001341104507446289]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 10.0, 14.0, 24.0, 36.0, 51.0, 79.0, 103.0, 164.0, 269.0, 433.0, 761.0, 1394.0, 2814.0, 6464.0, 17300.0, 61962.0, 358266.0, 481127.0, 81256.0, 21188.0, 7683.0, 3232.0, 1676.0, 868.0, 486.0, 284.0, 184.0, 111.0, 86.0, 64.0, 33.0, 34.0, 21.0, 19.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.0810546875, -1.0462799072265625, -1.011505126953125, -0.9767303466796875, -0.94195556640625, -0.9071807861328125, -0.872406005859375, -0.8376312255859375, -0.8028564453125, -0.7680816650390625, -0.733306884765625, -0.6985321044921875, -0.66375732421875, -0.6289825439453125, -0.594207763671875, -0.5594329833984375, -0.524658203125, -0.4898834228515625, -0.455108642578125, -0.4203338623046875, -0.38555908203125, -0.3507843017578125, -0.316009521484375, -0.2812347412109375, -0.2464599609375, -0.2116851806640625, -0.176910400390625, -0.1421356201171875, -0.10736083984375, -0.0725860595703125, -0.037811279296875, -0.0030364990234375, 0.03173828125, 0.0665130615234375, 0.101287841796875, 0.1360626220703125, 0.17083740234375, 0.2056121826171875, 0.240386962890625, 0.2751617431640625, 0.3099365234375, 0.3447113037109375, 0.379486083984375, 0.4142608642578125, 0.44903564453125, 0.4838104248046875, 0.518585205078125, 0.5533599853515625, 0.588134765625, 0.6229095458984375, 0.657684326171875, 0.6924591064453125, 0.72723388671875, 0.7620086669921875, 0.796783447265625, 0.8315582275390625, 0.8663330078125, 0.9011077880859375, 0.935882568359375, 0.9706573486328125, 1.00543212890625, 1.0402069091796875, 1.074981689453125, 1.1097564697265625, 1.14453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 12.0, 10.0, 20.0, 25.0, 25.0, 36.0, 58.0, 57.0, 79.0, 69.0, 78.0, 76.0, 84.0, 80.0, 50.0, 39.0, 45.0, 20.0, 19.0, 16.0, 17.0, 12.0, 7.0, 9.0, 6.0, 8.0, 7.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0207977294921875, -0.987884521484375, -0.9549713134765625, -0.92205810546875, -0.8891448974609375, -0.856231689453125, -0.8233184814453125, -0.7904052734375, -0.7574920654296875, -0.724578857421875, -0.6916656494140625, -0.65875244140625, -0.6258392333984375, -0.592926025390625, -0.5600128173828125, -0.527099609375, -0.4941864013671875, -0.461273193359375, -0.4283599853515625, -0.39544677734375, -0.3625335693359375, -0.329620361328125, -0.2967071533203125, -0.2637939453125, -0.2308807373046875, -0.197967529296875, -0.1650543212890625, -0.13214111328125, -0.0992279052734375, -0.066314697265625, -0.0334014892578125, -0.00048828125, 0.0324249267578125, 0.065338134765625, 0.0982513427734375, 0.13116455078125, 0.1640777587890625, 0.196990966796875, 0.2299041748046875, 0.2628173828125, 0.2957305908203125, 0.328643798828125, 0.3615570068359375, 0.39447021484375, 0.4273834228515625, 0.460296630859375, 0.4932098388671875, 0.526123046875, 0.5590362548828125, 0.591949462890625, 0.6248626708984375, 0.65777587890625, 0.6906890869140625, 0.723602294921875, 0.7565155029296875, 0.7894287109375, 0.8223419189453125, 0.855255126953125, 0.8881683349609375, 0.92108154296875, 0.9539947509765625, 0.986907958984375, 1.0198211669921875, 1.052734375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 7.0, 11.0, 21.0, 60.0, 196.0, 346.0, 202.0, 87.0, 29.0, 15.0, 8.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.618993759155273, -9.036643981933594, -8.454293251037598, -7.871943473815918, -7.289593696594238, -6.7072434425354, -6.1248931884765625, -5.542543411254883, -4.960193157196045, -4.377842903137207, -3.7954931259155273, -3.2131428718566895, -2.6307928562164307, -2.048442840576172, -1.466092586517334, -0.8837428092956543, -0.3013925552368164, 0.28095752000808716, 0.8633075952529907, 1.445657730102539, 2.028007745742798, 2.6103577613830566, 3.1927080154418945, 3.775057792663574, 4.357408046722412, 4.93975830078125, 5.52210807800293, 6.104458332061768, 6.6868085861206055, 7.269158363342285, 7.851508617401123, 8.433858871459961, 9.01620864868164, 9.59855842590332, 10.180909156799316, 10.763258934020996, 11.345608711242676, 11.927959442138672, 12.510309219360352, 13.092658996582031, 13.675008773803711, 14.25735855102539, 14.839709281921387, 15.422059059143066, 16.004409790039062, 16.586759567260742, 17.169109344482422, 17.7514591217041, 18.33380889892578, 18.91615867614746, 19.49850845336914, 20.080860137939453, 20.663209915161133, 21.245559692382812, 21.827909469604492, 22.410259246826172, 22.992610931396484, 23.574960708618164, 24.157310485839844, 24.739662170410156, 25.322011947631836, 25.904361724853516, 26.486711502075195, 27.069061279296875, 27.651411056518555]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 9.0, 10.0, 14.0, 21.0, 41.0, 65.0, 123.0, 182.0, 177.0, 149.0, 83.0, 38.0, 24.0, 14.0, 13.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.530311584472656, -15.962973594665527, -15.395635604858398, -14.82829761505127, -14.26095962524414, -13.693621635437012, -13.126283645629883, -12.558944702148438, -11.991607666015625, -11.424269676208496, -10.856931686401367, -10.289593696594238, -9.72225570678711, -9.15491771697998, -8.587579727172852, -8.020240783691406, -7.452902793884277, -6.885564804077148, -6.3182268142700195, -5.750888824462891, -5.183550834655762, -4.616212844848633, -4.048874378204346, -3.481536388397217, -2.914198398590088, -2.346860408782959, -1.7795222997665405, -1.212184190750122, -0.6448462009429932, -0.07750821113586426, 0.48983001708984375, 1.0571680068969727, 1.6245059967041016, 2.1918439865112305, 2.7591819763183594, 3.3265202045440674, 3.8938581943511963, 4.461195945739746, 5.028534412384033, 5.595872402191162, 6.163210391998291, 6.73054838180542, 7.297886371612549, 7.865224838256836, 8.432562828063965, 8.999900817871094, 9.567238807678223, 10.134576797485352, 10.70191478729248, 11.26925277709961, 11.836590766906738, 12.403928756713867, 12.971266746520996, 13.538604736328125, 14.10594367980957, 14.673280715942383, 15.240619659423828, 15.807957649230957, 16.375295639038086, 16.94263458251953, 17.509971618652344, 18.07731056213379, 18.6446475982666, 19.211986541748047, 19.77932357788086]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 9.0, 12.0, 16.0, 33.0, 50.0, 90.0, 141.0, 258.0, 496.0, 1016.0, 2188.0, 5773.0, 22610.0, 1490203.0, 2637357.0, 24048.0, 5897.0, 2118.0, 923.0, 473.0, 224.0, 121.0, 76.0, 55.0, 32.0, 12.0, 8.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.406036376953125, -3.29254150390625, -3.179046630859375, -3.0655517578125, -2.952056884765625, -2.83856201171875, -2.725067138671875, -2.611572265625, -2.498077392578125, -2.38458251953125, -2.271087646484375, -2.1575927734375, -2.044097900390625, -1.93060302734375, -1.817108154296875, -1.70361328125, -1.590118408203125, -1.47662353515625, -1.363128662109375, -1.2496337890625, -1.136138916015625, -1.02264404296875, -0.909149169921875, -0.795654296875, -0.682159423828125, -0.56866455078125, -0.455169677734375, -0.3416748046875, -0.228179931640625, -0.11468505859375, -0.001190185546875, 0.1123046875, 0.225799560546875, 0.33929443359375, 0.452789306640625, 0.5662841796875, 0.679779052734375, 0.79327392578125, 0.906768798828125, 1.020263671875, 1.133758544921875, 1.24725341796875, 1.360748291015625, 1.4742431640625, 1.587738037109375, 1.70123291015625, 1.814727783203125, 1.92822265625, 2.041717529296875, 2.15521240234375, 2.268707275390625, 2.3822021484375, 2.495697021484375, 2.60919189453125, 2.722686767578125, 2.836181640625, 2.949676513671875, 3.06317138671875, 3.176666259765625, 3.2901611328125, 3.403656005859375, 3.51715087890625, 3.630645751953125, 3.744140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 8.0, 8.0, 20.0, 26.0, 62.0, 128.0, 191.0, 222.0, 121.0, 80.0, 33.0, 15.0, 8.0, 11.0, 12.0, 6.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1998291015625, -0.19378089904785156, -0.18773269653320312, -0.1816844940185547, -0.17563629150390625, -0.1695880889892578, -0.16353988647460938, -0.15749168395996094, -0.1514434814453125, -0.14539527893066406, -0.13934707641601562, -0.1332988739013672, -0.12725067138671875, -0.12120246887207031, -0.11515426635742188, -0.10910606384277344, -0.103057861328125, -0.09700965881347656, -0.09096145629882812, -0.08491325378417969, -0.07886505126953125, -0.07281684875488281, -0.06676864624023438, -0.06072044372558594, -0.0546722412109375, -0.04862403869628906, -0.042575836181640625, -0.03652763366699219, -0.03047943115234375, -0.024431228637695312, -0.018383026123046875, -0.012334823608398438, -0.00628662109375, -0.0002384185791015625, 0.005809783935546875, 0.011857986450195312, 0.01790618896484375, 0.023954391479492188, 0.030002593994140625, 0.03605079650878906, 0.0420989990234375, 0.04814720153808594, 0.054195404052734375, 0.06024360656738281, 0.06629180908203125, 0.07234001159667969, 0.07838821411132812, 0.08443641662597656, 0.090484619140625, 0.09653282165527344, 0.10258102416992188, 0.10862922668457031, 0.11467742919921875, 0.12072563171386719, 0.12677383422851562, 0.13282203674316406, 0.1388702392578125, 0.14491844177246094, 0.15096664428710938, 0.1570148468017578, 0.16306304931640625, 0.1691112518310547, 0.17515945434570312, 0.18120765686035156, 0.187255859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 11.0, 2.0, 1.0, 10.0, 12.0, 7.0, 17.0, 22.0, 28.0, 48.0, 80.0, 90.0, 130.0, 183.0, 275.0, 392.0, 618.0, 970.0, 1538.0, 2536.0, 4259.0, 7770.0, 15622.0, 36450.0, 114842.0, 1010581.0, 2738096.0, 169585.0, 47747.0, 19445.0, 9368.0, 5173.0, 2980.0, 1868.0, 1158.0, 756.0, 530.0, 339.0, 232.0, 146.0, 113.0, 75.0, 60.0, 25.0, 30.0, 26.0, 12.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.2425079345703125, -1.199859619140625, -1.1572113037109375, -1.11456298828125, -1.0719146728515625, -1.029266357421875, -0.9866180419921875, -0.9439697265625, -0.9013214111328125, -0.858673095703125, -0.8160247802734375, -0.77337646484375, -0.7307281494140625, -0.688079833984375, -0.6454315185546875, -0.602783203125, -0.5601348876953125, -0.517486572265625, -0.4748382568359375, -0.43218994140625, -0.3895416259765625, -0.346893310546875, -0.3042449951171875, -0.2615966796875, -0.2189483642578125, -0.176300048828125, -0.1336517333984375, -0.09100341796875, -0.0483551025390625, -0.005706787109375, 0.0369415283203125, 0.07958984375, 0.1222381591796875, 0.164886474609375, 0.2075347900390625, 0.25018310546875, 0.2928314208984375, 0.335479736328125, 0.3781280517578125, 0.4207763671875, 0.4634246826171875, 0.506072998046875, 0.5487213134765625, 0.59136962890625, 0.6340179443359375, 0.676666259765625, 0.7193145751953125, 0.761962890625, 0.8046112060546875, 0.847259521484375, 0.8899078369140625, 0.93255615234375, 0.9752044677734375, 1.017852783203125, 1.0605010986328125, 1.1031494140625, 1.1457977294921875, 1.188446044921875, 1.2310943603515625, 1.27374267578125, 1.3163909912109375, 1.359039306640625, 1.4016876220703125, 1.4443359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 6.0, 8.0, 9.0, 16.0, 25.0, 39.0, 56.0, 85.0, 169.0, 324.0, 1115.0, 1475.0, 340.0, 137.0, 73.0, 51.0, 34.0, 15.0, 16.0, 13.0, 9.0, 11.0, 5.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30517578125, -0.29468536376953125, -0.2841949462890625, -0.27370452880859375, -0.263214111328125, -0.25272369384765625, -0.2422332763671875, -0.23174285888671875, -0.22125244140625, -0.21076202392578125, -0.2002716064453125, -0.18978118896484375, -0.179290771484375, -0.16880035400390625, -0.1583099365234375, -0.14781951904296875, -0.1373291015625, -0.12683868408203125, -0.1163482666015625, -0.10585784912109375, -0.095367431640625, -0.08487701416015625, -0.0743865966796875, -0.06389617919921875, -0.05340576171875, -0.04291534423828125, -0.0324249267578125, -0.02193450927734375, -0.011444091796875, -0.00095367431640625, 0.0095367431640625, 0.02002716064453125, 0.030517578125, 0.04100799560546875, 0.0514984130859375, 0.06198883056640625, 0.072479248046875, 0.08296966552734375, 0.0934600830078125, 0.10395050048828125, 0.11444091796875, 0.12493133544921875, 0.1354217529296875, 0.14591217041015625, 0.156402587890625, 0.16689300537109375, 0.1773834228515625, 0.18787384033203125, 0.1983642578125, 0.20885467529296875, 0.2193450927734375, 0.22983551025390625, 0.240325927734375, 0.25081634521484375, 0.2613067626953125, 0.27179718017578125, 0.28228759765625, 0.29277801513671875, 0.3032684326171875, 0.31375885009765625, 0.324249267578125, 0.33473968505859375, 0.3452301025390625, 0.35572052001953125, 0.3662109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 14.0, 8.0, 29.0, 67.0, 160.0, 251.0, 217.0, 137.0, 54.0, 19.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.637739658355713, -3.547118902206421, -3.456498384475708, -3.365877628326416, -3.275257110595703, -3.184636354446411, -3.094015598297119, -3.0033950805664062, -2.9127743244171143, -2.8221535682678223, -2.7315330505371094, -2.6409122943878174, -2.5502915382385254, -2.4596710205078125, -2.3690502643585205, -2.2784295082092285, -2.1878089904785156, -2.0971882343292236, -2.0065677165985107, -1.9159469604492188, -1.8253263235092163, -1.7347056865692139, -1.6440849304199219, -1.5534642934799194, -1.462843656539917, -1.3722230195999146, -1.281602382659912, -1.1909816265106201, -1.1003609895706177, -1.0097403526306152, -0.919119656085968, -0.8284989595413208, -0.7378783226013184, -0.6472576856613159, -0.5566369891166687, -0.46601632237434387, -0.37539565563201904, -0.2847749888896942, -0.19415432214736938, -0.10353362560272217, -0.012912988662719727, 0.0777076780796051, 0.16832834482192993, 0.25894901156425476, 0.3495696783065796, 0.4401903450489044, 0.5308110117912292, 0.6214317083358765, 0.7120523452758789, 0.8026729822158813, 0.8932936787605286, 0.9839143753051758, 1.0745350122451782, 1.1651556491851807, 1.2557764053344727, 1.346397042274475, 1.4370176792144775, 1.52763831615448, 1.6182589530944824, 1.7088797092437744, 1.7995003461837769, 1.8901209831237793, 1.9807417392730713, 2.0713624954223633, 2.161983013153076]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 9.0, 20.0, 17.0, 31.0, 43.0, 62.0, 63.0, 68.0, 97.0, 87.0, 93.0, 94.0, 76.0, 65.0, 50.0, 25.0, 28.0, 13.0, 10.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1788170337677, -2.1164371967315674, -2.0540575981140137, -1.9916777610778809, -1.9292980432510376, -1.8669182062149048, -1.8045384883880615, -1.7421586513519287, -1.6797789335250854, -1.6173992156982422, -1.5550193786621094, -1.4926396608352661, -1.4302599430084229, -1.36788010597229, -1.3055003881454468, -1.2431206703186035, -1.1807408332824707, -1.1183611154556274, -1.0559812784194946, -0.9936015605926514, -0.9312217831611633, -0.8688420057296753, -0.806462287902832, -0.744082510471344, -0.6817028522491455, -0.6193230748176575, -0.5569433569908142, -0.49456357955932617, -0.43218380212783813, -0.3698040544986725, -0.30742430686950684, -0.2450445294380188, -0.18266475200653076, -0.12028498947620392, -0.05790523439645767, 0.004474520683288574, 0.06685428321361542, 0.12923404574394226, 0.1916137933731079, 0.25399357080459595, 0.3163733184337616, 0.37875306606292725, 0.4411328434944153, 0.5035126209259033, 0.5658923387527466, 0.6282721161842346, 0.6906518936157227, 0.7530316114425659, 0.815411388874054, 0.877791166305542, 0.9401708841323853, 1.0025506019592285, 1.0649304389953613, 1.1273101568222046, 1.1896898746490479, 1.2520697116851807, 1.314449429512024, 1.3768291473388672, 1.439208984375, 1.5015887022018433, 1.5639684200286865, 1.6263482570648193, 1.6887279748916626, 1.7511076927185059, 1.8134875297546387]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 7.0, 8.0, 6.0, 12.0, 24.0, 22.0, 34.0, 47.0, 86.0, 132.0, 207.0, 337.0, 563.0, 983.0, 1849.0, 3309.0, 6402.0, 12920.0, 29984.0, 105382.0, 484089.0, 296893.0, 62908.0, 21378.0, 9893.0, 4904.0, 2649.0, 1479.0, 771.0, 458.0, 273.0, 191.0, 110.0, 83.0, 37.0, 30.0, 27.0, 20.0, 11.0, 9.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.990234375, -0.9600601196289062, -0.9298858642578125, -0.8997116088867188, -0.869537353515625, -0.8393630981445312, -0.8091888427734375, -0.7790145874023438, -0.74884033203125, -0.7186660766601562, -0.6884918212890625, -0.6583175659179688, -0.628143310546875, -0.5979690551757812, -0.5677947998046875, -0.5376205444335938, -0.5074462890625, -0.47727203369140625, -0.4470977783203125, -0.41692352294921875, -0.386749267578125, -0.35657501220703125, -0.3264007568359375, -0.29622650146484375, -0.26605224609375, -0.23587799072265625, -0.2057037353515625, -0.17552947998046875, -0.145355224609375, -0.11518096923828125, -0.0850067138671875, -0.05483245849609375, -0.024658203125, 0.00551605224609375, 0.0356903076171875, 0.06586456298828125, 0.096038818359375, 0.12621307373046875, 0.1563873291015625, 0.18656158447265625, 0.21673583984375, 0.24691009521484375, 0.2770843505859375, 0.30725860595703125, 0.337432861328125, 0.36760711669921875, 0.3977813720703125, 0.42795562744140625, 0.4581298828125, 0.48830413818359375, 0.5184783935546875, 0.5486526489257812, 0.578826904296875, 0.6090011596679688, 0.6391754150390625, 0.6693496704101562, 0.69952392578125, 0.7296981811523438, 0.7598724365234375, 0.7900466918945312, 0.820220947265625, 0.8503952026367188, 0.8805694580078125, 0.9107437133789062, 0.94091796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 16.0, 9.0, 14.0, 28.0, 34.0, 61.0, 78.0, 67.0, 80.0, 117.0, 91.0, 93.0, 67.0, 59.0, 36.0, 35.0, 21.0, 9.0, 11.0, 8.0, 9.0, 4.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.11199951171875, -0.10875606536865234, -0.10551261901855469, -0.10226917266845703, -0.09902572631835938, -0.09578227996826172, -0.09253883361816406, -0.0892953872680664, -0.08605194091796875, -0.0828084945678711, -0.07956504821777344, -0.07632160186767578, -0.07307815551757812, -0.06983470916748047, -0.06659126281738281, -0.06334781646728516, -0.0601043701171875, -0.056860923767089844, -0.05361747741699219, -0.05037403106689453, -0.047130584716796875, -0.04388713836669922, -0.04064369201660156, -0.037400245666503906, -0.03415679931640625, -0.030913352966308594, -0.027669906616210938, -0.02442646026611328, -0.021183013916015625, -0.01793956756591797, -0.014696121215820312, -0.011452674865722656, -0.008209228515625, -0.004965782165527344, -0.0017223358154296875, 0.0015211105346679688, 0.004764556884765625, 0.008008003234863281, 0.011251449584960938, 0.014494895935058594, 0.01773834228515625, 0.020981788635253906, 0.024225234985351562, 0.02746868133544922, 0.030712127685546875, 0.03395557403564453, 0.03719902038574219, 0.040442466735839844, 0.0436859130859375, 0.046929359436035156, 0.05017280578613281, 0.05341625213623047, 0.056659698486328125, 0.05990314483642578, 0.06314659118652344, 0.0663900375366211, 0.06963348388671875, 0.0728769302368164, 0.07612037658691406, 0.07936382293701172, 0.08260726928710938, 0.08585071563720703, 0.08909416198730469, 0.09233760833740234, 0.0955810546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 7.0, 5.0, 6.0, 5.0, 11.0, 29.0, 132.0, 763.0, 13436.0, 637208.0, 388412.0, 7784.0, 552.0, 126.0, 34.0, 5.0, 4.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.883056640625, -2.77978515625, -2.676513671875, -2.5732421875, -2.469970703125, -2.36669921875, -2.263427734375, -2.16015625, -2.056884765625, -1.95361328125, -1.850341796875, -1.7470703125, -1.643798828125, -1.54052734375, -1.437255859375, -1.333984375, -1.230712890625, -1.12744140625, -1.024169921875, -0.9208984375, -0.817626953125, -0.71435546875, -0.611083984375, -0.5078125, -0.404541015625, -0.30126953125, -0.197998046875, -0.0947265625, 0.008544921875, 0.11181640625, 0.215087890625, 0.318359375, 0.421630859375, 0.52490234375, 0.628173828125, 0.7314453125, 0.834716796875, 0.93798828125, 1.041259765625, 1.14453125, 1.247802734375, 1.35107421875, 1.454345703125, 1.5576171875, 1.660888671875, 1.76416015625, 1.867431640625, 1.970703125, 2.073974609375, 2.17724609375, 2.280517578125, 2.3837890625, 2.487060546875, 2.59033203125, 2.693603515625, 2.796875, 2.900146484375, 3.00341796875, 3.106689453125, 3.2099609375, 3.313232421875, 3.41650390625, 3.519775390625, 3.623046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 8.0, 7.0, 12.0, 14.0, 22.0, 19.0, 27.0, 23.0, 35.0, 35.0, 25.0, 38.0, 48.0, 45.0, 44.0, 50.0, 60.0, 57.0, 40.0, 40.0, 47.0, 33.0, 32.0, 38.0, 28.0, 20.0, 18.0, 10.0, 22.0, 17.0, 15.0, 12.0, 9.0, 8.0, 4.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.427734375, -0.4135589599609375, -0.399383544921875, -0.3852081298828125, -0.37103271484375, -0.3568572998046875, -0.342681884765625, -0.3285064697265625, -0.3143310546875, -0.3001556396484375, -0.285980224609375, -0.2718048095703125, -0.25762939453125, -0.2434539794921875, -0.229278564453125, -0.2151031494140625, -0.200927734375, -0.1867523193359375, -0.172576904296875, -0.1584014892578125, -0.14422607421875, -0.1300506591796875, -0.115875244140625, -0.1016998291015625, -0.0875244140625, -0.0733489990234375, -0.059173583984375, -0.0449981689453125, -0.03082275390625, -0.0166473388671875, -0.002471923828125, 0.0117034912109375, 0.02587890625, 0.0400543212890625, 0.054229736328125, 0.0684051513671875, 0.08258056640625, 0.0967559814453125, 0.110931396484375, 0.1251068115234375, 0.1392822265625, 0.1534576416015625, 0.167633056640625, 0.1818084716796875, 0.19598388671875, 0.2101593017578125, 0.224334716796875, 0.2385101318359375, 0.252685546875, 0.2668609619140625, 0.281036376953125, 0.2952117919921875, 0.30938720703125, 0.3235626220703125, 0.337738037109375, 0.3519134521484375, 0.3660888671875, 0.3802642822265625, 0.394439697265625, 0.4086151123046875, 0.42279052734375, 0.4369659423828125, 0.451141357421875, 0.4653167724609375, 0.4794921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 12.0, 16.0, 23.0, 69.0, 254.0, 1629.0, 51602.0, 982087.0, 11797.0, 796.0, 136.0, 44.0, 24.0, 15.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.94427490234375, -3.7752685546875, -3.60626220703125, -3.437255859375, -3.26824951171875, -3.0992431640625, -2.93023681640625, -2.76123046875, -2.59222412109375, -2.4232177734375, -2.25421142578125, -2.085205078125, -1.91619873046875, -1.7471923828125, -1.57818603515625, -1.4091796875, -1.24017333984375, -1.0711669921875, -0.90216064453125, -0.733154296875, -0.56414794921875, -0.3951416015625, -0.22613525390625, -0.05712890625, 0.11187744140625, 0.2808837890625, 0.44989013671875, 0.618896484375, 0.78790283203125, 0.9569091796875, 1.12591552734375, 1.294921875, 1.46392822265625, 1.6329345703125, 1.80194091796875, 1.970947265625, 2.13995361328125, 2.3089599609375, 2.47796630859375, 2.64697265625, 2.81597900390625, 2.9849853515625, 3.15399169921875, 3.322998046875, 3.49200439453125, 3.6610107421875, 3.83001708984375, 3.9990234375, 4.16802978515625, 4.3370361328125, 4.50604248046875, 4.675048828125, 4.84405517578125, 5.0130615234375, 5.18206787109375, 5.35107421875, 5.52008056640625, 5.6890869140625, 5.85809326171875, 6.027099609375, 6.19610595703125, 6.3651123046875, 6.53411865234375, 6.703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 10.0, 12.0, 35.0, 34.0, 49.0, 67.0, 94.0, 93.0, 126.0, 109.0, 88.0, 77.0, 61.0, 32.0, 25.0, 15.0, 15.0, 15.0, 6.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.712841033935547e-05, -7.401220500469208e-05, -7.089599967002869e-05, -6.77797943353653e-05, -6.46635890007019e-05, -6.154738366603851e-05, -5.843117833137512e-05, -5.531497299671173e-05, -5.219876766204834e-05, -4.908256232738495e-05, -4.596635699272156e-05, -4.2850151658058167e-05, -3.9733946323394775e-05, -3.6617740988731384e-05, -3.350153565406799e-05, -3.0385330319404602e-05, -2.726912498474121e-05, -2.415291965007782e-05, -2.103671431541443e-05, -1.7920508980751038e-05, -1.4804303646087646e-05, -1.1688098311424255e-05, -8.571892976760864e-06, -5.455687642097473e-06, -2.339482307434082e-06, 7.767230272293091e-07, 3.8929283618927e-06, 7.009133696556091e-06, 1.0125339031219482e-05, 1.3241544365882874e-05, 1.6357749700546265e-05, 1.9473955035209656e-05, 2.2590160369873047e-05, 2.5706365704536438e-05, 2.882257103919983e-05, 3.193877637386322e-05, 3.505498170852661e-05, 3.817118704319e-05, 4.1287392377853394e-05, 4.4403597712516785e-05, 4.7519803047180176e-05, 5.063600838184357e-05, 5.375221371650696e-05, 5.686841905117035e-05, 5.998462438583374e-05, 6.310082972049713e-05, 6.621703505516052e-05, 6.933324038982391e-05, 7.24494457244873e-05, 7.55656510591507e-05, 7.868185639381409e-05, 8.179806172847748e-05, 8.491426706314087e-05, 8.803047239780426e-05, 9.114667773246765e-05, 9.426288306713104e-05, 9.737908840179443e-05, 0.00010049529373645782, 0.00010361149907112122, 0.00010672770440578461, 0.000109843909740448, 0.00011296011507511139, 0.00011607632040977478, 0.00011919252574443817, 0.00012230873107910156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 10.0, 8.0, 13.0, 23.0, 28.0, 39.0, 61.0, 82.0, 113.0, 196.0, 332.0, 599.0, 1069.0, 2217.0, 5237.0, 14456.0, 47671.0, 197377.0, 490614.0, 211850.0, 50863.0, 15236.0, 5477.0, 2337.0, 1121.0, 608.0, 348.0, 196.0, 118.0, 81.0, 52.0, 38.0, 26.0, 15.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1474609375, -1.11688232421875, -1.0863037109375, -1.05572509765625, -1.025146484375, -0.99456787109375, -0.9639892578125, -0.93341064453125, -0.90283203125, -0.87225341796875, -0.8416748046875, -0.81109619140625, -0.780517578125, -0.74993896484375, -0.7193603515625, -0.68878173828125, -0.658203125, -0.62762451171875, -0.5970458984375, -0.56646728515625, -0.535888671875, -0.50531005859375, -0.4747314453125, -0.44415283203125, -0.41357421875, -0.38299560546875, -0.3524169921875, -0.32183837890625, -0.291259765625, -0.26068115234375, -0.2301025390625, -0.19952392578125, -0.1689453125, -0.13836669921875, -0.1077880859375, -0.07720947265625, -0.046630859375, -0.01605224609375, 0.0145263671875, 0.04510498046875, 0.07568359375, 0.10626220703125, 0.1368408203125, 0.16741943359375, 0.197998046875, 0.22857666015625, 0.2591552734375, 0.28973388671875, 0.3203125, 0.35089111328125, 0.3814697265625, 0.41204833984375, 0.442626953125, 0.47320556640625, 0.5037841796875, 0.53436279296875, 0.56494140625, 0.59552001953125, 0.6260986328125, 0.65667724609375, 0.687255859375, 0.71783447265625, 0.7484130859375, 0.77899169921875, 0.8095703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 30.0, 40.0, 67.0, 97.0, 97.0, 126.0, 133.0, 114.0, 74.0, 64.0, 36.0, 36.0, 16.0, 16.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2123870849609375, -1.177703857421875, -1.1430206298828125, -1.10833740234375, -1.0736541748046875, -1.038970947265625, -1.0042877197265625, -0.9696044921875, -0.9349212646484375, -0.900238037109375, -0.8655548095703125, -0.83087158203125, -0.7961883544921875, -0.761505126953125, -0.7268218994140625, -0.692138671875, -0.6574554443359375, -0.622772216796875, -0.5880889892578125, -0.55340576171875, -0.5187225341796875, -0.484039306640625, -0.4493560791015625, -0.4146728515625, -0.3799896240234375, -0.345306396484375, -0.3106231689453125, -0.27593994140625, -0.2412567138671875, -0.206573486328125, -0.1718902587890625, -0.13720703125, -0.1025238037109375, -0.067840576171875, -0.0331573486328125, 0.00152587890625, 0.0362091064453125, 0.070892333984375, 0.1055755615234375, 0.1402587890625, 0.1749420166015625, 0.209625244140625, 0.2443084716796875, 0.27899169921875, 0.3136749267578125, 0.348358154296875, 0.3830413818359375, 0.417724609375, 0.4524078369140625, 0.487091064453125, 0.5217742919921875, 0.55645751953125, 0.5911407470703125, 0.625823974609375, 0.6605072021484375, 0.6951904296875, 0.7298736572265625, 0.764556884765625, 0.7992401123046875, 0.83392333984375, 0.8686065673828125, 0.903289794921875, 0.9379730224609375, 0.97265625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 24.0, 84.0, 253.0, 399.0, 168.0, 42.0, 16.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.457090377807617, -8.909775733947754, -8.36246109008789, -7.8151469230651855, -7.2678327560424805, -6.720518112182617, -6.173203468322754, -5.625888824462891, -5.0785746574401855, -4.531260013580322, -3.983945846557617, -3.436631202697754, -2.8893167972564697, -2.3420023918151855, -1.7946877479553223, -1.247373342514038, -0.7000589370727539, -0.15274447202682495, 0.394569993019104, 0.9418845176696777, 1.489198923110962, 2.036513328552246, 2.5838279724121094, 3.1311423778533936, 3.6784567832946777, 4.225771427154541, 4.773085594177246, 5.320400238037109, 5.867714881896973, 6.415029048919678, 6.962343692779541, 7.509657859802246, 8.05697250366211, 8.604287147521973, 9.151601791381836, 9.698915481567383, 10.246230125427246, 10.79354476928711, 11.340859413146973, 11.888174057006836, 12.435487747192383, 12.982802391052246, 13.53011703491211, 14.077430725097656, 14.62474536895752, 15.172060012817383, 15.719374656677246, 16.26668930053711, 16.814002990722656, 17.361316680908203, 17.908632278442383, 18.45594596862793, 19.00326156616211, 19.550575256347656, 20.097888946533203, 20.645204544067383, 21.192520141601562, 21.73983383178711, 22.28714942932129, 22.834463119506836, 23.381778717041016, 23.929092407226562, 24.47640609741211, 25.02372169494629, 25.571035385131836]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 17.0, 18.0, 25.0, 33.0, 37.0, 40.0, 55.0, 52.0, 53.0, 64.0, 57.0, 67.0, 73.0, 55.0, 60.0, 56.0, 36.0, 29.0, 28.0, 30.0, 19.0, 7.0, 6.0, 13.0, 8.0, 9.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.642788410186768, -4.488044738769531, -4.333301067352295, -4.178557872772217, -4.0238142013549805, -3.869070529937744, -3.714326858520508, -3.5595831871032715, -3.4048397541046143, -3.250096082687378, -3.0953526496887207, -2.9406089782714844, -2.785865306854248, -2.631121873855591, -2.4763782024383545, -2.3216347694396973, -2.166891098022461, -2.0121474266052246, -1.8574039936065674, -1.702660322189331, -1.5479167699813843, -1.3931732177734375, -1.2384295463562012, -1.0836859941482544, -0.9289424419403076, -0.7741988897323608, -0.6194552779197693, -0.4647116959095001, -0.30996811389923096, -0.15522456169128418, -0.00048094987869262695, 0.15426266193389893, 0.3090066909790039, 0.46375027298927307, 0.6184938549995422, 0.7732374668121338, 0.9279810190200806, 1.0827245712280273, 1.2374682426452637, 1.3922117948532104, 1.5469553470611572, 1.701698899269104, 1.8564424514770508, 2.011186122894287, 2.1659297943115234, 2.3206732273101807, 2.475416898727417, 2.630160331726074, 2.7849040031433105, 2.939647674560547, 3.094391107559204, 3.2491347789764404, 3.4038782119750977, 3.558621883392334, 3.7133655548095703, 3.8681092262268066, 4.022852897644043, 4.177596569061279, 4.332340240478516, 4.487083435058594, 4.64182710647583, 4.796570777893066, 4.951314449310303, 5.106058120727539, 5.260801315307617]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 14.0, 12.0, 18.0, 30.0, 37.0, 73.0, 82.0, 135.0, 219.0, 367.0, 598.0, 1088.0, 2333.0, 5585.0, 18394.0, 127608.0, 3879592.0, 131450.0, 17524.0, 5054.0, 2025.0, 897.0, 435.0, 251.0, 171.0, 89.0, 67.0, 35.0, 32.0, 14.0, 10.0, 12.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.820953369140625, -2.72198486328125, -2.623016357421875, -2.5240478515625, -2.425079345703125, -2.32611083984375, -2.227142333984375, -2.128173828125, -2.029205322265625, -1.93023681640625, -1.831268310546875, -1.7322998046875, -1.633331298828125, -1.53436279296875, -1.435394287109375, -1.33642578125, -1.237457275390625, -1.13848876953125, -1.039520263671875, -0.9405517578125, -0.841583251953125, -0.74261474609375, -0.643646240234375, -0.544677734375, -0.445709228515625, -0.34674072265625, -0.247772216796875, -0.1488037109375, -0.049835205078125, 0.04913330078125, 0.148101806640625, 0.2470703125, 0.346038818359375, 0.44500732421875, 0.543975830078125, 0.6429443359375, 0.741912841796875, 0.84088134765625, 0.939849853515625, 1.038818359375, 1.137786865234375, 1.23675537109375, 1.335723876953125, 1.4346923828125, 1.533660888671875, 1.63262939453125, 1.731597900390625, 1.83056640625, 1.929534912109375, 2.02850341796875, 2.127471923828125, 2.2264404296875, 2.325408935546875, 2.42437744140625, 2.523345947265625, 2.622314453125, 2.721282958984375, 2.82025146484375, 2.919219970703125, 3.0181884765625, 3.117156982421875, 3.21612548828125, 3.315093994140625, 3.4140625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 7.0, 7.0, 16.0, 15.0, 26.0, 29.0, 25.0, 54.0, 54.0, 79.0, 77.0, 83.0, 80.0, 80.0, 75.0, 61.0, 47.0, 42.0, 28.0, 26.0, 13.0, 15.0, 10.0, 5.0, 6.0, 9.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.111541748046875, -0.10833740234375, -0.105133056640625, -0.1019287109375, -0.098724365234375, -0.09552001953125, -0.092315673828125, -0.089111328125, -0.085906982421875, -0.08270263671875, -0.079498291015625, -0.0762939453125, -0.073089599609375, -0.06988525390625, -0.066680908203125, -0.0634765625, -0.060272216796875, -0.05706787109375, -0.053863525390625, -0.0506591796875, -0.047454833984375, -0.04425048828125, -0.041046142578125, -0.037841796875, -0.034637451171875, -0.03143310546875, -0.028228759765625, -0.0250244140625, -0.021820068359375, -0.01861572265625, -0.015411376953125, -0.01220703125, -0.009002685546875, -0.00579833984375, -0.002593994140625, 0.0006103515625, 0.003814697265625, 0.00701904296875, 0.010223388671875, 0.013427734375, 0.016632080078125, 0.01983642578125, 0.023040771484375, 0.0262451171875, 0.029449462890625, 0.03265380859375, 0.035858154296875, 0.0390625, 0.042266845703125, 0.04547119140625, 0.048675537109375, 0.0518798828125, 0.055084228515625, 0.05828857421875, 0.061492919921875, 0.064697265625, 0.067901611328125, 0.07110595703125, 0.074310302734375, 0.0775146484375, 0.080718994140625, 0.08392333984375, 0.087127685546875, 0.09033203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 13.0, 32.0, 23.0, 38.0, 55.0, 103.0, 166.0, 517.0, 9013.0, 4104932.0, 77430.0, 1229.0, 232.0, 133.0, 97.0, 62.0, 49.0, 31.0, 20.0, 11.0, 17.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.6484375, -10.341552734375, -10.03466796875, -9.727783203125, -9.4208984375, -9.114013671875, -8.80712890625, -8.500244140625, -8.193359375, -7.886474609375, -7.57958984375, -7.272705078125, -6.9658203125, -6.658935546875, -6.35205078125, -6.045166015625, -5.73828125, -5.431396484375, -5.12451171875, -4.817626953125, -4.5107421875, -4.203857421875, -3.89697265625, -3.590087890625, -3.283203125, -2.976318359375, -2.66943359375, -2.362548828125, -2.0556640625, -1.748779296875, -1.44189453125, -1.135009765625, -0.828125, -0.521240234375, -0.21435546875, 0.092529296875, 0.3994140625, 0.706298828125, 1.01318359375, 1.320068359375, 1.626953125, 1.933837890625, 2.24072265625, 2.547607421875, 2.8544921875, 3.161376953125, 3.46826171875, 3.775146484375, 4.08203125, 4.388916015625, 4.69580078125, 5.002685546875, 5.3095703125, 5.616455078125, 5.92333984375, 6.230224609375, 6.537109375, 6.843994140625, 7.15087890625, 7.457763671875, 7.7646484375, 8.071533203125, 8.37841796875, 8.685302734375, 8.9921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 6.0, 9.0, 10.0, 12.0, 24.0, 40.0, 57.0, 92.0, 104.0, 201.0, 345.0, 881.0, 1267.0, 430.0, 239.0, 135.0, 66.0, 45.0, 31.0, 20.0, 15.0, 19.0, 7.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.24686050415039062, -0.23664093017578125, -0.22642135620117188, -0.2162017822265625, -0.20598220825195312, -0.19576263427734375, -0.18554306030273438, -0.175323486328125, -0.16510391235351562, -0.15488433837890625, -0.14466476440429688, -0.1344451904296875, -0.12422561645507812, -0.11400604248046875, -0.10378646850585938, -0.09356689453125, -0.08334732055664062, -0.07312774658203125, -0.06290817260742188, -0.0526885986328125, -0.042469024658203125, -0.03224945068359375, -0.022029876708984375, -0.011810302734375, -0.001590728759765625, 0.00862884521484375, 0.018848419189453125, 0.0290679931640625, 0.039287567138671875, 0.04950714111328125, 0.059726715087890625, 0.0699462890625, 0.08016586303710938, 0.09038543701171875, 0.10060501098632812, 0.1108245849609375, 0.12104415893554688, 0.13126373291015625, 0.14148330688476562, 0.151702880859375, 0.16192245483398438, 0.17214202880859375, 0.18236160278320312, 0.1925811767578125, 0.20280075073242188, 0.21302032470703125, 0.22323989868164062, 0.23345947265625, 0.24367904663085938, 0.25389862060546875, 0.2641181945800781, 0.2743377685546875, 0.2845573425292969, 0.29477691650390625, 0.3049964904785156, 0.315216064453125, 0.3254356384277344, 0.33565521240234375, 0.3458747863769531, 0.3560943603515625, 0.3663139343261719, 0.37653350830078125, 0.3867530822753906, 0.39697265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 11.0, 13.0, 36.0, 78.0, 145.0, 233.0, 227.0, 141.0, 60.0, 39.0, 11.0, 9.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.055519104003906, -3.94917368888855, -3.8428282737731934, -3.736482620239258, -3.6301372051239014, -3.523791790008545, -3.4174463748931885, -3.311100959777832, -3.2047553062438965, -3.09840989112854, -2.9920644760131836, -2.885718822479248, -2.7793734073638916, -2.673027992248535, -2.5666825771331787, -2.4603371620178223, -2.353991746902466, -2.2476463317871094, -2.141300916671753, -2.0349555015563965, -1.928609848022461, -1.8222644329071045, -1.715919017791748, -1.6095736026763916, -1.5032280683517456, -1.3968826532363892, -1.2905371189117432, -1.1841917037963867, -1.0778462886810303, -0.9715007543563843, -0.8651553392410278, -0.7588098645210266, -0.6524643898010254, -0.5461189150810242, -0.43977347016334534, -0.3334280252456665, -0.22708255052566528, -0.12073707580566406, -0.014391660690307617, 0.0919538140296936, 0.19829928874969482, 0.30464476346969604, 0.4109902083873749, 0.5173356533050537, 0.6236811280250549, 0.7300266027450562, 0.8363720178604126, 0.9427174925804138, 1.049062967300415, 1.1554083824157715, 1.2617539167404175, 1.368099331855774, 1.47444486618042, 1.5807902812957764, 1.6871356964111328, 1.7934811115264893, 1.8998266458511353, 2.0061721801757812, 2.1125175952911377, 2.218863010406494, 2.3252084255218506, 2.431553840637207, 2.5378994941711426, 2.644244909286499, 2.7505903244018555]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 10.0, 8.0, 25.0, 26.0, 24.0, 23.0, 39.0, 43.0, 42.0, 39.0, 46.0, 46.0, 55.0, 58.0, 50.0, 61.0, 53.0, 52.0, 38.0, 48.0, 32.0, 38.0, 30.0, 20.0, 17.0, 13.0, 13.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0891273021697998, -1.054241418838501, -1.0193555355072021, -0.9844696521759033, -0.9495837688446045, -0.9146978855133057, -0.8798120021820068, -0.844926118850708, -0.8100402355194092, -0.7751543521881104, -0.7402684688568115, -0.7053825855255127, -0.6704967021942139, -0.635610818862915, -0.6007249355316162, -0.5658390522003174, -0.5309531092643738, -0.49606722593307495, -0.4611813426017761, -0.4262954592704773, -0.39140957593917847, -0.35652369260787964, -0.3216377794742584, -0.2867518961429596, -0.25186601281166077, -0.21698012948036194, -0.1820942461490631, -0.1472083479166031, -0.11232246458530426, -0.07743658125400543, -0.04255068302154541, -0.007664799690246582, 0.027221083641052246, 0.06210697069764137, 0.0969928577542305, 0.13187874853610992, 0.16676463186740875, 0.20165051519870758, 0.2365364134311676, 0.27142229676246643, 0.30630818009376526, 0.3411940634250641, 0.3760799467563629, 0.41096585988998413, 0.44585174322128296, 0.4807376265525818, 0.5156235098838806, 0.5505093932151794, 0.5853952765464783, 0.6202811598777771, 0.6551670432090759, 0.6900529265403748, 0.7249388098716736, 0.7598246932029724, 0.794710636138916, 0.8295965194702148, 0.8644824028015137, 0.8993682861328125, 0.9342541694641113, 0.9691400527954102, 1.004025936126709, 1.0389118194580078, 1.0737977027893066, 1.1086835861206055, 1.1435694694519043]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 21.0, 20.0, 19.0, 37.0, 40.0, 65.0, 91.0, 127.0, 200.0, 300.0, 469.0, 741.0, 1206.0, 2181.0, 4363.0, 8825.0, 20638.0, 54194.0, 149385.0, 346597.0, 280558.0, 108194.0, 39436.0, 15770.0, 6825.0, 3350.0, 1889.0, 1046.0, 637.0, 411.0, 265.0, 206.0, 117.0, 83.0, 67.0, 41.0, 30.0, 27.0, 20.0, 14.0, 11.0, 7.0, 11.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7763671875, -0.7503509521484375, -0.724334716796875, -0.6983184814453125, -0.67230224609375, -0.6462860107421875, -0.620269775390625, -0.5942535400390625, -0.5682373046875, -0.5422210693359375, -0.516204833984375, -0.4901885986328125, -0.46417236328125, -0.4381561279296875, -0.412139892578125, -0.3861236572265625, -0.360107421875, -0.3340911865234375, -0.308074951171875, -0.2820587158203125, -0.25604248046875, -0.2300262451171875, -0.204010009765625, -0.1779937744140625, -0.1519775390625, -0.1259613037109375, -0.099945068359375, -0.0739288330078125, -0.04791259765625, -0.0218963623046875, 0.004119873046875, 0.0301361083984375, 0.05615234375, 0.0821685791015625, 0.108184814453125, 0.1342010498046875, 0.16021728515625, 0.1862335205078125, 0.212249755859375, 0.2382659912109375, 0.2642822265625, 0.2902984619140625, 0.316314697265625, 0.3423309326171875, 0.36834716796875, 0.3943634033203125, 0.420379638671875, 0.4463958740234375, 0.472412109375, 0.4984283447265625, 0.524444580078125, 0.5504608154296875, 0.57647705078125, 0.6024932861328125, 0.628509521484375, 0.6545257568359375, 0.6805419921875, 0.7065582275390625, 0.732574462890625, 0.7585906982421875, 0.78460693359375, 0.8106231689453125, 0.836639404296875, 0.8626556396484375, 0.888671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 6.0, 10.0, 5.0, 5.0, 16.0, 13.0, 18.0, 30.0, 34.0, 31.0, 42.0, 65.0, 70.0, 66.0, 88.0, 87.0, 78.0, 60.0, 42.0, 49.0, 47.0, 38.0, 30.0, 24.0, 14.0, 10.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1165771484375, -0.11322689056396484, -0.10987663269042969, -0.10652637481689453, -0.10317611694335938, -0.09982585906982422, -0.09647560119628906, -0.0931253433227539, -0.08977508544921875, -0.0864248275756836, -0.08307456970214844, -0.07972431182861328, -0.07637405395507812, -0.07302379608154297, -0.06967353820800781, -0.06632328033447266, -0.0629730224609375, -0.059622764587402344, -0.05627250671386719, -0.05292224884033203, -0.049571990966796875, -0.04622173309326172, -0.04287147521972656, -0.039521217346191406, -0.03617095947265625, -0.032820701599121094, -0.029470443725585938, -0.02612018585205078, -0.022769927978515625, -0.01941967010498047, -0.016069412231445312, -0.012719154357910156, -0.009368896484375, -0.006018638610839844, -0.0026683807373046875, 0.0006818771362304688, 0.004032135009765625, 0.007382392883300781, 0.010732650756835938, 0.014082908630371094, 0.01743316650390625, 0.020783424377441406, 0.024133682250976562, 0.02748394012451172, 0.030834197998046875, 0.03418445587158203, 0.03753471374511719, 0.040884971618652344, 0.0442352294921875, 0.047585487365722656, 0.05093574523925781, 0.05428600311279297, 0.057636260986328125, 0.06098651885986328, 0.06433677673339844, 0.0676870346069336, 0.07103729248046875, 0.0743875503540039, 0.07773780822753906, 0.08108806610107422, 0.08443832397460938, 0.08778858184814453, 0.09113883972167969, 0.09448909759521484, 0.09783935546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 7.0, 17.0, 31.0, 28.0, 36.0, 68.0, 67.0, 94.0, 164.0, 220.0, 306.0, 479.0, 739.0, 1301.0, 2257.0, 4021.0, 7199.0, 13490.0, 25959.0, 52703.0, 105703.0, 191621.0, 247630.0, 186587.0, 102257.0, 50841.0, 25312.0, 13022.0, 6823.0, 3783.0, 2191.0, 1279.0, 748.0, 474.0, 314.0, 217.0, 146.0, 117.0, 76.0, 61.0, 54.0, 31.0, 17.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.6591796875, -0.6382369995117188, -0.6172943115234375, -0.5963516235351562, -0.575408935546875, -0.5544662475585938, -0.5335235595703125, -0.5125808715820312, -0.49163818359375, -0.47069549560546875, -0.4497528076171875, -0.42881011962890625, -0.407867431640625, -0.38692474365234375, -0.3659820556640625, -0.34503936767578125, -0.3240966796875, -0.30315399169921875, -0.2822113037109375, -0.26126861572265625, -0.240325927734375, -0.21938323974609375, -0.1984405517578125, -0.17749786376953125, -0.15655517578125, -0.13561248779296875, -0.1146697998046875, -0.09372711181640625, -0.072784423828125, -0.05184173583984375, -0.0308990478515625, -0.00995635986328125, 0.010986328125, 0.03192901611328125, 0.0528717041015625, 0.07381439208984375, 0.094757080078125, 0.11569976806640625, 0.1366424560546875, 0.15758514404296875, 0.17852783203125, 0.19947052001953125, 0.2204132080078125, 0.24135589599609375, 0.262298583984375, 0.28324127197265625, 0.3041839599609375, 0.32512664794921875, 0.3460693359375, 0.36701202392578125, 0.3879547119140625, 0.40889739990234375, 0.429840087890625, 0.45078277587890625, 0.4717254638671875, 0.49266815185546875, 0.51361083984375, 0.5345535278320312, 0.5554962158203125, 0.5764389038085938, 0.597381591796875, 0.6183242797851562, 0.6392669677734375, 0.6602096557617188, 0.68115234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 10.0, 6.0, 6.0, 11.0, 24.0, 17.0, 9.0, 25.0, 25.0, 30.0, 34.0, 37.0, 44.0, 45.0, 39.0, 26.0, 50.0, 52.0, 40.0, 46.0, 51.0, 45.0, 45.0, 43.0, 28.0, 35.0, 21.0, 31.0, 25.0, 19.0, 21.0, 16.0, 7.0, 8.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5128326416015625, -0.494415283203125, -0.4759979248046875, -0.45758056640625, -0.4391632080078125, -0.420745849609375, -0.4023284912109375, -0.3839111328125, -0.3654937744140625, -0.347076416015625, -0.3286590576171875, -0.31024169921875, -0.2918243408203125, -0.273406982421875, -0.2549896240234375, -0.236572265625, -0.2181549072265625, -0.199737548828125, -0.1813201904296875, -0.16290283203125, -0.1444854736328125, -0.126068115234375, -0.1076507568359375, -0.0892333984375, -0.0708160400390625, -0.052398681640625, -0.0339813232421875, -0.01556396484375, 0.0028533935546875, 0.021270751953125, 0.0396881103515625, 0.05810546875, 0.0765228271484375, 0.094940185546875, 0.1133575439453125, 0.13177490234375, 0.1501922607421875, 0.168609619140625, 0.1870269775390625, 0.2054443359375, 0.2238616943359375, 0.242279052734375, 0.2606964111328125, 0.27911376953125, 0.2975311279296875, 0.315948486328125, 0.3343658447265625, 0.352783203125, 0.3712005615234375, 0.389617919921875, 0.4080352783203125, 0.42645263671875, 0.4448699951171875, 0.463287353515625, 0.4817047119140625, 0.5001220703125, 0.5185394287109375, 0.536956787109375, 0.5553741455078125, 0.57379150390625, 0.5922088623046875, 0.610626220703125, 0.6290435791015625, 0.6474609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 7.0, 8.0, 9.0, 21.0, 26.0, 44.0, 88.0, 160.0, 396.0, 1124.0, 3912.0, 26767.0, 656836.0, 339562.0, 15379.0, 2771.0, 794.0, 319.0, 141.0, 77.0, 41.0, 15.0, 21.0, 16.0, 8.0, 6.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.49298095703125, -2.4215087890625, -2.35003662109375, -2.278564453125, -2.20709228515625, -2.1356201171875, -2.06414794921875, -1.99267578125, -1.92120361328125, -1.8497314453125, -1.77825927734375, -1.706787109375, -1.63531494140625, -1.5638427734375, -1.49237060546875, -1.4208984375, -1.34942626953125, -1.2779541015625, -1.20648193359375, -1.135009765625, -1.06353759765625, -0.9920654296875, -0.92059326171875, -0.84912109375, -0.77764892578125, -0.7061767578125, -0.63470458984375, -0.563232421875, -0.49176025390625, -0.4202880859375, -0.34881591796875, -0.27734375, -0.20587158203125, -0.1343994140625, -0.06292724609375, 0.008544921875, 0.08001708984375, 0.1514892578125, 0.22296142578125, 0.29443359375, 0.36590576171875, 0.4373779296875, 0.50885009765625, 0.580322265625, 0.65179443359375, 0.7232666015625, 0.79473876953125, 0.8662109375, 0.93768310546875, 1.0091552734375, 1.08062744140625, 1.152099609375, 1.22357177734375, 1.2950439453125, 1.36651611328125, 1.43798828125, 1.50946044921875, 1.5809326171875, 1.65240478515625, 1.723876953125, 1.79534912109375, 1.8668212890625, 1.93829345703125, 2.009765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 7.0, 14.0, 23.0, 22.0, 58.0, 54.0, 100.0, 100.0, 105.0, 91.0, 116.0, 88.0, 59.0, 56.0, 26.0, 15.0, 12.0, 9.0, 7.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.72747802734375e-05, -9.3020498752594e-05, -8.876621723175049e-05, -8.451193571090698e-05, -8.025765419006348e-05, -7.600337266921997e-05, -7.174909114837646e-05, -6.749480962753296e-05, -6.324052810668945e-05, -5.898624658584595e-05, -5.473196506500244e-05, -5.0477683544158936e-05, -4.622340202331543e-05, -4.1969120502471924e-05, -3.771483898162842e-05, -3.346055746078491e-05, -2.9206275939941406e-05, -2.49519944190979e-05, -2.0697712898254395e-05, -1.644343137741089e-05, -1.2189149856567383e-05, -7.934868335723877e-06, -3.680586814880371e-06, 5.736947059631348e-07, 4.827976226806641e-06, 9.082257747650146e-06, 1.3336539268493652e-05, 1.7590820789337158e-05, 2.1845102310180664e-05, 2.609938383102417e-05, 3.0353665351867676e-05, 3.460794687271118e-05, 3.886222839355469e-05, 4.311650991439819e-05, 4.73707914352417e-05, 5.1625072956085205e-05, 5.587935447692871e-05, 6.013363599777222e-05, 6.438791751861572e-05, 6.864219903945923e-05, 7.289648056030273e-05, 7.715076208114624e-05, 8.140504360198975e-05, 8.565932512283325e-05, 8.991360664367676e-05, 9.416788816452026e-05, 9.842216968536377e-05, 0.00010267645120620728, 0.00010693073272705078, 0.00011118501424789429, 0.00011543929576873779, 0.0001196935772895813, 0.0001239478588104248, 0.0001282021403312683, 0.00013245642185211182, 0.00013671070337295532, 0.00014096498489379883, 0.00014521926641464233, 0.00014947354793548584, 0.00015372782945632935, 0.00015798211097717285, 0.00016223639249801636, 0.00016649067401885986, 0.00017074495553970337, 0.00017499923706054688]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 22.0, 29.0, 44.0, 65.0, 97.0, 185.0, 500.0, 2762.0, 60308.0, 950455.0, 31231.0, 2016.0, 445.0, 182.0, 94.0, 58.0, 22.0, 14.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.755859375, -3.658111572265625, -3.56036376953125, -3.462615966796875, -3.3648681640625, -3.267120361328125, -3.16937255859375, -3.071624755859375, -2.973876953125, -2.876129150390625, -2.77838134765625, -2.680633544921875, -2.5828857421875, -2.485137939453125, -2.38739013671875, -2.289642333984375, -2.19189453125, -2.094146728515625, -1.99639892578125, -1.898651123046875, -1.8009033203125, -1.703155517578125, -1.60540771484375, -1.507659912109375, -1.409912109375, -1.312164306640625, -1.21441650390625, -1.116668701171875, -1.0189208984375, -0.921173095703125, -0.82342529296875, -0.725677490234375, -0.6279296875, -0.530181884765625, -0.43243408203125, -0.334686279296875, -0.2369384765625, -0.139190673828125, -0.04144287109375, 0.056304931640625, 0.154052734375, 0.251800537109375, 0.34954833984375, 0.447296142578125, 0.5450439453125, 0.642791748046875, 0.74053955078125, 0.838287353515625, 0.93603515625, 1.033782958984375, 1.13153076171875, 1.229278564453125, 1.3270263671875, 1.424774169921875, 1.52252197265625, 1.620269775390625, 1.718017578125, 1.815765380859375, 1.91351318359375, 2.011260986328125, 2.1090087890625, 2.206756591796875, 2.30450439453125, 2.402252197265625, 2.5]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 13.0, 42.0, 98.0, 183.0, 269.0, 200.0, 97.0, 51.0, 20.0, 15.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.9740142822265625, -1.926544189453125, -1.8790740966796875, -1.83160400390625, -1.7841339111328125, -1.736663818359375, -1.6891937255859375, -1.6417236328125, -1.5942535400390625, -1.546783447265625, -1.4993133544921875, -1.45184326171875, -1.4043731689453125, -1.356903076171875, -1.3094329833984375, -1.261962890625, -1.2144927978515625, -1.167022705078125, -1.1195526123046875, -1.07208251953125, -1.0246124267578125, -0.977142333984375, -0.9296722412109375, -0.8822021484375, -0.8347320556640625, -0.787261962890625, -0.7397918701171875, -0.69232177734375, -0.6448516845703125, -0.597381591796875, -0.5499114990234375, -0.50244140625, -0.4549713134765625, -0.407501220703125, -0.3600311279296875, -0.31256103515625, -0.2650909423828125, -0.217620849609375, -0.1701507568359375, -0.1226806640625, -0.0752105712890625, -0.027740478515625, 0.0197296142578125, 0.06719970703125, 0.1146697998046875, 0.162139892578125, 0.2096099853515625, 0.257080078125, 0.3045501708984375, 0.352020263671875, 0.3994903564453125, 0.44696044921875, 0.4944305419921875, 0.541900634765625, 0.5893707275390625, 0.6368408203125, 0.6843109130859375, 0.731781005859375, 0.7792510986328125, 0.82672119140625, 0.8741912841796875, 0.921661376953125, 0.9691314697265625, 1.0166015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 11.0, 19.0, 34.0, 204.0, 431.0, 221.0, 58.0, 21.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.39303970336914, -33.69886779785156, -33.00469970703125, -32.31052780151367, -31.616355895996094, -30.92218589782715, -30.228015899658203, -29.533843994140625, -28.839672088623047, -28.1455020904541, -27.451330184936523, -26.757160186767578, -26.06298828125, -25.368818283081055, -24.67464828491211, -23.98047637939453, -23.286306381225586, -22.59213638305664, -21.897964477539062, -21.203794479370117, -20.50962257385254, -19.815452575683594, -19.121280670166016, -18.42711067199707, -17.732940673828125, -17.03877067565918, -16.3445987701416, -15.650428771972656, -14.956256866455078, -14.262086868286133, -13.567915916442871, -12.87374496459961, -12.179571151733398, -11.485400199890137, -10.791229248046875, -10.09705924987793, -9.402887344360352, -8.708717346191406, -8.014546394348145, -7.320375442504883, -6.626204490661621, -5.932033538818359, -5.237862586975098, -4.543692111968994, -3.8495211601257324, -3.1553502082824707, -2.461179733276367, -1.7670087814331055, -1.0728378295898438, -0.3786669969558716, 0.3155038356781006, 1.0096745491027832, 1.703845500946045, 2.3980164527893066, 3.09218692779541, 3.786357879638672, 4.480528831481934, 5.174699783325195, 5.868870735168457, 6.5630412101745605, 7.257212162017822, 7.951383113861084, 8.645553588867188, 9.33972454071045, 10.033895492553711]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 13.0, 5.0, 20.0, 30.0, 18.0, 34.0, 34.0, 39.0, 44.0, 62.0, 67.0, 66.0, 60.0, 62.0, 64.0, 56.0, 55.0, 44.0, 52.0, 36.0, 24.0, 26.0, 13.0, 14.0, 14.0, 9.0, 8.0, 1.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.47700834274292, -5.293737888336182, -5.110467433929443, -4.927196979522705, -4.743926525115967, -4.5606560707092285, -4.377385139465332, -4.194114685058594, -4.0108442306518555, -3.827573776245117, -3.644303321838379, -3.4610328674316406, -3.2777624130249023, -3.094491958618164, -2.9112212657928467, -2.7279508113861084, -2.544680595397949, -2.361410140991211, -2.1781396865844727, -1.9948691129684448, -1.8115986585617065, -1.6283282041549683, -1.4450576305389404, -1.2617871761322021, -1.0785167217254639, -0.8952462673187256, -0.7119757533073425, -0.5287052392959595, -0.3454347848892212, -0.1621643304824829, 0.021106243133544922, 0.2043766975402832, 0.3876466751098633, 0.5709171295166016, 0.7541876435279846, 0.9374581575393677, 1.120728611946106, 1.3039990663528442, 1.487269639968872, 1.6705400943756104, 1.8538105487823486, 2.037081003189087, 2.220351457595825, 2.4036221504211426, 2.586892604827881, 2.770163059234619, 2.9534335136413574, 3.1367039680480957, 3.319974422454834, 3.5032448768615723, 3.6865153312683105, 3.869785785675049, 4.053056240081787, 4.236326694488525, 4.419597625732422, 4.60286808013916, 4.786138534545898, 4.969408988952637, 5.152679443359375, 5.335949897766113, 5.519220352172852, 5.70249080657959, 5.885761260986328, 6.069031715393066, 6.252302169799805]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 14.0, 23.0, 34.0, 77.0, 132.0, 307.0, 841.0, 3226.0, 29911.0, 4010883.0, 139240.0, 7537.0, 1293.0, 401.0, 153.0, 67.0, 52.0, 23.0, 13.0, 11.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3828125, -8.141357421875, -7.89990234375, -7.658447265625, -7.4169921875, -7.175537109375, -6.93408203125, -6.692626953125, -6.451171875, -6.209716796875, -5.96826171875, -5.726806640625, -5.4853515625, -5.243896484375, -5.00244140625, -4.760986328125, -4.51953125, -4.278076171875, -4.03662109375, -3.795166015625, -3.5537109375, -3.312255859375, -3.07080078125, -2.829345703125, -2.587890625, -2.346435546875, -2.10498046875, -1.863525390625, -1.6220703125, -1.380615234375, -1.13916015625, -0.897705078125, -0.65625, -0.414794921875, -0.17333984375, 0.068115234375, 0.3095703125, 0.551025390625, 0.79248046875, 1.033935546875, 1.275390625, 1.516845703125, 1.75830078125, 1.999755859375, 2.2412109375, 2.482666015625, 2.72412109375, 2.965576171875, 3.20703125, 3.448486328125, 3.68994140625, 3.931396484375, 4.1728515625, 4.414306640625, 4.65576171875, 4.897216796875, 5.138671875, 5.380126953125, 5.62158203125, 5.863037109375, 6.1044921875, 6.345947265625, 6.58740234375, 6.828857421875, 7.0703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 15.0, 24.0, 43.0, 45.0, 60.0, 72.0, 83.0, 92.0, 107.0, 85.0, 90.0, 67.0, 50.0, 39.0, 33.0, 18.0, 16.0, 13.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20661544799804688, -0.20021820068359375, -0.19382095336914062, -0.1874237060546875, -0.18102645874023438, -0.17462921142578125, -0.16823196411132812, -0.161834716796875, -0.15543746948242188, -0.14904022216796875, -0.14264297485351562, -0.1362457275390625, -0.12984848022460938, -0.12345123291015625, -0.11705398559570312, -0.11065673828125, -0.10425949096679688, -0.09786224365234375, -0.09146499633789062, -0.0850677490234375, -0.07867050170898438, -0.07227325439453125, -0.06587600708007812, -0.059478759765625, -0.053081512451171875, -0.04668426513671875, -0.040287017822265625, -0.0338897705078125, -0.027492523193359375, -0.02109527587890625, -0.014698028564453125, -0.00830078125, -0.001903533935546875, 0.00449371337890625, 0.010890960693359375, 0.0172882080078125, 0.023685455322265625, 0.03008270263671875, 0.036479949951171875, 0.042877197265625, 0.049274444580078125, 0.05567169189453125, 0.062068939208984375, 0.0684661865234375, 0.07486343383789062, 0.08126068115234375, 0.08765792846679688, 0.09405517578125, 0.10045242309570312, 0.10684967041015625, 0.11324691772460938, 0.1196441650390625, 0.12604141235351562, 0.13243865966796875, 0.13883590698242188, 0.145233154296875, 0.15163040161132812, 0.15802764892578125, 0.16442489624023438, 0.1708221435546875, 0.17721939086914062, 0.18361663818359375, 0.19001388549804688, 0.1964111328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 15.0, 27.0, 71.0, 155.0, 380.0, 973.0, 2950.0, 11206.0, 61554.0, 1511884.0, 2516427.0, 70878.0, 12641.0, 3321.0, 1074.0, 389.0, 171.0, 76.0, 36.0, 18.0, 12.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.807586669921875, -3.71478271484375, -3.621978759765625, -3.5291748046875, -3.436370849609375, -3.34356689453125, -3.250762939453125, -3.157958984375, -3.065155029296875, -2.97235107421875, -2.879547119140625, -2.7867431640625, -2.693939208984375, -2.60113525390625, -2.508331298828125, -2.41552734375, -2.322723388671875, -2.22991943359375, -2.137115478515625, -2.0443115234375, -1.951507568359375, -1.85870361328125, -1.765899658203125, -1.673095703125, -1.580291748046875, -1.48748779296875, -1.394683837890625, -1.3018798828125, -1.209075927734375, -1.11627197265625, -1.023468017578125, -0.9306640625, -0.837860107421875, -0.74505615234375, -0.652252197265625, -0.5594482421875, -0.466644287109375, -0.37384033203125, -0.281036376953125, -0.188232421875, -0.095428466796875, -0.00262451171875, 0.090179443359375, 0.1829833984375, 0.275787353515625, 0.36859130859375, 0.461395263671875, 0.55419921875, 0.647003173828125, 0.73980712890625, 0.832611083984375, 0.9254150390625, 1.018218994140625, 1.11102294921875, 1.203826904296875, 1.296630859375, 1.389434814453125, 1.48223876953125, 1.575042724609375, 1.6678466796875, 1.760650634765625, 1.85345458984375, 1.946258544921875, 2.0390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 9.0, 3.0, 9.0, 15.0, 14.0, 14.0, 23.0, 32.0, 37.0, 47.0, 103.0, 158.0, 268.0, 573.0, 1511.0, 534.0, 218.0, 143.0, 87.0, 59.0, 49.0, 41.0, 26.0, 19.0, 19.0, 14.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.406005859375, -0.39488983154296875, -0.3837738037109375, -0.37265777587890625, -0.361541748046875, -0.35042572021484375, -0.3393096923828125, -0.32819366455078125, -0.31707763671875, -0.30596160888671875, -0.2948455810546875, -0.28372955322265625, -0.272613525390625, -0.26149749755859375, -0.2503814697265625, -0.23926544189453125, -0.2281494140625, -0.21703338623046875, -0.2059173583984375, -0.19480133056640625, -0.183685302734375, -0.17256927490234375, -0.1614532470703125, -0.15033721923828125, -0.13922119140625, -0.12810516357421875, -0.1169891357421875, -0.10587310791015625, -0.094757080078125, -0.08364105224609375, -0.0725250244140625, -0.06140899658203125, -0.05029296875, -0.03917694091796875, -0.0280609130859375, -0.01694488525390625, -0.005828857421875, 0.00528717041015625, 0.0164031982421875, 0.02751922607421875, 0.03863525390625, 0.04975128173828125, 0.0608673095703125, 0.07198333740234375, 0.083099365234375, 0.09421539306640625, 0.1053314208984375, 0.11644744873046875, 0.1275634765625, 0.13867950439453125, 0.1497955322265625, 0.16091156005859375, 0.172027587890625, 0.18314361572265625, 0.1942596435546875, 0.20537567138671875, 0.21649169921875, 0.22760772705078125, 0.2387237548828125, 0.24983978271484375, 0.260955810546875, 0.27207183837890625, 0.2831878662109375, 0.29430389404296875, 0.305419921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 9.0, 25.0, 85.0, 223.0, 340.0, 219.0, 64.0, 31.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.954348564147949, -5.7595438957214355, -5.56473970413208, -5.369935035705566, -5.175130844116211, -4.980326175689697, -4.785521507263184, -4.590717315673828, -4.3959126472473145, -4.201107978820801, -4.006303787231445, -3.8114991188049316, -3.616694688796997, -3.4218902587890625, -3.227085590362549, -3.0322811603546143, -2.8374767303466797, -2.642672300338745, -2.4478678703308105, -2.253063201904297, -2.0582587718963623, -1.8634543418884277, -1.6686497926712036, -1.4738452434539795, -1.279040813446045, -1.0842363834381104, -0.8894318342208862, -0.6946273446083069, -0.49982285499572754, -0.3050183653831482, -0.11021387577056885, 0.08459067344665527, 0.27939558029174805, 0.4742000699043274, 0.6690045595169067, 0.8638090491294861, 1.0586135387420654, 1.25341796875, 1.4482225179672241, 1.6430270671844482, 1.8378314971923828, 2.0326359272003174, 2.227440357208252, 2.4222450256347656, 2.6170494556427, 2.8118538856506348, 3.0066585540771484, 3.201462984085083, 3.3962674140930176, 3.591071844100952, 3.7858762741088867, 3.9806809425354004, 4.175485610961914, 4.3702898025512695, 4.565094470977783, 4.759899139404297, 4.954703330993652, 5.149507999420166, 5.3443121910095215, 5.539116859436035, 5.733921051025391, 5.928725719451904, 6.123530387878418, 6.318334579467773, 6.513139247894287]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 5.0, 12.0, 19.0, 24.0, 25.0, 37.0, 46.0, 50.0, 71.0, 62.0, 70.0, 76.0, 80.0, 73.0, 59.0, 64.0, 54.0, 53.0, 28.0, 31.0, 16.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1704611778259277, -2.0985894203186035, -2.0267179012298584, -1.9548462629318237, -1.882974624633789, -1.8111029863357544, -1.7392313480377197, -1.667359709739685, -1.5954880714416504, -1.5236164331436157, -1.451744794845581, -1.3798731565475464, -1.3080015182495117, -1.236129879951477, -1.1642582416534424, -1.0923866033554077, -1.020514965057373, -0.9486433267593384, -0.8767716884613037, -0.804900050163269, -0.7330284118652344, -0.6611567735671997, -0.589285135269165, -0.5174134969711304, -0.4455418586730957, -0.37367022037506104, -0.30179858207702637, -0.2299269437789917, -0.15805530548095703, -0.08618366718292236, -0.014312028884887695, 0.05755960941314697, 0.12943124771118164, 0.2013028860092163, 0.273174524307251, 0.34504616260528564, 0.4169178009033203, 0.488789439201355, 0.5606610774993896, 0.6325327157974243, 0.704404354095459, 0.7762759923934937, 0.8481476306915283, 0.920019268989563, 0.9918909072875977, 1.0637625455856323, 1.135634183883667, 1.2075058221817017, 1.2793774604797363, 1.351249098777771, 1.4231207370758057, 1.4949923753738403, 1.566864013671875, 1.6387356519699097, 1.7106072902679443, 1.782478928565979, 1.8543505668640137, 1.9262222051620483, 1.998093843460083, 2.069965362548828, 2.1418371200561523, 2.2137088775634766, 2.2855803966522217, 2.357451915740967, 2.429323673248291]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 19.0, 25.0, 25.0, 35.0, 46.0, 69.0, 103.0, 131.0, 206.0, 270.0, 440.0, 668.0, 1161.0, 2210.0, 5278.0, 15056.0, 59429.0, 276037.0, 489519.0, 147496.0, 32568.0, 9647.0, 3667.0, 1782.0, 934.0, 541.0, 371.0, 219.0, 125.0, 124.0, 73.0, 58.0, 39.0, 31.0, 34.0, 15.0, 19.0, 12.0, 14.0, 8.0, 5.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.3333892822265625, -1.287872314453125, -1.2423553466796875, -1.19683837890625, -1.1513214111328125, -1.105804443359375, -1.0602874755859375, -1.0147705078125, -0.9692535400390625, -0.923736572265625, -0.8782196044921875, -0.83270263671875, -0.7871856689453125, -0.741668701171875, -0.6961517333984375, -0.650634765625, -0.6051177978515625, -0.559600830078125, -0.5140838623046875, -0.46856689453125, -0.4230499267578125, -0.377532958984375, -0.3320159912109375, -0.2864990234375, -0.2409820556640625, -0.195465087890625, -0.1499481201171875, -0.10443115234375, -0.0589141845703125, -0.013397216796875, 0.0321197509765625, 0.07763671875, 0.1231536865234375, 0.168670654296875, 0.2141876220703125, 0.25970458984375, 0.3052215576171875, 0.350738525390625, 0.3962554931640625, 0.4417724609375, 0.4872894287109375, 0.532806396484375, 0.5783233642578125, 0.62384033203125, 0.6693572998046875, 0.714874267578125, 0.7603912353515625, 0.805908203125, 0.8514251708984375, 0.896942138671875, 0.9424591064453125, 0.98797607421875, 1.0334930419921875, 1.079010009765625, 1.1245269775390625, 1.1700439453125, 1.2155609130859375, 1.261077880859375, 1.3065948486328125, 1.35211181640625, 1.3976287841796875, 1.443145751953125, 1.4886627197265625, 1.5341796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 3.0, 7.0, 8.0, 5.0, 11.0, 22.0, 46.0, 56.0, 50.0, 81.0, 91.0, 133.0, 105.0, 110.0, 83.0, 67.0, 41.0, 32.0, 22.0, 12.0, 7.0, 11.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1947021484375, -0.1871776580810547, -0.17965316772460938, -0.17212867736816406, -0.16460418701171875, -0.15707969665527344, -0.14955520629882812, -0.1420307159423828, -0.1345062255859375, -0.1269817352294922, -0.11945724487304688, -0.11193275451660156, -0.10440826416015625, -0.09688377380371094, -0.08935928344726562, -0.08183479309082031, -0.074310302734375, -0.06678581237792969, -0.059261322021484375, -0.05173683166503906, -0.04421234130859375, -0.03668785095214844, -0.029163360595703125, -0.021638870239257812, -0.0141143798828125, -0.0065898895263671875, 0.000934600830078125, 0.008459091186523438, 0.01598358154296875, 0.023508071899414062, 0.031032562255859375, 0.03855705261230469, 0.04608154296875, 0.05360603332519531, 0.061130523681640625, 0.06865501403808594, 0.07617950439453125, 0.08370399475097656, 0.09122848510742188, 0.09875297546386719, 0.1062774658203125, 0.11380195617675781, 0.12132644653320312, 0.12885093688964844, 0.13637542724609375, 0.14389991760253906, 0.15142440795898438, 0.1589488983154297, 0.166473388671875, 0.1739978790283203, 0.18152236938476562, 0.18904685974121094, 0.19657135009765625, 0.20409584045410156, 0.21162033081054688, 0.2191448211669922, 0.2266693115234375, 0.2341938018798828, 0.24171829223632812, 0.24924278259277344, 0.25676727294921875, 0.26429176330566406, 0.2718162536621094, 0.2793407440185547, 0.286865234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 2.0, 7.0, 9.0, 13.0, 12.0, 16.0, 25.0, 31.0, 45.0, 68.0, 89.0, 135.0, 227.0, 358.0, 619.0, 1076.0, 1998.0, 4200.0, 9716.0, 26996.0, 89041.0, 304921.0, 407246.0, 136895.0, 40398.0, 13540.0, 5279.0, 2455.0, 1241.0, 734.0, 467.0, 241.0, 148.0, 96.0, 61.0, 45.0, 28.0, 16.0, 20.0, 13.0, 4.0, 4.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.07421875, -1.0386199951171875, -1.003021240234375, -0.9674224853515625, -0.93182373046875, -0.8962249755859375, -0.860626220703125, -0.8250274658203125, -0.7894287109375, -0.7538299560546875, -0.718231201171875, -0.6826324462890625, -0.64703369140625, -0.6114349365234375, -0.575836181640625, -0.5402374267578125, -0.504638671875, -0.4690399169921875, -0.433441162109375, -0.3978424072265625, -0.36224365234375, -0.3266448974609375, -0.291046142578125, -0.2554473876953125, -0.2198486328125, -0.1842498779296875, -0.148651123046875, -0.1130523681640625, -0.07745361328125, -0.0418548583984375, -0.006256103515625, 0.0293426513671875, 0.06494140625, 0.1005401611328125, 0.136138916015625, 0.1717376708984375, 0.20733642578125, 0.2429351806640625, 0.278533935546875, 0.3141326904296875, 0.3497314453125, 0.3853302001953125, 0.420928955078125, 0.4565277099609375, 0.49212646484375, 0.5277252197265625, 0.563323974609375, 0.5989227294921875, 0.634521484375, 0.6701202392578125, 0.705718994140625, 0.7413177490234375, 0.77691650390625, 0.8125152587890625, 0.848114013671875, 0.8837127685546875, 0.9193115234375, 0.9549102783203125, 0.990509033203125, 1.0261077880859375, 1.06170654296875, 1.0973052978515625, 1.132904052734375, 1.1685028076171875, 1.2041015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 5.0, 20.0, 11.0, 16.0, 20.0, 17.0, 25.0, 36.0, 31.0, 35.0, 33.0, 39.0, 51.0, 57.0, 55.0, 57.0, 58.0, 33.0, 51.0, 29.0, 24.0, 33.0, 25.0, 39.0, 25.0, 24.0, 20.0, 23.0, 19.0, 14.0, 18.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.708984375, -0.6881866455078125, -0.667388916015625, -0.6465911865234375, -0.62579345703125, -0.6049957275390625, -0.584197998046875, -0.5634002685546875, -0.5426025390625, -0.5218048095703125, -0.501007080078125, -0.4802093505859375, -0.45941162109375, -0.4386138916015625, -0.417816162109375, -0.3970184326171875, -0.376220703125, -0.3554229736328125, -0.334625244140625, -0.3138275146484375, -0.29302978515625, -0.2722320556640625, -0.251434326171875, -0.2306365966796875, -0.2098388671875, -0.1890411376953125, -0.168243408203125, -0.1474456787109375, -0.12664794921875, -0.1058502197265625, -0.085052490234375, -0.0642547607421875, -0.04345703125, -0.0226593017578125, -0.001861572265625, 0.0189361572265625, 0.03973388671875, 0.0605316162109375, 0.081329345703125, 0.1021270751953125, 0.1229248046875, 0.1437225341796875, 0.164520263671875, 0.1853179931640625, 0.20611572265625, 0.2269134521484375, 0.247711181640625, 0.2685089111328125, 0.289306640625, 0.3101043701171875, 0.330902099609375, 0.3516998291015625, 0.37249755859375, 0.3932952880859375, 0.414093017578125, 0.4348907470703125, 0.4556884765625, 0.4764862060546875, 0.497283935546875, 0.5180816650390625, 0.53887939453125, 0.5596771240234375, 0.580474853515625, 0.6012725830078125, 0.6220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 14.0, 29.0, 50.0, 70.0, 134.0, 188.0, 380.0, 1199.0, 6741.0, 502635.0, 528244.0, 6744.0, 1232.0, 384.0, 180.0, 106.0, 63.0, 53.0, 21.0, 18.0, 12.0, 11.0, 11.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.660247802734375, -3.51385498046875, -3.367462158203125, -3.2210693359375, -3.074676513671875, -2.92828369140625, -2.781890869140625, -2.635498046875, -2.489105224609375, -2.34271240234375, -2.196319580078125, -2.0499267578125, -1.903533935546875, -1.75714111328125, -1.610748291015625, -1.46435546875, -1.317962646484375, -1.17156982421875, -1.025177001953125, -0.8787841796875, -0.732391357421875, -0.58599853515625, -0.439605712890625, -0.293212890625, -0.146820068359375, -0.00042724609375, 0.145965576171875, 0.2923583984375, 0.438751220703125, 0.58514404296875, 0.731536865234375, 0.8779296875, 1.024322509765625, 1.17071533203125, 1.317108154296875, 1.4635009765625, 1.609893798828125, 1.75628662109375, 1.902679443359375, 2.049072265625, 2.195465087890625, 2.34185791015625, 2.488250732421875, 2.6346435546875, 2.781036376953125, 2.92742919921875, 3.073822021484375, 3.22021484375, 3.366607666015625, 3.51300048828125, 3.659393310546875, 3.8057861328125, 3.952178955078125, 4.09857177734375, 4.244964599609375, 4.391357421875, 4.537750244140625, 4.68414306640625, 4.830535888671875, 4.9769287109375, 5.123321533203125, 5.26971435546875, 5.416107177734375, 5.5625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 14.0, 23.0, 62.0, 178.0, 334.0, 225.0, 88.0, 44.0, 21.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038242340087890625, -0.000371687114238739, -0.0003609508275985718, -0.00035021454095840454, -0.0003394782543182373, -0.00032874196767807007, -0.00031800568103790283, -0.0003072693943977356, -0.00029653310775756836, -0.0002857968211174011, -0.0002750605344772339, -0.00026432424783706665, -0.0002535879611968994, -0.00024285167455673218, -0.00023211538791656494, -0.0002213791012763977, -0.00021064281463623047, -0.00019990652799606323, -0.000189170241355896, -0.00017843395471572876, -0.00016769766807556152, -0.0001569613814353943, -0.00014622509479522705, -0.00013548880815505981, -0.00012475252151489258, -0.00011401623487472534, -0.0001032799482345581, -9.254366159439087e-05, -8.180737495422363e-05, -7.10710883140564e-05, -6.033480167388916e-05, -4.9598515033721924e-05, -3.886222839355469e-05, -2.812594175338745e-05, -1.7389655113220215e-05, -6.6533684730529785e-06, 4.082918167114258e-06, 1.4819204807281494e-05, 2.555549144744873e-05, 3.629177808761597e-05, 4.70280647277832e-05, 5.776435136795044e-05, 6.850063800811768e-05, 7.923692464828491e-05, 8.997321128845215e-05, 0.00010070949792861938, 0.00011144578456878662, 0.00012218207120895386, 0.0001329183578491211, 0.00014365464448928833, 0.00015439093112945557, 0.0001651272177696228, 0.00017586350440979004, 0.00018659979104995728, 0.0001973360776901245, 0.00020807236433029175, 0.00021880865097045898, 0.00022954493761062622, 0.00024028122425079346, 0.0002510175108909607, 0.00026175379753112793, 0.00027249008417129517, 0.0002832263708114624, 0.00029396265745162964, 0.0003046989440917969]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 4.0, 20.0, 25.0, 45.0, 64.0, 122.0, 271.0, 694.0, 2861.0, 14496.0, 949080.0, 72916.0, 5820.0, 1321.0, 423.0, 167.0, 100.0, 44.0, 28.0, 24.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.12530517578125, -3.0084228515625, -2.89154052734375, -2.774658203125, -2.65777587890625, -2.5408935546875, -2.42401123046875, -2.30712890625, -2.19024658203125, -2.0733642578125, -1.95648193359375, -1.839599609375, -1.72271728515625, -1.6058349609375, -1.48895263671875, -1.3720703125, -1.25518798828125, -1.1383056640625, -1.02142333984375, -0.904541015625, -0.78765869140625, -0.6707763671875, -0.55389404296875, -0.43701171875, -0.32012939453125, -0.2032470703125, -0.08636474609375, 0.030517578125, 0.14739990234375, 0.2642822265625, 0.38116455078125, 0.498046875, 0.61492919921875, 0.7318115234375, 0.84869384765625, 0.965576171875, 1.08245849609375, 1.1993408203125, 1.31622314453125, 1.43310546875, 1.54998779296875, 1.6668701171875, 1.78375244140625, 1.900634765625, 2.01751708984375, 2.1343994140625, 2.25128173828125, 2.3681640625, 2.48504638671875, 2.6019287109375, 2.71881103515625, 2.835693359375, 2.95257568359375, 3.0694580078125, 3.18634033203125, 3.30322265625, 3.42010498046875, 3.5369873046875, 3.65386962890625, 3.770751953125, 3.88763427734375, 4.0045166015625, 4.12139892578125, 4.23828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 32.0, 116.0, 243.0, 278.0, 167.0, 65.0, 28.0, 16.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.103729248046875, -1.05999755859375, -1.016265869140625, -0.9725341796875, -0.928802490234375, -0.88507080078125, -0.841339111328125, -0.797607421875, -0.753875732421875, -0.71014404296875, -0.666412353515625, -0.6226806640625, -0.578948974609375, -0.53521728515625, -0.491485595703125, -0.44775390625, -0.404022216796875, -0.36029052734375, -0.316558837890625, -0.2728271484375, -0.229095458984375, -0.18536376953125, -0.141632080078125, -0.097900390625, -0.054168701171875, -0.01043701171875, 0.033294677734375, 0.0770263671875, 0.120758056640625, 0.16448974609375, 0.208221435546875, 0.251953125, 0.295684814453125, 0.33941650390625, 0.383148193359375, 0.4268798828125, 0.470611572265625, 0.51434326171875, 0.558074951171875, 0.601806640625, 0.645538330078125, 0.68927001953125, 0.733001708984375, 0.7767333984375, 0.820465087890625, 0.86419677734375, 0.907928466796875, 0.95166015625, 0.995391845703125, 1.03912353515625, 1.082855224609375, 1.1265869140625, 1.170318603515625, 1.21405029296875, 1.257781982421875, 1.301513671875, 1.345245361328125, 1.38897705078125, 1.432708740234375, 1.4764404296875, 1.520172119140625, 1.56390380859375, 1.607635498046875, 1.6513671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 7.0, 8.0, 11.0, 55.0, 97.0, 175.0, 224.0, 201.0, 108.0, 56.0, 25.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.00646686553955, -9.63134765625, -9.25622844696045, -8.881109237670898, -8.505989074707031, -8.13086986541748, -7.75575065612793, -7.380631446838379, -7.005512237548828, -6.630393028259277, -6.255273818969727, -5.880154132843018, -5.505034923553467, -5.129915714263916, -4.754796028137207, -4.379676818847656, -4.0045576095581055, -3.6294384002685547, -3.254318952560425, -2.879199504852295, -2.504080295562744, -2.1289610862731934, -1.7538416385650635, -1.3787221908569336, -1.0036029815673828, -0.6284836530685425, -0.25336432456970215, 0.12175500392913818, 0.4968743324279785, 0.8719936609268188, 1.2471129894256592, 1.622232437133789, 1.9973506927490234, 2.372469902038574, 2.747589349746704, 3.122708797454834, 3.4978280067443848, 3.8729472160339355, 4.2480669021606445, 4.623186111450195, 4.998305320739746, 5.373424530029297, 5.748543739318848, 6.123663425445557, 6.498782634735107, 6.873901844024658, 7.249021530151367, 7.624140739440918, 7.999259948730469, 8.37437915802002, 8.74949836730957, 9.124617576599121, 9.499736785888672, 9.874856948852539, 10.24997615814209, 10.62509536743164, 11.000214576721191, 11.375333786010742, 11.750452995300293, 12.125572204589844, 12.500692367553711, 12.875811576843262, 13.250930786132812, 13.626049995422363, 14.001169204711914]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 10.0, 7.0, 11.0, 8.0, 19.0, 28.0, 24.0, 24.0, 35.0, 29.0, 47.0, 44.0, 32.0, 51.0, 53.0, 43.0, 53.0, 52.0, 53.0, 34.0, 46.0, 38.0, 42.0, 37.0, 26.0, 28.0, 25.0, 23.0, 13.0, 15.0, 13.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.452207565307617, -5.282741546630859, -5.113275051116943, -4.943808555603027, -4.7743425369262695, -4.604876518249512, -4.435410022735596, -4.26594352722168, -4.096477508544922, -3.927011251449585, -3.757544994354248, -3.588078737258911, -3.418612480163574, -3.2491462230682373, -3.0796799659729004, -2.9102137088775635, -2.7407474517822266, -2.5712811946868896, -2.4018149375915527, -2.232348680496216, -2.062882423400879, -1.893416166305542, -1.723949909210205, -1.5544836521148682, -1.3850173950195312, -1.2155511379241943, -1.0460848808288574, -0.8766186237335205, -0.7071523666381836, -0.5376861095428467, -0.36821985244750977, -0.19875359535217285, -0.029287338256835938, 0.14017891883850098, 0.3096451759338379, 0.4791114330291748, 0.6485776901245117, 0.8180439472198486, 0.9875102043151855, 1.1569764614105225, 1.3264427185058594, 1.4959089756011963, 1.6653752326965332, 1.8348414897918701, 2.004307746887207, 2.173774003982544, 2.343240261077881, 2.5127065181732178, 2.6821727752685547, 2.8516390323638916, 3.0211052894592285, 3.1905715465545654, 3.3600378036499023, 3.5295040607452393, 3.698970317840576, 3.868436574935913, 4.03790283203125, 4.207368850708008, 4.376835346221924, 4.54630184173584, 4.715767860412598, 4.8852338790893555, 5.0547003746032715, 5.2241668701171875, 5.393632888793945]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 8.0, 12.0, 20.0, 34.0, 50.0, 67.0, 114.0, 170.0, 221.0, 398.0, 670.0, 1219.0, 2449.0, 5035.0, 11850.0, 33159.0, 133754.0, 3296363.0, 600122.0, 71345.0, 21337.0, 8204.0, 3537.0, 1714.0, 975.0, 539.0, 322.0, 211.0, 107.0, 86.0, 44.0, 37.0, 32.0, 8.0, 9.0, 17.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.751953125, -1.7001190185546875, -1.648284912109375, -1.5964508056640625, -1.54461669921875, -1.4927825927734375, -1.440948486328125, -1.3891143798828125, -1.3372802734375, -1.2854461669921875, -1.233612060546875, -1.1817779541015625, -1.12994384765625, -1.0781097412109375, -1.026275634765625, -0.9744415283203125, -0.922607421875, -0.8707733154296875, -0.818939208984375, -0.7671051025390625, -0.71527099609375, -0.6634368896484375, -0.611602783203125, -0.5597686767578125, -0.5079345703125, -0.4561004638671875, -0.404266357421875, -0.3524322509765625, -0.30059814453125, -0.2487640380859375, -0.196929931640625, -0.1450958251953125, -0.09326171875, -0.0414276123046875, 0.010406494140625, 0.0622406005859375, 0.11407470703125, 0.1659088134765625, 0.217742919921875, 0.2695770263671875, 0.3214111328125, 0.3732452392578125, 0.425079345703125, 0.4769134521484375, 0.52874755859375, 0.5805816650390625, 0.632415771484375, 0.6842498779296875, 0.736083984375, 0.7879180908203125, 0.839752197265625, 0.8915863037109375, 0.94342041015625, 0.9952545166015625, 1.047088623046875, 1.0989227294921875, 1.1507568359375, 1.2025909423828125, 1.254425048828125, 1.3062591552734375, 1.35809326171875, 1.4099273681640625, 1.461761474609375, 1.5135955810546875, 1.5654296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 9.0, 8.0, 7.0, 14.0, 22.0, 28.0, 25.0, 30.0, 40.0, 42.0, 53.0, 55.0, 59.0, 67.0, 78.0, 60.0, 58.0, 48.0, 44.0, 48.0, 41.0, 35.0, 24.0, 27.0, 17.0, 14.0, 9.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1990966796875, -0.19328689575195312, -0.18747711181640625, -0.18166732788085938, -0.1758575439453125, -0.17004776000976562, -0.16423797607421875, -0.15842819213867188, -0.152618408203125, -0.14680862426757812, -0.14099884033203125, -0.13518905639648438, -0.1293792724609375, -0.12356948852539062, -0.11775970458984375, -0.11194992065429688, -0.10614013671875, -0.10033035278320312, -0.09452056884765625, -0.08871078491210938, -0.0829010009765625, -0.07709121704101562, -0.07128143310546875, -0.06547164916992188, -0.059661865234375, -0.053852081298828125, -0.04804229736328125, -0.042232513427734375, -0.0364227294921875, -0.030612945556640625, -0.02480316162109375, -0.018993377685546875, -0.01318359375, -0.007373809814453125, -0.00156402587890625, 0.004245758056640625, 0.0100555419921875, 0.015865325927734375, 0.02167510986328125, 0.027484893798828125, 0.033294677734375, 0.039104461669921875, 0.04491424560546875, 0.050724029541015625, 0.0565338134765625, 0.062343597412109375, 0.06815338134765625, 0.07396316528320312, 0.07977294921875, 0.08558273315429688, 0.09139251708984375, 0.09720230102539062, 0.1030120849609375, 0.10882186889648438, 0.11463165283203125, 0.12044143676757812, 0.126251220703125, 0.13206100463867188, 0.13787078857421875, 0.14368057250976562, 0.1494903564453125, 0.15530014038085938, 0.16110992431640625, 0.16691970825195312, 0.1727294921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 12.0, 19.0, 34.0, 47.0, 117.0, 245.0, 803.0, 3749.0, 35357.0, 3889407.0, 252031.0, 9878.0, 1693.0, 482.0, 199.0, 69.0, 53.0, 31.0, 21.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9951171875, -3.865234375, -3.7353515625, -3.60546875, -3.4755859375, -3.345703125, -3.2158203125, -3.0859375, -2.9560546875, -2.826171875, -2.6962890625, -2.56640625, -2.4365234375, -2.306640625, -2.1767578125, -2.046875, -1.9169921875, -1.787109375, -1.6572265625, -1.52734375, -1.3974609375, -1.267578125, -1.1376953125, -1.0078125, -0.8779296875, -0.748046875, -0.6181640625, -0.48828125, -0.3583984375, -0.228515625, -0.0986328125, 0.03125, 0.1611328125, 0.291015625, 0.4208984375, 0.55078125, 0.6806640625, 0.810546875, 0.9404296875, 1.0703125, 1.2001953125, 1.330078125, 1.4599609375, 1.58984375, 1.7197265625, 1.849609375, 1.9794921875, 2.109375, 2.2392578125, 2.369140625, 2.4990234375, 2.62890625, 2.7587890625, 2.888671875, 3.0185546875, 3.1484375, 3.2783203125, 3.408203125, 3.5380859375, 3.66796875, 3.7978515625, 3.927734375, 4.0576171875, 4.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 4.0, 8.0, 5.0, 12.0, 13.0, 17.0, 18.0, 34.0, 36.0, 62.0, 107.0, 205.0, 555.0, 1709.0, 634.0, 251.0, 142.0, 81.0, 48.0, 41.0, 22.0, 14.0, 14.0, 6.0, 12.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36474609375, -0.3515434265136719, -0.33834075927734375, -0.3251380920410156, -0.3119354248046875, -0.2987327575683594, -0.28553009033203125, -0.2723274230957031, -0.259124755859375, -0.24592208862304688, -0.23271942138671875, -0.21951675415039062, -0.2063140869140625, -0.19311141967773438, -0.17990875244140625, -0.16670608520507812, -0.15350341796875, -0.14030075073242188, -0.12709808349609375, -0.11389541625976562, -0.1006927490234375, -0.08749008178710938, -0.07428741455078125, -0.061084747314453125, -0.047882080078125, -0.034679412841796875, -0.02147674560546875, -0.008274078369140625, 0.0049285888671875, 0.018131256103515625, 0.03133392333984375, 0.044536590576171875, 0.0577392578125, 0.07094192504882812, 0.08414459228515625, 0.09734725952148438, 0.1105499267578125, 0.12375259399414062, 0.13695526123046875, 0.15015792846679688, 0.163360595703125, 0.17656326293945312, 0.18976593017578125, 0.20296859741210938, 0.2161712646484375, 0.22937393188476562, 0.24257659912109375, 0.2557792663574219, 0.26898193359375, 0.2821846008300781, 0.29538726806640625, 0.3085899353027344, 0.3217926025390625, 0.3349952697753906, 0.34819793701171875, 0.3614006042480469, 0.374603271484375, 0.3878059387207031, 0.40100860595703125, 0.4142112731933594, 0.4274139404296875, 0.4406166076660156, 0.45381927490234375, 0.4670219421386719, 0.480224609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 10.0, 7.0, 32.0, 101.0, 303.0, 315.0, 160.0, 52.0, 16.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.755788803100586, -7.571357250213623, -7.386925220489502, -7.202493667602539, -7.018061637878418, -6.833630084991455, -6.649198055267334, -6.464766502380371, -6.28033447265625, -6.095902919769287, -5.911470890045166, -5.727039337158203, -5.542607307434082, -5.358175754547119, -5.173743724822998, -4.989312171936035, -4.804880142211914, -4.620448589324951, -4.43601655960083, -4.251585006713867, -4.067152976989746, -3.882721185684204, -3.698289394378662, -3.513857841491699, -3.3294262886047363, -3.1449944972991943, -2.9605627059936523, -2.7761309146881104, -2.5916991233825684, -2.4072673320770264, -2.2228355407714844, -2.0384039878845215, -1.8539719581604004, -1.6695401668548584, -1.4851083755493164, -1.3006765842437744, -1.1162447929382324, -0.9318130612373352, -0.747381329536438, -0.562949538230896, -0.378517746925354, -0.1940859705209732, -0.009654194116592407, 0.1747775673866272, 0.3592093586921692, 0.5436411499977112, 0.7280728816986084, 0.9125046730041504, 1.0969364643096924, 1.2813682556152344, 1.4658000469207764, 1.6502318382263184, 1.8346636295318604, 2.0190954208374023, 2.2035269737243652, 2.3879590034484863, 2.572390556335449, 2.756822347640991, 2.941254138946533, 3.125685930252075, 3.310117721557617, 3.494549512863159, 3.678981304168701, 3.863412857055664, 4.047844886779785]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 11.0, 21.0, 16.0, 19.0, 21.0, 40.0, 34.0, 51.0, 40.0, 49.0, 45.0, 61.0, 51.0, 76.0, 64.0, 48.0, 59.0, 54.0, 29.0, 44.0, 22.0, 22.0, 25.0, 14.0, 10.0, 14.0, 13.0, 5.0, 13.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5961822271347046, -1.543816328048706, -1.4914504289627075, -1.439084529876709, -1.38671875, -1.334352731704712, -1.281986951828003, -1.2296210527420044, -1.1772551536560059, -1.1248892545700073, -1.0725233554840088, -1.0201574563980103, -0.9677916169166565, -0.915425717830658, -0.8630598783493042, -0.8106939792633057, -0.7583280801773071, -0.7059621810913086, -0.6535962820053101, -0.6012304425239563, -0.5488645434379578, -0.49649864435195923, -0.4441327750682831, -0.39176690578460693, -0.3394010066986084, -0.28703510761260986, -0.23466923832893372, -0.18230335414409637, -0.12993746995925903, -0.0775715708732605, -0.02520570158958435, 0.027160167694091797, 0.07952618598937988, 0.13189207017421722, 0.18425795435905457, 0.2366238385438919, 0.28898972272872925, 0.3413556218147278, 0.39372149109840393, 0.4460873603820801, 0.4984532594680786, 0.5508191585540771, 0.6031850576400757, 0.6555508971214294, 0.707916796207428, 0.7602826952934265, 0.8126485347747803, 0.8650144338607788, 0.9173803329467773, 0.9697462320327759, 1.0221121311187744, 1.074478030204773, 1.1268439292907715, 1.1792097091674805, 1.231575608253479, 1.2839415073394775, 1.336307406425476, 1.3886733055114746, 1.4410392045974731, 1.4934051036834717, 1.5457708835601807, 1.5981369018554688, 1.6505026817321777, 1.7028685808181763, 1.7552344799041748]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 3.0, 8.0, 15.0, 22.0, 50.0, 38.0, 70.0, 87.0, 149.0, 252.0, 371.0, 635.0, 1066.0, 2199.0, 4555.0, 11479.0, 34255.0, 117780.0, 344811.0, 351788.0, 121963.0, 35480.0, 11740.0, 4746.0, 2150.0, 1079.0, 628.0, 424.0, 249.0, 168.0, 113.0, 67.0, 33.0, 24.0, 26.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0548553466796875, -1.020843505859375, -0.9868316650390625, -0.95281982421875, -0.9188079833984375, -0.884796142578125, -0.8507843017578125, -0.8167724609375, -0.7827606201171875, -0.748748779296875, -0.7147369384765625, -0.68072509765625, -0.6467132568359375, -0.612701416015625, -0.5786895751953125, -0.544677734375, -0.5106658935546875, -0.476654052734375, -0.4426422119140625, -0.40863037109375, -0.3746185302734375, -0.340606689453125, -0.3065948486328125, -0.2725830078125, -0.2385711669921875, -0.204559326171875, -0.1705474853515625, -0.13653564453125, -0.1025238037109375, -0.068511962890625, -0.0345001220703125, -0.00048828125, 0.0335235595703125, 0.067535400390625, 0.1015472412109375, 0.13555908203125, 0.1695709228515625, 0.203582763671875, 0.2375946044921875, 0.2716064453125, 0.3056182861328125, 0.339630126953125, 0.3736419677734375, 0.40765380859375, 0.4416656494140625, 0.475677490234375, 0.5096893310546875, 0.543701171875, 0.5777130126953125, 0.611724853515625, 0.6457366943359375, 0.67974853515625, 0.7137603759765625, 0.747772216796875, 0.7817840576171875, 0.8157958984375, 0.8498077392578125, 0.883819580078125, 0.9178314208984375, 0.95184326171875, 0.9858551025390625, 1.019866943359375, 1.0538787841796875, 1.087890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 7.0, 11.0, 8.0, 20.0, 24.0, 23.0, 38.0, 54.0, 57.0, 68.0, 93.0, 95.0, 84.0, 79.0, 70.0, 58.0, 57.0, 45.0, 33.0, 25.0, 12.0, 9.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23473548889160156, -0.22691726684570312, -0.2190990447998047, -0.21128082275390625, -0.2034626007080078, -0.19564437866210938, -0.18782615661621094, -0.1800079345703125, -0.17218971252441406, -0.16437149047851562, -0.1565532684326172, -0.14873504638671875, -0.1409168243408203, -0.13309860229492188, -0.12528038024902344, -0.117462158203125, -0.10964393615722656, -0.10182571411132812, -0.09400749206542969, -0.08618927001953125, -0.07837104797363281, -0.07055282592773438, -0.06273460388183594, -0.0549163818359375, -0.04709815979003906, -0.039279937744140625, -0.03146171569824219, -0.02364349365234375, -0.015825271606445312, -0.008007049560546875, -0.0001888275146484375, 0.00762939453125, 0.015447616577148438, 0.023265838623046875, 0.031084060668945312, 0.03890228271484375, 0.04672050476074219, 0.054538726806640625, 0.06235694885253906, 0.0701751708984375, 0.07799339294433594, 0.08581161499023438, 0.09362983703613281, 0.10144805908203125, 0.10926628112792969, 0.11708450317382812, 0.12490272521972656, 0.132720947265625, 0.14053916931152344, 0.14835739135742188, 0.1561756134033203, 0.16399383544921875, 0.1718120574951172, 0.17963027954101562, 0.18744850158691406, 0.1952667236328125, 0.20308494567871094, 0.21090316772460938, 0.2187213897705078, 0.22653961181640625, 0.2343578338623047, 0.24217605590820312, 0.24999427795410156, 0.2578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 3.0, 9.0, 14.0, 8.0, 22.0, 29.0, 40.0, 52.0, 73.0, 117.0, 189.0, 279.0, 431.0, 726.0, 1223.0, 2361.0, 4814.0, 10556.0, 25293.0, 66427.0, 184581.0, 354162.0, 245056.0, 92129.0, 33686.0, 13601.0, 5999.0, 2920.0, 1530.0, 851.0, 471.0, 305.0, 176.0, 119.0, 87.0, 71.0, 33.0, 32.0, 22.0, 18.0, 13.0, 10.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72607421875, -0.6998214721679688, -0.6735687255859375, -0.6473159790039062, -0.621063232421875, -0.5948104858398438, -0.5685577392578125, -0.5423049926757812, -0.51605224609375, -0.48979949951171875, -0.4635467529296875, -0.43729400634765625, -0.411041259765625, -0.38478851318359375, -0.3585357666015625, -0.33228302001953125, -0.3060302734375, -0.27977752685546875, -0.2535247802734375, -0.22727203369140625, -0.201019287109375, -0.17476654052734375, -0.1485137939453125, -0.12226104736328125, -0.09600830078125, -0.06975555419921875, -0.0435028076171875, -0.01725006103515625, 0.009002685546875, 0.03525543212890625, 0.0615081787109375, 0.08776092529296875, 0.114013671875, 0.14026641845703125, 0.1665191650390625, 0.19277191162109375, 0.219024658203125, 0.24527740478515625, 0.2715301513671875, 0.29778289794921875, 0.32403564453125, 0.35028839111328125, 0.3765411376953125, 0.40279388427734375, 0.429046630859375, 0.45529937744140625, 0.4815521240234375, 0.5078048706054688, 0.5340576171875, 0.5603103637695312, 0.5865631103515625, 0.6128158569335938, 0.639068603515625, 0.6653213500976562, 0.6915740966796875, 0.7178268432617188, 0.74407958984375, 0.7703323364257812, 0.7965850830078125, 0.8228378295898438, 0.849090576171875, 0.8753433227539062, 0.9015960693359375, 0.9278488159179688, 0.9541015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 3.0, 12.0, 11.0, 20.0, 17.0, 20.0, 23.0, 23.0, 30.0, 38.0, 25.0, 49.0, 38.0, 52.0, 46.0, 53.0, 56.0, 45.0, 41.0, 58.0, 49.0, 43.0, 36.0, 30.0, 23.0, 28.0, 18.0, 19.0, 16.0, 11.0, 8.0, 11.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.712432861328125, -0.68658447265625, -0.660736083984375, -0.6348876953125, -0.609039306640625, -0.58319091796875, -0.557342529296875, -0.531494140625, -0.505645751953125, -0.47979736328125, -0.453948974609375, -0.4281005859375, -0.402252197265625, -0.37640380859375, -0.350555419921875, -0.32470703125, -0.298858642578125, -0.27301025390625, -0.247161865234375, -0.2213134765625, -0.195465087890625, -0.16961669921875, -0.143768310546875, -0.117919921875, -0.092071533203125, -0.06622314453125, -0.040374755859375, -0.0145263671875, 0.011322021484375, 0.03717041015625, 0.063018798828125, 0.0888671875, 0.114715576171875, 0.14056396484375, 0.166412353515625, 0.1922607421875, 0.218109130859375, 0.24395751953125, 0.269805908203125, 0.295654296875, 0.321502685546875, 0.34735107421875, 0.373199462890625, 0.3990478515625, 0.424896240234375, 0.45074462890625, 0.476593017578125, 0.50244140625, 0.528289794921875, 0.55413818359375, 0.579986572265625, 0.6058349609375, 0.631683349609375, 0.65753173828125, 0.683380126953125, 0.709228515625, 0.735076904296875, 0.76092529296875, 0.786773681640625, 0.8126220703125, 0.838470458984375, 0.86431884765625, 0.890167236328125, 0.916015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 5.0, 6.0, 9.0, 15.0, 7.0, 22.0, 22.0, 39.0, 70.0, 99.0, 182.0, 347.0, 729.0, 1635.0, 4089.0, 12433.0, 66377.0, 692005.0, 234716.0, 24476.0, 6712.0, 2461.0, 993.0, 478.0, 229.0, 124.0, 84.0, 43.0, 39.0, 26.0, 15.0, 16.0, 9.0, 9.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7314453125, -0.7083969116210938, -0.6853485107421875, -0.6623001098632812, -0.639251708984375, -0.6162033081054688, -0.5931549072265625, -0.5701065063476562, -0.54705810546875, -0.5240097045898438, -0.5009613037109375, -0.47791290283203125, -0.454864501953125, -0.43181610107421875, -0.4087677001953125, -0.38571929931640625, -0.3626708984375, -0.33962249755859375, -0.3165740966796875, -0.29352569580078125, -0.270477294921875, -0.24742889404296875, -0.2243804931640625, -0.20133209228515625, -0.17828369140625, -0.15523529052734375, -0.1321868896484375, -0.10913848876953125, -0.086090087890625, -0.06304168701171875, -0.0399932861328125, -0.01694488525390625, 0.006103515625, 0.02915191650390625, 0.0522003173828125, 0.07524871826171875, 0.098297119140625, 0.12134552001953125, 0.1443939208984375, 0.16744232177734375, 0.19049072265625, 0.21353912353515625, 0.2365875244140625, 0.25963592529296875, 0.282684326171875, 0.30573272705078125, 0.3287811279296875, 0.35182952880859375, 0.3748779296875, 0.39792633056640625, 0.4209747314453125, 0.44402313232421875, 0.467071533203125, 0.49011993408203125, 0.5131683349609375, 0.5362167358398438, 0.55926513671875, 0.5823135375976562, 0.6053619384765625, 0.6284103393554688, 0.651458740234375, 0.6745071411132812, 0.6975555419921875, 0.7206039428710938, 0.74365234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 14.0, 12.0, 32.0, 27.0, 50.0, 57.0, 93.0, 116.0, 121.0, 102.0, 99.0, 64.0, 50.0, 36.0, 32.0, 19.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.398294448852539e-05, -8.123181760311127e-05, -7.848069071769714e-05, -7.572956383228302e-05, -7.29784369468689e-05, -7.022731006145477e-05, -6.747618317604065e-05, -6.472505629062653e-05, -6.19739294052124e-05, -5.922280251979828e-05, -5.6471675634384155e-05, -5.372054874897003e-05, -5.096942186355591e-05, -4.8218294978141785e-05, -4.546716809272766e-05, -4.271604120731354e-05, -3.9964914321899414e-05, -3.721378743648529e-05, -3.446266055107117e-05, -3.1711533665657043e-05, -2.896040678024292e-05, -2.6209279894828796e-05, -2.3458153009414673e-05, -2.070702612400055e-05, -1.7955899238586426e-05, -1.5204772353172302e-05, -1.2453645467758179e-05, -9.702518582344055e-06, -6.951391696929932e-06, -4.200264811515808e-06, -1.4491379261016846e-06, 1.301988959312439e-06, 4.0531158447265625e-06, 6.804242730140686e-06, 9.55536961555481e-06, 1.2306496500968933e-05, 1.5057623386383057e-05, 1.780875027179718e-05, 2.0559877157211304e-05, 2.3311004042625427e-05, 2.606213092803955e-05, 2.8813257813453674e-05, 3.15643846988678e-05, 3.431551158428192e-05, 3.7066638469696045e-05, 3.981776535511017e-05, 4.256889224052429e-05, 4.5320019125938416e-05, 4.807114601135254e-05, 5.082227289676666e-05, 5.3573399782180786e-05, 5.632452666759491e-05, 5.907565355300903e-05, 6.182678043842316e-05, 6.457790732383728e-05, 6.73290342092514e-05, 7.008016109466553e-05, 7.283128798007965e-05, 7.558241486549377e-05, 7.83335417509079e-05, 8.108466863632202e-05, 8.383579552173615e-05, 8.658692240715027e-05, 8.933804929256439e-05, 9.208917617797852e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 17.0, 25.0, 26.0, 45.0, 86.0, 114.0, 189.0, 327.0, 676.0, 1368.0, 2948.0, 7312.0, 22490.0, 142944.0, 697682.0, 137122.0, 21968.0, 7445.0, 2879.0, 1364.0, 644.0, 345.0, 190.0, 92.0, 61.0, 48.0, 28.0, 26.0, 19.0, 14.0, 3.0, 5.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6794204711914062, -0.6591339111328125, -0.6388473510742188, -0.618560791015625, -0.5982742309570312, -0.5779876708984375, -0.5577011108398438, -0.53741455078125, -0.5171279907226562, -0.4968414306640625, -0.47655487060546875, -0.456268310546875, -0.43598175048828125, -0.4156951904296875, -0.39540863037109375, -0.3751220703125, -0.35483551025390625, -0.3345489501953125, -0.31426239013671875, -0.293975830078125, -0.27368927001953125, -0.2534027099609375, -0.23311614990234375, -0.21282958984375, -0.19254302978515625, -0.1722564697265625, -0.15196990966796875, -0.131683349609375, -0.11139678955078125, -0.0911102294921875, -0.07082366943359375, -0.050537109375, -0.03025054931640625, -0.0099639892578125, 0.01032257080078125, 0.030609130859375, 0.05089569091796875, 0.0711822509765625, 0.09146881103515625, 0.11175537109375, 0.13204193115234375, 0.1523284912109375, 0.17261505126953125, 0.192901611328125, 0.21318817138671875, 0.2334747314453125, 0.25376129150390625, 0.2740478515625, 0.29433441162109375, 0.3146209716796875, 0.33490753173828125, 0.355194091796875, 0.37548065185546875, 0.3957672119140625, 0.41605377197265625, 0.43634033203125, 0.45662689208984375, 0.4769134521484375, 0.49720001220703125, 0.517486572265625, 0.5377731323242188, 0.5580596923828125, 0.5783462524414062, 0.5986328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 5.0, 1.0, 10.0, 8.0, 10.0, 13.0, 26.0, 45.0, 71.0, 88.0, 138.0, 164.0, 132.0, 103.0, 65.0, 35.0, 18.0, 18.0, 9.0, 6.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5564956665039062, -0.5392608642578125, -0.5220260620117188, -0.504791259765625, -0.48755645751953125, -0.4703216552734375, -0.45308685302734375, -0.43585205078125, -0.41861724853515625, -0.4013824462890625, -0.38414764404296875, -0.366912841796875, -0.34967803955078125, -0.3324432373046875, -0.31520843505859375, -0.2979736328125, -0.28073883056640625, -0.2635040283203125, -0.24626922607421875, -0.229034423828125, -0.21179962158203125, -0.1945648193359375, -0.17733001708984375, -0.16009521484375, -0.14286041259765625, -0.1256256103515625, -0.10839080810546875, -0.091156005859375, -0.07392120361328125, -0.0566864013671875, -0.03945159912109375, -0.022216796875, -0.00498199462890625, 0.0122528076171875, 0.02948760986328125, 0.046722412109375, 0.06395721435546875, 0.0811920166015625, 0.09842681884765625, 0.11566162109375, 0.13289642333984375, 0.1501312255859375, 0.16736602783203125, 0.184600830078125, 0.20183563232421875, 0.2190704345703125, 0.23630523681640625, 0.2535400390625, 0.27077484130859375, 0.2880096435546875, 0.30524444580078125, 0.322479248046875, 0.33971405029296875, 0.3569488525390625, 0.37418365478515625, 0.39141845703125, 0.40865325927734375, 0.4258880615234375, 0.44312286376953125, 0.460357666015625, 0.47759246826171875, 0.4948272705078125, 0.5120620727539062, 0.529296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 16.0, 45.0, 203.0, 370.0, 239.0, 86.0, 30.0, 11.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.228866577148438, -17.65174674987793, -17.074626922607422, -16.497507095336914, -15.920388221740723, -15.343268394470215, -14.766149520874023, -14.189029693603516, -13.611909866333008, -13.0347900390625, -12.457670211791992, -11.8805513381958, -11.303431510925293, -10.726311683654785, -10.149192810058594, -9.572072982788086, -8.994953155517578, -8.41783332824707, -7.840713977813721, -7.263594627380371, -6.686474800109863, -6.1093549728393555, -5.532235622406006, -4.955116271972656, -4.377996444702148, -3.8008768558502197, -3.223757266998291, -2.6466376781463623, -2.0695180892944336, -1.4923985004425049, -0.9152789115905762, -0.33815956115722656, 0.23896026611328125, 0.81607985496521, 1.3931994438171387, 1.9703190326690674, 2.547438621520996, 3.124558210372925, 3.7016777992248535, 4.278797149658203, 4.855916976928711, 5.433036804199219, 6.010156154632568, 6.587275505065918, 7.164395332336426, 7.741515159606934, 8.318634033203125, 8.895753860473633, 9.47287368774414, 10.049993515014648, 10.627113342285156, 11.204232215881348, 11.781352043151855, 12.358471870422363, 12.935590744018555, 13.512710571289062, 14.08983039855957, 14.666950225830078, 15.244070053100586, 15.821188926696777, 16.39830780029297, 16.975427627563477, 17.552547454833984, 18.129667282104492, 18.706787109375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 16.0, 14.0, 14.0, 24.0, 27.0, 34.0, 33.0, 30.0, 45.0, 48.0, 47.0, 54.0, 50.0, 66.0, 63.0, 45.0, 44.0, 45.0, 34.0, 36.0, 39.0, 29.0, 22.0, 23.0, 21.0, 9.0, 13.0, 10.0, 10.0, 3.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6068220138549805, -5.43815803527832, -5.269493579864502, -5.100829601287842, -4.932165622711182, -4.763501167297363, -4.594837188720703, -4.426173210144043, -4.257508754730225, -4.0888447761535645, -3.920180559158325, -3.751516342163086, -3.5828521251678467, -3.4141879081726074, -3.2455239295959473, -3.076859712600708, -2.908195734024048, -2.7395315170288086, -2.5708675384521484, -2.402203321456909, -2.23353910446167, -2.0648751258850098, -1.8962109088897705, -1.7275466918945312, -1.5588825941085815, -1.3902184963226318, -1.2215542793273926, -1.0528901815414429, -0.8842260241508484, -0.7155618667602539, -0.5468977689743042, -0.37823355197906494, -0.20956945419311523, -0.040905311703681946, 0.12775883078575134, 0.29642295837402344, 0.4650871157646179, 0.6337512731552124, 0.8024153709411621, 0.9710795879364014, 1.139743685722351, 1.3084077835083008, 1.47707200050354, 1.6457360982894897, 1.8144001960754395, 1.9830644130706787, 2.151728630065918, 2.320392608642578, 2.4890568256378174, 2.6577210426330566, 2.826385021209717, 2.995049238204956, 3.1637134552001953, 3.3323774337768555, 3.5010416507720947, 3.669705867767334, 3.838369846343994, 4.007033824920654, 4.175698280334473, 4.344362258911133, 4.513026237487793, 4.681690692901611, 4.8503546714782715, 5.01901912689209, 5.18768310546875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 13.0, 24.0, 24.0, 55.0, 61.0, 85.0, 128.0, 202.0, 340.0, 560.0, 1052.0, 2326.0, 5525.0, 15219.0, 62830.0, 1247936.0, 2755939.0, 74373.0, 16773.0, 5788.0, 2439.0, 1103.0, 560.0, 289.0, 217.0, 101.0, 91.0, 47.0, 49.0, 25.0, 21.0, 18.0, 12.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8468399047851562, -0.8084259033203125, -0.7700119018554688, -0.731597900390625, -0.6931838989257812, -0.6547698974609375, -0.6163558959960938, -0.57794189453125, -0.5395278930664062, -0.5011138916015625, -0.46269989013671875, -0.424285888671875, -0.38587188720703125, -0.3474578857421875, -0.30904388427734375, -0.2706298828125, -0.23221588134765625, -0.1938018798828125, -0.15538787841796875, -0.116973876953125, -0.07855987548828125, -0.0401458740234375, -0.00173187255859375, 0.03668212890625, 0.07509613037109375, 0.1135101318359375, 0.15192413330078125, 0.190338134765625, 0.22875213623046875, 0.2671661376953125, 0.30558013916015625, 0.343994140625, 0.38240814208984375, 0.4208221435546875, 0.45923614501953125, 0.497650146484375, 0.5360641479492188, 0.5744781494140625, 0.6128921508789062, 0.65130615234375, 0.6897201538085938, 0.7281341552734375, 0.7665481567382812, 0.804962158203125, 0.8433761596679688, 0.8817901611328125, 0.9202041625976562, 0.9586181640625, 0.9970321655273438, 1.0354461669921875, 1.0738601684570312, 1.112274169921875, 1.1506881713867188, 1.1891021728515625, 1.2275161743164062, 1.26593017578125, 1.3043441772460938, 1.3427581787109375, 1.3811721801757812, 1.419586181640625, 1.4580001831054688, 1.4964141845703125, 1.5348281860351562, 1.5732421875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 13.0, 17.0, 25.0, 28.0, 52.0, 65.0, 64.0, 73.0, 85.0, 93.0, 86.0, 68.0, 81.0, 58.0, 46.0, 41.0, 27.0, 21.0, 12.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24267578125, -0.23416519165039062, -0.22565460205078125, -0.21714401245117188, -0.2086334228515625, -0.20012283325195312, -0.19161224365234375, -0.18310165405273438, -0.174591064453125, -0.16608047485351562, -0.15756988525390625, -0.14905929565429688, -0.1405487060546875, -0.13203811645507812, -0.12352752685546875, -0.11501693725585938, -0.10650634765625, -0.09799575805664062, -0.08948516845703125, -0.08097457885742188, -0.0724639892578125, -0.06395339965820312, -0.05544281005859375, -0.046932220458984375, -0.038421630859375, -0.029911041259765625, -0.02140045166015625, -0.012889862060546875, -0.0043792724609375, 0.004131317138671875, 0.01264190673828125, 0.021152496337890625, 0.0296630859375, 0.038173675537109375, 0.04668426513671875, 0.055194854736328125, 0.0637054443359375, 0.07221603393554688, 0.08072662353515625, 0.08923721313476562, 0.097747802734375, 0.10625839233398438, 0.11476898193359375, 0.12327957153320312, 0.1317901611328125, 0.14030075073242188, 0.14881134033203125, 0.15732192993164062, 0.16583251953125, 0.17434310913085938, 0.18285369873046875, 0.19136428833007812, 0.1998748779296875, 0.20838546752929688, 0.21689605712890625, 0.22540664672851562, 0.233917236328125, 0.24242782592773438, 0.25093841552734375, 0.2594490051269531, 0.2679595947265625, 0.2764701843261719, 0.28498077392578125, 0.2934913635253906, 0.302001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 10.0, 5.0, 10.0, 28.0, 46.0, 137.0, 290.0, 782.0, 2196.0, 9859.0, 94740.0, 3901921.0, 167574.0, 12737.0, 2492.0, 821.0, 357.0, 135.0, 68.0, 43.0, 12.0, 9.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.546875, -1.48394775390625, -1.4210205078125, -1.35809326171875, -1.295166015625, -1.23223876953125, -1.1693115234375, -1.10638427734375, -1.04345703125, -0.98052978515625, -0.9176025390625, -0.85467529296875, -0.791748046875, -0.72882080078125, -0.6658935546875, -0.60296630859375, -0.5400390625, -0.47711181640625, -0.4141845703125, -0.35125732421875, -0.288330078125, -0.22540283203125, -0.1624755859375, -0.09954833984375, -0.03662109375, 0.02630615234375, 0.0892333984375, 0.15216064453125, 0.215087890625, 0.27801513671875, 0.3409423828125, 0.40386962890625, 0.466796875, 0.52972412109375, 0.5926513671875, 0.65557861328125, 0.718505859375, 0.78143310546875, 0.8443603515625, 0.90728759765625, 0.97021484375, 1.03314208984375, 1.0960693359375, 1.15899658203125, 1.221923828125, 1.28485107421875, 1.3477783203125, 1.41070556640625, 1.4736328125, 1.53656005859375, 1.5994873046875, 1.66241455078125, 1.725341796875, 1.78826904296875, 1.8511962890625, 1.91412353515625, 1.97705078125, 2.03997802734375, 2.1029052734375, 2.16583251953125, 2.228759765625, 2.29168701171875, 2.3546142578125, 2.41754150390625, 2.48046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 10.0, 14.0, 38.0, 35.0, 71.0, 149.0, 321.0, 1053.0, 1616.0, 367.0, 161.0, 84.0, 38.0, 25.0, 22.0, 14.0, 11.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33447265625, -0.32297515869140625, -0.3114776611328125, -0.29998016357421875, -0.288482666015625, -0.27698516845703125, -0.2654876708984375, -0.25399017333984375, -0.24249267578125, -0.23099517822265625, -0.2194976806640625, -0.20800018310546875, -0.196502685546875, -0.18500518798828125, -0.1735076904296875, -0.16201019287109375, -0.1505126953125, -0.13901519775390625, -0.1275177001953125, -0.11602020263671875, -0.104522705078125, -0.09302520751953125, -0.0815277099609375, -0.07003021240234375, -0.05853271484375, -0.04703521728515625, -0.0355377197265625, -0.02404022216796875, -0.012542724609375, -0.00104522705078125, 0.0104522705078125, 0.02194976806640625, 0.033447265625, 0.04494476318359375, 0.0564422607421875, 0.06793975830078125, 0.079437255859375, 0.09093475341796875, 0.1024322509765625, 0.11392974853515625, 0.12542724609375, 0.13692474365234375, 0.1484222412109375, 0.15991973876953125, 0.171417236328125, 0.18291473388671875, 0.1944122314453125, 0.20590972900390625, 0.2174072265625, 0.22890472412109375, 0.2404022216796875, 0.25189971923828125, 0.263397216796875, 0.27489471435546875, 0.2863922119140625, 0.29788970947265625, 0.30938720703125, 0.32088470458984375, 0.3323822021484375, 0.34387969970703125, 0.355377197265625, 0.36687469482421875, 0.3783721923828125, 0.38986968994140625, 0.4013671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 30.0, 90.0, 205.0, 313.0, 225.0, 93.0, 33.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.004284858703613, -5.883307933807373, -5.762331008911133, -5.641354560852051, -5.5203776359558105, -5.39940071105957, -5.27842378616333, -5.15744686126709, -5.036470413208008, -4.915493488311768, -4.794516563415527, -4.673540115356445, -4.552563190460205, -4.431586265563965, -4.310609340667725, -4.189632415771484, -4.068655490875244, -3.947678565979004, -3.8267018795013428, -3.7057249546051025, -3.5847482681274414, -3.463771343231201, -3.342794418334961, -3.2218177318573, -3.1008410453796387, -2.9798641204833984, -2.8588874340057373, -2.737910509109497, -2.616933822631836, -2.4959568977355957, -2.3749799728393555, -2.2540032863616943, -2.133026361465454, -2.012049436569214, -1.8910727500915527, -1.7700958251953125, -1.6491190195083618, -1.5281422138214111, -1.4071654081344604, -1.2861886024475098, -1.1652116775512695, -1.0442348718643188, -0.9232580065727234, -0.8022812008857727, -0.6813043355941772, -0.5603275299072266, -0.4393507242202759, -0.3183738589286804, -0.1973971128463745, -0.07642028480768204, 0.04455654323101044, 0.16553336381912231, 0.2865101993083954, 0.40748703479766846, 0.5284638404846191, 0.6494407057762146, 0.7704175114631653, 0.891394317150116, 1.0123711824417114, 1.133347988128662, 1.2543247938156128, 1.3753015995025635, 1.4962785243988037, 1.6172553300857544, 1.738232135772705]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 3.0, 5.0, 1.0, 10.0, 12.0, 14.0, 26.0, 27.0, 24.0, 25.0, 36.0, 19.0, 47.0, 51.0, 54.0, 60.0, 41.0, 41.0, 38.0, 50.0, 60.0, 47.0, 51.0, 34.0, 46.0, 37.0, 37.0, 15.0, 20.0, 19.0, 12.0, 7.0, 10.0, 10.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8928457498550415, -0.8597777485847473, -0.8267097473144531, -0.7936418056488037, -0.7605738043785095, -0.7275058031082153, -0.6944378614425659, -0.6613698601722717, -0.6283018589019775, -0.5952338576316833, -0.5621658563613892, -0.5290979146957397, -0.49602991342544556, -0.46296191215515137, -0.42989394068717957, -0.39682596921920776, -0.3637579679489136, -0.3306899666786194, -0.2976219952106476, -0.2645540237426758, -0.2314860224723816, -0.1984180361032486, -0.1653500497341156, -0.1322820633649826, -0.09921407699584961, -0.06614609062671661, -0.03307810425758362, -1.0117888450622559e-05, 0.03305786848068237, 0.06612585484981537, 0.09919384121894836, 0.13226182758808136, 0.1653299331665039, 0.1983979195356369, 0.2314659059047699, 0.2645338773727417, 0.2976018786430359, 0.3306698799133301, 0.3637378513813019, 0.3968058228492737, 0.42987382411956787, 0.46294182538986206, 0.49600979685783386, 0.5290777683258057, 0.5621457695960999, 0.595213770866394, 0.6282817125320435, 0.6613497138023376, 0.6944177150726318, 0.727485716342926, 0.7605537176132202, 0.7936216592788696, 0.8266896605491638, 0.859757661819458, 0.8928256034851074, 0.9258936047554016, 0.9589616060256958, 0.99202960729599, 1.0250976085662842, 1.0581655502319336, 1.091233491897583, 1.124301552772522, 1.1573694944381714, 1.1904375553131104, 1.2235054969787598]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 7.0, 3.0, 11.0, 14.0, 26.0, 34.0, 42.0, 47.0, 125.0, 164.0, 295.0, 454.0, 812.0, 1379.0, 2544.0, 5355.0, 13937.0, 45341.0, 166895.0, 400789.0, 284636.0, 85233.0, 24193.0, 8358.0, 3500.0, 1818.0, 986.0, 601.0, 357.0, 202.0, 138.0, 87.0, 57.0, 32.0, 22.0, 20.0, 17.0, 6.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85791015625, -0.8258285522460938, -0.7937469482421875, -0.7616653442382812, -0.729583740234375, -0.6975021362304688, -0.6654205322265625, -0.6333389282226562, -0.60125732421875, -0.5691757202148438, -0.5370941162109375, -0.5050125122070312, -0.472930908203125, -0.44084930419921875, -0.4087677001953125, -0.37668609619140625, -0.3446044921875, -0.31252288818359375, -0.2804412841796875, -0.24835968017578125, -0.216278076171875, -0.18419647216796875, -0.1521148681640625, -0.12003326416015625, -0.08795166015625, -0.05587005615234375, -0.0237884521484375, 0.00829315185546875, 0.040374755859375, 0.07245635986328125, 0.1045379638671875, 0.13661956787109375, 0.168701171875, 0.20078277587890625, 0.2328643798828125, 0.26494598388671875, 0.297027587890625, 0.32910919189453125, 0.3611907958984375, 0.39327239990234375, 0.42535400390625, 0.45743560791015625, 0.4895172119140625, 0.5215988159179688, 0.553680419921875, 0.5857620239257812, 0.6178436279296875, 0.6499252319335938, 0.6820068359375, 0.7140884399414062, 0.7461700439453125, 0.7782516479492188, 0.810333251953125, 0.8424148559570312, 0.8744964599609375, 0.9065780639648438, 0.93865966796875, 0.9707412719726562, 1.0028228759765625, 1.0349044799804688, 1.066986083984375, 1.0990676879882812, 1.1311492919921875, 1.1632308959960938, 1.1953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 15.0, 20.0, 21.0, 27.0, 43.0, 42.0, 46.0, 69.0, 75.0, 90.0, 72.0, 76.0, 78.0, 52.0, 70.0, 54.0, 43.0, 24.0, 24.0, 15.0, 10.0, 9.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2110595703125, -0.20310020446777344, -0.19514083862304688, -0.1871814727783203, -0.17922210693359375, -0.1712627410888672, -0.16330337524414062, -0.15534400939941406, -0.1473846435546875, -0.13942527770996094, -0.13146591186523438, -0.12350654602050781, -0.11554718017578125, -0.10758781433105469, -0.09962844848632812, -0.09166908264160156, -0.083709716796875, -0.07575035095214844, -0.06779098510742188, -0.05983161926269531, -0.05187225341796875, -0.04391288757324219, -0.035953521728515625, -0.027994155883789062, -0.0200347900390625, -0.012075424194335938, -0.004116058349609375, 0.0038433074951171875, 0.01180267333984375, 0.019762039184570312, 0.027721405029296875, 0.03568077087402344, 0.04364013671875, 0.05159950256347656, 0.059558868408203125, 0.06751823425292969, 0.07547760009765625, 0.08343696594238281, 0.09139633178710938, 0.09935569763183594, 0.1073150634765625, 0.11527442932128906, 0.12323379516601562, 0.1311931610107422, 0.13915252685546875, 0.1471118927001953, 0.15507125854492188, 0.16303062438964844, 0.170989990234375, 0.17894935607910156, 0.18690872192382812, 0.1948680877685547, 0.20282745361328125, 0.2107868194580078, 0.21874618530273438, 0.22670555114746094, 0.2346649169921875, 0.24262428283691406, 0.2505836486816406, 0.2585430145263672, 0.26650238037109375, 0.2744617462158203, 0.2824211120605469, 0.29038047790527344, 0.29833984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 7.0, 20.0, 28.0, 18.0, 26.0, 46.0, 64.0, 96.0, 144.0, 193.0, 273.0, 461.0, 758.0, 1268.0, 2403.0, 4595.0, 9732.0, 22015.0, 53122.0, 133348.0, 284667.0, 292437.0, 141863.0, 56337.0, 23455.0, 10289.0, 4869.0, 2479.0, 1341.0, 775.0, 458.0, 291.0, 190.0, 128.0, 94.0, 55.0, 45.0, 43.0, 33.0, 19.0, 16.0, 17.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6816482543945312, -0.6596832275390625, -0.6377182006835938, -0.615753173828125, -0.5937881469726562, -0.5718231201171875, -0.5498580932617188, -0.52789306640625, -0.5059280395507812, -0.4839630126953125, -0.46199798583984375, -0.440032958984375, -0.41806793212890625, -0.3961029052734375, -0.37413787841796875, -0.3521728515625, -0.33020782470703125, -0.3082427978515625, -0.28627777099609375, -0.264312744140625, -0.24234771728515625, -0.2203826904296875, -0.19841766357421875, -0.17645263671875, -0.15448760986328125, -0.1325225830078125, -0.11055755615234375, -0.088592529296875, -0.06662750244140625, -0.0446624755859375, -0.02269744873046875, -0.000732421875, 0.02123260498046875, 0.0431976318359375, 0.06516265869140625, 0.087127685546875, 0.10909271240234375, 0.1310577392578125, 0.15302276611328125, 0.17498779296875, 0.19695281982421875, 0.2189178466796875, 0.24088287353515625, 0.262847900390625, 0.28481292724609375, 0.3067779541015625, 0.32874298095703125, 0.3507080078125, 0.37267303466796875, 0.3946380615234375, 0.41660308837890625, 0.438568115234375, 0.46053314208984375, 0.4824981689453125, 0.5044631958007812, 0.52642822265625, 0.5483932495117188, 0.5703582763671875, 0.5923233032226562, 0.614288330078125, 0.6362533569335938, 0.6582183837890625, 0.6801834106445312, 0.7021484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 9.0, 18.0, 15.0, 18.0, 18.0, 22.0, 15.0, 28.0, 30.0, 30.0, 44.0, 60.0, 40.0, 52.0, 30.0, 43.0, 53.0, 31.0, 39.0, 42.0, 52.0, 36.0, 24.0, 41.0, 25.0, 26.0, 28.0, 16.0, 26.0, 10.0, 13.0, 12.0, 6.0, 4.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.83203125, -0.80712890625, -0.7822265625, -0.75732421875, -0.732421875, -0.70751953125, -0.6826171875, -0.65771484375, -0.6328125, -0.60791015625, -0.5830078125, -0.55810546875, -0.533203125, -0.50830078125, -0.4833984375, -0.45849609375, -0.43359375, -0.40869140625, -0.3837890625, -0.35888671875, -0.333984375, -0.30908203125, -0.2841796875, -0.25927734375, -0.234375, -0.20947265625, -0.1845703125, -0.15966796875, -0.134765625, -0.10986328125, -0.0849609375, -0.06005859375, -0.03515625, -0.01025390625, 0.0146484375, 0.03955078125, 0.064453125, 0.08935546875, 0.1142578125, 0.13916015625, 0.1640625, 0.18896484375, 0.2138671875, 0.23876953125, 0.263671875, 0.28857421875, 0.3134765625, 0.33837890625, 0.36328125, 0.38818359375, 0.4130859375, 0.43798828125, 0.462890625, 0.48779296875, 0.5126953125, 0.53759765625, 0.5625, 0.58740234375, 0.6123046875, 0.63720703125, 0.662109375, 0.68701171875, 0.7119140625, 0.73681640625, 0.76171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 13.0, 15.0, 31.0, 55.0, 89.0, 145.0, 303.0, 588.0, 1412.0, 5072.0, 29641.0, 467891.0, 503126.0, 32242.0, 5147.0, 1556.0, 623.0, 248.0, 139.0, 69.0, 47.0, 23.0, 29.0, 10.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.5990447998046875, -0.576019287109375, -0.5529937744140625, -0.52996826171875, -0.5069427490234375, -0.483917236328125, -0.4608917236328125, -0.4378662109375, -0.4148406982421875, -0.391815185546875, -0.3687896728515625, -0.34576416015625, -0.3227386474609375, -0.299713134765625, -0.2766876220703125, -0.253662109375, -0.2306365966796875, -0.207611083984375, -0.1845855712890625, -0.16156005859375, -0.1385345458984375, -0.115509033203125, -0.0924835205078125, -0.0694580078125, -0.0464324951171875, -0.023406982421875, -0.0003814697265625, 0.02264404296875, 0.0456695556640625, 0.068695068359375, 0.0917205810546875, 0.11474609375, 0.1377716064453125, 0.160797119140625, 0.1838226318359375, 0.20684814453125, 0.2298736572265625, 0.252899169921875, 0.2759246826171875, 0.2989501953125, 0.3219757080078125, 0.345001220703125, 0.3680267333984375, 0.39105224609375, 0.4140777587890625, 0.437103271484375, 0.4601287841796875, 0.483154296875, 0.5061798095703125, 0.529205322265625, 0.5522308349609375, 0.57525634765625, 0.5982818603515625, 0.621307373046875, 0.6443328857421875, 0.6673583984375, 0.6903839111328125, 0.713409423828125, 0.7364349365234375, 0.75946044921875, 0.7824859619140625, 0.805511474609375, 0.8285369873046875, 0.8515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 11.0, 25.0, 20.0, 22.0, 51.0, 85.0, 121.0, 118.0, 134.0, 115.0, 84.0, 56.0, 44.0, 33.0, 18.0, 23.0, 7.0, 11.0, 4.0, 7.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001055598258972168, -0.00010246876627206802, -9.937770664691925e-05, -9.628664702177048e-05, -9.31955873966217e-05, -9.010452777147293e-05, -8.701346814632416e-05, -8.392240852117538e-05, -8.083134889602661e-05, -7.774028927087784e-05, -7.464922964572906e-05, -7.155817002058029e-05, -6.846711039543152e-05, -6.537605077028275e-05, -6.228499114513397e-05, -5.91939315199852e-05, -5.6102871894836426e-05, -5.301181226968765e-05, -4.992075264453888e-05, -4.6829693019390106e-05, -4.373863339424133e-05, -4.064757376909256e-05, -3.755651414394379e-05, -3.4465454518795013e-05, -3.137439489364624e-05, -2.8283335268497467e-05, -2.5192275643348694e-05, -2.210121601819992e-05, -1.9010156393051147e-05, -1.5919096767902374e-05, -1.2828037142753601e-05, -9.736977517604828e-06, -6.645917892456055e-06, -3.5548582673072815e-06, -4.637986421585083e-07, 2.627260982990265e-06, 5.718320608139038e-06, 8.809380233287811e-06, 1.1900439858436584e-05, 1.4991499483585358e-05, 1.808255910873413e-05, 2.1173618733882904e-05, 2.4264678359031677e-05, 2.735573798418045e-05, 3.0446797609329224e-05, 3.3537857234478e-05, 3.662891685962677e-05, 3.971997648477554e-05, 4.2811036109924316e-05, 4.590209573507309e-05, 4.899315536022186e-05, 5.2084214985370636e-05, 5.517527461051941e-05, 5.826633423566818e-05, 6.135739386081696e-05, 6.444845348596573e-05, 6.75395131111145e-05, 7.063057273626328e-05, 7.372163236141205e-05, 7.681269198656082e-05, 7.99037516117096e-05, 8.299481123685837e-05, 8.608587086200714e-05, 8.917693048715591e-05, 9.226799011230469e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 5.0, 14.0, 15.0, 23.0, 35.0, 43.0, 78.0, 133.0, 215.0, 389.0, 709.0, 1666.0, 4380.0, 15878.0, 100422.0, 616490.0, 263336.0, 32639.0, 7379.0, 2435.0, 1039.0, 518.0, 249.0, 171.0, 111.0, 60.0, 46.0, 21.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.468505859375, -0.4527397155761719, -0.43697357177734375, -0.4212074279785156, -0.4054412841796875, -0.3896751403808594, -0.37390899658203125, -0.3581428527832031, -0.342376708984375, -0.3266105651855469, -0.31084442138671875, -0.2950782775878906, -0.2793121337890625, -0.2635459899902344, -0.24777984619140625, -0.23201370239257812, -0.21624755859375, -0.20048141479492188, -0.18471527099609375, -0.16894912719726562, -0.1531829833984375, -0.13741683959960938, -0.12165069580078125, -0.10588455200195312, -0.090118408203125, -0.07435226440429688, -0.05858612060546875, -0.042819976806640625, -0.0270538330078125, -0.011287689208984375, 0.00447845458984375, 0.020244598388671875, 0.0360107421875, 0.051776885986328125, 0.06754302978515625, 0.08330917358398438, 0.0990753173828125, 0.11484146118164062, 0.13060760498046875, 0.14637374877929688, 0.162139892578125, 0.17790603637695312, 0.19367218017578125, 0.20943832397460938, 0.2252044677734375, 0.24097061157226562, 0.25673675537109375, 0.2725028991699219, 0.28826904296875, 0.3040351867675781, 0.31980133056640625, 0.3355674743652344, 0.3513336181640625, 0.3670997619628906, 0.38286590576171875, 0.3986320495605469, 0.414398193359375, 0.4301643371582031, 0.44593048095703125, 0.4616966247558594, 0.4774627685546875, 0.4932289123535156, 0.5089950561523438, 0.5247611999511719, 0.54052734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 19.0, 34.0, 60.0, 88.0, 139.0, 163.0, 151.0, 116.0, 73.0, 57.0, 27.0, 19.0, 10.0, 9.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5049362182617188, -0.4874114990234375, -0.46988677978515625, -0.452362060546875, -0.43483734130859375, -0.4173126220703125, -0.39978790283203125, -0.38226318359375, -0.36473846435546875, -0.3472137451171875, -0.32968902587890625, -0.312164306640625, -0.29463958740234375, -0.2771148681640625, -0.25959014892578125, -0.2420654296875, -0.22454071044921875, -0.2070159912109375, -0.18949127197265625, -0.171966552734375, -0.15444183349609375, -0.1369171142578125, -0.11939239501953125, -0.10186767578125, -0.08434295654296875, -0.0668182373046875, -0.04929351806640625, -0.031768798828125, -0.01424407958984375, 0.0032806396484375, 0.02080535888671875, 0.038330078125, 0.05585479736328125, 0.0733795166015625, 0.09090423583984375, 0.108428955078125, 0.12595367431640625, 0.1434783935546875, 0.16100311279296875, 0.17852783203125, 0.19605255126953125, 0.2135772705078125, 0.23110198974609375, 0.248626708984375, 0.26615142822265625, 0.2836761474609375, 0.30120086669921875, 0.3187255859375, 0.33625030517578125, 0.3537750244140625, 0.37129974365234375, 0.388824462890625, 0.40634918212890625, 0.4238739013671875, 0.44139862060546875, 0.45892333984375, 0.47644805908203125, 0.4939727783203125, 0.5114974975585938, 0.529022216796875, 0.5465469360351562, 0.5640716552734375, 0.5815963745117188, 0.59912109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 15.0, 27.0, 46.0, 104.0, 190.0, 201.0, 152.0, 113.0, 74.0, 29.0, 16.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6962890625, -13.401540756225586, -13.106792449951172, -12.812044143676758, -12.517295837402344, -12.22254753112793, -11.927799224853516, -11.633050918579102, -11.338302612304688, -11.043554306030273, -10.74880599975586, -10.454057693481445, -10.159309387207031, -9.864561080932617, -9.569812774658203, -9.275064468383789, -8.980317115783691, -8.685568809509277, -8.390820503234863, -8.09607219696045, -7.801323890686035, -7.506575584411621, -7.211827754974365, -6.917079448699951, -6.622331142425537, -6.327582836151123, -6.032834529876709, -5.738086223602295, -5.443338394165039, -5.148590087890625, -4.853841781616211, -4.559093475341797, -4.264345169067383, -3.9695968627929688, -3.6748485565185547, -3.3801004886627197, -3.0853521823883057, -2.7906038761138916, -2.4958558082580566, -2.2011075019836426, -1.9063591957092285, -1.6116108894348145, -1.31686270236969, -1.0221145153045654, -0.7273662090301514, -0.4326179027557373, -0.1378697156906128, 0.15687847137451172, 0.4516267776489258, 0.7463750243186951, 1.0411232709884644, 1.3358714580535889, 1.630619764328003, 1.925368070602417, 2.220116138458252, 2.514864444732666, 2.80961275100708, 3.104361057281494, 3.399109363555908, 3.693857431411743, 3.9886057376861572, 4.283353805541992, 4.578102111816406, 4.87285041809082, 5.167598724365234]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 10.0, 11.0, 13.0, 21.0, 24.0, 33.0, 21.0, 39.0, 37.0, 38.0, 35.0, 55.0, 47.0, 51.0, 54.0, 58.0, 53.0, 43.0, 45.0, 41.0, 29.0, 33.0, 26.0, 25.0, 31.0, 21.0, 12.0, 15.0, 9.0, 13.0, 7.0, 4.0, 4.0, 0.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.2443342208862305, -5.084080696105957, -4.923826694488525, -4.763573169708252, -4.60331916809082, -4.443065643310547, -4.282812118530273, -4.122558116912842, -3.9623045921325684, -3.802050828933716, -3.6417970657348633, -3.48154354095459, -3.3212897777557373, -3.1610360145568848, -3.0007822513580322, -2.8405284881591797, -2.680274724960327, -2.5200209617614746, -2.359767198562622, -2.1995134353637695, -2.039259910583496, -1.8790061473846436, -1.718752384185791, -1.558498740196228, -1.3982449769973755, -1.237991213798523, -1.07773756980896, -0.9174838066101074, -0.7572301030158997, -0.5969763994216919, -0.43672263622283936, -0.27646899223327637, -0.11621522903442383, 0.04403848946094513, 0.2042922079563141, 0.36454594135284424, 0.524799644947052, 0.6850533485412598, 0.8453071117401123, 1.0055607557296753, 1.1658145189285278, 1.3260682821273804, 1.4863219261169434, 1.646575689315796, 1.8068294525146484, 1.9670830965042114, 2.1273369789123535, 2.287590503692627, 2.4478442668914795, 2.608098030090332, 2.7683517932891846, 2.928605556488037, 3.0888590812683105, 3.249112844467163, 3.4093666076660156, 3.569620132446289, 3.7298741340637207, 3.8901278972625732, 4.050381660461426, 4.210635185241699, 4.370889186859131, 4.531142711639404, 4.691396713256836, 4.851650238037109, 5.011903762817383]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 17.0, 11.0, 15.0, 25.0, 43.0, 48.0, 99.0, 175.0, 298.0, 664.0, 1450.0, 3969.0, 14462.0, 116904.0, 3881082.0, 151480.0, 16367.0, 4256.0, 1483.0, 687.0, 303.0, 169.0, 97.0, 61.0, 29.0, 26.0, 17.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.0689697265625, -2.001220703125, -1.9334716796875, -1.86572265625, -1.7979736328125, -1.730224609375, -1.6624755859375, -1.5947265625, -1.5269775390625, -1.459228515625, -1.3914794921875, -1.32373046875, -1.2559814453125, -1.188232421875, -1.1204833984375, -1.052734375, -0.9849853515625, -0.917236328125, -0.8494873046875, -0.78173828125, -0.7139892578125, -0.646240234375, -0.5784912109375, -0.5107421875, -0.4429931640625, -0.375244140625, -0.3074951171875, -0.23974609375, -0.1719970703125, -0.104248046875, -0.0364990234375, 0.03125, 0.0989990234375, 0.166748046875, 0.2344970703125, 0.30224609375, 0.3699951171875, 0.437744140625, 0.5054931640625, 0.5732421875, 0.6409912109375, 0.708740234375, 0.7764892578125, 0.84423828125, 0.9119873046875, 0.979736328125, 1.0474853515625, 1.115234375, 1.1829833984375, 1.250732421875, 1.3184814453125, 1.38623046875, 1.4539794921875, 1.521728515625, 1.5894775390625, 1.6572265625, 1.7249755859375, 1.792724609375, 1.8604736328125, 1.92822265625, 1.9959716796875, 2.063720703125, 2.1314697265625, 2.19921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 19.0, 28.0, 40.0, 52.0, 91.0, 95.0, 114.0, 129.0, 106.0, 81.0, 82.0, 39.0, 38.0, 30.0, 19.0, 13.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3688812255859375, -0.357147216796875, -0.3454132080078125, -0.33367919921875, -0.3219451904296875, -0.310211181640625, -0.2984771728515625, -0.2867431640625, -0.2750091552734375, -0.263275146484375, -0.2515411376953125, -0.23980712890625, -0.2280731201171875, -0.216339111328125, -0.2046051025390625, -0.19287109375, -0.1811370849609375, -0.169403076171875, -0.1576690673828125, -0.14593505859375, -0.1342010498046875, -0.122467041015625, -0.1107330322265625, -0.0989990234375, -0.0872650146484375, -0.075531005859375, -0.0637969970703125, -0.05206298828125, -0.0403289794921875, -0.028594970703125, -0.0168609619140625, -0.005126953125, 0.0066070556640625, 0.018341064453125, 0.0300750732421875, 0.04180908203125, 0.0535430908203125, 0.065277099609375, 0.0770111083984375, 0.0887451171875, 0.1004791259765625, 0.112213134765625, 0.1239471435546875, 0.13568115234375, 0.1474151611328125, 0.159149169921875, 0.1708831787109375, 0.1826171875, 0.1943511962890625, 0.206085205078125, 0.2178192138671875, 0.22955322265625, 0.2412872314453125, 0.253021240234375, 0.2647552490234375, 0.2764892578125, 0.2882232666015625, 0.299957275390625, 0.3116912841796875, 0.32342529296875, 0.3351593017578125, 0.346893310546875, 0.3586273193359375, 0.370361328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 9.0, 19.0, 30.0, 54.0, 108.0, 217.0, 484.0, 1067.0, 2816.0, 8564.0, 45985.0, 3508525.0, 592327.0, 24177.0, 5952.0, 2197.0, 839.0, 416.0, 229.0, 106.0, 59.0, 30.0, 17.0, 17.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.722412109375, -1.65576171875, -1.589111328125, -1.5224609375, -1.455810546875, -1.38916015625, -1.322509765625, -1.255859375, -1.189208984375, -1.12255859375, -1.055908203125, -0.9892578125, -0.922607421875, -0.85595703125, -0.789306640625, -0.72265625, -0.656005859375, -0.58935546875, -0.522705078125, -0.4560546875, -0.389404296875, -0.32275390625, -0.256103515625, -0.189453125, -0.122802734375, -0.05615234375, 0.010498046875, 0.0771484375, 0.143798828125, 0.21044921875, 0.277099609375, 0.34375, 0.410400390625, 0.47705078125, 0.543701171875, 0.6103515625, 0.677001953125, 0.74365234375, 0.810302734375, 0.876953125, 0.943603515625, 1.01025390625, 1.076904296875, 1.1435546875, 1.210205078125, 1.27685546875, 1.343505859375, 1.41015625, 1.476806640625, 1.54345703125, 1.610107421875, 1.6767578125, 1.743408203125, 1.81005859375, 1.876708984375, 1.943359375, 2.010009765625, 2.07666015625, 2.143310546875, 2.2099609375, 2.276611328125, 2.34326171875, 2.409912109375, 2.4765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 9.0, 15.0, 32.0, 44.0, 122.0, 348.0, 1620.0, 1317.0, 299.0, 112.0, 55.0, 22.0, 16.0, 13.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6304931640625, -0.606201171875, -0.5819091796875, -0.5576171875, -0.5333251953125, -0.509033203125, -0.4847412109375, -0.46044921875, -0.4361572265625, -0.411865234375, -0.3875732421875, -0.36328125, -0.3389892578125, -0.314697265625, -0.2904052734375, -0.26611328125, -0.2418212890625, -0.217529296875, -0.1932373046875, -0.1689453125, -0.1446533203125, -0.120361328125, -0.0960693359375, -0.07177734375, -0.0474853515625, -0.023193359375, 0.0010986328125, 0.025390625, 0.0496826171875, 0.073974609375, 0.0982666015625, 0.12255859375, 0.1468505859375, 0.171142578125, 0.1954345703125, 0.2197265625, 0.2440185546875, 0.268310546875, 0.2926025390625, 0.31689453125, 0.3411865234375, 0.365478515625, 0.3897705078125, 0.4140625, 0.4383544921875, 0.462646484375, 0.4869384765625, 0.51123046875, 0.5355224609375, 0.559814453125, 0.5841064453125, 0.6083984375, 0.6326904296875, 0.656982421875, 0.6812744140625, 0.70556640625, 0.7298583984375, 0.754150390625, 0.7784423828125, 0.802734375, 0.8270263671875, 0.851318359375, 0.8756103515625, 0.89990234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 9.0, 20.0, 59.0, 152.0, 295.0, 284.0, 107.0, 39.0, 13.0, 6.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6997599601745605, -4.510450839996338, -4.321142196655273, -4.131833076477051, -3.9425241947174072, -3.7532153129577637, -3.563906192779541, -3.3745973110198975, -3.185288429260254, -2.9959795475006104, -2.806670665740967, -2.617361545562744, -2.4280526638031006, -2.238743782043457, -2.0494346618652344, -1.8601257801055908, -1.6708168983459473, -1.4815080165863037, -1.2921990156173706, -1.1028900146484375, -0.913581132888794, -0.7242721915245056, -0.5349632501602173, -0.3456542491912842, -0.15634536743164062, 0.032963573932647705, 0.22227251529693604, 0.41158145666122437, 0.6008903980255127, 0.790199339389801, 0.9795082807540894, 1.1688172817230225, 1.3581256866455078, 1.5474345684051514, 1.7367435693740845, 1.9260525703430176, 2.115361452102661, 2.3046703338623047, 2.4939794540405273, 2.683288335800171, 2.8725972175598145, 3.061906099319458, 3.2512149810791016, 3.440524101257324, 3.6298329830169678, 3.8191418647766113, 4.008450984954834, 4.197759628295898, 4.387068748474121, 4.576377868652344, 4.765686511993408, 4.954995632171631, 5.144304275512695, 5.333613395690918, 5.522922515869141, 5.712231636047363, 5.901540279388428, 6.09084939956665, 6.280158042907715, 6.4694671630859375, 6.65877628326416, 6.848084926605225, 7.037394046783447, 7.226702690124512, 7.416011810302734]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 13.0, 25.0, 33.0, 65.0, 90.0, 105.0, 97.0, 127.0, 110.0, 117.0, 81.0, 49.0, 36.0, 23.0, 10.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6562447547912598, -2.543438673019409, -2.4306323528289795, -2.317826271057129, -2.205019950866699, -2.0922138690948486, -1.979407787322998, -1.866601586341858, -1.7537953853607178, -1.6409891843795776, -1.5281829833984375, -1.415376901626587, -1.3025707006454468, -1.1897644996643066, -1.076958417892456, -0.9641522169113159, -0.8513460159301758, -0.7385398149490356, -0.6257336735725403, -0.5129275321960449, -0.4001213312149048, -0.28731513023376465, -0.1745089888572693, -0.061702847480773926, 0.05110335350036621, 0.16390952467918396, 0.2767156958580017, 0.38952186703681946, 0.5023280382156372, 0.6151342391967773, 0.7279403805732727, 0.8407465219497681, 0.9535527229309082, 1.0663589239120483, 1.1791651248931885, 1.291971206665039, 1.4047774076461792, 1.5175836086273193, 1.63038969039917, 1.74319589138031, 1.8560020923614502, 1.9688082933425903, 2.0816144943237305, 2.194420576095581, 2.3072266578674316, 2.4200329780578613, 2.532839059829712, 2.6456451416015625, 2.758451461791992, 2.8712575435638428, 2.9840638637542725, 3.096869945526123, 3.2096762657165527, 3.3224823474884033, 3.435288429260254, 3.5480947494506836, 3.660900831222534, 3.7737069129943848, 3.8865132331848145, 3.999319314956665, 4.112125396728516, 4.224931716918945, 4.337738037109375, 4.4505438804626465, 4.563350200653076]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 3.0, 5.0, 12.0, 8.0, 20.0, 20.0, 26.0, 49.0, 67.0, 96.0, 153.0, 216.0, 337.0, 538.0, 998.0, 1784.0, 4195.0, 15273.0, 113198.0, 628724.0, 243848.0, 27482.0, 6200.0, 2348.0, 1163.0, 645.0, 406.0, 235.0, 173.0, 96.0, 61.0, 47.0, 38.0, 35.0, 11.0, 15.0, 11.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.711578369140625, -1.65753173828125, -1.603485107421875, -1.5494384765625, -1.495391845703125, -1.44134521484375, -1.387298583984375, -1.333251953125, -1.279205322265625, -1.22515869140625, -1.171112060546875, -1.1170654296875, -1.063018798828125, -1.00897216796875, -0.954925537109375, -0.90087890625, -0.846832275390625, -0.79278564453125, -0.738739013671875, -0.6846923828125, -0.630645751953125, -0.57659912109375, -0.522552490234375, -0.468505859375, -0.414459228515625, -0.36041259765625, -0.306365966796875, -0.2523193359375, -0.198272705078125, -0.14422607421875, -0.090179443359375, -0.0361328125, 0.017913818359375, 0.07196044921875, 0.126007080078125, 0.1800537109375, 0.234100341796875, 0.28814697265625, 0.342193603515625, 0.396240234375, 0.450286865234375, 0.50433349609375, 0.558380126953125, 0.6124267578125, 0.666473388671875, 0.72052001953125, 0.774566650390625, 0.82861328125, 0.882659912109375, 0.93670654296875, 0.990753173828125, 1.0447998046875, 1.098846435546875, 1.15289306640625, 1.206939697265625, 1.260986328125, 1.315032958984375, 1.36907958984375, 1.423126220703125, 1.4771728515625, 1.531219482421875, 1.58526611328125, 1.639312744140625, 1.693359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 27.0, 49.0, 87.0, 141.0, 157.0, 168.0, 138.0, 96.0, 59.0, 37.0, 13.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447265625, -0.43018341064453125, -0.4131011962890625, -0.39601898193359375, -0.378936767578125, -0.36185455322265625, -0.3447723388671875, -0.32769012451171875, -0.31060791015625, -0.29352569580078125, -0.2764434814453125, -0.25936126708984375, -0.242279052734375, -0.22519683837890625, -0.2081146240234375, -0.19103240966796875, -0.1739501953125, -0.15686798095703125, -0.1397857666015625, -0.12270355224609375, -0.105621337890625, -0.08853912353515625, -0.0714569091796875, -0.05437469482421875, -0.03729248046875, -0.02021026611328125, -0.0031280517578125, 0.01395416259765625, 0.031036376953125, 0.04811859130859375, 0.0652008056640625, 0.08228302001953125, 0.099365234375, 0.11644744873046875, 0.1335296630859375, 0.15061187744140625, 0.167694091796875, 0.18477630615234375, 0.2018585205078125, 0.21894073486328125, 0.23602294921875, 0.25310516357421875, 0.2701873779296875, 0.28726959228515625, 0.304351806640625, 0.32143402099609375, 0.3385162353515625, 0.35559844970703125, 0.3726806640625, 0.38976287841796875, 0.4068450927734375, 0.42392730712890625, 0.441009521484375, 0.45809173583984375, 0.4751739501953125, 0.49225616455078125, 0.50933837890625, 0.5264205932617188, 0.5435028076171875, 0.5605850219726562, 0.577667236328125, 0.5947494506835938, 0.6118316650390625, 0.6289138793945312, 0.64599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 13.0, 12.0, 14.0, 15.0, 37.0, 47.0, 64.0, 82.0, 150.0, 226.0, 381.0, 687.0, 1269.0, 2638.0, 5944.0, 14561.0, 38778.0, 107195.0, 260445.0, 332837.0, 176050.0, 65581.0, 23779.0, 9364.0, 3985.0, 1902.0, 1018.0, 563.0, 333.0, 197.0, 141.0, 73.0, 55.0, 35.0, 27.0, 13.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6384124755859375, -0.618621826171875, -0.5988311767578125, -0.57904052734375, -0.5592498779296875, -0.539459228515625, -0.5196685791015625, -0.4998779296875, -0.4800872802734375, -0.460296630859375, -0.4405059814453125, -0.42071533203125, -0.4009246826171875, -0.381134033203125, -0.3613433837890625, -0.341552734375, -0.3217620849609375, -0.301971435546875, -0.2821807861328125, -0.26239013671875, -0.2425994873046875, -0.222808837890625, -0.2030181884765625, -0.1832275390625, -0.1634368896484375, -0.143646240234375, -0.1238555908203125, -0.10406494140625, -0.0842742919921875, -0.064483642578125, -0.0446929931640625, -0.02490234375, -0.0051116943359375, 0.014678955078125, 0.0344696044921875, 0.05426025390625, 0.0740509033203125, 0.093841552734375, 0.1136322021484375, 0.1334228515625, 0.1532135009765625, 0.173004150390625, 0.1927947998046875, 0.21258544921875, 0.2323760986328125, 0.252166748046875, 0.2719573974609375, 0.291748046875, 0.3115386962890625, 0.331329345703125, 0.3511199951171875, 0.37091064453125, 0.3907012939453125, 0.410491943359375, 0.4302825927734375, 0.4500732421875, 0.4698638916015625, 0.489654541015625, 0.5094451904296875, 0.52923583984375, 0.5490264892578125, 0.568817138671875, 0.5886077880859375, 0.6083984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 11.0, 12.0, 7.0, 10.0, 14.0, 19.0, 21.0, 30.0, 35.0, 25.0, 26.0, 46.0, 45.0, 51.0, 44.0, 48.0, 53.0, 47.0, 57.0, 49.0, 47.0, 39.0, 31.0, 33.0, 33.0, 27.0, 23.0, 23.0, 12.0, 13.0, 11.0, 10.0, 13.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.828125, -0.8059234619140625, -0.783721923828125, -0.7615203857421875, -0.73931884765625, -0.7171173095703125, -0.694915771484375, -0.6727142333984375, -0.6505126953125, -0.6283111572265625, -0.606109619140625, -0.5839080810546875, -0.56170654296875, -0.5395050048828125, -0.517303466796875, -0.4951019287109375, -0.472900390625, -0.4506988525390625, -0.428497314453125, -0.4062957763671875, -0.38409423828125, -0.3618927001953125, -0.339691162109375, -0.3174896240234375, -0.2952880859375, -0.2730865478515625, -0.250885009765625, -0.2286834716796875, -0.20648193359375, -0.1842803955078125, -0.162078857421875, -0.1398773193359375, -0.11767578125, -0.0954742431640625, -0.073272705078125, -0.0510711669921875, -0.02886962890625, -0.0066680908203125, 0.015533447265625, 0.0377349853515625, 0.0599365234375, 0.0821380615234375, 0.104339599609375, 0.1265411376953125, 0.14874267578125, 0.1709442138671875, 0.193145751953125, 0.2153472900390625, 0.237548828125, 0.2597503662109375, 0.281951904296875, 0.3041534423828125, 0.32635498046875, 0.3485565185546875, 0.370758056640625, 0.3929595947265625, 0.4151611328125, 0.4373626708984375, 0.459564208984375, 0.4817657470703125, 0.50396728515625, 0.5261688232421875, 0.548370361328125, 0.5705718994140625, 0.5927734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 10.0, 15.0, 16.0, 17.0, 27.0, 29.0, 40.0, 78.0, 111.0, 147.0, 207.0, 359.0, 662.0, 1394.0, 3212.0, 9475.0, 43817.0, 356741.0, 532221.0, 78019.0, 13929.0, 4310.0, 1652.0, 812.0, 426.0, 242.0, 167.0, 115.0, 64.0, 56.0, 45.0, 21.0, 26.0, 12.0, 17.0, 13.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44775390625, -0.4333763122558594, -0.41899871826171875, -0.4046211242675781, -0.3902435302734375, -0.3758659362792969, -0.36148834228515625, -0.3471107482910156, -0.332733154296875, -0.3183555603027344, -0.30397796630859375, -0.2896003723144531, -0.2752227783203125, -0.2608451843261719, -0.24646759033203125, -0.23208999633789062, -0.21771240234375, -0.20333480834960938, -0.18895721435546875, -0.17457962036132812, -0.1602020263671875, -0.14582443237304688, -0.13144683837890625, -0.11706924438476562, -0.102691650390625, -0.08831405639648438, -0.07393646240234375, -0.059558868408203125, -0.0451812744140625, -0.030803680419921875, -0.01642608642578125, -0.002048492431640625, 0.0123291015625, 0.026706695556640625, 0.04108428955078125, 0.055461883544921875, 0.0698394775390625, 0.08421707153320312, 0.09859466552734375, 0.11297225952148438, 0.127349853515625, 0.14172744750976562, 0.15610504150390625, 0.17048263549804688, 0.1848602294921875, 0.19923782348632812, 0.21361541748046875, 0.22799301147460938, 0.24237060546875, 0.2567481994628906, 0.27112579345703125, 0.2855033874511719, 0.2998809814453125, 0.3142585754394531, 0.32863616943359375, 0.3430137634277344, 0.357391357421875, 0.3717689514160156, 0.38614654541015625, 0.4005241394042969, 0.4149017333984375, 0.4292793273925781, 0.44365692138671875, 0.4580345153808594, 0.472412109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 7.0, 6.0, 17.0, 18.0, 38.0, 53.0, 82.0, 101.0, 113.0, 128.0, 95.0, 98.0, 71.0, 53.0, 33.0, 32.0, 14.0, 16.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.26716423034668e-05, -8.011981844902039e-05, -7.756799459457397e-05, -7.501617074012756e-05, -7.246434688568115e-05, -6.991252303123474e-05, -6.736069917678833e-05, -6.480887532234192e-05, -6.225705146789551e-05, -5.97052276134491e-05, -5.7153403759002686e-05, -5.4601579904556274e-05, -5.204975605010986e-05, -4.949793219566345e-05, -4.694610834121704e-05, -4.439428448677063e-05, -4.184246063232422e-05, -3.929063677787781e-05, -3.6738812923431396e-05, -3.4186989068984985e-05, -3.1635165214538574e-05, -2.9083341360092163e-05, -2.6531517505645752e-05, -2.397969365119934e-05, -2.142786979675293e-05, -1.887604594230652e-05, -1.6324222087860107e-05, -1.3772398233413696e-05, -1.1220574378967285e-05, -8.668750524520874e-06, -6.116926670074463e-06, -3.5651028156280518e-06, -1.0132789611816406e-06, 1.5385448932647705e-06, 4.090368747711182e-06, 6.642192602157593e-06, 9.194016456604004e-06, 1.1745840311050415e-05, 1.4297664165496826e-05, 1.6849488019943237e-05, 1.940131187438965e-05, 2.195313572883606e-05, 2.450495958328247e-05, 2.7056783437728882e-05, 2.9608607292175293e-05, 3.2160431146621704e-05, 3.4712255001068115e-05, 3.7264078855514526e-05, 3.981590270996094e-05, 4.236772656440735e-05, 4.491955041885376e-05, 4.747137427330017e-05, 5.002319812774658e-05, 5.257502198219299e-05, 5.5126845836639404e-05, 5.7678669691085815e-05, 6.0230493545532227e-05, 6.278231739997864e-05, 6.533414125442505e-05, 6.788596510887146e-05, 7.043778896331787e-05, 7.298961281776428e-05, 7.55414366722107e-05, 7.80932605266571e-05, 8.064508438110352e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 17.0, 17.0, 37.0, 51.0, 75.0, 133.0, 225.0, 404.0, 761.0, 1594.0, 3680.0, 9744.0, 32624.0, 156958.0, 491402.0, 271699.0, 55068.0, 14685.0, 4995.0, 2087.0, 1013.0, 510.0, 287.0, 179.0, 108.0, 65.0, 35.0, 30.0, 26.0, 12.0, 10.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.33306884765625, -0.3228759765625, -0.31268310546875, -0.302490234375, -0.29229736328125, -0.2821044921875, -0.27191162109375, -0.26171875, -0.25152587890625, -0.2413330078125, -0.23114013671875, -0.220947265625, -0.21075439453125, -0.2005615234375, -0.19036865234375, -0.18017578125, -0.16998291015625, -0.1597900390625, -0.14959716796875, -0.139404296875, -0.12921142578125, -0.1190185546875, -0.10882568359375, -0.0986328125, -0.08843994140625, -0.0782470703125, -0.06805419921875, -0.057861328125, -0.04766845703125, -0.0374755859375, -0.02728271484375, -0.01708984375, -0.00689697265625, 0.0032958984375, 0.01348876953125, 0.023681640625, 0.03387451171875, 0.0440673828125, 0.05426025390625, 0.064453125, 0.07464599609375, 0.0848388671875, 0.09503173828125, 0.105224609375, 0.11541748046875, 0.1256103515625, 0.13580322265625, 0.14599609375, 0.15618896484375, 0.1663818359375, 0.17657470703125, 0.186767578125, 0.19696044921875, 0.2071533203125, 0.21734619140625, 0.2275390625, 0.23773193359375, 0.2479248046875, 0.25811767578125, 0.268310546875, 0.27850341796875, 0.2886962890625, 0.29888916015625, 0.30908203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 13.0, 11.0, 17.0, 17.0, 37.0, 29.0, 53.0, 78.0, 83.0, 120.0, 87.0, 121.0, 94.0, 44.0, 59.0, 28.0, 25.0, 16.0, 13.0, 13.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.414794921875, -0.40430450439453125, -0.3938140869140625, -0.38332366943359375, -0.372833251953125, -0.36234283447265625, -0.3518524169921875, -0.34136199951171875, -0.33087158203125, -0.32038116455078125, -0.3098907470703125, -0.29940032958984375, -0.288909912109375, -0.27841949462890625, -0.2679290771484375, -0.25743865966796875, -0.2469482421875, -0.23645782470703125, -0.2259674072265625, -0.21547698974609375, -0.204986572265625, -0.19449615478515625, -0.1840057373046875, -0.17351531982421875, -0.16302490234375, -0.15253448486328125, -0.1420440673828125, -0.13155364990234375, -0.121063232421875, -0.11057281494140625, -0.1000823974609375, -0.08959197998046875, -0.0791015625, -0.06861114501953125, -0.0581207275390625, -0.04763031005859375, -0.037139892578125, -0.02664947509765625, -0.0161590576171875, -0.00566864013671875, 0.00482177734375, 0.01531219482421875, 0.0258026123046875, 0.03629302978515625, 0.046783447265625, 0.05727386474609375, 0.0677642822265625, 0.07825469970703125, 0.0887451171875, 0.09923553466796875, 0.1097259521484375, 0.12021636962890625, 0.130706787109375, 0.14119720458984375, 0.1516876220703125, 0.16217803955078125, 0.17266845703125, 0.18315887451171875, 0.1936492919921875, 0.20413970947265625, 0.214630126953125, 0.22512054443359375, 0.2356109619140625, 0.24610137939453125, 0.256591796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 11.0, 34.0, 45.0, 73.0, 118.0, 156.0, 195.0, 137.0, 93.0, 55.0, 38.0, 13.0, 7.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.495314598083496, -6.294703483581543, -6.094092845916748, -5.893482208251953, -5.69287109375, -5.492259979248047, -5.291649341583252, -5.091038703918457, -4.890427589416504, -4.689816474914551, -4.489205837249756, -4.288595199584961, -4.087984085083008, -3.887373208999634, -3.6867623329162598, -3.4861514568328857, -3.2855405807495117, -3.0849297046661377, -2.8843188285827637, -2.6837079524993896, -2.4830970764160156, -2.2824862003326416, -2.0818753242492676, -1.8812644481658936, -1.6806535720825195, -1.4800426959991455, -1.2794318199157715, -1.0788209438323975, -0.8782100677490234, -0.6775991916656494, -0.4769883155822754, -0.27637743949890137, -0.07576656341552734, 0.12484431266784668, 0.3254551887512207, 0.5260660648345947, 0.7266769409179688, 0.9272878170013428, 1.1278986930847168, 1.3285095691680908, 1.5291204452514648, 1.7297313213348389, 1.930342197418213, 2.130953073501587, 2.331563949584961, 2.532174825668335, 2.732785701751709, 2.933396577835083, 3.134007453918457, 3.334618330001831, 3.535229206085205, 3.735840082168579, 3.936450958251953, 4.137062072753906, 4.337672710418701, 4.538283348083496, 4.738894462585449, 4.939505577087402, 5.140116214752197, 5.340726852416992, 5.541337966918945, 5.741949081420898, 5.942559719085693, 6.143170356750488, 6.343781471252441]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 6.0, 13.0, 26.0, 31.0, 29.0, 46.0, 53.0, 59.0, 60.0, 61.0, 66.0, 70.0, 87.0, 70.0, 57.0, 44.0, 46.0, 42.0, 32.0, 33.0, 12.0, 16.0, 9.0, 5.0, 10.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.679933071136475, -7.50173807144165, -7.323543548583984, -7.14534854888916, -6.967154026031494, -6.78895902633667, -6.610764503479004, -6.43256950378418, -6.2543745040893555, -6.076179504394531, -5.897984981536865, -5.719789981842041, -5.541595458984375, -5.363400459289551, -5.185205459594727, -5.0070109367370605, -4.8288164138793945, -4.65062141418457, -4.472426891326904, -4.29423189163208, -4.116037368774414, -3.93784236907959, -3.7596476078033447, -3.5814528465270996, -3.4032580852508545, -3.2250633239746094, -3.0468685626983643, -2.868673801422119, -2.690478801727295, -2.512284278869629, -2.3340892791748047, -2.1558945178985596, -1.9776997566223145, -1.7995049953460693, -1.6213102340698242, -1.4431153535842896, -1.2649205923080444, -1.0867258310317993, -0.9085309505462646, -0.7303361892700195, -0.5521414279937744, -0.3739466369152069, -0.1957518458366394, -0.01755702495574951, 0.1606377363204956, 0.3388324975967407, 0.5170273780822754, 0.6952221393585205, 0.8734169006347656, 1.0516116619110107, 1.2298064231872559, 1.4080013036727905, 1.5861960649490356, 1.7643908262252808, 1.9425857067108154, 2.1207804679870605, 2.2989752292633057, 2.477169990539551, 2.655364751815796, 2.833559513092041, 3.0117545127868652, 3.1899490356445312, 3.3681440353393555, 3.5463387966156006, 3.7245335578918457]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 12.0, 14.0, 19.0, 64.0, 143.0, 383.0, 1597.0, 20587.0, 4150592.0, 18907.0, 1332.0, 369.0, 140.0, 55.0, 34.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.771453857421875, -2.64251708984375, -2.513580322265625, -2.3846435546875, -2.255706787109375, -2.12677001953125, -1.997833251953125, -1.868896484375, -1.739959716796875, -1.61102294921875, -1.482086181640625, -1.3531494140625, -1.224212646484375, -1.09527587890625, -0.966339111328125, -0.83740234375, -0.708465576171875, -0.57952880859375, -0.450592041015625, -0.3216552734375, -0.192718505859375, -0.06378173828125, 0.065155029296875, 0.194091796875, 0.323028564453125, 0.45196533203125, 0.580902099609375, 0.7098388671875, 0.838775634765625, 0.96771240234375, 1.096649169921875, 1.2255859375, 1.354522705078125, 1.48345947265625, 1.612396240234375, 1.7413330078125, 1.870269775390625, 1.99920654296875, 2.128143310546875, 2.257080078125, 2.386016845703125, 2.51495361328125, 2.643890380859375, 2.7728271484375, 2.901763916015625, 3.03070068359375, 3.159637451171875, 3.28857421875, 3.417510986328125, 3.54644775390625, 3.675384521484375, 3.8043212890625, 3.933258056640625, 4.06219482421875, 4.191131591796875, 4.320068359375, 4.449005126953125, 4.57794189453125, 4.706878662109375, 4.8358154296875, 4.964752197265625, 5.09368896484375, 5.222625732421875, 5.3515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 5.0, 10.0, 21.0, 47.0, 77.0, 105.0, 160.0, 147.0, 140.0, 126.0, 66.0, 52.0, 24.0, 11.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416748046875, -0.3997306823730469, -0.38271331787109375, -0.3656959533691406, -0.3486785888671875, -0.3316612243652344, -0.31464385986328125, -0.2976264953613281, -0.280609130859375, -0.2635917663574219, -0.24657440185546875, -0.22955703735351562, -0.2125396728515625, -0.19552230834960938, -0.17850494384765625, -0.16148757934570312, -0.14447021484375, -0.12745285034179688, -0.11043548583984375, -0.09341812133789062, -0.0764007568359375, -0.059383392333984375, -0.04236602783203125, -0.025348663330078125, -0.008331298828125, 0.008686065673828125, 0.02570343017578125, 0.042720794677734375, 0.0597381591796875, 0.07675552368164062, 0.09377288818359375, 0.11079025268554688, 0.1278076171875, 0.14482498168945312, 0.16184234619140625, 0.17885971069335938, 0.1958770751953125, 0.21289443969726562, 0.22991180419921875, 0.24692916870117188, 0.263946533203125, 0.2809638977050781, 0.29798126220703125, 0.3149986267089844, 0.3320159912109375, 0.3490333557128906, 0.36605072021484375, 0.3830680847167969, 0.40008544921875, 0.4171028137207031, 0.43412017822265625, 0.4511375427246094, 0.4681549072265625, 0.4851722717285156, 0.5021896362304688, 0.5192070007324219, 0.536224365234375, 0.5532417297363281, 0.5702590942382812, 0.5872764587402344, 0.6042938232421875, 0.6213111877441406, 0.6383285522460938, 0.6553459167480469, 0.67236328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 17.0, 24.0, 39.0, 43.0, 78.0, 125.0, 195.0, 345.0, 684.0, 1491.0, 3740.0, 11610.0, 51101.0, 695298.0, 3278450.0, 120242.0, 20357.0, 5949.0, 2220.0, 964.0, 498.0, 292.0, 168.0, 86.0, 69.0, 46.0, 32.0, 22.0, 21.0, 15.0, 10.0, 8.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.798828125, -0.7705078125, -0.7421875, -0.7138671875, -0.685546875, -0.6572265625, -0.62890625, -0.6005859375, -0.572265625, -0.5439453125, -0.515625, -0.4873046875, -0.458984375, -0.4306640625, -0.40234375, -0.3740234375, -0.345703125, -0.3173828125, -0.2890625, -0.2607421875, -0.232421875, -0.2041015625, -0.17578125, -0.1474609375, -0.119140625, -0.0908203125, -0.0625, -0.0341796875, -0.005859375, 0.0224609375, 0.05078125, 0.0791015625, 0.107421875, 0.1357421875, 0.1640625, 0.1923828125, 0.220703125, 0.2490234375, 0.27734375, 0.3056640625, 0.333984375, 0.3623046875, 0.390625, 0.4189453125, 0.447265625, 0.4755859375, 0.50390625, 0.5322265625, 0.560546875, 0.5888671875, 0.6171875, 0.6455078125, 0.673828125, 0.7021484375, 0.73046875, 0.7587890625, 0.787109375, 0.8154296875, 0.84375, 0.8720703125, 0.900390625, 0.9287109375, 0.95703125, 0.9853515625, 1.013671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 8.0, 13.0, 24.0, 16.0, 19.0, 52.0, 96.0, 169.0, 415.0, 1437.0, 1080.0, 337.0, 159.0, 102.0, 39.0, 27.0, 14.0, 19.0, 12.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230712890625, -0.22019195556640625, -0.2096710205078125, -0.19915008544921875, -0.188629150390625, -0.17810821533203125, -0.1675872802734375, -0.15706634521484375, -0.14654541015625, -0.13602447509765625, -0.1255035400390625, -0.11498260498046875, -0.104461669921875, -0.09394073486328125, -0.0834197998046875, -0.07289886474609375, -0.0623779296875, -0.05185699462890625, -0.0413360595703125, -0.03081512451171875, -0.020294189453125, -0.00977325439453125, 0.0007476806640625, 0.01126861572265625, 0.02178955078125, 0.03231048583984375, 0.0428314208984375, 0.05335235595703125, 0.063873291015625, 0.07439422607421875, 0.0849151611328125, 0.09543609619140625, 0.10595703125, 0.11647796630859375, 0.1269989013671875, 0.13751983642578125, 0.148040771484375, 0.15856170654296875, 0.1690826416015625, 0.17960357666015625, 0.19012451171875, 0.20064544677734375, 0.2111663818359375, 0.22168731689453125, 0.232208251953125, 0.24272918701171875, 0.2532501220703125, 0.26377105712890625, 0.2742919921875, 0.28481292724609375, 0.2953338623046875, 0.30585479736328125, 0.316375732421875, 0.32689666748046875, 0.3374176025390625, 0.34793853759765625, 0.35845947265625, 0.36898040771484375, 0.3795013427734375, 0.39002227783203125, 0.400543212890625, 0.41106414794921875, 0.4215850830078125, 0.43210601806640625, 0.442626953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 11.0, 30.0, 79.0, 176.0, 272.0, 243.0, 131.0, 37.0, 15.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6337122917175293, -1.5219603776931763, -1.4102085828781128, -1.2984566688537598, -1.1867048740386963, -1.0749529600143433, -0.9632010459899902, -0.851449191570282, -0.7396973371505737, -0.6279454827308655, -0.5161936283111572, -0.4044417142868042, -0.29268985986709595, -0.1809380054473877, -0.06918609142303467, 0.042565762996673584, 0.15431761741638184, 0.2660694718360901, 0.3778213560581207, 0.48957324028015137, 0.6013250946998596, 0.7130769491195679, 0.8248288631439209, 0.9365807175636292, 1.0483325719833374, 1.1600844860076904, 1.271836280822754, 1.383588194847107, 1.49534010887146, 1.6070919036865234, 1.7188438177108765, 1.8305957317352295, 1.942347526550293, 2.0540993213653564, 2.165851354598999, 2.2776031494140625, 2.389354944229126, 2.5011067390441895, 2.612858772277832, 2.7246105670928955, 2.836362361907959, 2.9481141567230225, 3.059866189956665, 3.1716179847717285, 3.283369779586792, 3.3951215744018555, 3.506873607635498, 3.6186254024505615, 3.730377435684204, 3.8421292304992676, 3.95388126373291, 4.0656328201293945, 4.177384853363037, 4.28913688659668, 4.400888442993164, 4.512640476226807, 4.624392509460449, 4.736144542694092, 4.847896099090576, 4.959648132324219, 5.071400165557861, 5.183151721954346, 5.294903755187988, 5.406655788421631, 5.518407344818115]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 9.0, 13.0, 26.0, 25.0, 23.0, 38.0, 49.0, 65.0, 73.0, 74.0, 73.0, 73.0, 89.0, 73.0, 48.0, 51.0, 43.0, 28.0, 33.0, 24.0, 26.0, 14.0, 10.0, 13.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8544617295265198, -0.8084994554519653, -0.7625371813774109, -0.7165749073028564, -0.670612633228302, -0.6246503591537476, -0.5786880254745483, -0.5327258110046387, -0.48676350712776184, -0.4408012330532074, -0.39483895897865295, -0.3488766551017761, -0.3029143810272217, -0.25695210695266724, -0.2109898328781128, -0.16502755880355835, -0.1190652847290039, -0.07310301065444946, -0.027140729129314423, 0.018821552395820618, 0.06478382647037506, 0.1107461005449295, 0.15670838952064514, 0.20267066359519958, 0.24863293766975403, 0.29459521174430847, 0.3405574858188629, 0.38651978969573975, 0.4324820637702942, 0.47844433784484863, 0.5244066119194031, 0.5703688859939575, 0.6163312196731567, 0.6622934937477112, 0.7082557678222656, 0.7542180418968201, 0.8001803159713745, 0.846142590045929, 0.8921048641204834, 0.9380671977996826, 0.9840294122695923, 1.0299917459487915, 1.0759539604187012, 1.1219162940979004, 1.16787850856781, 1.2138408422470093, 1.259803056716919, 1.3057653903961182, 1.3517277240753174, 1.3976900577545166, 1.4436522722244263, 1.4896146059036255, 1.5355768203735352, 1.5815391540527344, 1.627501368522644, 1.6734637022018433, 1.719425916671753, 1.7653882503509521, 1.8113504648208618, 1.857312798500061, 1.9032750129699707, 1.94923734664917, 1.9951995611190796, 2.0411617755889893, 2.0871241092681885]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 12.0, 14.0, 13.0, 19.0, 28.0, 38.0, 61.0, 108.0, 139.0, 204.0, 324.0, 550.0, 872.0, 1466.0, 3145.0, 9094.0, 46416.0, 337429.0, 530089.0, 94448.0, 14897.0, 4418.0, 1899.0, 1057.0, 644.0, 402.0, 239.0, 160.0, 104.0, 72.0, 51.0, 32.0, 37.0, 21.0, 13.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4462890625, -1.3983612060546875, -1.350433349609375, -1.3025054931640625, -1.25457763671875, -1.2066497802734375, -1.158721923828125, -1.1107940673828125, -1.0628662109375, -1.0149383544921875, -0.967010498046875, -0.9190826416015625, -0.87115478515625, -0.8232269287109375, -0.775299072265625, -0.7273712158203125, -0.679443359375, -0.6315155029296875, -0.583587646484375, -0.5356597900390625, -0.48773193359375, -0.4398040771484375, -0.391876220703125, -0.3439483642578125, -0.2960205078125, -0.2480926513671875, -0.200164794921875, -0.1522369384765625, -0.10430908203125, -0.0563812255859375, -0.008453369140625, 0.0394744873046875, 0.08740234375, 0.1353302001953125, 0.183258056640625, 0.2311859130859375, 0.27911376953125, 0.3270416259765625, 0.374969482421875, 0.4228973388671875, 0.4708251953125, 0.5187530517578125, 0.566680908203125, 0.6146087646484375, 0.66253662109375, 0.7104644775390625, 0.758392333984375, 0.8063201904296875, 0.854248046875, 0.9021759033203125, 0.950103759765625, 0.9980316162109375, 1.04595947265625, 1.0938873291015625, 1.141815185546875, 1.1897430419921875, 1.2376708984375, 1.2855987548828125, 1.333526611328125, 1.3814544677734375, 1.42938232421875, 1.4773101806640625, 1.525238037109375, 1.5731658935546875, 1.62109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 1.0, 4.0, 4.0, 9.0, 19.0, 44.0, 77.0, 104.0, 142.0, 165.0, 151.0, 123.0, 70.0, 47.0, 26.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4030723571777344, -0.38597869873046875, -0.3688850402832031, -0.3517913818359375, -0.3346977233886719, -0.31760406494140625, -0.3005104064941406, -0.283416748046875, -0.2663230895996094, -0.24922943115234375, -0.23213577270507812, -0.2150421142578125, -0.19794845581054688, -0.18085479736328125, -0.16376113891601562, -0.14666748046875, -0.12957382202148438, -0.11248016357421875, -0.09538650512695312, -0.0782928466796875, -0.061199188232421875, -0.04410552978515625, -0.027011871337890625, -0.009918212890625, 0.007175445556640625, 0.02426910400390625, 0.041362762451171875, 0.0584564208984375, 0.07555007934570312, 0.09264373779296875, 0.10973739624023438, 0.1268310546875, 0.14392471313476562, 0.16101837158203125, 0.17811203002929688, 0.1952056884765625, 0.21229934692382812, 0.22939300537109375, 0.24648666381835938, 0.263580322265625, 0.2806739807128906, 0.29776763916015625, 0.3148612976074219, 0.3319549560546875, 0.3490486145019531, 0.36614227294921875, 0.3832359313964844, 0.40032958984375, 0.4174232482910156, 0.43451690673828125, 0.4516105651855469, 0.4687042236328125, 0.4857978820800781, 0.5028915405273438, 0.5199851989746094, 0.537078857421875, 0.5541725158691406, 0.5712661743164062, 0.5883598327636719, 0.6054534912109375, 0.6225471496582031, 0.6396408081054688, 0.6567344665527344, 0.673828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 13.0, 12.0, 18.0, 43.0, 49.0, 80.0, 110.0, 181.0, 288.0, 432.0, 809.0, 1471.0, 3068.0, 6603.0, 16276.0, 42173.0, 114131.0, 269195.0, 325726.0, 165239.0, 61466.0, 23411.0, 9286.0, 4054.0, 1952.0, 1045.0, 547.0, 310.0, 181.0, 113.0, 81.0, 48.0, 35.0, 30.0, 15.0, 17.0, 9.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.640625, -0.6224212646484375, -0.604217529296875, -0.5860137939453125, -0.56781005859375, -0.5496063232421875, -0.531402587890625, -0.5131988525390625, -0.4949951171875, -0.4767913818359375, -0.458587646484375, -0.4403839111328125, -0.42218017578125, -0.4039764404296875, -0.385772705078125, -0.3675689697265625, -0.349365234375, -0.3311614990234375, -0.312957763671875, -0.2947540283203125, -0.27655029296875, -0.2583465576171875, -0.240142822265625, -0.2219390869140625, -0.2037353515625, -0.1855316162109375, -0.167327880859375, -0.1491241455078125, -0.13092041015625, -0.1127166748046875, -0.094512939453125, -0.0763092041015625, -0.05810546875, -0.0399017333984375, -0.021697998046875, -0.0034942626953125, 0.01470947265625, 0.0329132080078125, 0.051116943359375, 0.0693206787109375, 0.0875244140625, 0.1057281494140625, 0.123931884765625, 0.1421356201171875, 0.16033935546875, 0.1785430908203125, 0.196746826171875, 0.2149505615234375, 0.233154296875, 0.2513580322265625, 0.269561767578125, 0.2877655029296875, 0.30596923828125, 0.3241729736328125, 0.342376708984375, 0.3605804443359375, 0.3787841796875, 0.3969879150390625, 0.415191650390625, 0.4333953857421875, 0.45159912109375, 0.4698028564453125, 0.488006591796875, 0.5062103271484375, 0.5244140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 10.0, 10.0, 13.0, 23.0, 24.0, 27.0, 32.0, 38.0, 25.0, 35.0, 39.0, 42.0, 67.0, 51.0, 49.0, 53.0, 52.0, 37.0, 53.0, 52.0, 38.0, 25.0, 31.0, 32.0, 26.0, 16.0, 16.0, 14.0, 11.0, 11.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7675399780273438, -0.7430877685546875, -0.7186355590820312, -0.694183349609375, -0.6697311401367188, -0.6452789306640625, -0.6208267211914062, -0.59637451171875, -0.5719223022460938, -0.5474700927734375, -0.5230178833007812, -0.498565673828125, -0.47411346435546875, -0.4496612548828125, -0.42520904541015625, -0.4007568359375, -0.37630462646484375, -0.3518524169921875, -0.32740020751953125, -0.302947998046875, -0.27849578857421875, -0.2540435791015625, -0.22959136962890625, -0.20513916015625, -0.18068695068359375, -0.1562347412109375, -0.13178253173828125, -0.107330322265625, -0.08287811279296875, -0.0584259033203125, -0.03397369384765625, -0.009521484375, 0.01493072509765625, 0.0393829345703125, 0.06383514404296875, 0.088287353515625, 0.11273956298828125, 0.1371917724609375, 0.16164398193359375, 0.18609619140625, 0.21054840087890625, 0.2350006103515625, 0.25945281982421875, 0.283905029296875, 0.30835723876953125, 0.3328094482421875, 0.35726165771484375, 0.3817138671875, 0.40616607666015625, 0.4306182861328125, 0.45507049560546875, 0.479522705078125, 0.5039749145507812, 0.5284271240234375, 0.5528793334960938, 0.57733154296875, 0.6017837524414062, 0.6262359619140625, 0.6506881713867188, 0.675140380859375, 0.6995925903320312, 0.7240447998046875, 0.7484970092773438, 0.77294921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 10.0, 11.0, 19.0, 32.0, 77.0, 125.0, 228.0, 418.0, 964.0, 2407.0, 9227.0, 62138.0, 435082.0, 455972.0, 67280.0, 9994.0, 2674.0, 990.0, 407.0, 216.0, 117.0, 63.0, 30.0, 24.0, 20.0, 10.0, 3.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317626953125, -0.304931640625, -0.292236328125, -0.279541015625, -0.266845703125, -0.254150390625, -0.241455078125, -0.228759765625, -0.216064453125, -0.203369140625, -0.190673828125, -0.177978515625, -0.165283203125, -0.152587890625, -0.139892578125, -0.127197265625, -0.114501953125, -0.101806640625, -0.089111328125, -0.076416015625, -0.063720703125, -0.051025390625, -0.038330078125, -0.025634765625, -0.012939453125, -0.000244140625, 0.012451171875, 0.025146484375, 0.037841796875, 0.050537109375, 0.063232421875, 0.075927734375, 0.088623046875, 0.101318359375, 0.114013671875, 0.126708984375, 0.139404296875, 0.152099609375, 0.164794921875, 0.177490234375, 0.190185546875, 0.202880859375, 0.215576171875, 0.228271484375, 0.240966796875, 0.253662109375, 0.266357421875, 0.279052734375, 0.291748046875, 0.304443359375, 0.317138671875, 0.329833984375, 0.342529296875, 0.355224609375, 0.367919921875, 0.380615234375, 0.393310546875, 0.406005859375, 0.418701171875, 0.431396484375, 0.444091796875, 0.456787109375, 0.469482421875, 0.482177734375, 0.494873046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 8.0, 11.0, 24.0, 23.0, 51.0, 69.0, 75.0, 102.0, 98.0, 95.0, 102.0, 76.0, 62.0, 40.0, 47.0, 38.0, 20.0, 12.0, 14.0, 6.0, 9.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.666515350341797e-05, -8.45668837428093e-05, -8.246861398220062e-05, -8.037034422159195e-05, -7.827207446098328e-05, -7.61738047003746e-05, -7.407553493976593e-05, -7.197726517915726e-05, -6.987899541854858e-05, -6.778072565793991e-05, -6.568245589733124e-05, -6.358418613672256e-05, -6.148591637611389e-05, -5.938764661550522e-05, -5.7289376854896545e-05, -5.519110709428787e-05, -5.30928373336792e-05, -5.0994567573070526e-05, -4.889629781246185e-05, -4.679802805185318e-05, -4.469975829124451e-05, -4.2601488530635834e-05, -4.050321877002716e-05, -3.840494900941849e-05, -3.6306679248809814e-05, -3.420840948820114e-05, -3.211013972759247e-05, -3.0011869966983795e-05, -2.7913600206375122e-05, -2.581533044576645e-05, -2.3717060685157776e-05, -2.1618790924549103e-05, -1.952052116394043e-05, -1.7422251403331757e-05, -1.5323981642723083e-05, -1.322571188211441e-05, -1.1127442121505737e-05, -9.029172360897064e-06, -6.930902600288391e-06, -4.832632839679718e-06, -2.734363079071045e-06, -6.360933184623718e-07, 1.4621764421463013e-06, 3.5604462027549744e-06, 5.6587159633636475e-06, 7.75698572397232e-06, 9.855255484580994e-06, 1.1953525245189667e-05, 1.405179500579834e-05, 1.6150064766407013e-05, 1.8248334527015686e-05, 2.034660428762436e-05, 2.2444874048233032e-05, 2.4543143808841705e-05, 2.664141356945038e-05, 2.873968333005905e-05, 3.0837953090667725e-05, 3.29362228512764e-05, 3.503449261188507e-05, 3.7132762372493744e-05, 3.923103213310242e-05, 4.132930189371109e-05, 4.342757165431976e-05, 4.5525841414928436e-05, 4.762411117553711e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 11.0, 19.0, 14.0, 22.0, 36.0, 73.0, 100.0, 168.0, 262.0, 497.0, 956.0, 1947.0, 4636.0, 14477.0, 53751.0, 207791.0, 422933.0, 246236.0, 66952.0, 17400.0, 5703.0, 2141.0, 1029.0, 557.0, 317.0, 179.0, 107.0, 76.0, 50.0, 28.0, 17.0, 14.0, 7.0, 8.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.26904296875, -0.2610301971435547, -0.2530174255371094, -0.24500465393066406, -0.23699188232421875, -0.22897911071777344, -0.22096633911132812, -0.2129535675048828, -0.2049407958984375, -0.1969280242919922, -0.18891525268554688, -0.18090248107910156, -0.17288970947265625, -0.16487693786621094, -0.15686416625976562, -0.1488513946533203, -0.140838623046875, -0.1328258514404297, -0.12481307983398438, -0.11680030822753906, -0.10878753662109375, -0.10077476501464844, -0.09276199340820312, -0.08474922180175781, -0.0767364501953125, -0.06872367858886719, -0.060710906982421875, -0.05269813537597656, -0.04468536376953125, -0.03667259216308594, -0.028659820556640625, -0.020647048950195312, -0.01263427734375, -0.0046215057373046875, 0.003391265869140625, 0.011404037475585938, 0.01941680908203125, 0.027429580688476562, 0.035442352294921875, 0.04345512390136719, 0.0514678955078125, 0.05948066711425781, 0.06749343872070312, 0.07550621032714844, 0.08351898193359375, 0.09153175354003906, 0.09954452514648438, 0.10755729675292969, 0.115570068359375, 0.12358283996582031, 0.13159561157226562, 0.13960838317871094, 0.14762115478515625, 0.15563392639160156, 0.16364669799804688, 0.1716594696044922, 0.1796722412109375, 0.1876850128173828, 0.19569778442382812, 0.20371055603027344, 0.21172332763671875, 0.21973609924316406, 0.22774887084960938, 0.2357616424560547, 0.2437744140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 7.0, 7.0, 6.0, 15.0, 21.0, 26.0, 22.0, 41.0, 45.0, 52.0, 74.0, 68.0, 92.0, 84.0, 59.0, 80.0, 72.0, 48.0, 44.0, 33.0, 36.0, 17.0, 9.0, 7.0, 10.0, 5.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2232666015625, -0.21481895446777344, -0.20637130737304688, -0.1979236602783203, -0.18947601318359375, -0.1810283660888672, -0.17258071899414062, -0.16413307189941406, -0.1556854248046875, -0.14723777770996094, -0.13879013061523438, -0.1303424835205078, -0.12189483642578125, -0.11344718933105469, -0.10499954223632812, -0.09655189514160156, -0.088104248046875, -0.07965660095214844, -0.07120895385742188, -0.06276130676269531, -0.05431365966796875, -0.04586601257324219, -0.037418365478515625, -0.028970718383789062, -0.0205230712890625, -0.012075424194335938, -0.003627777099609375, 0.0048198699951171875, 0.01326751708984375, 0.021715164184570312, 0.030162811279296875, 0.03861045837402344, 0.04705810546875, 0.05550575256347656, 0.06395339965820312, 0.07240104675292969, 0.08084869384765625, 0.08929634094238281, 0.09774398803710938, 0.10619163513183594, 0.1146392822265625, 0.12308692932128906, 0.13153457641601562, 0.1399822235107422, 0.14842987060546875, 0.1568775177001953, 0.16532516479492188, 0.17377281188964844, 0.182220458984375, 0.19066810607910156, 0.19911575317382812, 0.2075634002685547, 0.21601104736328125, 0.2244586944580078, 0.23290634155273438, 0.24135398864746094, 0.2498016357421875, 0.25824928283691406, 0.2666969299316406, 0.2751445770263672, 0.28359222412109375, 0.2920398712158203, 0.3004875183105469, 0.30893516540527344, 0.3173828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 29.0, 54.0, 138.0, 259.0, 240.0, 156.0, 63.0, 32.0, 14.0, 6.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.155750274658203, -15.839024543762207, -15.522297859191895, -15.205572128295898, -14.888845443725586, -14.57211971282959, -14.255393981933594, -13.938667297363281, -13.621941566467285, -13.305215835571289, -12.988489151000977, -12.67176342010498, -12.355037689208984, -12.038311004638672, -11.721585273742676, -11.40485954284668, -11.088132858276367, -10.771407127380371, -10.454680442810059, -10.137954711914062, -9.82122802734375, -9.504502296447754, -9.187776565551758, -8.871049880981445, -8.55432415008545, -8.237598419189453, -7.920871734619141, -7.6041460037231445, -7.28741979598999, -6.970693588256836, -6.65396785736084, -6.3372416496276855, -6.020516395568848, -5.703790187835693, -5.387063980102539, -5.070338249206543, -4.753612041473389, -4.436885833740234, -4.120160102844238, -3.803433895111084, -3.4867076873779297, -3.1699814796447754, -2.8532555103302, -2.536529541015625, -2.2198033332824707, -1.903077244758606, -1.5863511562347412, -1.269625186920166, -0.9528989791870117, -0.636172890663147, -0.3194468021392822, -0.0027207136154174805, 0.31400537490844727, 0.630731463432312, 0.9474575519561768, 1.264183521270752, 1.5809097290039062, 1.897635817527771, 2.2143619060516357, 2.531087875366211, 2.8478140830993652, 3.1645402908325195, 3.4812662601470947, 3.79799222946167, 4.114718437194824]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 3.0, 5.0, 4.0, 12.0, 15.0, 15.0, 9.0, 22.0, 18.0, 30.0, 31.0, 36.0, 31.0, 40.0, 33.0, 37.0, 52.0, 46.0, 36.0, 49.0, 50.0, 47.0, 40.0, 42.0, 44.0, 38.0, 24.0, 23.0, 20.0, 17.0, 23.0, 18.0, 23.0, 12.0, 14.0, 10.0, 8.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.395662546157837, -3.2700700759887695, -3.1444778442382812, -3.018885612487793, -2.8932931423187256, -2.767700672149658, -2.64210844039917, -2.5165162086486816, -2.3909237384796143, -2.265331268310547, -2.1397390365600586, -2.0141468048095703, -1.888554334640503, -1.762961983680725, -1.6373696327209473, -1.5117772817611694, -1.3861849308013916, -1.2605925798416138, -1.135000228881836, -1.009407877922058, -0.8838155269622803, -0.7582231760025024, -0.6326308250427246, -0.5070384740829468, -0.38144612312316895, -0.2558537721633911, -0.13026142120361328, -0.004669070243835449, 0.12092328071594238, 0.24651563167572021, 0.37210798263549805, 0.4977003335952759, 0.6232929229736328, 0.7488852739334106, 0.8744776248931885, 1.0000699758529663, 1.1256623268127441, 1.251254677772522, 1.3768470287322998, 1.5024393796920776, 1.6280317306518555, 1.7536240816116333, 1.8792164325714111, 2.0048089027404785, 2.130401134490967, 2.255993366241455, 2.3815858364105225, 2.50717830657959, 2.632770538330078, 2.7583627700805664, 2.883955240249634, 3.009547710418701, 3.1351399421691895, 3.2607321739196777, 3.386324644088745, 3.5119171142578125, 3.637509346008301, 3.763101577758789, 3.8886940479278564, 4.014286518096924, 4.139878749847412, 4.2654709815979, 4.391063690185547, 4.516655921936035, 4.642248153686523]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 16.0, 27.0, 50.0, 110.0, 248.0, 565.0, 1967.0, 13269.0, 3811730.0, 357600.0, 6677.0, 1256.0, 430.0, 149.0, 75.0, 42.0, 23.0, 15.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.3394775390625, -2.241455078125, -2.1434326171875, -2.04541015625, -1.9473876953125, -1.849365234375, -1.7513427734375, -1.6533203125, -1.5552978515625, -1.457275390625, -1.3592529296875, -1.26123046875, -1.1632080078125, -1.065185546875, -0.9671630859375, -0.869140625, -0.7711181640625, -0.673095703125, -0.5750732421875, -0.47705078125, -0.3790283203125, -0.281005859375, -0.1829833984375, -0.0849609375, 0.0130615234375, 0.111083984375, 0.2091064453125, 0.30712890625, 0.4051513671875, 0.503173828125, 0.6011962890625, 0.69921875, 0.7972412109375, 0.895263671875, 0.9932861328125, 1.09130859375, 1.1893310546875, 1.287353515625, 1.3853759765625, 1.4833984375, 1.5814208984375, 1.679443359375, 1.7774658203125, 1.87548828125, 1.9735107421875, 2.071533203125, 2.1695556640625, 2.267578125, 2.3656005859375, 2.463623046875, 2.5616455078125, 2.65966796875, 2.7576904296875, 2.855712890625, 2.9537353515625, 3.0517578125, 3.1497802734375, 3.247802734375, 3.3458251953125, 3.44384765625, 3.5418701171875, 3.639892578125, 3.7379150390625, 3.8359375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 12.0, 24.0, 34.0, 55.0, 85.0, 114.0, 151.0, 133.0, 133.0, 101.0, 72.0, 36.0, 25.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419189453125, -0.4018287658691406, -0.38446807861328125, -0.3671073913574219, -0.3497467041015625, -0.3323860168457031, -0.31502532958984375, -0.2976646423339844, -0.280303955078125, -0.2629432678222656, -0.24558258056640625, -0.22822189331054688, -0.2108612060546875, -0.19350051879882812, -0.17613983154296875, -0.15877914428710938, -0.14141845703125, -0.12405776977539062, -0.10669708251953125, -0.08933639526367188, -0.0719757080078125, -0.054615020751953125, -0.03725433349609375, -0.019893646240234375, -0.002532958984375, 0.014827728271484375, 0.03218841552734375, 0.049549102783203125, 0.0669097900390625, 0.08427047729492188, 0.10163116455078125, 0.11899185180664062, 0.1363525390625, 0.15371322631835938, 0.17107391357421875, 0.18843460083007812, 0.2057952880859375, 0.22315597534179688, 0.24051666259765625, 0.2578773498535156, 0.275238037109375, 0.2925987243652344, 0.30995941162109375, 0.3273200988769531, 0.3446807861328125, 0.3620414733886719, 0.37940216064453125, 0.3967628479003906, 0.41412353515625, 0.4314842224121094, 0.44884490966796875, 0.4662055969238281, 0.4835662841796875, 0.5009269714355469, 0.5182876586914062, 0.5356483459472656, 0.553009033203125, 0.5703697204589844, 0.5877304077148438, 0.6050910949707031, 0.6224517822265625, 0.6398124694824219, 0.6571731567382812, 0.6745338439941406, 0.69189453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 12.0, 9.0, 24.0, 30.0, 56.0, 57.0, 105.0, 139.0, 211.0, 320.0, 535.0, 982.0, 2172.0, 6056.0, 24667.0, 230419.0, 3621398.0, 268472.0, 26884.0, 6559.0, 2446.0, 1098.0, 559.0, 340.0, 229.0, 152.0, 101.0, 83.0, 51.0, 33.0, 22.0, 20.0, 13.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8834304809570312, -0.8513336181640625, -0.8192367553710938, -0.787139892578125, -0.7550430297851562, -0.7229461669921875, -0.6908493041992188, -0.65875244140625, -0.6266555786132812, -0.5945587158203125, -0.5624618530273438, -0.530364990234375, -0.49826812744140625, -0.4661712646484375, -0.43407440185546875, -0.4019775390625, -0.36988067626953125, -0.3377838134765625, -0.30568695068359375, -0.273590087890625, -0.24149322509765625, -0.2093963623046875, -0.17729949951171875, -0.14520263671875, -0.11310577392578125, -0.0810089111328125, -0.04891204833984375, -0.016815185546875, 0.01528167724609375, 0.0473785400390625, 0.07947540283203125, 0.111572265625, 0.14366912841796875, 0.1757659912109375, 0.20786285400390625, 0.239959716796875, 0.27205657958984375, 0.3041534423828125, 0.33625030517578125, 0.36834716796875, 0.40044403076171875, 0.4325408935546875, 0.46463775634765625, 0.496734619140625, 0.5288314819335938, 0.5609283447265625, 0.5930252075195312, 0.6251220703125, 0.6572189331054688, 0.6893157958984375, 0.7214126586914062, 0.753509521484375, 0.7856063842773438, 0.8177032470703125, 0.8498001098632812, 0.88189697265625, 0.9139938354492188, 0.9460906982421875, 0.9781875610351562, 1.010284423828125, 1.0423812866210938, 1.0744781494140625, 1.1065750122070312, 1.138671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 14.0, 10.0, 28.0, 49.0, 106.0, 313.0, 1355.0, 1550.0, 371.0, 137.0, 61.0, 26.0, 17.0, 11.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.624237060546875, -0.60345458984375, -0.582672119140625, -0.5618896484375, -0.541107177734375, -0.52032470703125, -0.499542236328125, -0.478759765625, -0.457977294921875, -0.43719482421875, -0.416412353515625, -0.3956298828125, -0.374847412109375, -0.35406494140625, -0.333282470703125, -0.3125, -0.291717529296875, -0.27093505859375, -0.250152587890625, -0.2293701171875, -0.208587646484375, -0.18780517578125, -0.167022705078125, -0.146240234375, -0.125457763671875, -0.10467529296875, -0.083892822265625, -0.0631103515625, -0.042327880859375, -0.02154541015625, -0.000762939453125, 0.02001953125, 0.040802001953125, 0.06158447265625, 0.082366943359375, 0.1031494140625, 0.123931884765625, 0.14471435546875, 0.165496826171875, 0.186279296875, 0.207061767578125, 0.22784423828125, 0.248626708984375, 0.2694091796875, 0.290191650390625, 0.31097412109375, 0.331756591796875, 0.3525390625, 0.373321533203125, 0.39410400390625, 0.414886474609375, 0.4356689453125, 0.456451416015625, 0.47723388671875, 0.498016357421875, 0.518798828125, 0.539581298828125, 0.56036376953125, 0.581146240234375, 0.6019287109375, 0.622711181640625, 0.64349365234375, 0.664276123046875, 0.68505859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 15.0, 55.0, 411.0, 428.0, 81.0, 12.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8225123882293701, -1.513832688331604, -1.205152988433838, -0.8964731693267822, -0.5877934694290161, -0.27911376953125, 0.029566049575805664, 0.3382456302642822, 0.6469254493713379, 0.955605149269104, 1.2642848491668701, 1.5729646682739258, 1.881644368171692, 2.190324068069458, 2.4990038871765137, 2.8076834678649902, 3.116363286972046, 3.4250431060791016, 3.733722686767578, 4.042402267456055, 4.3510823249816895, 4.659761905670166, 4.968441963195801, 5.277121543884277, 5.585801124572754, 5.8944807052612305, 6.203160762786865, 6.511840343475342, 6.820519924163818, 7.129199981689453, 7.43787956237793, 7.746559143066406, 8.0552396774292, 8.363919258117676, 8.672598838806152, 8.981279373168945, 9.289958953857422, 9.598638534545898, 9.907318115234375, 10.215997695922852, 10.524677276611328, 10.833356857299805, 11.142036437988281, 11.450716018676758, 11.75939655303955, 12.068076133728027, 12.376755714416504, 12.68543529510498, 12.994115829467773, 13.30279541015625, 13.611474990844727, 13.920154571533203, 14.228835105895996, 14.537514686584473, 14.84619426727295, 15.154873847961426, 15.463553428649902, 15.772233009338379, 16.080913543701172, 16.38959312438965, 16.698272705078125, 17.0069522857666, 17.315631866455078, 17.624311447143555, 17.93299102783203]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 6.0, 9.0, 6.0, 9.0, 12.0, 10.0, 20.0, 15.0, 18.0, 27.0, 27.0, 31.0, 29.0, 45.0, 49.0, 45.0, 48.0, 45.0, 42.0, 40.0, 37.0, 58.0, 37.0, 46.0, 41.0, 35.0, 34.0, 26.0, 25.0, 24.0, 16.0, 14.0, 15.0, 13.0, 11.0, 12.0, 6.0, 9.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.127223014831543, -1.0846521854400635, -1.042081356048584, -0.9995105266571045, -0.956939697265625, -0.9143688678741455, -0.8717980980873108, -0.8292272686958313, -0.7866564393043518, -0.7440856099128723, -0.7015147805213928, -0.6589440107345581, -0.6163731813430786, -0.5738023519515991, -0.5312315225601196, -0.48866069316864014, -0.44608986377716064, -0.40351903438568115, -0.36094820499420166, -0.31837740540504456, -0.27580657601356506, -0.23323574662208557, -0.19066494703292847, -0.14809411764144897, -0.10552328824996948, -0.06295246630907059, -0.020381644368171692, 0.022189170122146606, 0.0647599995136261, 0.10733082890510559, 0.1499016284942627, 0.1924724578857422, 0.23504328727722168, 0.27761411666870117, 0.32018494606018066, 0.36275574564933777, 0.40532657504081726, 0.44789740443229675, 0.49046820402145386, 0.5330390334129333, 0.5756098628044128, 0.6181806921958923, 0.6607515215873718, 0.7033222913742065, 0.745893120765686, 0.7884639501571655, 0.831034779548645, 0.8736056089401245, 0.916176438331604, 0.9587472677230835, 1.001318097114563, 1.0438889265060425, 1.086459755897522, 1.1290305852890015, 1.1716012954711914, 1.214172124862671, 1.2567429542541504, 1.2993137836456299, 1.3418846130371094, 1.3844554424285889, 1.4270262718200684, 1.4695971012115479, 1.5121679306030273, 1.5547387599945068, 1.5973095893859863]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 4.0, 20.0, 26.0, 34.0, 45.0, 74.0, 113.0, 182.0, 312.0, 533.0, 1104.0, 2418.0, 6652.0, 28423.0, 238027.0, 654874.0, 93074.0, 14738.0, 4248.0, 1695.0, 809.0, 429.0, 232.0, 179.0, 91.0, 61.0, 34.0, 30.0, 18.0, 14.0, 15.0, 5.0, 7.0, 5.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7578125, -1.7065582275390625, -1.655303955078125, -1.6040496826171875, -1.55279541015625, -1.5015411376953125, -1.450286865234375, -1.3990325927734375, -1.3477783203125, -1.2965240478515625, -1.245269775390625, -1.1940155029296875, -1.14276123046875, -1.0915069580078125, -1.040252685546875, -0.9889984130859375, -0.937744140625, -0.8864898681640625, -0.835235595703125, -0.7839813232421875, -0.73272705078125, -0.6814727783203125, -0.630218505859375, -0.5789642333984375, -0.5277099609375, -0.4764556884765625, -0.425201416015625, -0.3739471435546875, -0.32269287109375, -0.2714385986328125, -0.220184326171875, -0.1689300537109375, -0.11767578125, -0.0664215087890625, -0.015167236328125, 0.0360870361328125, 0.08734130859375, 0.1385955810546875, 0.189849853515625, 0.2411041259765625, 0.2923583984375, 0.3436126708984375, 0.394866943359375, 0.4461212158203125, 0.49737548828125, 0.5486297607421875, 0.599884033203125, 0.6511383056640625, 0.702392578125, 0.7536468505859375, 0.804901123046875, 0.8561553955078125, 0.90740966796875, 0.9586639404296875, 1.009918212890625, 1.0611724853515625, 1.1124267578125, 1.1636810302734375, 1.214935302734375, 1.2661895751953125, 1.31744384765625, 1.3686981201171875, 1.419952392578125, 1.4712066650390625, 1.5224609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 22.0, 30.0, 43.0, 58.0, 92.0, 122.0, 151.0, 132.0, 115.0, 94.0, 57.0, 37.0, 22.0, 9.0, 3.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.39624786376953125, -0.3789215087890625, -0.36159515380859375, -0.344268798828125, -0.32694244384765625, -0.3096160888671875, -0.29228973388671875, -0.27496337890625, -0.25763702392578125, -0.2403106689453125, -0.22298431396484375, -0.205657958984375, -0.18833160400390625, -0.1710052490234375, -0.15367889404296875, -0.1363525390625, -0.11902618408203125, -0.1016998291015625, -0.08437347412109375, -0.067047119140625, -0.04972076416015625, -0.0323944091796875, -0.01506805419921875, 0.00225830078125, 0.01958465576171875, 0.0369110107421875, 0.05423736572265625, 0.071563720703125, 0.08889007568359375, 0.1062164306640625, 0.12354278564453125, 0.140869140625, 0.15819549560546875, 0.1755218505859375, 0.19284820556640625, 0.210174560546875, 0.22750091552734375, 0.2448272705078125, 0.26215362548828125, 0.27947998046875, 0.29680633544921875, 0.3141326904296875, 0.33145904541015625, 0.348785400390625, 0.36611175537109375, 0.3834381103515625, 0.40076446533203125, 0.4180908203125, 0.43541717529296875, 0.4527435302734375, 0.47006988525390625, 0.487396240234375, 0.5047225952148438, 0.5220489501953125, 0.5393753051757812, 0.55670166015625, 0.5740280151367188, 0.5913543701171875, 0.6086807250976562, 0.626007080078125, 0.6433334350585938, 0.6606597900390625, 0.6779861450195312, 0.6953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 16.0, 11.0, 11.0, 25.0, 38.0, 39.0, 47.0, 87.0, 148.0, 191.0, 336.0, 597.0, 1237.0, 2489.0, 6074.0, 16111.0, 46632.0, 153416.0, 408421.0, 280295.0, 86512.0, 27912.0, 10014.0, 3946.0, 1782.0, 842.0, 425.0, 272.0, 172.0, 104.0, 68.0, 53.0, 33.0, 39.0, 30.0, 26.0, 25.0, 15.0, 13.0, 6.0, 7.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.58984375, -0.5693359375, -0.548828125, -0.5283203125, -0.5078125, -0.4873046875, -0.466796875, -0.4462890625, -0.42578125, -0.4052734375, -0.384765625, -0.3642578125, -0.34375, -0.3232421875, -0.302734375, -0.2822265625, -0.26171875, -0.2412109375, -0.220703125, -0.2001953125, -0.1796875, -0.1591796875, -0.138671875, -0.1181640625, -0.09765625, -0.0771484375, -0.056640625, -0.0361328125, -0.015625, 0.0048828125, 0.025390625, 0.0458984375, 0.06640625, 0.0869140625, 0.107421875, 0.1279296875, 0.1484375, 0.1689453125, 0.189453125, 0.2099609375, 0.23046875, 0.2509765625, 0.271484375, 0.2919921875, 0.3125, 0.3330078125, 0.353515625, 0.3740234375, 0.39453125, 0.4150390625, 0.435546875, 0.4560546875, 0.4765625, 0.4970703125, 0.517578125, 0.5380859375, 0.55859375, 0.5791015625, 0.599609375, 0.6201171875, 0.640625, 0.6611328125, 0.681640625, 0.7021484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 16.0, 12.0, 14.0, 20.0, 15.0, 23.0, 29.0, 29.0, 30.0, 41.0, 34.0, 46.0, 29.0, 55.0, 52.0, 28.0, 52.0, 35.0, 44.0, 27.0, 37.0, 24.0, 47.0, 20.0, 25.0, 20.0, 19.0, 20.0, 23.0, 18.0, 14.0, 15.0, 13.0, 6.0, 7.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.65478515625, -0.632293701171875, -0.60980224609375, -0.587310791015625, -0.5648193359375, -0.542327880859375, -0.51983642578125, -0.497344970703125, -0.474853515625, -0.452362060546875, -0.42987060546875, -0.407379150390625, -0.3848876953125, -0.362396240234375, -0.33990478515625, -0.317413330078125, -0.294921875, -0.272430419921875, -0.24993896484375, -0.227447509765625, -0.2049560546875, -0.182464599609375, -0.15997314453125, -0.137481689453125, -0.114990234375, -0.092498779296875, -0.07000732421875, -0.047515869140625, -0.0250244140625, -0.002532958984375, 0.01995849609375, 0.042449951171875, 0.06494140625, 0.087432861328125, 0.10992431640625, 0.132415771484375, 0.1549072265625, 0.177398681640625, 0.19989013671875, 0.222381591796875, 0.244873046875, 0.267364501953125, 0.28985595703125, 0.312347412109375, 0.3348388671875, 0.357330322265625, 0.37982177734375, 0.402313232421875, 0.4248046875, 0.447296142578125, 0.46978759765625, 0.492279052734375, 0.5147705078125, 0.537261962890625, 0.55975341796875, 0.582244873046875, 0.604736328125, 0.627227783203125, 0.64971923828125, 0.672210693359375, 0.6947021484375, 0.717193603515625, 0.73968505859375, 0.762176513671875, 0.78466796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 14.0, 24.0, 43.0, 102.0, 238.0, 797.0, 3512.0, 53713.0, 903145.0, 81382.0, 4197.0, 884.0, 293.0, 108.0, 56.0, 19.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6689453125, -0.6455154418945312, -0.6220855712890625, -0.5986557006835938, -0.575225830078125, -0.5517959594726562, -0.5283660888671875, -0.5049362182617188, -0.48150634765625, -0.45807647705078125, -0.4346466064453125, -0.41121673583984375, -0.387786865234375, -0.36435699462890625, -0.3409271240234375, -0.31749725341796875, -0.2940673828125, -0.27063751220703125, -0.2472076416015625, -0.22377777099609375, -0.200347900390625, -0.17691802978515625, -0.1534881591796875, -0.13005828857421875, -0.10662841796875, -0.08319854736328125, -0.0597686767578125, -0.03633880615234375, -0.012908935546875, 0.01052093505859375, 0.0339508056640625, 0.05738067626953125, 0.080810546875, 0.10424041748046875, 0.1276702880859375, 0.15110015869140625, 0.174530029296875, 0.19795989990234375, 0.2213897705078125, 0.24481964111328125, 0.26824951171875, 0.29167938232421875, 0.3151092529296875, 0.33853912353515625, 0.361968994140625, 0.38539886474609375, 0.4088287353515625, 0.43225860595703125, 0.4556884765625, 0.47911834716796875, 0.5025482177734375, 0.5259780883789062, 0.549407958984375, 0.5728378295898438, 0.5962677001953125, 0.6196975708007812, 0.64312744140625, 0.6665573120117188, 0.6899871826171875, 0.7134170532226562, 0.736846923828125, 0.7602767944335938, 0.7837066650390625, 0.8071365356445312, 0.83056640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 0.0, 3.0, 10.0, 4.0, 7.0, 14.0, 18.0, 22.0, 36.0, 33.0, 45.0, 47.0, 56.0, 74.0, 68.0, 77.0, 76.0, 80.0, 62.0, 64.0, 46.0, 33.0, 32.0, 24.0, 16.0, 8.0, 12.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.808736801147461e-05, -3.6646611988544464e-05, -3.520585596561432e-05, -3.3765099942684174e-05, -3.232434391975403e-05, -3.088358789682388e-05, -2.9442831873893738e-05, -2.8002075850963593e-05, -2.6561319828033447e-05, -2.5120563805103302e-05, -2.3679807782173157e-05, -2.223905175924301e-05, -2.0798295736312866e-05, -1.935753971338272e-05, -1.7916783690452576e-05, -1.647602766752243e-05, -1.5035271644592285e-05, -1.359451562166214e-05, -1.2153759598731995e-05, -1.071300357580185e-05, -9.272247552871704e-06, -7.831491529941559e-06, -6.3907355070114136e-06, -4.949979484081268e-06, -3.509223461151123e-06, -2.0684674382209778e-06, -6.277114152908325e-07, 8.130446076393127e-07, 2.253800630569458e-06, 3.6945566534996033e-06, 5.1353126764297485e-06, 6.576068699359894e-06, 8.016824722290039e-06, 9.457580745220184e-06, 1.089833676815033e-05, 1.2339092791080475e-05, 1.377984881401062e-05, 1.5220604836940765e-05, 1.666136085987091e-05, 1.8102116882801056e-05, 1.95428729057312e-05, 2.0983628928661346e-05, 2.2424384951591492e-05, 2.3865140974521637e-05, 2.5305896997451782e-05, 2.6746653020381927e-05, 2.8187409043312073e-05, 2.9628165066242218e-05, 3.106892108917236e-05, 3.250967711210251e-05, 3.3950433135032654e-05, 3.53911891579628e-05, 3.6831945180892944e-05, 3.827270120382309e-05, 3.9713457226753235e-05, 4.115421324968338e-05, 4.2594969272613525e-05, 4.403572529554367e-05, 4.5476481318473816e-05, 4.691723734140396e-05, 4.8357993364334106e-05, 4.979874938726425e-05, 5.12395054101944e-05, 5.268026143312454e-05, 5.412101745605469e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 11.0, 8.0, 15.0, 29.0, 37.0, 63.0, 117.0, 220.0, 490.0, 1430.0, 7848.0, 128488.0, 835713.0, 66818.0, 5269.0, 1169.0, 409.0, 191.0, 81.0, 52.0, 28.0, 28.0, 17.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72021484375, -0.700958251953125, -0.68170166015625, -0.662445068359375, -0.6431884765625, -0.623931884765625, -0.60467529296875, -0.585418701171875, -0.566162109375, -0.546905517578125, -0.52764892578125, -0.508392333984375, -0.4891357421875, -0.469879150390625, -0.45062255859375, -0.431365966796875, -0.412109375, -0.392852783203125, -0.37359619140625, -0.354339599609375, -0.3350830078125, -0.315826416015625, -0.29656982421875, -0.277313232421875, -0.258056640625, -0.238800048828125, -0.21954345703125, -0.200286865234375, -0.1810302734375, -0.161773681640625, -0.14251708984375, -0.123260498046875, -0.10400390625, -0.084747314453125, -0.06549072265625, -0.046234130859375, -0.0269775390625, -0.007720947265625, 0.01153564453125, 0.030792236328125, 0.050048828125, 0.069305419921875, 0.08856201171875, 0.107818603515625, 0.1270751953125, 0.146331787109375, 0.16558837890625, 0.184844970703125, 0.2041015625, 0.223358154296875, 0.24261474609375, 0.261871337890625, 0.2811279296875, 0.300384521484375, 0.31964111328125, 0.338897705078125, 0.358154296875, 0.377410888671875, 0.39666748046875, 0.415924072265625, 0.4351806640625, 0.454437255859375, 0.47369384765625, 0.492950439453125, 0.51220703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 15.0, 23.0, 51.0, 84.0, 146.0, 213.0, 203.0, 112.0, 76.0, 37.0, 23.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8778495788574219, -0.8562850952148438, -0.8347206115722656, -0.8131561279296875, -0.7915916442871094, -0.7700271606445312, -0.7484626770019531, -0.726898193359375, -0.7053337097167969, -0.6837692260742188, -0.6622047424316406, -0.6406402587890625, -0.6190757751464844, -0.5975112915039062, -0.5759468078613281, -0.55438232421875, -0.5328178405761719, -0.5112533569335938, -0.4896888732910156, -0.4681243896484375, -0.4465599060058594, -0.42499542236328125, -0.4034309387207031, -0.381866455078125, -0.3603019714355469, -0.33873748779296875, -0.3171730041503906, -0.2956085205078125, -0.2740440368652344, -0.25247955322265625, -0.23091506958007812, -0.2093505859375, -0.18778610229492188, -0.16622161865234375, -0.14465713500976562, -0.1230926513671875, -0.10152816772460938, -0.07996368408203125, -0.058399200439453125, -0.036834716796875, -0.015270233154296875, 0.00629425048828125, 0.027858734130859375, 0.0494232177734375, 0.07098770141601562, 0.09255218505859375, 0.11411666870117188, 0.13568115234375, 0.15724563598632812, 0.17881011962890625, 0.20037460327148438, 0.2219390869140625, 0.24350357055664062, 0.26506805419921875, 0.2866325378417969, 0.308197021484375, 0.3297615051269531, 0.35132598876953125, 0.3728904724121094, 0.3944549560546875, 0.4160194396972656, 0.43758392333984375, 0.4591484069824219, 0.480712890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 7.0, 5.0, 16.0, 32.0, 45.0, 61.0, 115.0, 154.0, 163.0, 135.0, 106.0, 62.0, 43.0, 23.0, 15.0, 13.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.048084735870361, -6.868906021118164, -6.689726829528809, -6.510548114776611, -6.331369400024414, -6.152190685272217, -5.9730119705200195, -5.793832778930664, -5.614654064178467, -5.4354753494262695, -5.256296157836914, -5.077117443084717, -4.8979387283325195, -4.718760013580322, -4.539581298828125, -4.3604021072387695, -4.181223392486572, -4.002044677734375, -3.8228657245635986, -3.6436867713928223, -3.464508056640625, -3.2853293418884277, -3.1061503887176514, -2.926971435546875, -2.7477927207946777, -2.5686140060424805, -2.389435052871704, -2.2102560997009277, -2.0310773849487305, -1.8518985509872437, -1.6727197170257568, -1.49354088306427, -1.3143625259399414, -1.1351836919784546, -0.9560048580169678, -0.776826024055481, -0.5976471900939941, -0.4184683561325073, -0.2392895221710205, -0.06011068820953369, 0.11906814575195312, 0.29824697971343994, 0.47742581367492676, 0.6566046476364136, 0.8357834815979004, 1.0149623155593872, 1.194141149520874, 1.3733199834823608, 1.5524988174438477, 1.7316776514053345, 1.9108564853668213, 2.0900354385375977, 2.269214153289795, 2.448392868041992, 2.6275718212127686, 2.806750774383545, 2.985929489135742, 3.1651082038879395, 3.344287157058716, 3.523466110229492, 3.7026448249816895, 3.8818235397338867, 4.061002731323242, 4.2401814460754395, 4.419360160827637]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 8.0, 8.0, 8.0, 11.0, 12.0, 8.0, 24.0, 23.0, 18.0, 20.0, 26.0, 25.0, 37.0, 24.0, 36.0, 45.0, 44.0, 40.0, 47.0, 42.0, 37.0, 36.0, 39.0, 43.0, 41.0, 39.0, 32.0, 35.0, 33.0, 29.0, 17.0, 17.0, 20.0, 8.0, 11.0, 12.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4207098484039307, -3.305483818054199, -3.1902575492858887, -3.0750315189361572, -2.959805488586426, -2.8445792198181152, -2.729353189468384, -2.6141271591186523, -2.498900890350342, -2.3836748600006104, -2.2684485912323, -2.1532225608825684, -2.037996292114258, -1.9227702617645264, -1.807544231414795, -1.692318081855774, -1.577091932296753, -1.461865782737732, -1.346639633178711, -1.2314136028289795, -1.1161874532699585, -1.0009613037109375, -0.8857352137565613, -0.7705091238021851, -0.6552829742431641, -0.5400568246841431, -0.42483073472976685, -0.30960461497306824, -0.19437849521636963, -0.07915234565734863, 0.03607374429702759, 0.1512998342514038, 0.2665262222290039, 0.3817523419857025, 0.4969784617424011, 0.6122045516967773, 0.7274307012557983, 0.8426568508148193, 0.9578829407691956, 1.0731090307235718, 1.1883351802825928, 1.3035613298416138, 1.4187874794006348, 1.5340135097503662, 1.6492396593093872, 1.7644658088684082, 1.8796918392181396, 1.9949179887771606, 2.1101441383361816, 2.225370168685913, 2.3405964374542236, 2.455822467803955, 2.5710487365722656, 2.686274766921997, 2.8015007972717285, 2.916727066040039, 3.0319530963897705, 3.147179126739502, 3.2624053955078125, 3.377631425857544, 3.4928574562072754, 3.608083724975586, 3.7233097553253174, 3.838535785675049, 3.9537620544433594]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 6.0, 19.0, 19.0, 30.0, 41.0, 62.0, 101.0, 171.0, 351.0, 704.0, 1520.0, 4479.0, 20468.0, 457920.0, 3657590.0, 40785.0, 6543.0, 1850.0, 774.0, 374.0, 174.0, 101.0, 55.0, 44.0, 32.0, 24.0, 12.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.666534423828125, -1.61627197265625, -1.566009521484375, -1.5157470703125, -1.465484619140625, -1.41522216796875, -1.364959716796875, -1.314697265625, -1.264434814453125, -1.21417236328125, -1.163909912109375, -1.1136474609375, -1.063385009765625, -1.01312255859375, -0.962860107421875, -0.91259765625, -0.862335205078125, -0.81207275390625, -0.761810302734375, -0.7115478515625, -0.661285400390625, -0.61102294921875, -0.560760498046875, -0.510498046875, -0.460235595703125, -0.40997314453125, -0.359710693359375, -0.3094482421875, -0.259185791015625, -0.20892333984375, -0.158660888671875, -0.1083984375, -0.058135986328125, -0.00787353515625, 0.042388916015625, 0.0926513671875, 0.142913818359375, 0.19317626953125, 0.243438720703125, 0.293701171875, 0.343963623046875, 0.39422607421875, 0.444488525390625, 0.4947509765625, 0.545013427734375, 0.59527587890625, 0.645538330078125, 0.69580078125, 0.746063232421875, 0.79632568359375, 0.846588134765625, 0.8968505859375, 0.947113037109375, 0.99737548828125, 1.047637939453125, 1.097900390625, 1.148162841796875, 1.19842529296875, 1.248687744140625, 1.2989501953125, 1.349212646484375, 1.39947509765625, 1.449737548828125, 1.5]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 11.0, 22.0, 26.0, 38.0, 70.0, 76.0, 105.0, 138.0, 121.0, 123.0, 102.0, 57.0, 50.0, 26.0, 20.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41796875, -0.40061187744140625, -0.3832550048828125, -0.36589813232421875, -0.348541259765625, -0.33118438720703125, -0.3138275146484375, -0.29647064208984375, -0.27911376953125, -0.26175689697265625, -0.2444000244140625, -0.22704315185546875, -0.209686279296875, -0.19232940673828125, -0.1749725341796875, -0.15761566162109375, -0.1402587890625, -0.12290191650390625, -0.1055450439453125, -0.08818817138671875, -0.070831298828125, -0.05347442626953125, -0.0361175537109375, -0.01876068115234375, -0.00140380859375, 0.01595306396484375, 0.0333099365234375, 0.05066680908203125, 0.068023681640625, 0.08538055419921875, 0.1027374267578125, 0.12009429931640625, 0.137451171875, 0.15480804443359375, 0.1721649169921875, 0.18952178955078125, 0.206878662109375, 0.22423553466796875, 0.2415924072265625, 0.25894927978515625, 0.27630615234375, 0.29366302490234375, 0.3110198974609375, 0.32837677001953125, 0.345733642578125, 0.36309051513671875, 0.3804473876953125, 0.39780426025390625, 0.4151611328125, 0.43251800537109375, 0.4498748779296875, 0.46723175048828125, 0.484588623046875, 0.5019454956054688, 0.5193023681640625, 0.5366592407226562, 0.55401611328125, 0.5713729858398438, 0.5887298583984375, 0.6060867309570312, 0.623443603515625, 0.6408004760742188, 0.6581573486328125, 0.6755142211914062, 0.69287109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 5.0, 13.0, 8.0, 7.0, 18.0, 22.0, 33.0, 53.0, 60.0, 62.0, 98.0, 169.0, 341.0, 852.0, 3008.0, 17451.0, 289387.0, 3804477.0, 67085.0, 8139.0, 1699.0, 543.0, 233.0, 142.0, 91.0, 80.0, 54.0, 45.0, 33.0, 13.0, 16.0, 17.0, 15.0, 3.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.2833404541015625, -1.239532470703125, -1.1957244873046875, -1.15191650390625, -1.1081085205078125, -1.064300537109375, -1.0204925537109375, -0.9766845703125, -0.9328765869140625, -0.889068603515625, -0.8452606201171875, -0.80145263671875, -0.7576446533203125, -0.713836669921875, -0.6700286865234375, -0.626220703125, -0.5824127197265625, -0.538604736328125, -0.4947967529296875, -0.45098876953125, -0.4071807861328125, -0.363372802734375, -0.3195648193359375, -0.2757568359375, -0.2319488525390625, -0.188140869140625, -0.1443328857421875, -0.10052490234375, -0.0567169189453125, -0.012908935546875, 0.0308990478515625, 0.07470703125, 0.1185150146484375, 0.162322998046875, 0.2061309814453125, 0.24993896484375, 0.2937469482421875, 0.337554931640625, 0.3813629150390625, 0.4251708984375, 0.4689788818359375, 0.512786865234375, 0.5565948486328125, 0.60040283203125, 0.6442108154296875, 0.688018798828125, 0.7318267822265625, 0.775634765625, 0.8194427490234375, 0.863250732421875, 0.9070587158203125, 0.95086669921875, 0.9946746826171875, 1.038482666015625, 1.0822906494140625, 1.1260986328125, 1.1699066162109375, 1.213714599609375, 1.2575225830078125, 1.30133056640625, 1.3451385498046875, 1.388946533203125, 1.4327545166015625, 1.4765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 24.0, 33.0, 73.0, 296.0, 2428.0, 977.0, 150.0, 47.0, 21.0, 16.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82861328125, -0.8033676147460938, -0.7781219482421875, -0.7528762817382812, -0.727630615234375, -0.7023849487304688, -0.6771392822265625, -0.6518936157226562, -0.62664794921875, -0.6014022827148438, -0.5761566162109375, -0.5509109497070312, -0.525665283203125, -0.5004196166992188, -0.4751739501953125, -0.44992828369140625, -0.4246826171875, -0.39943695068359375, -0.3741912841796875, -0.34894561767578125, -0.323699951171875, -0.29845428466796875, -0.2732086181640625, -0.24796295166015625, -0.22271728515625, -0.19747161865234375, -0.1722259521484375, -0.14698028564453125, -0.121734619140625, -0.09648895263671875, -0.0712432861328125, -0.04599761962890625, -0.020751953125, 0.00449371337890625, 0.0297393798828125, 0.05498504638671875, 0.080230712890625, 0.10547637939453125, 0.1307220458984375, 0.15596771240234375, 0.18121337890625, 0.20645904541015625, 0.2317047119140625, 0.25695037841796875, 0.282196044921875, 0.30744171142578125, 0.3326873779296875, 0.35793304443359375, 0.3831787109375, 0.40842437744140625, 0.4336700439453125, 0.45891571044921875, 0.484161376953125, 0.5094070434570312, 0.5346527099609375, 0.5598983764648438, 0.58514404296875, 0.6103897094726562, 0.6356353759765625, 0.6608810424804688, 0.686126708984375, 0.7113723754882812, 0.7366180419921875, 0.7618637084960938, 0.787109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 9.0, 16.0, 35.0, 83.0, 173.0, 246.0, 198.0, 118.0, 68.0, 32.0, 11.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.369837760925293, -1.2773617506027222, -1.1848856210708618, -1.092409610748291, -0.9999335408210754, -0.9074574708938599, -0.8149814605712891, -0.7225053906440735, -0.6300293207168579, -0.5375532507896423, -0.44507721066474915, -0.35260117053985596, -0.2601251006126404, -0.1676490306854248, -0.075173020362854, 0.017303049564361572, 0.10977911949157715, 0.20225517451763153, 0.2947312295436859, 0.3872072696685791, 0.4796833395957947, 0.5721594095230103, 0.664635419845581, 0.7571114897727966, 0.8495875597000122, 0.9420636296272278, 1.0345396995544434, 1.1270157098770142, 1.219491720199585, 1.3119678497314453, 1.4044438600540161, 1.496919870376587, 1.5893959999084473, 1.681872010231018, 1.7743481397628784, 1.8668241500854492, 1.9593002796173096, 2.05177640914917, 2.144252300262451, 2.2367284297943115, 2.329204559326172, 2.4216806888580322, 2.5141565799713135, 2.606632709503174, 2.699108839035034, 2.7915849685668945, 2.884060859680176, 2.976536989212036, 3.0690128803253174, 3.1614890098571777, 3.253964900970459, 3.3464410305023193, 3.4389171600341797, 3.531393051147461, 3.6238691806793213, 3.7163453102111816, 3.808821201324463, 3.9012973308563232, 3.9937732219696045, 4.086249351501465, 4.178725242614746, 4.2712016105651855, 4.363677501678467, 4.456153392791748, 4.5486297607421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 15.0, 17.0, 21.0, 19.0, 21.0, 39.0, 40.0, 48.0, 49.0, 41.0, 59.0, 56.0, 67.0, 56.0, 53.0, 61.0, 44.0, 41.0, 29.0, 45.0, 30.0, 31.0, 18.0, 17.0, 25.0, 5.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9604644775390625, -0.924887478351593, -0.8893104791641235, -0.8537335395812988, -0.8181565403938293, -0.7825795412063599, -0.7470025420188904, -0.7114255428314209, -0.6758486032485962, -0.6402716040611267, -0.6046946048736572, -0.5691176652908325, -0.533540666103363, -0.49796366691589355, -0.4623866677284241, -0.4268096685409546, -0.3912326693534851, -0.3556556701660156, -0.32007870078086853, -0.28450170159339905, -0.24892471730709076, -0.21334773302078247, -0.177770733833313, -0.1421937495470047, -0.10661676526069641, -0.07103978097438812, -0.03546278923749924, 0.00011420249938964844, 0.03569118678569794, 0.07126817107200623, 0.10684517025947571, 0.142422154545784, 0.17799913883209229, 0.21357612311840057, 0.24915310740470886, 0.28473010659217834, 0.32030707597732544, 0.3558840751647949, 0.3914610743522644, 0.4270380735397339, 0.462615042924881, 0.49819204211235046, 0.5337690114974976, 0.569346010684967, 0.6049230098724365, 0.6404999494552612, 0.6760770082473755, 0.7116539478302002, 0.7472309470176697, 0.7828079462051392, 0.8183849453926086, 0.8539619445800781, 0.8895388841629028, 0.9251158833503723, 0.9606928825378418, 0.9962698817253113, 1.0318468809127808, 1.0674238204956055, 1.1030008792877197, 1.1385778188705444, 1.1741548776626587, 1.2097318172454834, 1.2453088760375977, 1.2808858156204224, 1.316462755203247]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 15.0, 26.0, 39.0, 82.0, 129.0, 231.0, 422.0, 764.0, 1722.0, 4647.0, 24768.0, 303162.0, 644084.0, 56310.0, 7633.0, 2335.0, 1039.0, 543.0, 259.0, 135.0, 74.0, 54.0, 32.0, 17.0, 4.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87109375, -1.8110809326171875, -1.751068115234375, -1.6910552978515625, -1.63104248046875, -1.5710296630859375, -1.511016845703125, -1.4510040283203125, -1.3909912109375, -1.3309783935546875, -1.270965576171875, -1.2109527587890625, -1.15093994140625, -1.0909271240234375, -1.030914306640625, -0.9709014892578125, -0.910888671875, -0.8508758544921875, -0.790863037109375, -0.7308502197265625, -0.67083740234375, -0.6108245849609375, -0.550811767578125, -0.4907989501953125, -0.4307861328125, -0.3707733154296875, -0.310760498046875, -0.2507476806640625, -0.19073486328125, -0.1307220458984375, -0.070709228515625, -0.0106964111328125, 0.04931640625, 0.1093292236328125, 0.169342041015625, 0.2293548583984375, 0.28936767578125, 0.3493804931640625, 0.409393310546875, 0.4694061279296875, 0.5294189453125, 0.5894317626953125, 0.649444580078125, 0.7094573974609375, 0.76947021484375, 0.8294830322265625, 0.889495849609375, 0.9495086669921875, 1.009521484375, 1.0695343017578125, 1.129547119140625, 1.1895599365234375, 1.24957275390625, 1.3095855712890625, 1.369598388671875, 1.4296112060546875, 1.4896240234375, 1.5496368408203125, 1.609649658203125, 1.6696624755859375, 1.72967529296875, 1.7896881103515625, 1.849700927734375, 1.9097137451171875, 1.9697265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 14.0, 23.0, 46.0, 61.0, 84.0, 89.0, 131.0, 149.0, 115.0, 97.0, 70.0, 44.0, 34.0, 18.0, 5.0, 8.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4274482727050781, -0.40982818603515625, -0.3922080993652344, -0.3745880126953125, -0.3569679260253906, -0.33934783935546875, -0.3217277526855469, -0.304107666015625, -0.2864875793457031, -0.26886749267578125, -0.2512474060058594, -0.2336273193359375, -0.21600723266601562, -0.19838714599609375, -0.18076705932617188, -0.16314697265625, -0.14552688598632812, -0.12790679931640625, -0.11028671264648438, -0.0926666259765625, -0.07504653930664062, -0.05742645263671875, -0.039806365966796875, -0.022186279296875, -0.004566192626953125, 0.01305389404296875, 0.030673980712890625, 0.0482940673828125, 0.06591415405273438, 0.08353424072265625, 0.10115432739257812, 0.1187744140625, 0.13639450073242188, 0.15401458740234375, 0.17163467407226562, 0.1892547607421875, 0.20687484741210938, 0.22449493408203125, 0.24211502075195312, 0.259735107421875, 0.2773551940917969, 0.29497528076171875, 0.3125953674316406, 0.3302154541015625, 0.3478355407714844, 0.36545562744140625, 0.3830757141113281, 0.40069580078125, 0.4183158874511719, 0.43593597412109375, 0.4535560607910156, 0.4711761474609375, 0.4887962341308594, 0.5064163208007812, 0.5240364074707031, 0.541656494140625, 0.5592765808105469, 0.5768966674804688, 0.5945167541503906, 0.6121368408203125, 0.6297569274902344, 0.6473770141601562, 0.6649971008300781, 0.6826171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 11.0, 8.0, 4.0, 10.0, 14.0, 23.0, 22.0, 38.0, 50.0, 81.0, 121.0, 192.0, 298.0, 523.0, 1006.0, 2117.0, 5167.0, 14257.0, 46185.0, 149166.0, 401605.0, 289024.0, 93621.0, 28589.0, 9470.0, 3604.0, 1451.0, 698.0, 419.0, 230.0, 172.0, 93.0, 78.0, 51.0, 44.0, 22.0, 31.0, 19.0, 7.0, 11.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.6611328125, -0.6409759521484375, -0.620819091796875, -0.6006622314453125, -0.58050537109375, -0.5603485107421875, -0.540191650390625, -0.5200347900390625, -0.4998779296875, -0.4797210693359375, -0.459564208984375, -0.4394073486328125, -0.41925048828125, -0.3990936279296875, -0.378936767578125, -0.3587799072265625, -0.338623046875, -0.3184661865234375, -0.298309326171875, -0.2781524658203125, -0.25799560546875, -0.2378387451171875, -0.217681884765625, -0.1975250244140625, -0.1773681640625, -0.1572113037109375, -0.137054443359375, -0.1168975830078125, -0.09674072265625, -0.0765838623046875, -0.056427001953125, -0.0362701416015625, -0.01611328125, 0.0040435791015625, 0.024200439453125, 0.0443572998046875, 0.06451416015625, 0.0846710205078125, 0.104827880859375, 0.1249847412109375, 0.1451416015625, 0.1652984619140625, 0.185455322265625, 0.2056121826171875, 0.22576904296875, 0.2459259033203125, 0.266082763671875, 0.2862396240234375, 0.306396484375, 0.3265533447265625, 0.346710205078125, 0.3668670654296875, 0.38702392578125, 0.4071807861328125, 0.427337646484375, 0.4474945068359375, 0.4676513671875, 0.4878082275390625, 0.507965087890625, 0.5281219482421875, 0.54827880859375, 0.5684356689453125, 0.588592529296875, 0.6087493896484375, 0.62890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 7.0, 5.0, 6.0, 4.0, 10.0, 16.0, 22.0, 16.0, 21.0, 27.0, 21.0, 39.0, 32.0, 49.0, 50.0, 51.0, 41.0, 49.0, 52.0, 49.0, 50.0, 47.0, 54.0, 46.0, 42.0, 24.0, 36.0, 29.0, 27.0, 20.0, 16.0, 10.0, 12.0, 3.0, 6.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8833770751953125, -0.855133056640625, -0.8268890380859375, -0.79864501953125, -0.7704010009765625, -0.742156982421875, -0.7139129638671875, -0.6856689453125, -0.6574249267578125, -0.629180908203125, -0.6009368896484375, -0.57269287109375, -0.5444488525390625, -0.516204833984375, -0.4879608154296875, -0.459716796875, -0.4314727783203125, -0.403228759765625, -0.3749847412109375, -0.34674072265625, -0.3184967041015625, -0.290252685546875, -0.2620086669921875, -0.2337646484375, -0.2055206298828125, -0.177276611328125, -0.1490325927734375, -0.12078857421875, -0.0925445556640625, -0.064300537109375, -0.0360565185546875, -0.0078125, 0.0204315185546875, 0.048675537109375, 0.0769195556640625, 0.10516357421875, 0.1334075927734375, 0.161651611328125, 0.1898956298828125, 0.2181396484375, 0.2463836669921875, 0.274627685546875, 0.3028717041015625, 0.33111572265625, 0.3593597412109375, 0.387603759765625, 0.4158477783203125, 0.444091796875, 0.4723358154296875, 0.500579833984375, 0.5288238525390625, 0.55706787109375, 0.5853118896484375, 0.613555908203125, 0.6417999267578125, 0.6700439453125, 0.6982879638671875, 0.726531982421875, 0.7547760009765625, 0.78302001953125, 0.8112640380859375, 0.839508056640625, 0.8677520751953125, 0.89599609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 14.0, 18.0, 27.0, 57.0, 109.0, 171.0, 270.0, 505.0, 1065.0, 2796.0, 10464.0, 59456.0, 376841.0, 487435.0, 88877.0, 14250.0, 3593.0, 1166.0, 655.0, 318.0, 181.0, 102.0, 70.0, 41.0, 32.0, 14.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.28638458251953125, -0.2768707275390625, -0.26735687255859375, -0.257843017578125, -0.24832916259765625, -0.2388153076171875, -0.22930145263671875, -0.21978759765625, -0.21027374267578125, -0.2007598876953125, -0.19124603271484375, -0.181732177734375, -0.17221832275390625, -0.1627044677734375, -0.15319061279296875, -0.1436767578125, -0.13416290283203125, -0.1246490478515625, -0.11513519287109375, -0.105621337890625, -0.09610748291015625, -0.0865936279296875, -0.07707977294921875, -0.06756591796875, -0.05805206298828125, -0.0485382080078125, -0.03902435302734375, -0.029510498046875, -0.01999664306640625, -0.0104827880859375, -0.00096893310546875, 0.008544921875, 0.01805877685546875, 0.0275726318359375, 0.03708648681640625, 0.046600341796875, 0.05611419677734375, 0.0656280517578125, 0.07514190673828125, 0.08465576171875, 0.09416961669921875, 0.1036834716796875, 0.11319732666015625, 0.122711181640625, 0.13222503662109375, 0.1417388916015625, 0.15125274658203125, 0.1607666015625, 0.17028045654296875, 0.1797943115234375, 0.18930816650390625, 0.198822021484375, 0.20833587646484375, 0.2178497314453125, 0.22736358642578125, 0.23687744140625, 0.24639129638671875, 0.2559051513671875, 0.26541900634765625, 0.274932861328125, 0.28444671630859375, 0.2939605712890625, 0.30347442626953125, 0.31298828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 18.0, 23.0, 32.0, 31.0, 55.0, 79.0, 93.0, 124.0, 104.0, 90.0, 94.0, 61.0, 60.0, 37.0, 25.0, 22.0, 11.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3048133850097656e-05, -5.1276758313179016e-05, -4.9505382776260376e-05, -4.7734007239341736e-05, -4.5962631702423096e-05, -4.4191256165504456e-05, -4.2419880628585815e-05, -4.0648505091667175e-05, -3.8877129554748535e-05, -3.7105754017829895e-05, -3.5334378480911255e-05, -3.3563002943992615e-05, -3.1791627407073975e-05, -3.0020251870155334e-05, -2.8248876333236694e-05, -2.6477500796318054e-05, -2.4706125259399414e-05, -2.2934749722480774e-05, -2.1163374185562134e-05, -1.9391998648643494e-05, -1.7620623111724854e-05, -1.5849247574806213e-05, -1.4077872037887573e-05, -1.2306496500968933e-05, -1.0535120964050293e-05, -8.763745427131653e-06, -6.992369890213013e-06, -5.2209943532943726e-06, -3.4496188163757324e-06, -1.6782432794570923e-06, 9.313225746154785e-08, 1.864507794380188e-06, 3.635883331298828e-06, 5.407258868217468e-06, 7.178634405136108e-06, 8.950009942054749e-06, 1.0721385478973389e-05, 1.2492761015892029e-05, 1.4264136552810669e-05, 1.603551208972931e-05, 1.780688762664795e-05, 1.957826316356659e-05, 2.134963870048523e-05, 2.312101423740387e-05, 2.489238977432251e-05, 2.666376531124115e-05, 2.843514084815979e-05, 3.020651638507843e-05, 3.197789192199707e-05, 3.374926745891571e-05, 3.552064299583435e-05, 3.729201853275299e-05, 3.906339406967163e-05, 4.083476960659027e-05, 4.260614514350891e-05, 4.437752068042755e-05, 4.614889621734619e-05, 4.792027175426483e-05, 4.969164729118347e-05, 5.146302282810211e-05, 5.323439836502075e-05, 5.500577390193939e-05, 5.677714943885803e-05, 5.854852497577667e-05, 6.031990051269531e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 16.0, 27.0, 71.0, 153.0, 416.0, 1439.0, 9446.0, 278992.0, 729326.0, 25066.0, 2519.0, 661.0, 251.0, 97.0, 35.0, 7.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49591064453125, -0.4776611328125, -0.45941162109375, -0.441162109375, -0.42291259765625, -0.4046630859375, -0.38641357421875, -0.3681640625, -0.34991455078125, -0.3316650390625, -0.31341552734375, -0.295166015625, -0.27691650390625, -0.2586669921875, -0.24041748046875, -0.22216796875, -0.20391845703125, -0.1856689453125, -0.16741943359375, -0.149169921875, -0.13092041015625, -0.1126708984375, -0.09442138671875, -0.076171875, -0.05792236328125, -0.0396728515625, -0.02142333984375, -0.003173828125, 0.01507568359375, 0.0333251953125, 0.05157470703125, 0.06982421875, 0.08807373046875, 0.1063232421875, 0.12457275390625, 0.142822265625, 0.16107177734375, 0.1793212890625, 0.19757080078125, 0.2158203125, 0.23406982421875, 0.2523193359375, 0.27056884765625, 0.288818359375, 0.30706787109375, 0.3253173828125, 0.34356689453125, 0.36181640625, 0.38006591796875, 0.3983154296875, 0.41656494140625, 0.434814453125, 0.45306396484375, 0.4713134765625, 0.48956298828125, 0.5078125, 0.52606201171875, 0.5443115234375, 0.56256103515625, 0.580810546875, 0.59906005859375, 0.6173095703125, 0.63555908203125, 0.65380859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 10.0, 18.0, 14.0, 30.0, 48.0, 55.0, 72.0, 96.0, 115.0, 98.0, 96.0, 80.0, 73.0, 50.0, 37.0, 21.0, 22.0, 9.0, 8.0, 9.0, 10.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21826171875, -0.20923233032226562, -0.20020294189453125, -0.19117355346679688, -0.1821441650390625, -0.17311477661132812, -0.16408538818359375, -0.15505599975585938, -0.146026611328125, -0.13699722290039062, -0.12796783447265625, -0.11893844604492188, -0.1099090576171875, -0.10087966918945312, -0.09185028076171875, -0.08282089233398438, -0.07379150390625, -0.06476211547851562, -0.05573272705078125, -0.046703338623046875, -0.0376739501953125, -0.028644561767578125, -0.01961517333984375, -0.010585784912109375, -0.001556396484375, 0.007472991943359375, 0.01650238037109375, 0.025531768798828125, 0.0345611572265625, 0.043590545654296875, 0.05261993408203125, 0.061649322509765625, 0.0706787109375, 0.07970809936523438, 0.08873748779296875, 0.09776687622070312, 0.1067962646484375, 0.11582565307617188, 0.12485504150390625, 0.13388442993164062, 0.142913818359375, 0.15194320678710938, 0.16097259521484375, 0.17000198364257812, 0.1790313720703125, 0.18806076049804688, 0.19709014892578125, 0.20611953735351562, 0.21514892578125, 0.22417831420898438, 0.23320770263671875, 0.24223709106445312, 0.2512664794921875, 0.2602958679199219, 0.26932525634765625, 0.2783546447753906, 0.287384033203125, 0.2964134216308594, 0.30544281005859375, 0.3144721984863281, 0.3235015869140625, 0.3325309753417969, 0.34156036376953125, 0.3505897521972656, 0.359619140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 14.0, 16.0, 31.0, 57.0, 98.0, 113.0, 128.0, 134.0, 120.0, 95.0, 76.0, 45.0, 26.0, 21.0, 8.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.726189613342285, -4.572580814361572, -4.418972015380859, -4.265363693237305, -4.111754894256592, -3.958146095275879, -3.804537296295166, -3.650928497314453, -3.4973196983337402, -3.3437108993530273, -3.1901023387908936, -3.0364935398101807, -2.8828847408294678, -2.729276180267334, -2.575667381286621, -2.422058582305908, -2.2684500217437744, -2.1148412227630615, -1.9612325429916382, -1.8076238632202148, -1.654015064239502, -1.5004063844680786, -1.3467977046966553, -1.1931889057159424, -1.039580225944519, -0.8859714865684509, -0.7323627471923828, -0.5787540674209595, -0.42514532804489136, -0.27153658866882324, -0.1179279088973999, 0.03568089008331299, 0.18928956985473633, 0.34289830923080444, 0.49650701880455017, 0.6501157283782959, 0.803724467754364, 0.9573332071304321, 1.1109418869018555, 1.2645506858825684, 1.4181593656539917, 1.571768045425415, 1.725376844406128, 1.8789855241775513, 2.0325942039489746, 2.1862030029296875, 2.3398118019104004, 2.4934206008911133, 2.647029161453247, 2.80063796043396, 2.9542465209960938, 3.1078553199768066, 3.2614641189575195, 3.4150729179382324, 3.568681478500366, 3.722290277481079, 3.875898838043213, 4.029507637023926, 4.183116436004639, 4.336725234985352, 4.490333557128906, 4.643942356109619, 4.797551155090332, 4.951159954071045, 5.104768753051758]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 8.0, 13.0, 8.0, 7.0, 10.0, 15.0, 14.0, 24.0, 16.0, 25.0, 31.0, 31.0, 23.0, 40.0, 41.0, 46.0, 38.0, 51.0, 51.0, 41.0, 33.0, 44.0, 45.0, 32.0, 34.0, 36.0, 29.0, 27.0, 26.0, 21.0, 21.0, 17.0, 18.0, 17.0, 18.0, 12.0, 6.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.694124221801758, -3.58223295211792, -3.470341444015503, -3.358450174331665, -3.246558666229248, -3.13466739654541, -3.0227761268615723, -2.9108848571777344, -2.7989933490753174, -2.6871020793914795, -2.5752105712890625, -2.4633193016052246, -2.3514280319213867, -2.2395365238189697, -2.127645254135132, -2.015753746032715, -1.903862476348877, -1.7919710874557495, -1.680079698562622, -1.5681884288787842, -1.4562970399856567, -1.3444056510925293, -1.2325143814086914, -1.120622992515564, -1.0087316036224365, -0.8968402147293091, -0.7849488854408264, -0.6730575561523438, -0.5611661672592163, -0.44927477836608887, -0.3373834490776062, -0.22549211978912354, -0.1136009693145752, -0.0017096102237701416, 0.11018174886703491, 0.22207310795783997, 0.333964467048645, 0.44585585594177246, 0.5577471852302551, 0.6696385145187378, 0.7815299034118652, 0.8934212923049927, 1.0053126811981201, 1.117203950881958, 1.2290953397750854, 1.340986728668213, 1.4528779983520508, 1.5647693872451782, 1.6766607761383057, 1.788552165031433, 1.9004435539245605, 2.0123348236083984, 2.1242260932922363, 2.2361176013946533, 2.348008871078491, 2.459900379180908, 2.571791648864746, 2.683682918548584, 2.795574426651001, 2.907465696334839, 3.019357204437256, 3.1312484741210938, 3.2431397438049316, 3.3550310134887695, 3.4669225215911865]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 10.0, 9.0, 10.0, 9.0, 15.0, 28.0, 30.0, 38.0, 55.0, 98.0, 142.0, 222.0, 391.0, 753.0, 1528.0, 3056.0, 7592.0, 28285.0, 559956.0, 3536141.0, 40129.0, 9138.0, 3159.0, 1563.0, 799.0, 405.0, 243.0, 151.0, 90.0, 69.0, 46.0, 36.0, 16.0, 18.0, 12.0, 7.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.8447265625, -1.7872467041015625, -1.729766845703125, -1.6722869873046875, -1.61480712890625, -1.5573272705078125, -1.499847412109375, -1.4423675537109375, -1.3848876953125, -1.3274078369140625, -1.269927978515625, -1.2124481201171875, -1.15496826171875, -1.0974884033203125, -1.040008544921875, -0.9825286865234375, -0.925048828125, -0.8675689697265625, -0.810089111328125, -0.7526092529296875, -0.69512939453125, -0.6376495361328125, -0.580169677734375, -0.5226898193359375, -0.4652099609375, -0.4077301025390625, -0.350250244140625, -0.2927703857421875, -0.23529052734375, -0.1778106689453125, -0.120330810546875, -0.0628509521484375, -0.00537109375, 0.0521087646484375, 0.109588623046875, 0.1670684814453125, 0.22454833984375, 0.2820281982421875, 0.339508056640625, 0.3969879150390625, 0.4544677734375, 0.5119476318359375, 0.569427490234375, 0.6269073486328125, 0.68438720703125, 0.7418670654296875, 0.799346923828125, 0.8568267822265625, 0.914306640625, 0.9717864990234375, 1.029266357421875, 1.0867462158203125, 1.14422607421875, 1.2017059326171875, 1.259185791015625, 1.3166656494140625, 1.3741455078125, 1.4316253662109375, 1.489105224609375, 1.5465850830078125, 1.60406494140625, 1.6615447998046875, 1.719024658203125, 1.7765045166015625, 1.833984375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 10.0, 24.0, 30.0, 55.0, 69.0, 75.0, 91.0, 122.0, 139.0, 121.0, 86.0, 71.0, 34.0, 31.0, 19.0, 12.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441162109375, -0.4235343933105469, -0.40590667724609375, -0.3882789611816406, -0.3706512451171875, -0.3530235290527344, -0.33539581298828125, -0.3177680969238281, -0.300140380859375, -0.2825126647949219, -0.26488494873046875, -0.24725723266601562, -0.2296295166015625, -0.21200180053710938, -0.19437408447265625, -0.17674636840820312, -0.15911865234375, -0.14149093627929688, -0.12386322021484375, -0.10623550415039062, -0.0886077880859375, -0.07098007202148438, -0.05335235595703125, -0.035724639892578125, -0.018096923828125, -0.000469207763671875, 0.01715850830078125, 0.034786224365234375, 0.0524139404296875, 0.07004165649414062, 0.08766937255859375, 0.10529708862304688, 0.1229248046875, 0.14055252075195312, 0.15818023681640625, 0.17580795288085938, 0.1934356689453125, 0.21106338500976562, 0.22869110107421875, 0.24631881713867188, 0.263946533203125, 0.2815742492675781, 0.29920196533203125, 0.3168296813964844, 0.3344573974609375, 0.3520851135253906, 0.36971282958984375, 0.3873405456542969, 0.40496826171875, 0.4225959777832031, 0.44022369384765625, 0.4578514099121094, 0.4754791259765625, 0.4931068420410156, 0.5107345581054688, 0.5283622741699219, 0.545989990234375, 0.5636177062988281, 0.5812454223632812, 0.5988731384277344, 0.6165008544921875, 0.6341285705566406, 0.6517562866210938, 0.6693840026855469, 0.68701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 6.0, 17.0, 24.0, 14.0, 32.0, 54.0, 57.0, 94.0, 128.0, 189.0, 346.0, 571.0, 1136.0, 2571.0, 6956.0, 24483.0, 238595.0, 3807294.0, 87700.0, 14966.0, 4813.0, 1988.0, 893.0, 474.0, 278.0, 164.0, 117.0, 73.0, 52.0, 51.0, 26.0, 29.0, 23.0, 12.0, 14.0, 9.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1465301513671875, -1.104583740234375, -1.0626373291015625, -1.02069091796875, -0.9787445068359375, -0.936798095703125, -0.8948516845703125, -0.8529052734375, -0.8109588623046875, -0.769012451171875, -0.7270660400390625, -0.68511962890625, -0.6431732177734375, -0.601226806640625, -0.5592803955078125, -0.517333984375, -0.4753875732421875, -0.433441162109375, -0.3914947509765625, -0.34954833984375, -0.3076019287109375, -0.265655517578125, -0.2237091064453125, -0.1817626953125, -0.1398162841796875, -0.097869873046875, -0.0559234619140625, -0.01397705078125, 0.0279693603515625, 0.069915771484375, 0.1118621826171875, 0.15380859375, 0.1957550048828125, 0.237701416015625, 0.2796478271484375, 0.32159423828125, 0.3635406494140625, 0.405487060546875, 0.4474334716796875, 0.4893798828125, 0.5313262939453125, 0.573272705078125, 0.6152191162109375, 0.65716552734375, 0.6991119384765625, 0.741058349609375, 0.7830047607421875, 0.824951171875, 0.8668975830078125, 0.908843994140625, 0.9507904052734375, 0.99273681640625, 1.0346832275390625, 1.076629638671875, 1.1185760498046875, 1.1605224609375, 1.2024688720703125, 1.244415283203125, 1.2863616943359375, 1.32830810546875, 1.3702545166015625, 1.412200927734375, 1.4541473388671875, 1.49609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 9.0, 1.0, 6.0, 8.0, 17.0, 30.0, 47.0, 100.0, 428.0, 2868.0, 378.0, 92.0, 39.0, 19.0, 15.0, 8.0, 3.0, 8.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5366744995117188, -0.5128021240234375, -0.48892974853515625, -0.465057373046875, -0.44118499755859375, -0.4173126220703125, -0.39344024658203125, -0.36956787109375, -0.34569549560546875, -0.3218231201171875, -0.29795074462890625, -0.274078369140625, -0.25020599365234375, -0.2263336181640625, -0.20246124267578125, -0.1785888671875, -0.15471649169921875, -0.1308441162109375, -0.10697174072265625, -0.083099365234375, -0.05922698974609375, -0.0353546142578125, -0.01148223876953125, 0.01239013671875, 0.03626251220703125, 0.0601348876953125, 0.08400726318359375, 0.107879638671875, 0.13175201416015625, 0.1556243896484375, 0.17949676513671875, 0.203369140625, 0.22724151611328125, 0.2511138916015625, 0.27498626708984375, 0.298858642578125, 0.32273101806640625, 0.3466033935546875, 0.37047576904296875, 0.39434814453125, 0.41822052001953125, 0.4420928955078125, 0.46596527099609375, 0.489837646484375, 0.5137100219726562, 0.5375823974609375, 0.5614547729492188, 0.5853271484375, 0.6091995239257812, 0.6330718994140625, 0.6569442749023438, 0.680816650390625, 0.7046890258789062, 0.7285614013671875, 0.7524337768554688, 0.77630615234375, 0.8001785278320312, 0.8240509033203125, 0.8479232788085938, 0.871795654296875, 0.8956680297851562, 0.9195404052734375, 0.9434127807617188, 0.96728515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 7.0, 23.0, 40.0, 73.0, 139.0, 175.0, 191.0, 134.0, 74.0, 64.0, 28.0, 15.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.583125352859497, -2.507763624191284, -2.4324021339416504, -2.3570404052734375, -2.2816786766052246, -2.206317186355591, -2.130955457687378, -2.055593967437744, -1.9802322387695312, -1.904870629310608, -1.8295090198516846, -1.7541472911834717, -1.6787856817245483, -1.603424072265625, -1.528062343597412, -1.4527007341384888, -1.3773391246795654, -1.301977515220642, -1.2266159057617188, -1.1512541770935059, -1.0758925676345825, -1.0005309581756592, -0.9251692891120911, -0.849807620048523, -0.7744460105895996, -0.6990844011306763, -0.6237227320671082, -0.54836106300354, -0.4729994535446167, -0.39763781428337097, -0.32227617502212524, -0.24691450595855713, -0.1715531349182129, -0.09619149565696716, -0.020829856395721436, 0.05453178286552429, 0.12989342212677002, 0.20525506138801575, 0.2806167006492615, 0.3559783697128296, 0.43133997917175293, 0.5067015886306763, 0.5820632576942444, 0.6574249267578125, 0.7327865362167358, 0.8081481456756592, 0.8835098147392273, 0.9588714838027954, 1.0342330932617188, 1.109594702720642, 1.1849563121795654, 1.2603180408477783, 1.3356796503067017, 1.411041259765625, 1.486402988433838, 1.5617645978927612, 1.6371262073516846, 1.712487816810608, 1.7878494262695312, 1.8632111549377441, 1.9385727643966675, 2.013934373855591, 2.0892961025238037, 2.1646575927734375, 2.2400193214416504]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 11.0, 9.0, 16.0, 11.0, 20.0, 24.0, 31.0, 38.0, 40.0, 52.0, 55.0, 52.0, 68.0, 59.0, 52.0, 64.0, 43.0, 54.0, 52.0, 37.0, 36.0, 36.0, 27.0, 15.0, 16.0, 16.0, 11.0, 8.0, 12.0, 6.0, 4.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2836978435516357, -1.2408756017684937, -1.1980534791946411, -1.155231237411499, -1.1124091148376465, -1.0695868730545044, -1.0267646312713623, -0.983942449092865, -0.9411202669143677, -0.8982980847358704, -0.855475902557373, -0.812653660774231, -0.7698314785957336, -0.7270092964172363, -0.6841870546340942, -0.6413648724555969, -0.5985426902770996, -0.5557205080986023, -0.512898325920105, -0.4700760841369629, -0.4272539019584656, -0.38443171977996826, -0.34160950779914856, -0.29878729581832886, -0.25596511363983154, -0.21314291656017303, -0.17032071948051453, -0.12749852240085602, -0.08467632532119751, -0.041854128241539, 0.0009680688381195068, 0.04379028081893921, 0.08661246299743652, 0.12943466007709503, 0.17225685715675354, 0.21507905423641205, 0.25790125131607056, 0.30072343349456787, 0.3435456454753876, 0.3863678574562073, 0.4291900396347046, 0.4720122218132019, 0.5148344039916992, 0.5576566457748413, 0.6004788279533386, 0.6433010101318359, 0.686123251914978, 0.7289454340934753, 0.7717676162719727, 0.81458979845047, 0.8574119806289673, 0.9002342224121094, 0.9430564045906067, 0.985878586769104, 1.028700828552246, 1.0715229511260986, 1.1143451929092407, 1.1571674346923828, 1.1999895572662354, 1.2428117990493774, 1.2856340408325195, 1.328456163406372, 1.3712784051895142, 1.4141006469726562, 1.4569227695465088]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 6.0, 21.0, 20.0, 29.0, 40.0, 82.0, 122.0, 174.0, 327.0, 513.0, 879.0, 1774.0, 4172.0, 13600.0, 70885.0, 466884.0, 410193.0, 59300.0, 11950.0, 3806.0, 1573.0, 878.0, 482.0, 311.0, 192.0, 110.0, 70.0, 47.0, 37.0, 19.0, 19.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6689453125, -1.6183013916015625, -1.567657470703125, -1.5170135498046875, -1.46636962890625, -1.4157257080078125, -1.365081787109375, -1.3144378662109375, -1.2637939453125, -1.2131500244140625, -1.162506103515625, -1.1118621826171875, -1.06121826171875, -1.0105743408203125, -0.959930419921875, -0.9092864990234375, -0.858642578125, -0.8079986572265625, -0.757354736328125, -0.7067108154296875, -0.65606689453125, -0.6054229736328125, -0.554779052734375, -0.5041351318359375, -0.4534912109375, -0.4028472900390625, -0.352203369140625, -0.3015594482421875, -0.25091552734375, -0.2002716064453125, -0.149627685546875, -0.0989837646484375, -0.04833984375, 0.0023040771484375, 0.052947998046875, 0.1035919189453125, 0.15423583984375, 0.2048797607421875, 0.255523681640625, 0.3061676025390625, 0.3568115234375, 0.4074554443359375, 0.458099365234375, 0.5087432861328125, 0.55938720703125, 0.6100311279296875, 0.660675048828125, 0.7113189697265625, 0.761962890625, 0.8126068115234375, 0.863250732421875, 0.9138946533203125, 0.96453857421875, 1.0151824951171875, 1.065826416015625, 1.1164703369140625, 1.1671142578125, 1.2177581787109375, 1.268402099609375, 1.3190460205078125, 1.36968994140625, 1.4203338623046875, 1.470977783203125, 1.5216217041015625, 1.572265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 22.0, 34.0, 46.0, 59.0, 80.0, 92.0, 122.0, 143.0, 110.0, 77.0, 86.0, 47.0, 24.0, 26.0, 16.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451904296875, -0.4339866638183594, -0.41606903076171875, -0.3981513977050781, -0.3802337646484375, -0.3623161315917969, -0.34439849853515625, -0.3264808654785156, -0.308563232421875, -0.2906455993652344, -0.27272796630859375, -0.2548103332519531, -0.2368927001953125, -0.21897506713867188, -0.20105743408203125, -0.18313980102539062, -0.16522216796875, -0.14730453491210938, -0.12938690185546875, -0.11146926879882812, -0.0935516357421875, -0.07563400268554688, -0.05771636962890625, -0.039798736572265625, -0.021881103515625, -0.003963470458984375, 0.01395416259765625, 0.031871795654296875, 0.0497894287109375, 0.06770706176757812, 0.08562469482421875, 0.10354232788085938, 0.1214599609375, 0.13937759399414062, 0.15729522705078125, 0.17521286010742188, 0.1931304931640625, 0.21104812622070312, 0.22896575927734375, 0.24688339233398438, 0.264801025390625, 0.2827186584472656, 0.30063629150390625, 0.3185539245605469, 0.3364715576171875, 0.3543891906738281, 0.37230682373046875, 0.3902244567871094, 0.40814208984375, 0.4260597229003906, 0.44397735595703125, 0.4618949890136719, 0.4798126220703125, 0.4977302551269531, 0.5156478881835938, 0.5335655212402344, 0.551483154296875, 0.5694007873535156, 0.5873184204101562, 0.6052360534667969, 0.6231536865234375, 0.6410713195800781, 0.6589889526367188, 0.6769065856933594, 0.69482421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 15.0, 9.0, 18.0, 16.0, 21.0, 28.0, 61.0, 75.0, 102.0, 177.0, 316.0, 579.0, 1000.0, 2068.0, 4224.0, 10668.0, 31991.0, 115788.0, 371659.0, 354070.0, 106808.0, 30249.0, 10287.0, 4051.0, 1891.0, 959.0, 520.0, 326.0, 194.0, 120.0, 77.0, 56.0, 40.0, 31.0, 14.0, 9.0, 6.0, 8.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.79638671875, -0.7722320556640625, -0.748077392578125, -0.7239227294921875, -0.69976806640625, -0.6756134033203125, -0.651458740234375, -0.6273040771484375, -0.6031494140625, -0.5789947509765625, -0.554840087890625, -0.5306854248046875, -0.50653076171875, -0.4823760986328125, -0.458221435546875, -0.4340667724609375, -0.409912109375, -0.3857574462890625, -0.361602783203125, -0.3374481201171875, -0.31329345703125, -0.2891387939453125, -0.264984130859375, -0.2408294677734375, -0.2166748046875, -0.1925201416015625, -0.168365478515625, -0.1442108154296875, -0.12005615234375, -0.0959014892578125, -0.071746826171875, -0.0475921630859375, -0.0234375, 0.0007171630859375, 0.024871826171875, 0.0490264892578125, 0.07318115234375, 0.0973358154296875, 0.121490478515625, 0.1456451416015625, 0.1697998046875, 0.1939544677734375, 0.218109130859375, 0.2422637939453125, 0.26641845703125, 0.2905731201171875, 0.314727783203125, 0.3388824462890625, 0.363037109375, 0.3871917724609375, 0.411346435546875, 0.4355010986328125, 0.45965576171875, 0.4838104248046875, 0.507965087890625, 0.5321197509765625, 0.5562744140625, 0.5804290771484375, 0.604583740234375, 0.6287384033203125, 0.65289306640625, 0.6770477294921875, 0.701202392578125, 0.7253570556640625, 0.74951171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 7.0, 6.0, 10.0, 9.0, 15.0, 6.0, 13.0, 18.0, 35.0, 32.0, 32.0, 40.0, 38.0, 50.0, 41.0, 56.0, 50.0, 70.0, 56.0, 48.0, 46.0, 44.0, 50.0, 27.0, 31.0, 29.0, 31.0, 28.0, 22.0, 14.0, 13.0, 6.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1376953125, -1.1014556884765625, -1.065216064453125, -1.0289764404296875, -0.99273681640625, -0.9564971923828125, -0.920257568359375, -0.8840179443359375, -0.8477783203125, -0.8115386962890625, -0.775299072265625, -0.7390594482421875, -0.70281982421875, -0.6665802001953125, -0.630340576171875, -0.5941009521484375, -0.557861328125, -0.5216217041015625, -0.485382080078125, -0.4491424560546875, -0.41290283203125, -0.3766632080078125, -0.340423583984375, -0.3041839599609375, -0.2679443359375, -0.2317047119140625, -0.195465087890625, -0.1592254638671875, -0.12298583984375, -0.0867462158203125, -0.050506591796875, -0.0142669677734375, 0.02197265625, 0.0582122802734375, 0.094451904296875, 0.1306915283203125, 0.16693115234375, 0.2031707763671875, 0.239410400390625, 0.2756500244140625, 0.3118896484375, 0.3481292724609375, 0.384368896484375, 0.4206085205078125, 0.45684814453125, 0.4930877685546875, 0.529327392578125, 0.5655670166015625, 0.601806640625, 0.6380462646484375, 0.674285888671875, 0.7105255126953125, 0.74676513671875, 0.7830047607421875, 0.819244384765625, 0.8554840087890625, 0.8917236328125, 0.9279632568359375, 0.964202880859375, 1.0004425048828125, 1.03668212890625, 1.0729217529296875, 1.109161376953125, 1.1454010009765625, 1.181640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 8.0, 9.0, 14.0, 25.0, 23.0, 41.0, 47.0, 80.0, 114.0, 194.0, 343.0, 529.0, 1134.0, 2389.0, 6016.0, 19286.0, 91089.0, 440110.0, 385410.0, 75445.0, 16314.0, 5389.0, 2216.0, 968.0, 523.0, 278.0, 179.0, 116.0, 71.0, 51.0, 38.0, 21.0, 22.0, 14.0, 11.0, 6.0, 6.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3581581115722656, -0.34790802001953125, -0.3376579284667969, -0.3274078369140625, -0.3171577453613281, -0.30690765380859375, -0.2966575622558594, -0.286407470703125, -0.2761573791503906, -0.26590728759765625, -0.2556571960449219, -0.2454071044921875, -0.23515701293945312, -0.22490692138671875, -0.21465682983398438, -0.20440673828125, -0.19415664672851562, -0.18390655517578125, -0.17365646362304688, -0.1634063720703125, -0.15315628051757812, -0.14290618896484375, -0.13265609741210938, -0.122406005859375, -0.11215591430664062, -0.10190582275390625, -0.09165573120117188, -0.0814056396484375, -0.07115554809570312, -0.06090545654296875, -0.050655364990234375, -0.0404052734375, -0.030155181884765625, -0.01990509033203125, -0.009654998779296875, 0.0005950927734375, 0.010845184326171875, 0.02109527587890625, 0.031345367431640625, 0.041595458984375, 0.051845550537109375, 0.06209564208984375, 0.07234573364257812, 0.0825958251953125, 0.09284591674804688, 0.10309600830078125, 0.11334609985351562, 0.12359619140625, 0.13384628295898438, 0.14409637451171875, 0.15434646606445312, 0.1645965576171875, 0.17484664916992188, 0.18509674072265625, 0.19534683227539062, 0.205596923828125, 0.21584701538085938, 0.22609710693359375, 0.23634719848632812, 0.2465972900390625, 0.2568473815917969, 0.26709747314453125, 0.2773475646972656, 0.28759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 11.0, 12.0, 16.0, 12.0, 21.0, 36.0, 44.0, 48.0, 58.0, 81.0, 100.0, 91.0, 99.0, 89.0, 63.0, 59.0, 41.0, 40.0, 20.0, 12.0, 11.0, 13.0, 6.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.447864532470703e-05, -5.2741728723049164e-05, -5.1004812121391296e-05, -4.926789551973343e-05, -4.753097891807556e-05, -4.5794062316417694e-05, -4.405714571475983e-05, -4.232022911310196e-05, -4.058331251144409e-05, -3.8846395909786224e-05, -3.710947930812836e-05, -3.537256270647049e-05, -3.363564610481262e-05, -3.1898729503154755e-05, -3.0161812901496887e-05, -2.842489629983902e-05, -2.6687979698181152e-05, -2.4951063096523285e-05, -2.3214146494865417e-05, -2.147722989320755e-05, -1.9740313291549683e-05, -1.8003396689891815e-05, -1.6266480088233948e-05, -1.452956348657608e-05, -1.2792646884918213e-05, -1.1055730283260345e-05, -9.318813681602478e-06, -7.581897079944611e-06, -5.844980478286743e-06, -4.108063876628876e-06, -2.3711472749710083e-06, -6.342306733131409e-07, 1.1026859283447266e-06, 2.839602530002594e-06, 4.5765191316604614e-06, 6.313435733318329e-06, 8.050352334976196e-06, 9.787268936634064e-06, 1.1524185538291931e-05, 1.3261102139949799e-05, 1.4998018741607666e-05, 1.6734935343265533e-05, 1.84718519449234e-05, 2.020876854658127e-05, 2.1945685148239136e-05, 2.3682601749897003e-05, 2.541951835155487e-05, 2.7156434953212738e-05, 2.8893351554870605e-05, 3.063026815652847e-05, 3.236718475818634e-05, 3.410410135984421e-05, 3.5841017961502075e-05, 3.757793456315994e-05, 3.931485116481781e-05, 4.105176776647568e-05, 4.2788684368133545e-05, 4.452560096979141e-05, 4.626251757144928e-05, 4.799943417310715e-05, 4.9736350774765015e-05, 5.147326737642288e-05, 5.321018397808075e-05, 5.494710057973862e-05, 5.6684017181396484e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 8.0, 12.0, 18.0, 35.0, 46.0, 123.0, 250.0, 521.0, 1559.0, 6041.0, 32493.0, 263106.0, 618350.0, 105794.0, 15171.0, 3292.0, 958.0, 365.0, 172.0, 88.0, 54.0, 39.0, 21.0, 10.0, 6.0, 6.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.2829399108886719, -0.26827239990234375, -0.2536048889160156, -0.2389373779296875, -0.22426986694335938, -0.20960235595703125, -0.19493484497070312, -0.180267333984375, -0.16559982299804688, -0.15093231201171875, -0.13626480102539062, -0.1215972900390625, -0.10692977905273438, -0.09226226806640625, -0.07759475708007812, -0.06292724609375, -0.048259735107421875, -0.03359222412109375, -0.018924713134765625, -0.0042572021484375, 0.010410308837890625, 0.02507781982421875, 0.039745330810546875, 0.054412841796875, 0.06908035278320312, 0.08374786376953125, 0.09841537475585938, 0.1130828857421875, 0.12775039672851562, 0.14241790771484375, 0.15708541870117188, 0.1717529296875, 0.18642044067382812, 0.20108795166015625, 0.21575546264648438, 0.2304229736328125, 0.24509048461914062, 0.25975799560546875, 0.2744255065917969, 0.289093017578125, 0.3037605285644531, 0.31842803955078125, 0.3330955505371094, 0.3477630615234375, 0.3624305725097656, 0.37709808349609375, 0.3917655944824219, 0.40643310546875, 0.4211006164550781, 0.43576812744140625, 0.4504356384277344, 0.4651031494140625, 0.4797706604003906, 0.49443817138671875, 0.5091056823730469, 0.523773193359375, 0.5384407043457031, 0.5531082153320312, 0.5677757263183594, 0.5824432373046875, 0.5971107482910156, 0.6117782592773438, 0.6264457702636719, 0.64111328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 8.0, 4.0, 5.0, 12.0, 8.0, 14.0, 16.0, 18.0, 32.0, 49.0, 37.0, 59.0, 75.0, 79.0, 86.0, 93.0, 92.0, 76.0, 54.0, 50.0, 31.0, 36.0, 16.0, 8.0, 15.0, 7.0, 4.0, 4.0, 10.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.422119140625, -0.4091911315917969, -0.39626312255859375, -0.3833351135253906, -0.3704071044921875, -0.3574790954589844, -0.34455108642578125, -0.3316230773925781, -0.318695068359375, -0.3057670593261719, -0.29283905029296875, -0.2799110412597656, -0.2669830322265625, -0.2540550231933594, -0.24112701416015625, -0.22819900512695312, -0.21527099609375, -0.20234298706054688, -0.18941497802734375, -0.17648696899414062, -0.1635589599609375, -0.15063095092773438, -0.13770294189453125, -0.12477493286132812, -0.111846923828125, -0.09891891479492188, -0.08599090576171875, -0.07306289672851562, -0.0601348876953125, -0.047206878662109375, -0.03427886962890625, -0.021350860595703125, -0.0084228515625, 0.004505157470703125, 0.01743316650390625, 0.030361175537109375, 0.0432891845703125, 0.056217193603515625, 0.06914520263671875, 0.08207321166992188, 0.095001220703125, 0.10792922973632812, 0.12085723876953125, 0.13378524780273438, 0.1467132568359375, 0.15964126586914062, 0.17256927490234375, 0.18549728393554688, 0.19842529296875, 0.21135330200195312, 0.22428131103515625, 0.23720932006835938, 0.2501373291015625, 0.2630653381347656, 0.27599334716796875, 0.2889213562011719, 0.301849365234375, 0.3147773742675781, 0.32770538330078125, 0.3406333923339844, 0.3535614013671875, 0.3664894104003906, 0.37941741943359375, 0.3923454284667969, 0.4052734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 6.0, 7.0, 5.0, 11.0, 21.0, 31.0, 57.0, 92.0, 123.0, 150.0, 134.0, 130.0, 86.0, 54.0, 30.0, 20.0, 17.0, 11.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7573747634887695, -7.535057544708252, -7.312740325927734, -7.090423107147217, -6.868105888366699, -6.645788669586182, -6.423471450805664, -6.2011542320251465, -5.978837013244629, -5.756519794464111, -5.534202575683594, -5.311885356903076, -5.089568138122559, -4.867250919342041, -4.644933700561523, -4.422616481781006, -4.200299263000488, -3.9779820442199707, -3.755664825439453, -3.5333476066589355, -3.311030387878418, -3.0887131690979004, -2.866395950317383, -2.6440787315368652, -2.4217615127563477, -2.19944429397583, -1.9771270751953125, -1.754809856414795, -1.5324926376342773, -1.3101754188537598, -1.0878582000732422, -0.8655409812927246, -0.6432232856750488, -0.42090606689453125, -0.19858884811401367, 0.023728370666503906, 0.24604558944702148, 0.46836280822753906, 0.6906800270080566, 0.9129972457885742, 1.1353144645690918, 1.3576316833496094, 1.579948902130127, 1.8022661209106445, 2.024583339691162, 2.2469005584716797, 2.4692177772521973, 2.691534996032715, 2.9138522148132324, 3.13616943359375, 3.3584866523742676, 3.580803871154785, 3.8031210899353027, 4.02543830871582, 4.247755527496338, 4.4700727462768555, 4.692389965057373, 4.914707183837891, 5.137024402618408, 5.359341621398926, 5.581658840179443, 5.803976058959961, 6.0262932777404785, 6.248610496520996, 6.470927715301514]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 2.0, 4.0, 7.0, 10.0, 4.0, 11.0, 11.0, 14.0, 15.0, 20.0, 21.0, 21.0, 23.0, 29.0, 23.0, 27.0, 27.0, 41.0, 35.0, 42.0, 35.0, 43.0, 32.0, 32.0, 46.0, 23.0, 38.0, 40.0, 42.0, 30.0, 16.0, 30.0, 21.0, 23.0, 19.0, 19.0, 15.0, 14.0, 20.0, 15.0, 11.0, 8.0, 5.0, 9.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-5.144678115844727, -4.988236904144287, -4.831796169281006, -4.675354957580566, -4.518914222717285, -4.362473011016846, -4.2060322761535645, -4.049591064453125, -3.8931503295898438, -3.7367093563079834, -3.580268383026123, -3.4238274097442627, -3.2673864364624023, -3.110945463180542, -2.9545044898986816, -2.798063278198242, -2.641622304916382, -2.4851813316345215, -2.328740358352661, -2.172299385070801, -2.0158584117889404, -1.85941743850708, -1.7029763460159302, -1.5465353727340698, -1.3900943994522095, -1.2336534261703491, -1.0772124528884888, -0.9207714200019836, -0.7643304467201233, -0.6078894734382629, -0.4514484405517578, -0.29500746726989746, -0.1385664939880371, 0.017874494194984436, 0.17431548237800598, 0.3307564854621887, 0.4871974587440491, 0.6436384320259094, 0.8000794649124146, 0.9565204381942749, 1.1129614114761353, 1.2694023847579956, 1.425843358039856, 1.5822844505310059, 1.7387254238128662, 1.8951663970947266, 2.051607370376587, 2.2080483436584473, 2.3644893169403076, 2.520930290222168, 2.6773712635040283, 2.8338122367858887, 2.990253210067749, 3.1466941833496094, 3.303135395050049, 3.45957612991333, 3.6160173416137695, 3.77245831489563, 3.9288992881774902, 4.08534049987793, 4.241781234741211, 4.39822244644165, 4.554663181304932, 4.711104393005371, 4.867545127868652]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 7.0, 13.0, 13.0, 36.0, 39.0, 41.0, 68.0, 109.0, 175.0, 268.0, 376.0, 735.0, 1437.0, 2865.0, 6516.0, 18736.0, 79728.0, 3610921.0, 411157.0, 40102.0, 11745.0, 4506.0, 2022.0, 1078.0, 581.0, 341.0, 195.0, 132.0, 87.0, 51.0, 42.0, 30.0, 36.0, 22.0, 11.0, 13.0, 8.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.798828125, -1.74560546875, -1.6923828125, -1.63916015625, -1.5859375, -1.53271484375, -1.4794921875, -1.42626953125, -1.373046875, -1.31982421875, -1.2666015625, -1.21337890625, -1.16015625, -1.10693359375, -1.0537109375, -1.00048828125, -0.947265625, -0.89404296875, -0.8408203125, -0.78759765625, -0.734375, -0.68115234375, -0.6279296875, -0.57470703125, -0.521484375, -0.46826171875, -0.4150390625, -0.36181640625, -0.30859375, -0.25537109375, -0.2021484375, -0.14892578125, -0.095703125, -0.04248046875, 0.0107421875, 0.06396484375, 0.1171875, 0.17041015625, 0.2236328125, 0.27685546875, 0.330078125, 0.38330078125, 0.4365234375, 0.48974609375, 0.54296875, 0.59619140625, 0.6494140625, 0.70263671875, 0.755859375, 0.80908203125, 0.8623046875, 0.91552734375, 0.96875, 1.02197265625, 1.0751953125, 1.12841796875, 1.181640625, 1.23486328125, 1.2880859375, 1.34130859375, 1.39453125, 1.44775390625, 1.5009765625, 1.55419921875, 1.607421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 11.0, 10.0, 22.0, 35.0, 46.0, 55.0, 75.0, 70.0, 92.0, 95.0, 108.0, 84.0, 70.0, 63.0, 58.0, 32.0, 27.0, 14.0, 12.0, 6.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437744140625, -0.4200477600097656, -0.40235137939453125, -0.3846549987792969, -0.3669586181640625, -0.3492622375488281, -0.33156585693359375, -0.3138694763183594, -0.296173095703125, -0.2784767150878906, -0.26078033447265625, -0.24308395385742188, -0.2253875732421875, -0.20769119262695312, -0.18999481201171875, -0.17229843139648438, -0.15460205078125, -0.13690567016601562, -0.11920928955078125, -0.10151290893554688, -0.0838165283203125, -0.06612014770507812, -0.04842376708984375, -0.030727386474609375, -0.013031005859375, 0.004665374755859375, 0.02236175537109375, 0.040058135986328125, 0.0577545166015625, 0.07545089721679688, 0.09314727783203125, 0.11084365844726562, 0.1285400390625, 0.14623641967773438, 0.16393280029296875, 0.18162918090820312, 0.1993255615234375, 0.21702194213867188, 0.23471832275390625, 0.2524147033691406, 0.270111083984375, 0.2878074645996094, 0.30550384521484375, 0.3232002258300781, 0.3408966064453125, 0.3585929870605469, 0.37628936767578125, 0.3939857482910156, 0.41168212890625, 0.4293785095214844, 0.44707489013671875, 0.4647712707519531, 0.4824676513671875, 0.5001640319824219, 0.5178604125976562, 0.5355567932128906, 0.553253173828125, 0.5709495544433594, 0.5886459350585938, 0.6063423156738281, 0.6240386962890625, 0.6417350769042969, 0.6594314575195312, 0.6771278381347656, 0.69482421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 20.0, 16.0, 21.0, 41.0, 41.0, 62.0, 79.0, 120.0, 183.0, 334.0, 599.0, 1015.0, 2062.0, 5089.0, 17558.0, 137976.0, 3877090.0, 125653.0, 16922.0, 4868.0, 1977.0, 1072.0, 502.0, 330.0, 210.0, 124.0, 86.0, 59.0, 35.0, 30.0, 22.0, 15.0, 9.0, 8.0, 14.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5625, -1.5095062255859375, -1.456512451171875, -1.4035186767578125, -1.35052490234375, -1.2975311279296875, -1.244537353515625, -1.1915435791015625, -1.1385498046875, -1.0855560302734375, -1.032562255859375, -0.9795684814453125, -0.92657470703125, -0.8735809326171875, -0.820587158203125, -0.7675933837890625, -0.714599609375, -0.6616058349609375, -0.608612060546875, -0.5556182861328125, -0.50262451171875, -0.4496307373046875, -0.396636962890625, -0.3436431884765625, -0.2906494140625, -0.2376556396484375, -0.184661865234375, -0.1316680908203125, -0.07867431640625, -0.0256805419921875, 0.027313232421875, 0.0803070068359375, 0.13330078125, 0.1862945556640625, 0.239288330078125, 0.2922821044921875, 0.34527587890625, 0.3982696533203125, 0.451263427734375, 0.5042572021484375, 0.5572509765625, 0.6102447509765625, 0.663238525390625, 0.7162322998046875, 0.76922607421875, 0.8222198486328125, 0.875213623046875, 0.9282073974609375, 0.981201171875, 1.0341949462890625, 1.087188720703125, 1.1401824951171875, 1.19317626953125, 1.2461700439453125, 1.299163818359375, 1.3521575927734375, 1.4051513671875, 1.4581451416015625, 1.511138916015625, 1.5641326904296875, 1.61712646484375, 1.6701202392578125, 1.723114013671875, 1.7761077880859375, 1.8291015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 15.0, 12.0, 29.0, 51.0, 177.0, 1564.0, 1916.0, 150.0, 67.0, 36.0, 8.0, 17.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.732757568359375, -0.69207763671875, -0.651397705078125, -0.6107177734375, -0.570037841796875, -0.52935791015625, -0.488677978515625, -0.447998046875, -0.407318115234375, -0.36663818359375, -0.325958251953125, -0.2852783203125, -0.244598388671875, -0.20391845703125, -0.163238525390625, -0.12255859375, -0.081878662109375, -0.04119873046875, -0.000518798828125, 0.0401611328125, 0.080841064453125, 0.12152099609375, 0.162200927734375, 0.202880859375, 0.243560791015625, 0.28424072265625, 0.324920654296875, 0.3656005859375, 0.406280517578125, 0.44696044921875, 0.487640380859375, 0.5283203125, 0.569000244140625, 0.60968017578125, 0.650360107421875, 0.6910400390625, 0.731719970703125, 0.77239990234375, 0.813079833984375, 0.853759765625, 0.894439697265625, 0.93511962890625, 0.975799560546875, 1.0164794921875, 1.057159423828125, 1.09783935546875, 1.138519287109375, 1.17919921875, 1.219879150390625, 1.26055908203125, 1.301239013671875, 1.3419189453125, 1.382598876953125, 1.42327880859375, 1.463958740234375, 1.504638671875, 1.545318603515625, 1.58599853515625, 1.626678466796875, 1.6673583984375, 1.708038330078125, 1.74871826171875, 1.789398193359375, 1.830078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 21.0, 27.0, 41.0, 77.0, 110.0, 170.0, 168.0, 147.0, 92.0, 54.0, 28.0, 16.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.304532527923584, -2.1892147064208984, -2.073896646499634, -1.9585788249969482, -1.8432607650756836, -1.727942943572998, -1.612625002861023, -1.4973070621490479, -1.3819891214370728, -1.2666711807250977, -1.1513532400131226, -1.0360352993011475, -0.9207174181938171, -0.805399477481842, -0.6900815963745117, -0.5747636556625366, -0.4594457149505615, -0.3441277742385864, -0.22880986332893372, -0.113491952419281, 0.0018259882926940918, 0.11714392900466919, 0.2324618101119995, 0.3477797508239746, 0.4630976915359497, 0.5784156322479248, 0.6937335729598999, 0.8090514540672302, 0.9243693947792053, 1.0396873950958252, 1.1550052165985107, 1.2703231573104858, 1.385641098022461, 1.500959038734436, 1.6162769794464111, 1.7315948009490967, 1.8469128608703613, 1.9622306823730469, 2.0775485038757324, 2.192866563796997, 2.3081846237182617, 2.4235024452209473, 2.538820505142212, 2.6541383266448975, 2.769456386566162, 2.8847742080688477, 3.000092029571533, 3.115410089492798, 3.2307279109954834, 3.346045732498169, 3.4613637924194336, 3.576681613922119, 3.691999673843384, 3.8073174953460693, 3.922635555267334, 4.0379533767700195, 4.153271198272705, 4.268589019775391, 4.383906841278076, 4.49922513961792, 4.6145429611206055, 4.729860782623291, 4.845178604125977, 4.96049690246582, 5.075814723968506]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 14.0, 19.0, 20.0, 29.0, 45.0, 54.0, 64.0, 74.0, 81.0, 65.0, 73.0, 79.0, 65.0, 61.0, 59.0, 50.0, 33.0, 33.0, 15.0, 12.0, 17.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.718045234680176, -3.6175076961517334, -3.516970157623291, -3.4164326190948486, -3.3158950805664062, -3.215357780456543, -3.1148202419281006, -3.014282703399658, -2.913745164871216, -2.8132076263427734, -2.712670087814331, -2.6121325492858887, -2.5115952491760254, -2.411057472229004, -2.3105201721191406, -2.2099826335906982, -2.109445095062256, -2.0089075565338135, -1.908370018005371, -1.8078325986862183, -1.7072950601577759, -1.6067575216293335, -1.5062201023101807, -1.4056825637817383, -1.305145025253296, -1.2046074867248535, -1.1040699481964111, -1.0035325288772583, -0.9029949903488159, -0.8024574518203735, -0.7019199728965759, -0.6013824939727783, -0.5008449554443359, -0.40030744671821594, -0.29976993799209595, -0.19923242926597595, -0.09869492053985596, 0.0018426179885864258, 0.10238009691238403, 0.20291757583618164, 0.303455114364624, 0.403992623090744, 0.504530131816864, 0.6050676107406616, 0.705605149269104, 0.8061426877975464, 0.906680166721344, 1.0072176456451416, 1.107755184173584, 1.2082927227020264, 1.3088302612304688, 1.4093676805496216, 1.509905219078064, 1.6104427576065063, 1.7109801769256592, 1.8115177154541016, 1.912055253982544, 2.0125927925109863, 2.1131303310394287, 2.213667869567871, 2.3142051696777344, 2.414742946624756, 2.515280246734619, 2.6158177852630615, 2.716355323791504]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 6.0, 11.0, 16.0, 29.0, 34.0, 72.0, 81.0, 123.0, 185.0, 301.0, 382.0, 670.0, 1160.0, 2115.0, 4161.0, 10134.0, 28945.0, 104495.0, 357406.0, 375320.0, 111941.0, 30847.0, 10391.0, 4437.0, 2070.0, 1221.0, 673.0, 442.0, 275.0, 183.0, 123.0, 86.0, 60.0, 41.0, 29.0, 23.0, 17.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2392578125, -1.196563720703125, -1.15386962890625, -1.111175537109375, -1.0684814453125, -1.025787353515625, -0.98309326171875, -0.940399169921875, -0.897705078125, -0.855010986328125, -0.81231689453125, -0.769622802734375, -0.7269287109375, -0.684234619140625, -0.64154052734375, -0.598846435546875, -0.55615234375, -0.513458251953125, -0.47076416015625, -0.428070068359375, -0.3853759765625, -0.342681884765625, -0.29998779296875, -0.257293701171875, -0.214599609375, -0.171905517578125, -0.12921142578125, -0.086517333984375, -0.0438232421875, -0.001129150390625, 0.04156494140625, 0.084259033203125, 0.126953125, 0.169647216796875, 0.21234130859375, 0.255035400390625, 0.2977294921875, 0.340423583984375, 0.38311767578125, 0.425811767578125, 0.468505859375, 0.511199951171875, 0.55389404296875, 0.596588134765625, 0.6392822265625, 0.681976318359375, 0.72467041015625, 0.767364501953125, 0.81005859375, 0.852752685546875, 0.89544677734375, 0.938140869140625, 0.9808349609375, 1.023529052734375, 1.06622314453125, 1.108917236328125, 1.151611328125, 1.194305419921875, 1.23699951171875, 1.279693603515625, 1.3223876953125, 1.365081787109375, 1.40777587890625, 1.450469970703125, 1.4931640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 8.0, 24.0, 20.0, 30.0, 48.0, 42.0, 73.0, 86.0, 75.0, 89.0, 93.0, 89.0, 80.0, 58.0, 55.0, 42.0, 29.0, 25.0, 9.0, 7.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478759765625, -0.4603004455566406, -0.44184112548828125, -0.4233818054199219, -0.4049224853515625, -0.3864631652832031, -0.36800384521484375, -0.3495445251464844, -0.331085205078125, -0.3126258850097656, -0.29416656494140625, -0.2757072448730469, -0.2572479248046875, -0.23878860473632812, -0.22032928466796875, -0.20186996459960938, -0.18341064453125, -0.16495132446289062, -0.14649200439453125, -0.12803268432617188, -0.1095733642578125, -0.09111404418945312, -0.07265472412109375, -0.054195404052734375, -0.035736083984375, -0.017276763916015625, 0.00118255615234375, 0.019641876220703125, 0.0381011962890625, 0.056560516357421875, 0.07501983642578125, 0.09347915649414062, 0.1119384765625, 0.13039779663085938, 0.14885711669921875, 0.16731643676757812, 0.1857757568359375, 0.20423507690429688, 0.22269439697265625, 0.24115371704101562, 0.259613037109375, 0.2780723571777344, 0.29653167724609375, 0.3149909973144531, 0.3334503173828125, 0.3519096374511719, 0.37036895751953125, 0.3888282775878906, 0.40728759765625, 0.4257469177246094, 0.44420623779296875, 0.4626655578613281, 0.4811248779296875, 0.4995841979980469, 0.5180435180664062, 0.5365028381347656, 0.554962158203125, 0.5734214782714844, 0.5918807983398438, 0.6103401184082031, 0.6287994384765625, 0.6472587585449219, 0.6657180786132812, 0.6841773986816406, 0.70263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 8.0, 9.0, 6.0, 14.0, 20.0, 34.0, 53.0, 107.0, 154.0, 341.0, 720.0, 1626.0, 4007.0, 12011.0, 44285.0, 240247.0, 575900.0, 128513.0, 27427.0, 7986.0, 2813.0, 1171.0, 498.0, 266.0, 107.0, 79.0, 64.0, 34.0, 17.0, 10.0, 10.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.689453125, -1.641632080078125, -1.59381103515625, -1.545989990234375, -1.4981689453125, -1.450347900390625, -1.40252685546875, -1.354705810546875, -1.306884765625, -1.259063720703125, -1.21124267578125, -1.163421630859375, -1.1156005859375, -1.067779541015625, -1.01995849609375, -0.972137451171875, -0.92431640625, -0.876495361328125, -0.82867431640625, -0.780853271484375, -0.7330322265625, -0.685211181640625, -0.63739013671875, -0.589569091796875, -0.541748046875, -0.493927001953125, -0.44610595703125, -0.398284912109375, -0.3504638671875, -0.302642822265625, -0.25482177734375, -0.207000732421875, -0.1591796875, -0.111358642578125, -0.06353759765625, -0.015716552734375, 0.0321044921875, 0.079925537109375, 0.12774658203125, 0.175567626953125, 0.223388671875, 0.271209716796875, 0.31903076171875, 0.366851806640625, 0.4146728515625, 0.462493896484375, 0.51031494140625, 0.558135986328125, 0.60595703125, 0.653778076171875, 0.70159912109375, 0.749420166015625, 0.7972412109375, 0.845062255859375, 0.89288330078125, 0.940704345703125, 0.988525390625, 1.036346435546875, 1.08416748046875, 1.131988525390625, 1.1798095703125, 1.227630615234375, 1.27545166015625, 1.323272705078125, 1.37109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 6.0, 5.0, 10.0, 9.0, 19.0, 21.0, 21.0, 23.0, 34.0, 37.0, 44.0, 42.0, 48.0, 60.0, 69.0, 67.0, 59.0, 63.0, 36.0, 50.0, 40.0, 40.0, 39.0, 19.0, 30.0, 22.0, 14.0, 22.0, 7.0, 8.0, 8.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0], "bins": [-2.609375, -2.5466461181640625, -2.483917236328125, -2.4211883544921875, -2.35845947265625, -2.2957305908203125, -2.233001708984375, -2.1702728271484375, -2.1075439453125, -2.0448150634765625, -1.982086181640625, -1.9193572998046875, -1.85662841796875, -1.7938995361328125, -1.731170654296875, -1.6684417724609375, -1.605712890625, -1.5429840087890625, -1.480255126953125, -1.4175262451171875, -1.35479736328125, -1.2920684814453125, -1.229339599609375, -1.1666107177734375, -1.1038818359375, -1.0411529541015625, -0.978424072265625, -0.9156951904296875, -0.85296630859375, -0.7902374267578125, -0.727508544921875, -0.6647796630859375, -0.60205078125, -0.5393218994140625, -0.476593017578125, -0.4138641357421875, -0.35113525390625, -0.2884063720703125, -0.225677490234375, -0.1629486083984375, -0.1002197265625, -0.0374908447265625, 0.025238037109375, 0.0879669189453125, 0.15069580078125, 0.2134246826171875, 0.276153564453125, 0.3388824462890625, 0.401611328125, 0.4643402099609375, 0.527069091796875, 0.5897979736328125, 0.65252685546875, 0.7152557373046875, 0.777984619140625, 0.8407135009765625, 0.9034423828125, 0.9661712646484375, 1.028900146484375, 1.0916290283203125, 1.15435791015625, 1.2170867919921875, 1.279815673828125, 1.3425445556640625, 1.4052734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 12.0, 14.0, 31.0, 42.0, 66.0, 96.0, 227.0, 391.0, 928.0, 2684.0, 11911.0, 135493.0, 823309.0, 62173.0, 7681.0, 2021.0, 725.0, 324.0, 184.0, 101.0, 58.0, 28.0, 17.0, 13.0, 5.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0636138916015625, -1.028594970703125, -0.9935760498046875, -0.95855712890625, -0.9235382080078125, -0.888519287109375, -0.8535003662109375, -0.8184814453125, -0.7834625244140625, -0.748443603515625, -0.7134246826171875, -0.67840576171875, -0.6433868408203125, -0.608367919921875, -0.5733489990234375, -0.538330078125, -0.5033111572265625, -0.468292236328125, -0.4332733154296875, -0.39825439453125, -0.3632354736328125, -0.328216552734375, -0.2931976318359375, -0.2581787109375, -0.2231597900390625, -0.188140869140625, -0.1531219482421875, -0.11810302734375, -0.0830841064453125, -0.048065185546875, -0.0130462646484375, 0.02197265625, 0.0569915771484375, 0.092010498046875, 0.1270294189453125, 0.16204833984375, 0.1970672607421875, 0.232086181640625, 0.2671051025390625, 0.3021240234375, 0.3371429443359375, 0.372161865234375, 0.4071807861328125, 0.44219970703125, 0.4772186279296875, 0.512237548828125, 0.5472564697265625, 0.582275390625, 0.6172943115234375, 0.652313232421875, 0.6873321533203125, 0.72235107421875, 0.7573699951171875, 0.792388916015625, 0.8274078369140625, 0.8624267578125, 0.8974456787109375, 0.932464599609375, 0.9674835205078125, 1.00250244140625, 1.0375213623046875, 1.072540283203125, 1.1075592041015625, 1.142578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 1.0, 13.0, 6.0, 24.0, 26.0, 43.0, 73.0, 116.0, 140.0, 152.0, 158.0, 79.0, 58.0, 39.0, 32.0, 11.0, 13.0, 4.0, 8.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010031461715698242, -9.675044566392899e-05, -9.318627417087555e-05, -8.962210267782211e-05, -8.605793118476868e-05, -8.249375969171524e-05, -7.89295881986618e-05, -7.536541670560837e-05, -7.180124521255493e-05, -6.82370737195015e-05, -6.467290222644806e-05, -6.110873073339462e-05, -5.7544559240341187e-05, -5.398038774728775e-05, -5.0416216254234314e-05, -4.685204476118088e-05, -4.328787326812744e-05, -3.9723701775074005e-05, -3.615953028202057e-05, -3.259535878896713e-05, -2.9031187295913696e-05, -2.546701580286026e-05, -2.1902844309806824e-05, -1.8338672816753387e-05, -1.4774501323699951e-05, -1.1210329830646515e-05, -7.646158337593079e-06, -4.081986844539642e-06, -5.178153514862061e-07, 3.0463561415672302e-06, 6.6105276346206665e-06, 1.0174699127674103e-05, 1.3738870620727539e-05, 1.7303042113780975e-05, 2.086721360683441e-05, 2.4431385099887848e-05, 2.7995556592941284e-05, 3.155972808599472e-05, 3.512389957904816e-05, 3.868807107210159e-05, 4.225224256515503e-05, 4.5816414058208466e-05, 4.93805855512619e-05, 5.294475704431534e-05, 5.6508928537368774e-05, 6.007310003042221e-05, 6.363727152347565e-05, 6.720144301652908e-05, 7.076561450958252e-05, 7.432978600263596e-05, 7.789395749568939e-05, 8.145812898874283e-05, 8.502230048179626e-05, 8.85864719748497e-05, 9.215064346790314e-05, 9.571481496095657e-05, 9.927898645401001e-05, 0.00010284315794706345, 0.00010640732944011688, 0.00010997150093317032, 0.00011353567242622375, 0.00011709984391927719, 0.00012066401541233063, 0.00012422818690538406, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 18.0, 16.0, 31.0, 50.0, 91.0, 139.0, 194.0, 345.0, 586.0, 1196.0, 2756.0, 8341.0, 39937.0, 364184.0, 548447.0, 63895.0, 11675.0, 3462.0, 1432.0, 689.0, 378.0, 229.0, 165.0, 99.0, 49.0, 40.0, 29.0, 13.0, 15.0, 4.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5602645874023438, -0.5370330810546875, -0.5138015747070312, -0.490570068359375, -0.46733856201171875, -0.4441070556640625, -0.42087554931640625, -0.39764404296875, -0.37441253662109375, -0.3511810302734375, -0.32794952392578125, -0.304718017578125, -0.28148651123046875, -0.2582550048828125, -0.23502349853515625, -0.2117919921875, -0.18856048583984375, -0.1653289794921875, -0.14209747314453125, -0.118865966796875, -0.09563446044921875, -0.0724029541015625, -0.04917144775390625, -0.02593994140625, -0.00270843505859375, 0.0205230712890625, 0.04375457763671875, 0.066986083984375, 0.09021759033203125, 0.1134490966796875, 0.13668060302734375, 0.159912109375, 0.18314361572265625, 0.2063751220703125, 0.22960662841796875, 0.252838134765625, 0.27606964111328125, 0.2993011474609375, 0.32253265380859375, 0.34576416015625, 0.36899566650390625, 0.3922271728515625, 0.41545867919921875, 0.438690185546875, 0.46192169189453125, 0.4851531982421875, 0.5083847045898438, 0.5316162109375, 0.5548477172851562, 0.5780792236328125, 0.6013107299804688, 0.624542236328125, 0.6477737426757812, 0.6710052490234375, 0.6942367553710938, 0.71746826171875, 0.7406997680664062, 0.7639312744140625, 0.7871627807617188, 0.810394287109375, 0.8336257934570312, 0.8568572998046875, 0.8800888061523438, 0.9033203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 18.0, 30.0, 32.0, 70.0, 112.0, 183.0, 174.0, 112.0, 78.0, 48.0, 42.0, 26.0, 15.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5205078125, -1.479461669921875, -1.43841552734375, -1.397369384765625, -1.3563232421875, -1.315277099609375, -1.27423095703125, -1.233184814453125, -1.192138671875, -1.151092529296875, -1.11004638671875, -1.069000244140625, -1.0279541015625, -0.986907958984375, -0.94586181640625, -0.904815673828125, -0.86376953125, -0.822723388671875, -0.78167724609375, -0.740631103515625, -0.6995849609375, -0.658538818359375, -0.61749267578125, -0.576446533203125, -0.535400390625, -0.494354248046875, -0.45330810546875, -0.412261962890625, -0.3712158203125, -0.330169677734375, -0.28912353515625, -0.248077392578125, -0.20703125, -0.165985107421875, -0.12493896484375, -0.083892822265625, -0.0428466796875, -0.001800537109375, 0.03924560546875, 0.080291748046875, 0.121337890625, 0.162384033203125, 0.20343017578125, 0.244476318359375, 0.2855224609375, 0.326568603515625, 0.36761474609375, 0.408660888671875, 0.44970703125, 0.490753173828125, 0.53179931640625, 0.572845458984375, 0.6138916015625, 0.654937744140625, 0.69598388671875, 0.737030029296875, 0.778076171875, 0.819122314453125, 0.86016845703125, 0.901214599609375, 0.9422607421875, 0.983306884765625, 1.02435302734375, 1.065399169921875, 1.1064453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 6.0, 20.0, 73.0, 132.0, 206.0, 268.0, 172.0, 66.0, 28.0, 17.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.202939987182617, -27.565452575683594, -26.92796516418457, -26.290477752685547, -25.652990341186523, -25.0155029296875, -24.37801742553711, -23.740530014038086, -23.103042602539062, -22.46555519104004, -21.828067779541016, -21.190580368041992, -20.55309295654297, -19.915607452392578, -19.278118133544922, -18.64063262939453, -18.003143310546875, -17.36565589904785, -16.728168487548828, -16.090681076049805, -15.453194618225098, -14.815707206726074, -14.17821979522705, -13.540733337402344, -12.90324592590332, -12.265758514404297, -11.628271102905273, -10.99078369140625, -10.353297233581543, -9.71580982208252, -9.078322410583496, -8.440835952758789, -7.803347587585449, -7.165860176086426, -6.5283732414245605, -5.890885829925537, -5.253398895263672, -4.615911483764648, -3.978424072265625, -3.3409371376037598, -2.7034497261047363, -2.065962553024292, -1.428475260734558, -0.7909879684448242, -0.15350079536437988, 0.48398637771606445, 1.121473789215088, 1.7589607238769531, 2.3964481353759766, 3.033935308456421, 3.6714224815368652, 4.308909893035889, 4.946396827697754, 5.583884239196777, 6.221371650695801, 6.858858585357666, 7.4963459968566895, 8.133832931518555, 8.771320343017578, 9.408807754516602, 10.046295166015625, 10.683782577514648, 11.321269989013672, 11.958756446838379, 12.596243858337402]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 10.0, 2.0, 6.0, 6.0, 12.0, 11.0, 11.0, 13.0, 29.0, 21.0, 37.0, 22.0, 42.0, 41.0, 40.0, 48.0, 43.0, 50.0, 51.0, 44.0, 55.0, 47.0, 42.0, 37.0, 38.0, 27.0, 35.0, 26.0, 30.0, 32.0, 11.0, 11.0, 16.0, 4.0, 12.0, 11.0, 5.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.04537582397461, -10.709592819213867, -10.373810768127441, -10.0380277633667, -9.702244758605957, -9.366462707519531, -9.030679702758789, -8.694896697998047, -8.359114646911621, -8.023331642150879, -7.687549114227295, -7.351766586303711, -7.015984058380127, -6.680201530456543, -6.344418525695801, -6.008635997772217, -5.672852993011475, -5.337070465087891, -5.001287460327148, -4.6655049324035645, -4.3297224044799805, -3.9939396381378174, -3.6581568717956543, -3.3223743438720703, -2.9865915775299072, -2.650808811187744, -2.31502628326416, -1.979243516921997, -1.6434608697891235, -1.30767822265625, -0.9718954563140869, -0.6361129283905029, -0.30033016204833984, 0.03545251488685608, 0.371235191822052, 0.7070178985595703, 1.0428005456924438, 1.3785831928253174, 1.7143659591674805, 2.0501484870910645, 2.3859312534332275, 2.7217140197753906, 3.0574965476989746, 3.3932793140411377, 3.729062080383301, 4.064844608306885, 4.400627136230469, 4.736410140991211, 5.072192668914795, 5.407975196838379, 5.743758201599121, 6.079540729522705, 6.415323257446289, 6.751106262207031, 7.086888790130615, 7.422671318054199, 7.758454322814941, 8.094237327575684, 8.43001937866211, 8.765802383422852, 9.101585388183594, 9.43736743927002, 9.773150444030762, 10.108932495117188, 10.44471549987793]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 14.0, 30.0, 41.0, 51.0, 78.0, 118.0, 192.0, 328.0, 636.0, 1307.0, 2965.0, 9080.0, 36883.0, 3858815.0, 247669.0, 24416.0, 6876.0, 2468.0, 1067.0, 467.0, 268.0, 173.0, 117.0, 52.0, 43.0, 27.0, 13.0, 15.0, 9.0, 7.0, 0.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.998046875, -1.9407501220703125, -1.883453369140625, -1.8261566162109375, -1.76885986328125, -1.7115631103515625, -1.654266357421875, -1.5969696044921875, -1.5396728515625, -1.4823760986328125, -1.425079345703125, -1.3677825927734375, -1.31048583984375, -1.2531890869140625, -1.195892333984375, -1.1385955810546875, -1.081298828125, -1.0240020751953125, -0.966705322265625, -0.9094085693359375, -0.85211181640625, -0.7948150634765625, -0.737518310546875, -0.6802215576171875, -0.6229248046875, -0.5656280517578125, -0.508331298828125, -0.4510345458984375, -0.39373779296875, -0.3364410400390625, -0.279144287109375, -0.2218475341796875, -0.16455078125, -0.1072540283203125, -0.049957275390625, 0.0073394775390625, 0.06463623046875, 0.1219329833984375, 0.179229736328125, 0.2365264892578125, 0.2938232421875, 0.3511199951171875, 0.408416748046875, 0.4657135009765625, 0.52301025390625, 0.5803070068359375, 0.637603759765625, 0.6949005126953125, 0.752197265625, 0.8094940185546875, 0.866790771484375, 0.9240875244140625, 0.98138427734375, 1.0386810302734375, 1.095977783203125, 1.1532745361328125, 1.2105712890625, 1.2678680419921875, 1.325164794921875, 1.3824615478515625, 1.43975830078125, 1.4970550537109375, 1.554351806640625, 1.6116485595703125, 1.6689453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 8.0, 15.0, 14.0, 14.0, 19.0, 36.0, 38.0, 35.0, 40.0, 45.0, 53.0, 76.0, 71.0, 73.0, 63.0, 59.0, 62.0, 46.0, 38.0, 39.0, 39.0, 37.0, 11.0, 23.0, 8.0, 10.0, 8.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4945220947265625, -0.475860595703125, -0.4571990966796875, -0.43853759765625, -0.4198760986328125, -0.401214599609375, -0.3825531005859375, -0.3638916015625, -0.3452301025390625, -0.326568603515625, -0.3079071044921875, -0.28924560546875, -0.2705841064453125, -0.251922607421875, -0.2332611083984375, -0.214599609375, -0.1959381103515625, -0.177276611328125, -0.1586151123046875, -0.13995361328125, -0.1212921142578125, -0.102630615234375, -0.0839691162109375, -0.0653076171875, -0.0466461181640625, -0.027984619140625, -0.0093231201171875, 0.00933837890625, 0.0279998779296875, 0.046661376953125, 0.0653228759765625, 0.083984375, 0.1026458740234375, 0.121307373046875, 0.1399688720703125, 0.15863037109375, 0.1772918701171875, 0.195953369140625, 0.2146148681640625, 0.2332763671875, 0.2519378662109375, 0.270599365234375, 0.2892608642578125, 0.30792236328125, 0.3265838623046875, 0.345245361328125, 0.3639068603515625, 0.382568359375, 0.4012298583984375, 0.419891357421875, 0.4385528564453125, 0.45721435546875, 0.4758758544921875, 0.494537353515625, 0.5131988525390625, 0.5318603515625, 0.5505218505859375, 0.569183349609375, 0.5878448486328125, 0.60650634765625, 0.6251678466796875, 0.643829345703125, 0.6624908447265625, 0.68115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 12.0, 18.0, 15.0, 22.0, 34.0, 52.0, 48.0, 62.0, 102.0, 120.0, 146.0, 265.0, 395.0, 631.0, 1074.0, 2505.0, 7091.0, 34913.0, 3895593.0, 224658.0, 17568.0, 4700.0, 1837.0, 799.0, 499.0, 275.0, 224.0, 162.0, 106.0, 80.0, 57.0, 53.0, 47.0, 18.0, 25.0, 11.0, 12.0, 8.0, 5.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.572265625, -2.496185302734375, -2.42010498046875, -2.344024658203125, -2.2679443359375, -2.191864013671875, -2.11578369140625, -2.039703369140625, -1.963623046875, -1.887542724609375, -1.81146240234375, -1.735382080078125, -1.6593017578125, -1.583221435546875, -1.50714111328125, -1.431060791015625, -1.35498046875, -1.278900146484375, -1.20281982421875, -1.126739501953125, -1.0506591796875, -0.974578857421875, -0.89849853515625, -0.822418212890625, -0.746337890625, -0.670257568359375, -0.59417724609375, -0.518096923828125, -0.4420166015625, -0.365936279296875, -0.28985595703125, -0.213775634765625, -0.1376953125, -0.061614990234375, 0.01446533203125, 0.090545654296875, 0.1666259765625, 0.242706298828125, 0.31878662109375, 0.394866943359375, 0.470947265625, 0.547027587890625, 0.62310791015625, 0.699188232421875, 0.7752685546875, 0.851348876953125, 0.92742919921875, 1.003509521484375, 1.07958984375, 1.155670166015625, 1.23175048828125, 1.307830810546875, 1.3839111328125, 1.459991455078125, 1.53607177734375, 1.612152099609375, 1.688232421875, 1.764312744140625, 1.84039306640625, 1.916473388671875, 1.9925537109375, 2.068634033203125, 2.14471435546875, 2.220794677734375, 2.296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 18.0, 32.0, 97.0, 3431.0, 376.0, 64.0, 22.0, 8.0, 5.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.1188201904296875, -1.089202880859375, -1.0595855712890625, -1.02996826171875, -1.0003509521484375, -0.970733642578125, -0.9411163330078125, -0.9114990234375, -0.8818817138671875, -0.852264404296875, -0.8226470947265625, -0.79302978515625, -0.7634124755859375, -0.733795166015625, -0.7041778564453125, -0.674560546875, -0.6449432373046875, -0.615325927734375, -0.5857086181640625, -0.55609130859375, -0.5264739990234375, -0.496856689453125, -0.4672393798828125, -0.4376220703125, -0.4080047607421875, -0.378387451171875, -0.3487701416015625, -0.31915283203125, -0.2895355224609375, -0.259918212890625, -0.2303009033203125, -0.20068359375, -0.1710662841796875, -0.141448974609375, -0.1118316650390625, -0.08221435546875, -0.0525970458984375, -0.022979736328125, 0.0066375732421875, 0.0362548828125, 0.0658721923828125, 0.095489501953125, 0.1251068115234375, 0.15472412109375, 0.1843414306640625, 0.213958740234375, 0.2435760498046875, 0.273193359375, 0.3028106689453125, 0.332427978515625, 0.3620452880859375, 0.39166259765625, 0.4212799072265625, 0.450897216796875, 0.4805145263671875, 0.5101318359375, 0.5397491455078125, 0.569366455078125, 0.5989837646484375, 0.62860107421875, 0.6582183837890625, 0.687835693359375, 0.7174530029296875, 0.7470703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 11.0, 20.0, 36.0, 105.0, 169.0, 251.0, 189.0, 107.0, 64.0, 23.0, 12.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.188333988189697, -4.084510803222656, -3.9806878566741943, -3.8768649101257324, -3.7730417251586914, -3.6692187786102295, -3.5653958320617676, -3.4615726470947266, -3.3577497005462646, -3.2539267539978027, -3.1501035690307617, -3.0462806224823, -2.942457675933838, -2.838634490966797, -2.734811544418335, -2.630988597869873, -2.527165412902832, -2.42334246635437, -2.319519281387329, -2.215696334838867, -2.111873149871826, -2.0080502033233643, -1.9042272567749023, -1.8004041910171509, -1.6965811252593994, -1.592758059501648, -1.4889349937438965, -1.3851120471954346, -1.281288981437683, -1.1774659156799316, -1.0736429691314697, -0.9698199033737183, -0.8659965991973877, -0.7621735334396362, -0.6583505272865295, -0.5545275211334229, -0.4507044553756714, -0.3468813896179199, -0.24305838346481323, -0.13923537731170654, -0.03541231155395508, 0.068410724401474, 0.17223376035690308, 0.27605679631233215, 0.37987983226776123, 0.4837028980255127, 0.5875259041786194, 0.6913489103317261, 0.7951719760894775, 0.898995041847229, 1.0028181076049805, 1.1066410541534424, 1.2104641199111938, 1.3142871856689453, 1.4181101322174072, 1.5219331979751587, 1.6257562637329102, 1.7295793294906616, 1.833402395248413, 1.937225341796875, 2.041048526763916, 2.144871473312378, 2.24869441986084, 2.352517604827881, 2.4563405513763428]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 7.0, 13.0, 10.0, 8.0, 19.0, 25.0, 31.0, 21.0, 22.0, 42.0, 36.0, 33.0, 53.0, 53.0, 56.0, 50.0, 51.0, 46.0, 39.0, 60.0, 38.0, 35.0, 34.0, 39.0, 37.0, 21.0, 23.0, 22.0, 14.0, 16.0, 10.0, 11.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3935050964355469, -1.344226360321045, -1.294947624206543, -1.2456687688827515, -1.1963900327682495, -1.1471112966537476, -1.097832441329956, -1.048553705215454, -0.9992749691009521, -0.9499962329864502, -0.9007174372673035, -0.8514386415481567, -0.8021599054336548, -0.7528811693191528, -0.7036023736000061, -0.6543235778808594, -0.6050448417663574, -0.5557661056518555, -0.5064873099327087, -0.4572085440158844, -0.40792977809906006, -0.3586510121822357, -0.3093722462654114, -0.26009348034858704, -0.2108147144317627, -0.16153594851493835, -0.11225718259811401, -0.06297841668128967, -0.013699650764465332, 0.03557911515235901, 0.08485788106918335, 0.1341366469860077, 0.18341553211212158, 0.23269429802894592, 0.28197306394577026, 0.3312518298625946, 0.38053059577941895, 0.4298093616962433, 0.4790881276130676, 0.5283669233322144, 0.5776456594467163, 0.6269243955612183, 0.676203191280365, 0.7254819869995117, 0.7747607231140137, 0.8240394592285156, 0.8733182549476624, 0.9225970506668091, 0.971875786781311, 1.021154522895813, 1.0704333782196045, 1.1197121143341064, 1.1689908504486084, 1.2182695865631104, 1.2675483226776123, 1.3168271780014038, 1.3661059141159058, 1.4153846502304077, 1.4646635055541992, 1.5139422416687012, 1.5632209777832031, 1.612499713897705, 1.661778450012207, 1.7110573053359985, 1.7603360414505005]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 16.0, 28.0, 70.0, 105.0, 218.0, 368.0, 788.0, 1755.0, 4166.0, 12062.0, 41250.0, 175982.0, 492285.0, 239648.0, 55392.0, 15446.0, 5140.0, 1953.0, 947.0, 416.0, 218.0, 112.0, 71.0, 43.0, 25.0, 18.0, 7.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.283203125, -2.225555419921875, -2.16790771484375, -2.110260009765625, -2.0526123046875, -1.994964599609375, -1.93731689453125, -1.879669189453125, -1.822021484375, -1.764373779296875, -1.70672607421875, -1.649078369140625, -1.5914306640625, -1.533782958984375, -1.47613525390625, -1.418487548828125, -1.36083984375, -1.303192138671875, -1.24554443359375, -1.187896728515625, -1.1302490234375, -1.072601318359375, -1.01495361328125, -0.957305908203125, -0.899658203125, -0.842010498046875, -0.78436279296875, -0.726715087890625, -0.6690673828125, -0.611419677734375, -0.55377197265625, -0.496124267578125, -0.4384765625, -0.380828857421875, -0.32318115234375, -0.265533447265625, -0.2078857421875, -0.150238037109375, -0.09259033203125, -0.034942626953125, 0.022705078125, 0.080352783203125, 0.13800048828125, 0.195648193359375, 0.2532958984375, 0.310943603515625, 0.36859130859375, 0.426239013671875, 0.48388671875, 0.541534423828125, 0.59918212890625, 0.656829833984375, 0.7144775390625, 0.772125244140625, 0.82977294921875, 0.887420654296875, 0.945068359375, 1.002716064453125, 1.06036376953125, 1.118011474609375, 1.1756591796875, 1.233306884765625, 1.29095458984375, 1.348602294921875, 1.40625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 6.0, 13.0, 11.0, 9.0, 24.0, 16.0, 20.0, 29.0, 35.0, 31.0, 49.0, 42.0, 44.0, 59.0, 55.0, 58.0, 46.0, 60.0, 55.0, 46.0, 50.0, 41.0, 34.0, 32.0, 20.0, 25.0, 23.0, 15.0, 11.0, 11.0, 4.0, 11.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5013656616210938, -0.4827117919921875, -0.46405792236328125, -0.445404052734375, -0.42675018310546875, -0.4080963134765625, -0.38944244384765625, -0.37078857421875, -0.35213470458984375, -0.3334808349609375, -0.31482696533203125, -0.296173095703125, -0.27751922607421875, -0.2588653564453125, -0.24021148681640625, -0.2215576171875, -0.20290374755859375, -0.1842498779296875, -0.16559600830078125, -0.146942138671875, -0.12828826904296875, -0.1096343994140625, -0.09098052978515625, -0.07232666015625, -0.05367279052734375, -0.0350189208984375, -0.01636505126953125, 0.002288818359375, 0.02094268798828125, 0.0395965576171875, 0.05825042724609375, 0.076904296875, 0.09555816650390625, 0.1142120361328125, 0.13286590576171875, 0.151519775390625, 0.17017364501953125, 0.1888275146484375, 0.20748138427734375, 0.22613525390625, 0.24478912353515625, 0.2634429931640625, 0.28209686279296875, 0.300750732421875, 0.31940460205078125, 0.3380584716796875, 0.35671234130859375, 0.3753662109375, 0.39402008056640625, 0.4126739501953125, 0.43132781982421875, 0.449981689453125, 0.46863555908203125, 0.4872894287109375, 0.5059432983398438, 0.52459716796875, 0.5432510375976562, 0.5619049072265625, 0.5805587768554688, 0.599212646484375, 0.6178665161132812, 0.6365203857421875, 0.6551742553710938, 0.673828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 3.0, 6.0, 4.0, 5.0, 13.0, 17.0, 20.0, 33.0, 36.0, 76.0, 93.0, 151.0, 267.0, 483.0, 876.0, 1798.0, 4093.0, 10447.0, 31441.0, 122537.0, 518310.0, 270316.0, 58353.0, 17236.0, 6398.0, 2759.0, 1229.0, 611.0, 362.0, 201.0, 124.0, 74.0, 55.0, 35.0, 24.0, 17.0, 15.0, 6.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6201171875, -1.5617218017578125, -1.503326416015625, -1.4449310302734375, -1.38653564453125, -1.3281402587890625, -1.269744873046875, -1.2113494873046875, -1.1529541015625, -1.0945587158203125, -1.036163330078125, -0.9777679443359375, -0.91937255859375, -0.8609771728515625, -0.802581787109375, -0.7441864013671875, -0.685791015625, -0.6273956298828125, -0.569000244140625, -0.5106048583984375, -0.45220947265625, -0.3938140869140625, -0.335418701171875, -0.2770233154296875, -0.2186279296875, -0.1602325439453125, -0.101837158203125, -0.0434417724609375, 0.01495361328125, 0.0733489990234375, 0.131744384765625, 0.1901397705078125, 0.24853515625, 0.3069305419921875, 0.365325927734375, 0.4237213134765625, 0.48211669921875, 0.5405120849609375, 0.598907470703125, 0.6573028564453125, 0.7156982421875, 0.7740936279296875, 0.832489013671875, 0.8908843994140625, 0.94927978515625, 1.0076751708984375, 1.066070556640625, 1.1244659423828125, 1.182861328125, 1.2412567138671875, 1.299652099609375, 1.3580474853515625, 1.41644287109375, 1.4748382568359375, 1.533233642578125, 1.5916290283203125, 1.6500244140625, 1.7084197998046875, 1.766815185546875, 1.8252105712890625, 1.88360595703125, 1.9420013427734375, 2.000396728515625, 2.0587921142578125, 2.1171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 9.0, 6.0, 12.0, 9.0, 20.0, 25.0, 18.0, 39.0, 38.0, 35.0, 61.0, 62.0, 56.0, 66.0, 64.0, 66.0, 54.0, 71.0, 60.0, 51.0, 36.0, 24.0, 24.0, 19.0, 21.0, 11.0, 10.0, 8.0, 5.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.7373046875, -2.603515625, -2.4697265625, -2.3359375, -2.2021484375, -2.068359375, -1.9345703125, -1.80078125, -1.6669921875, -1.533203125, -1.3994140625, -1.265625, -1.1318359375, -0.998046875, -0.8642578125, -0.73046875, -0.5966796875, -0.462890625, -0.3291015625, -0.1953125, -0.0615234375, 0.072265625, 0.2060546875, 0.33984375, 0.4736328125, 0.607421875, 0.7412109375, 0.875, 1.0087890625, 1.142578125, 1.2763671875, 1.41015625, 1.5439453125, 1.677734375, 1.8115234375, 1.9453125, 2.0791015625, 2.212890625, 2.3466796875, 2.48046875, 2.6142578125, 2.748046875, 2.8818359375, 3.015625, 3.1494140625, 3.283203125, 3.4169921875, 3.55078125, 3.6845703125, 3.818359375, 3.9521484375, 4.0859375, 4.2197265625, 4.353515625, 4.4873046875, 4.62109375, 4.7548828125, 4.888671875, 5.0224609375, 5.15625, 5.2900390625, 5.423828125, 5.5576171875, 5.69140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 0.0, 2.0, 2.0, 8.0, 10.0, 25.0, 29.0, 49.0, 82.0, 162.0, 328.0, 788.0, 2872.0, 31419.0, 997360.0, 12237.0, 1938.0, 658.0, 259.0, 132.0, 77.0, 55.0, 27.0, 10.0, 8.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.6175537109375, -2.518310546875, -2.4190673828125, -2.31982421875, -2.2205810546875, -2.121337890625, -2.0220947265625, -1.9228515625, -1.8236083984375, -1.724365234375, -1.6251220703125, -1.52587890625, -1.4266357421875, -1.327392578125, -1.2281494140625, -1.12890625, -1.0296630859375, -0.930419921875, -0.8311767578125, -0.73193359375, -0.6326904296875, -0.533447265625, -0.4342041015625, -0.3349609375, -0.2357177734375, -0.136474609375, -0.0372314453125, 0.06201171875, 0.1612548828125, 0.260498046875, 0.3597412109375, 0.458984375, 0.5582275390625, 0.657470703125, 0.7567138671875, 0.85595703125, 0.9552001953125, 1.054443359375, 1.1536865234375, 1.2529296875, 1.3521728515625, 1.451416015625, 1.5506591796875, 1.64990234375, 1.7491455078125, 1.848388671875, 1.9476318359375, 2.046875, 2.1461181640625, 2.245361328125, 2.3446044921875, 2.44384765625, 2.5430908203125, 2.642333984375, 2.7415771484375, 2.8408203125, 2.9400634765625, 3.039306640625, 3.1385498046875, 3.23779296875, 3.3370361328125, 3.436279296875, 3.5355224609375, 3.634765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 14.0, 16.0, 24.0, 48.0, 43.0, 90.0, 100.0, 114.0, 137.0, 111.0, 91.0, 63.0, 46.0, 29.0, 19.0, 17.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014662742614746094, -0.00014279503375291824, -0.00013896264135837555, -0.00013513024896383286, -0.00013129785656929016, -0.00012746546417474747, -0.00012363307178020477, -0.00011980067938566208, -0.00011596828699111938, -0.00011213589459657669, -0.000108303502202034, -0.0001044711098074913, -0.00010063871741294861, -9.680632501840591e-05, -9.297393262386322e-05, -8.914154022932053e-05, -8.530914783477783e-05, -8.147675544023514e-05, -7.764436304569244e-05, -7.381197065114975e-05, -6.997957825660706e-05, -6.614718586206436e-05, -6.231479346752167e-05, -5.8482401072978973e-05, -5.465000867843628e-05, -5.0817616283893585e-05, -4.698522388935089e-05, -4.31528314948082e-05, -3.93204391002655e-05, -3.548804670572281e-05, -3.1655654311180115e-05, -2.782326191663742e-05, -2.3990869522094727e-05, -2.0158477127552032e-05, -1.632608473300934e-05, -1.2493692338466644e-05, -8.66129994392395e-06, -4.828907549381256e-06, -9.96515154838562e-07, 2.835877239704132e-06, 6.668269634246826e-06, 1.050066202878952e-05, 1.4333054423332214e-05, 1.816544681787491e-05, 2.1997839212417603e-05, 2.5830231606960297e-05, 2.966262400150299e-05, 3.3495016396045685e-05, 3.732740879058838e-05, 4.115980118513107e-05, 4.499219357967377e-05, 4.882458597421646e-05, 5.2656978368759155e-05, 5.648937076330185e-05, 6.0321763157844543e-05, 6.415415555238724e-05, 6.798654794692993e-05, 7.181894034147263e-05, 7.565133273601532e-05, 7.948372513055801e-05, 8.331611752510071e-05, 8.71485099196434e-05, 9.09809023141861e-05, 9.481329470872879e-05, 9.864568710327148e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 16.0, 6.0, 17.0, 32.0, 43.0, 104.0, 190.0, 416.0, 885.0, 2129.0, 7192.0, 118147.0, 886708.0, 25705.0, 4180.0, 1491.0, 605.0, 321.0, 150.0, 86.0, 40.0, 22.0, 25.0, 15.0, 9.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.82073974609375, -1.7625732421875, -1.70440673828125, -1.646240234375, -1.58807373046875, -1.5299072265625, -1.47174072265625, -1.41357421875, -1.35540771484375, -1.2972412109375, -1.23907470703125, -1.180908203125, -1.12274169921875, -1.0645751953125, -1.00640869140625, -0.9482421875, -0.89007568359375, -0.8319091796875, -0.77374267578125, -0.715576171875, -0.65740966796875, -0.5992431640625, -0.54107666015625, -0.48291015625, -0.42474365234375, -0.3665771484375, -0.30841064453125, -0.250244140625, -0.19207763671875, -0.1339111328125, -0.07574462890625, -0.017578125, 0.04058837890625, 0.0987548828125, 0.15692138671875, 0.215087890625, 0.27325439453125, 0.3314208984375, 0.38958740234375, 0.44775390625, 0.50592041015625, 0.5640869140625, 0.62225341796875, 0.680419921875, 0.73858642578125, 0.7967529296875, 0.85491943359375, 0.9130859375, 0.97125244140625, 1.0294189453125, 1.08758544921875, 1.145751953125, 1.20391845703125, 1.2620849609375, 1.32025146484375, 1.37841796875, 1.43658447265625, 1.4947509765625, 1.55291748046875, 1.611083984375, 1.66925048828125, 1.7274169921875, 1.78558349609375, 1.84375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 9.0, 28.0, 70.0, 156.0, 289.0, 238.0, 112.0, 48.0, 15.0, 10.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.4366455078125, -3.347900390625, -3.2591552734375, -3.17041015625, -3.0816650390625, -2.992919921875, -2.9041748046875, -2.8154296875, -2.7266845703125, -2.637939453125, -2.5491943359375, -2.46044921875, -2.3717041015625, -2.282958984375, -2.1942138671875, -2.10546875, -2.0167236328125, -1.927978515625, -1.8392333984375, -1.75048828125, -1.6617431640625, -1.572998046875, -1.4842529296875, -1.3955078125, -1.3067626953125, -1.218017578125, -1.1292724609375, -1.04052734375, -0.9517822265625, -0.863037109375, -0.7742919921875, -0.685546875, -0.5968017578125, -0.508056640625, -0.4193115234375, -0.33056640625, -0.2418212890625, -0.153076171875, -0.0643310546875, 0.0244140625, 0.1131591796875, 0.201904296875, 0.2906494140625, 0.37939453125, 0.4681396484375, 0.556884765625, 0.6456298828125, 0.734375, 0.8231201171875, 0.911865234375, 1.0006103515625, 1.08935546875, 1.1781005859375, 1.266845703125, 1.3555908203125, 1.4443359375, 1.5330810546875, 1.621826171875, 1.7105712890625, 1.79931640625, 1.8880615234375, 1.976806640625, 2.0655517578125, 2.154296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 17.0, 22.0, 56.0, 117.0, 216.0, 235.0, 156.0, 97.0, 43.0, 22.0, 12.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.19236755371094, -47.25567626953125, -46.3189811706543, -45.382286071777344, -44.445594787597656, -43.50890350341797, -42.572208404541016, -41.63551330566406, -40.698822021484375, -39.76213073730469, -38.825435638427734, -37.88874053955078, -36.952049255371094, -36.015357971191406, -35.07866287231445, -34.1419677734375, -33.20527648925781, -32.268585205078125, -31.331890106201172, -30.39519691467285, -29.45850372314453, -28.52181053161621, -27.58511734008789, -26.64842414855957, -25.71173095703125, -24.77503776550293, -23.83834457397461, -22.90165138244629, -21.96495819091797, -21.02826499938965, -20.091571807861328, -19.154878616333008, -18.218185424804688, -17.281492233276367, -16.344799041748047, -15.408105850219727, -14.471412658691406, -13.534719467163086, -12.598026275634766, -11.661333084106445, -10.724639892578125, -9.787946701049805, -8.851253509521484, -7.914560317993164, -6.977867126464844, -6.041173934936523, -5.104480743408203, -4.167787551879883, -3.2310943603515625, -2.294401168823242, -1.3577079772949219, -0.42101478576660156, 0.5156784057617188, 1.452371597290039, 2.3890647888183594, 3.3257579803466797, 4.262451171875, 5.19914436340332, 6.135837554931641, 7.072530746459961, 8.009223937988281, 8.945917129516602, 9.882610321044922, 10.819303512573242, 11.755996704101562]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 10.0, 10.0, 9.0, 11.0, 18.0, 21.0, 11.0, 19.0, 20.0, 23.0, 27.0, 30.0, 30.0, 39.0, 31.0, 54.0, 48.0, 50.0, 41.0, 55.0, 53.0, 29.0, 38.0, 37.0, 45.0, 33.0, 24.0, 26.0, 16.0, 19.0, 16.0, 20.0, 13.0, 5.0, 15.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.521869659423828, -16.038021087646484, -15.554170608520508, -15.070322036743164, -14.586472511291504, -14.102622985839844, -13.618773460388184, -13.134923934936523, -12.65107536315918, -12.16722583770752, -11.68337631225586, -11.199527740478516, -10.715678215026855, -10.231828689575195, -9.747979164123535, -9.264129638671875, -8.780281066894531, -8.296431541442871, -7.812582492828369, -7.328732967376709, -6.844883918762207, -6.361034393310547, -5.877184867858887, -5.393335819244385, -4.909485816955566, -4.425636291503906, -3.9417872428894043, -3.457937717437744, -2.974088668823242, -2.490239143371582, -2.006389856338501, -1.52254056930542, -1.038691520690918, -0.5548422336578369, -0.07099288702011108, 0.41285645961761475, 0.8967057466506958, 1.3805551528930664, 1.8644044399261475, 2.3482537269592285, 2.8321030139923096, 3.3159523010253906, 3.7998015880584717, 4.283650875091553, 4.767500400543213, 5.251349449157715, 5.735198974609375, 6.219048500061035, 6.702897548675537, 7.186747074127197, 7.670596122741699, 8.15444564819336, 8.63829517364502, 9.12214469909668, 9.605993270874023, 10.089842796325684, 10.573692321777344, 11.057541847229004, 11.541391372680664, 12.025239944458008, 12.509089469909668, 12.992938995361328, 13.476788520812988, 13.960638046264648, 14.444486618041992]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 3.0, 8.0, 11.0, 18.0, 28.0, 26.0, 39.0, 50.0, 52.0, 70.0, 110.0, 119.0, 219.0, 337.0, 508.0, 877.0, 1579.0, 3146.0, 7370.0, 24684.0, 212926.0, 3876838.0, 45428.0, 11102.0, 4285.0, 1900.0, 975.0, 566.0, 302.0, 198.0, 144.0, 108.0, 55.0, 37.0, 39.0, 31.0, 20.0, 14.0, 4.0, 8.0, 8.0, 5.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7531280517578125, -1.698638916015625, -1.6441497802734375, -1.58966064453125, -1.5351715087890625, -1.480682373046875, -1.4261932373046875, -1.3717041015625, -1.3172149658203125, -1.262725830078125, -1.2082366943359375, -1.15374755859375, -1.0992584228515625, -1.044769287109375, -0.9902801513671875, -0.935791015625, -0.8813018798828125, -0.826812744140625, -0.7723236083984375, -0.71783447265625, -0.6633453369140625, -0.608856201171875, -0.5543670654296875, -0.4998779296875, -0.4453887939453125, -0.390899658203125, -0.3364105224609375, -0.28192138671875, -0.2274322509765625, -0.172943115234375, -0.1184539794921875, -0.06396484375, -0.0094757080078125, 0.045013427734375, 0.0995025634765625, 0.15399169921875, 0.2084808349609375, 0.262969970703125, 0.3174591064453125, 0.3719482421875, 0.4264373779296875, 0.480926513671875, 0.5354156494140625, 0.58990478515625, 0.6443939208984375, 0.698883056640625, 0.7533721923828125, 0.807861328125, 0.8623504638671875, 0.916839599609375, 0.9713287353515625, 1.02581787109375, 1.0803070068359375, 1.134796142578125, 1.1892852783203125, 1.2437744140625, 1.2982635498046875, 1.352752685546875, 1.4072418212890625, 1.46173095703125, 1.5162200927734375, 1.570709228515625, 1.6251983642578125, 1.6796875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 10.0, 8.0, 9.0, 21.0, 17.0, 22.0, 28.0, 30.0, 45.0, 51.0, 47.0, 70.0, 62.0, 48.0, 74.0, 68.0, 51.0, 64.0, 55.0, 42.0, 37.0, 30.0, 23.0, 16.0, 11.0, 15.0, 9.0, 11.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.6896743774414062, -0.6659698486328125, -0.6422653198242188, -0.618560791015625, -0.5948562622070312, -0.5711517333984375, -0.5474472045898438, -0.52374267578125, -0.5000381469726562, -0.4763336181640625, -0.45262908935546875, -0.428924560546875, -0.40522003173828125, -0.3815155029296875, -0.35781097412109375, -0.3341064453125, -0.31040191650390625, -0.2866973876953125, -0.26299285888671875, -0.239288330078125, -0.21558380126953125, -0.1918792724609375, -0.16817474365234375, -0.14447021484375, -0.12076568603515625, -0.0970611572265625, -0.07335662841796875, -0.049652099609375, -0.02594757080078125, -0.0022430419921875, 0.02146148681640625, 0.045166015625, 0.06887054443359375, 0.0925750732421875, 0.11627960205078125, 0.139984130859375, 0.16368865966796875, 0.1873931884765625, 0.21109771728515625, 0.23480224609375, 0.25850677490234375, 0.2822113037109375, 0.30591583251953125, 0.329620361328125, 0.35332489013671875, 0.3770294189453125, 0.40073394775390625, 0.4244384765625, 0.44814300537109375, 0.4718475341796875, 0.49555206298828125, 0.519256591796875, 0.5429611206054688, 0.5666656494140625, 0.5903701782226562, 0.61407470703125, 0.6377792358398438, 0.6614837646484375, 0.6851882934570312, 0.708892822265625, 0.7325973510742188, 0.7563018798828125, 0.7800064086914062, 0.8037109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 10.0, 22.0, 27.0, 45.0, 62.0, 83.0, 94.0, 134.0, 192.0, 274.0, 415.0, 678.0, 983.0, 1533.0, 2741.0, 5142.0, 10204.0, 25273.0, 90024.0, 3586189.0, 377830.0, 55870.0, 18225.0, 7874.0, 4064.0, 2252.0, 1406.0, 847.0, 570.0, 346.0, 254.0, 172.0, 114.0, 90.0, 64.0, 53.0, 29.0, 36.0, 17.0, 7.0, 14.0, 13.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.5, -1.456939697265625, -1.41387939453125, -1.370819091796875, -1.3277587890625, -1.284698486328125, -1.24163818359375, -1.198577880859375, -1.155517578125, -1.112457275390625, -1.06939697265625, -1.026336669921875, -0.9832763671875, -0.940216064453125, -0.89715576171875, -0.854095458984375, -0.81103515625, -0.767974853515625, -0.72491455078125, -0.681854248046875, -0.6387939453125, -0.595733642578125, -0.55267333984375, -0.509613037109375, -0.466552734375, -0.423492431640625, -0.38043212890625, -0.337371826171875, -0.2943115234375, -0.251251220703125, -0.20819091796875, -0.165130615234375, -0.1220703125, -0.079010009765625, -0.03594970703125, 0.007110595703125, 0.0501708984375, 0.093231201171875, 0.13629150390625, 0.179351806640625, 0.222412109375, 0.265472412109375, 0.30853271484375, 0.351593017578125, 0.3946533203125, 0.437713623046875, 0.48077392578125, 0.523834228515625, 0.56689453125, 0.609954833984375, 0.65301513671875, 0.696075439453125, 0.7391357421875, 0.782196044921875, 0.82525634765625, 0.868316650390625, 0.911376953125, 0.954437255859375, 0.99749755859375, 1.040557861328125, 1.0836181640625, 1.126678466796875, 1.16973876953125, 1.212799072265625, 1.255859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 7.0, 7.0, 10.0, 16.0, 35.0, 63.0, 91.0, 222.0, 3009.0, 344.0, 97.0, 66.0, 37.0, 15.0, 14.0, 7.0, 8.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.492919921875, -0.4757423400878906, -0.45856475830078125, -0.4413871765136719, -0.4242095947265625, -0.4070320129394531, -0.38985443115234375, -0.3726768493652344, -0.355499267578125, -0.3383216857910156, -0.32114410400390625, -0.3039665222167969, -0.2867889404296875, -0.2696113586425781, -0.25243377685546875, -0.23525619506835938, -0.21807861328125, -0.20090103149414062, -0.18372344970703125, -0.16654586791992188, -0.1493682861328125, -0.13219070434570312, -0.11501312255859375, -0.09783554077148438, -0.080657958984375, -0.06348037719726562, -0.04630279541015625, -0.029125213623046875, -0.0119476318359375, 0.005229949951171875, 0.02240753173828125, 0.039585113525390625, 0.0567626953125, 0.07394027709960938, 0.09111785888671875, 0.10829544067382812, 0.1254730224609375, 0.14265060424804688, 0.15982818603515625, 0.17700576782226562, 0.194183349609375, 0.21136093139648438, 0.22853851318359375, 0.24571609497070312, 0.2628936767578125, 0.2800712585449219, 0.29724884033203125, 0.3144264221191406, 0.33160400390625, 0.3487815856933594, 0.36595916748046875, 0.3831367492675781, 0.4003143310546875, 0.4174919128417969, 0.43466949462890625, 0.4518470764160156, 0.469024658203125, 0.4862022399902344, 0.5033798217773438, 0.5205574035644531, 0.5377349853515625, 0.5549125671386719, 0.5720901489257812, 0.5892677307128906, 0.6064453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 15.0, 27.0, 42.0, 77.0, 113.0, 145.0, 140.0, 135.0, 102.0, 108.0, 44.0, 27.0, 17.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.461196422576904, -4.375263214111328, -4.289329528808594, -4.203396320343018, -4.117463111877441, -4.031529426574707, -3.945596218109131, -3.8596630096435547, -3.7737295627593994, -3.687796115875244, -3.601862907409668, -3.5159294605255127, -3.4299962520599365, -3.3440628051757812, -3.258129596710205, -3.17219614982605, -3.0862627029418945, -3.0003292560577393, -2.914396047592163, -2.828462600708008, -2.7425293922424316, -2.6565959453582764, -2.570662498474121, -2.484729290008545, -2.3987960815429688, -2.3128626346588135, -2.2269294261932373, -2.140995979309082, -2.055062770843506, -1.9691293239593506, -1.8831959962844849, -1.7972626686096191, -1.7113293409347534, -1.6253960132598877, -1.539462685585022, -1.4535293579101562, -1.367595911026001, -1.2816625833511353, -1.1957292556762695, -1.1097958087921143, -1.023862600326538, -0.9379292726516724, -0.8519958853721619, -0.7660625576972961, -0.6801291704177856, -0.5941958427429199, -0.5082625150680542, -0.4223291277885437, -0.3363957405090332, -0.2504623830318451, -0.16452904045581818, -0.07859569787979126, 0.007337659597396851, 0.09327101707458496, 0.17920434474945068, 0.2651377320289612, 0.3510710597038269, 0.437004417181015, 0.5229377746582031, 0.6088711023330688, 0.6948044300079346, 0.7807378172874451, 0.8666711449623108, 0.9526045322418213, 1.038537859916687]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 9.0, 9.0, 15.0, 20.0, 21.0, 15.0, 24.0, 24.0, 26.0, 37.0, 31.0, 35.0, 44.0, 36.0, 52.0, 45.0, 48.0, 36.0, 36.0, 47.0, 36.0, 47.0, 31.0, 37.0, 31.0, 29.0, 27.0, 23.0, 22.0, 18.0, 11.0, 12.0, 12.0, 4.0, 6.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1898448467254639, -1.1543632745742798, -1.1188818216323853, -1.0834002494812012, -1.0479187965393066, -1.0124372243881226, -0.9769556522369385, -0.9414741396903992, -0.9059926271438599, -0.8705111145973206, -0.8350296020507812, -0.7995480298995972, -0.7640665173530579, -0.7285850048065186, -0.6931034326553345, -0.6576219201087952, -0.6221404075622559, -0.5866588950157166, -0.5511773824691772, -0.5156958103179932, -0.48021429777145386, -0.44473278522491455, -0.40925124287605286, -0.37376970052719116, -0.33828818798065186, -0.30280667543411255, -0.26732513308525085, -0.23184360563755035, -0.19636207818984985, -0.16088055074214935, -0.12539902329444885, -0.08991749584674835, -0.05443596839904785, -0.01895444095134735, 0.01652708649635315, 0.05200861394405365, 0.08749014139175415, 0.12297166883945465, 0.15845319628715515, 0.19393472373485565, 0.22941625118255615, 0.26489776372909546, 0.30037930607795715, 0.33586084842681885, 0.37134236097335815, 0.40682387351989746, 0.44230541586875916, 0.47778695821762085, 0.5132684707641602, 0.5487499833106995, 0.5842314958572388, 0.6197130680084229, 0.6551945805549622, 0.6906760931015015, 0.7261576652526855, 0.7616391777992249, 0.7971206903457642, 0.8326022028923035, 0.8680837154388428, 0.9035652875900269, 0.9390468001365662, 0.9745283126831055, 1.0100098848342896, 1.045491337776184, 1.0809729099273682]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 9.0, 11.0, 17.0, 29.0, 47.0, 78.0, 103.0, 148.0, 232.0, 366.0, 528.0, 921.0, 1540.0, 2980.0, 5474.0, 11110.0, 24301.0, 58245.0, 144497.0, 292038.0, 278483.0, 130608.0, 52686.0, 22175.0, 10203.0, 5012.0, 2696.0, 1545.0, 888.0, 546.0, 323.0, 210.0, 153.0, 113.0, 73.0, 40.0, 32.0, 19.0, 17.0, 16.0, 7.0, 10.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0109710693359375, -0.976043701171875, -0.9411163330078125, -0.90618896484375, -0.8712615966796875, -0.836334228515625, -0.8014068603515625, -0.7664794921875, -0.7315521240234375, -0.696624755859375, -0.6616973876953125, -0.62677001953125, -0.5918426513671875, -0.556915283203125, -0.5219879150390625, -0.487060546875, -0.4521331787109375, -0.417205810546875, -0.3822784423828125, -0.34735107421875, -0.3124237060546875, -0.277496337890625, -0.2425689697265625, -0.2076416015625, -0.1727142333984375, -0.137786865234375, -0.1028594970703125, -0.06793212890625, -0.0330047607421875, 0.001922607421875, 0.0368499755859375, 0.07177734375, 0.1067047119140625, 0.141632080078125, 0.1765594482421875, 0.21148681640625, 0.2464141845703125, 0.281341552734375, 0.3162689208984375, 0.3511962890625, 0.3861236572265625, 0.421051025390625, 0.4559783935546875, 0.49090576171875, 0.5258331298828125, 0.560760498046875, 0.5956878662109375, 0.630615234375, 0.6655426025390625, 0.700469970703125, 0.7353973388671875, 0.77032470703125, 0.8052520751953125, 0.840179443359375, 0.8751068115234375, 0.9100341796875, 0.9449615478515625, 0.979888916015625, 1.0148162841796875, 1.04974365234375, 1.0846710205078125, 1.119598388671875, 1.1545257568359375, 1.189453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 12.0, 19.0, 15.0, 22.0, 17.0, 30.0, 48.0, 39.0, 46.0, 56.0, 65.0, 52.0, 68.0, 47.0, 70.0, 41.0, 46.0, 56.0, 46.0, 37.0, 23.0, 24.0, 20.0, 19.0, 8.0, 11.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5738677978515625, -0.551544189453125, -0.5292205810546875, -0.50689697265625, -0.4845733642578125, -0.462249755859375, -0.4399261474609375, -0.4176025390625, -0.3952789306640625, -0.372955322265625, -0.3506317138671875, -0.32830810546875, -0.3059844970703125, -0.283660888671875, -0.2613372802734375, -0.239013671875, -0.2166900634765625, -0.194366455078125, -0.1720428466796875, -0.14971923828125, -0.1273956298828125, -0.105072021484375, -0.0827484130859375, -0.0604248046875, -0.0381011962890625, -0.015777587890625, 0.0065460205078125, 0.02886962890625, 0.0511932373046875, 0.073516845703125, 0.0958404541015625, 0.1181640625, 0.1404876708984375, 0.162811279296875, 0.1851348876953125, 0.20745849609375, 0.2297821044921875, 0.252105712890625, 0.2744293212890625, 0.2967529296875, 0.3190765380859375, 0.341400146484375, 0.3637237548828125, 0.38604736328125, 0.4083709716796875, 0.430694580078125, 0.4530181884765625, 0.475341796875, 0.4976654052734375, 0.519989013671875, 0.5423126220703125, 0.56463623046875, 0.5869598388671875, 0.609283447265625, 0.6316070556640625, 0.6539306640625, 0.6762542724609375, 0.698577880859375, 0.7209014892578125, 0.74322509765625, 0.7655487060546875, 0.787872314453125, 0.8101959228515625, 0.83251953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 8.0, 6.0, 13.0, 14.0, 16.0, 25.0, 30.0, 55.0, 77.0, 124.0, 264.0, 533.0, 1279.0, 3447.0, 11802.0, 53972.0, 369240.0, 510117.0, 75347.0, 15004.0, 4314.0, 1493.0, 620.0, 285.0, 144.0, 100.0, 65.0, 45.0, 34.0, 29.0, 11.0, 15.0, 5.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.578125, -2.5066986083984375, -2.435272216796875, -2.3638458251953125, -2.29241943359375, -2.2209930419921875, -2.149566650390625, -2.0781402587890625, -2.0067138671875, -1.9352874755859375, -1.863861083984375, -1.7924346923828125, -1.72100830078125, -1.6495819091796875, -1.578155517578125, -1.5067291259765625, -1.435302734375, -1.3638763427734375, -1.292449951171875, -1.2210235595703125, -1.14959716796875, -1.0781707763671875, -1.006744384765625, -0.9353179931640625, -0.8638916015625, -0.7924652099609375, -0.721038818359375, -0.6496124267578125, -0.57818603515625, -0.5067596435546875, -0.435333251953125, -0.3639068603515625, -0.29248046875, -0.2210540771484375, -0.149627685546875, -0.0782012939453125, -0.00677490234375, 0.0646514892578125, 0.136077880859375, 0.2075042724609375, 0.2789306640625, 0.3503570556640625, 0.421783447265625, 0.4932098388671875, 0.56463623046875, 0.6360626220703125, 0.707489013671875, 0.7789154052734375, 0.850341796875, 0.9217681884765625, 0.993194580078125, 1.0646209716796875, 1.13604736328125, 1.2074737548828125, 1.278900146484375, 1.3503265380859375, 1.4217529296875, 1.4931793212890625, 1.564605712890625, 1.6360321044921875, 1.70745849609375, 1.7788848876953125, 1.850311279296875, 1.9217376708984375, 1.9931640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 5.0, 5.0, 6.0, 5.0, 18.0, 10.0, 18.0, 27.0, 30.0, 14.0, 21.0, 37.0, 38.0, 36.0, 47.0, 52.0, 47.0, 48.0, 64.0, 58.0, 57.0, 43.0, 41.0, 47.0, 39.0, 33.0, 24.0, 31.0, 17.0, 19.0, 10.0, 13.0, 6.0, 5.0, 9.0, 2.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08203125, -2.985107421875, -2.88818359375, -2.791259765625, -2.6943359375, -2.597412109375, -2.50048828125, -2.403564453125, -2.306640625, -2.209716796875, -2.11279296875, -2.015869140625, -1.9189453125, -1.822021484375, -1.72509765625, -1.628173828125, -1.53125, -1.434326171875, -1.33740234375, -1.240478515625, -1.1435546875, -1.046630859375, -0.94970703125, -0.852783203125, -0.755859375, -0.658935546875, -0.56201171875, -0.465087890625, -0.3681640625, -0.271240234375, -0.17431640625, -0.077392578125, 0.01953125, 0.116455078125, 0.21337890625, 0.310302734375, 0.4072265625, 0.504150390625, 0.60107421875, 0.697998046875, 0.794921875, 0.891845703125, 0.98876953125, 1.085693359375, 1.1826171875, 1.279541015625, 1.37646484375, 1.473388671875, 1.5703125, 1.667236328125, 1.76416015625, 1.861083984375, 1.9580078125, 2.054931640625, 2.15185546875, 2.248779296875, 2.345703125, 2.442626953125, 2.53955078125, 2.636474609375, 2.7333984375, 2.830322265625, 2.92724609375, 3.024169921875, 3.12109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 7.0, 15.0, 17.0, 30.0, 50.0, 78.0, 128.0, 189.0, 400.0, 859.0, 2678.0, 13161.0, 253839.0, 740050.0, 30250.0, 4371.0, 1270.0, 501.0, 271.0, 130.0, 78.0, 59.0, 38.0, 14.0, 14.0, 4.0, 12.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1953125, -2.136260986328125, -2.07720947265625, -2.018157958984375, -1.9591064453125, -1.900054931640625, -1.84100341796875, -1.781951904296875, -1.722900390625, -1.663848876953125, -1.60479736328125, -1.545745849609375, -1.4866943359375, -1.427642822265625, -1.36859130859375, -1.309539794921875, -1.25048828125, -1.191436767578125, -1.13238525390625, -1.073333740234375, -1.0142822265625, -0.955230712890625, -0.89617919921875, -0.837127685546875, -0.778076171875, -0.719024658203125, -0.65997314453125, -0.600921630859375, -0.5418701171875, -0.482818603515625, -0.42376708984375, -0.364715576171875, -0.3056640625, -0.246612548828125, -0.18756103515625, -0.128509521484375, -0.0694580078125, -0.010406494140625, 0.04864501953125, 0.107696533203125, 0.166748046875, 0.225799560546875, 0.28485107421875, 0.343902587890625, 0.4029541015625, 0.462005615234375, 0.52105712890625, 0.580108642578125, 0.63916015625, 0.698211669921875, 0.75726318359375, 0.816314697265625, 0.8753662109375, 0.934417724609375, 0.99346923828125, 1.052520751953125, 1.111572265625, 1.170623779296875, 1.22967529296875, 1.288726806640625, 1.3477783203125, 1.406829833984375, 1.46588134765625, 1.524932861328125, 1.583984375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 5.0, 10.0, 10.0, 16.0, 20.0, 30.0, 43.0, 64.0, 81.0, 122.0, 129.0, 114.0, 104.0, 81.0, 49.0, 35.0, 31.0, 10.0, 19.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010776519775390625, -0.00010203570127487183, -9.63062047958374e-05, -9.057670831680298e-05, -8.484721183776855e-05, -7.911771535873413e-05, -7.338821887969971e-05, -6.765872240066528e-05, -6.192922592163086e-05, -5.6199729442596436e-05, -5.047023296356201e-05, -4.474073648452759e-05, -3.9011240005493164e-05, -3.328174352645874e-05, -2.7552247047424316e-05, -2.1822750568389893e-05, -1.609325408935547e-05, -1.0363757610321045e-05, -4.634261131286621e-06, 1.0952353477478027e-06, 6.8247318267822266e-06, 1.255422830581665e-05, 1.8283724784851074e-05, 2.4013221263885498e-05, 2.9742717742919922e-05, 3.5472214221954346e-05, 4.120171070098877e-05, 4.693120718002319e-05, 5.266070365905762e-05, 5.839020013809204e-05, 6.411969661712646e-05, 6.984919309616089e-05, 7.557868957519531e-05, 8.130818605422974e-05, 8.703768253326416e-05, 9.276717901229858e-05, 9.849667549133301e-05, 0.00010422617197036743, 0.00010995566844940186, 0.00011568516492843628, 0.0001214146614074707, 0.00012714415788650513, 0.00013287365436553955, 0.00013860315084457397, 0.0001443326473236084, 0.00015006214380264282, 0.00015579164028167725, 0.00016152113676071167, 0.0001672506332397461, 0.00017298012971878052, 0.00017870962619781494, 0.00018443912267684937, 0.0001901686191558838, 0.0001958981156349182, 0.00020162761211395264, 0.00020735710859298706, 0.00021308660507202148, 0.0002188161015510559, 0.00022454559803009033, 0.00023027509450912476, 0.00023600459098815918, 0.0002417340874671936, 0.00024746358394622803, 0.00025319308042526245, 0.0002589225769042969]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 14.0, 14.0, 38.0, 60.0, 86.0, 168.0, 357.0, 915.0, 2893.0, 18212.0, 416652.0, 580126.0, 23629.0, 3486.0, 1033.0, 405.0, 197.0, 95.0, 69.0, 31.0, 25.0, 16.0, 7.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4964447021484375, -1.441131591796875, -1.3858184814453125, -1.33050537109375, -1.2751922607421875, -1.219879150390625, -1.1645660400390625, -1.1092529296875, -1.0539398193359375, -0.998626708984375, -0.9433135986328125, -0.88800048828125, -0.8326873779296875, -0.777374267578125, -0.7220611572265625, -0.666748046875, -0.6114349365234375, -0.556121826171875, -0.5008087158203125, -0.44549560546875, -0.3901824951171875, -0.334869384765625, -0.2795562744140625, -0.2242431640625, -0.1689300537109375, -0.113616943359375, -0.0583038330078125, -0.00299072265625, 0.0523223876953125, 0.107635498046875, 0.1629486083984375, 0.21826171875, 0.2735748291015625, 0.328887939453125, 0.3842010498046875, 0.43951416015625, 0.4948272705078125, 0.550140380859375, 0.6054534912109375, 0.6607666015625, 0.7160797119140625, 0.771392822265625, 0.8267059326171875, 0.88201904296875, 0.9373321533203125, 0.992645263671875, 1.0479583740234375, 1.103271484375, 1.1585845947265625, 1.213897705078125, 1.2692108154296875, 1.32452392578125, 1.3798370361328125, 1.435150146484375, 1.4904632568359375, 1.5457763671875, 1.6010894775390625, 1.656402587890625, 1.7117156982421875, 1.76702880859375, 1.8223419189453125, 1.877655029296875, 1.9329681396484375, 1.98828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 12.0, 19.0, 31.0, 48.0, 69.0, 83.0, 134.0, 122.0, 120.0, 108.0, 82.0, 54.0, 38.0, 24.0, 12.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.5359649658203125, -1.491851806640625, -1.4477386474609375, -1.40362548828125, -1.3595123291015625, -1.315399169921875, -1.2712860107421875, -1.2271728515625, -1.1830596923828125, -1.138946533203125, -1.0948333740234375, -1.05072021484375, -1.0066070556640625, -0.962493896484375, -0.9183807373046875, -0.874267578125, -0.8301544189453125, -0.786041259765625, -0.7419281005859375, -0.69781494140625, -0.6537017822265625, -0.609588623046875, -0.5654754638671875, -0.5213623046875, -0.4772491455078125, -0.433135986328125, -0.3890228271484375, -0.34490966796875, -0.3007965087890625, -0.256683349609375, -0.2125701904296875, -0.16845703125, -0.1243438720703125, -0.080230712890625, -0.0361175537109375, 0.00799560546875, 0.0521087646484375, 0.096221923828125, 0.1403350830078125, 0.1844482421875, 0.2285614013671875, 0.272674560546875, 0.3167877197265625, 0.36090087890625, 0.4050140380859375, 0.449127197265625, 0.4932403564453125, 0.537353515625, 0.5814666748046875, 0.625579833984375, 0.6696929931640625, 0.71380615234375, 0.7579193115234375, 0.802032470703125, 0.8461456298828125, 0.8902587890625, 0.9343719482421875, 0.978485107421875, 1.0225982666015625, 1.06671142578125, 1.1108245849609375, 1.154937744140625, 1.1990509033203125, 1.2431640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 26.0, 44.0, 77.0, 92.0, 131.0, 142.0, 138.0, 118.0, 78.0, 54.0, 28.0, 24.0, 12.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.407135009765625, -16.81833839416504, -16.229541778564453, -15.64074420928955, -15.051946640014648, -14.463150024414062, -13.874353408813477, -13.28555679321289, -12.696759223937988, -12.107962608337402, -11.5191650390625, -10.930368423461914, -10.341571807861328, -9.752774238586426, -9.16397762298584, -8.575180053710938, -7.986383438110352, -7.397586345672607, -6.808789253234863, -6.219992637634277, -5.631195545196533, -5.042398452758789, -4.453601837158203, -3.864804744720459, -3.276007652282715, -2.6872105598449707, -2.0984137058258057, -1.509616732597351, -0.9208197593688965, -0.33202266693115234, 0.2567741870880127, 0.8455710411071777, 1.4343681335449219, 2.023165225982666, 2.611962080001831, 3.200758934020996, 3.7895560264587402, 4.378353118896484, 4.96714973449707, 5.5559468269348145, 6.144743919372559, 6.733541011810303, 7.322338104248047, 7.911134719848633, 8.499931335449219, 9.088728904724121, 9.677525520324707, 10.26632308959961, 10.855119705200195, 11.443916320800781, 12.032713890075684, 12.62151050567627, 13.210308074951172, 13.799104690551758, 14.387901306152344, 14.97669792175293, 15.565495491027832, 16.154293060302734, 16.74308967590332, 17.331886291503906, 17.920682907104492, 18.509479522705078, 19.098278045654297, 19.687074661254883, 20.27587127685547]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 10.0, 13.0, 20.0, 17.0, 18.0, 23.0, 23.0, 39.0, 52.0, 37.0, 44.0, 56.0, 51.0, 56.0, 48.0, 50.0, 49.0, 50.0, 44.0, 40.0, 40.0, 32.0, 30.0, 19.0, 23.0, 14.0, 25.0, 19.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.589033126831055, -15.140758514404297, -14.692483901977539, -14.244209289550781, -13.795934677124023, -13.347660064697266, -12.899386405944824, -12.451111793518066, -12.002837181091309, -11.55456256866455, -11.106287956237793, -10.658013343811035, -10.209739685058594, -9.761465072631836, -9.313190460205078, -8.86491584777832, -8.416641235351562, -7.968366622924805, -7.520092010498047, -7.071817874908447, -6.6235432624816895, -6.175268650054932, -5.726994514465332, -5.278719902038574, -4.830445289611816, -4.382170677185059, -3.93389630317688, -3.485621929168701, -3.0373473167419434, -2.5890727043151855, -2.140798330307007, -1.6925239562988281, -1.2442502975463867, -0.7959758043289185, -0.3477013111114502, 0.10057318210601807, 0.5488476753234863, 0.9971222877502441, 1.4453966617584229, 1.8936710357666016, 2.3419456481933594, 2.790220260620117, 3.238494634628296, 3.6867690086364746, 4.135043621063232, 4.58331823348999, 5.03159236907959, 5.479866981506348, 5.9281415939331055, 6.376416206359863, 6.824690818786621, 7.272964954376221, 7.7212395668029785, 8.169513702392578, 8.617788314819336, 9.066062927246094, 9.514337539672852, 9.96261215209961, 10.410886764526367, 10.859161376953125, 11.307435989379883, 11.75571060180664, 12.203984260559082, 12.65225887298584, 13.100533485412598]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 4.0, 5.0, 8.0, 19.0, 21.0, 25.0, 51.0, 61.0, 74.0, 114.0, 160.0, 260.0, 389.0, 589.0, 1087.0, 2238.0, 5621.0, 18598.0, 3975729.0, 163295.0, 16165.0, 5013.0, 2116.0, 1008.0, 584.0, 341.0, 238.0, 124.0, 90.0, 70.0, 39.0, 37.0, 23.0, 17.0, 13.0, 16.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.5390625, -2.468414306640625, -2.39776611328125, -2.327117919921875, -2.2564697265625, -2.185821533203125, -2.11517333984375, -2.044525146484375, -1.973876953125, -1.903228759765625, -1.83258056640625, -1.761932373046875, -1.6912841796875, -1.620635986328125, -1.54998779296875, -1.479339599609375, -1.40869140625, -1.338043212890625, -1.26739501953125, -1.196746826171875, -1.1260986328125, -1.055450439453125, -0.98480224609375, -0.914154052734375, -0.843505859375, -0.772857666015625, -0.70220947265625, -0.631561279296875, -0.5609130859375, -0.490264892578125, -0.41961669921875, -0.348968505859375, -0.2783203125, -0.207672119140625, -0.13702392578125, -0.066375732421875, 0.0042724609375, 0.074920654296875, 0.14556884765625, 0.216217041015625, 0.286865234375, 0.357513427734375, 0.42816162109375, 0.498809814453125, 0.5694580078125, 0.640106201171875, 0.71075439453125, 0.781402587890625, 0.85205078125, 0.922698974609375, 0.99334716796875, 1.063995361328125, 1.1346435546875, 1.205291748046875, 1.27593994140625, 1.346588134765625, 1.417236328125, 1.487884521484375, 1.55853271484375, 1.629180908203125, 1.6998291015625, 1.770477294921875, 1.84112548828125, 1.911773681640625, 1.982421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 5.0, 0.0, 2.0, 9.0, 7.0, 8.0, 14.0, 24.0, 19.0, 34.0, 18.0, 44.0, 39.0, 47.0, 53.0, 76.0, 63.0, 60.0, 69.0, 61.0, 51.0, 51.0, 52.0, 29.0, 28.0, 29.0, 22.0, 12.0, 24.0, 13.0, 11.0, 7.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74462890625, -0.7203369140625, -0.696044921875, -0.6717529296875, -0.6474609375, -0.6231689453125, -0.598876953125, -0.5745849609375, -0.55029296875, -0.5260009765625, -0.501708984375, -0.4774169921875, -0.453125, -0.4288330078125, -0.404541015625, -0.3802490234375, -0.35595703125, -0.3316650390625, -0.307373046875, -0.2830810546875, -0.2587890625, -0.2344970703125, -0.210205078125, -0.1859130859375, -0.16162109375, -0.1373291015625, -0.113037109375, -0.0887451171875, -0.064453125, -0.0401611328125, -0.015869140625, 0.0084228515625, 0.03271484375, 0.0570068359375, 0.081298828125, 0.1055908203125, 0.1298828125, 0.1541748046875, 0.178466796875, 0.2027587890625, 0.22705078125, 0.2513427734375, 0.275634765625, 0.2999267578125, 0.32421875, 0.3485107421875, 0.372802734375, 0.3970947265625, 0.42138671875, 0.4456787109375, 0.469970703125, 0.4942626953125, 0.5185546875, 0.5428466796875, 0.567138671875, 0.5914306640625, 0.61572265625, 0.6400146484375, 0.664306640625, 0.6885986328125, 0.712890625, 0.7371826171875, 0.761474609375, 0.7857666015625, 0.81005859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 1.0, 4.0, 6.0, 5.0, 23.0, 20.0, 32.0, 47.0, 82.0, 120.0, 181.0, 290.0, 468.0, 845.0, 1463.0, 2771.0, 6274.0, 17697.0, 104771.0, 4005764.0, 34555.0, 9923.0, 4131.0, 2040.0, 1094.0, 568.0, 422.0, 215.0, 159.0, 83.0, 72.0, 45.0, 38.0, 23.0, 15.0, 6.0, 7.0, 10.0, 3.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.130859375, -2.055419921875, -1.97998046875, -1.904541015625, -1.8291015625, -1.753662109375, -1.67822265625, -1.602783203125, -1.52734375, -1.451904296875, -1.37646484375, -1.301025390625, -1.2255859375, -1.150146484375, -1.07470703125, -0.999267578125, -0.923828125, -0.848388671875, -0.77294921875, -0.697509765625, -0.6220703125, -0.546630859375, -0.47119140625, -0.395751953125, -0.3203125, -0.244873046875, -0.16943359375, -0.093994140625, -0.0185546875, 0.056884765625, 0.13232421875, 0.207763671875, 0.283203125, 0.358642578125, 0.43408203125, 0.509521484375, 0.5849609375, 0.660400390625, 0.73583984375, 0.811279296875, 0.88671875, 0.962158203125, 1.03759765625, 1.113037109375, 1.1884765625, 1.263916015625, 1.33935546875, 1.414794921875, 1.490234375, 1.565673828125, 1.64111328125, 1.716552734375, 1.7919921875, 1.867431640625, 1.94287109375, 2.018310546875, 2.09375, 2.169189453125, 2.24462890625, 2.320068359375, 2.3955078125, 2.470947265625, 2.54638671875, 2.621826171875, 2.697265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 14.0, 23.0, 15.0, 40.0, 106.0, 3585.0, 133.0, 46.0, 29.0, 13.0, 11.0, 5.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.6606521606445312, -0.6430816650390625, -0.6255111694335938, -0.607940673828125, -0.5903701782226562, -0.5727996826171875, -0.5552291870117188, -0.53765869140625, -0.5200881958007812, -0.5025177001953125, -0.48494720458984375, -0.467376708984375, -0.44980621337890625, -0.4322357177734375, -0.41466522216796875, -0.3970947265625, -0.37952423095703125, -0.3619537353515625, -0.34438323974609375, -0.326812744140625, -0.30924224853515625, -0.2916717529296875, -0.27410125732421875, -0.25653076171875, -0.23896026611328125, -0.2213897705078125, -0.20381927490234375, -0.186248779296875, -0.16867828369140625, -0.1511077880859375, -0.13353729248046875, -0.115966796875, -0.09839630126953125, -0.0808258056640625, -0.06325531005859375, -0.045684814453125, -0.02811431884765625, -0.0105438232421875, 0.00702667236328125, 0.02459716796875, 0.04216766357421875, 0.0597381591796875, 0.07730865478515625, 0.094879150390625, 0.11244964599609375, 0.1300201416015625, 0.14759063720703125, 0.1651611328125, 0.18273162841796875, 0.2003021240234375, 0.21787261962890625, 0.235443115234375, 0.25301361083984375, 0.2705841064453125, 0.28815460205078125, 0.30572509765625, 0.32329559326171875, 0.3408660888671875, 0.35843658447265625, 0.376007080078125, 0.39357757568359375, 0.4111480712890625, 0.42871856689453125, 0.4462890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 11.0, 20.0, 85.0, 280.0, 410.0, 174.0, 26.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.367841720581055, -10.129673957824707, -9.89150619506836, -9.653338432312012, -9.415170669555664, -9.177002906799316, -8.938835144042969, -8.700667381286621, -8.462499618530273, -8.224331855773926, -7.986164093017578, -7.7479963302612305, -7.509828567504883, -7.271660804748535, -7.0334930419921875, -6.79532527923584, -6.557157516479492, -6.3189897537231445, -6.080821990966797, -5.842654228210449, -5.604486465454102, -5.366318702697754, -5.128150939941406, -4.889983177185059, -4.651815414428711, -4.413647651672363, -4.175479888916016, -3.937312126159668, -3.6991443634033203, -3.4609766006469727, -3.222808837890625, -2.9846410751342773, -2.7464733123779297, -2.508305549621582, -2.2701377868652344, -2.0319700241088867, -1.793802261352539, -1.5556344985961914, -1.3174667358398438, -1.079298973083496, -0.8411312103271484, -0.6029634475708008, -0.3647956848144531, -0.12662792205810547, 0.11153984069824219, 0.34970760345458984, 0.5878753662109375, 0.8260431289672852, 1.0642108917236328, 1.3023786544799805, 1.5405464172363281, 1.7787141799926758, 2.0168819427490234, 2.255049705505371, 2.4932174682617188, 2.7313852310180664, 2.969552993774414, 3.2077207565307617, 3.4458885192871094, 3.684056282043457, 3.9222240447998047, 4.160391807556152, 4.3985595703125, 4.636727333068848, 4.874895095825195]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 5.0, 8.0, 11.0, 11.0, 10.0, 20.0, 26.0, 21.0, 13.0, 28.0, 27.0, 43.0, 38.0, 36.0, 34.0, 39.0, 34.0, 43.0, 22.0, 27.0, 34.0, 46.0, 40.0, 34.0, 33.0, 34.0, 30.0, 33.0, 36.0, 31.0, 14.0, 18.0, 13.0, 12.0, 9.0, 21.0, 11.0, 8.0, 4.0, 2.0, 6.0, 3.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0931146144866943, -1.0551148653030396, -1.0171151161193848, -0.97911536693573, -0.9411156177520752, -0.9031158685684204, -0.8651160597801208, -0.8271163105964661, -0.7891165614128113, -0.7511168122291565, -0.7131170630455017, -0.6751173138618469, -0.6371175050735474, -0.5991177558898926, -0.5611180067062378, -0.523118257522583, -0.4851185083389282, -0.44711875915527344, -0.40911900997161865, -0.3711192309856415, -0.3331194818019867, -0.2951197326183319, -0.25711995363235474, -0.21912020444869995, -0.18112045526504517, -0.14312070608139038, -0.1051209419965744, -0.06712118536233902, -0.029121428728103638, 0.008878320455551147, 0.046878084540367126, 0.0848778486251831, 0.12287759780883789, 0.16087734699249268, 0.19887711107730865, 0.23687687516212463, 0.2748766243457794, 0.3128763735294342, 0.3508761525154114, 0.38887590169906616, 0.42687565088272095, 0.46487540006637573, 0.5028751492500305, 0.5408748984336853, 0.5788747072219849, 0.6168744564056396, 0.6548742055892944, 0.6928739547729492, 0.730873703956604, 0.7688734531402588, 0.8068732023239136, 0.8448729515075684, 0.8828727006912231, 0.9208724498748779, 0.9588722586631775, 0.9968720078468323, 1.0348718166351318, 1.0728715658187866, 1.1108713150024414, 1.1488710641860962, 1.186870813369751, 1.2248705625534058, 1.2628703117370605, 1.3008701801300049, 1.3388698101043701]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 8.0, 17.0, 25.0, 23.0, 39.0, 46.0, 79.0, 87.0, 164.0, 269.0, 347.0, 499.0, 818.0, 1216.0, 1998.0, 3242.0, 5658.0, 9784.0, 17909.0, 35538.0, 71024.0, 145155.0, 252231.0, 238697.0, 129708.0, 63143.0, 31819.0, 16381.0, 9023.0, 5204.0, 3102.0, 1848.0, 1188.0, 762.0, 507.0, 339.0, 214.0, 145.0, 86.0, 67.0, 44.0, 28.0, 25.0, 14.0, 10.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9423828125, -0.91375732421875, -0.8851318359375, -0.85650634765625, -0.827880859375, -0.79925537109375, -0.7706298828125, -0.74200439453125, -0.71337890625, -0.68475341796875, -0.6561279296875, -0.62750244140625, -0.598876953125, -0.57025146484375, -0.5416259765625, -0.51300048828125, -0.484375, -0.45574951171875, -0.4271240234375, -0.39849853515625, -0.369873046875, -0.34124755859375, -0.3126220703125, -0.28399658203125, -0.25537109375, -0.22674560546875, -0.1981201171875, -0.16949462890625, -0.140869140625, -0.11224365234375, -0.0836181640625, -0.05499267578125, -0.0263671875, 0.00225830078125, 0.0308837890625, 0.05950927734375, 0.088134765625, 0.11676025390625, 0.1453857421875, 0.17401123046875, 0.20263671875, 0.23126220703125, 0.2598876953125, 0.28851318359375, 0.317138671875, 0.34576416015625, 0.3743896484375, 0.40301513671875, 0.431640625, 0.46026611328125, 0.4888916015625, 0.51751708984375, 0.546142578125, 0.57476806640625, 0.6033935546875, 0.63201904296875, 0.66064453125, 0.68927001953125, 0.7178955078125, 0.74652099609375, 0.775146484375, 0.80377197265625, 0.8323974609375, 0.86102294921875, 0.8896484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 12.0, 19.0, 23.0, 32.0, 29.0, 25.0, 36.0, 30.0, 41.0, 62.0, 52.0, 49.0, 66.0, 61.0, 57.0, 58.0, 42.0, 44.0, 44.0, 33.0, 22.0, 28.0, 17.0, 17.0, 12.0, 10.0, 12.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6673049926757812, -0.6441802978515625, -0.6210556030273438, -0.597930908203125, -0.5748062133789062, -0.5516815185546875, -0.5285568237304688, -0.50543212890625, -0.48230743408203125, -0.4591827392578125, -0.43605804443359375, -0.412933349609375, -0.38980865478515625, -0.3666839599609375, -0.34355926513671875, -0.3204345703125, -0.29730987548828125, -0.2741851806640625, -0.25106048583984375, -0.227935791015625, -0.20481109619140625, -0.1816864013671875, -0.15856170654296875, -0.13543701171875, -0.11231231689453125, -0.0891876220703125, -0.06606292724609375, -0.042938232421875, -0.01981353759765625, 0.0033111572265625, 0.02643585205078125, 0.049560546875, 0.07268524169921875, 0.0958099365234375, 0.11893463134765625, 0.142059326171875, 0.16518402099609375, 0.1883087158203125, 0.21143341064453125, 0.23455810546875, 0.25768280029296875, 0.2808074951171875, 0.30393218994140625, 0.327056884765625, 0.35018157958984375, 0.3733062744140625, 0.39643096923828125, 0.4195556640625, 0.44268035888671875, 0.4658050537109375, 0.48892974853515625, 0.512054443359375, 0.5351791381835938, 0.5583038330078125, 0.5814285278320312, 0.60455322265625, 0.6276779174804688, 0.6508026123046875, 0.6739273071289062, 0.697052001953125, 0.7201766967773438, 0.7433013916015625, 0.7664260864257812, 0.78955078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 8.0, 8.0, 15.0, 20.0, 33.0, 37.0, 55.0, 95.0, 133.0, 291.0, 696.0, 1882.0, 6777.0, 37440.0, 360779.0, 569096.0, 57648.0, 9471.0, 2423.0, 852.0, 347.0, 175.0, 81.0, 62.0, 38.0, 23.0, 15.0, 11.0, 5.0, 10.0, 8.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.357421875, -3.273712158203125, -3.19000244140625, -3.106292724609375, -3.0225830078125, -2.938873291015625, -2.85516357421875, -2.771453857421875, -2.687744140625, -2.604034423828125, -2.52032470703125, -2.436614990234375, -2.3529052734375, -2.269195556640625, -2.18548583984375, -2.101776123046875, -2.01806640625, -1.934356689453125, -1.85064697265625, -1.766937255859375, -1.6832275390625, -1.599517822265625, -1.51580810546875, -1.432098388671875, -1.348388671875, -1.264678955078125, -1.18096923828125, -1.097259521484375, -1.0135498046875, -0.929840087890625, -0.84613037109375, -0.762420654296875, -0.6787109375, -0.595001220703125, -0.51129150390625, -0.427581787109375, -0.3438720703125, -0.260162353515625, -0.17645263671875, -0.092742919921875, -0.009033203125, 0.074676513671875, 0.15838623046875, 0.242095947265625, 0.3258056640625, 0.409515380859375, 0.49322509765625, 0.576934814453125, 0.66064453125, 0.744354248046875, 0.82806396484375, 0.911773681640625, 0.9954833984375, 1.079193115234375, 1.16290283203125, 1.246612548828125, 1.330322265625, 1.414031982421875, 1.49774169921875, 1.581451416015625, 1.6651611328125, 1.748870849609375, 1.83258056640625, 1.916290283203125, 2.0]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 9.0, 15.0, 11.0, 19.0, 12.0, 18.0, 37.0, 22.0, 40.0, 34.0, 40.0, 42.0, 56.0, 36.0, 46.0, 45.0, 42.0, 50.0, 42.0, 58.0, 36.0, 38.0, 33.0, 36.0, 30.0, 23.0, 21.0, 25.0, 21.0, 8.0, 14.0, 6.0, 3.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.16796875, -3.070159912109375, -2.97235107421875, -2.874542236328125, -2.7767333984375, -2.678924560546875, -2.58111572265625, -2.483306884765625, -2.385498046875, -2.287689208984375, -2.18988037109375, -2.092071533203125, -1.9942626953125, -1.896453857421875, -1.79864501953125, -1.700836181640625, -1.60302734375, -1.505218505859375, -1.40740966796875, -1.309600830078125, -1.2117919921875, -1.113983154296875, -1.01617431640625, -0.918365478515625, -0.820556640625, -0.722747802734375, -0.62493896484375, -0.527130126953125, -0.4293212890625, -0.331512451171875, -0.23370361328125, -0.135894775390625, -0.0380859375, 0.059722900390625, 0.15753173828125, 0.255340576171875, 0.3531494140625, 0.450958251953125, 0.54876708984375, 0.646575927734375, 0.744384765625, 0.842193603515625, 0.94000244140625, 1.037811279296875, 1.1356201171875, 1.233428955078125, 1.33123779296875, 1.429046630859375, 1.52685546875, 1.624664306640625, 1.72247314453125, 1.820281982421875, 1.9180908203125, 2.015899658203125, 2.11370849609375, 2.211517333984375, 2.309326171875, 2.407135009765625, 2.50494384765625, 2.602752685546875, 2.7005615234375, 2.798370361328125, 2.89617919921875, 2.993988037109375, 3.091796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 14.0, 22.0, 31.0, 56.0, 107.0, 215.0, 523.0, 1537.0, 7789.0, 197731.0, 819236.0, 17431.0, 2519.0, 726.0, 290.0, 146.0, 60.0, 33.0, 19.0, 13.0, 9.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.274688720703125, -2.20172119140625, -2.128753662109375, -2.0557861328125, -1.982818603515625, -1.90985107421875, -1.836883544921875, -1.763916015625, -1.690948486328125, -1.61798095703125, -1.545013427734375, -1.4720458984375, -1.399078369140625, -1.32611083984375, -1.253143310546875, -1.18017578125, -1.107208251953125, -1.03424072265625, -0.961273193359375, -0.8883056640625, -0.815338134765625, -0.74237060546875, -0.669403076171875, -0.596435546875, -0.523468017578125, -0.45050048828125, -0.377532958984375, -0.3045654296875, -0.231597900390625, -0.15863037109375, -0.085662841796875, -0.0126953125, 0.060272216796875, 0.13323974609375, 0.206207275390625, 0.2791748046875, 0.352142333984375, 0.42510986328125, 0.498077392578125, 0.571044921875, 0.644012451171875, 0.71697998046875, 0.789947509765625, 0.8629150390625, 0.935882568359375, 1.00885009765625, 1.081817626953125, 1.15478515625, 1.227752685546875, 1.30072021484375, 1.373687744140625, 1.4466552734375, 1.519622802734375, 1.59259033203125, 1.665557861328125, 1.738525390625, 1.811492919921875, 1.88446044921875, 1.957427978515625, 2.0303955078125, 2.103363037109375, 2.17633056640625, 2.249298095703125, 2.322265625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 10.0, 10.0, 15.0, 17.0, 22.0, 39.0, 45.0, 55.0, 79.0, 109.0, 94.0, 84.0, 100.0, 68.0, 66.0, 52.0, 27.0, 33.0, 19.0, 17.0, 4.0, 5.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017690658569335938, -0.00017259083688259125, -0.00016827508807182312, -0.000163959339261055, -0.00015964359045028687, -0.00015532784163951874, -0.0001510120928287506, -0.00014669634401798248, -0.00014238059520721436, -0.00013806484639644623, -0.0001337490975856781, -0.00012943334877490997, -0.00012511759996414185, -0.00012080185115337372, -0.00011648610234260559, -0.00011217035353183746, -0.00010785460472106934, -0.00010353885591030121, -9.922310709953308e-05, -9.490735828876495e-05, -9.059160947799683e-05, -8.62758606672287e-05, -8.196011185646057e-05, -7.764436304569244e-05, -7.332861423492432e-05, -6.901286542415619e-05, -6.469711661338806e-05, -6.0381367802619934e-05, -5.606561899185181e-05, -5.174987018108368e-05, -4.743412137031555e-05, -4.3118372559547424e-05, -3.88026237487793e-05, -3.448687493801117e-05, -3.0171126127243042e-05, -2.5855377316474915e-05, -2.1539628505706787e-05, -1.722387969493866e-05, -1.2908130884170532e-05, -8.592382073402405e-06, -4.276633262634277e-06, 3.91155481338501e-08, 4.3548643589019775e-06, 8.670613169670105e-06, 1.2986361980438232e-05, 1.730211079120636e-05, 2.1617859601974487e-05, 2.5933608412742615e-05, 3.0249357223510742e-05, 3.456510603427887e-05, 3.8880854845047e-05, 4.3196603655815125e-05, 4.751235246658325e-05, 5.182810127735138e-05, 5.614385008811951e-05, 6.0459598898887634e-05, 6.477534770965576e-05, 6.909109652042389e-05, 7.340684533119202e-05, 7.772259414196014e-05, 8.203834295272827e-05, 8.63540917634964e-05, 9.066984057426453e-05, 9.498558938503265e-05, 9.930133819580078e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 4.0, 13.0, 17.0, 22.0, 37.0, 32.0, 45.0, 89.0, 185.0, 337.0, 670.0, 1550.0, 4000.0, 16952.0, 240845.0, 732671.0, 40169.0, 6775.0, 2174.0, 892.0, 455.0, 259.0, 125.0, 69.0, 50.0, 32.0, 33.0, 21.0, 11.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.794921875, -1.7479400634765625, -1.700958251953125, -1.6539764404296875, -1.60699462890625, -1.5600128173828125, -1.513031005859375, -1.4660491943359375, -1.4190673828125, -1.3720855712890625, -1.325103759765625, -1.2781219482421875, -1.23114013671875, -1.1841583251953125, -1.137176513671875, -1.0901947021484375, -1.043212890625, -0.9962310791015625, -0.949249267578125, -0.9022674560546875, -0.85528564453125, -0.8083038330078125, -0.761322021484375, -0.7143402099609375, -0.6673583984375, -0.6203765869140625, -0.573394775390625, -0.5264129638671875, -0.47943115234375, -0.4324493408203125, -0.385467529296875, -0.3384857177734375, -0.29150390625, -0.2445220947265625, -0.197540283203125, -0.1505584716796875, -0.10357666015625, -0.0565948486328125, -0.009613037109375, 0.0373687744140625, 0.0843505859375, 0.1313323974609375, 0.178314208984375, 0.2252960205078125, 0.27227783203125, 0.3192596435546875, 0.366241455078125, 0.4132232666015625, 0.460205078125, 0.5071868896484375, 0.554168701171875, 0.6011505126953125, 0.64813232421875, 0.6951141357421875, 0.742095947265625, 0.7890777587890625, 0.8360595703125, 0.8830413818359375, 0.930023193359375, 0.9770050048828125, 1.02398681640625, 1.0709686279296875, 1.117950439453125, 1.1649322509765625, 1.2119140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 22.0, 47.0, 112.0, 239.0, 223.0, 190.0, 64.0, 36.0, 21.0, 7.0, 1.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.0908355712890625, -3.994171142578125, -3.8975067138671875, -3.80084228515625, -3.7041778564453125, -3.607513427734375, -3.5108489990234375, -3.4141845703125, -3.3175201416015625, -3.220855712890625, -3.1241912841796875, -3.02752685546875, -2.9308624267578125, -2.834197998046875, -2.7375335693359375, -2.640869140625, -2.5442047119140625, -2.447540283203125, -2.3508758544921875, -2.25421142578125, -2.1575469970703125, -2.060882568359375, -1.9642181396484375, -1.8675537109375, -1.7708892822265625, -1.674224853515625, -1.5775604248046875, -1.48089599609375, -1.3842315673828125, -1.287567138671875, -1.1909027099609375, -1.09423828125, -0.9975738525390625, -0.900909423828125, -0.8042449951171875, -0.70758056640625, -0.6109161376953125, -0.514251708984375, -0.4175872802734375, -0.3209228515625, -0.2242584228515625, -0.127593994140625, -0.0309295654296875, 0.06573486328125, 0.1623992919921875, 0.259063720703125, 0.3557281494140625, 0.452392578125, 0.5490570068359375, 0.645721435546875, 0.7423858642578125, 0.83905029296875, 0.9357147216796875, 1.032379150390625, 1.1290435791015625, 1.2257080078125, 1.3223724365234375, 1.419036865234375, 1.5157012939453125, 1.61236572265625, 1.7090301513671875, 1.805694580078125, 1.9023590087890625, 1.9990234375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 19.0, 28.0, 65.0, 147.0, 201.0, 211.0, 160.0, 87.0, 42.0, 25.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.588043212890625, -36.720909118652344, -35.85377883911133, -34.98664474487305, -34.11951446533203, -33.25238037109375, -32.38524627685547, -31.518115997314453, -30.650981903076172, -29.783849716186523, -28.916717529296875, -28.049583435058594, -27.182451248168945, -26.315319061279297, -25.44818687438965, -24.5810546875, -23.71392250061035, -22.846790313720703, -21.979658126831055, -21.112525939941406, -20.245391845703125, -19.378259658813477, -18.511127471923828, -17.64399528503418, -16.77686309814453, -15.909730911254883, -15.042597770690918, -14.17546558380127, -13.308332443237305, -12.441200256347656, -11.574068069458008, -10.70693588256836, -9.839799880981445, -8.972667694091797, -8.105534553527832, -7.238402366638184, -6.371269702911377, -5.50413703918457, -4.637004852294922, -3.7698721885681152, -2.9027395248413086, -2.035606861114502, -1.1684744358062744, -0.3013420104980469, 0.5657906532287598, 1.4329233169555664, 2.300055503845215, 3.1671881675720215, 4.034320831298828, 4.901453495025635, 5.768586158752441, 6.63571834564209, 7.5028510093688965, 8.369983673095703, 9.237115859985352, 10.104248046875, 10.971381187438965, 11.838513374328613, 12.705646514892578, 13.572778701782227, 14.439910888671875, 15.30704402923584, 16.174175262451172, 17.041309356689453, 17.9084415435791]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 8.0, 2.0, 7.0, 12.0, 16.0, 7.0, 15.0, 8.0, 20.0, 17.0, 22.0, 22.0, 24.0, 27.0, 30.0, 29.0, 43.0, 29.0, 42.0, 55.0, 52.0, 47.0, 44.0, 39.0, 45.0, 38.0, 43.0, 27.0, 28.0, 19.0, 22.0, 22.0, 13.0, 27.0, 11.0, 13.0, 17.0, 11.0, 7.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-14.619349479675293, -14.213800430297852, -13.808250427246094, -13.402701377868652, -12.997152328491211, -12.591602325439453, -12.186053276062012, -11.78050422668457, -11.374954223632812, -10.969405174255371, -10.563855171203613, -10.158306121826172, -9.752756118774414, -9.347207069396973, -8.941658020019531, -8.536108016967773, -8.130558967590332, -7.725009441375732, -7.319459915161133, -6.913910865783691, -6.508361339569092, -6.102811813354492, -5.697262763977051, -5.291713237762451, -4.886163711547852, -4.480614185333252, -4.075064659118652, -3.669515609741211, -3.2639660835266113, -2.8584165573120117, -2.452867269515991, -2.0473179817199707, -1.6417675018310547, -1.2362180948257446, -0.8306686878204346, -0.4251192808151245, -0.019569873809814453, 0.38597965240478516, 0.7915289402008057, 1.1970782279968262, 1.6026277542114258, 2.0081772804260254, 2.413726568222046, 2.8192758560180664, 3.224825382232666, 3.6303749084472656, 4.035923957824707, 4.441473484039307, 4.847023010253906, 5.252572536468506, 5.6581220626831055, 6.063671112060547, 6.4692206382751465, 6.874770164489746, 7.2803192138671875, 7.685868740081787, 8.091418266296387, 8.496967315673828, 8.902517318725586, 9.308066368103027, 9.713615417480469, 10.119165420532227, 10.524714469909668, 10.93026351928711, 11.335813522338867]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 9.0, 8.0, 15.0, 25.0, 32.0, 58.0, 93.0, 158.0, 339.0, 811.0, 2261.0, 8938.0, 97990.0, 4051958.0, 24922.0, 4302.0, 1362.0, 502.0, 234.0, 97.0, 51.0, 29.0, 24.0, 11.0, 13.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.9140625, -3.811767578125, -3.70947265625, -3.607177734375, -3.5048828125, -3.402587890625, -3.30029296875, -3.197998046875, -3.095703125, -2.993408203125, -2.89111328125, -2.788818359375, -2.6865234375, -2.584228515625, -2.48193359375, -2.379638671875, -2.27734375, -2.175048828125, -2.07275390625, -1.970458984375, -1.8681640625, -1.765869140625, -1.66357421875, -1.561279296875, -1.458984375, -1.356689453125, -1.25439453125, -1.152099609375, -1.0498046875, -0.947509765625, -0.84521484375, -0.742919921875, -0.640625, -0.538330078125, -0.43603515625, -0.333740234375, -0.2314453125, -0.129150390625, -0.02685546875, 0.075439453125, 0.177734375, 0.280029296875, 0.38232421875, 0.484619140625, 0.5869140625, 0.689208984375, 0.79150390625, 0.893798828125, 0.99609375, 1.098388671875, 1.20068359375, 1.302978515625, 1.4052734375, 1.507568359375, 1.60986328125, 1.712158203125, 1.814453125, 1.916748046875, 2.01904296875, 2.121337890625, 2.2236328125, 2.325927734375, 2.42822265625, 2.530517578125, 2.6328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 1.0, 6.0, 3.0, 12.0, 5.0, 19.0, 24.0, 36.0, 49.0, 40.0, 42.0, 68.0, 69.0, 63.0, 74.0, 68.0, 73.0, 61.0, 53.0, 39.0, 29.0, 29.0, 39.0, 24.0, 17.0, 12.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9333267211914062, -0.9047393798828125, -0.8761520385742188, -0.847564697265625, -0.8189773559570312, -0.7903900146484375, -0.7618026733398438, -0.73321533203125, -0.7046279907226562, -0.6760406494140625, -0.6474533081054688, -0.618865966796875, -0.5902786254882812, -0.5616912841796875, -0.5331039428710938, -0.5045166015625, -0.47592926025390625, -0.4473419189453125, -0.41875457763671875, -0.390167236328125, -0.36157989501953125, -0.3329925537109375, -0.30440521240234375, -0.27581787109375, -0.24723052978515625, -0.2186431884765625, -0.19005584716796875, -0.161468505859375, -0.13288116455078125, -0.1042938232421875, -0.07570648193359375, -0.047119140625, -0.01853179931640625, 0.0100555419921875, 0.03864288330078125, 0.067230224609375, 0.09581756591796875, 0.1244049072265625, 0.15299224853515625, 0.18157958984375, 0.21016693115234375, 0.2387542724609375, 0.26734161376953125, 0.295928955078125, 0.32451629638671875, 0.3531036376953125, 0.38169097900390625, 0.4102783203125, 0.43886566162109375, 0.4674530029296875, 0.49604034423828125, 0.524627685546875, 0.5532150268554688, 0.5818023681640625, 0.6103897094726562, 0.63897705078125, 0.6675643920898438, 0.6961517333984375, 0.7247390747070312, 0.753326416015625, 0.7819137573242188, 0.8105010986328125, 0.8390884399414062, 0.86767578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 4.0, 4.0, 13.0, 16.0, 21.0, 28.0, 42.0, 47.0, 79.0, 104.0, 171.0, 340.0, 809.0, 2526.0, 11997.0, 160572.0, 3977255.0, 32791.0, 4894.0, 1399.0, 497.0, 259.0, 111.0, 96.0, 63.0, 36.0, 28.0, 23.0, 26.0, 11.0, 10.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3046875, -4.1890869140625, -4.073486328125, -3.9578857421875, -3.84228515625, -3.7266845703125, -3.611083984375, -3.4954833984375, -3.3798828125, -3.2642822265625, -3.148681640625, -3.0330810546875, -2.91748046875, -2.8018798828125, -2.686279296875, -2.5706787109375, -2.455078125, -2.3394775390625, -2.223876953125, -2.1082763671875, -1.99267578125, -1.8770751953125, -1.761474609375, -1.6458740234375, -1.5302734375, -1.4146728515625, -1.299072265625, -1.1834716796875, -1.06787109375, -0.9522705078125, -0.836669921875, -0.7210693359375, -0.60546875, -0.4898681640625, -0.374267578125, -0.2586669921875, -0.14306640625, -0.0274658203125, 0.088134765625, 0.2037353515625, 0.3193359375, 0.4349365234375, 0.550537109375, 0.6661376953125, 0.78173828125, 0.8973388671875, 1.012939453125, 1.1285400390625, 1.244140625, 1.3597412109375, 1.475341796875, 1.5909423828125, 1.70654296875, 1.8221435546875, 1.937744140625, 2.0533447265625, 2.1689453125, 2.2845458984375, 2.400146484375, 2.5157470703125, 2.63134765625, 2.7469482421875, 2.862548828125, 2.9781494140625, 3.09375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 11.0, 21.0, 38.0, 71.0, 218.0, 3346.0, 229.0, 82.0, 30.0, 17.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.2540740966796875, -2.195648193359375, -2.1372222900390625, -2.07879638671875, -2.0203704833984375, -1.961944580078125, -1.9035186767578125, -1.8450927734375, -1.7866668701171875, -1.728240966796875, -1.6698150634765625, -1.61138916015625, -1.5529632568359375, -1.494537353515625, -1.4361114501953125, -1.377685546875, -1.3192596435546875, -1.260833740234375, -1.2024078369140625, -1.14398193359375, -1.0855560302734375, -1.027130126953125, -0.9687042236328125, -0.9102783203125, -0.8518524169921875, -0.793426513671875, -0.7350006103515625, -0.67657470703125, -0.6181488037109375, -0.559722900390625, -0.5012969970703125, -0.44287109375, -0.3844451904296875, -0.326019287109375, -0.2675933837890625, -0.20916748046875, -0.1507415771484375, -0.092315673828125, -0.0338897705078125, 0.0245361328125, 0.0829620361328125, 0.141387939453125, 0.1998138427734375, 0.25823974609375, 0.3166656494140625, 0.375091552734375, 0.4335174560546875, 0.491943359375, 0.5503692626953125, 0.608795166015625, 0.6672210693359375, 0.72564697265625, 0.7840728759765625, 0.842498779296875, 0.9009246826171875, 0.9593505859375, 1.0177764892578125, 1.076202392578125, 1.1346282958984375, 1.19305419921875, 1.2514801025390625, 1.309906005859375, 1.3683319091796875, 1.4267578125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 7.0, 10.0, 8.0, 12.0, 20.0, 32.0, 31.0, 54.0, 57.0, 68.0, 90.0, 105.0, 97.0, 85.0, 81.0, 68.0, 47.0, 33.0, 24.0, 17.0, 14.0, 7.0, 7.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.678887367248535, -3.5750250816345215, -3.4711625576019287, -3.367300271987915, -3.2634379863739014, -3.1595754623413086, -3.055713176727295, -2.9518508911132812, -2.8479886054992676, -2.744126319885254, -2.640263795852661, -2.5364015102386475, -2.432539224624634, -2.328676700592041, -2.2248144149780273, -2.1209521293640137, -2.017089605331421, -1.9132272005081177, -1.809364914894104, -1.7055025100708008, -1.601640224456787, -1.4977778196334839, -1.3939154148101807, -1.290053129196167, -1.1861907243728638, -1.0823283195495605, -0.9784660339355469, -0.8746036291122437, -0.7707412838935852, -0.6668789386749268, -0.5630165338516235, -0.4591541886329651, -0.35529208183288574, -0.2514297366142273, -0.14756736159324646, -0.043704986572265625, 0.06015735864639282, 0.16401970386505127, 0.2678821086883545, 0.37174445390701294, 0.4756067991256714, 0.5794691443443298, 0.6833314895629883, 0.7871938943862915, 0.89105623960495, 0.9949185848236084, 1.0987809896469116, 1.2026433944702148, 1.3065056800842285, 1.4103680849075317, 1.5142303705215454, 1.6180927753448486, 1.7219550609588623, 1.8258174657821655, 1.9296798706054688, 2.0335421562194824, 2.137404441833496, 2.2412667274475098, 2.3451292514801025, 2.448991537094116, 2.55285382270813, 2.6567163467407227, 2.7605786323547363, 2.86444091796875, 2.9683034420013428]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 6.0, 12.0, 9.0, 12.0, 17.0, 16.0, 18.0, 21.0, 18.0, 30.0, 30.0, 39.0, 33.0, 34.0, 42.0, 41.0, 45.0, 36.0, 34.0, 39.0, 33.0, 41.0, 40.0, 40.0, 24.0, 38.0, 33.0, 24.0, 29.0, 23.0, 16.0, 21.0, 15.0, 10.0, 15.0, 7.0, 8.0, 4.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-2.7551400661468506, -2.6702563762664795, -2.5853726863861084, -2.5004892349243164, -2.4156055450439453, -2.330721855163574, -2.245838165283203, -2.160954475402832, -2.07607102394104, -1.991187334060669, -1.9063037633895874, -1.8214200735092163, -1.7365365028381348, -1.6516528129577637, -1.5667691230773926, -1.481885552406311, -1.39700186252594, -1.3121181726455688, -1.2272346019744873, -1.1423509120941162, -1.0574673414230347, -0.9725836515426636, -0.8877000212669373, -0.8028163909912109, -0.7179327607154846, -0.6330491304397583, -0.548165500164032, -0.4632818400859833, -0.37839820981025696, -0.29351457953453064, -0.20863091945648193, -0.12374728918075562, -0.0388636589050293, 0.04601997882127762, 0.13090361654758453, 0.21578726172447205, 0.30067089200019836, 0.3855545222759247, 0.4704381823539734, 0.5553218126296997, 0.640205442905426, 0.7250890731811523, 0.8099727034568787, 0.894856333732605, 0.9797400236129761, 1.0646235942840576, 1.1495072841644287, 1.2343909740447998, 1.3192745447158813, 1.4041582345962524, 1.489041805267334, 1.573925495147705, 1.6588090658187866, 1.7436927556991577, 1.8285763263702393, 1.9134600162506104, 1.9983437061309814, 2.0832273960113525, 2.1681110858917236, 2.2529945373535156, 2.3378782272338867, 2.422761917114258, 2.507645606994629, 2.592529296875, 2.677412748336792]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 22.0, 20.0, 31.0, 58.0, 108.0, 197.0, 373.0, 759.0, 1613.0, 3978.0, 11437.0, 39455.0, 168955.0, 507225.0, 236676.0, 53853.0, 14951.0, 5043.0, 1953.0, 908.0, 395.0, 230.0, 120.0, 68.0, 42.0, 24.0, 17.0, 11.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.83453369140625, -1.7725830078125, -1.71063232421875, -1.648681640625, -1.58673095703125, -1.5247802734375, -1.46282958984375, -1.40087890625, -1.33892822265625, -1.2769775390625, -1.21502685546875, -1.153076171875, -1.09112548828125, -1.0291748046875, -0.96722412109375, -0.9052734375, -0.84332275390625, -0.7813720703125, -0.71942138671875, -0.657470703125, -0.59552001953125, -0.5335693359375, -0.47161865234375, -0.40966796875, -0.34771728515625, -0.2857666015625, -0.22381591796875, -0.161865234375, -0.09991455078125, -0.0379638671875, 0.02398681640625, 0.0859375, 0.14788818359375, 0.2098388671875, 0.27178955078125, 0.333740234375, 0.39569091796875, 0.4576416015625, 0.51959228515625, 0.58154296875, 0.64349365234375, 0.7054443359375, 0.76739501953125, 0.829345703125, 0.89129638671875, 0.9532470703125, 1.01519775390625, 1.0771484375, 1.13909912109375, 1.2010498046875, 1.26300048828125, 1.324951171875, 1.38690185546875, 1.4488525390625, 1.51080322265625, 1.57275390625, 1.63470458984375, 1.6966552734375, 1.75860595703125, 1.820556640625, 1.88250732421875, 1.9444580078125, 2.00640869140625, 2.068359375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 3.0, 6.0, 13.0, 19.0, 15.0, 22.0, 23.0, 35.0, 48.0, 42.0, 60.0, 56.0, 71.0, 69.0, 66.0, 80.0, 60.0, 42.0, 59.0, 38.0, 39.0, 29.0, 28.0, 16.0, 14.0, 6.0, 15.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.203125, -1.17230224609375, -1.1414794921875, -1.11065673828125, -1.079833984375, -1.04901123046875, -1.0181884765625, -0.98736572265625, -0.95654296875, -0.92572021484375, -0.8948974609375, -0.86407470703125, -0.833251953125, -0.80242919921875, -0.7716064453125, -0.74078369140625, -0.7099609375, -0.67913818359375, -0.6483154296875, -0.61749267578125, -0.586669921875, -0.55584716796875, -0.5250244140625, -0.49420166015625, -0.46337890625, -0.43255615234375, -0.4017333984375, -0.37091064453125, -0.340087890625, -0.30926513671875, -0.2784423828125, -0.24761962890625, -0.216796875, -0.18597412109375, -0.1551513671875, -0.12432861328125, -0.093505859375, -0.06268310546875, -0.0318603515625, -0.00103759765625, 0.02978515625, 0.06060791015625, 0.0914306640625, 0.12225341796875, 0.153076171875, 0.18389892578125, 0.2147216796875, 0.24554443359375, 0.2763671875, 0.30718994140625, 0.3380126953125, 0.36883544921875, 0.399658203125, 0.43048095703125, 0.4613037109375, 0.49212646484375, 0.52294921875, 0.55377197265625, 0.5845947265625, 0.61541748046875, 0.646240234375, 0.67706298828125, 0.7078857421875, 0.73870849609375, 0.76953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 9.0, 15.0, 20.0, 27.0, 38.0, 53.0, 70.0, 85.0, 126.0, 238.0, 356.0, 665.0, 1342.0, 2900.0, 7934.0, 25384.0, 112010.0, 540271.0, 280540.0, 53132.0, 14168.0, 4744.0, 2064.0, 970.0, 506.0, 277.0, 186.0, 139.0, 70.0, 47.0, 43.0, 21.0, 20.0, 13.0, 13.0, 14.0, 5.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.845703125, -1.78369140625, -1.7216796875, -1.65966796875, -1.59765625, -1.53564453125, -1.4736328125, -1.41162109375, -1.349609375, -1.28759765625, -1.2255859375, -1.16357421875, -1.1015625, -1.03955078125, -0.9775390625, -0.91552734375, -0.853515625, -0.79150390625, -0.7294921875, -0.66748046875, -0.60546875, -0.54345703125, -0.4814453125, -0.41943359375, -0.357421875, -0.29541015625, -0.2333984375, -0.17138671875, -0.109375, -0.04736328125, 0.0146484375, 0.07666015625, 0.138671875, 0.20068359375, 0.2626953125, 0.32470703125, 0.38671875, 0.44873046875, 0.5107421875, 0.57275390625, 0.634765625, 0.69677734375, 0.7587890625, 0.82080078125, 0.8828125, 0.94482421875, 1.0068359375, 1.06884765625, 1.130859375, 1.19287109375, 1.2548828125, 1.31689453125, 1.37890625, 1.44091796875, 1.5029296875, 1.56494140625, 1.626953125, 1.68896484375, 1.7509765625, 1.81298828125, 1.875, 1.93701171875, 1.9990234375, 2.06103515625, 2.123046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 9.0, 10.0, 13.0, 15.0, 15.0, 18.0, 24.0, 17.0, 29.0, 31.0, 39.0, 43.0, 44.0, 49.0, 45.0, 56.0, 54.0, 44.0, 40.0, 49.0, 51.0, 52.0, 44.0, 31.0, 31.0, 28.0, 12.0, 12.0, 16.0, 17.0, 11.0, 9.0, 4.0, 5.0, 7.0, 0.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.583984375, -3.473724365234375, -3.36346435546875, -3.253204345703125, -3.1429443359375, -3.032684326171875, -2.92242431640625, -2.812164306640625, -2.701904296875, -2.591644287109375, -2.48138427734375, -2.371124267578125, -2.2608642578125, -2.150604248046875, -2.04034423828125, -1.930084228515625, -1.81982421875, -1.709564208984375, -1.59930419921875, -1.489044189453125, -1.3787841796875, -1.268524169921875, -1.15826416015625, -1.048004150390625, -0.937744140625, -0.827484130859375, -0.71722412109375, -0.606964111328125, -0.4967041015625, -0.386444091796875, -0.27618408203125, -0.165924072265625, -0.0556640625, 0.054595947265625, 0.16485595703125, 0.275115966796875, 0.3853759765625, 0.495635986328125, 0.60589599609375, 0.716156005859375, 0.826416015625, 0.936676025390625, 1.04693603515625, 1.157196044921875, 1.2674560546875, 1.377716064453125, 1.48797607421875, 1.598236083984375, 1.70849609375, 1.818756103515625, 1.92901611328125, 2.039276123046875, 2.1495361328125, 2.259796142578125, 2.37005615234375, 2.480316162109375, 2.590576171875, 2.700836181640625, 2.81109619140625, 2.921356201171875, 3.0316162109375, 3.141876220703125, 3.25213623046875, 3.362396240234375, 3.47265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 10.0, 12.0, 14.0, 19.0, 32.0, 48.0, 73.0, 178.0, 339.0, 839.0, 2766.0, 17367.0, 443497.0, 558176.0, 20548.0, 2902.0, 936.0, 364.0, 173.0, 80.0, 63.0, 35.0, 21.0, 14.0, 14.0, 7.0, 7.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0667724609375, -1.030029296875, -0.9932861328125, -0.95654296875, -0.9197998046875, -0.883056640625, -0.8463134765625, -0.8095703125, -0.7728271484375, -0.736083984375, -0.6993408203125, -0.66259765625, -0.6258544921875, -0.589111328125, -0.5523681640625, -0.515625, -0.4788818359375, -0.442138671875, -0.4053955078125, -0.36865234375, -0.3319091796875, -0.295166015625, -0.2584228515625, -0.2216796875, -0.1849365234375, -0.148193359375, -0.1114501953125, -0.07470703125, -0.0379638671875, -0.001220703125, 0.0355224609375, 0.072265625, 0.1090087890625, 0.145751953125, 0.1824951171875, 0.21923828125, 0.2559814453125, 0.292724609375, 0.3294677734375, 0.3662109375, 0.4029541015625, 0.439697265625, 0.4764404296875, 0.51318359375, 0.5499267578125, 0.586669921875, 0.6234130859375, 0.66015625, 0.6968994140625, 0.733642578125, 0.7703857421875, 0.80712890625, 0.8438720703125, 0.880615234375, 0.9173583984375, 0.9541015625, 0.9908447265625, 1.027587890625, 1.0643310546875, 1.10107421875, 1.1378173828125, 1.174560546875, 1.2113037109375, 1.248046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 3.0, 11.0, 9.0, 19.0, 24.0, 29.0, 46.0, 60.0, 86.0, 85.0, 134.0, 125.0, 96.0, 97.0, 48.0, 37.0, 26.0, 21.0, 15.0, 10.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014841556549072266, -0.00014360807836055756, -0.00013880059123039246, -0.00013399310410022736, -0.00012918561697006226, -0.00012437812983989716, -0.00011957064270973206, -0.00011476315557956696, -0.00010995566844940186, -0.00010514818131923676, -0.00010034069418907166, -9.553320705890656e-05, -9.072571992874146e-05, -8.591823279857635e-05, -8.111074566841125e-05, -7.630325853824615e-05, -7.149577140808105e-05, -6.668828427791595e-05, -6.188079714775085e-05, -5.7073310017585754e-05, -5.2265822887420654e-05, -4.7458335757255554e-05, -4.2650848627090454e-05, -3.7843361496925354e-05, -3.3035874366760254e-05, -2.8228387236595154e-05, -2.3420900106430054e-05, -1.8613412976264954e-05, -1.3805925846099854e-05, -8.998438715934753e-06, -4.190951585769653e-06, 6.165355443954468e-07, 5.424022674560547e-06, 1.0231509804725647e-05, 1.5038996934890747e-05, 1.9846484065055847e-05, 2.4653971195220947e-05, 2.9461458325386047e-05, 3.426894545555115e-05, 3.907643258571625e-05, 4.388391971588135e-05, 4.869140684604645e-05, 5.349889397621155e-05, 5.830638110637665e-05, 6.311386823654175e-05, 6.792135536670685e-05, 7.272884249687195e-05, 7.753632962703705e-05, 8.234381675720215e-05, 8.715130388736725e-05, 9.195879101753235e-05, 9.676627814769745e-05, 0.00010157376527786255, 0.00010638125240802765, 0.00011118873953819275, 0.00011599622666835785, 0.00012080371379852295, 0.00012561120092868805, 0.00013041868805885315, 0.00013522617518901825, 0.00014003366231918335, 0.00014484114944934845, 0.00014964863657951355, 0.00015445612370967865, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 1.0, 4.0, 7.0, 21.0, 21.0, 43.0, 77.0, 146.0, 317.0, 834.0, 2663.0, 15184.0, 316558.0, 677554.0, 29169.0, 3935.0, 1141.0, 439.0, 219.0, 93.0, 59.0, 26.0, 17.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.556640625, -1.518798828125, -1.48095703125, -1.443115234375, -1.4052734375, -1.367431640625, -1.32958984375, -1.291748046875, -1.25390625, -1.216064453125, -1.17822265625, -1.140380859375, -1.1025390625, -1.064697265625, -1.02685546875, -0.989013671875, -0.951171875, -0.913330078125, -0.87548828125, -0.837646484375, -0.7998046875, -0.761962890625, -0.72412109375, -0.686279296875, -0.6484375, -0.610595703125, -0.57275390625, -0.534912109375, -0.4970703125, -0.459228515625, -0.42138671875, -0.383544921875, -0.345703125, -0.307861328125, -0.27001953125, -0.232177734375, -0.1943359375, -0.156494140625, -0.11865234375, -0.080810546875, -0.04296875, -0.005126953125, 0.03271484375, 0.070556640625, 0.1083984375, 0.146240234375, 0.18408203125, 0.221923828125, 0.259765625, 0.297607421875, 0.33544921875, 0.373291015625, 0.4111328125, 0.448974609375, 0.48681640625, 0.524658203125, 0.5625, 0.600341796875, 0.63818359375, 0.676025390625, 0.7138671875, 0.751708984375, 0.78955078125, 0.827392578125, 0.865234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 13.0, 23.0, 40.0, 69.0, 102.0, 142.0, 173.0, 139.0, 106.0, 64.0, 56.0, 27.0, 10.0, 11.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3579254150390625, -1.308624267578125, -1.2593231201171875, -1.21002197265625, -1.1607208251953125, -1.111419677734375, -1.0621185302734375, -1.0128173828125, -0.9635162353515625, -0.914215087890625, -0.8649139404296875, -0.81561279296875, -0.7663116455078125, -0.717010498046875, -0.6677093505859375, -0.618408203125, -0.5691070556640625, -0.519805908203125, -0.4705047607421875, -0.42120361328125, -0.3719024658203125, -0.322601318359375, -0.2733001708984375, -0.2239990234375, -0.1746978759765625, -0.125396728515625, -0.0760955810546875, -0.02679443359375, 0.0225067138671875, 0.071807861328125, 0.1211090087890625, 0.17041015625, 0.2197113037109375, 0.269012451171875, 0.3183135986328125, 0.36761474609375, 0.4169158935546875, 0.466217041015625, 0.5155181884765625, 0.5648193359375, 0.6141204833984375, 0.663421630859375, 0.7127227783203125, 0.76202392578125, 0.8113250732421875, 0.860626220703125, 0.9099273681640625, 0.959228515625, 1.0085296630859375, 1.057830810546875, 1.1071319580078125, 1.15643310546875, 1.2057342529296875, 1.255035400390625, 1.3043365478515625, 1.3536376953125, 1.4029388427734375, 1.452239990234375, 1.5015411376953125, 1.55084228515625, 1.6001434326171875, 1.649444580078125, 1.6987457275390625, 1.748046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 15.0, 30.0, 69.0, 163.0, 300.0, 228.0, 127.0, 45.0, 17.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.67064666748047, -51.67135238647461, -50.672054290771484, -49.672760009765625, -48.673465728759766, -47.674171447753906, -46.67487335205078, -45.67557907104492, -44.67628479003906, -43.6769905090332, -42.67769241333008, -41.67839813232422, -40.67910385131836, -39.6798095703125, -38.680511474609375, -37.681217193603516, -36.68191909790039, -35.68262481689453, -34.683326721191406, -33.68403244018555, -32.68473815917969, -31.685441970825195, -30.686145782470703, -29.686851501464844, -28.68755531311035, -27.68825912475586, -26.68896484375, -25.689668655395508, -24.690372467041016, -23.691078186035156, -22.691781997680664, -21.692485809326172, -20.693191528320312, -19.69389533996582, -18.69460105895996, -17.69530487060547, -16.69601058959961, -15.696714401245117, -14.697418212890625, -13.69812297821045, -12.698827743530273, -11.699532508850098, -10.700237274169922, -9.70094108581543, -8.701645851135254, -7.702350616455078, -6.703054904937744, -5.70375919342041, -4.704463958740234, -3.7051684856414795, -2.7058730125427246, -1.7065775394439697, -0.7072820663452148, 0.29201316833496094, 1.291308879852295, 2.290604591369629, 3.2898998260498047, 4.2891950607299805, 5.2884907722473145, 6.287786483764648, 7.287081718444824, 8.286376953125, 9.285673141479492, 10.284968376159668, 11.284263610839844]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 11.0, 9.0, 5.0, 16.0, 14.0, 20.0, 21.0, 17.0, 27.0, 25.0, 39.0, 39.0, 39.0, 48.0, 46.0, 54.0, 56.0, 61.0, 52.0, 51.0, 29.0, 37.0, 42.0, 36.0, 32.0, 24.0, 23.0, 24.0, 13.0, 14.0, 14.0, 16.0, 5.0, 8.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.212024688720703, -12.742264747619629, -12.272504806518555, -11.802745819091797, -11.332985877990723, -10.863225936889648, -10.393465995788574, -9.9237060546875, -9.453946113586426, -8.984186172485352, -8.514426231384277, -8.044666290283203, -7.574906826019287, -7.105147361755371, -6.635387420654297, -6.165627479553223, -5.695868015289307, -5.226108074188232, -4.756348609924316, -4.286588668823242, -3.816828727722168, -3.347069025039673, -2.8773093223571777, -2.4075493812561035, -1.9377896785736084, -1.4680298566818237, -0.9982700943946838, -0.528510332107544, -0.05875051021575928, 0.4110093116760254, 0.8807690143585205, 1.3505289554595947, 1.8202886581420898, 2.290048360824585, 2.759808301925659, 3.2295680046081543, 3.6993279457092285, 4.1690874099731445, 4.638847351074219, 5.108607292175293, 5.578367233276367, 6.048127174377441, 6.517886638641357, 6.987646579742432, 7.457406520843506, 7.927165985107422, 8.396925926208496, 8.86668586730957, 9.336444854736328, 9.806204795837402, 10.275964736938477, 10.745723724365234, 11.215483665466309, 11.685243606567383, 12.155003547668457, 12.624763488769531, 13.094523429870605, 13.56428337097168, 14.034043312072754, 14.503803253173828, 14.973562240600586, 15.44332218170166, 15.913082122802734, 16.382843017578125, 16.852602005004883]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 12.0, 11.0, 13.0, 6.0, 18.0, 32.0, 37.0, 67.0, 120.0, 221.0, 458.0, 897.0, 1992.0, 5347.0, 15738.0, 71554.0, 2362744.0, 1651659.0, 60295.0, 14164.0, 4857.0, 1939.0, 949.0, 447.0, 232.0, 144.0, 93.0, 83.0, 46.0, 21.0, 26.0, 11.0, 7.0, 6.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.60003662109375, -1.5447998046875, -1.48956298828125, -1.434326171875, -1.37908935546875, -1.3238525390625, -1.26861572265625, -1.21337890625, -1.15814208984375, -1.1029052734375, -1.04766845703125, -0.992431640625, -0.93719482421875, -0.8819580078125, -0.82672119140625, -0.771484375, -0.71624755859375, -0.6610107421875, -0.60577392578125, -0.550537109375, -0.49530029296875, -0.4400634765625, -0.38482666015625, -0.32958984375, -0.27435302734375, -0.2191162109375, -0.16387939453125, -0.108642578125, -0.05340576171875, 0.0018310546875, 0.05706787109375, 0.1123046875, 0.16754150390625, 0.2227783203125, 0.27801513671875, 0.333251953125, 0.38848876953125, 0.4437255859375, 0.49896240234375, 0.55419921875, 0.60943603515625, 0.6646728515625, 0.71990966796875, 0.775146484375, 0.83038330078125, 0.8856201171875, 0.94085693359375, 0.99609375, 1.05133056640625, 1.1065673828125, 1.16180419921875, 1.217041015625, 1.27227783203125, 1.3275146484375, 1.38275146484375, 1.43798828125, 1.49322509765625, 1.5484619140625, 1.60369873046875, 1.658935546875, 1.71417236328125, 1.7694091796875, 1.82464599609375, 1.8798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 12.0, 12.0, 14.0, 43.0, 61.0, 67.0, 69.0, 82.0, 102.0, 116.0, 95.0, 91.0, 63.0, 65.0, 48.0, 30.0, 11.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.214324951171875, -1.16986083984375, -1.125396728515625, -1.0809326171875, -1.036468505859375, -0.99200439453125, -0.947540283203125, -0.903076171875, -0.858612060546875, -0.81414794921875, -0.769683837890625, -0.7252197265625, -0.680755615234375, -0.63629150390625, -0.591827392578125, -0.54736328125, -0.502899169921875, -0.45843505859375, -0.413970947265625, -0.3695068359375, -0.325042724609375, -0.28057861328125, -0.236114501953125, -0.191650390625, -0.147186279296875, -0.10272216796875, -0.058258056640625, -0.0137939453125, 0.030670166015625, 0.07513427734375, 0.119598388671875, 0.1640625, 0.208526611328125, 0.25299072265625, 0.297454833984375, 0.3419189453125, 0.386383056640625, 0.43084716796875, 0.475311279296875, 0.519775390625, 0.564239501953125, 0.60870361328125, 0.653167724609375, 0.6976318359375, 0.742095947265625, 0.78656005859375, 0.831024169921875, 0.87548828125, 0.919952392578125, 0.96441650390625, 1.008880615234375, 1.0533447265625, 1.097808837890625, 1.14227294921875, 1.186737060546875, 1.231201171875, 1.275665283203125, 1.32012939453125, 1.364593505859375, 1.4090576171875, 1.453521728515625, 1.49798583984375, 1.542449951171875, 1.5869140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 2.0, 9.0, 8.0, 14.0, 24.0, 35.0, 65.0, 117.0, 272.0, 811.0, 2771.0, 13629.0, 165802.0, 3899201.0, 98336.0, 9890.0, 2175.0, 622.0, 220.0, 112.0, 47.0, 34.0, 24.0, 18.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.1241455078125, -2.033447265625, -1.9427490234375, -1.85205078125, -1.7613525390625, -1.670654296875, -1.5799560546875, -1.4892578125, -1.3985595703125, -1.307861328125, -1.2171630859375, -1.12646484375, -1.0357666015625, -0.945068359375, -0.8543701171875, -0.763671875, -0.6729736328125, -0.582275390625, -0.4915771484375, -0.40087890625, -0.3101806640625, -0.219482421875, -0.1287841796875, -0.0380859375, 0.0526123046875, 0.143310546875, 0.2340087890625, 0.32470703125, 0.4154052734375, 0.506103515625, 0.5968017578125, 0.6875, 0.7781982421875, 0.868896484375, 0.9595947265625, 1.05029296875, 1.1409912109375, 1.231689453125, 1.3223876953125, 1.4130859375, 1.5037841796875, 1.594482421875, 1.6851806640625, 1.77587890625, 1.8665771484375, 1.957275390625, 2.0479736328125, 2.138671875, 2.2293701171875, 2.320068359375, 2.4107666015625, 2.50146484375, 2.5921630859375, 2.682861328125, 2.7735595703125, 2.8642578125, 2.9549560546875, 3.045654296875, 3.1363525390625, 3.22705078125, 3.3177490234375, 3.408447265625, 3.4991455078125, 3.58984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 16.0, 23.0, 31.0, 42.0, 83.0, 131.0, 285.0, 944.0, 1407.0, 585.0, 215.0, 100.0, 64.0, 45.0, 23.0, 12.0, 10.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.994140625, -2.9198760986328125, -2.845611572265625, -2.7713470458984375, -2.69708251953125, -2.6228179931640625, -2.548553466796875, -2.4742889404296875, -2.4000244140625, -2.3257598876953125, -2.251495361328125, -2.1772308349609375, -2.10296630859375, -2.0287017822265625, -1.954437255859375, -1.8801727294921875, -1.805908203125, -1.7316436767578125, -1.657379150390625, -1.5831146240234375, -1.50885009765625, -1.4345855712890625, -1.360321044921875, -1.2860565185546875, -1.2117919921875, -1.1375274658203125, -1.063262939453125, -0.9889984130859375, -0.91473388671875, -0.8404693603515625, -0.766204833984375, -0.6919403076171875, -0.61767578125, -0.5434112548828125, -0.469146728515625, -0.3948822021484375, -0.32061767578125, -0.2463531494140625, -0.172088623046875, -0.0978240966796875, -0.0235595703125, 0.0507049560546875, 0.124969482421875, 0.1992340087890625, 0.27349853515625, 0.3477630615234375, 0.422027587890625, 0.4962921142578125, 0.570556640625, 0.6448211669921875, 0.719085693359375, 0.7933502197265625, 0.86761474609375, 0.9418792724609375, 1.016143798828125, 1.0904083251953125, 1.1646728515625, 1.2389373779296875, 1.313201904296875, 1.3874664306640625, 1.46173095703125, 1.5359954833984375, 1.610260009765625, 1.6845245361328125, 1.7587890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 36.0, 87.0, 174.0, 227.0, 229.0, 111.0, 58.0, 25.0, 9.0, 6.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.634222030639648, -14.007793426513672, -13.381364822387695, -12.754936218261719, -12.128507614135742, -11.502079010009766, -10.875650405883789, -10.249221801757812, -9.622793197631836, -8.99636459350586, -8.369935989379883, -7.743507385253906, -7.11707878112793, -6.490650177001953, -5.864221572875977, -5.23779296875, -4.611364364624023, -3.984935760498047, -3.3585071563720703, -2.7320785522460938, -2.105649948120117, -1.4792213439941406, -0.8527927398681641, -0.2263641357421875, 0.40006446838378906, 1.0264930725097656, 1.6529216766357422, 2.2793502807617188, 2.9057788848876953, 3.532207489013672, 4.158636093139648, 4.785064697265625, 5.411495208740234, 6.037923812866211, 6.6643524169921875, 7.290781021118164, 7.917209625244141, 8.543638229370117, 9.170066833496094, 9.79649543762207, 10.422924041748047, 11.049352645874023, 11.67578125, 12.302209854125977, 12.928638458251953, 13.55506706237793, 14.181495666503906, 14.807924270629883, 15.43435287475586, 16.060781478881836, 16.687210083007812, 17.31363868713379, 17.940067291259766, 18.566495895385742, 19.19292449951172, 19.819353103637695, 20.445781707763672, 21.07221031188965, 21.698638916015625, 22.3250675201416, 22.951496124267578, 23.577924728393555, 24.20435333251953, 24.830781936645508, 25.457210540771484]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 4.0, 12.0, 17.0, 14.0, 30.0, 30.0, 43.0, 57.0, 49.0, 53.0, 57.0, 75.0, 58.0, 73.0, 62.0, 56.0, 52.0, 54.0, 36.0, 40.0, 23.0, 16.0, 13.0, 24.0, 7.0, 8.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.714668273925781, -13.341004371643066, -12.967340469360352, -12.593676567077637, -12.220012664794922, -11.846348762512207, -11.472684860229492, -11.099020957946777, -10.725357055664062, -10.351693153381348, -9.978029251098633, -9.604365348815918, -9.230701446533203, -8.857037544250488, -8.483373641967773, -8.109709739685059, -7.7360453605651855, -7.362381458282471, -6.988717555999756, -6.615053653717041, -6.241389751434326, -5.867725849151611, -5.494061470031738, -5.120397567749023, -4.746733665466309, -4.373069763183594, -3.999405860900879, -3.625741958618164, -3.252078056335449, -2.8784141540527344, -2.5047500133514404, -2.1310861110687256, -1.7574224472045898, -1.383758544921875, -1.0100946426391602, -0.6364306211471558, -0.2627667188644409, 0.11089718341827393, 0.4845612049102783, 0.8582251071929932, 1.231889009475708, 1.6055529117584229, 1.9792168140411377, 2.3528809547424316, 2.7265448570251465, 3.1002087593078613, 3.473872661590576, 3.847536563873291, 4.221200466156006, 4.594864368438721, 4.9685282707214355, 5.34219217300415, 5.715856075286865, 6.08951997756958, 6.463184356689453, 6.836848258972168, 7.210512161254883, 7.584176063537598, 7.9578399658203125, 8.331503868103027, 8.705167770385742, 9.078831672668457, 9.452495574951172, 9.826159477233887, 10.199823379516602]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 14.0, 20.0, 26.0, 44.0, 51.0, 79.0, 132.0, 199.0, 240.0, 476.0, 764.0, 1390.0, 2463.0, 4679.0, 9293.0, 18994.0, 41116.0, 93036.0, 203138.0, 302234.0, 199308.0, 91743.0, 40582.0, 18547.0, 9248.0, 4684.0, 2557.0, 1415.0, 821.0, 444.0, 279.0, 193.0, 106.0, 70.0, 48.0, 30.0, 26.0, 15.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8779449462890625, -0.848175048828125, -0.8184051513671875, -0.78863525390625, -0.7588653564453125, -0.729095458984375, -0.6993255615234375, -0.6695556640625, -0.6397857666015625, -0.610015869140625, -0.5802459716796875, -0.55047607421875, -0.5207061767578125, -0.490936279296875, -0.4611663818359375, -0.431396484375, -0.4016265869140625, -0.371856689453125, -0.3420867919921875, -0.31231689453125, -0.2825469970703125, -0.252777099609375, -0.2230072021484375, -0.1932373046875, -0.1634674072265625, -0.133697509765625, -0.1039276123046875, -0.07415771484375, -0.0443878173828125, -0.014617919921875, 0.0151519775390625, 0.044921875, 0.0746917724609375, 0.104461669921875, 0.1342315673828125, 0.16400146484375, 0.1937713623046875, 0.223541259765625, 0.2533111572265625, 0.2830810546875, 0.3128509521484375, 0.342620849609375, 0.3723907470703125, 0.40216064453125, 0.4319305419921875, 0.461700439453125, 0.4914703369140625, 0.521240234375, 0.5510101318359375, 0.580780029296875, 0.6105499267578125, 0.64031982421875, 0.6700897216796875, 0.699859619140625, 0.7296295166015625, 0.7593994140625, 0.7891693115234375, 0.818939208984375, 0.8487091064453125, 0.87847900390625, 0.9082489013671875, 0.938018798828125, 0.9677886962890625, 0.99755859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 17.0, 25.0, 31.0, 31.0, 36.0, 32.0, 51.0, 53.0, 62.0, 47.0, 50.0, 55.0, 60.0, 46.0, 54.0, 56.0, 42.0, 34.0, 40.0, 30.0, 24.0, 13.0, 20.0, 20.0, 11.0, 9.0, 3.0, 6.0, 0.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87158203125, -0.8469924926757812, -0.8224029541015625, -0.7978134155273438, -0.773223876953125, -0.7486343383789062, -0.7240447998046875, -0.6994552612304688, -0.67486572265625, -0.6502761840820312, -0.6256866455078125, -0.6010971069335938, -0.576507568359375, -0.5519180297851562, -0.5273284912109375, -0.5027389526367188, -0.4781494140625, -0.45355987548828125, -0.4289703369140625, -0.40438079833984375, -0.379791259765625, -0.35520172119140625, -0.3306121826171875, -0.30602264404296875, -0.28143310546875, -0.25684356689453125, -0.2322540283203125, -0.20766448974609375, -0.183074951171875, -0.15848541259765625, -0.1338958740234375, -0.10930633544921875, -0.084716796875, -0.06012725830078125, -0.0355377197265625, -0.01094818115234375, 0.013641357421875, 0.03823089599609375, 0.0628204345703125, 0.08740997314453125, 0.11199951171875, 0.13658905029296875, 0.1611785888671875, 0.18576812744140625, 0.210357666015625, 0.23494720458984375, 0.2595367431640625, 0.28412628173828125, 0.3087158203125, 0.33330535888671875, 0.3578948974609375, 0.38248443603515625, 0.407073974609375, 0.43166351318359375, 0.4562530517578125, 0.48084259033203125, 0.50543212890625, 0.5300216674804688, 0.5546112060546875, 0.5792007446289062, 0.603790283203125, 0.6283798217773438, 0.6529693603515625, 0.6775588989257812, 0.7021484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 10.0, 14.0, 41.0, 42.0, 57.0, 112.0, 149.0, 322.0, 591.0, 1243.0, 3205.0, 12565.0, 120108.0, 787792.0, 105170.0, 11670.0, 3019.0, 1184.0, 529.0, 280.0, 177.0, 96.0, 45.0, 36.0, 26.0, 18.0, 8.0, 13.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.30078125, -3.214996337890625, -3.12921142578125, -3.043426513671875, -2.9576416015625, -2.871856689453125, -2.78607177734375, -2.700286865234375, -2.614501953125, -2.528717041015625, -2.44293212890625, -2.357147216796875, -2.2713623046875, -2.185577392578125, -2.09979248046875, -2.014007568359375, -1.92822265625, -1.842437744140625, -1.75665283203125, -1.670867919921875, -1.5850830078125, -1.499298095703125, -1.41351318359375, -1.327728271484375, -1.241943359375, -1.156158447265625, -1.07037353515625, -0.984588623046875, -0.8988037109375, -0.813018798828125, -0.72723388671875, -0.641448974609375, -0.5556640625, -0.469879150390625, -0.38409423828125, -0.298309326171875, -0.2125244140625, -0.126739501953125, -0.04095458984375, 0.044830322265625, 0.130615234375, 0.216400146484375, 0.30218505859375, 0.387969970703125, 0.4737548828125, 0.559539794921875, 0.64532470703125, 0.731109619140625, 0.81689453125, 0.902679443359375, 0.98846435546875, 1.074249267578125, 1.1600341796875, 1.245819091796875, 1.33160400390625, 1.417388916015625, 1.503173828125, 1.588958740234375, 1.67474365234375, 1.760528564453125, 1.8463134765625, 1.932098388671875, 2.01788330078125, 2.103668212890625, 2.189453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 12.0, 11.0, 20.0, 10.0, 17.0, 27.0, 31.0, 35.0, 45.0, 48.0, 53.0, 65.0, 61.0, 75.0, 71.0, 72.0, 53.0, 58.0, 44.0, 37.0, 36.0, 30.0, 13.0, 16.0, 12.0, 10.0, 10.0, 7.0, 8.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.271759033203125, -4.15289306640625, -4.034027099609375, -3.9151611328125, -3.796295166015625, -3.67742919921875, -3.558563232421875, -3.439697265625, -3.320831298828125, -3.20196533203125, -3.083099365234375, -2.9642333984375, -2.845367431640625, -2.72650146484375, -2.607635498046875, -2.48876953125, -2.369903564453125, -2.25103759765625, -2.132171630859375, -2.0133056640625, -1.894439697265625, -1.77557373046875, -1.656707763671875, -1.537841796875, -1.418975830078125, -1.30010986328125, -1.181243896484375, -1.0623779296875, -0.943511962890625, -0.82464599609375, -0.705780029296875, -0.5869140625, -0.468048095703125, -0.34918212890625, -0.230316162109375, -0.1114501953125, 0.007415771484375, 0.12628173828125, 0.245147705078125, 0.364013671875, 0.482879638671875, 0.60174560546875, 0.720611572265625, 0.8394775390625, 0.958343505859375, 1.07720947265625, 1.196075439453125, 1.31494140625, 1.433807373046875, 1.55267333984375, 1.671539306640625, 1.7904052734375, 1.909271240234375, 2.02813720703125, 2.147003173828125, 2.265869140625, 2.384735107421875, 2.50360107421875, 2.622467041015625, 2.7413330078125, 2.860198974609375, 2.97906494140625, 3.097930908203125, 3.216796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 19.0, 34.0, 65.0, 193.0, 743.0, 4660.0, 260291.0, 772851.0, 8319.0, 965.0, 239.0, 83.0, 38.0, 17.0, 5.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.9613037109375, -1.906982421875, -1.8526611328125, -1.79833984375, -1.7440185546875, -1.689697265625, -1.6353759765625, -1.5810546875, -1.5267333984375, -1.472412109375, -1.4180908203125, -1.36376953125, -1.3094482421875, -1.255126953125, -1.2008056640625, -1.146484375, -1.0921630859375, -1.037841796875, -0.9835205078125, -0.92919921875, -0.8748779296875, -0.820556640625, -0.7662353515625, -0.7119140625, -0.6575927734375, -0.603271484375, -0.5489501953125, -0.49462890625, -0.4403076171875, -0.385986328125, -0.3316650390625, -0.27734375, -0.2230224609375, -0.168701171875, -0.1143798828125, -0.06005859375, -0.0057373046875, 0.048583984375, 0.1029052734375, 0.1572265625, 0.2115478515625, 0.265869140625, 0.3201904296875, 0.37451171875, 0.4288330078125, 0.483154296875, 0.5374755859375, 0.591796875, 0.6461181640625, 0.700439453125, 0.7547607421875, 0.80908203125, 0.8634033203125, 0.917724609375, 0.9720458984375, 1.0263671875, 1.0806884765625, 1.135009765625, 1.1893310546875, 1.24365234375, 1.2979736328125, 1.352294921875, 1.4066162109375, 1.4609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 12.0, 11.0, 6.0, 10.0, 13.0, 30.0, 29.0, 39.0, 42.0, 55.0, 78.0, 77.0, 96.0, 97.0, 66.0, 47.0, 45.0, 50.0, 51.0, 29.0, 23.0, 15.0, 17.0, 9.0, 11.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.225440979003906e-05, -7.893331348896027e-05, -7.561221718788147e-05, -7.229112088680267e-05, -6.897002458572388e-05, -6.564892828464508e-05, -6.232783198356628e-05, -5.900673568248749e-05, -5.568563938140869e-05, -5.2364543080329895e-05, -4.90434467792511e-05, -4.57223504781723e-05, -4.2401254177093506e-05, -3.908015787601471e-05, -3.575906157493591e-05, -3.243796527385712e-05, -2.911686897277832e-05, -2.5795772671699524e-05, -2.2474676370620728e-05, -1.915358006954193e-05, -1.5832483768463135e-05, -1.2511387467384338e-05, -9.190291166305542e-06, -5.869194865226746e-06, -2.5480985641479492e-06, 7.729977369308472e-07, 4.0940940380096436e-06, 7.41519033908844e-06, 1.0736286640167236e-05, 1.4057382941246033e-05, 1.737847924232483e-05, 2.0699575543403625e-05, 2.4020671844482422e-05, 2.7341768145561218e-05, 3.0662864446640015e-05, 3.398396074771881e-05, 3.730505704879761e-05, 4.0626153349876404e-05, 4.39472496509552e-05, 4.7268345952033997e-05, 5.058944225311279e-05, 5.391053855419159e-05, 5.7231634855270386e-05, 6.055273115634918e-05, 6.387382745742798e-05, 6.719492375850677e-05, 7.051602005958557e-05, 7.383711636066437e-05, 7.715821266174316e-05, 8.047930896282196e-05, 8.380040526390076e-05, 8.712150156497955e-05, 9.044259786605835e-05, 9.376369416713715e-05, 9.708479046821594e-05, 0.00010040588676929474, 0.00010372698307037354, 0.00010704807937145233, 0.00011036917567253113, 0.00011369027197360992, 0.00011701136827468872, 0.00012033246457576752, 0.0001236535608768463, 0.0001269746571779251, 0.0001302957534790039]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 15.0, 17.0, 31.0, 38.0, 59.0, 80.0, 134.0, 218.0, 379.0, 858.0, 1965.0, 5730.0, 26791.0, 234514.0, 678283.0, 81228.0, 12282.0, 3334.0, 1224.0, 544.0, 318.0, 178.0, 122.0, 70.0, 42.0, 27.0, 26.0, 11.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5196075439453125, -0.498199462890625, -0.4767913818359375, -0.45538330078125, -0.4339752197265625, -0.412567138671875, -0.3911590576171875, -0.3697509765625, -0.3483428955078125, -0.326934814453125, -0.3055267333984375, -0.28411865234375, -0.2627105712890625, -0.241302490234375, -0.2198944091796875, -0.198486328125, -0.1770782470703125, -0.155670166015625, -0.1342620849609375, -0.11285400390625, -0.0914459228515625, -0.070037841796875, -0.0486297607421875, -0.0272216796875, -0.0058135986328125, 0.015594482421875, 0.0370025634765625, 0.05841064453125, 0.0798187255859375, 0.101226806640625, 0.1226348876953125, 0.14404296875, 0.1654510498046875, 0.186859130859375, 0.2082672119140625, 0.22967529296875, 0.2510833740234375, 0.272491455078125, 0.2938995361328125, 0.3153076171875, 0.3367156982421875, 0.358123779296875, 0.3795318603515625, 0.40093994140625, 0.4223480224609375, 0.443756103515625, 0.4651641845703125, 0.486572265625, 0.5079803466796875, 0.529388427734375, 0.5507965087890625, 0.57220458984375, 0.5936126708984375, 0.615020751953125, 0.6364288330078125, 0.6578369140625, 0.6792449951171875, 0.700653076171875, 0.7220611572265625, 0.74346923828125, 0.7648773193359375, 0.786285400390625, 0.8076934814453125, 0.8291015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 12.0, 18.0, 20.0, 26.0, 16.0, 28.0, 34.0, 34.0, 65.0, 70.0, 64.0, 69.0, 79.0, 72.0, 74.0, 58.0, 40.0, 42.0, 31.0, 34.0, 27.0, 12.0, 18.0, 7.0, 7.0, 7.0, 1.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6240234375, -0.6039276123046875, -0.583831787109375, -0.5637359619140625, -0.54364013671875, -0.5235443115234375, -0.503448486328125, -0.4833526611328125, -0.4632568359375, -0.4431610107421875, -0.423065185546875, -0.4029693603515625, -0.38287353515625, -0.3627777099609375, -0.342681884765625, -0.3225860595703125, -0.302490234375, -0.2823944091796875, -0.262298583984375, -0.2422027587890625, -0.22210693359375, -0.2020111083984375, -0.181915283203125, -0.1618194580078125, -0.1417236328125, -0.1216278076171875, -0.101531982421875, -0.0814361572265625, -0.06134033203125, -0.0412445068359375, -0.021148681640625, -0.0010528564453125, 0.01904296875, 0.0391387939453125, 0.059234619140625, 0.0793304443359375, 0.09942626953125, 0.1195220947265625, 0.139617919921875, 0.1597137451171875, 0.1798095703125, 0.1999053955078125, 0.220001220703125, 0.2400970458984375, 0.26019287109375, 0.2802886962890625, 0.300384521484375, 0.3204803466796875, 0.340576171875, 0.3606719970703125, 0.380767822265625, 0.4008636474609375, 0.42095947265625, 0.4410552978515625, 0.461151123046875, 0.4812469482421875, 0.5013427734375, 0.5214385986328125, 0.541534423828125, 0.5616302490234375, 0.58172607421875, 0.6018218994140625, 0.621917724609375, 0.6420135498046875, 0.662109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 16.0, 41.0, 128.0, 371.0, 279.0, 111.0, 27.0, 14.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.17041015625, -42.163047790527344, -41.15568542480469, -40.14832305908203, -39.140960693359375, -38.13359832763672, -37.12623596191406, -36.118873596191406, -35.11151123046875, -34.104148864746094, -33.09678649902344, -32.08942413330078, -31.082061767578125, -30.07469940185547, -29.067338943481445, -28.05997657775879, -27.052616119384766, -26.04525375366211, -25.037891387939453, -24.030529022216797, -23.02316665649414, -22.015804290771484, -21.00844383239746, -20.001081466674805, -18.99371910095215, -17.986356735229492, -16.978994369506836, -15.971632957458496, -14.96427059173584, -13.956908226013184, -12.949546813964844, -11.942184448242188, -10.934822082519531, -9.927459716796875, -8.920097351074219, -7.912735939025879, -6.905373573303223, -5.898011207580566, -4.890649318695068, -3.8832874298095703, -2.875925064086914, -1.868562936782837, -0.8612008094787598, 0.14616131782531738, 1.1535234451293945, 2.160885810852051, 3.168247699737549, 4.175609588623047, 5.182971954345703, 6.190334320068359, 7.197696208953857, 8.205058097839355, 9.212420463562012, 10.219782829284668, 11.227144241333008, 12.234506607055664, 13.24186897277832, 14.249231338500977, 15.256593704223633, 16.26395606994629, 17.271316528320312, 18.27867889404297, 19.286041259765625, 20.29340362548828, 21.300765991210938]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 14.0, 17.0, 21.0, 41.0, 37.0, 53.0, 52.0, 71.0, 67.0, 95.0, 107.0, 78.0, 63.0, 53.0, 49.0, 49.0, 27.0, 19.0, 21.0, 13.0, 14.0, 10.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.663875579833984, -24.01864242553711, -23.373409271240234, -22.72817611694336, -22.08294105529785, -21.437707901000977, -20.7924747467041, -20.147241592407227, -19.50200843811035, -18.856775283813477, -18.2115421295166, -17.566307067871094, -16.92107391357422, -16.275840759277344, -15.630607604980469, -14.985374450683594, -14.340140342712402, -13.694907188415527, -13.049673080444336, -12.404439926147461, -11.759206771850586, -11.113973617553711, -10.46873950958252, -9.823506355285645, -9.178272247314453, -8.533039093017578, -7.887805461883545, -7.242571830749512, -6.597338676452637, -5.9521050453186035, -5.30687141418457, -4.661638259887695, -4.01640510559082, -3.371171712875366, -2.725938320159912, -2.080704689025879, -1.4354712963104248, -0.7902379035949707, -0.1450042724609375, 0.5002288818359375, 1.1454625129699707, 1.7906959056854248, 2.435929298400879, 3.081162929534912, 3.726396322250366, 4.37162971496582, 5.0168633460998535, 5.6620965003967285, 6.307330131530762, 6.952563762664795, 7.59779691696167, 8.243030548095703, 8.888263702392578, 9.533496856689453, 10.178730964660645, 10.82396411895752, 11.469198226928711, 12.114431381225586, 12.759665489196777, 13.404898643493652, 14.050131797790527, 14.695365905761719, 15.340599060058594, 15.985832214355469, 16.631065368652344]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 8.0, 19.0, 15.0, 27.0, 31.0, 62.0, 64.0, 84.0, 143.0, 242.0, 417.0, 1439.0, 14409.0, 3583181.0, 581920.0, 10215.0, 1257.0, 323.0, 130.0, 77.0, 53.0, 25.0, 35.0, 15.0, 18.0, 14.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.091796875, -2.991668701171875, -2.89154052734375, -2.791412353515625, -2.6912841796875, -2.591156005859375, -2.49102783203125, -2.390899658203125, -2.290771484375, -2.190643310546875, -2.09051513671875, -1.990386962890625, -1.8902587890625, -1.790130615234375, -1.69000244140625, -1.589874267578125, -1.48974609375, -1.389617919921875, -1.28948974609375, -1.189361572265625, -1.0892333984375, -0.989105224609375, -0.88897705078125, -0.788848876953125, -0.688720703125, -0.588592529296875, -0.48846435546875, -0.388336181640625, -0.2882080078125, -0.188079833984375, -0.08795166015625, 0.012176513671875, 0.1123046875, 0.212432861328125, 0.31256103515625, 0.412689208984375, 0.5128173828125, 0.612945556640625, 0.71307373046875, 0.813201904296875, 0.913330078125, 1.013458251953125, 1.11358642578125, 1.213714599609375, 1.3138427734375, 1.413970947265625, 1.51409912109375, 1.614227294921875, 1.71435546875, 1.814483642578125, 1.91461181640625, 2.014739990234375, 2.1148681640625, 2.214996337890625, 2.31512451171875, 2.415252685546875, 2.515380859375, 2.615509033203125, 2.71563720703125, 2.815765380859375, 2.9158935546875, 3.016021728515625, 3.11614990234375, 3.216278076171875, 3.31640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 20.0, 40.0, 63.0, 97.0, 130.0, 124.0, 143.0, 124.0, 91.0, 70.0, 39.0, 23.0, 11.0, 11.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-2.904296875, -2.8461761474609375, -2.788055419921875, -2.7299346923828125, -2.67181396484375, -2.6136932373046875, -2.555572509765625, -2.4974517822265625, -2.4393310546875, -2.3812103271484375, -2.323089599609375, -2.2649688720703125, -2.20684814453125, -2.1487274169921875, -2.090606689453125, -2.0324859619140625, -1.974365234375, -1.9162445068359375, -1.858123779296875, -1.8000030517578125, -1.74188232421875, -1.6837615966796875, -1.625640869140625, -1.5675201416015625, -1.5093994140625, -1.4512786865234375, -1.393157958984375, -1.3350372314453125, -1.27691650390625, -1.2187957763671875, -1.160675048828125, -1.1025543212890625, -1.04443359375, -0.9863128662109375, -0.928192138671875, -0.8700714111328125, -0.81195068359375, -0.7538299560546875, -0.695709228515625, -0.6375885009765625, -0.5794677734375, -0.5213470458984375, -0.463226318359375, -0.4051055908203125, -0.34698486328125, -0.2888641357421875, -0.230743408203125, -0.1726226806640625, -0.114501953125, -0.0563812255859375, 0.001739501953125, 0.0598602294921875, 0.11798095703125, 0.1761016845703125, 0.234222412109375, 0.2923431396484375, 0.3504638671875, 0.4085845947265625, 0.466705322265625, 0.5248260498046875, 0.58294677734375, 0.6410675048828125, 0.699188232421875, 0.7573089599609375, 0.8154296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 21.0, 17.0, 47.0, 30.0, 88.0, 120.0, 180.0, 327.0, 683.0, 1512.0, 3479.0, 9045.0, 27856.0, 141432.0, 3123942.0, 792010.0, 65316.0, 17051.0, 5936.0, 2543.0, 1180.0, 610.0, 318.0, 165.0, 112.0, 67.0, 55.0, 30.0, 23.0, 17.0, 19.0, 17.0, 8.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5601348876953125, -1.517730712890625, -1.4753265380859375, -1.43292236328125, -1.3905181884765625, -1.348114013671875, -1.3057098388671875, -1.2633056640625, -1.2209014892578125, -1.178497314453125, -1.1360931396484375, -1.09368896484375, -1.0512847900390625, -1.008880615234375, -0.9664764404296875, -0.924072265625, -0.8816680908203125, -0.839263916015625, -0.7968597412109375, -0.75445556640625, -0.7120513916015625, -0.669647216796875, -0.6272430419921875, -0.5848388671875, -0.5424346923828125, -0.500030517578125, -0.4576263427734375, -0.41522216796875, -0.3728179931640625, -0.330413818359375, -0.2880096435546875, -0.24560546875, -0.2032012939453125, -0.160797119140625, -0.1183929443359375, -0.07598876953125, -0.0335845947265625, 0.008819580078125, 0.0512237548828125, 0.0936279296875, 0.1360321044921875, 0.178436279296875, 0.2208404541015625, 0.26324462890625, 0.3056488037109375, 0.348052978515625, 0.3904571533203125, 0.432861328125, 0.4752655029296875, 0.517669677734375, 0.5600738525390625, 0.60247802734375, 0.6448822021484375, 0.687286376953125, 0.7296905517578125, 0.7720947265625, 0.8144989013671875, 0.856903076171875, 0.8993072509765625, 0.94171142578125, 0.9841156005859375, 1.026519775390625, 1.0689239501953125, 1.111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 11.0, 11.0, 15.0, 11.0, 27.0, 44.0, 101.0, 232.0, 715.0, 1612.0, 779.0, 259.0, 109.0, 52.0, 35.0, 19.0, 14.0, 8.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.019561767578125, -1.94342041015625, -1.867279052734375, -1.7911376953125, -1.714996337890625, -1.63885498046875, -1.562713623046875, -1.486572265625, -1.410430908203125, -1.33428955078125, -1.258148193359375, -1.1820068359375, -1.105865478515625, -1.02972412109375, -0.953582763671875, -0.87744140625, -0.801300048828125, -0.72515869140625, -0.649017333984375, -0.5728759765625, -0.496734619140625, -0.42059326171875, -0.344451904296875, -0.268310546875, -0.192169189453125, -0.11602783203125, -0.039886474609375, 0.0362548828125, 0.112396240234375, 0.18853759765625, 0.264678955078125, 0.3408203125, 0.416961669921875, 0.49310302734375, 0.569244384765625, 0.6453857421875, 0.721527099609375, 0.79766845703125, 0.873809814453125, 0.949951171875, 1.026092529296875, 1.10223388671875, 1.178375244140625, 1.2545166015625, 1.330657958984375, 1.40679931640625, 1.482940673828125, 1.55908203125, 1.635223388671875, 1.71136474609375, 1.787506103515625, 1.8636474609375, 1.939788818359375, 2.01593017578125, 2.092071533203125, 2.168212890625, 2.244354248046875, 2.32049560546875, 2.396636962890625, 2.4727783203125, 2.548919677734375, 2.62506103515625, 2.701202392578125, 2.77734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 15.0, 74.0, 202.0, 395.0, 214.0, 68.0, 10.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.139007568359375, -8.419883728027344, -7.700760841369629, -6.981637001037598, -6.262513637542725, -5.543390274047852, -4.82426643371582, -4.105143070220947, -3.386019706726074, -2.666896343231201, -1.947772741317749, -1.2286491394042969, -0.5095257759094238, 0.20959758758544922, 0.9287214279174805, 1.6478447914123535, 2.3669681549072266, 3.0860915184020996, 3.8052151203155518, 4.524338722229004, 5.243462085723877, 5.96258544921875, 6.681709289550781, 7.400832653045654, 8.119956016540527, 8.839079856872559, 9.558202743530273, 10.277326583862305, 10.996450424194336, 11.71557331085205, 12.434697151184082, 13.153820037841797, 13.872943878173828, 14.59206771850586, 15.311190605163574, 16.030315399169922, 16.74943733215332, 17.46856117248535, 18.187685012817383, 18.906808853149414, 19.625930786132812, 20.345054626464844, 21.064178466796875, 21.783302307128906, 22.502424240112305, 23.221548080444336, 23.940671920776367, 24.6597957611084, 25.37891960144043, 26.09804344177246, 26.817167282104492, 27.53628921508789, 28.255413055419922, 28.974536895751953, 29.693660736083984, 30.412784576416016, 31.131908416748047, 31.851032257080078, 32.57015609741211, 33.28927993774414, 34.00840377807617, 34.72752380371094, 35.44664764404297, 36.165771484375, 36.88489532470703]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 16.0, 22.0, 27.0, 24.0, 44.0, 42.0, 59.0, 77.0, 72.0, 84.0, 76.0, 64.0, 75.0, 76.0, 64.0, 41.0, 37.0, 26.0, 21.0, 10.0, 9.0, 5.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.655929565429688, -12.301444053649902, -11.946958541870117, -11.592473983764648, -11.237988471984863, -10.883502960205078, -10.529017448425293, -10.174531936645508, -9.820047378540039, -9.465561866760254, -9.111076354980469, -8.756591796875, -8.402106285095215, -8.04762077331543, -7.6931352615356445, -7.338650226593018, -6.984164714813232, -6.629679203033447, -6.27519416809082, -5.920708656311035, -5.566223621368408, -5.211738109588623, -4.857253074645996, -4.502767562866211, -4.148282051086426, -3.7937967777252197, -3.4393115043640137, -3.0848259925842285, -2.7303409576416016, -2.3758554458618164, -2.0213701725006104, -1.6668848991394043, -1.3123998641967773, -0.9579145908355713, -0.6034292578697205, -0.24894392490386963, 0.10554134845733643, 0.4600266218185425, 0.8145120143890381, 1.1689972877502441, 1.5234825611114502, 1.8779678344726562, 2.2324531078338623, 2.5869383811950684, 2.9414238929748535, 3.2959089279174805, 3.6503944396972656, 4.004879951477051, 4.359364986419678, 4.713850498199463, 5.06833553314209, 5.422821044921875, 5.777306079864502, 6.131791591644287, 6.486276626586914, 6.840762138366699, 7.195247650146484, 7.5497331619262695, 7.9042181968688965, 8.258703231811523, 8.613188743591309, 8.967674255371094, 9.322159767150879, 9.676645278930664, 10.031129837036133]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 2.0, 3.0, 2.0, 18.0, 14.0, 32.0, 47.0, 85.0, 164.0, 349.0, 892.0, 2569.0, 8680.0, 33981.0, 164932.0, 543651.0, 230792.0, 45940.0, 11031.0, 3357.0, 1103.0, 450.0, 202.0, 91.0, 49.0, 45.0, 18.0, 10.0, 7.0, 11.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.7682647705078125, -1.712310791015625, -1.6563568115234375, -1.60040283203125, -1.5444488525390625, -1.488494873046875, -1.4325408935546875, -1.3765869140625, -1.3206329345703125, -1.264678955078125, -1.2087249755859375, -1.15277099609375, -1.0968170166015625, -1.040863037109375, -0.9849090576171875, -0.928955078125, -0.8730010986328125, -0.817047119140625, -0.7610931396484375, -0.70513916015625, -0.6491851806640625, -0.593231201171875, -0.5372772216796875, -0.4813232421875, -0.4253692626953125, -0.369415283203125, -0.3134613037109375, -0.25750732421875, -0.2015533447265625, -0.145599365234375, -0.0896453857421875, -0.03369140625, 0.0222625732421875, 0.078216552734375, 0.1341705322265625, 0.19012451171875, 0.2460784912109375, 0.302032470703125, 0.3579864501953125, 0.4139404296875, 0.4698944091796875, 0.525848388671875, 0.5818023681640625, 0.63775634765625, 0.6937103271484375, 0.749664306640625, 0.8056182861328125, 0.861572265625, 0.9175262451171875, 0.973480224609375, 1.0294342041015625, 1.08538818359375, 1.1413421630859375, 1.197296142578125, 1.2532501220703125, 1.3092041015625, 1.3651580810546875, 1.421112060546875, 1.4770660400390625, 1.53302001953125, 1.5889739990234375, 1.644927978515625, 1.7008819580078125, 1.7568359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 18.0, 32.0, 33.0, 51.0, 83.0, 86.0, 86.0, 97.0, 82.0, 101.0, 81.0, 55.0, 51.0, 53.0, 32.0, 19.0, 11.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.9130859375, -1.8723526000976562, -1.8316192626953125, -1.7908859252929688, -1.750152587890625, -1.7094192504882812, -1.6686859130859375, -1.6279525756835938, -1.58721923828125, -1.5464859008789062, -1.5057525634765625, -1.4650192260742188, -1.424285888671875, -1.3835525512695312, -1.3428192138671875, -1.3020858764648438, -1.2613525390625, -1.2206192016601562, -1.1798858642578125, -1.1391525268554688, -1.098419189453125, -1.0576858520507812, -1.0169525146484375, -0.9762191772460938, -0.93548583984375, -0.8947525024414062, -0.8540191650390625, -0.8132858276367188, -0.772552490234375, -0.7318191528320312, -0.6910858154296875, -0.6503524780273438, -0.609619140625, -0.5688858032226562, -0.5281524658203125, -0.48741912841796875, -0.446685791015625, -0.40595245361328125, -0.3652191162109375, -0.32448577880859375, -0.28375244140625, -0.24301910400390625, -0.2022857666015625, -0.16155242919921875, -0.120819091796875, -0.08008575439453125, -0.0393524169921875, 0.00138092041015625, 0.0421142578125, 0.08284759521484375, 0.1235809326171875, 0.16431427001953125, 0.205047607421875, 0.24578094482421875, 0.2865142822265625, 0.32724761962890625, 0.36798095703125, 0.40871429443359375, 0.4494476318359375, 0.49018096923828125, 0.530914306640625, 0.5716476440429688, 0.6123809814453125, 0.6531143188476562, 0.69384765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 8.0, 18.0, 8.0, 27.0, 25.0, 47.0, 64.0, 122.0, 192.0, 363.0, 796.0, 2127.0, 7391.0, 40943.0, 377295.0, 550779.0, 54909.0, 9010.0, 2487.0, 888.0, 429.0, 215.0, 125.0, 91.0, 61.0, 36.0, 20.0, 16.0, 11.0, 8.0, 3.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0859375, -2.016571044921875, -1.94720458984375, -1.877838134765625, -1.8084716796875, -1.739105224609375, -1.66973876953125, -1.600372314453125, -1.531005859375, -1.461639404296875, -1.39227294921875, -1.322906494140625, -1.2535400390625, -1.184173583984375, -1.11480712890625, -1.045440673828125, -0.97607421875, -0.906707763671875, -0.83734130859375, -0.767974853515625, -0.6986083984375, -0.629241943359375, -0.55987548828125, -0.490509033203125, -0.421142578125, -0.351776123046875, -0.28240966796875, -0.213043212890625, -0.1436767578125, -0.074310302734375, -0.00494384765625, 0.064422607421875, 0.1337890625, 0.203155517578125, 0.27252197265625, 0.341888427734375, 0.4112548828125, 0.480621337890625, 0.54998779296875, 0.619354248046875, 0.688720703125, 0.758087158203125, 0.82745361328125, 0.896820068359375, 0.9661865234375, 1.035552978515625, 1.10491943359375, 1.174285888671875, 1.24365234375, 1.313018798828125, 1.38238525390625, 1.451751708984375, 1.5211181640625, 1.590484619140625, 1.65985107421875, 1.729217529296875, 1.798583984375, 1.867950439453125, 1.93731689453125, 2.006683349609375, 2.0760498046875, 2.145416259765625, 2.21478271484375, 2.284149169921875, 2.353515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 7.0, 4.0, 5.0, 9.0, 6.0, 5.0, 14.0, 17.0, 26.0, 38.0, 53.0, 42.0, 48.0, 54.0, 46.0, 50.0, 48.0, 48.0, 71.0, 54.0, 44.0, 52.0, 47.0, 50.0, 21.0, 26.0, 23.0, 20.0, 15.0, 10.0, 9.0, 7.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.837890625, -2.74639892578125, -2.6549072265625, -2.56341552734375, -2.471923828125, -2.38043212890625, -2.2889404296875, -2.19744873046875, -2.10595703125, -2.01446533203125, -1.9229736328125, -1.83148193359375, -1.739990234375, -1.64849853515625, -1.5570068359375, -1.46551513671875, -1.3740234375, -1.28253173828125, -1.1910400390625, -1.09954833984375, -1.008056640625, -0.91656494140625, -0.8250732421875, -0.73358154296875, -0.64208984375, -0.55059814453125, -0.4591064453125, -0.36761474609375, -0.276123046875, -0.18463134765625, -0.0931396484375, -0.00164794921875, 0.08984375, 0.18133544921875, 0.2728271484375, 0.36431884765625, 0.455810546875, 0.54730224609375, 0.6387939453125, 0.73028564453125, 0.82177734375, 0.91326904296875, 1.0047607421875, 1.09625244140625, 1.187744140625, 1.27923583984375, 1.3707275390625, 1.46221923828125, 1.5537109375, 1.64520263671875, 1.7366943359375, 1.82818603515625, 1.919677734375, 2.01116943359375, 2.1026611328125, 2.19415283203125, 2.28564453125, 2.37713623046875, 2.4686279296875, 2.56011962890625, 2.651611328125, 2.74310302734375, 2.8345947265625, 2.92608642578125, 3.017578125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 10.0, 14.0, 12.0, 23.0, 37.0, 59.0, 112.0, 210.0, 526.0, 1708.0, 9588.0, 565000.0, 459438.0, 9205.0, 1544.0, 527.0, 225.0, 110.0, 78.0, 32.0, 27.0, 15.0, 14.0, 7.0, 8.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5693359375, -1.5202789306640625, -1.471221923828125, -1.4221649169921875, -1.37310791015625, -1.3240509033203125, -1.274993896484375, -1.2259368896484375, -1.1768798828125, -1.1278228759765625, -1.078765869140625, -1.0297088623046875, -0.98065185546875, -0.9315948486328125, -0.882537841796875, -0.8334808349609375, -0.784423828125, -0.7353668212890625, -0.686309814453125, -0.6372528076171875, -0.58819580078125, -0.5391387939453125, -0.490081787109375, -0.4410247802734375, -0.3919677734375, -0.3429107666015625, -0.293853759765625, -0.2447967529296875, -0.19573974609375, -0.1466827392578125, -0.097625732421875, -0.0485687255859375, 0.00048828125, 0.0495452880859375, 0.098602294921875, 0.1476593017578125, 0.19671630859375, 0.2457733154296875, 0.294830322265625, 0.3438873291015625, 0.3929443359375, 0.4420013427734375, 0.491058349609375, 0.5401153564453125, 0.58917236328125, 0.6382293701171875, 0.687286376953125, 0.7363433837890625, 0.785400390625, 0.8344573974609375, 0.883514404296875, 0.9325714111328125, 0.98162841796875, 1.0306854248046875, 1.079742431640625, 1.1287994384765625, 1.1778564453125, 1.2269134521484375, 1.275970458984375, 1.3250274658203125, 1.37408447265625, 1.4231414794921875, 1.472198486328125, 1.5212554931640625, 1.5703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 7.0, 16.0, 13.0, 23.0, 42.0, 62.0, 98.0, 128.0, 145.0, 128.0, 125.0, 64.0, 50.0, 39.0, 22.0, 8.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011301040649414062, -0.00010727345943450928, -0.00010153651237487793, -9.579956531524658e-05, -9.006261825561523e-05, -8.432567119598389e-05, -7.858872413635254e-05, -7.285177707672119e-05, -6.711483001708984e-05, -6.13778829574585e-05, -5.564093589782715e-05, -4.99039888381958e-05, -4.416704177856445e-05, -3.8430094718933105e-05, -3.269314765930176e-05, -2.695620059967041e-05, -2.1219253540039062e-05, -1.5482306480407715e-05, -9.745359420776367e-06, -4.0084123611450195e-06, 1.7285346984863281e-06, 7.465481758117676e-06, 1.3202428817749023e-05, 1.893937587738037e-05, 2.467632293701172e-05, 3.0413269996643066e-05, 3.6150217056274414e-05, 4.188716411590576e-05, 4.762411117553711e-05, 5.336105823516846e-05, 5.9098005294799805e-05, 6.483495235443115e-05, 7.05718994140625e-05, 7.630884647369385e-05, 8.20457935333252e-05, 8.778274059295654e-05, 9.351968765258789e-05, 9.925663471221924e-05, 0.00010499358177185059, 0.00011073052883148193, 0.00011646747589111328, 0.00012220442295074463, 0.00012794137001037598, 0.00013367831707000732, 0.00013941526412963867, 0.00014515221118927002, 0.00015088915824890137, 0.00015662610530853271, 0.00016236305236816406, 0.0001680999994277954, 0.00017383694648742676, 0.0001795738935470581, 0.00018531084060668945, 0.0001910477876663208, 0.00019678473472595215, 0.0002025216817855835, 0.00020825862884521484, 0.0002139955759048462, 0.00021973252296447754, 0.0002254694700241089, 0.00023120641708374023, 0.00023694336414337158, 0.00024268031120300293, 0.0002484172582626343, 0.0002541542053222656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 9.0, 10.0, 17.0, 24.0, 40.0, 59.0, 94.0, 173.0, 283.0, 592.0, 1361.0, 3983.0, 17625.0, 186901.0, 745614.0, 77096.0, 9967.0, 2525.0, 1057.0, 449.0, 259.0, 147.0, 93.0, 39.0, 40.0, 24.0, 17.0, 11.0, 10.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74609375, -0.7222824096679688, -0.6984710693359375, -0.6746597290039062, -0.650848388671875, -0.6270370483398438, -0.6032257080078125, -0.5794143676757812, -0.55560302734375, -0.5317916870117188, -0.5079803466796875, -0.48416900634765625, -0.460357666015625, -0.43654632568359375, -0.4127349853515625, -0.38892364501953125, -0.3651123046875, -0.34130096435546875, -0.3174896240234375, -0.29367828369140625, -0.269866943359375, -0.24605560302734375, -0.2222442626953125, -0.19843292236328125, -0.17462158203125, -0.15081024169921875, -0.1269989013671875, -0.10318756103515625, -0.079376220703125, -0.05556488037109375, -0.0317535400390625, -0.00794219970703125, 0.015869140625, 0.03968048095703125, 0.0634918212890625, 0.08730316162109375, 0.111114501953125, 0.13492584228515625, 0.1587371826171875, 0.18254852294921875, 0.20635986328125, 0.23017120361328125, 0.2539825439453125, 0.27779388427734375, 0.301605224609375, 0.32541656494140625, 0.3492279052734375, 0.37303924560546875, 0.3968505859375, 0.42066192626953125, 0.4444732666015625, 0.46828460693359375, 0.492095947265625, 0.5159072875976562, 0.5397186279296875, 0.5635299682617188, 0.58734130859375, 0.6111526489257812, 0.6349639892578125, 0.6587753295898438, 0.682586669921875, 0.7063980102539062, 0.7302093505859375, 0.7540206909179688, 0.77783203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 15.0, 28.0, 26.0, 38.0, 67.0, 75.0, 104.0, 106.0, 112.0, 85.0, 88.0, 58.0, 50.0, 44.0, 27.0, 19.0, 12.0, 13.0, 4.0, 8.0, 4.0, 0.0, 2.0], "bins": [-1.234375, -1.2091712951660156, -1.1839675903320312, -1.1587638854980469, -1.1335601806640625, -1.1083564758300781, -1.0831527709960938, -1.0579490661621094, -1.032745361328125, -1.0075416564941406, -0.9823379516601562, -0.9571342468261719, -0.9319305419921875, -0.9067268371582031, -0.8815231323242188, -0.8563194274902344, -0.83111572265625, -0.8059120178222656, -0.7807083129882812, -0.7555046081542969, -0.7303009033203125, -0.7050971984863281, -0.6798934936523438, -0.6546897888183594, -0.629486083984375, -0.6042823791503906, -0.5790786743164062, -0.5538749694824219, -0.5286712646484375, -0.5034675598144531, -0.47826385498046875, -0.4530601501464844, -0.4278564453125, -0.4026527404785156, -0.37744903564453125, -0.3522453308105469, -0.3270416259765625, -0.3018379211425781, -0.27663421630859375, -0.2514305114746094, -0.226226806640625, -0.20102310180664062, -0.17581939697265625, -0.15061569213867188, -0.1254119873046875, -0.10020828247070312, -0.07500457763671875, -0.049800872802734375, -0.02459716796875, 0.000606536865234375, 0.02581024169921875, 0.051013946533203125, 0.0762176513671875, 0.10142135620117188, 0.12662506103515625, 0.15182876586914062, 0.177032470703125, 0.20223617553710938, 0.22743988037109375, 0.2526435852050781, 0.2778472900390625, 0.3030509948730469, 0.32825469970703125, 0.3534584045410156, 0.378662109375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 5.0, 9.0, 17.0, 48.0, 161.0, 280.0, 283.0, 104.0, 65.0, 15.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75192642211914, -17.998106002807617, -17.244285583496094, -16.490463256835938, -15.736642837524414, -14.98282241821289, -14.229001998901367, -13.475181579589844, -12.721360206604004, -11.96753978729248, -11.21371841430664, -10.459897994995117, -9.706077575683594, -8.952256202697754, -8.19843578338623, -7.444614887237549, -6.690793991088867, -5.9369730949401855, -5.183152198791504, -4.4293317794799805, -3.675510883331299, -2.921689987182617, -2.1678695678710938, -1.414048671722412, -0.6602277755737305, 0.09359300136566162, 0.8474137783050537, 1.6012344360351562, 2.355055332183838, 3.1088762283325195, 3.862696647644043, 4.616517543792725, 5.370340347290039, 6.124161243438721, 6.877982139587402, 7.631802558898926, 8.385623931884766, 9.139444351196289, 9.893264770507812, 10.647085189819336, 11.400906562805176, 12.1547269821167, 12.908548355102539, 13.662368774414062, 14.416189193725586, 15.170010566711426, 15.92383098602295, 16.67765235900879, 17.431472778320312, 18.185293197631836, 18.93911361694336, 19.692935943603516, 20.44675636291504, 21.200576782226562, 21.954397201538086, 22.70821762084961, 23.462039947509766, 24.21586036682129, 24.969680786132812, 25.72350311279297, 26.477323532104492, 27.231143951416016, 27.98496437072754, 28.738784790039062, 29.492605209350586]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 8.0, 4.0, 9.0, 7.0, 17.0, 16.0, 28.0, 31.0, 28.0, 44.0, 53.0, 53.0, 67.0, 72.0, 83.0, 74.0, 70.0, 59.0, 58.0, 37.0, 36.0, 35.0, 30.0, 26.0, 8.0, 11.0, 15.0, 14.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953275680541992, -8.501081466674805, -8.0488862991333, -7.596692085266113, -7.144497394561768, -6.692302703857422, -6.240108489990234, -5.787913799285889, -5.335719108581543, -4.883524417877197, -4.43133020401001, -3.979135513305664, -3.5269408226013184, -3.0747463703155518, -2.622551918029785, -2.1703572273254395, -1.718163013458252, -1.2659684419631958, -0.8137739300727844, -0.36157941818237305, 0.0906151533126831, 0.5428097248077393, 0.9950041770935059, 1.4471988677978516, 1.8993933200836182, 2.3515877723693848, 2.8037824630737305, 3.255976915359497, 3.7081713676452637, 4.160366058349609, 4.612560272216797, 5.064755439758301, 5.516949653625488, 5.969144344329834, 6.4213385581970215, 6.873533248901367, 7.325727939605713, 7.777922630310059, 8.230116844177246, 8.68231201171875, 9.134506225585938, 9.586700439453125, 10.038895606994629, 10.491089820861816, 10.943284034729004, 11.395479202270508, 11.847673416137695, 12.299867630004883, 12.75206184387207, 13.204256057739258, 13.656451225280762, 14.10864543914795, 14.560839653015137, 15.01303482055664, 15.465229034423828, 15.917423248291016, 16.369619369506836, 16.821813583374023, 17.27400779724121, 17.72620391845703, 18.17839813232422, 18.630592346191406, 19.082786560058594, 19.53498077392578, 19.98717498779297]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 10.0, 24.0, 37.0, 68.0, 102.0, 231.0, 460.0, 1045.0, 3947.0, 25884.0, 621143.0, 3386182.0, 139648.0, 11885.0, 2257.0, 705.0, 289.0, 144.0, 76.0, 50.0, 35.0, 9.0, 15.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7392578125, -1.69500732421875, -1.6507568359375, -1.60650634765625, -1.562255859375, -1.51800537109375, -1.4737548828125, -1.42950439453125, -1.38525390625, -1.34100341796875, -1.2967529296875, -1.25250244140625, -1.208251953125, -1.16400146484375, -1.1197509765625, -1.07550048828125, -1.03125, -0.98699951171875, -0.9427490234375, -0.89849853515625, -0.854248046875, -0.80999755859375, -0.7657470703125, -0.72149658203125, -0.67724609375, -0.63299560546875, -0.5887451171875, -0.54449462890625, -0.500244140625, -0.45599365234375, -0.4117431640625, -0.36749267578125, -0.3232421875, -0.27899169921875, -0.2347412109375, -0.19049072265625, -0.146240234375, -0.10198974609375, -0.0577392578125, -0.01348876953125, 0.03076171875, 0.07501220703125, 0.1192626953125, 0.16351318359375, 0.207763671875, 0.25201416015625, 0.2962646484375, 0.34051513671875, 0.384765625, 0.42901611328125, 0.4732666015625, 0.51751708984375, 0.561767578125, 0.60601806640625, 0.6502685546875, 0.69451904296875, 0.73876953125, 0.78302001953125, 0.8272705078125, 0.87152099609375, 0.915771484375, 0.96002197265625, 1.0042724609375, 1.04852294921875, 1.0927734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 13.0, 18.0, 19.0, 33.0, 31.0, 36.0, 38.0, 36.0, 55.0, 47.0, 47.0, 51.0, 54.0, 48.0, 49.0, 56.0, 49.0, 56.0, 43.0, 37.0, 35.0, 28.0, 18.0, 31.0, 17.0, 11.0, 10.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.572967529296875, -0.55316162109375, -0.533355712890625, -0.5135498046875, -0.493743896484375, -0.47393798828125, -0.454132080078125, -0.434326171875, -0.414520263671875, -0.39471435546875, -0.374908447265625, -0.3551025390625, -0.335296630859375, -0.31549072265625, -0.295684814453125, -0.27587890625, -0.256072998046875, -0.23626708984375, -0.216461181640625, -0.1966552734375, -0.176849365234375, -0.15704345703125, -0.137237548828125, -0.117431640625, -0.097625732421875, -0.07781982421875, -0.058013916015625, -0.0382080078125, -0.018402099609375, 0.00140380859375, 0.021209716796875, 0.041015625, 0.060821533203125, 0.08062744140625, 0.100433349609375, 0.1202392578125, 0.140045166015625, 0.15985107421875, 0.179656982421875, 0.199462890625, 0.219268798828125, 0.23907470703125, 0.258880615234375, 0.2786865234375, 0.298492431640625, 0.31829833984375, 0.338104248046875, 0.35791015625, 0.377716064453125, 0.39752197265625, 0.417327880859375, 0.4371337890625, 0.456939697265625, 0.47674560546875, 0.496551513671875, 0.516357421875, 0.536163330078125, 0.55596923828125, 0.575775146484375, 0.5955810546875, 0.615386962890625, 0.63519287109375, 0.654998779296875, 0.6748046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 9.0, 8.0, 15.0, 13.0, 34.0, 62.0, 92.0, 188.0, 392.0, 997.0, 2714.0, 10792.0, 76243.0, 2502734.0, 1524890.0, 59993.0, 10311.0, 2849.0, 993.0, 462.0, 200.0, 116.0, 55.0, 46.0, 13.0, 15.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.6796875, -1.63421630859375, -1.5887451171875, -1.54327392578125, -1.497802734375, -1.45233154296875, -1.4068603515625, -1.36138916015625, -1.31591796875, -1.27044677734375, -1.2249755859375, -1.17950439453125, -1.134033203125, -1.08856201171875, -1.0430908203125, -0.99761962890625, -0.9521484375, -0.90667724609375, -0.8612060546875, -0.81573486328125, -0.770263671875, -0.72479248046875, -0.6793212890625, -0.63385009765625, -0.58837890625, -0.54290771484375, -0.4974365234375, -0.45196533203125, -0.406494140625, -0.36102294921875, -0.3155517578125, -0.27008056640625, -0.224609375, -0.17913818359375, -0.1336669921875, -0.08819580078125, -0.042724609375, 0.00274658203125, 0.0482177734375, 0.09368896484375, 0.13916015625, 0.18463134765625, 0.2301025390625, 0.27557373046875, 0.321044921875, 0.36651611328125, 0.4119873046875, 0.45745849609375, 0.5029296875, 0.54840087890625, 0.5938720703125, 0.63934326171875, 0.684814453125, 0.73028564453125, 0.7757568359375, 0.82122802734375, 0.86669921875, 0.91217041015625, 0.9576416015625, 1.00311279296875, 1.048583984375, 1.09405517578125, 1.1395263671875, 1.18499755859375, 1.23046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 11.0, 7.0, 16.0, 18.0, 36.0, 79.0, 109.0, 210.0, 468.0, 1022.0, 944.0, 552.0, 258.0, 137.0, 69.0, 50.0, 25.0, 11.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.8576202392578125, -1.803131103515625, -1.7486419677734375, -1.69415283203125, -1.6396636962890625, -1.585174560546875, -1.5306854248046875, -1.4761962890625, -1.4217071533203125, -1.367218017578125, -1.3127288818359375, -1.25823974609375, -1.2037506103515625, -1.149261474609375, -1.0947723388671875, -1.040283203125, -0.9857940673828125, -0.931304931640625, -0.8768157958984375, -0.82232666015625, -0.7678375244140625, -0.713348388671875, -0.6588592529296875, -0.6043701171875, -0.5498809814453125, -0.495391845703125, -0.4409027099609375, -0.38641357421875, -0.3319244384765625, -0.277435302734375, -0.2229461669921875, -0.16845703125, -0.1139678955078125, -0.059478759765625, -0.0049896240234375, 0.04949951171875, 0.1039886474609375, 0.158477783203125, 0.2129669189453125, 0.2674560546875, 0.3219451904296875, 0.376434326171875, 0.4309234619140625, 0.48541259765625, 0.5399017333984375, 0.594390869140625, 0.6488800048828125, 0.703369140625, 0.7578582763671875, 0.812347412109375, 0.8668365478515625, 0.92132568359375, 0.9758148193359375, 1.030303955078125, 1.0847930908203125, 1.1392822265625, 1.1937713623046875, 1.248260498046875, 1.3027496337890625, 1.35723876953125, 1.4117279052734375, 1.466217041015625, 1.5207061767578125, 1.5751953125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 12.0, 30.0, 103.0, 172.0, 225.0, 200.0, 122.0, 51.0, 33.0, 11.0, 10.0, 11.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3109540939331055, -6.874582290649414, -6.438210487365723, -6.001838684082031, -5.56546688079834, -5.129095077514648, -4.692722797393799, -4.256350994110107, -3.819979190826416, -3.3836073875427246, -2.947235584259033, -2.5108635425567627, -2.0744917392730713, -1.6381199359893799, -1.2017478942871094, -0.765376091003418, -0.32900428771972656, 0.10736757516860962, 0.5437394380569458, 0.9801113605499268, 1.4164831638336182, 1.8528549671173096, 2.28922700881958, 2.7255988121032715, 3.161970615386963, 3.5983424186706543, 4.034714221954346, 4.471086502075195, 4.907458305358887, 5.343830108642578, 5.7802019119262695, 6.216573715209961, 6.652944564819336, 7.089316368103027, 7.525688171386719, 7.96205997467041, 8.398431777954102, 8.834803581237793, 9.271175384521484, 9.707548141479492, 10.143918991088867, 10.580290794372559, 11.01666259765625, 11.453034400939941, 11.889406204223633, 12.325778007507324, 12.762149810791016, 13.198522567749023, 13.634894371032715, 14.071266174316406, 14.507637977600098, 14.944009780883789, 15.38038158416748, 15.816753387451172, 16.25312614440918, 16.689496994018555, 17.125869750976562, 17.56224250793457, 17.998613357543945, 18.434986114501953, 18.871356964111328, 19.307729721069336, 19.74410057067871, 20.18047332763672, 20.616844177246094]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 10.0, 6.0, 6.0, 9.0, 12.0, 13.0, 21.0, 16.0, 21.0, 22.0, 27.0, 26.0, 31.0, 42.0, 34.0, 41.0, 44.0, 32.0, 58.0, 48.0, 55.0, 46.0, 41.0, 46.0, 46.0, 35.0, 30.0, 31.0, 29.0, 17.0, 20.0, 14.0, 16.0, 10.0, 14.0, 7.0, 6.0, 9.0, 4.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.850091934204102, -5.671099662780762, -5.492107391357422, -5.313115119934082, -5.134122371673584, -4.955130100250244, -4.776137828826904, -4.5971455574035645, -4.418152809143066, -4.239160537719727, -4.060168266296387, -3.8811757564544678, -3.702183246612549, -3.523190975189209, -3.344198703765869, -3.1652064323425293, -2.9862141609191895, -2.8072218894958496, -2.6282293796539307, -2.449237108230591, -2.270244598388672, -2.091252326965332, -1.9122600555419922, -1.7332676649093628, -1.5542752742767334, -1.375282883644104, -1.1962904930114746, -1.0172982215881348, -0.8383058309555054, -0.659313440322876, -0.48032116889953613, -0.30132877826690674, -0.12233638763427734, 0.05665597319602966, 0.23564833402633667, 0.4146406650543213, 0.5936330556869507, 0.7726254463195801, 0.9516177177429199, 1.1306101083755493, 1.3096024990081787, 1.488594889640808, 1.6675872802734375, 1.8465795516967773, 2.025571823120117, 2.204564332962036, 2.383556604385376, 2.562549114227295, 2.7415413856506348, 2.9205336570739746, 3.0995261669158936, 3.2785184383392334, 3.4575109481811523, 3.636503219604492, 3.815495491027832, 3.994487762451172, 4.173480033874512, 4.352472305297852, 4.531464576721191, 4.710456848144531, 4.889449596405029, 5.068441867828369, 5.247434139251709, 5.426426410675049, 5.605419158935547]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 12.0, 21.0, 29.0, 51.0, 115.0, 213.0, 314.0, 675.0, 1336.0, 2883.0, 6537.0, 16148.0, 40476.0, 98210.0, 217178.0, 310172.0, 201783.0, 90096.0, 36360.0, 14616.0, 6058.0, 2641.0, 1238.0, 633.0, 316.0, 183.0, 107.0, 59.0, 29.0, 15.0, 9.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.622039794921875, -0.59759521484375, -0.573150634765625, -0.5487060546875, -0.524261474609375, -0.49981689453125, -0.475372314453125, -0.450927734375, -0.426483154296875, -0.40203857421875, -0.377593994140625, -0.3531494140625, -0.328704833984375, -0.30426025390625, -0.279815673828125, -0.25537109375, -0.230926513671875, -0.20648193359375, -0.182037353515625, -0.1575927734375, -0.133148193359375, -0.10870361328125, -0.084259033203125, -0.059814453125, -0.035369873046875, -0.01092529296875, 0.013519287109375, 0.0379638671875, 0.062408447265625, 0.08685302734375, 0.111297607421875, 0.1357421875, 0.160186767578125, 0.18463134765625, 0.209075927734375, 0.2335205078125, 0.257965087890625, 0.28240966796875, 0.306854248046875, 0.331298828125, 0.355743408203125, 0.38018798828125, 0.404632568359375, 0.4290771484375, 0.453521728515625, 0.47796630859375, 0.502410888671875, 0.52685546875, 0.551300048828125, 0.57574462890625, 0.600189208984375, 0.6246337890625, 0.649078369140625, 0.67352294921875, 0.697967529296875, 0.722412109375, 0.746856689453125, 0.77130126953125, 0.795745849609375, 0.8201904296875, 0.844635009765625, 0.86907958984375, 0.893524169921875, 0.91796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 9.0, 11.0, 13.0, 14.0, 18.0, 32.0, 27.0, 28.0, 41.0, 41.0, 55.0, 40.0, 50.0, 50.0, 65.0, 68.0, 62.0, 38.0, 53.0, 62.0, 32.0, 42.0, 36.0, 25.0, 22.0, 24.0, 16.0, 5.0, 8.0, 2.0, 5.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5804443359375, -0.560302734375, -0.5401611328125, -0.52001953125, -0.4998779296875, -0.479736328125, -0.4595947265625, -0.439453125, -0.4193115234375, -0.399169921875, -0.3790283203125, -0.35888671875, -0.3387451171875, -0.318603515625, -0.2984619140625, -0.2783203125, -0.2581787109375, -0.238037109375, -0.2178955078125, -0.19775390625, -0.1776123046875, -0.157470703125, -0.1373291015625, -0.1171875, -0.0970458984375, -0.076904296875, -0.0567626953125, -0.03662109375, -0.0164794921875, 0.003662109375, 0.0238037109375, 0.0439453125, 0.0640869140625, 0.084228515625, 0.1043701171875, 0.12451171875, 0.1446533203125, 0.164794921875, 0.1849365234375, 0.205078125, 0.2252197265625, 0.245361328125, 0.2655029296875, 0.28564453125, 0.3057861328125, 0.325927734375, 0.3460693359375, 0.3662109375, 0.3863525390625, 0.406494140625, 0.4266357421875, 0.44677734375, 0.4669189453125, 0.487060546875, 0.5072021484375, 0.52734375, 0.5474853515625, 0.567626953125, 0.5877685546875, 0.60791015625, 0.6280517578125, 0.648193359375, 0.6683349609375, 0.6884765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 13.0, 31.0, 38.0, 64.0, 75.0, 111.0, 128.0, 230.0, 363.0, 538.0, 909.0, 1758.0, 4391.0, 17981.0, 137747.0, 708370.0, 147546.0, 19014.0, 4731.0, 1873.0, 934.0, 568.0, 321.0, 239.0, 154.0, 105.0, 83.0, 52.0, 43.0, 32.0, 22.0, 11.0, 15.0, 7.0, 6.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.587890625, -1.537506103515625, -1.48712158203125, -1.436737060546875, -1.3863525390625, -1.335968017578125, -1.28558349609375, -1.235198974609375, -1.184814453125, -1.134429931640625, -1.08404541015625, -1.033660888671875, -0.9832763671875, -0.932891845703125, -0.88250732421875, -0.832122802734375, -0.78173828125, -0.731353759765625, -0.68096923828125, -0.630584716796875, -0.5802001953125, -0.529815673828125, -0.47943115234375, -0.429046630859375, -0.378662109375, -0.328277587890625, -0.27789306640625, -0.227508544921875, -0.1771240234375, -0.126739501953125, -0.07635498046875, -0.025970458984375, 0.0244140625, 0.074798583984375, 0.12518310546875, 0.175567626953125, 0.2259521484375, 0.276336669921875, 0.32672119140625, 0.377105712890625, 0.427490234375, 0.477874755859375, 0.52825927734375, 0.578643798828125, 0.6290283203125, 0.679412841796875, 0.72979736328125, 0.780181884765625, 0.83056640625, 0.880950927734375, 0.93133544921875, 0.981719970703125, 1.0321044921875, 1.082489013671875, 1.13287353515625, 1.183258056640625, 1.233642578125, 1.284027099609375, 1.33441162109375, 1.384796142578125, 1.4351806640625, 1.485565185546875, 1.53594970703125, 1.586334228515625, 1.63671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 9.0, 7.0, 8.0, 8.0, 8.0, 22.0, 20.0, 18.0, 20.0, 18.0, 34.0, 38.0, 38.0, 33.0, 43.0, 60.0, 38.0, 46.0, 50.0, 55.0, 55.0, 37.0, 46.0, 37.0, 38.0, 38.0, 31.0, 20.0, 24.0, 21.0, 12.0, 15.0, 10.0, 8.0, 6.0, 5.0, 8.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.03515625, -1.971893310546875, -1.90863037109375, -1.845367431640625, -1.7821044921875, -1.718841552734375, -1.65557861328125, -1.592315673828125, -1.529052734375, -1.465789794921875, -1.40252685546875, -1.339263916015625, -1.2760009765625, -1.212738037109375, -1.14947509765625, -1.086212158203125, -1.02294921875, -0.959686279296875, -0.89642333984375, -0.833160400390625, -0.7698974609375, -0.706634521484375, -0.64337158203125, -0.580108642578125, -0.516845703125, -0.453582763671875, -0.39031982421875, -0.327056884765625, -0.2637939453125, -0.200531005859375, -0.13726806640625, -0.074005126953125, -0.0107421875, 0.052520751953125, 0.11578369140625, 0.179046630859375, 0.2423095703125, 0.305572509765625, 0.36883544921875, 0.432098388671875, 0.495361328125, 0.558624267578125, 0.62188720703125, 0.685150146484375, 0.7484130859375, 0.811676025390625, 0.87493896484375, 0.938201904296875, 1.00146484375, 1.064727783203125, 1.12799072265625, 1.191253662109375, 1.2545166015625, 1.317779541015625, 1.38104248046875, 1.444305419921875, 1.507568359375, 1.570831298828125, 1.63409423828125, 1.697357177734375, 1.7606201171875, 1.823883056640625, 1.88714599609375, 1.950408935546875, 2.013671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 9.0, 12.0, 25.0, 46.0, 159.0, 380.0, 1563.0, 11862.0, 802651.0, 224264.0, 6063.0, 1042.0, 272.0, 115.0, 28.0, 31.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.1324310302734375, -1.096893310546875, -1.0613555908203125, -1.02581787109375, -0.9902801513671875, -0.954742431640625, -0.9192047119140625, -0.8836669921875, -0.8481292724609375, -0.812591552734375, -0.7770538330078125, -0.74151611328125, -0.7059783935546875, -0.670440673828125, -0.6349029541015625, -0.599365234375, -0.5638275146484375, -0.528289794921875, -0.4927520751953125, -0.45721435546875, -0.4216766357421875, -0.386138916015625, -0.3506011962890625, -0.3150634765625, -0.2795257568359375, -0.243988037109375, -0.2084503173828125, -0.17291259765625, -0.1373748779296875, -0.101837158203125, -0.0662994384765625, -0.03076171875, 0.0047760009765625, 0.040313720703125, 0.0758514404296875, 0.11138916015625, 0.1469268798828125, 0.182464599609375, 0.2180023193359375, 0.2535400390625, 0.2890777587890625, 0.324615478515625, 0.3601531982421875, 0.39569091796875, 0.4312286376953125, 0.466766357421875, 0.5023040771484375, 0.537841796875, 0.5733795166015625, 0.608917236328125, 0.6444549560546875, 0.67999267578125, 0.7155303955078125, 0.751068115234375, 0.7866058349609375, 0.8221435546875, 0.8576812744140625, 0.893218994140625, 0.9287567138671875, 0.96429443359375, 0.9998321533203125, 1.035369873046875, 1.0709075927734375, 1.1064453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 15.0, 34.0, 28.0, 41.0, 66.0, 75.0, 115.0, 147.0, 135.0, 109.0, 62.0, 54.0, 23.0, 24.0, 18.0, 10.0, 10.0, 12.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00021088123321533203, -0.00020604953169822693, -0.00020121783018112183, -0.00019638612866401672, -0.00019155442714691162, -0.00018672272562980652, -0.00018189102411270142, -0.0001770593225955963, -0.0001722276210784912, -0.0001673959195613861, -0.000162564218044281, -0.0001577325165271759, -0.0001529008150100708, -0.0001480691134929657, -0.0001432374119758606, -0.0001384057104587555, -0.0001335740089416504, -0.0001287423074245453, -0.00012391060590744019, -0.00011907890439033508, -0.00011424720287322998, -0.00010941550135612488, -0.00010458379983901978, -9.975209832191467e-05, -9.492039680480957e-05, -9.008869528770447e-05, -8.525699377059937e-05, -8.042529225349426e-05, -7.559359073638916e-05, -7.076188921928406e-05, -6.593018770217896e-05, -6.109848618507385e-05, -5.626678466796875e-05, -5.143508315086365e-05, -4.6603381633758545e-05, -4.177168011665344e-05, -3.693997859954834e-05, -3.210827708244324e-05, -2.7276575565338135e-05, -2.2444874048233032e-05, -1.761317253112793e-05, -1.2781471014022827e-05, -7.949769496917725e-06, -3.118067979812622e-06, 1.7136335372924805e-06, 6.545335054397583e-06, 1.1377036571502686e-05, 1.6208738088607788e-05, 2.104043960571289e-05, 2.5872141122817993e-05, 3.0703842639923096e-05, 3.55355441570282e-05, 4.03672456741333e-05, 4.51989471912384e-05, 5.0030648708343506e-05, 5.486235022544861e-05, 5.969405174255371e-05, 6.452575325965881e-05, 6.935745477676392e-05, 7.418915629386902e-05, 7.902085781097412e-05, 8.385255932807922e-05, 8.868426084518433e-05, 9.351596236228943e-05, 9.834766387939453e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 7.0, 12.0, 18.0, 24.0, 51.0, 80.0, 127.0, 223.0, 491.0, 1240.0, 3998.0, 20399.0, 313299.0, 668291.0, 32295.0, 5216.0, 1524.0, 591.0, 268.0, 144.0, 83.0, 50.0, 37.0, 23.0, 11.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5697784423828125, -0.550201416015625, -0.5306243896484375, -0.51104736328125, -0.4914703369140625, -0.471893310546875, -0.4523162841796875, -0.4327392578125, -0.4131622314453125, -0.393585205078125, -0.3740081787109375, -0.35443115234375, -0.3348541259765625, -0.315277099609375, -0.2957000732421875, -0.276123046875, -0.2565460205078125, -0.236968994140625, -0.2173919677734375, -0.19781494140625, -0.1782379150390625, -0.158660888671875, -0.1390838623046875, -0.1195068359375, -0.0999298095703125, -0.080352783203125, -0.0607757568359375, -0.04119873046875, -0.0216217041015625, -0.002044677734375, 0.0175323486328125, 0.037109375, 0.0566864013671875, 0.076263427734375, 0.0958404541015625, 0.11541748046875, 0.1349945068359375, 0.154571533203125, 0.1741485595703125, 0.1937255859375, 0.2133026123046875, 0.232879638671875, 0.2524566650390625, 0.27203369140625, 0.2916107177734375, 0.311187744140625, 0.3307647705078125, 0.350341796875, 0.3699188232421875, 0.389495849609375, 0.4090728759765625, 0.42864990234375, 0.4482269287109375, 0.467803955078125, 0.4873809814453125, 0.5069580078125, 0.5265350341796875, 0.546112060546875, 0.5656890869140625, 0.58526611328125, 0.6048431396484375, 0.624420166015625, 0.6439971923828125, 0.66357421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 0.0, 8.0, 7.0, 5.0, 15.0, 17.0, 24.0, 32.0, 36.0, 43.0, 70.0, 82.0, 97.0, 96.0, 76.0, 79.0, 84.0, 55.0, 50.0, 29.0, 31.0, 24.0, 11.0, 9.0, 11.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.6004409790039062, -0.5832061767578125, -0.5659713745117188, -0.548736572265625, -0.5315017700195312, -0.5142669677734375, -0.49703216552734375, -0.47979736328125, -0.46256256103515625, -0.4453277587890625, -0.42809295654296875, -0.410858154296875, -0.39362335205078125, -0.3763885498046875, -0.35915374755859375, -0.3419189453125, -0.32468414306640625, -0.3074493408203125, -0.29021453857421875, -0.272979736328125, -0.25574493408203125, -0.2385101318359375, -0.22127532958984375, -0.20404052734375, -0.18680572509765625, -0.1695709228515625, -0.15233612060546875, -0.135101318359375, -0.11786651611328125, -0.1006317138671875, -0.08339691162109375, -0.066162109375, -0.04892730712890625, -0.0316925048828125, -0.01445770263671875, 0.002777099609375, 0.02001190185546875, 0.0372467041015625, 0.05448150634765625, 0.07171630859375, 0.08895111083984375, 0.1061859130859375, 0.12342071533203125, 0.140655517578125, 0.15789031982421875, 0.1751251220703125, 0.19235992431640625, 0.2095947265625, 0.22682952880859375, 0.2440643310546875, 0.26129913330078125, 0.278533935546875, 0.29576873779296875, 0.3130035400390625, 0.33023834228515625, 0.34747314453125, 0.36470794677734375, 0.3819427490234375, 0.39917755126953125, 0.416412353515625, 0.43364715576171875, 0.4508819580078125, 0.46811676025390625, 0.4853515625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 7.0, 10.0, 12.0, 19.0, 57.0, 94.0, 141.0, 243.0, 159.0, 115.0, 58.0, 42.0, 17.0, 11.0, 8.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.833471298217773, -9.477264404296875, -9.121057510375977, -8.764850616455078, -8.40864372253418, -8.052436828613281, -7.696230411529541, -7.340023517608643, -6.983816623687744, -6.627609729766846, -6.271402835845947, -5.915196418762207, -5.558989524841309, -5.20278263092041, -4.846575736999512, -4.490368843078613, -4.134161949157715, -3.7779550552368164, -3.421748161315918, -3.0655415058135986, -2.7093346118927, -2.3531277179718018, -1.9969210624694824, -1.640714168548584, -1.2845072746276855, -0.9283004403114319, -0.5720936059951782, -0.21588683128356934, 0.1403200626373291, 0.49652695655822754, 0.8527336120605469, 1.2089405059814453, 1.5651473999023438, 1.9213542938232422, 2.2775611877441406, 2.63376784324646, 2.9899747371673584, 3.346181631088257, 3.702388286590576, 4.058595180511475, 4.414802074432373, 4.7710089683532715, 5.12721586227417, 5.48342227935791, 5.839629173278809, 6.195836067199707, 6.5520429611206055, 6.908249855041504, 7.264456748962402, 7.620663642883301, 7.976870536804199, 8.333077430725098, 8.689284324645996, 9.045491218566895, 9.401697158813477, 9.757904052734375, 10.114110946655273, 10.470317840576172, 10.82652473449707, 11.182731628417969, 11.538938522338867, 11.895145416259766, 12.251352310180664, 12.607559204101562, 12.963766098022461]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 0.0, 6.0, 9.0, 8.0, 5.0, 10.0, 8.0, 8.0, 18.0, 15.0, 12.0, 20.0, 19.0, 24.0, 18.0, 32.0, 27.0, 21.0, 26.0, 44.0, 30.0, 61.0, 74.0, 60.0, 58.0, 35.0, 32.0, 31.0, 42.0, 38.0, 22.0, 26.0, 18.0, 30.0, 18.0, 14.0, 15.0, 12.0, 10.0, 9.0, 10.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.116373538970947, -6.894139766693115, -6.671906471252441, -6.449672698974609, -6.227438926696777, -6.0052056312561035, -5.7829718589782715, -5.560738563537598, -5.338504791259766, -5.116271018981934, -4.89403772354126, -4.671803951263428, -4.449570178985596, -4.227336883544922, -4.00510311126709, -3.782869577407837, -3.560635805130005, -3.338402271270752, -3.11616849899292, -2.893934965133667, -2.671701431274414, -2.449467658996582, -2.227234125137329, -2.005000591278076, -1.7827669382095337, -1.5605332851409912, -1.3382997512817383, -1.1160660982131958, -0.8938325047492981, -0.6715989112854004, -0.4493652582168579, -0.22713172435760498, -0.0048980712890625, 0.2173355370759964, 0.4395691454410553, 0.6618027687072754, 0.8840363621711731, 1.1062699556350708, 1.3285036087036133, 1.5507371425628662, 1.7729707956314087, 1.9952044486999512, 2.217437982559204, 2.439671516418457, 2.661905288696289, 2.884138822555542, 3.106372356414795, 3.328606128692627, 3.55083966255188, 3.773073196411133, 3.995306968688965, 4.217540740966797, 4.439774036407471, 4.662007808685303, 4.884241104125977, 5.106474876403809, 5.328708648681641, 5.550942420959473, 5.7731757164001465, 5.9954094886779785, 6.2176432609558105, 6.439876556396484, 6.662110328674316, 6.884344100952148, 7.106577396392822]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 2.0, 7.0, 17.0, 15.0, 20.0, 30.0, 33.0, 60.0, 74.0, 146.0, 191.0, 352.0, 676.0, 1136.0, 2382.0, 5081.0, 12930.0, 37738.0, 139446.0, 619491.0, 1872081.0, 1138329.0, 264665.0, 63785.0, 20505.0, 7989.0, 3375.0, 1633.0, 860.0, 486.0, 260.0, 171.0, 82.0, 72.0, 54.0, 42.0, 23.0, 17.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.5234375, -0.5091819763183594, -0.49492645263671875, -0.4806709289550781, -0.4664154052734375, -0.4521598815917969, -0.43790435791015625, -0.4236488342285156, -0.409393310546875, -0.3951377868652344, -0.38088226318359375, -0.3666267395019531, -0.3523712158203125, -0.3381156921386719, -0.32386016845703125, -0.3096046447753906, -0.29534912109375, -0.2810935974121094, -0.26683807373046875, -0.2525825500488281, -0.2383270263671875, -0.22407150268554688, -0.20981597900390625, -0.19556045532226562, -0.181304931640625, -0.16704940795898438, -0.15279388427734375, -0.13853836059570312, -0.1242828369140625, -0.11002731323242188, -0.09577178955078125, -0.08151626586914062, -0.0672607421875, -0.053005218505859375, -0.03874969482421875, -0.024494171142578125, -0.0102386474609375, 0.004016876220703125, 0.01827239990234375, 0.032527923583984375, 0.046783447265625, 0.061038970947265625, 0.07529449462890625, 0.08955001831054688, 0.1038055419921875, 0.11806106567382812, 0.13231658935546875, 0.14657211303710938, 0.16082763671875, 0.17508316040039062, 0.18933868408203125, 0.20359420776367188, 0.2178497314453125, 0.23210525512695312, 0.24636077880859375, 0.2606163024902344, 0.274871826171875, 0.2891273498535156, 0.30338287353515625, 0.3176383972167969, 0.3318939208984375, 0.3461494445800781, 0.36040496826171875, 0.3746604919433594, 0.388916015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 10.0, 11.0, 21.0, 15.0, 34.0, 25.0, 40.0, 31.0, 47.0, 46.0, 59.0, 54.0, 57.0, 60.0, 62.0, 55.0, 72.0, 66.0, 43.0, 43.0, 32.0, 25.0, 22.0, 18.0, 11.0, 13.0, 7.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5873565673828125, -0.566802978515625, -0.5462493896484375, -0.52569580078125, -0.5051422119140625, -0.484588623046875, -0.4640350341796875, -0.4434814453125, -0.4229278564453125, -0.402374267578125, -0.3818206787109375, -0.36126708984375, -0.3407135009765625, -0.320159912109375, -0.2996063232421875, -0.279052734375, -0.2584991455078125, -0.237945556640625, -0.2173919677734375, -0.19683837890625, -0.1762847900390625, -0.155731201171875, -0.1351776123046875, -0.1146240234375, -0.0940704345703125, -0.073516845703125, -0.0529632568359375, -0.03240966796875, -0.0118560791015625, 0.008697509765625, 0.0292510986328125, 0.0498046875, 0.0703582763671875, 0.090911865234375, 0.1114654541015625, 0.13201904296875, 0.1525726318359375, 0.173126220703125, 0.1936798095703125, 0.2142333984375, 0.2347869873046875, 0.255340576171875, 0.2758941650390625, 0.29644775390625, 0.3170013427734375, 0.337554931640625, 0.3581085205078125, 0.378662109375, 0.3992156982421875, 0.419769287109375, 0.4403228759765625, 0.46087646484375, 0.4814300537109375, 0.501983642578125, 0.5225372314453125, 0.5430908203125, 0.5636444091796875, 0.584197998046875, 0.6047515869140625, 0.62530517578125, 0.6458587646484375, 0.666412353515625, 0.6869659423828125, 0.70751953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 22.0, 24.0, 64.0, 90.0, 152.0, 316.0, 683.0, 2588.0, 16996.0, 382033.0, 3703779.0, 79300.0, 6359.0, 1184.0, 359.0, 169.0, 87.0, 27.0, 16.0, 10.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.884063720703125, -1.83355712890625, -1.783050537109375, -1.7325439453125, -1.682037353515625, -1.63153076171875, -1.581024169921875, -1.530517578125, -1.480010986328125, -1.42950439453125, -1.378997802734375, -1.3284912109375, -1.277984619140625, -1.22747802734375, -1.176971435546875, -1.12646484375, -1.075958251953125, -1.02545166015625, -0.974945068359375, -0.9244384765625, -0.873931884765625, -0.82342529296875, -0.772918701171875, -0.722412109375, -0.671905517578125, -0.62139892578125, -0.570892333984375, -0.5203857421875, -0.469879150390625, -0.41937255859375, -0.368865966796875, -0.318359375, -0.267852783203125, -0.21734619140625, -0.166839599609375, -0.1163330078125, -0.065826416015625, -0.01531982421875, 0.035186767578125, 0.085693359375, 0.136199951171875, 0.18670654296875, 0.237213134765625, 0.2877197265625, 0.338226318359375, 0.38873291015625, 0.439239501953125, 0.48974609375, 0.540252685546875, 0.59075927734375, 0.641265869140625, 0.6917724609375, 0.742279052734375, 0.79278564453125, 0.843292236328125, 0.893798828125, 0.944305419921875, 0.99481201171875, 1.045318603515625, 1.0958251953125, 1.146331787109375, 1.19683837890625, 1.247344970703125, 1.2978515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 4.0, 10.0, 10.0, 7.0, 11.0, 21.0, 22.0, 50.0, 66.0, 105.0, 186.0, 330.0, 542.0, 713.0, 737.0, 511.0, 300.0, 166.0, 95.0, 63.0, 31.0, 28.0, 18.0, 13.0, 11.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3701171875, -1.334014892578125, -1.29791259765625, -1.261810302734375, -1.2257080078125, -1.189605712890625, -1.15350341796875, -1.117401123046875, -1.081298828125, -1.045196533203125, -1.00909423828125, -0.972991943359375, -0.9368896484375, -0.900787353515625, -0.86468505859375, -0.828582763671875, -0.79248046875, -0.756378173828125, -0.72027587890625, -0.684173583984375, -0.6480712890625, -0.611968994140625, -0.57586669921875, -0.539764404296875, -0.503662109375, -0.467559814453125, -0.43145751953125, -0.395355224609375, -0.3592529296875, -0.323150634765625, -0.28704833984375, -0.250946044921875, -0.21484375, -0.178741455078125, -0.14263916015625, -0.106536865234375, -0.0704345703125, -0.034332275390625, 0.00177001953125, 0.037872314453125, 0.073974609375, 0.110076904296875, 0.14617919921875, 0.182281494140625, 0.2183837890625, 0.254486083984375, 0.29058837890625, 0.326690673828125, 0.36279296875, 0.398895263671875, 0.43499755859375, 0.471099853515625, 0.5072021484375, 0.543304443359375, 0.57940673828125, 0.615509033203125, 0.651611328125, 0.687713623046875, 0.72381591796875, 0.759918212890625, 0.7960205078125, 0.832122802734375, 0.86822509765625, 0.904327392578125, 0.9404296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 14.0, 26.0, 55.0, 103.0, 155.0, 237.0, 187.0, 111.0, 54.0, 23.0, 9.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.33808708190918, -12.0036039352417, -11.669121742248535, -11.334638595581055, -11.000155448913574, -10.665672302246094, -10.33119010925293, -9.99670696258545, -9.662223815917969, -9.327740669250488, -8.993258476257324, -8.658775329589844, -8.324292182922363, -7.989809513092041, -7.655326843261719, -7.320843696594238, -6.986361026763916, -6.651878356933594, -6.317395210266113, -5.982912540435791, -5.6484293937683105, -5.313946723937988, -4.979463577270508, -4.6449809074401855, -4.310498237609863, -3.976015329360962, -3.6415324211120605, -3.3070497512817383, -2.972566604614258, -2.6380839347839355, -2.303601026535034, -1.9691181182861328, -1.6346349716186523, -1.300152063369751, -0.9656692147254944, -0.6311863660812378, -0.2967034578323364, 0.03777945041656494, 0.37226223945617676, 0.7067451477050781, 1.0412280559539795, 1.3757109642028809, 1.7101938724517822, 2.0446767807006836, 2.379159450531006, 2.7136425971984863, 3.0481252670288086, 3.38260817527771, 3.7170910835266113, 4.051573753356934, 4.386056900024414, 4.720539569854736, 5.055022716522217, 5.389505386352539, 5.7239885330200195, 6.058471202850342, 6.392953872680664, 6.727436542510986, 7.061919689178467, 7.396402359008789, 7.7308855056762695, 8.06536865234375, 8.399850845336914, 8.734333992004395, 9.068817138671875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 8.0, 7.0, 15.0, 19.0, 20.0, 19.0, 41.0, 27.0, 34.0, 32.0, 31.0, 38.0, 39.0, 40.0, 47.0, 37.0, 45.0, 49.0, 35.0, 50.0, 33.0, 30.0, 31.0, 36.0, 32.0, 26.0, 18.0, 14.0, 23.0, 18.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.490769386291504, -4.348851680755615, -4.206933975219727, -4.065016269683838, -3.923098564147949, -3.7811808586120605, -3.6392629146575928, -3.497345209121704, -3.3554275035858154, -3.2135097980499268, -3.071592092514038, -2.9296743869781494, -2.7877564430236816, -2.645838737487793, -2.5039210319519043, -2.3620033264160156, -2.220085620880127, -2.0781679153442383, -1.9362502098083496, -1.7943323850631714, -1.6524146795272827, -1.510496973991394, -1.3685791492462158, -1.2266614437103271, -1.0847437381744385, -0.9428260326385498, -0.8009082674980164, -0.6589905023574829, -0.5170727968215942, -0.37515509128570557, -0.23323732614517212, -0.09131956100463867, 0.0505986213684082, 0.19251635670661926, 0.3344340920448303, 0.4763518273830414, 0.6182695627212524, 0.7601872682571411, 0.9021050333976746, 1.044022798538208, 1.1859405040740967, 1.3278582096099854, 1.469775915145874, 1.6116937398910522, 1.753611445426941, 1.8955291509628296, 2.037446975708008, 2.1793646812438965, 2.321282386779785, 2.463200092315674, 2.6051177978515625, 2.747035503387451, 2.88895320892334, 3.0308709144592285, 3.1727888584136963, 3.314706563949585, 3.4566242694854736, 3.5985419750213623, 3.740459680557251, 3.8823773860931396, 4.024295330047607, 4.166213035583496, 4.308130741119385, 4.450048446655273, 4.591966152191162]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 13.0, 24.0, 40.0, 52.0, 107.0, 148.0, 213.0, 348.0, 618.0, 1094.0, 2008.0, 3593.0, 6960.0, 14183.0, 29257.0, 61393.0, 128536.0, 240242.0, 263536.0, 153313.0, 73284.0, 35133.0, 16547.0, 8307.0, 4220.0, 2317.0, 1208.0, 745.0, 415.0, 238.0, 160.0, 102.0, 68.0, 29.0, 28.0, 27.0, 11.0, 8.0, 3.0, 1.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.657745361328125, -0.63726806640625, -0.616790771484375, -0.5963134765625, -0.575836181640625, -0.55535888671875, -0.534881591796875, -0.514404296875, -0.493927001953125, -0.47344970703125, -0.452972412109375, -0.4324951171875, -0.412017822265625, -0.39154052734375, -0.371063232421875, -0.3505859375, -0.330108642578125, -0.30963134765625, -0.289154052734375, -0.2686767578125, -0.248199462890625, -0.22772216796875, -0.207244873046875, -0.186767578125, -0.166290283203125, -0.14581298828125, -0.125335693359375, -0.1048583984375, -0.084381103515625, -0.06390380859375, -0.043426513671875, -0.02294921875, -0.002471923828125, 0.01800537109375, 0.038482666015625, 0.0589599609375, 0.079437255859375, 0.09991455078125, 0.120391845703125, 0.140869140625, 0.161346435546875, 0.18182373046875, 0.202301025390625, 0.2227783203125, 0.243255615234375, 0.26373291015625, 0.284210205078125, 0.3046875, 0.325164794921875, 0.34564208984375, 0.366119384765625, 0.3865966796875, 0.407073974609375, 0.42755126953125, 0.448028564453125, 0.468505859375, 0.488983154296875, 0.50946044921875, 0.529937744140625, 0.5504150390625, 0.570892333984375, 0.59136962890625, 0.611846923828125, 0.63232421875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 7.0, 17.0, 23.0, 21.0, 27.0, 30.0, 34.0, 34.0, 48.0, 57.0, 60.0, 68.0, 65.0, 71.0, 64.0, 76.0, 51.0, 52.0, 34.0, 28.0, 22.0, 23.0, 20.0, 23.0, 9.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6340255737304688, -0.6127777099609375, -0.5915298461914062, -0.570281982421875, -0.5490341186523438, -0.5277862548828125, -0.5065383911132812, -0.48529052734375, -0.46404266357421875, -0.4427947998046875, -0.42154693603515625, -0.400299072265625, -0.37905120849609375, -0.3578033447265625, -0.33655548095703125, -0.3153076171875, -0.29405975341796875, -0.2728118896484375, -0.25156402587890625, -0.230316162109375, -0.20906829833984375, -0.1878204345703125, -0.16657257080078125, -0.14532470703125, -0.12407684326171875, -0.1028289794921875, -0.08158111572265625, -0.060333251953125, -0.03908538818359375, -0.0178375244140625, 0.00341033935546875, 0.024658203125, 0.04590606689453125, 0.0671539306640625, 0.08840179443359375, 0.109649658203125, 0.13089752197265625, 0.1521453857421875, 0.17339324951171875, 0.19464111328125, 0.21588897705078125, 0.2371368408203125, 0.25838470458984375, 0.279632568359375, 0.30088043212890625, 0.3221282958984375, 0.34337615966796875, 0.3646240234375, 0.38587188720703125, 0.4071197509765625, 0.42836761474609375, 0.449615478515625, 0.47086334228515625, 0.4921112060546875, 0.5133590698242188, 0.53460693359375, 0.5558547973632812, 0.5771026611328125, 0.5983505249023438, 0.619598388671875, 0.6408462524414062, 0.6620941162109375, 0.6833419799804688, 0.70458984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 3.0, 13.0, 9.0, 17.0, 33.0, 27.0, 41.0, 53.0, 60.0, 96.0, 130.0, 179.0, 265.0, 341.0, 584.0, 1027.0, 2127.0, 5935.0, 25623.0, 168464.0, 685631.0, 127672.0, 20322.0, 5143.0, 1986.0, 972.0, 543.0, 373.0, 234.0, 174.0, 133.0, 92.0, 68.0, 55.0, 28.0, 24.0, 17.0, 13.0, 14.0, 11.0, 6.0, 5.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5771484375, -1.5285186767578125, -1.479888916015625, -1.4312591552734375, -1.38262939453125, -1.3339996337890625, -1.285369873046875, -1.2367401123046875, -1.1881103515625, -1.1394805908203125, -1.090850830078125, -1.0422210693359375, -0.99359130859375, -0.9449615478515625, -0.896331787109375, -0.8477020263671875, -0.799072265625, -0.7504425048828125, -0.701812744140625, -0.6531829833984375, -0.60455322265625, -0.5559234619140625, -0.507293701171875, -0.4586639404296875, -0.4100341796875, -0.3614044189453125, -0.312774658203125, -0.2641448974609375, -0.21551513671875, -0.1668853759765625, -0.118255615234375, -0.0696258544921875, -0.02099609375, 0.0276336669921875, 0.076263427734375, 0.1248931884765625, 0.17352294921875, 0.2221527099609375, 0.270782470703125, 0.3194122314453125, 0.3680419921875, 0.4166717529296875, 0.465301513671875, 0.5139312744140625, 0.56256103515625, 0.6111907958984375, 0.659820556640625, 0.7084503173828125, 0.757080078125, 0.8057098388671875, 0.854339599609375, 0.9029693603515625, 0.95159912109375, 1.0002288818359375, 1.048858642578125, 1.0974884033203125, 1.1461181640625, 1.1947479248046875, 1.243377685546875, 1.2920074462890625, 1.34063720703125, 1.3892669677734375, 1.437896728515625, 1.4865264892578125, 1.53515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 11.0, 15.0, 13.0, 16.0, 20.0, 27.0, 25.0, 25.0, 32.0, 50.0, 36.0, 48.0, 41.0, 51.0, 43.0, 51.0, 44.0, 45.0, 47.0, 45.0, 37.0, 51.0, 24.0, 22.0, 27.0, 27.0, 18.0, 15.0, 17.0, 9.0, 7.0, 5.0, 17.0, 7.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5794525146484375, -1.519256591796875, -1.4590606689453125, -1.39886474609375, -1.3386688232421875, -1.278472900390625, -1.2182769775390625, -1.1580810546875, -1.0978851318359375, -1.037689208984375, -0.9774932861328125, -0.91729736328125, -0.8571014404296875, -0.796905517578125, -0.7367095947265625, -0.676513671875, -0.6163177490234375, -0.556121826171875, -0.4959259033203125, -0.43572998046875, -0.3755340576171875, -0.315338134765625, -0.2551422119140625, -0.1949462890625, -0.1347503662109375, -0.074554443359375, -0.0143585205078125, 0.04583740234375, 0.1060333251953125, 0.166229248046875, 0.2264251708984375, 0.28662109375, 0.3468170166015625, 0.407012939453125, 0.4672088623046875, 0.52740478515625, 0.5876007080078125, 0.647796630859375, 0.7079925537109375, 0.7681884765625, 0.8283843994140625, 0.888580322265625, 0.9487762451171875, 1.00897216796875, 1.0691680908203125, 1.129364013671875, 1.1895599365234375, 1.249755859375, 1.3099517822265625, 1.370147705078125, 1.4303436279296875, 1.49053955078125, 1.5507354736328125, 1.610931396484375, 1.6711273193359375, 1.7313232421875, 1.7915191650390625, 1.851715087890625, 1.9119110107421875, 1.97210693359375, 2.0323028564453125, 2.092498779296875, 2.1526947021484375, 2.212890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 10.0, 15.0, 13.0, 30.0, 66.0, 109.0, 174.0, 331.0, 680.0, 1736.0, 4444.0, 15615.0, 93454.0, 726090.0, 172217.0, 23494.0, 6160.0, 2128.0, 898.0, 413.0, 189.0, 119.0, 65.0, 34.0, 16.0, 14.0, 12.0, 8.0, 11.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.45458984375, -0.43752288818359375, -0.4204559326171875, -0.40338897705078125, -0.386322021484375, -0.36925506591796875, -0.3521881103515625, -0.33512115478515625, -0.31805419921875, -0.30098724365234375, -0.2839202880859375, -0.26685333251953125, -0.249786376953125, -0.23271942138671875, -0.2156524658203125, -0.19858551025390625, -0.1815185546875, -0.16445159912109375, -0.1473846435546875, -0.13031768798828125, -0.113250732421875, -0.09618377685546875, -0.0791168212890625, -0.06204986572265625, -0.04498291015625, -0.02791595458984375, -0.0108489990234375, 0.00621795654296875, 0.023284912109375, 0.04035186767578125, 0.0574188232421875, 0.07448577880859375, 0.091552734375, 0.10861968994140625, 0.1256866455078125, 0.14275360107421875, 0.159820556640625, 0.17688751220703125, 0.1939544677734375, 0.21102142333984375, 0.22808837890625, 0.24515533447265625, 0.2622222900390625, 0.27928924560546875, 0.296356201171875, 0.31342315673828125, 0.3304901123046875, 0.34755706787109375, 0.3646240234375, 0.38169097900390625, 0.3987579345703125, 0.41582489013671875, 0.432891845703125, 0.44995880126953125, 0.4670257568359375, 0.48409271240234375, 0.50115966796875, 0.5182266235351562, 0.5352935791015625, 0.5523605346679688, 0.569427490234375, 0.5864944458007812, 0.6035614013671875, 0.6206283569335938, 0.6376953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 3.0, 12.0, 8.0, 12.0, 16.0, 25.0, 29.0, 46.0, 63.0, 74.0, 116.0, 125.0, 120.0, 95.0, 75.0, 49.0, 41.0, 18.0, 19.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013685226440429688, -0.00013221986591815948, -0.0001275874674320221, -0.0001229550689458847, -0.00011832267045974731, -0.00011369027197360992, -0.00010905787348747253, -0.00010442547500133514, -9.979307651519775e-05, -9.516067802906036e-05, -9.052827954292297e-05, -8.589588105678558e-05, -8.12634825706482e-05, -7.66310840845108e-05, -7.199868559837341e-05, -6.736628711223602e-05, -6.273388862609863e-05, -5.810149013996124e-05, -5.346909165382385e-05, -4.883669316768646e-05, -4.420429468154907e-05, -3.957189619541168e-05, -3.493949770927429e-05, -3.0307099223136902e-05, -2.5674700736999512e-05, -2.104230225086212e-05, -1.640990376472473e-05, -1.1777505278587341e-05, -7.145106792449951e-06, -2.512708306312561e-06, 2.119690179824829e-06, 6.752088665962219e-06, 1.138448715209961e-05, 1.6016885638237e-05, 2.064928412437439e-05, 2.528168261051178e-05, 2.991408109664917e-05, 3.454647958278656e-05, 3.917887806892395e-05, 4.381127655506134e-05, 4.844367504119873e-05, 5.307607352733612e-05, 5.770847201347351e-05, 6.23408704996109e-05, 6.697326898574829e-05, 7.160566747188568e-05, 7.623806595802307e-05, 8.087046444416046e-05, 8.550286293029785e-05, 9.013526141643524e-05, 9.476765990257263e-05, 9.940005838871002e-05, 0.00010403245687484741, 0.0001086648553609848, 0.00011329725384712219, 0.00011792965233325958, 0.00012256205081939697, 0.00012719444930553436, 0.00013182684779167175, 0.00013645924627780914, 0.00014109164476394653, 0.00014572404325008392, 0.0001503564417362213, 0.0001549888402223587, 0.0001596212387084961]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 4.0, 10.0, 13.0, 22.0, 33.0, 43.0, 58.0, 64.0, 155.0, 238.0, 467.0, 912.0, 1947.0, 5309.0, 20169.0, 142955.0, 736392.0, 114058.0, 17155.0, 4825.0, 1751.0, 835.0, 438.0, 243.0, 137.0, 81.0, 55.0, 42.0, 23.0, 26.0, 16.0, 17.0, 9.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4892578125, -0.47370147705078125, -0.4581451416015625, -0.44258880615234375, -0.427032470703125, -0.41147613525390625, -0.3959197998046875, -0.38036346435546875, -0.36480712890625, -0.34925079345703125, -0.3336944580078125, -0.31813812255859375, -0.302581787109375, -0.28702545166015625, -0.2714691162109375, -0.25591278076171875, -0.2403564453125, -0.22480010986328125, -0.2092437744140625, -0.19368743896484375, -0.178131103515625, -0.16257476806640625, -0.1470184326171875, -0.13146209716796875, -0.11590576171875, -0.10034942626953125, -0.0847930908203125, -0.06923675537109375, -0.053680419921875, -0.03812408447265625, -0.0225677490234375, -0.00701141357421875, 0.008544921875, 0.02410125732421875, 0.0396575927734375, 0.05521392822265625, 0.070770263671875, 0.08632659912109375, 0.1018829345703125, 0.11743927001953125, 0.13299560546875, 0.14855194091796875, 0.1641082763671875, 0.17966461181640625, 0.195220947265625, 0.21077728271484375, 0.2263336181640625, 0.24188995361328125, 0.2574462890625, 0.27300262451171875, 0.2885589599609375, 0.30411529541015625, 0.319671630859375, 0.33522796630859375, 0.3507843017578125, 0.36634063720703125, 0.38189697265625, 0.39745330810546875, 0.4130096435546875, 0.42856597900390625, 0.444122314453125, 0.45967864990234375, 0.4752349853515625, 0.49079132080078125, 0.50634765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 8.0, 10.0, 12.0, 10.0, 12.0, 24.0, 35.0, 33.0, 44.0, 50.0, 54.0, 87.0, 89.0, 68.0, 71.0, 90.0, 63.0, 38.0, 46.0, 23.0, 26.0, 24.0, 16.0, 9.0, 15.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.475341796875, -0.4611091613769531, -0.44687652587890625, -0.4326438903808594, -0.4184112548828125, -0.4041786193847656, -0.38994598388671875, -0.3757133483886719, -0.361480712890625, -0.3472480773925781, -0.33301544189453125, -0.3187828063964844, -0.3045501708984375, -0.2903175354003906, -0.27608489990234375, -0.2618522644042969, -0.24761962890625, -0.23338699340820312, -0.21915435791015625, -0.20492172241210938, -0.1906890869140625, -0.17645645141601562, -0.16222381591796875, -0.14799118041992188, -0.133758544921875, -0.11952590942382812, -0.10529327392578125, -0.09106063842773438, -0.0768280029296875, -0.06259536743164062, -0.04836273193359375, -0.034130096435546875, -0.0198974609375, -0.005664825439453125, 0.00856781005859375, 0.022800445556640625, 0.0370330810546875, 0.051265716552734375, 0.06549835205078125, 0.07973098754882812, 0.093963623046875, 0.10819625854492188, 0.12242889404296875, 0.13666152954101562, 0.1508941650390625, 0.16512680053710938, 0.17935943603515625, 0.19359207153320312, 0.20782470703125, 0.22205734252929688, 0.23628997802734375, 0.2505226135253906, 0.2647552490234375, 0.2789878845214844, 0.29322052001953125, 0.3074531555175781, 0.321685791015625, 0.3359184265136719, 0.35015106201171875, 0.3643836975097656, 0.3786163330078125, 0.3928489685058594, 0.40708160400390625, 0.4213142395019531, 0.435546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 32.0, 96.0, 328.0, 327.0, 124.0, 50.0, 18.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.992441177368164, -15.2954683303833, -14.598494529724121, -13.901521682739258, -13.204548835754395, -12.507575988769531, -11.810602188110352, -11.113629341125488, -10.416656494140625, -9.719683647155762, -9.022709846496582, -8.325736999511719, -7.6287641525268555, -6.931790828704834, -6.2348175048828125, -5.537844657897949, -4.8408708572387695, -4.143897533416748, -3.4469246864318848, -2.7499513626098633, -2.052978277206421, -1.3560051918029785, -0.659031867980957, 0.03794097900390625, 0.7349143028259277, 1.4318873882293701, 2.1288604736328125, 2.825833797454834, 3.5228068828582764, 4.219779968261719, 4.91675329208374, 5.6137261390686035, 6.310699462890625, 7.0076727867126465, 7.70464563369751, 8.401618957519531, 9.098591804504395, 9.795564651489258, 10.492538452148438, 11.1895112991333, 11.886484146118164, 12.583456993103027, 13.280430793762207, 13.97740364074707, 14.674376487731934, 15.371349334716797, 16.068323135375977, 16.765296936035156, 17.462268829345703, 18.159242630004883, 18.85621452331543, 19.55318832397461, 20.25016212463379, 20.947134017944336, 21.644107818603516, 22.341079711914062, 23.038055419921875, 23.735029220581055, 24.4320011138916, 25.12897491455078, 25.82594871520996, 26.522920608520508, 27.219894409179688, 27.916866302490234, 28.613840103149414]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 3.0, 14.0, 11.0, 20.0, 16.0, 20.0, 22.0, 25.0, 21.0, 29.0, 38.0, 41.0, 52.0, 67.0, 67.0, 66.0, 85.0, 49.0, 47.0, 45.0, 27.0, 40.0, 28.0, 21.0, 20.0, 21.0, 15.0, 19.0, 16.0, 12.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.939767837524414, -7.671344757080078, -7.402921676635742, -7.134498596191406, -6.8660759925842285, -6.597652912139893, -6.329229831695557, -6.060806751251221, -5.792384147644043, -5.523961067199707, -5.255537986755371, -4.987114906311035, -4.718692302703857, -4.4502692222595215, -4.1818461418151855, -3.9134230613708496, -3.6449999809265137, -3.3765769004821777, -3.108154058456421, -2.839730978012085, -2.571308135986328, -2.302885055541992, -2.0344619750976562, -1.7660390138626099, -1.4976160526275635, -1.229193091392517, -0.9607700705528259, -0.6923470497131348, -0.4239240884780884, -0.155501127243042, 0.11292195320129395, 0.38134491443634033, 0.6497678756713867, 0.9181908369064331, 1.1866137981414795, 1.4550368785858154, 1.7234598398208618, 1.9918828010559082, 2.260305881500244, 2.52872896194458, 2.797151803970337, 3.065574884414673, 3.3339977264404297, 3.6024208068847656, 3.8708438873291016, 4.1392669677734375, 4.407690048217773, 4.676112651824951, 4.944535732269287, 5.212958812713623, 5.481381893157959, 5.749804496765137, 6.018227577209473, 6.286650657653809, 6.5550737380981445, 6.8234968185424805, 7.091919898986816, 7.360342979431152, 7.628766059875488, 7.897189140319824, 8.16561222076416, 8.43403434753418, 8.702457427978516, 8.970880508422852, 9.239303588867188]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 12.0, 9.0, 12.0, 25.0, 21.0, 37.0, 47.0, 92.0, 133.0, 231.0, 434.0, 946.0, 2403.0, 7641.0, 35277.0, 304348.0, 2282918.0, 1388473.0, 142195.0, 20582.0, 5115.0, 1776.0, 674.0, 314.0, 196.0, 121.0, 82.0, 54.0, 30.0, 16.0, 26.0, 11.0, 14.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.861328125, -0.8407402038574219, -0.8201522827148438, -0.7995643615722656, -0.7789764404296875, -0.7583885192871094, -0.7378005981445312, -0.7172126770019531, -0.696624755859375, -0.6760368347167969, -0.6554489135742188, -0.6348609924316406, -0.6142730712890625, -0.5936851501464844, -0.5730972290039062, -0.5525093078613281, -0.53192138671875, -0.5113334655761719, -0.49074554443359375, -0.4701576232910156, -0.4495697021484375, -0.4289817810058594, -0.40839385986328125, -0.3878059387207031, -0.367218017578125, -0.3466300964355469, -0.32604217529296875, -0.3054542541503906, -0.2848663330078125, -0.2642784118652344, -0.24369049072265625, -0.22310256958007812, -0.2025146484375, -0.18192672729492188, -0.16133880615234375, -0.14075088500976562, -0.1201629638671875, -0.09957504272460938, -0.07898712158203125, -0.058399200439453125, -0.037811279296875, -0.017223358154296875, 0.00336456298828125, 0.023952484130859375, 0.0445404052734375, 0.06512832641601562, 0.08571624755859375, 0.10630416870117188, 0.12689208984375, 0.14748001098632812, 0.16806793212890625, 0.18865585327148438, 0.2092437744140625, 0.22983169555664062, 0.25041961669921875, 0.2710075378417969, 0.291595458984375, 0.3121833801269531, 0.33277130126953125, 0.3533592224121094, 0.3739471435546875, 0.3945350646972656, 0.41512298583984375, 0.4357109069824219, 0.456298828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 17.0, 10.0, 17.0, 18.0, 29.0, 26.0, 30.0, 52.0, 42.0, 61.0, 76.0, 85.0, 67.0, 63.0, 60.0, 63.0, 63.0, 47.0, 47.0, 23.0, 33.0, 19.0, 19.0, 16.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64892578125, -0.6270294189453125, -0.605133056640625, -0.5832366943359375, -0.56134033203125, -0.5394439697265625, -0.517547607421875, -0.4956512451171875, -0.4737548828125, -0.4518585205078125, -0.429962158203125, -0.4080657958984375, -0.38616943359375, -0.3642730712890625, -0.342376708984375, -0.3204803466796875, -0.298583984375, -0.2766876220703125, -0.254791259765625, -0.2328948974609375, -0.21099853515625, -0.1891021728515625, -0.167205810546875, -0.1453094482421875, -0.1234130859375, -0.1015167236328125, -0.079620361328125, -0.0577239990234375, -0.03582763671875, -0.0139312744140625, 0.007965087890625, 0.0298614501953125, 0.0517578125, 0.0736541748046875, 0.095550537109375, 0.1174468994140625, 0.13934326171875, 0.1612396240234375, 0.183135986328125, 0.2050323486328125, 0.2269287109375, 0.2488250732421875, 0.270721435546875, 0.2926177978515625, 0.31451416015625, 0.3364105224609375, 0.358306884765625, 0.3802032470703125, 0.402099609375, 0.4239959716796875, 0.445892333984375, 0.4677886962890625, 0.48968505859375, 0.5115814208984375, 0.533477783203125, 0.5553741455078125, 0.5772705078125, 0.5991668701171875, 0.621063232421875, 0.6429595947265625, 0.66485595703125, 0.6867523193359375, 0.708648681640625, 0.7305450439453125, 0.75244140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 35.0, 73.0, 166.0, 377.0, 790.0, 3284.0, 50525.0, 4006073.0, 125950.0, 5128.0, 999.0, 403.0, 205.0, 114.0, 50.0, 41.0, 16.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.025604248046875, -1.95941162109375, -1.893218994140625, -1.8270263671875, -1.760833740234375, -1.69464111328125, -1.628448486328125, -1.562255859375, -1.496063232421875, -1.42987060546875, -1.363677978515625, -1.2974853515625, -1.231292724609375, -1.16510009765625, -1.098907470703125, -1.03271484375, -0.966522216796875, -0.90032958984375, -0.834136962890625, -0.7679443359375, -0.701751708984375, -0.63555908203125, -0.569366455078125, -0.503173828125, -0.436981201171875, -0.37078857421875, -0.304595947265625, -0.2384033203125, -0.172210693359375, -0.10601806640625, -0.039825439453125, 0.0263671875, 0.092559814453125, 0.15875244140625, 0.224945068359375, 0.2911376953125, 0.357330322265625, 0.42352294921875, 0.489715576171875, 0.555908203125, 0.622100830078125, 0.68829345703125, 0.754486083984375, 0.8206787109375, 0.886871337890625, 0.95306396484375, 1.019256591796875, 1.08544921875, 1.151641845703125, 1.21783447265625, 1.284027099609375, 1.3502197265625, 1.416412353515625, 1.48260498046875, 1.548797607421875, 1.614990234375, 1.681182861328125, 1.74737548828125, 1.813568115234375, 1.8797607421875, 1.945953369140625, 2.01214599609375, 2.078338623046875, 2.14453125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 24.0, 44.0, 66.0, 235.0, 713.0, 1520.0, 964.0, 306.0, 108.0, 52.0, 13.0, 12.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.9967041015625, -1.927001953125, -1.8572998046875, -1.78759765625, -1.7178955078125, -1.648193359375, -1.5784912109375, -1.5087890625, -1.4390869140625, -1.369384765625, -1.2996826171875, -1.22998046875, -1.1602783203125, -1.090576171875, -1.0208740234375, -0.951171875, -0.8814697265625, -0.811767578125, -0.7420654296875, -0.67236328125, -0.6026611328125, -0.532958984375, -0.4632568359375, -0.3935546875, -0.3238525390625, -0.254150390625, -0.1844482421875, -0.11474609375, -0.0450439453125, 0.024658203125, 0.0943603515625, 0.1640625, 0.2337646484375, 0.303466796875, 0.3731689453125, 0.44287109375, 0.5125732421875, 0.582275390625, 0.6519775390625, 0.7216796875, 0.7913818359375, 0.861083984375, 0.9307861328125, 1.00048828125, 1.0701904296875, 1.139892578125, 1.2095947265625, 1.279296875, 1.3489990234375, 1.418701171875, 1.4884033203125, 1.55810546875, 1.6278076171875, 1.697509765625, 1.7672119140625, 1.8369140625, 1.9066162109375, 1.976318359375, 2.0460205078125, 2.11572265625, 2.1854248046875, 2.255126953125, 2.3248291015625, 2.39453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 37.0, 302.0, 500.0, 124.0, 15.0, 9.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.2139892578125, -15.415182113647461, -14.616374969482422, -13.817566871643066, -13.018759727478027, -12.219952583312988, -11.421144485473633, -10.622337341308594, -9.823530197143555, -9.024723052978516, -8.225915908813477, -7.427107810974121, -6.628300666809082, -5.829493522644043, -5.030685901641846, -4.231878280639648, -3.4330711364746094, -2.634263753890991, -1.835456371307373, -1.0366489887237549, -0.23784160614013672, 0.5609657764434814, 1.3597731590270996, 2.158580780029297, 2.957387924194336, 3.756195306777954, 4.555002689361572, 5.3538103103637695, 6.152617454528809, 6.951424598693848, 7.750232219696045, 8.549039840698242, 9.347846984863281, 10.14665412902832, 10.94546127319336, 11.744269371032715, 12.543076515197754, 13.341883659362793, 14.140691757202148, 14.939498901367188, 15.738306045532227, 16.537113189697266, 17.335920333862305, 18.134727478027344, 18.933536529541016, 19.732343673706055, 20.531150817871094, 21.329957962036133, 22.128765106201172, 22.92757225036621, 23.72637939453125, 24.52518653869629, 25.323993682861328, 26.122802734375, 26.92160987854004, 27.720417022705078, 28.519224166870117, 29.318031311035156, 30.116838455200195, 30.915645599365234, 31.714454650878906, 32.51325988769531, 33.312068939208984, 34.110877990722656, 34.90968322753906]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 5.0, 8.0, 9.0, 11.0, 18.0, 42.0, 36.0, 54.0, 40.0, 51.0, 40.0, 59.0, 75.0, 76.0, 62.0, 84.0, 56.0, 61.0, 43.0, 35.0, 34.0, 24.0, 15.0, 17.0, 11.0, 12.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.721892833709717, -4.524106025695801, -4.326318740844727, -4.1285319328308105, -3.9307448863983154, -3.7329578399658203, -3.5351710319519043, -3.337383985519409, -3.139596939086914, -2.941809892654419, -2.744022846221924, -2.546236038208008, -2.3484489917755127, -2.1506619453430176, -1.952875018119812, -1.7550880908966064, -1.5573010444641113, -1.3595139980316162, -1.1617270708084106, -0.9639400839805603, -0.76615309715271, -0.5683661103248596, -0.3705791234970093, -0.1727921962738037, 0.024994850158691406, 0.22278183698654175, 0.4205688238143921, 0.6183558106422424, 0.8161427974700928, 1.013929843902588, 1.2117167711257935, 1.409503698348999, 1.607290267944336, 1.805077314376831, 2.002864360809326, 2.200651168823242, 2.3984382152557373, 2.5962252616882324, 2.7940120697021484, 2.9917991161346436, 3.1895861625671387, 3.387373208999634, 3.585160255432129, 3.782947063446045, 3.98073410987854, 4.178521156311035, 4.376307964324951, 4.574094772338867, 4.771882057189941, 4.969668865203857, 5.167456150054932, 5.365242958068848, 5.563030242919922, 5.760817050933838, 5.958603858947754, 6.156391143798828, 6.354177951812744, 6.55196475982666, 6.749752044677734, 6.94753885269165, 7.145325660705566, 7.343112945556641, 7.540899753570557, 7.738686561584473, 7.936473846435547]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 16.0, 23.0, 29.0, 39.0, 69.0, 96.0, 174.0, 231.0, 382.0, 643.0, 1092.0, 1897.0, 3607.0, 6960.0, 14086.0, 29581.0, 63115.0, 132530.0, 232365.0, 251644.0, 159363.0, 78464.0, 36842.0, 17188.0, 8351.0, 4267.0, 2232.0, 1262.0, 755.0, 430.0, 313.0, 149.0, 106.0, 76.0, 42.0, 32.0, 18.0, 19.0, 11.0, 8.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.564453125, -0.5468902587890625, -0.529327392578125, -0.5117645263671875, -0.49420166015625, -0.4766387939453125, -0.459075927734375, -0.4415130615234375, -0.4239501953125, -0.4063873291015625, -0.388824462890625, -0.3712615966796875, -0.35369873046875, -0.3361358642578125, -0.318572998046875, -0.3010101318359375, -0.283447265625, -0.2658843994140625, -0.248321533203125, -0.2307586669921875, -0.21319580078125, -0.1956329345703125, -0.178070068359375, -0.1605072021484375, -0.1429443359375, -0.1253814697265625, -0.107818603515625, -0.0902557373046875, -0.07269287109375, -0.0551300048828125, -0.037567138671875, -0.0200042724609375, -0.00244140625, 0.0151214599609375, 0.032684326171875, 0.0502471923828125, 0.06781005859375, 0.0853729248046875, 0.102935791015625, 0.1204986572265625, 0.1380615234375, 0.1556243896484375, 0.173187255859375, 0.1907501220703125, 0.20831298828125, 0.2258758544921875, 0.243438720703125, 0.2610015869140625, 0.278564453125, 0.2961273193359375, 0.313690185546875, 0.3312530517578125, 0.34881591796875, 0.3663787841796875, 0.383941650390625, 0.4015045166015625, 0.4190673828125, 0.4366302490234375, 0.454193115234375, 0.4717559814453125, 0.48931884765625, 0.5068817138671875, 0.524444580078125, 0.5420074462890625, 0.5595703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 12.0, 8.0, 13.0, 22.0, 29.0, 23.0, 29.0, 39.0, 50.0, 53.0, 51.0, 68.0, 72.0, 70.0, 69.0, 55.0, 64.0, 55.0, 45.0, 40.0, 35.0, 21.0, 16.0, 18.0, 13.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.6126937866210938, -0.5911102294921875, -0.5695266723632812, -0.547943115234375, -0.5263595581054688, -0.5047760009765625, -0.48319244384765625, -0.46160888671875, -0.44002532958984375, -0.4184417724609375, -0.39685821533203125, -0.375274658203125, -0.35369110107421875, -0.3321075439453125, -0.31052398681640625, -0.2889404296875, -0.26735687255859375, -0.2457733154296875, -0.22418975830078125, -0.202606201171875, -0.18102264404296875, -0.1594390869140625, -0.13785552978515625, -0.11627197265625, -0.09468841552734375, -0.0731048583984375, -0.05152130126953125, -0.029937744140625, -0.00835418701171875, 0.0132293701171875, 0.03481292724609375, 0.056396484375, 0.07798004150390625, 0.0995635986328125, 0.12114715576171875, 0.142730712890625, 0.16431427001953125, 0.1858978271484375, 0.20748138427734375, 0.22906494140625, 0.25064849853515625, 0.2722320556640625, 0.29381561279296875, 0.315399169921875, 0.33698272705078125, 0.3585662841796875, 0.38014984130859375, 0.4017333984375, 0.42331695556640625, 0.4449005126953125, 0.46648406982421875, 0.488067626953125, 0.5096511840820312, 0.5312347412109375, 0.5528182983398438, 0.57440185546875, 0.5959854125976562, 0.6175689697265625, 0.6391525268554688, 0.660736083984375, 0.6823196411132812, 0.7039031982421875, 0.7254867553710938, 0.7470703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 8.0, 5.0, 8.0, 7.0, 15.0, 15.0, 21.0, 37.0, 51.0, 69.0, 134.0, 236.0, 473.0, 1156.0, 3547.0, 15135.0, 85447.0, 586908.0, 291847.0, 49539.0, 9678.0, 2567.0, 803.0, 328.0, 178.0, 92.0, 87.0, 42.0, 28.0, 18.0, 15.0, 18.0, 17.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4326171875, -1.391510009765625, -1.35040283203125, -1.309295654296875, -1.2681884765625, -1.227081298828125, -1.18597412109375, -1.144866943359375, -1.103759765625, -1.062652587890625, -1.02154541015625, -0.980438232421875, -0.9393310546875, -0.898223876953125, -0.85711669921875, -0.816009521484375, -0.77490234375, -0.733795166015625, -0.69268798828125, -0.651580810546875, -0.6104736328125, -0.569366455078125, -0.52825927734375, -0.487152099609375, -0.446044921875, -0.404937744140625, -0.36383056640625, -0.322723388671875, -0.2816162109375, -0.240509033203125, -0.19940185546875, -0.158294677734375, -0.1171875, -0.076080322265625, -0.03497314453125, 0.006134033203125, 0.0472412109375, 0.088348388671875, 0.12945556640625, 0.170562744140625, 0.211669921875, 0.252777099609375, 0.29388427734375, 0.334991455078125, 0.3760986328125, 0.417205810546875, 0.45831298828125, 0.499420166015625, 0.54052734375, 0.581634521484375, 0.62274169921875, 0.663848876953125, 0.7049560546875, 0.746063232421875, 0.78717041015625, 0.828277587890625, 0.869384765625, 0.910491943359375, 0.95159912109375, 0.992706298828125, 1.0338134765625, 1.074920654296875, 1.11602783203125, 1.157135009765625, 1.1982421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 11.0, 7.0, 8.0, 10.0, 18.0, 16.0, 20.0, 21.0, 26.0, 17.0, 48.0, 29.0, 40.0, 35.0, 43.0, 56.0, 46.0, 35.0, 41.0, 55.0, 53.0, 37.0, 37.0, 41.0, 35.0, 32.0, 35.0, 20.0, 22.0, 18.0, 17.0, 15.0, 12.0, 10.0, 8.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8359375, -1.7828521728515625, -1.729766845703125, -1.6766815185546875, -1.62359619140625, -1.5705108642578125, -1.517425537109375, -1.4643402099609375, -1.4112548828125, -1.3581695556640625, -1.305084228515625, -1.2519989013671875, -1.19891357421875, -1.1458282470703125, -1.092742919921875, -1.0396575927734375, -0.986572265625, -0.9334869384765625, -0.880401611328125, -0.8273162841796875, -0.77423095703125, -0.7211456298828125, -0.668060302734375, -0.6149749755859375, -0.5618896484375, -0.5088043212890625, -0.455718994140625, -0.4026336669921875, -0.34954833984375, -0.2964630126953125, -0.243377685546875, -0.1902923583984375, -0.13720703125, -0.0841217041015625, -0.031036376953125, 0.0220489501953125, 0.07513427734375, 0.1282196044921875, 0.181304931640625, 0.2343902587890625, 0.2874755859375, 0.3405609130859375, 0.393646240234375, 0.4467315673828125, 0.49981689453125, 0.5529022216796875, 0.605987548828125, 0.6590728759765625, 0.712158203125, 0.7652435302734375, 0.818328857421875, 0.8714141845703125, 0.92449951171875, 0.9775848388671875, 1.030670166015625, 1.0837554931640625, 1.1368408203125, 1.1899261474609375, 1.243011474609375, 1.2960968017578125, 1.34918212890625, 1.4022674560546875, 1.455352783203125, 1.5084381103515625, 1.5615234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 9.0, 15.0, 20.0, 18.0, 20.0, 42.0, 53.0, 88.0, 139.0, 184.0, 327.0, 520.0, 868.0, 1623.0, 3264.0, 6988.0, 16419.0, 42309.0, 118242.0, 469633.0, 242863.0, 88661.0, 31752.0, 12770.0, 5625.0, 2697.0, 1401.0, 717.0, 407.0, 302.0, 187.0, 123.0, 81.0, 48.0, 35.0, 23.0, 17.0, 17.0, 9.0, 9.0, 3.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2239990234375, -0.21718215942382812, -0.21036529541015625, -0.20354843139648438, -0.1967315673828125, -0.18991470336914062, -0.18309783935546875, -0.17628097534179688, -0.169464111328125, -0.16264724731445312, -0.15583038330078125, -0.14901351928710938, -0.1421966552734375, -0.13537979125976562, -0.12856292724609375, -0.12174606323242188, -0.11492919921875, -0.10811233520507812, -0.10129547119140625, -0.09447860717773438, -0.0876617431640625, -0.08084487915039062, -0.07402801513671875, -0.06721115112304688, -0.060394287109375, -0.053577423095703125, -0.04676055908203125, -0.039943695068359375, -0.0331268310546875, -0.026309967041015625, -0.01949310302734375, -0.012676239013671875, -0.005859375, 0.000957489013671875, 0.00777435302734375, 0.014591217041015625, 0.0214080810546875, 0.028224945068359375, 0.03504180908203125, 0.041858673095703125, 0.048675537109375, 0.055492401123046875, 0.06230926513671875, 0.06912612915039062, 0.0759429931640625, 0.08275985717773438, 0.08957672119140625, 0.09639358520507812, 0.10321044921875, 0.11002731323242188, 0.11684417724609375, 0.12366104125976562, 0.1304779052734375, 0.13729476928710938, 0.14411163330078125, 0.15092849731445312, 0.157745361328125, 0.16456222534179688, 0.17137908935546875, 0.17819595336914062, 0.1850128173828125, 0.19182968139648438, 0.19864654541015625, 0.20546340942382812, 0.2122802734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 18.0, 32.0, 60.0, 74.0, 139.0, 142.0, 152.0, 116.0, 92.0, 50.0, 29.0, 19.0, 17.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001957416534423828, -0.00019058212637901306, -0.0001854225993156433, -0.00018026307225227356, -0.0001751035451889038, -0.00016994401812553406, -0.0001647844910621643, -0.00015962496399879456, -0.0001544654369354248, -0.00014930590987205505, -0.0001441463828086853, -0.00013898685574531555, -0.0001338273286819458, -0.00012866780161857605, -0.0001235082745552063, -0.00011834874749183655, -0.0001131892204284668, -0.00010802969336509705, -0.0001028701663017273, -9.771063923835754e-05, -9.255111217498779e-05, -8.739158511161804e-05, -8.223205804824829e-05, -7.707253098487854e-05, -7.191300392150879e-05, -6.675347685813904e-05, -6.159394979476929e-05, -5.6434422731399536e-05, -5.1274895668029785e-05, -4.6115368604660034e-05, -4.095584154129028e-05, -3.579631447792053e-05, -3.063678741455078e-05, -2.547726035118103e-05, -2.031773328781128e-05, -1.5158206224441528e-05, -9.998679161071777e-06, -4.839152097702026e-06, 3.203749656677246e-07, 5.479902029037476e-06, 1.0639429092407227e-05, 1.5798956155776978e-05, 2.095848321914673e-05, 2.611801028251648e-05, 3.127753734588623e-05, 3.643706440925598e-05, 4.159659147262573e-05, 4.6756118535995483e-05, 5.1915645599365234e-05, 5.7075172662734985e-05, 6.223469972610474e-05, 6.739422678947449e-05, 7.255375385284424e-05, 7.771328091621399e-05, 8.287280797958374e-05, 8.803233504295349e-05, 9.319186210632324e-05, 9.835138916969299e-05, 0.00010351091623306274, 0.0001086704432964325, 0.00011382997035980225, 0.000118989497423172, 0.00012414902448654175, 0.0001293085515499115, 0.00013446807861328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 15.0, 17.0, 19.0, 31.0, 44.0, 50.0, 83.0, 160.0, 297.0, 601.0, 1304.0, 3236.0, 9888.0, 35094.0, 150112.0, 593167.0, 191095.0, 44415.0, 11978.0, 3842.0, 1535.0, 680.0, 346.0, 193.0, 111.0, 75.0, 55.0, 22.0, 16.0, 14.0, 14.0, 8.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.35400390625, -0.34405517578125, -0.3341064453125, -0.32415771484375, -0.314208984375, -0.30426025390625, -0.2943115234375, -0.28436279296875, -0.2744140625, -0.26446533203125, -0.2545166015625, -0.24456787109375, -0.234619140625, -0.22467041015625, -0.2147216796875, -0.20477294921875, -0.19482421875, -0.18487548828125, -0.1749267578125, -0.16497802734375, -0.155029296875, -0.14508056640625, -0.1351318359375, -0.12518310546875, -0.115234375, -0.10528564453125, -0.0953369140625, -0.08538818359375, -0.075439453125, -0.06549072265625, -0.0555419921875, -0.04559326171875, -0.03564453125, -0.02569580078125, -0.0157470703125, -0.00579833984375, 0.004150390625, 0.01409912109375, 0.0240478515625, 0.03399658203125, 0.0439453125, 0.05389404296875, 0.0638427734375, 0.07379150390625, 0.083740234375, 0.09368896484375, 0.1036376953125, 0.11358642578125, 0.12353515625, 0.13348388671875, 0.1434326171875, 0.15338134765625, 0.163330078125, 0.17327880859375, 0.1832275390625, 0.19317626953125, 0.203125, 0.21307373046875, 0.2230224609375, 0.23297119140625, 0.242919921875, 0.25286865234375, 0.2628173828125, 0.27276611328125, 0.28271484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 4.0, 10.0, 9.0, 6.0, 6.0, 19.0, 24.0, 24.0, 49.0, 31.0, 47.0, 61.0, 55.0, 63.0, 62.0, 59.0, 74.0, 60.0, 54.0, 42.0, 42.0, 33.0, 34.0, 26.0, 21.0, 15.0, 12.0, 6.0, 5.0, 6.0, 7.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.265869140625, -0.25635528564453125, -0.2468414306640625, -0.23732757568359375, -0.227813720703125, -0.21829986572265625, -0.2087860107421875, -0.19927215576171875, -0.18975830078125, -0.18024444580078125, -0.1707305908203125, -0.16121673583984375, -0.151702880859375, -0.14218902587890625, -0.1326751708984375, -0.12316131591796875, -0.1136474609375, -0.10413360595703125, -0.0946197509765625, -0.08510589599609375, -0.075592041015625, -0.06607818603515625, -0.0565643310546875, -0.04705047607421875, -0.03753662109375, -0.02802276611328125, -0.0185089111328125, -0.00899505615234375, 0.000518798828125, 0.01003265380859375, 0.0195465087890625, 0.02906036376953125, 0.03857421875, 0.04808807373046875, 0.0576019287109375, 0.06711578369140625, 0.076629638671875, 0.08614349365234375, 0.0956573486328125, 0.10517120361328125, 0.11468505859375, 0.12419891357421875, 0.1337127685546875, 0.14322662353515625, 0.152740478515625, 0.16225433349609375, 0.1717681884765625, 0.18128204345703125, 0.1907958984375, 0.20030975341796875, 0.2098236083984375, 0.21933746337890625, 0.228851318359375, 0.23836517333984375, 0.2478790283203125, 0.25739288330078125, 0.26690673828125, 0.27642059326171875, 0.2859344482421875, 0.29544830322265625, 0.304962158203125, 0.31447601318359375, 0.3239898681640625, 0.33350372314453125, 0.343017578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 2.0, 5.0, 11.0, 24.0, 42.0, 85.0, 180.0, 279.0, 172.0, 109.0, 49.0, 21.0, 11.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.356524467468262, -5.011242866516113, -4.665961265563965, -4.320679187774658, -3.9753975868225098, -3.6301159858703613, -3.284834146499634, -2.9395523071289062, -2.594270706176758, -2.2489891052246094, -1.9037072658538818, -1.5584255456924438, -1.2131438255310059, -0.8678621053695679, -0.5225803852081299, -0.17729854583740234, 0.1679830551147461, 0.5132647752761841, 0.8585464954376221, 1.20382821559906, 1.549109935760498, 1.894391655921936, 2.239673376083374, 2.5849552154541016, 2.93023681640625, 3.2755184173583984, 3.620800256729126, 3.9660820960998535, 4.311363697052002, 4.65664529800415, 5.001927375793457, 5.3472089767456055, 5.6924896240234375, 6.037771224975586, 6.383052825927734, 6.728334903717041, 7.0736165046691895, 7.418898105621338, 7.7641801834106445, 8.109461784362793, 8.454743385314941, 8.80002498626709, 9.145306587219238, 9.490588188171387, 9.835870742797852, 10.18115234375, 10.526433944702148, 10.871715545654297, 11.216997146606445, 11.562278747558594, 11.907560348510742, 12.25284194946289, 12.598123550415039, 12.943406105041504, 13.288687705993652, 13.6339693069458, 13.97925090789795, 14.324532508850098, 14.669814109802246, 15.015095710754395, 15.36037826538086, 15.705659866333008, 16.050941467285156, 16.396223068237305, 16.741504669189453]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 4.0, 3.0, 7.0, 8.0, 7.0, 13.0, 12.0, 13.0, 12.0, 11.0, 22.0, 25.0, 24.0, 19.0, 24.0, 38.0, 38.0, 52.0, 49.0, 71.0, 68.0, 65.0, 51.0, 33.0, 37.0, 32.0, 38.0, 35.0, 28.0, 23.0, 20.0, 15.0, 18.0, 12.0, 11.0, 10.0, 9.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.6926469802856445, -6.4937005043029785, -6.294753551483154, -6.095807075500488, -5.896860599517822, -5.697914123535156, -5.498967170715332, -5.300020694732666, -5.10107421875, -4.902127742767334, -4.70318078994751, -4.504234313964844, -4.305287837982178, -4.106341361999512, -3.9073944091796875, -3.7084479331970215, -3.5095009803771973, -3.310554265975952, -3.111607789993286, -2.912661075592041, -2.713714599609375, -2.51476788520813, -2.3158211708068848, -2.1168746948242188, -1.9179279804229736, -1.718981385231018, -1.5200347900390625, -1.3210880756378174, -1.1221414804458618, -0.9231948852539062, -0.7242481708526611, -0.5253015756607056, -0.32635498046875, -0.12740835547447205, 0.07153826951980591, 0.27048492431640625, 0.4694315195083618, 0.6683781147003174, 0.8673248291015625, 1.066271424293518, 1.2652180194854736, 1.4641646146774292, 1.6631112098693848, 1.8620579242706299, 2.061004638671875, 2.259951114654541, 2.458897829055786, 2.6578445434570312, 2.8567910194396973, 3.0557377338409424, 3.2546842098236084, 3.4536309242248535, 3.6525774002075195, 3.8515241146087646, 4.05047082901001, 4.249417304992676, 4.4483642578125, 4.647310733795166, 4.84625768661499, 5.045204162597656, 5.244150638580322, 5.443097114562988, 5.6420440673828125, 5.8409905433654785, 6.0399370193481445]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 14.0, 13.0, 22.0, 35.0, 68.0, 74.0, 141.0, 261.0, 452.0, 823.0, 1543.0, 3220.0, 6866.0, 17866.0, 53242.0, 177073.0, 585530.0, 1446176.0, 1254969.0, 449269.0, 130992.0, 39698.0, 14231.0, 5939.0, 2742.0, 1332.0, 711.0, 386.0, 242.0, 116.0, 74.0, 52.0, 28.0, 19.0, 20.0, 9.0, 7.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30652618408203125, -0.2959136962890625, -0.28530120849609375, -0.274688720703125, -0.26407623291015625, -0.2534637451171875, -0.24285125732421875, -0.23223876953125, -0.22162628173828125, -0.2110137939453125, -0.20040130615234375, -0.189788818359375, -0.17917633056640625, -0.1685638427734375, -0.15795135498046875, -0.1473388671875, -0.13672637939453125, -0.1261138916015625, -0.11550140380859375, -0.104888916015625, -0.09427642822265625, -0.0836639404296875, -0.07305145263671875, -0.06243896484375, -0.05182647705078125, -0.0412139892578125, -0.03060150146484375, -0.019989013671875, -0.00937652587890625, 0.0012359619140625, 0.01184844970703125, 0.0224609375, 0.03307342529296875, 0.0436859130859375, 0.05429840087890625, 0.064910888671875, 0.07552337646484375, 0.0861358642578125, 0.09674835205078125, 0.10736083984375, 0.11797332763671875, 0.1285858154296875, 0.13919830322265625, 0.149810791015625, 0.16042327880859375, 0.1710357666015625, 0.18164825439453125, 0.1922607421875, 0.20287322998046875, 0.2134857177734375, 0.22409820556640625, 0.234710693359375, 0.24532318115234375, 0.2559356689453125, 0.26654815673828125, 0.27716064453125, 0.28777313232421875, 0.2983856201171875, 0.30899810791015625, 0.319610595703125, 0.33022308349609375, 0.3408355712890625, 0.35144805908203125, 0.362060546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 15.0, 14.0, 24.0, 21.0, 21.0, 42.0, 40.0, 56.0, 49.0, 66.0, 65.0, 75.0, 63.0, 58.0, 61.0, 64.0, 45.0, 44.0, 34.0, 42.0, 23.0, 20.0, 15.0, 14.0, 4.0, 10.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.575958251953125, -0.55474853515625, -0.533538818359375, -0.5123291015625, -0.491119384765625, -0.46990966796875, -0.448699951171875, -0.427490234375, -0.406280517578125, -0.38507080078125, -0.363861083984375, -0.3426513671875, -0.321441650390625, -0.30023193359375, -0.279022216796875, -0.2578125, -0.236602783203125, -0.21539306640625, -0.194183349609375, -0.1729736328125, -0.151763916015625, -0.13055419921875, -0.109344482421875, -0.088134765625, -0.066925048828125, -0.04571533203125, -0.024505615234375, -0.0032958984375, 0.017913818359375, 0.03912353515625, 0.060333251953125, 0.08154296875, 0.102752685546875, 0.12396240234375, 0.145172119140625, 0.1663818359375, 0.187591552734375, 0.20880126953125, 0.230010986328125, 0.251220703125, 0.272430419921875, 0.29364013671875, 0.314849853515625, 0.3360595703125, 0.357269287109375, 0.37847900390625, 0.399688720703125, 0.4208984375, 0.442108154296875, 0.46331787109375, 0.484527587890625, 0.5057373046875, 0.526947021484375, 0.54815673828125, 0.569366455078125, 0.590576171875, 0.611785888671875, 0.63299560546875, 0.654205322265625, 0.6754150390625, 0.696624755859375, 0.71783447265625, 0.739044189453125, 0.76025390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 3.0, 19.0, 19.0, 31.0, 41.0, 67.0, 124.0, 239.0, 523.0, 1648.0, 7759.0, 95218.0, 3745919.0, 324514.0, 14328.0, 2391.0, 756.0, 338.0, 129.0, 76.0, 30.0, 37.0, 13.0, 18.0, 8.0, 4.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.701171875, -1.6559906005859375, -1.610809326171875, -1.5656280517578125, -1.52044677734375, -1.4752655029296875, -1.430084228515625, -1.3849029541015625, -1.3397216796875, -1.2945404052734375, -1.249359130859375, -1.2041778564453125, -1.15899658203125, -1.1138153076171875, -1.068634033203125, -1.0234527587890625, -0.978271484375, -0.9330902099609375, -0.887908935546875, -0.8427276611328125, -0.79754638671875, -0.7523651123046875, -0.707183837890625, -0.6620025634765625, -0.6168212890625, -0.5716400146484375, -0.526458740234375, -0.4812774658203125, -0.43609619140625, -0.3909149169921875, -0.345733642578125, -0.3005523681640625, -0.25537109375, -0.2101898193359375, -0.165008544921875, -0.1198272705078125, -0.07464599609375, -0.0294647216796875, 0.015716552734375, 0.0608978271484375, 0.1060791015625, 0.1512603759765625, 0.196441650390625, 0.2416229248046875, 0.28680419921875, 0.3319854736328125, 0.377166748046875, 0.4223480224609375, 0.467529296875, 0.5127105712890625, 0.557891845703125, 0.6030731201171875, 0.64825439453125, 0.6934356689453125, 0.738616943359375, 0.7837982177734375, 0.8289794921875, 0.8741607666015625, 0.919342041015625, 0.9645233154296875, 1.00970458984375, 1.0548858642578125, 1.100067138671875, 1.1452484130859375, 1.1904296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 8.0, 11.0, 15.0, 25.0, 29.0, 41.0, 68.0, 91.0, 166.0, 340.0, 564.0, 754.0, 684.0, 487.0, 335.0, 180.0, 98.0, 68.0, 26.0, 25.0, 17.0, 10.0, 7.0, 8.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9517440795898438, -0.9176483154296875, -0.8835525512695312, -0.849456787109375, -0.8153610229492188, -0.7812652587890625, -0.7471694946289062, -0.71307373046875, -0.6789779663085938, -0.6448822021484375, -0.6107864379882812, -0.576690673828125, -0.5425949096679688, -0.5084991455078125, -0.47440338134765625, -0.4403076171875, -0.40621185302734375, -0.3721160888671875, -0.33802032470703125, -0.303924560546875, -0.26982879638671875, -0.2357330322265625, -0.20163726806640625, -0.16754150390625, -0.13344573974609375, -0.0993499755859375, -0.06525421142578125, -0.031158447265625, 0.00293731689453125, 0.0370330810546875, 0.07112884521484375, 0.105224609375, 0.13932037353515625, 0.1734161376953125, 0.20751190185546875, 0.241607666015625, 0.27570343017578125, 0.3097991943359375, 0.34389495849609375, 0.37799072265625, 0.41208648681640625, 0.4461822509765625, 0.48027801513671875, 0.514373779296875, 0.5484695434570312, 0.5825653076171875, 0.6166610717773438, 0.6507568359375, 0.6848526000976562, 0.7189483642578125, 0.7530441284179688, 0.787139892578125, 0.8212356567382812, 0.8553314208984375, 0.8894271850585938, 0.92352294921875, 0.9576187133789062, 0.9917144775390625, 1.0258102416992188, 1.059906005859375, 1.0940017700195312, 1.1280975341796875, 1.1621932983398438, 1.1962890625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 11.0, 13.0, 28.0, 74.0, 129.0, 216.0, 214.0, 147.0, 79.0, 38.0, 15.0, 13.0, 6.0, 9.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.337383270263672, -8.029167175292969, -7.720952033996582, -7.412736415863037, -7.104520797729492, -6.796304702758789, -6.488089084625244, -6.179873466491699, -5.871657848358154, -5.563442230224609, -5.2552266120910645, -4.9470109939575195, -4.638794898986816, -4.33057975769043, -4.022363662719727, -3.7141480445861816, -3.4059324264526367, -3.097716808319092, -2.789501190185547, -2.481285333633423, -2.173069715499878, -1.864854097366333, -1.5566383600234985, -1.248422622680664, -0.9402070045471191, -0.6319913268089294, -0.32377564907073975, -0.015559971332550049, 0.29265570640563965, 0.6008713245391846, 0.909087061882019, 1.2173027992248535, 1.5255184173583984, 1.8337340354919434, 2.1419496536254883, 2.4501655101776123, 2.7583811283111572, 3.066596746444702, 3.374812602996826, 3.683028221130371, 3.991243839263916, 4.299459457397461, 4.607675075531006, 4.915890693664551, 5.224106788635254, 5.532321929931641, 5.840538024902344, 6.148753643035889, 6.456969261169434, 6.7651848793029785, 7.073400497436523, 7.381616115570068, 7.689831733703613, 7.998047828674316, 8.306262969970703, 8.614479064941406, 8.92269515991211, 9.230911254882812, 9.5391263961792, 9.847342491149902, 10.155557632446289, 10.463773727416992, 10.771988868713379, 11.080204963684082, 11.388420104980469]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 9.0, 1.0, 13.0, 12.0, 18.0, 18.0, 11.0, 16.0, 22.0, 28.0, 18.0, 31.0, 27.0, 32.0, 33.0, 44.0, 36.0, 54.0, 40.0, 63.0, 48.0, 67.0, 49.0, 39.0, 42.0, 24.0, 32.0, 29.0, 24.0, 24.0, 20.0, 9.0, 12.0, 10.0, 9.0, 9.0, 5.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01992130279541, -3.8885204792022705, -3.757119655609131, -3.625718832015991, -3.4943180084228516, -3.362916946411133, -3.231516122817993, -3.1001152992248535, -2.968714475631714, -2.837313652038574, -2.7059128284454346, -2.574512004852295, -2.443110942840576, -2.3117103576660156, -2.180309295654297, -2.0489084720611572, -1.9175076484680176, -1.786106824874878, -1.6547060012817383, -1.523305058479309, -1.3919042348861694, -1.2605034112930298, -1.1291024684906006, -0.9977016448974609, -0.8663008213043213, -0.7348999977111816, -0.6034991145133972, -0.4720982611179352, -0.34069740772247314, -0.2092965841293335, -0.07789570093154907, 0.05350518226623535, 0.1849055290222168, 0.31630638241767883, 0.44770723581314087, 0.5791081190109253, 0.7105089426040649, 0.8419097661972046, 0.973310649394989, 1.1047115325927734, 1.236112356185913, 1.3675131797790527, 1.4989140033721924, 1.6303149461746216, 1.7617157697677612, 1.8931165933609009, 2.02451753616333, 2.1559183597564697, 2.2873191833496094, 2.418720006942749, 2.5501208305358887, 2.6815216541290283, 2.812922477722168, 2.9443235397338867, 3.0757243633270264, 3.207125186920166, 3.3385260105133057, 3.4699268341064453, 3.601327657699585, 3.7327284812927246, 3.8641295433044434, 3.995530128479004, 4.126931190490723, 4.258332252502441, 4.389732837677002]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 9.0, 4.0, 12.0, 11.0, 17.0, 23.0, 23.0, 61.0, 77.0, 85.0, 147.0, 237.0, 364.0, 588.0, 1002.0, 1611.0, 3010.0, 5660.0, 10516.0, 21197.0, 43129.0, 88544.0, 175006.0, 263680.0, 210531.0, 111834.0, 55007.0, 26916.0, 13495.0, 6866.0, 3706.0, 2083.0, 1166.0, 711.0, 432.0, 282.0, 168.0, 99.0, 75.0, 51.0, 31.0, 26.0, 13.0, 15.0, 12.0, 10.0, 4.0, 5.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.53515625, -0.5182571411132812, -0.5013580322265625, -0.48445892333984375, -0.467559814453125, -0.45066070556640625, -0.4337615966796875, -0.41686248779296875, -0.39996337890625, -0.38306427001953125, -0.3661651611328125, -0.34926605224609375, -0.332366943359375, -0.31546783447265625, -0.2985687255859375, -0.28166961669921875, -0.2647705078125, -0.24787139892578125, -0.2309722900390625, -0.21407318115234375, -0.197174072265625, -0.18027496337890625, -0.1633758544921875, -0.14647674560546875, -0.12957763671875, -0.11267852783203125, -0.0957794189453125, -0.07888031005859375, -0.061981201171875, -0.04508209228515625, -0.0281829833984375, -0.01128387451171875, 0.005615234375, 0.02251434326171875, 0.0394134521484375, 0.05631256103515625, 0.073211669921875, 0.09011077880859375, 0.1070098876953125, 0.12390899658203125, 0.14080810546875, 0.15770721435546875, 0.1746063232421875, 0.19150543212890625, 0.208404541015625, 0.22530364990234375, 0.2422027587890625, 0.25910186767578125, 0.2760009765625, 0.29290008544921875, 0.3097991943359375, 0.32669830322265625, 0.343597412109375, 0.36049652099609375, 0.3773956298828125, 0.39429473876953125, 0.41119384765625, 0.42809295654296875, 0.4449920654296875, 0.46189117431640625, 0.478790283203125, 0.49568939208984375, 0.5125885009765625, 0.5294876098632812, 0.54638671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 12.0, 15.0, 18.0, 19.0, 31.0, 49.0, 47.0, 61.0, 50.0, 59.0, 73.0, 67.0, 64.0, 55.0, 78.0, 46.0, 54.0, 39.0, 30.0, 31.0, 19.0, 15.0, 16.0, 8.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5736846923828125, -0.552154541015625, -0.5306243896484375, -0.50909423828125, -0.4875640869140625, -0.466033935546875, -0.4445037841796875, -0.4229736328125, -0.4014434814453125, -0.379913330078125, -0.3583831787109375, -0.33685302734375, -0.3153228759765625, -0.293792724609375, -0.2722625732421875, -0.250732421875, -0.2292022705078125, -0.207672119140625, -0.1861419677734375, -0.16461181640625, -0.1430816650390625, -0.121551513671875, -0.1000213623046875, -0.0784912109375, -0.0569610595703125, -0.035430908203125, -0.0139007568359375, 0.00762939453125, 0.0291595458984375, 0.050689697265625, 0.0722198486328125, 0.09375, 0.1152801513671875, 0.136810302734375, 0.1583404541015625, 0.17987060546875, 0.2014007568359375, 0.222930908203125, 0.2444610595703125, 0.2659912109375, 0.2875213623046875, 0.309051513671875, 0.3305816650390625, 0.35211181640625, 0.3736419677734375, 0.395172119140625, 0.4167022705078125, 0.438232421875, 0.4597625732421875, 0.481292724609375, 0.5028228759765625, 0.52435302734375, 0.5458831787109375, 0.567413330078125, 0.5889434814453125, 0.6104736328125, 0.6320037841796875, 0.653533935546875, 0.6750640869140625, 0.69659423828125, 0.7181243896484375, 0.739654541015625, 0.7611846923828125, 0.78271484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 4.0, 10.0, 9.0, 15.0, 22.0, 31.0, 38.0, 58.0, 85.0, 128.0, 186.0, 249.0, 357.0, 587.0, 1155.0, 2520.0, 7326.0, 29148.0, 152323.0, 665268.0, 147963.0, 28388.0, 7199.0, 2523.0, 1096.0, 607.0, 350.0, 242.0, 167.0, 138.0, 104.0, 60.0, 53.0, 45.0, 24.0, 21.0, 11.0, 7.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.111968994140625, -1.07550048828125, -1.039031982421875, -1.0025634765625, -0.966094970703125, -0.92962646484375, -0.893157958984375, -0.856689453125, -0.820220947265625, -0.78375244140625, -0.747283935546875, -0.7108154296875, -0.674346923828125, -0.63787841796875, -0.601409912109375, -0.56494140625, -0.528472900390625, -0.49200439453125, -0.455535888671875, -0.4190673828125, -0.382598876953125, -0.34613037109375, -0.309661865234375, -0.273193359375, -0.236724853515625, -0.20025634765625, -0.163787841796875, -0.1273193359375, -0.090850830078125, -0.05438232421875, -0.017913818359375, 0.0185546875, 0.055023193359375, 0.09149169921875, 0.127960205078125, 0.1644287109375, 0.200897216796875, 0.23736572265625, 0.273834228515625, 0.310302734375, 0.346771240234375, 0.38323974609375, 0.419708251953125, 0.4561767578125, 0.492645263671875, 0.52911376953125, 0.565582275390625, 0.60205078125, 0.638519287109375, 0.67498779296875, 0.711456298828125, 0.7479248046875, 0.784393310546875, 0.82086181640625, 0.857330322265625, 0.893798828125, 0.930267333984375, 0.96673583984375, 1.003204345703125, 1.0396728515625, 1.076141357421875, 1.11260986328125, 1.149078369140625, 1.185546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 15.0, 9.0, 17.0, 15.0, 17.0, 28.0, 25.0, 31.0, 30.0, 33.0, 40.0, 47.0, 49.0, 47.0, 40.0, 55.0, 55.0, 51.0, 53.0, 47.0, 45.0, 29.0, 28.0, 22.0, 37.0, 21.0, 15.0, 12.0, 13.0, 8.0, 13.0, 4.0, 8.0, 4.0, 3.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.628021240234375, -1.57440185546875, -1.520782470703125, -1.4671630859375, -1.413543701171875, -1.35992431640625, -1.306304931640625, -1.252685546875, -1.199066162109375, -1.14544677734375, -1.091827392578125, -1.0382080078125, -0.984588623046875, -0.93096923828125, -0.877349853515625, -0.82373046875, -0.770111083984375, -0.71649169921875, -0.662872314453125, -0.6092529296875, -0.555633544921875, -0.50201416015625, -0.448394775390625, -0.394775390625, -0.341156005859375, -0.28753662109375, -0.233917236328125, -0.1802978515625, -0.126678466796875, -0.07305908203125, -0.019439697265625, 0.0341796875, 0.087799072265625, 0.14141845703125, 0.195037841796875, 0.2486572265625, 0.302276611328125, 0.35589599609375, 0.409515380859375, 0.463134765625, 0.516754150390625, 0.57037353515625, 0.623992919921875, 0.6776123046875, 0.731231689453125, 0.78485107421875, 0.838470458984375, 0.89208984375, 0.945709228515625, 0.99932861328125, 1.052947998046875, 1.1065673828125, 1.160186767578125, 1.21380615234375, 1.267425537109375, 1.321044921875, 1.374664306640625, 1.42828369140625, 1.481903076171875, 1.5355224609375, 1.589141845703125, 1.64276123046875, 1.696380615234375, 1.75]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 16.0, 17.0, 22.0, 20.0, 58.0, 76.0, 105.0, 156.0, 243.0, 377.0, 670.0, 1192.0, 2338.0, 4911.0, 10956.0, 26842.0, 71457.0, 227633.0, 536906.0, 100751.0, 36595.0, 14531.0, 6221.0, 2911.0, 1434.0, 764.0, 474.0, 276.0, 177.0, 125.0, 83.0, 59.0, 41.0, 32.0, 20.0, 7.0, 6.0, 10.0, 7.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.2420654296875, -0.23476600646972656, -0.22746658325195312, -0.2201671600341797, -0.21286773681640625, -0.2055683135986328, -0.19826889038085938, -0.19096946716308594, -0.1836700439453125, -0.17637062072753906, -0.16907119750976562, -0.1617717742919922, -0.15447235107421875, -0.1471729278564453, -0.13987350463867188, -0.13257408142089844, -0.125274658203125, -0.11797523498535156, -0.11067581176757812, -0.10337638854980469, -0.09607696533203125, -0.08877754211425781, -0.08147811889648438, -0.07417869567871094, -0.0668792724609375, -0.05957984924316406, -0.052280426025390625, -0.04498100280761719, -0.03768157958984375, -0.030382156372070312, -0.023082733154296875, -0.015783309936523438, -0.00848388671875, -0.0011844635009765625, 0.006114959716796875, 0.013414382934570312, 0.02071380615234375, 0.028013229370117188, 0.035312652587890625, 0.04261207580566406, 0.0499114990234375, 0.05721092224121094, 0.06451034545898438, 0.07180976867675781, 0.07910919189453125, 0.08640861511230469, 0.09370803833007812, 0.10100746154785156, 0.108306884765625, 0.11560630798339844, 0.12290573120117188, 0.1302051544189453, 0.13750457763671875, 0.1448040008544922, 0.15210342407226562, 0.15940284729003906, 0.1667022705078125, 0.17400169372558594, 0.18130111694335938, 0.1886005401611328, 0.19589996337890625, 0.2031993865966797, 0.21049880981445312, 0.21779823303222656, 0.22509765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 10.0, 15.0, 20.0, 20.0, 16.0, 19.0, 39.0, 25.0, 47.0, 69.0, 94.0, 129.0, 121.0, 91.0, 50.0, 43.0, 32.0, 33.0, 35.0, 23.0, 16.0, 8.0, 13.0, 3.0, 2.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.875131607055664e-05, -8.468236774206161e-05, -8.061341941356659e-05, -7.654447108507156e-05, -7.247552275657654e-05, -6.840657442808151e-05, -6.433762609958649e-05, -6.026867777109146e-05, -5.6199729442596436e-05, -5.213078111410141e-05, -4.8061832785606384e-05, -4.399288445711136e-05, -3.992393612861633e-05, -3.585498780012131e-05, -3.178603947162628e-05, -2.7717091143131256e-05, -2.364814281463623e-05, -1.9579194486141205e-05, -1.551024615764618e-05, -1.1441297829151154e-05, -7.372349500656128e-06, -3.3034011721611023e-06, 7.655471563339233e-07, 4.834495484828949e-06, 8.903443813323975e-06, 1.2972392141819e-05, 1.7041340470314026e-05, 2.111028879880905e-05, 2.5179237127304077e-05, 2.9248185455799103e-05, 3.331713378429413e-05, 3.7386082112789154e-05, 4.145503044128418e-05, 4.5523978769779205e-05, 4.959292709827423e-05, 5.3661875426769257e-05, 5.773082375526428e-05, 6.179977208375931e-05, 6.586872041225433e-05, 6.993766874074936e-05, 7.400661706924438e-05, 7.807556539773941e-05, 8.214451372623444e-05, 8.621346205472946e-05, 9.028241038322449e-05, 9.435135871171951e-05, 9.842030704021454e-05, 0.00010248925536870956, 0.00010655820369720459, 0.00011062715202569962, 0.00011469610035419464, 0.00011876504868268967, 0.0001228339970111847, 0.00012690294533967972, 0.00013097189366817474, 0.00013504084199666977, 0.0001391097903251648, 0.00014317873865365982, 0.00014724768698215485, 0.00015131663531064987, 0.0001553855836391449, 0.00015945453196763992, 0.00016352348029613495, 0.00016759242862462997, 0.000171661376953125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 16.0, 21.0, 27.0, 44.0, 83.0, 103.0, 204.0, 296.0, 560.0, 1260.0, 3510.0, 12823.0, 64033.0, 648880.0, 264060.0, 39272.0, 8542.0, 2558.0, 1033.0, 516.0, 247.0, 152.0, 95.0, 63.0, 27.0, 42.0, 25.0, 12.0, 9.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.36767578125, -0.3553619384765625, -0.343048095703125, -0.3307342529296875, -0.31842041015625, -0.3061065673828125, -0.293792724609375, -0.2814788818359375, -0.2691650390625, -0.2568511962890625, -0.244537353515625, -0.2322235107421875, -0.21990966796875, -0.2075958251953125, -0.195281982421875, -0.1829681396484375, -0.170654296875, -0.1583404541015625, -0.146026611328125, -0.1337127685546875, -0.12139892578125, -0.1090850830078125, -0.096771240234375, -0.0844573974609375, -0.0721435546875, -0.0598297119140625, -0.047515869140625, -0.0352020263671875, -0.02288818359375, -0.0105743408203125, 0.001739501953125, 0.0140533447265625, 0.0263671875, 0.0386810302734375, 0.050994873046875, 0.0633087158203125, 0.07562255859375, 0.0879364013671875, 0.100250244140625, 0.1125640869140625, 0.1248779296875, 0.1371917724609375, 0.149505615234375, 0.1618194580078125, 0.17413330078125, 0.1864471435546875, 0.198760986328125, 0.2110748291015625, 0.223388671875, 0.2357025146484375, 0.248016357421875, 0.2603302001953125, 0.27264404296875, 0.2849578857421875, 0.297271728515625, 0.3095855712890625, 0.3218994140625, 0.3342132568359375, 0.346527099609375, 0.3588409423828125, 0.37115478515625, 0.3834686279296875, 0.395782470703125, 0.4080963134765625, 0.42041015625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 4.0, 5.0, 5.0, 15.0, 13.0, 14.0, 17.0, 20.0, 33.0, 30.0, 56.0, 56.0, 102.0, 87.0, 92.0, 86.0, 84.0, 53.0, 56.0, 47.0, 32.0, 27.0, 15.0, 11.0, 9.0, 11.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3427734375, -0.3322181701660156, -0.32166290283203125, -0.3111076354980469, -0.3005523681640625, -0.2899971008300781, -0.27944183349609375, -0.2688865661621094, -0.258331298828125, -0.24777603149414062, -0.23722076416015625, -0.22666549682617188, -0.2161102294921875, -0.20555496215820312, -0.19499969482421875, -0.18444442749023438, -0.17388916015625, -0.16333389282226562, -0.15277862548828125, -0.14222335815429688, -0.1316680908203125, -0.12111282348632812, -0.11055755615234375, -0.10000228881835938, -0.089447021484375, -0.07889175415039062, -0.06833648681640625, -0.057781219482421875, -0.0472259521484375, -0.036670684814453125, -0.02611541748046875, -0.015560150146484375, -0.0050048828125, 0.005550384521484375, 0.01610565185546875, 0.026660919189453125, 0.0372161865234375, 0.047771453857421875, 0.05832672119140625, 0.06888198852539062, 0.079437255859375, 0.08999252319335938, 0.10054779052734375, 0.11110305786132812, 0.1216583251953125, 0.13221359252929688, 0.14276885986328125, 0.15332412719726562, 0.16387939453125, 0.17443466186523438, 0.18498992919921875, 0.19554519653320312, 0.2061004638671875, 0.21665573120117188, 0.22721099853515625, 0.23776626586914062, 0.248321533203125, 0.2588768005371094, 0.26943206787109375, 0.2799873352050781, 0.2905426025390625, 0.3010978698730469, 0.31165313720703125, 0.3222084045410156, 0.332763671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 23.0, 35.0, 47.0, 108.0, 247.0, 185.0, 117.0, 86.0, 64.0, 29.0, 19.0, 10.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.926670074462891, -4.664752960205078, -4.402835845947266, -4.140918731689453, -3.8790018558502197, -3.6170847415924072, -3.355167865753174, -3.0932507514953613, -2.831333637237549, -2.5694165229797363, -2.307499408721924, -2.0455825328826904, -1.783665418624878, -1.5217483043670654, -1.2598313093185425, -0.9979143142700195, -0.735997200012207, -0.4740801453590393, -0.21216309070587158, 0.04975396394729614, 0.31167101860046387, 0.5735881328582764, 0.8355051279067993, 1.0974221229553223, 1.3593392372131348, 1.6212563514709473, 1.8831733465194702, 2.145090341567993, 2.4070074558258057, 2.668924570083618, 2.9308414459228516, 3.192758560180664, 3.454676628112793, 3.7165937423706055, 3.978510856628418, 4.2404279708862305, 4.502345085144043, 4.7642621994018555, 5.02617883682251, 5.288095951080322, 5.550013065338135, 5.811930179595947, 6.07384729385376, 6.335764408111572, 6.597681045532227, 6.859598159790039, 7.121515274047852, 7.383432388305664, 7.645349502563477, 7.907266616821289, 8.169183731079102, 8.431100845336914, 8.693017959594727, 8.954935073852539, 9.216852188110352, 9.478769302368164, 9.740686416625977, 10.002603530883789, 10.264520645141602, 10.526437759399414, 10.788354873657227, 11.050271987915039, 11.312189102172852, 11.574106216430664, 11.83602237701416]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 7.0, 7.0, 12.0, 18.0, 14.0, 10.0, 21.0, 20.0, 22.0, 34.0, 23.0, 35.0, 31.0, 61.0, 80.0, 114.0, 101.0, 71.0, 46.0, 39.0, 35.0, 37.0, 31.0, 18.0, 15.0, 15.0, 6.0, 9.0, 18.0, 9.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.058432579040527, -6.841629981994629, -6.6248273849487305, -6.408024787902832, -6.191222190856934, -5.974419593811035, -5.757616996765137, -5.540814399719238, -5.32401180267334, -5.107209205627441, -4.890406608581543, -4.6736040115356445, -4.456801414489746, -4.239998817443848, -4.023196220397949, -3.806393623352051, -3.5895910263061523, -3.372788429260254, -3.1559858322143555, -2.939183235168457, -2.7223806381225586, -2.50557804107666, -2.2887754440307617, -2.0719728469848633, -1.8551702499389648, -1.6383676528930664, -1.421565055847168, -1.2047624588012695, -0.9879598617553711, -0.7711572647094727, -0.5543546676635742, -0.3375520706176758, -0.12074995040893555, 0.09605264663696289, 0.31285524368286133, 0.5296578407287598, 0.7464604377746582, 0.9632630348205566, 1.180065631866455, 1.3968682289123535, 1.613670825958252, 1.8304734230041504, 2.047276020050049, 2.2640786170959473, 2.4808812141418457, 2.697683811187744, 2.9144864082336426, 3.131289005279541, 3.3480916023254395, 3.564894199371338, 3.7816967964172363, 3.9984993934631348, 4.215301990509033, 4.432104587554932, 4.64890718460083, 4.8657097816467285, 5.082512378692627, 5.299314975738525, 5.516117572784424, 5.732920169830322, 5.949722766876221, 6.166525363922119, 6.383327960968018, 6.600130558013916, 6.8169331550598145]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 8.0, 12.0, 10.0, 19.0, 24.0, 27.0, 45.0, 65.0, 104.0, 167.0, 252.0, 420.0, 729.0, 1506.0, 3087.0, 7238.0, 20268.0, 71214.0, 311827.0, 1217560.0, 1750845.0, 606711.0, 144103.0, 37001.0, 12051.0, 4581.0, 2079.0, 1053.0, 488.0, 308.0, 160.0, 117.0, 63.0, 43.0, 28.0, 18.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4404296875, -0.42676544189453125, -0.4131011962890625, -0.39943695068359375, -0.385772705078125, -0.37210845947265625, -0.3584442138671875, -0.34477996826171875, -0.33111572265625, -0.31745147705078125, -0.3037872314453125, -0.29012298583984375, -0.276458740234375, -0.26279449462890625, -0.2491302490234375, -0.23546600341796875, -0.2218017578125, -0.20813751220703125, -0.1944732666015625, -0.18080902099609375, -0.167144775390625, -0.15348052978515625, -0.1398162841796875, -0.12615203857421875, -0.11248779296875, -0.09882354736328125, -0.0851593017578125, -0.07149505615234375, -0.057830810546875, -0.04416656494140625, -0.0305023193359375, -0.01683807373046875, -0.003173828125, 0.01049041748046875, 0.0241546630859375, 0.03781890869140625, 0.051483154296875, 0.06514739990234375, 0.0788116455078125, 0.09247589111328125, 0.10614013671875, 0.11980438232421875, 0.1334686279296875, 0.14713287353515625, 0.160797119140625, 0.17446136474609375, 0.1881256103515625, 0.20178985595703125, 0.2154541015625, 0.22911834716796875, 0.2427825927734375, 0.25644683837890625, 0.270111083984375, 0.28377532958984375, 0.2974395751953125, 0.31110382080078125, 0.32476806640625, 0.33843231201171875, 0.3520965576171875, 0.36576080322265625, 0.379425048828125, 0.39308929443359375, 0.4067535400390625, 0.42041778564453125, 0.43408203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 4.0, 4.0, 10.0, 11.0, 14.0, 25.0, 28.0, 33.0, 48.0, 47.0, 61.0, 51.0, 71.0, 71.0, 51.0, 73.0, 65.0, 59.0, 57.0, 57.0, 35.0, 38.0, 19.0, 20.0, 13.0, 10.0, 8.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.564849853515625, -0.54327392578125, -0.521697998046875, -0.5001220703125, -0.478546142578125, -0.45697021484375, -0.435394287109375, -0.413818359375, -0.392242431640625, -0.37066650390625, -0.349090576171875, -0.3275146484375, -0.305938720703125, -0.28436279296875, -0.262786865234375, -0.2412109375, -0.219635009765625, -0.19805908203125, -0.176483154296875, -0.1549072265625, -0.133331298828125, -0.11175537109375, -0.090179443359375, -0.068603515625, -0.047027587890625, -0.02545166015625, -0.003875732421875, 0.0177001953125, 0.039276123046875, 0.06085205078125, 0.082427978515625, 0.10400390625, 0.125579833984375, 0.14715576171875, 0.168731689453125, 0.1903076171875, 0.211883544921875, 0.23345947265625, 0.255035400390625, 0.276611328125, 0.298187255859375, 0.31976318359375, 0.341339111328125, 0.3629150390625, 0.384490966796875, 0.40606689453125, 0.427642822265625, 0.44921875, 0.470794677734375, 0.49237060546875, 0.513946533203125, 0.5355224609375, 0.557098388671875, 0.57867431640625, 0.600250244140625, 0.621826171875, 0.643402099609375, 0.66497802734375, 0.686553955078125, 0.7081298828125, 0.729705810546875, 0.75128173828125, 0.772857666015625, 0.79443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 13.0, 12.0, 28.0, 39.0, 61.0, 103.0, 207.0, 406.0, 1032.0, 3855.0, 32233.0, 2500595.0, 1625217.0, 25319.0, 3337.0, 959.0, 406.0, 193.0, 101.0, 50.0, 29.0, 30.0, 18.0, 6.0, 7.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4669189453125, -1.416259765625, -1.3656005859375, -1.31494140625, -1.2642822265625, -1.213623046875, -1.1629638671875, -1.1123046875, -1.0616455078125, -1.010986328125, -0.9603271484375, -0.90966796875, -0.8590087890625, -0.808349609375, -0.7576904296875, -0.70703125, -0.6563720703125, -0.605712890625, -0.5550537109375, -0.50439453125, -0.4537353515625, -0.403076171875, -0.3524169921875, -0.3017578125, -0.2510986328125, -0.200439453125, -0.1497802734375, -0.09912109375, -0.0484619140625, 0.002197265625, 0.0528564453125, 0.103515625, 0.1541748046875, 0.204833984375, 0.2554931640625, 0.30615234375, 0.3568115234375, 0.407470703125, 0.4581298828125, 0.5087890625, 0.5594482421875, 0.610107421875, 0.6607666015625, 0.71142578125, 0.7620849609375, 0.812744140625, 0.8634033203125, 0.9140625, 0.9647216796875, 1.015380859375, 1.0660400390625, 1.11669921875, 1.1673583984375, 1.218017578125, 1.2686767578125, 1.3193359375, 1.3699951171875, 1.420654296875, 1.4713134765625, 1.52197265625, 1.5726318359375, 1.623291015625, 1.6739501953125, 1.724609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 9.0, 8.0, 9.0, 15.0, 23.0, 29.0, 43.0, 71.0, 90.0, 143.0, 227.0, 405.0, 602.0, 658.0, 589.0, 415.0, 279.0, 172.0, 111.0, 55.0, 27.0, 29.0, 12.0, 10.0, 15.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.7934188842773438, -0.7611541748046875, -0.7288894653320312, -0.696624755859375, -0.6643600463867188, -0.6320953369140625, -0.5998306274414062, -0.56756591796875, -0.5353012084960938, -0.5030364990234375, -0.47077178955078125, -0.438507080078125, -0.40624237060546875, -0.3739776611328125, -0.34171295166015625, -0.3094482421875, -0.27718353271484375, -0.2449188232421875, -0.21265411376953125, -0.180389404296875, -0.14812469482421875, -0.1158599853515625, -0.08359527587890625, -0.05133056640625, -0.01906585693359375, 0.0131988525390625, 0.04546356201171875, 0.077728271484375, 0.10999298095703125, 0.1422576904296875, 0.17452239990234375, 0.206787109375, 0.23905181884765625, 0.2713165283203125, 0.30358123779296875, 0.335845947265625, 0.36811065673828125, 0.4003753662109375, 0.43264007568359375, 0.46490478515625, 0.49716949462890625, 0.5294342041015625, 0.5616989135742188, 0.593963623046875, 0.6262283325195312, 0.6584930419921875, 0.6907577514648438, 0.7230224609375, 0.7552871704101562, 0.7875518798828125, 0.8198165893554688, 0.852081298828125, 0.8843460083007812, 0.9166107177734375, 0.9488754272460938, 0.98114013671875, 1.0134048461914062, 1.0456695556640625, 1.0779342651367188, 1.110198974609375, 1.1424636840820312, 1.1747283935546875, 1.2069931030273438, 1.2392578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 9.0, 10.0, 17.0, 21.0, 42.0, 83.0, 139.0, 167.0, 171.0, 129.0, 78.0, 49.0, 25.0, 16.0, 12.0, 9.0, 13.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.989684104919434, -10.714859008789062, -10.440033912658691, -10.16520881652832, -9.89038372039795, -9.615558624267578, -9.34073257446289, -9.06590747833252, -8.791082382202148, -8.516257286071777, -8.241432189941406, -7.966607093811035, -7.691781520843506, -7.416956424713135, -7.142131328582764, -6.867306232452393, -6.5924811363220215, -6.31765604019165, -6.042830944061279, -5.76800537109375, -5.493180274963379, -5.218355178833008, -4.943530082702637, -4.668704986572266, -4.3938798904418945, -4.119054794311523, -3.8442294597625732, -3.569404363632202, -3.294579029083252, -3.019753932952881, -2.7449288368225098, -2.4701037406921387, -2.1952786445617676, -1.920453429222107, -1.6456282138824463, -1.3708031177520752, -1.0959779024124146, -0.8211526870727539, -0.5463275909423828, -0.27150237560272217, 0.0033228397369384766, 0.27814802527427673, 0.552973210811615, 0.8277983665466309, 1.1026235818862915, 1.3774487972259521, 1.6522738933563232, 1.9270991086959839, 2.2019243240356445, 2.4767494201660156, 2.751574754714966, 3.026399850845337, 3.301225185394287, 3.576050281524658, 3.8508753776550293, 4.1257004737854, 4.40052604675293, 4.675351142883301, 4.950176239013672, 5.225001335144043, 5.499826908111572, 5.774652004241943, 6.0494771003723145, 6.3243021965026855, 6.599127292633057]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 9.0, 12.0, 21.0, 22.0, 21.0, 34.0, 31.0, 32.0, 45.0, 41.0, 40.0, 47.0, 37.0, 35.0, 38.0, 37.0, 37.0, 42.0, 42.0, 53.0, 35.0, 36.0, 29.0, 29.0, 20.0, 25.0, 18.0, 9.0, 13.0, 19.0, 7.0, 14.0, 5.0, 2.0, 2.0, 3.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.031878471374512, -3.915288209915161, -3.7986979484558105, -3.682107448577881, -3.5655171871185303, -3.4489269256591797, -3.332336664199829, -3.2157464027404785, -3.099155902862549, -2.9825656414031982, -2.8659753799438477, -2.749384880065918, -2.6327946186065674, -2.516204357147217, -2.399614095687866, -2.2830238342285156, -2.166433572769165, -2.0498433113098145, -1.9332529306411743, -1.8166626691818237, -1.7000722885131836, -1.583482027053833, -1.4668917655944824, -1.3503015041351318, -1.2337111234664917, -1.1171208620071411, -1.000530481338501, -0.8839402198791504, -0.767349898815155, -0.6507595777511597, -0.5341693162918091, -0.4175789952278137, -0.30098843574523926, -0.1843981295824051, -0.06780782341957092, 0.04878246784210205, 0.1653727889060974, 0.2819631099700928, 0.39855337142944336, 0.5151436924934387, 0.6317340135574341, 0.7483243346214294, 0.8649146556854248, 0.9815049171447754, 1.098095178604126, 1.2146855592727661, 1.3312758207321167, 1.4478662014007568, 1.5644564628601074, 1.681046724319458, 1.7976371049880981, 1.9142273664474487, 2.030817747116089, 2.1474080085754395, 2.26399827003479, 2.3805885314941406, 2.4971790313720703, 2.613769292831421, 2.7303595542907715, 2.846950054168701, 2.9635403156280518, 3.0801305770874023, 3.196720838546753, 3.3133111000061035, 3.429901361465454]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 3.0, 12.0, 10.0, 21.0, 33.0, 43.0, 79.0, 118.0, 240.0, 421.0, 915.0, 1832.0, 4164.0, 10838.0, 30423.0, 101628.0, 363080.0, 377098.0, 106814.0, 31449.0, 10938.0, 4443.0, 1928.0, 940.0, 444.0, 255.0, 150.0, 77.0, 52.0, 25.0, 26.0, 19.0, 16.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1505889892578125, -1.114654541015625, -1.0787200927734375, -1.04278564453125, -1.0068511962890625, -0.970916748046875, -0.9349822998046875, -0.8990478515625, -0.8631134033203125, -0.827178955078125, -0.7912445068359375, -0.75531005859375, -0.7193756103515625, -0.683441162109375, -0.6475067138671875, -0.611572265625, -0.5756378173828125, -0.539703369140625, -0.5037689208984375, -0.46783447265625, -0.4319000244140625, -0.395965576171875, -0.3600311279296875, -0.3240966796875, -0.2881622314453125, -0.252227783203125, -0.2162933349609375, -0.18035888671875, -0.1444244384765625, -0.108489990234375, -0.0725555419921875, -0.03662109375, -0.0006866455078125, 0.035247802734375, 0.0711822509765625, 0.10711669921875, 0.1430511474609375, 0.178985595703125, 0.2149200439453125, 0.2508544921875, 0.2867889404296875, 0.322723388671875, 0.3586578369140625, 0.39459228515625, 0.4305267333984375, 0.466461181640625, 0.5023956298828125, 0.538330078125, 0.5742645263671875, 0.610198974609375, 0.6461334228515625, 0.68206787109375, 0.7180023193359375, 0.753936767578125, 0.7898712158203125, 0.8258056640625, 0.8617401123046875, 0.897674560546875, 0.9336090087890625, 0.96954345703125, 1.0054779052734375, 1.041412353515625, 1.0773468017578125, 1.11328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 9.0, 12.0, 13.0, 17.0, 23.0, 34.0, 27.0, 40.0, 57.0, 54.0, 64.0, 68.0, 66.0, 68.0, 73.0, 56.0, 77.0, 48.0, 44.0, 33.0, 36.0, 18.0, 18.0, 10.0, 13.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5726165771484375, -0.550506591796875, -0.5283966064453125, -0.50628662109375, -0.4841766357421875, -0.462066650390625, -0.4399566650390625, -0.4178466796875, -0.3957366943359375, -0.373626708984375, -0.3515167236328125, -0.32940673828125, -0.3072967529296875, -0.285186767578125, -0.2630767822265625, -0.240966796875, -0.2188568115234375, -0.196746826171875, -0.1746368408203125, -0.15252685546875, -0.1304168701171875, -0.108306884765625, -0.0861968994140625, -0.0640869140625, -0.0419769287109375, -0.019866943359375, 0.0022430419921875, 0.02435302734375, 0.0464630126953125, 0.068572998046875, 0.0906829833984375, 0.11279296875, 0.1349029541015625, 0.157012939453125, 0.1791229248046875, 0.20123291015625, 0.2233428955078125, 0.245452880859375, 0.2675628662109375, 0.2896728515625, 0.3117828369140625, 0.333892822265625, 0.3560028076171875, 0.37811279296875, 0.4002227783203125, 0.422332763671875, 0.4444427490234375, 0.466552734375, 0.4886627197265625, 0.510772705078125, 0.5328826904296875, 0.55499267578125, 0.5771026611328125, 0.599212646484375, 0.6213226318359375, 0.6434326171875, 0.6655426025390625, 0.687652587890625, 0.7097625732421875, 0.73187255859375, 0.7539825439453125, 0.776092529296875, 0.7982025146484375, 0.8203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 15.0, 18.0, 35.0, 30.0, 45.0, 81.0, 124.0, 141.0, 221.0, 337.0, 515.0, 849.0, 1808.0, 4769.0, 21223.0, 164704.0, 760603.0, 74869.0, 11712.0, 3102.0, 1285.0, 715.0, 446.0, 300.0, 164.0, 122.0, 81.0, 58.0, 55.0, 29.0, 24.0, 13.0, 18.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.513671875, -1.4620513916015625, -1.410430908203125, -1.3588104248046875, -1.30718994140625, -1.2555694580078125, -1.203948974609375, -1.1523284912109375, -1.1007080078125, -1.0490875244140625, -0.997467041015625, -0.9458465576171875, -0.89422607421875, -0.8426055908203125, -0.790985107421875, -0.7393646240234375, -0.687744140625, -0.6361236572265625, -0.584503173828125, -0.5328826904296875, -0.48126220703125, -0.4296417236328125, -0.378021240234375, -0.3264007568359375, -0.2747802734375, -0.2231597900390625, -0.171539306640625, -0.1199188232421875, -0.06829833984375, -0.0166778564453125, 0.034942626953125, 0.0865631103515625, 0.13818359375, 0.1898040771484375, 0.241424560546875, 0.2930450439453125, 0.34466552734375, 0.3962860107421875, 0.447906494140625, 0.4995269775390625, 0.5511474609375, 0.6027679443359375, 0.654388427734375, 0.7060089111328125, 0.75762939453125, 0.8092498779296875, 0.860870361328125, 0.9124908447265625, 0.964111328125, 1.0157318115234375, 1.067352294921875, 1.1189727783203125, 1.17059326171875, 1.2222137451171875, 1.273834228515625, 1.3254547119140625, 1.3770751953125, 1.4286956787109375, 1.480316162109375, 1.5319366455078125, 1.58355712890625, 1.6351776123046875, 1.686798095703125, 1.7384185791015625, 1.7900390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 13.0, 9.0, 11.0, 14.0, 13.0, 25.0, 26.0, 23.0, 33.0, 34.0, 39.0, 53.0, 58.0, 58.0, 60.0, 60.0, 49.0, 57.0, 47.0, 39.0, 51.0, 41.0, 24.0, 31.0, 32.0, 22.0, 13.0, 9.0, 12.0, 4.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.828765869140625, -1.76885986328125, -1.708953857421875, -1.6490478515625, -1.589141845703125, -1.52923583984375, -1.469329833984375, -1.409423828125, -1.349517822265625, -1.28961181640625, -1.229705810546875, -1.1697998046875, -1.109893798828125, -1.04998779296875, -0.990081787109375, -0.93017578125, -0.870269775390625, -0.81036376953125, -0.750457763671875, -0.6905517578125, -0.630645751953125, -0.57073974609375, -0.510833740234375, -0.450927734375, -0.391021728515625, -0.33111572265625, -0.271209716796875, -0.2113037109375, -0.151397705078125, -0.09149169921875, -0.031585693359375, 0.0283203125, 0.088226318359375, 0.14813232421875, 0.208038330078125, 0.2679443359375, 0.327850341796875, 0.38775634765625, 0.447662353515625, 0.507568359375, 0.567474365234375, 0.62738037109375, 0.687286376953125, 0.7471923828125, 0.807098388671875, 0.86700439453125, 0.926910400390625, 0.98681640625, 1.046722412109375, 1.10662841796875, 1.166534423828125, 1.2264404296875, 1.286346435546875, 1.34625244140625, 1.406158447265625, 1.466064453125, 1.525970458984375, 1.58587646484375, 1.645782470703125, 1.7056884765625, 1.765594482421875, 1.82550048828125, 1.885406494140625, 1.9453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 8.0, 2.0, 1.0, 9.0, 10.0, 11.0, 4.0, 13.0, 20.0, 22.0, 27.0, 50.0, 57.0, 87.0, 128.0, 229.0, 312.0, 560.0, 1015.0, 2094.0, 4749.0, 13322.0, 45670.0, 194862.0, 656809.0, 90529.0, 23753.0, 7791.0, 2996.0, 1435.0, 771.0, 423.0, 255.0, 145.0, 107.0, 65.0, 49.0, 41.0, 29.0, 30.0, 16.0, 11.0, 8.0, 12.0, 7.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.328857421875, -0.3189659118652344, -0.30907440185546875, -0.2991828918457031, -0.2892913818359375, -0.2793998718261719, -0.26950836181640625, -0.2596168518066406, -0.249725341796875, -0.23983383178710938, -0.22994232177734375, -0.22005081176757812, -0.2101593017578125, -0.20026779174804688, -0.19037628173828125, -0.18048477172851562, -0.17059326171875, -0.16070175170898438, -0.15081024169921875, -0.14091873168945312, -0.1310272216796875, -0.12113571166992188, -0.11124420166015625, -0.10135269165039062, -0.091461181640625, -0.08156967163085938, -0.07167816162109375, -0.061786651611328125, -0.0518951416015625, -0.042003631591796875, -0.03211212158203125, -0.022220611572265625, -0.0123291015625, -0.002437591552734375, 0.00745391845703125, 0.017345428466796875, 0.0272369384765625, 0.037128448486328125, 0.04701995849609375, 0.056911468505859375, 0.066802978515625, 0.07669448852539062, 0.08658599853515625, 0.09647750854492188, 0.1063690185546875, 0.11626052856445312, 0.12615203857421875, 0.13604354858398438, 0.14593505859375, 0.15582656860351562, 0.16571807861328125, 0.17560958862304688, 0.1855010986328125, 0.19539260864257812, 0.20528411865234375, 0.21517562866210938, 0.225067138671875, 0.23495864868164062, 0.24485015869140625, 0.2547416687011719, 0.2646331787109375, 0.2745246887207031, 0.28441619873046875, 0.2943077087402344, 0.30419921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 15.0, 17.0, 26.0, 50.0, 73.0, 125.0, 227.0, 169.0, 117.0, 63.0, 34.0, 20.0, 10.0, 12.0, 7.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002734661102294922, -0.0002648457884788513, -0.00025622546672821045, -0.0002476051449775696, -0.0002389848232269287, -0.00023036450147628784, -0.00022174417972564697, -0.0002131238579750061, -0.00020450353622436523, -0.00019588321447372437, -0.0001872628927230835, -0.00017864257097244263, -0.00017002224922180176, -0.0001614019274711609, -0.00015278160572052002, -0.00014416128396987915, -0.00013554096221923828, -0.0001269206404685974, -0.00011830031871795654, -0.00010967999696731567, -0.0001010596752166748, -9.243935346603394e-05, -8.381903171539307e-05, -7.51987099647522e-05, -6.657838821411133e-05, -5.795806646347046e-05, -4.933774471282959e-05, -4.071742296218872e-05, -3.209710121154785e-05, -2.3476779460906982e-05, -1.4856457710266113e-05, -6.236135959625244e-06, 2.384185791015625e-06, 1.1004507541656494e-05, 1.9624829292297363e-05, 2.8245151042938232e-05, 3.68654727935791e-05, 4.548579454421997e-05, 5.410611629486084e-05, 6.272643804550171e-05, 7.134675979614258e-05, 7.996708154678345e-05, 8.858740329742432e-05, 9.720772504806519e-05, 0.00010582804679870605, 0.00011444836854934692, 0.0001230686902999878, 0.00013168901205062866, 0.00014030933380126953, 0.0001489296555519104, 0.00015754997730255127, 0.00016617029905319214, 0.000174790620803833, 0.00018341094255447388, 0.00019203126430511475, 0.00020065158605575562, 0.00020927190780639648, 0.00021789222955703735, 0.00022651255130767822, 0.0002351328730583191, 0.00024375319480895996, 0.00025237351655960083, 0.0002609938383102417, 0.00026961416006088257, 0.00027823448181152344]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 12.0, 14.0, 16.0, 24.0, 24.0, 49.0, 71.0, 111.0, 205.0, 320.0, 709.0, 1765.0, 5735.0, 28629.0, 264249.0, 691040.0, 43911.0, 7710.0, 2122.0, 810.0, 400.0, 230.0, 135.0, 63.0, 54.0, 48.0, 19.0, 19.0, 12.0, 12.0, 10.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.50634765625, -0.4923248291015625, -0.478302001953125, -0.4642791748046875, -0.45025634765625, -0.4362335205078125, -0.422210693359375, -0.4081878662109375, -0.3941650390625, -0.3801422119140625, -0.366119384765625, -0.3520965576171875, -0.33807373046875, -0.3240509033203125, -0.310028076171875, -0.2960052490234375, -0.281982421875, -0.2679595947265625, -0.253936767578125, -0.2399139404296875, -0.22589111328125, -0.2118682861328125, -0.197845458984375, -0.1838226318359375, -0.1697998046875, -0.1557769775390625, -0.141754150390625, -0.1277313232421875, -0.11370849609375, -0.0996856689453125, -0.085662841796875, -0.0716400146484375, -0.0576171875, -0.0435943603515625, -0.029571533203125, -0.0155487060546875, -0.00152587890625, 0.0124969482421875, 0.026519775390625, 0.0405426025390625, 0.0545654296875, 0.0685882568359375, 0.082611083984375, 0.0966339111328125, 0.11065673828125, 0.1246795654296875, 0.138702392578125, 0.1527252197265625, 0.166748046875, 0.1807708740234375, 0.194793701171875, 0.2088165283203125, 0.22283935546875, 0.2368621826171875, 0.250885009765625, 0.2649078369140625, 0.2789306640625, 0.2929534912109375, 0.306976318359375, 0.3209991455078125, 0.33502197265625, 0.3490447998046875, 0.363067626953125, 0.3770904541015625, 0.39111328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 11.0, 9.0, 14.0, 19.0, 20.0, 22.0, 39.0, 50.0, 60.0, 79.0, 96.0, 85.0, 79.0, 80.0, 71.0, 51.0, 50.0, 28.0, 28.0, 19.0, 10.0, 12.0, 9.0, 14.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281494140625, -0.271392822265625, -0.26129150390625, -0.251190185546875, -0.2410888671875, -0.230987548828125, -0.22088623046875, -0.210784912109375, -0.20068359375, -0.190582275390625, -0.18048095703125, -0.170379638671875, -0.1602783203125, -0.150177001953125, -0.14007568359375, -0.129974365234375, -0.119873046875, -0.109771728515625, -0.09967041015625, -0.089569091796875, -0.0794677734375, -0.069366455078125, -0.05926513671875, -0.049163818359375, -0.0390625, -0.028961181640625, -0.01885986328125, -0.008758544921875, 0.0013427734375, 0.011444091796875, 0.02154541015625, 0.031646728515625, 0.041748046875, 0.051849365234375, 0.06195068359375, 0.072052001953125, 0.0821533203125, 0.092254638671875, 0.10235595703125, 0.112457275390625, 0.12255859375, 0.132659912109375, 0.14276123046875, 0.152862548828125, 0.1629638671875, 0.173065185546875, 0.18316650390625, 0.193267822265625, 0.203369140625, 0.213470458984375, 0.22357177734375, 0.233673095703125, 0.2437744140625, 0.253875732421875, 0.26397705078125, 0.274078369140625, 0.2841796875, 0.294281005859375, 0.30438232421875, 0.314483642578125, 0.3245849609375, 0.334686279296875, 0.34478759765625, 0.354888916015625, 0.364990234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 18.0, 47.0, 108.0, 404.0, 238.0, 103.0, 38.0, 23.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.926727294921875, -12.384035110473633, -11.841343879699707, -11.298652648925781, -10.755960464477539, -10.213268280029297, -9.670577049255371, -9.127885818481445, -8.585193634033203, -8.042501449584961, -7.499810218811035, -6.957118511199951, -6.414426803588867, -5.871735095977783, -5.329043388366699, -4.786351680755615, -4.243659973144531, -3.7009682655334473, -3.1582765579223633, -2.6155848503112793, -2.0728931427001953, -1.5302014350891113, -0.9875097274780273, -0.44481801986694336, 0.09787368774414062, 0.6405653953552246, 1.1832571029663086, 1.7259488105773926, 2.2686405181884766, 2.8113322257995605, 3.3540239334106445, 3.8967156410217285, 4.4394073486328125, 4.9820990562438965, 5.5247907638549805, 6.0674824714660645, 6.610174179077148, 7.152865886688232, 7.695557594299316, 8.238248825073242, 8.780941009521484, 9.323633193969727, 9.866324424743652, 10.409015655517578, 10.95170783996582, 11.494400024414062, 12.037091255187988, 12.579782485961914, 13.122474670410156, 13.665166854858398, 14.207858085632324, 14.75054931640625, 15.293241500854492, 15.835933685302734, 16.378623962402344, 16.921316146850586, 17.464008331298828, 18.00670051574707, 18.549392700195312, 19.092082977294922, 19.634775161743164, 20.177467346191406, 20.720157623291016, 21.262849807739258, 21.8055419921875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 7.0, 9.0, 8.0, 14.0, 9.0, 17.0, 15.0, 34.0, 22.0, 35.0, 50.0, 25.0, 46.0, 67.0, 112.0, 140.0, 72.0, 40.0, 40.0, 44.0, 30.0, 22.0, 18.0, 11.0, 14.0, 14.0, 13.0, 7.0, 12.0, 5.0, 6.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.515538215637207, -5.303569316864014, -5.09160041809082, -4.879631519317627, -4.667662620544434, -4.455694198608398, -4.243725299835205, -4.031756401062012, -3.8197875022888184, -3.607818603515625, -3.3958497047424316, -3.1838810443878174, -2.971912145614624, -2.7599432468414307, -2.5479745864868164, -2.336005687713623, -2.1240367889404297, -1.9120678901672363, -1.7000991106033325, -1.4881303310394287, -1.2761614322662354, -1.064192533493042, -0.8522237539291382, -0.6402549743652344, -0.428286075592041, -0.21631723642349243, -0.004348397254943848, 0.20762044191360474, 0.4195892810821533, 0.6315581798553467, 0.8435269594192505, 1.0554957389831543, 1.2674646377563477, 1.479433536529541, 1.6914023160934448, 1.9033710956573486, 2.115339994430542, 2.3273088932037354, 2.5392775535583496, 2.751246452331543, 2.9632153511047363, 3.1751842498779297, 3.387153148651123, 3.5991218090057373, 3.8110907077789307, 4.023059844970703, 4.235028266906738, 4.446997165679932, 4.658966064453125, 4.870934963226318, 5.082903861999512, 5.294872760772705, 5.506841659545898, 5.718810081481934, 5.930778980255127, 6.14274787902832, 6.354716777801514, 6.566685676574707, 6.7786545753479, 6.990623474121094, 7.202591896057129, 7.4145612716674805, 7.626529693603516, 7.838498592376709, 8.050467491149902]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 2.0, 5.0, 8.0, 16.0, 22.0, 39.0, 64.0, 129.0, 224.0, 513.0, 1052.0, 2481.0, 8209.0, 42842.0, 449865.0, 2630525.0, 955178.0, 83239.0, 13707.0, 3641.0, 1316.0, 574.0, 281.0, 151.0, 84.0, 41.0, 23.0, 19.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3974609375, -1.3639144897460938, -1.3303680419921875, -1.2968215942382812, -1.263275146484375, -1.2297286987304688, -1.1961822509765625, -1.1626358032226562, -1.12908935546875, -1.0955429077148438, -1.0619964599609375, -1.0284500122070312, -0.994903564453125, -0.9613571166992188, -0.9278106689453125, -0.8942642211914062, -0.8607177734375, -0.8271713256835938, -0.7936248779296875, -0.7600784301757812, -0.726531982421875, -0.6929855346679688, -0.6594390869140625, -0.6258926391601562, -0.59234619140625, -0.5587997436523438, -0.5252532958984375, -0.49170684814453125, -0.458160400390625, -0.42461395263671875, -0.3910675048828125, -0.35752105712890625, -0.323974609375, -0.29042816162109375, -0.2568817138671875, -0.22333526611328125, -0.189788818359375, -0.15624237060546875, -0.1226959228515625, -0.08914947509765625, -0.05560302734375, -0.02205657958984375, 0.0114898681640625, 0.04503631591796875, 0.078582763671875, 0.11212921142578125, 0.1456756591796875, 0.17922210693359375, 0.2127685546875, 0.24631500244140625, 0.2798614501953125, 0.31340789794921875, 0.346954345703125, 0.38050079345703125, 0.4140472412109375, 0.44759368896484375, 0.48114013671875, 0.5146865844726562, 0.5482330322265625, 0.5817794799804688, 0.615325927734375, 0.6488723754882812, 0.6824188232421875, 0.7159652709960938, 0.74951171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 12.0, 15.0, 22.0, 24.0, 43.0, 42.0, 53.0, 62.0, 65.0, 84.0, 88.0, 69.0, 66.0, 65.0, 63.0, 45.0, 46.0, 29.0, 23.0, 20.0, 16.0, 19.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6741256713867188, -0.6514739990234375, -0.6288223266601562, -0.606170654296875, -0.5835189819335938, -0.5608673095703125, -0.5382156372070312, -0.51556396484375, -0.49291229248046875, -0.4702606201171875, -0.44760894775390625, -0.424957275390625, -0.40230560302734375, -0.3796539306640625, -0.35700225830078125, -0.3343505859375, -0.31169891357421875, -0.2890472412109375, -0.26639556884765625, -0.243743896484375, -0.22109222412109375, -0.1984405517578125, -0.17578887939453125, -0.15313720703125, -0.13048553466796875, -0.1078338623046875, -0.08518218994140625, -0.062530517578125, -0.03987884521484375, -0.0172271728515625, 0.00542449951171875, 0.028076171875, 0.05072784423828125, 0.0733795166015625, 0.09603118896484375, 0.118682861328125, 0.14133453369140625, 0.1639862060546875, 0.18663787841796875, 0.20928955078125, 0.23194122314453125, 0.2545928955078125, 0.27724456787109375, 0.299896240234375, 0.32254791259765625, 0.3451995849609375, 0.36785125732421875, 0.3905029296875, 0.41315460205078125, 0.4358062744140625, 0.45845794677734375, 0.481109619140625, 0.5037612915039062, 0.5264129638671875, 0.5490646362304688, 0.57171630859375, 0.5943679809570312, 0.6170196533203125, 0.6396713256835938, 0.662322998046875, 0.6849746704101562, 0.7076263427734375, 0.7302780151367188, 0.7529296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 15.0, 24.0, 38.0, 64.0, 123.0, 267.0, 539.0, 1465.0, 6464.0, 559507.0, 3612858.0, 9861.0, 1821.0, 615.0, 287.0, 138.0, 63.0, 51.0, 21.0, 21.0, 6.0, 6.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.58001708984375, -4.4373779296875, -4.29473876953125, -4.152099609375, -4.00946044921875, -3.8668212890625, -3.72418212890625, -3.58154296875, -3.43890380859375, -3.2962646484375, -3.15362548828125, -3.010986328125, -2.86834716796875, -2.7257080078125, -2.58306884765625, -2.4404296875, -2.29779052734375, -2.1551513671875, -2.01251220703125, -1.869873046875, -1.72723388671875, -1.5845947265625, -1.44195556640625, -1.29931640625, -1.15667724609375, -1.0140380859375, -0.87139892578125, -0.728759765625, -0.58612060546875, -0.4434814453125, -0.30084228515625, -0.158203125, -0.01556396484375, 0.1270751953125, 0.26971435546875, 0.412353515625, 0.55499267578125, 0.6976318359375, 0.84027099609375, 0.98291015625, 1.12554931640625, 1.2681884765625, 1.41082763671875, 1.553466796875, 1.69610595703125, 1.8387451171875, 1.98138427734375, 2.1240234375, 2.26666259765625, 2.4093017578125, 2.55194091796875, 2.694580078125, 2.83721923828125, 2.9798583984375, 3.12249755859375, 3.26513671875, 3.40777587890625, 3.5504150390625, 3.69305419921875, 3.835693359375, 3.97833251953125, 4.1209716796875, 4.26361083984375, 4.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 10.0, 17.0, 23.0, 32.0, 59.0, 134.0, 211.0, 356.0, 591.0, 849.0, 741.0, 462.0, 216.0, 141.0, 100.0, 43.0, 25.0, 18.0, 10.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.854095458984375, -2.77655029296875, -2.699005126953125, -2.6214599609375, -2.543914794921875, -2.46636962890625, -2.388824462890625, -2.311279296875, -2.233734130859375, -2.15618896484375, -2.078643798828125, -2.0010986328125, -1.923553466796875, -1.84600830078125, -1.768463134765625, -1.69091796875, -1.613372802734375, -1.53582763671875, -1.458282470703125, -1.3807373046875, -1.303192138671875, -1.22564697265625, -1.148101806640625, -1.070556640625, -0.993011474609375, -0.91546630859375, -0.837921142578125, -0.7603759765625, -0.682830810546875, -0.60528564453125, -0.527740478515625, -0.4501953125, -0.372650146484375, -0.29510498046875, -0.217559814453125, -0.1400146484375, -0.062469482421875, 0.01507568359375, 0.092620849609375, 0.170166015625, 0.247711181640625, 0.32525634765625, 0.402801513671875, 0.4803466796875, 0.557891845703125, 0.63543701171875, 0.712982177734375, 0.79052734375, 0.868072509765625, 0.94561767578125, 1.023162841796875, 1.1007080078125, 1.178253173828125, 1.25579833984375, 1.333343505859375, 1.410888671875, 1.488433837890625, 1.56597900390625, 1.643524169921875, 1.7210693359375, 1.798614501953125, 1.87615966796875, 1.953704833984375, 2.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 11.0, 20.0, 56.0, 107.0, 184.0, 233.0, 178.0, 100.0, 53.0, 17.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.60967254638672, -33.83175277709961, -33.0538330078125, -32.275917053222656, -31.497997283935547, -30.720077514648438, -29.94215965270996, -29.164241790771484, -28.386322021484375, -27.608402252197266, -26.83048439025879, -26.052566528320312, -25.274646759033203, -24.496726989746094, -23.718809127807617, -22.94089126586914, -22.16297149658203, -21.385051727294922, -20.607133865356445, -19.82921600341797, -19.05129623413086, -18.27337646484375, -17.495458602905273, -16.717540740966797, -15.939620971679688, -15.161702156066895, -14.383783340454102, -13.605864524841309, -12.827945709228516, -12.050026893615723, -11.27210807800293, -10.494189262390137, -9.716272354125977, -8.938353538513184, -8.16043472290039, -7.382515907287598, -6.604597091674805, -5.826678276062012, -5.048759460449219, -4.270840644836426, -3.492921829223633, -2.71500301361084, -1.9370841979980469, -1.159165382385254, -0.38124656677246094, 0.39667224884033203, 1.174591064453125, 1.952509880065918, 2.730428695678711, 3.508347511291504, 4.286266326904297, 5.06418514251709, 5.842103958129883, 6.620022773742676, 7.397941589355469, 8.175860404968262, 8.953779220581055, 9.731698036193848, 10.50961685180664, 11.287535667419434, 12.065454483032227, 12.84337329864502, 13.621292114257812, 14.399210929870605, 15.177129745483398]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 3.0, 11.0, 8.0, 13.0, 13.0, 7.0, 20.0, 19.0, 29.0, 26.0, 27.0, 32.0, 33.0, 43.0, 48.0, 47.0, 51.0, 57.0, 72.0, 48.0, 57.0, 57.0, 44.0, 46.0, 31.0, 31.0, 28.0, 14.0, 14.0, 18.0, 7.0, 9.0, 8.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.906109809875488, -10.568514823913574, -10.230918884277344, -9.89332389831543, -9.5557279586792, -9.218132972717285, -8.880537033081055, -8.54294204711914, -8.205347061157227, -7.867751598358154, -7.530156135559082, -7.192561149597168, -6.8549652099609375, -6.517370223999023, -6.179774761199951, -5.842179298400879, -5.504583358764648, -5.166987895965576, -4.829392433166504, -4.49179744720459, -4.154201507568359, -3.816606283187866, -3.479011058807373, -3.141415596008301, -2.8038201332092285, -2.4662246704101562, -2.128629207611084, -1.7910339832305908, -1.4534385204315186, -1.1158430576324463, -0.7782478332519531, -0.44065237045288086, -0.10305595397949219, 0.2345394492149353, 0.5721348524093628, 0.9097301959991455, 1.2473256587982178, 1.58492112159729, 1.9225163459777832, 2.2601118087768555, 2.5977072715759277, 2.935302734375, 3.2728981971740723, 3.6104934215545654, 3.9480888843536377, 4.285684585571289, 4.623279571533203, 4.960875034332275, 5.298470497131348, 5.63606595993042, 5.973661422729492, 6.311256408691406, 6.648852348327637, 6.986447334289551, 7.324042797088623, 7.661638259887695, 7.999233722686768, 8.33682918548584, 8.674424171447754, 9.012020111083984, 9.349615097045898, 9.687211036682129, 10.024806022644043, 10.362401962280273, 10.699996948242188]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 16.0, 16.0, 35.0, 37.0, 89.0, 168.0, 372.0, 1017.0, 3030.0, 12202.0, 104381.0, 820031.0, 91507.0, 11045.0, 2842.0, 969.0, 370.0, 197.0, 80.0, 38.0, 41.0, 18.0, 12.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.8203125, -2.74700927734375, -2.6737060546875, -2.60040283203125, -2.527099609375, -2.45379638671875, -2.3804931640625, -2.30718994140625, -2.23388671875, -2.16058349609375, -2.0872802734375, -2.01397705078125, -1.940673828125, -1.86737060546875, -1.7940673828125, -1.72076416015625, -1.6474609375, -1.57415771484375, -1.5008544921875, -1.42755126953125, -1.354248046875, -1.28094482421875, -1.2076416015625, -1.13433837890625, -1.06103515625, -0.98773193359375, -0.9144287109375, -0.84112548828125, -0.767822265625, -0.69451904296875, -0.6212158203125, -0.54791259765625, -0.474609375, -0.40130615234375, -0.3280029296875, -0.25469970703125, -0.181396484375, -0.10809326171875, -0.0347900390625, 0.03851318359375, 0.11181640625, 0.18511962890625, 0.2584228515625, 0.33172607421875, 0.405029296875, 0.47833251953125, 0.5516357421875, 0.62493896484375, 0.6982421875, 0.77154541015625, 0.8448486328125, 0.91815185546875, 0.991455078125, 1.06475830078125, 1.1380615234375, 1.21136474609375, 1.28466796875, 1.35797119140625, 1.4312744140625, 1.50457763671875, 1.577880859375, 1.65118408203125, 1.7244873046875, 1.79779052734375, 1.87109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 9.0, 26.0, 19.0, 30.0, 33.0, 39.0, 40.0, 60.0, 89.0, 73.0, 81.0, 71.0, 81.0, 71.0, 52.0, 58.0, 45.0, 40.0, 25.0, 20.0, 8.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2080078125, -1.1775970458984375, -1.147186279296875, -1.1167755126953125, -1.08636474609375, -1.0559539794921875, -1.025543212890625, -0.9951324462890625, -0.9647216796875, -0.9343109130859375, -0.903900146484375, -0.8734893798828125, -0.84307861328125, -0.8126678466796875, -0.782257080078125, -0.7518463134765625, -0.721435546875, -0.6910247802734375, -0.660614013671875, -0.6302032470703125, -0.59979248046875, -0.5693817138671875, -0.538970947265625, -0.5085601806640625, -0.4781494140625, -0.4477386474609375, -0.417327880859375, -0.3869171142578125, -0.35650634765625, -0.3260955810546875, -0.295684814453125, -0.2652740478515625, -0.23486328125, -0.2044525146484375, -0.174041748046875, -0.1436309814453125, -0.11322021484375, -0.0828094482421875, -0.052398681640625, -0.0219879150390625, 0.0084228515625, 0.0388336181640625, 0.069244384765625, 0.0996551513671875, 0.13006591796875, 0.1604766845703125, 0.190887451171875, 0.2212982177734375, 0.251708984375, 0.2821197509765625, 0.312530517578125, 0.3429412841796875, 0.37335205078125, 0.4037628173828125, 0.434173583984375, 0.4645843505859375, 0.4949951171875, 0.5254058837890625, 0.555816650390625, 0.5862274169921875, 0.61663818359375, 0.6470489501953125, 0.677459716796875, 0.7078704833984375, 0.73828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 17.0, 15.0, 24.0, 19.0, 37.0, 56.0, 56.0, 98.0, 163.0, 236.0, 445.0, 805.0, 1754.0, 4506.0, 18602.0, 146347.0, 821745.0, 40251.0, 8097.0, 2618.0, 1111.0, 554.0, 295.0, 200.0, 141.0, 91.0, 76.0, 52.0, 34.0, 21.0, 17.0, 19.0, 9.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4482421875, -1.404632568359375, -1.36102294921875, -1.317413330078125, -1.2738037109375, -1.230194091796875, -1.18658447265625, -1.142974853515625, -1.099365234375, -1.055755615234375, -1.01214599609375, -0.968536376953125, -0.9249267578125, -0.881317138671875, -0.83770751953125, -0.794097900390625, -0.75048828125, -0.706878662109375, -0.66326904296875, -0.619659423828125, -0.5760498046875, -0.532440185546875, -0.48883056640625, -0.445220947265625, -0.401611328125, -0.358001708984375, -0.31439208984375, -0.270782470703125, -0.2271728515625, -0.183563232421875, -0.13995361328125, -0.096343994140625, -0.052734375, -0.009124755859375, 0.03448486328125, 0.078094482421875, 0.1217041015625, 0.165313720703125, 0.20892333984375, 0.252532958984375, 0.296142578125, 0.339752197265625, 0.38336181640625, 0.426971435546875, 0.4705810546875, 0.514190673828125, 0.55780029296875, 0.601409912109375, 0.64501953125, 0.688629150390625, 0.73223876953125, 0.775848388671875, 0.8194580078125, 0.863067626953125, 0.90667724609375, 0.950286865234375, 0.993896484375, 1.037506103515625, 1.08111572265625, 1.124725341796875, 1.1683349609375, 1.211944580078125, 1.25555419921875, 1.299163818359375, 1.3427734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 4.0, 5.0, 11.0, 4.0, 8.0, 13.0, 15.0, 12.0, 15.0, 26.0, 20.0, 36.0, 34.0, 32.0, 57.0, 73.0, 69.0, 63.0, 61.0, 80.0, 51.0, 47.0, 34.0, 29.0, 23.0, 28.0, 19.0, 15.0, 16.0, 11.0, 17.0, 12.0, 9.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.234375, -2.167388916015625, -2.10040283203125, -2.033416748046875, -1.9664306640625, -1.899444580078125, -1.83245849609375, -1.765472412109375, -1.698486328125, -1.631500244140625, -1.56451416015625, -1.497528076171875, -1.4305419921875, -1.363555908203125, -1.29656982421875, -1.229583740234375, -1.16259765625, -1.095611572265625, -1.02862548828125, -0.961639404296875, -0.8946533203125, -0.827667236328125, -0.76068115234375, -0.693695068359375, -0.626708984375, -0.559722900390625, -0.49273681640625, -0.425750732421875, -0.3587646484375, -0.291778564453125, -0.22479248046875, -0.157806396484375, -0.0908203125, -0.023834228515625, 0.04315185546875, 0.110137939453125, 0.1771240234375, 0.244110107421875, 0.31109619140625, 0.378082275390625, 0.445068359375, 0.512054443359375, 0.57904052734375, 0.646026611328125, 0.7130126953125, 0.779998779296875, 0.84698486328125, 0.913970947265625, 0.98095703125, 1.047943115234375, 1.11492919921875, 1.181915283203125, 1.2489013671875, 1.315887451171875, 1.38287353515625, 1.449859619140625, 1.516845703125, 1.583831787109375, 1.65081787109375, 1.717803955078125, 1.7847900390625, 1.851776123046875, 1.91876220703125, 1.985748291015625, 2.052734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 8.0, 13.0, 10.0, 15.0, 26.0, 33.0, 56.0, 78.0, 100.0, 139.0, 220.0, 374.0, 620.0, 1172.0, 2460.0, 5404.0, 14153.0, 54450.0, 822610.0, 110797.0, 21626.0, 7471.0, 3145.0, 1527.0, 785.0, 397.0, 255.0, 193.0, 102.0, 97.0, 51.0, 40.0, 39.0, 21.0, 11.0, 9.0, 12.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2093505859375, -0.20229721069335938, -0.19524383544921875, -0.18819046020507812, -0.1811370849609375, -0.17408370971679688, -0.16703033447265625, -0.15997695922851562, -0.152923583984375, -0.14587020874023438, -0.13881683349609375, -0.13176345825195312, -0.1247100830078125, -0.11765670776367188, -0.11060333251953125, -0.10354995727539062, -0.09649658203125, -0.08944320678710938, -0.08238983154296875, -0.07533645629882812, -0.0682830810546875, -0.061229705810546875, -0.05417633056640625, -0.047122955322265625, -0.040069580078125, -0.033016204833984375, -0.02596282958984375, -0.018909454345703125, -0.0118560791015625, -0.004802703857421875, 0.00225067138671875, 0.009304046630859375, 0.016357421875, 0.023410797119140625, 0.03046417236328125, 0.037517547607421875, 0.0445709228515625, 0.051624298095703125, 0.05867767333984375, 0.06573104858398438, 0.072784423828125, 0.07983779907226562, 0.08689117431640625, 0.09394454956054688, 0.1009979248046875, 0.10805130004882812, 0.11510467529296875, 0.12215805053710938, 0.12921142578125, 0.13626480102539062, 0.14331817626953125, 0.15037155151367188, 0.1574249267578125, 0.16447830200195312, 0.17153167724609375, 0.17858505249023438, 0.185638427734375, 0.19269180297851562, 0.19974517822265625, 0.20679855346679688, 0.2138519287109375, 0.22090530395507812, 0.22795867919921875, 0.23501205444335938, 0.2420654296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 15.0, 15.0, 18.0, 34.0, 50.0, 72.0, 120.0, 177.0, 169.0, 103.0, 66.0, 37.0, 36.0, 21.0, 15.0, 17.0, 1.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014209747314453125, -0.0001383572816848755, -0.00013461709022521973, -0.00013087689876556396, -0.0001271367073059082, -0.00012339651584625244, -0.00011965632438659668, -0.00011591613292694092, -0.00011217594146728516, -0.0001084357500076294, -0.00010469555854797363, -0.00010095536708831787, -9.721517562866211e-05, -9.347498416900635e-05, -8.973479270935059e-05, -8.599460124969482e-05, -8.225440979003906e-05, -7.85142183303833e-05, -7.477402687072754e-05, -7.103383541107178e-05, -6.729364395141602e-05, -6.355345249176025e-05, -5.981326103210449e-05, -5.607306957244873e-05, -5.233287811279297e-05, -4.859268665313721e-05, -4.4852495193481445e-05, -4.1112303733825684e-05, -3.737211227416992e-05, -3.363192081451416e-05, -2.98917293548584e-05, -2.6151537895202637e-05, -2.2411346435546875e-05, -1.8671154975891113e-05, -1.4930963516235352e-05, -1.119077205657959e-05, -7.450580596923828e-06, -3.7103891372680664e-06, 2.9802322387695312e-08, 3.769993782043457e-06, 7.510185241699219e-06, 1.125037670135498e-05, 1.4990568161010742e-05, 1.8730759620666504e-05, 2.2470951080322266e-05, 2.6211142539978027e-05, 2.995133399963379e-05, 3.369152545928955e-05, 3.743171691894531e-05, 4.1171908378601074e-05, 4.4912099838256836e-05, 4.86522912979126e-05, 5.239248275756836e-05, 5.613267421722412e-05, 5.987286567687988e-05, 6.361305713653564e-05, 6.73532485961914e-05, 7.109344005584717e-05, 7.483363151550293e-05, 7.857382297515869e-05, 8.231401443481445e-05, 8.605420589447021e-05, 8.979439735412598e-05, 9.353458881378174e-05, 9.72747802734375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 9.0, 8.0, 22.0, 13.0, 31.0, 34.0, 49.0, 57.0, 113.0, 155.0, 282.0, 461.0, 811.0, 1513.0, 3013.0, 7089.0, 18020.0, 65514.0, 790187.0, 117694.0, 26035.0, 9318.0, 3865.0, 1882.0, 923.0, 529.0, 291.0, 206.0, 110.0, 89.0, 59.0, 50.0, 22.0, 23.0, 18.0, 11.0, 11.0, 9.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143310546875, -0.137725830078125, -0.13214111328125, -0.126556396484375, -0.1209716796875, -0.115386962890625, -0.10980224609375, -0.104217529296875, -0.0986328125, -0.093048095703125, -0.08746337890625, -0.081878662109375, -0.0762939453125, -0.070709228515625, -0.06512451171875, -0.059539794921875, -0.053955078125, -0.048370361328125, -0.04278564453125, -0.037200927734375, -0.0316162109375, -0.026031494140625, -0.02044677734375, -0.014862060546875, -0.00927734375, -0.003692626953125, 0.00189208984375, 0.007476806640625, 0.0130615234375, 0.018646240234375, 0.02423095703125, 0.029815673828125, 0.035400390625, 0.040985107421875, 0.04656982421875, 0.052154541015625, 0.0577392578125, 0.063323974609375, 0.06890869140625, 0.074493408203125, 0.080078125, 0.085662841796875, 0.09124755859375, 0.096832275390625, 0.1024169921875, 0.108001708984375, 0.11358642578125, 0.119171142578125, 0.124755859375, 0.130340576171875, 0.13592529296875, 0.141510009765625, 0.1470947265625, 0.152679443359375, 0.15826416015625, 0.163848876953125, 0.16943359375, 0.175018310546875, 0.18060302734375, 0.186187744140625, 0.1917724609375, 0.197357177734375, 0.20294189453125, 0.208526611328125, 0.214111328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 1.0, 5.0, 6.0, 8.0, 5.0, 12.0, 12.0, 16.0, 14.0, 25.0, 29.0, 31.0, 56.0, 52.0, 68.0, 81.0, 83.0, 94.0, 66.0, 70.0, 49.0, 42.0, 25.0, 25.0, 15.0, 19.0, 10.0, 11.0, 9.0, 10.0, 6.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.16805267333984375, -0.1621551513671875, -0.15625762939453125, -0.150360107421875, -0.14446258544921875, -0.1385650634765625, -0.13266754150390625, -0.12677001953125, -0.12087249755859375, -0.1149749755859375, -0.10907745361328125, -0.103179931640625, -0.09728240966796875, -0.0913848876953125, -0.08548736572265625, -0.07958984375, -0.07369232177734375, -0.0677947998046875, -0.06189727783203125, -0.055999755859375, -0.05010223388671875, -0.0442047119140625, -0.03830718994140625, -0.03240966796875, -0.02651214599609375, -0.0206146240234375, -0.01471710205078125, -0.008819580078125, -0.00292205810546875, 0.0029754638671875, 0.00887298583984375, 0.0147705078125, 0.02066802978515625, 0.0265655517578125, 0.03246307373046875, 0.038360595703125, 0.04425811767578125, 0.0501556396484375, 0.05605316162109375, 0.06195068359375, 0.06784820556640625, 0.0737457275390625, 0.07964324951171875, 0.085540771484375, 0.09143829345703125, 0.0973358154296875, 0.10323333740234375, 0.109130859375, 0.11502838134765625, 0.1209259033203125, 0.12682342529296875, 0.132720947265625, 0.13861846923828125, 0.1445159912109375, 0.15041351318359375, 0.15631103515625, 0.16220855712890625, 0.1681060791015625, 0.17400360107421875, 0.179901123046875, 0.18579864501953125, 0.1916961669921875, 0.19759368896484375, 0.2034912109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 31.0, 91.0, 596.0, 165.0, 68.0, 28.0, 14.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.053009033203125, -16.416913986206055, -15.780818939208984, -15.14472484588623, -14.50862979888916, -13.87253475189209, -13.236440658569336, -12.600345611572266, -11.964250564575195, -11.328155517578125, -10.692060470581055, -10.0559663772583, -9.41987133026123, -8.78377628326416, -8.147682189941406, -7.511587142944336, -6.875492095947266, -6.239397048950195, -5.603302478790283, -4.967207908630371, -4.331112861633301, -3.6950180530548096, -3.0589232444763184, -2.4228286743164062, -1.786733627319336, -1.1506388187408447, -0.5145440101623535, 0.1215507984161377, 0.7576456069946289, 1.3937404155731201, 2.0298352241516113, 2.6659297943115234, 3.3020267486572266, 3.9381215572357178, 4.574216365814209, 5.210310935974121, 5.846405982971191, 6.482501029968262, 7.118595600128174, 7.754690170288086, 8.390785217285156, 9.026880264282227, 9.662975311279297, 10.29906940460205, 10.935164451599121, 11.571259498596191, 12.207353591918945, 12.843448638916016, 13.479543685913086, 14.115638732910156, 14.751733779907227, 15.38782787322998, 16.023921966552734, 16.660017013549805, 17.296112060546875, 17.932207107543945, 18.568302154541016, 19.204397201538086, 19.840492248535156, 20.476587295532227, 21.112682342529297, 21.748775482177734, 22.384870529174805, 23.020965576171875, 23.657060623168945]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 5.0, 8.0, 12.0, 12.0, 22.0, 22.0, 29.0, 28.0, 22.0, 36.0, 52.0, 332.0, 169.0, 47.0, 35.0, 25.0, 34.0, 27.0, 23.0, 16.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.9119291305542, -13.601431846618652, -13.290933609008789, -12.980436325073242, -12.669939041137695, -12.359440803527832, -12.048943519592285, -11.738445281982422, -11.427947998046875, -11.117450714111328, -10.806952476501465, -10.496455192565918, -10.185956954956055, -9.875459671020508, -9.564962387084961, -9.254465103149414, -8.94396686553955, -8.633469581604004, -8.32297134399414, -8.012474060058594, -7.701976299285889, -7.391478538513184, -7.080981254577637, -6.770483493804932, -6.459985733032227, -6.1494879722595215, -5.838990211486816, -5.5284929275512695, -5.2179951667785645, -4.907497406005859, -4.5970001220703125, -4.286502361297607, -3.9760050773620605, -3.6655073165893555, -3.3550097942352295, -3.0445122718811035, -2.7340145111083984, -2.4235167503356934, -2.1130192279815674, -1.8025217056274414, -1.4920239448547363, -1.1815263032913208, -0.8710286617279053, -0.5605310201644897, -0.2500333786010742, 0.06046426296234131, 0.37096190452575684, 0.6814594268798828, 0.9919571876525879, 1.3024548292160034, 1.612952470779419, 1.9234501123428345, 2.23394775390625, 2.544445514678955, 2.854943037033081, 3.165440559387207, 3.475938320159912, 3.786436080932617, 4.096933364868164, 4.407431125640869, 4.717928886413574, 5.028426647186279, 5.338924407958984, 5.649421691894531, 5.959919452667236]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 15.0, 14.0, 13.0, 15.0, 22.0, 29.0, 25.0, 33.0, 58.0, 97.0, 250.0, 97.0, 35.0, 34.0, 30.0, 28.0, 42.0, 23.0, 29.0, 14.0, 11.0, 14.0, 8.0, 11.0, 3.0, 7.0, 2.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.775390625, -0.7552032470703125, -0.735015869140625, -0.7148284912109375, -0.69464111328125, -0.6744537353515625, -0.654266357421875, -0.6340789794921875, -0.6138916015625, -0.5937042236328125, -0.573516845703125, -0.5533294677734375, -0.53314208984375, -0.5129547119140625, -0.492767333984375, -0.4725799560546875, -0.452392578125, -0.4322052001953125, -0.412017822265625, -0.3918304443359375, -0.37164306640625, -0.3514556884765625, -0.331268310546875, -0.3110809326171875, -0.2908935546875, -0.2707061767578125, -0.250518798828125, -0.2303314208984375, -0.21014404296875, -0.1899566650390625, -0.169769287109375, -0.1495819091796875, -0.12939453125, -0.1092071533203125, -0.089019775390625, -0.0688323974609375, -0.04864501953125, -0.0284576416015625, -0.008270263671875, 0.0119171142578125, 0.0321044921875, 0.0522918701171875, 0.072479248046875, 0.0926666259765625, 0.11285400390625, 0.1330413818359375, 0.153228759765625, 0.1734161376953125, 0.193603515625, 0.2137908935546875, 0.233978271484375, 0.2541656494140625, 0.27435302734375, 0.2945404052734375, 0.314727783203125, 0.3349151611328125, 0.3551025390625, 0.3752899169921875, 0.395477294921875, 0.4156646728515625, 0.43585205078125, 0.4560394287109375, 0.476226806640625, 0.4964141845703125, 0.5166015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 7.0, 10.0, 20.0, 13.0, 30.0, 51.0, 104.0, 381.0, 2260.0, 6394659.0, 1988038.0, 2294.0, 403.0, 133.0, 57.0, 29.0, 19.0, 9.0, 5.0, 28.0, 8.0, 6.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0], "bins": [-9.970314025878906, -9.62648868560791, -9.282662391662598, -8.938837051391602, -8.595011711120605, -8.25118637084961, -7.907360076904297, -7.563534736633301, -7.2197089195251465, -6.875883102416992, -6.532057762145996, -6.188231945037842, -5.8444061279296875, -5.500580787658691, -5.156754970550537, -4.812929153442383, -4.469103813171387, -4.125277996063232, -3.7814526557922363, -3.437626838684082, -3.093801259994507, -2.7499756813049316, -2.4061498641967773, -2.062324285507202, -1.718498706817627, -1.3746731281280518, -1.030847430229187, -0.6870217323303223, -0.34319615364074707, 0.000629425048828125, 0.3444552421569824, 0.6882808208465576, 1.0321054458618164, 1.3759310245513916, 1.7197567224502563, 2.063582420349121, 2.4074079990386963, 2.7512335777282715, 3.095059394836426, 3.438884973526001, 3.782710552215576, 4.1265363693237305, 4.470361709594727, 4.814187526702881, 5.158013343811035, 5.501838684082031, 5.8456645011901855, 6.18949031829834, 6.533315658569336, 6.87714147567749, 7.220966815948486, 7.564792633056641, 7.908617973327637, 8.252443313598633, 8.596269607543945, 8.940094947814941, 9.283920288085938, 9.627745628356934, 9.971571922302246, 10.315397262573242, 10.659222602844238, 11.003047943115234, 11.346874237060547, 11.690699577331543, 12.034525871276855]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 6.0, 5.0, 5.0, 4.0, 3.0, 7.0, 3.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8434865474700928, -2.7135863304138184, -2.583686113357544, -2.4537858963012695, -2.323885917663574, -2.1939857006073, -2.0640854835510254, -1.934185266494751, -1.8042851686477661, -1.6743849515914917, -1.5444848537445068, -1.4145846366882324, -1.284684419631958, -1.1547843217849731, -1.0248841047286987, -0.8949839472770691, -0.7650837898254395, -0.6351836323738098, -0.5052834749221802, -0.37538325786590576, -0.24548310041427612, -0.11558294296264648, 0.01431727409362793, 0.14421743154525757, 0.2741175889968872, 0.40401774644851685, 0.5339179039001465, 0.6638181209564209, 0.7937182784080505, 0.9236184358596802, 1.0535186529159546, 1.1834187507629395, 1.3133187294006348, 1.4432189464569092, 1.573119044303894, 1.7030192613601685, 1.8329193592071533, 1.9628195762634277, 2.092719793319702, 2.2226200103759766, 2.352519989013672, 2.4824202060699463, 2.6123204231262207, 2.742220401763916, 2.8721206188201904, 3.002020835876465, 3.1319210529327393, 3.2618212699890137, 3.391721487045288, 3.5216217041015625, 3.651521921157837, 3.7814221382141113, 3.9113221168518066, 4.04122257232666, 4.1711225509643555, 4.301022529602051, 4.430922985076904, 4.5608229637146, 4.690723419189453, 4.820623397827148, 4.950523853302002, 5.080423831939697, 5.210324287414551, 5.340224266052246, 5.470124244689941]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 5.0, 10.0, 10.0, 14.0, 9.0, 28.0, 41.0, 57.0, 67.0, 104.0, 172.0, 247.0, 422.0, 734.0, 1808.0, 5126.0, 16891.0, 66264.0, 224620.0, 153936.0, 38396.0, 9894.0, 3007.0, 1083.0, 499.0, 269.0, 172.0, 97.0, 75.0, 67.0, 44.0, 28.0, 19.0, 11.0, 7.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.86328125, -6.69091796875, -6.5185546875, -6.34619140625, -6.173828125, -6.00146484375, -5.8291015625, -5.65673828125, -5.484375, -5.31201171875, -5.1396484375, -4.96728515625, -4.794921875, -4.62255859375, -4.4501953125, -4.27783203125, -4.10546875, -3.93310546875, -3.7607421875, -3.58837890625, -3.416015625, -3.24365234375, -3.0712890625, -2.89892578125, -2.7265625, -2.55419921875, -2.3818359375, -2.20947265625, -2.037109375, -1.86474609375, -1.6923828125, -1.52001953125, -1.34765625, -1.17529296875, -1.0029296875, -0.83056640625, -0.658203125, -0.48583984375, -0.3134765625, -0.14111328125, 0.03125, 0.20361328125, 0.3759765625, 0.54833984375, 0.720703125, 0.89306640625, 1.0654296875, 1.23779296875, 1.41015625, 1.58251953125, 1.7548828125, 1.92724609375, 2.099609375, 2.27197265625, 2.4443359375, 2.61669921875, 2.7890625, 2.96142578125, 3.1337890625, 3.30615234375, 3.478515625, 3.65087890625, 3.8232421875, 3.99560546875, 4.16796875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 4.0, 11.0, 10.0, 13.0, 26.0, 40.0, 39.0, 42.0, 55.0, 91.0, 109.0, 92.0, 94.0, 90.0, 65.0, 55.0, 51.0, 30.0, 23.0, 22.0, 8.0, 2.0, 6.0, 1.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.1706466674804688, -1.1381683349609375, -1.1056900024414062, -1.073211669921875, -1.0407333374023438, -1.0082550048828125, -0.9757766723632812, -0.94329833984375, -0.9108200073242188, -0.8783416748046875, -0.8458633422851562, -0.813385009765625, -0.7809066772460938, -0.7484283447265625, -0.7159500122070312, -0.6834716796875, -0.6509933471679688, -0.6185150146484375, -0.5860366821289062, -0.553558349609375, -0.5210800170898438, -0.4886016845703125, -0.45612335205078125, -0.42364501953125, -0.39116668701171875, -0.3586883544921875, -0.32621002197265625, -0.293731689453125, -0.26125335693359375, -0.2287750244140625, -0.19629669189453125, -0.163818359375, -0.13134002685546875, -0.0988616943359375, -0.06638336181640625, -0.033905029296875, -0.00142669677734375, 0.0310516357421875, 0.06352996826171875, 0.09600830078125, 0.12848663330078125, 0.1609649658203125, 0.19344329833984375, 0.225921630859375, 0.25839996337890625, 0.2908782958984375, 0.32335662841796875, 0.3558349609375, 0.38831329345703125, 0.4207916259765625, 0.45326995849609375, 0.485748291015625, 0.5182266235351562, 0.5507049560546875, 0.5831832885742188, 0.61566162109375, 0.6481399536132812, 0.6806182861328125, 0.7130966186523438, 0.745574951171875, 0.7780532836914062, 0.8105316162109375, 0.8430099487304688, 0.87548828125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 9.0, 16.0, 28.0, 57.0, 128.0, 103.0, 75.0, 20.0, 16.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.168756484985352, -6.935171127319336, -6.70158576965332, -6.468000888824463, -6.234415531158447, -6.000830173492432, -5.767245292663574, -5.533659934997559, -5.300074577331543, -5.066489219665527, -4.832903861999512, -4.599318981170654, -4.365733623504639, -4.132148265838623, -3.8985631465911865, -3.66497802734375, -3.4313926696777344, -3.1978073120117188, -2.9642221927642822, -2.7306370735168457, -2.49705171585083, -2.2634663581848145, -2.029881238937378, -1.7962960004806519, -1.5627107620239258, -1.3291255235671997, -1.0955402851104736, -0.8619550466537476, -0.6283698081970215, -0.3947845697402954, -0.16119933128356934, 0.07238590717315674, 0.3059711456298828, 0.5395563840866089, 0.773141622543335, 1.006726861000061, 1.240312099456787, 1.4738973379135132, 1.7074825763702393, 1.9410678148269653, 2.1746530532836914, 2.408238410949707, 2.6418235301971436, 2.87540864944458, 3.1089940071105957, 3.3425793647766113, 3.576164484024048, 3.8097496032714844, 4.0433349609375, 4.276920318603516, 4.510505676269531, 4.744090557098389, 4.977675914764404, 5.21126127243042, 5.444846153259277, 5.678431510925293, 5.912016868591309, 6.145602226257324, 6.37918758392334, 6.612772464752197, 6.846357822418213, 7.0799431800842285, 7.313528060913086, 7.547113418579102, 7.780698776245117]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 16.0, 45.0, 65.0, 93.0, 84.0, 50.0, 26.0, 11.0, 7.0, 8.0, 6.0, 3.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.533191204071045, -3.4177706241607666, -3.3023500442504883, -3.186929225921631, -3.0715086460113525, -2.956088066101074, -2.840667247772217, -2.7252466678619385, -2.60982608795166, -2.494405508041382, -2.3789849281311035, -2.263564109802246, -2.1481435298919678, -2.0327229499816895, -1.9173022508621216, -1.8018815517425537, -1.6864609718322754, -1.571040391921997, -1.4556196928024292, -1.3401989936828613, -1.224778413772583, -1.1093578338623047, -0.9939371347427368, -0.8785164952278137, -0.7630958557128906, -0.6476752161979675, -0.5322545766830444, -0.41683393716812134, -0.30141329765319824, -0.18599265813827515, -0.07057201862335205, 0.044848620891571045, 0.16026926040649414, 0.27568989992141724, 0.39111053943634033, 0.5065311789512634, 0.6219518184661865, 0.7373724579811096, 0.8527930974960327, 0.9682137370109558, 1.083634376525879, 1.1990549564361572, 1.314475655555725, 1.429896354675293, 1.5453169345855713, 1.6607375144958496, 1.7761582136154175, 1.8915789127349854, 2.0069994926452637, 2.122420072555542, 2.2378406524658203, 2.3532614707946777, 2.468682050704956, 2.5841026306152344, 2.699523448944092, 2.81494402885437, 2.9303646087646484, 3.0457851886749268, 3.161205768585205, 3.2766265869140625, 3.392047166824341, 3.507467746734619, 3.6228885650634766, 3.738309144973755, 3.853729724884033]}, "eval/loss": 4.2075958251953125, "eval/wer": 1.9032526775089251, "eval/runtime": 947.3446, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349} \ No newline at end of file +{"train/loss": 3.5579, "train/learning_rate": 9.345794392523364e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 8515, "_timestamp": 1646106787, "_step": 1787, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 20.0, 421.0, 554.0, 21.0, 0.0, 0.0, 2.0, 1.0], "bins": [-573.1256713867188, -563.2627563476562, -553.3998413085938, -543.5369873046875, -533.674072265625, -523.8111572265625, -513.9482421875, -504.0853271484375, -494.2224426269531, -484.3595275878906, -474.49664306640625, -464.63372802734375, -454.77081298828125, -444.9079284667969, -435.0450134277344, -425.18212890625, -415.3192138671875, -405.456298828125, -395.5934143066406, -385.7304992675781, -375.8675842285156, -366.00469970703125, -356.14178466796875, -346.27886962890625, -336.41595458984375, -326.55303955078125, -316.6901550292969, -306.8272399902344, -296.9643249511719, -287.1014404296875, -277.238525390625, -267.3756103515625, -257.5126953125, -247.64979553222656, -237.78688049316406, -227.92398071289062, -218.0610809326172, -208.19818115234375, -198.33526611328125, -188.4723663330078, -178.60946655273438, -168.74656677246094, -158.88365173339844, -149.020751953125, -139.15785217285156, -129.29495239257812, -119.43203735351562, -109.56913757324219, -99.70622253417969, -89.84331512451172, -79.98041534423828, -70.11750793457031, -60.25460433959961, -50.391700744628906, -40.52879333496094, -30.6658935546875, -20.802989959716797, -10.940085411071777, -1.0771808624267578, 8.785724639892578, 18.64862823486328, 28.511531829833984, 38.37443923950195, 48.23733901977539, 58.10024642944336]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 14.0, 11.0, 17.0, 21.0, 24.0, 25.0, 30.0, 26.0, 39.0, 40.0, 38.0, 43.0, 54.0, 42.0, 45.0, 42.0, 57.0, 37.0, 38.0, 45.0, 41.0, 37.0, 26.0, 28.0, 32.0, 21.0, 10.0, 17.0, 23.0, 9.0, 12.0, 10.0, 4.0, 11.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.35408020019531, -78.11407470703125, -75.87406921386719, -73.63406372070312, -71.39405822753906, -69.154052734375, -66.91404724121094, -64.67404174804688, -62.43403625488281, -60.19403076171875, -57.95402526855469, -55.714019775390625, -53.47401428222656, -51.2340087890625, -48.99400329589844, -46.753997802734375, -44.51398849487305, -42.273983001708984, -40.03397750854492, -37.79397201538086, -35.5539665222168, -33.313961029052734, -31.07395362854004, -28.833948135375977, -26.593942642211914, -24.35393714904785, -22.11393165588379, -19.873924255371094, -17.63391876220703, -15.393914222717285, -13.153907775878906, -10.913902282714844, -8.673896789550781, -6.433891296386719, -4.193885326385498, -1.9538793563842773, 0.28612613677978516, 2.5261316299438477, 4.766138076782227, 7.006143569946289, 9.246149063110352, 11.486154556274414, 13.726160049438477, 15.966166496276855, 18.206172943115234, 20.446178436279297, 22.68618392944336, 24.926189422607422, 27.166194915771484, 29.406200408935547, 31.64620590209961, 33.88621139526367, 36.126216888427734, 38.3662223815918, 40.606231689453125, 42.84623718261719, 45.08624267578125, 47.32624816894531, 49.566253662109375, 51.80625915527344, 54.0462646484375, 56.28627014160156, 58.526275634765625, 60.76628112792969, 63.00628662109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 20.0, 22.0, 27.0, 30.0, 48.0, 41.0, 58.0, 54.0, 51.0, 62.0, 54.0, 71.0, 57.0, 61.0, 53.0, 49.0, 38.0, 36.0, 40.0, 24.0, 21.0, 15.0, 14.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.7642822265625, -6.602783203125, -6.4412841796875, -6.27978515625, -6.1182861328125, -5.956787109375, -5.7952880859375, -5.6337890625, -5.4722900390625, -5.310791015625, -5.1492919921875, -4.98779296875, -4.8262939453125, -4.664794921875, -4.5032958984375, -4.341796875, -4.1802978515625, -4.018798828125, -3.8572998046875, -3.69580078125, -3.5343017578125, -3.372802734375, -3.2113037109375, -3.0498046875, -2.8883056640625, -2.726806640625, -2.5653076171875, -2.40380859375, -2.2423095703125, -2.080810546875, -1.9193115234375, -1.7578125, -1.5963134765625, -1.434814453125, -1.2733154296875, -1.11181640625, -0.9503173828125, -0.788818359375, -0.6273193359375, -0.4658203125, -0.3043212890625, -0.142822265625, 0.0186767578125, 0.18017578125, 0.3416748046875, 0.503173828125, 0.6646728515625, 0.826171875, 0.9876708984375, 1.149169921875, 1.3106689453125, 1.47216796875, 1.6336669921875, 1.795166015625, 1.9566650390625, 2.1181640625, 2.2796630859375, 2.441162109375, 2.6026611328125, 2.76416015625, 2.9256591796875, 3.087158203125, 3.2486572265625, 3.41015625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 9.0, 11.0, 17.0, 30.0, 62.0, 86.0, 116.0, 172.0, 373.0, 714.0, 1670.0, 5326.0, 26656.0, 482826.0, 3521891.0, 133920.0, 14339.0, 3441.0, 1325.0, 585.0, 289.0, 163.0, 85.0, 52.0, 40.0, 23.0, 17.0, 9.0, 12.0, 8.0, 1.0, 1.0], "bins": [-33.09375, -32.37939453125, -31.6650390625, -30.95068359375, -30.236328125, -29.52197265625, -28.8076171875, -28.09326171875, -27.37890625, -26.66455078125, -25.9501953125, -25.23583984375, -24.521484375, -23.80712890625, -23.0927734375, -22.37841796875, -21.6640625, -20.94970703125, -20.2353515625, -19.52099609375, -18.806640625, -18.09228515625, -17.3779296875, -16.66357421875, -15.94921875, -15.23486328125, -14.5205078125, -13.80615234375, -13.091796875, -12.37744140625, -11.6630859375, -10.94873046875, -10.234375, -9.52001953125, -8.8056640625, -8.09130859375, -7.376953125, -6.66259765625, -5.9482421875, -5.23388671875, -4.51953125, -3.80517578125, -3.0908203125, -2.37646484375, -1.662109375, -0.94775390625, -0.2333984375, 0.48095703125, 1.1953125, 1.90966796875, 2.6240234375, 3.33837890625, 4.052734375, 4.76708984375, 5.4814453125, 6.19580078125, 6.91015625, 7.62451171875, 8.3388671875, 9.05322265625, 9.767578125, 10.48193359375, 11.1962890625, 11.91064453125, 12.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 34.0, 44.0, 74.0, 135.0, 237.0, 330.0, 585.0, 820.0, 699.0, 430.0, 254.0, 149.0, 100.0, 56.0, 34.0, 28.0, 16.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.219482421875, -14.54833984375, -13.877197265625, -13.2060546875, -12.534912109375, -11.86376953125, -11.192626953125, -10.521484375, -9.850341796875, -9.17919921875, -8.508056640625, -7.8369140625, -7.165771484375, -6.49462890625, -5.823486328125, -5.15234375, -4.481201171875, -3.81005859375, -3.138916015625, -2.4677734375, -1.796630859375, -1.12548828125, -0.454345703125, 0.216796875, 0.887939453125, 1.55908203125, 2.230224609375, 2.9013671875, 3.572509765625, 4.24365234375, 4.914794921875, 5.5859375, 6.257080078125, 6.92822265625, 7.599365234375, 8.2705078125, 8.941650390625, 9.61279296875, 10.283935546875, 10.955078125, 11.626220703125, 12.29736328125, 12.968505859375, 13.6396484375, 14.310791015625, 14.98193359375, 15.653076171875, 16.32421875, 16.995361328125, 17.66650390625, 18.337646484375, 19.0087890625, 19.679931640625, 20.35107421875, 21.022216796875, 21.693359375, 22.364501953125, 23.03564453125, 23.706787109375, 24.3779296875, 25.049072265625, 25.72021484375, 26.391357421875, 27.0625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 18.0, 26.0, 29.0, 66.0, 112.0, 262.0, 565.0, 1339.0, 4538.0, 526046.0, 3648990.0, 9143.0, 1741.0, 686.0, 325.0, 153.0, 91.0, 62.0, 29.0, 12.0, 8.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.5625, -70.1552734375, -67.748046875, -65.3408203125, -62.93359375, -60.5263671875, -58.119140625, -55.7119140625, -53.3046875, -50.8974609375, -48.490234375, -46.0830078125, -43.67578125, -41.2685546875, -38.861328125, -36.4541015625, -34.046875, -31.6396484375, -29.232421875, -26.8251953125, -24.41796875, -22.0107421875, -19.603515625, -17.1962890625, -14.7890625, -12.3818359375, -9.974609375, -7.5673828125, -5.16015625, -2.7529296875, -0.345703125, 2.0615234375, 4.46875, 6.8759765625, 9.283203125, 11.6904296875, 14.09765625, 16.5048828125, 18.912109375, 21.3193359375, 23.7265625, 26.1337890625, 28.541015625, 30.9482421875, 33.35546875, 35.7626953125, 38.169921875, 40.5771484375, 42.984375, 45.3916015625, 47.798828125, 50.2060546875, 52.61328125, 55.0205078125, 57.427734375, 59.8349609375, 62.2421875, 64.6494140625, 67.056640625, 69.4638671875, 71.87109375, 74.2783203125, 76.685546875, 79.0927734375, 81.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 16.0, 44.0, 193.0, 425.0, 243.0, 73.0, 14.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.2716064453125, -208.23072814941406, -204.18984985351562, -200.1489715576172, -196.10809326171875, -192.0672149658203, -188.02633666992188, -183.9854736328125, -179.944580078125, -175.90370178222656, -171.86282348632812, -167.8219451904297, -163.78106689453125, -159.7401885986328, -155.69931030273438, -151.658447265625, -147.61756896972656, -143.57669067382812, -139.5358123779297, -135.49493408203125, -131.4540557861328, -127.41317749023438, -123.37230682373047, -119.33142852783203, -115.2905502319336, -111.24967193603516, -107.20879364013672, -103.16791534423828, -99.12704467773438, -95.08616638183594, -91.0452880859375, -87.00440979003906, -82.96353149414062, -78.92265319824219, -74.88177490234375, -70.84089660644531, -66.80001831054688, -62.7591438293457, -58.71826934814453, -54.677391052246094, -50.63651657104492, -46.595638275146484, -42.55476379394531, -38.513885498046875, -34.47300720214844, -30.43212890625, -26.391252517700195, -22.35037612915039, -18.309497833251953, -14.268620491027832, -10.227743148803711, -6.18686580657959, -2.1459884643554688, 1.8948898315429688, 5.935766220092773, 9.976642608642578, 14.017520904541016, 18.058399200439453, 22.099275588989258, 26.140151977539062, 30.1810302734375, 34.22190856933594, 38.262786865234375, 42.30366134643555, 46.344539642333984]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 5.0, 9.0, 5.0, 12.0, 5.0, 20.0, 14.0, 16.0, 19.0, 22.0, 21.0, 16.0, 37.0, 31.0, 42.0, 26.0, 30.0, 44.0, 38.0, 37.0, 30.0, 30.0, 37.0, 39.0, 41.0, 33.0, 51.0, 31.0, 34.0, 28.0, 28.0, 21.0, 19.0, 14.0, 27.0, 12.0, 11.0, 7.0, 13.0, 6.0, 7.0, 6.0, 10.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0], "bins": [-44.282958984375, -43.00820541381836, -41.73345184326172, -40.45869827270508, -39.18394470214844, -37.9091911315918, -36.634437561035156, -35.35968780517578, -34.084930419921875, -32.810176849365234, -31.535423278808594, -30.260669708251953, -28.985916137695312, -27.711162567138672, -26.436410903930664, -25.161657333374023, -23.886905670166016, -22.612152099609375, -21.337398529052734, -20.062644958496094, -18.787891387939453, -17.513137817382812, -16.238386154174805, -14.963632583618164, -13.688879013061523, -12.414125442504883, -11.139371871948242, -9.864619255065918, -8.589865684509277, -7.315112113952637, -6.040359020233154, -4.765605926513672, -3.4908523559570312, -2.2160990238189697, -0.9413456916809082, 0.3334076404571533, 1.6081609725952148, 2.8829145431518555, 4.157667636871338, 5.43242073059082, 6.707174301147461, 7.981927871704102, 9.256681442260742, 10.531434059143066, 11.806187629699707, 13.080941200256348, 14.355693817138672, 15.630447387695312, 16.905200958251953, 18.179954528808594, 19.454708099365234, 20.729461669921875, 22.004215240478516, 23.278968811035156, 24.553720474243164, 25.828474044799805, 27.103227615356445, 28.377981185913086, 29.652734756469727, 30.927488327026367, 32.202239990234375, 33.476993560791016, 34.751747131347656, 36.0265007019043, 37.30125427246094]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 29.0, 46.0, 60.0, 85.0, 110.0, 191.0, 242.0, 364.0, 519.0, 720.0, 1137.0, 1540.0, 2265.0, 3384.0, 4838.0, 7391.0, 10979.0, 16461.0, 24432.0, 37086.0, 56146.0, 87430.0, 130522.0, 171932.0, 158227.0, 113185.0, 74671.0, 48235.0, 31832.0, 21042.0, 14026.0, 9492.0, 6240.0, 4304.0, 2913.0, 1946.0, 1404.0, 934.0, 659.0, 475.0, 321.0, 234.0, 148.0, 101.0, 84.0, 58.0, 31.0, 25.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.3349571228027344, -0.32372283935546875, -0.3124885559082031, -0.3012542724609375, -0.2900199890136719, -0.27878570556640625, -0.2675514221191406, -0.256317138671875, -0.24508285522460938, -0.23384857177734375, -0.22261428833007812, -0.2113800048828125, -0.20014572143554688, -0.18891143798828125, -0.17767715454101562, -0.16644287109375, -0.15520858764648438, -0.14397430419921875, -0.13274002075195312, -0.1215057373046875, -0.11027145385742188, -0.09903717041015625, -0.08780288696289062, -0.076568603515625, -0.06533432006835938, -0.05410003662109375, -0.042865753173828125, -0.0316314697265625, -0.020397186279296875, -0.00916290283203125, 0.002071380615234375, 0.0133056640625, 0.024539947509765625, 0.03577423095703125, 0.047008514404296875, 0.0582427978515625, 0.06947708129882812, 0.08071136474609375, 0.09194564819335938, 0.103179931640625, 0.11441421508789062, 0.12564849853515625, 0.13688278198242188, 0.1481170654296875, 0.15935134887695312, 0.17058563232421875, 0.18181991577148438, 0.19305419921875, 0.20428848266601562, 0.21552276611328125, 0.22675704956054688, 0.2379913330078125, 0.24922561645507812, 0.26045989990234375, 0.2716941833496094, 0.282928466796875, 0.2941627502441406, 0.30539703369140625, 0.3166313171386719, 0.3278656005859375, 0.3390998840332031, 0.35033416748046875, 0.3615684509277344, 0.372802734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 8.0, 14.0, 18.0, 16.0, 14.0, 19.0, 30.0, 31.0, 27.0, 32.0, 29.0, 46.0, 42.0, 40.0, 38.0, 47.0, 1066.0, 33.0, 33.0, 48.0, 41.0, 35.0, 32.0, 21.0, 34.0, 32.0, 25.0, 14.0, 29.0, 18.0, 14.0, 10.0, 16.0, 8.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.214141845703125, -2.14117431640625, -2.068206787109375, -1.9952392578125, -1.922271728515625, -1.84930419921875, -1.776336669921875, -1.703369140625, -1.630401611328125, -1.55743408203125, -1.484466552734375, -1.4114990234375, -1.338531494140625, -1.26556396484375, -1.192596435546875, -1.11962890625, -1.046661376953125, -0.97369384765625, -0.900726318359375, -0.8277587890625, -0.754791259765625, -0.68182373046875, -0.608856201171875, -0.535888671875, -0.462921142578125, -0.38995361328125, -0.316986083984375, -0.2440185546875, -0.171051025390625, -0.09808349609375, -0.025115966796875, 0.0478515625, 0.120819091796875, 0.19378662109375, 0.266754150390625, 0.3397216796875, 0.412689208984375, 0.48565673828125, 0.558624267578125, 0.631591796875, 0.704559326171875, 0.77752685546875, 0.850494384765625, 0.9234619140625, 0.996429443359375, 1.06939697265625, 1.142364501953125, 1.21533203125, 1.288299560546875, 1.36126708984375, 1.434234619140625, 1.5072021484375, 1.580169677734375, 1.65313720703125, 1.726104736328125, 1.799072265625, 1.872039794921875, 1.94500732421875, 2.017974853515625, 2.0909423828125, 2.163909912109375, 2.23687744140625, 2.309844970703125, 2.3828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 4.0, 11.0, 14.0, 23.0, 36.0, 58.0, 92.0, 102.0, 189.0, 303.0, 514.0, 755.0, 1359.0, 2123.0, 3583.0, 5903.0, 9968.0, 16434.0, 26980.0, 44670.0, 72015.0, 111197.0, 154575.0, 1220992.0, 148644.0, 103884.0, 67155.0, 41641.0, 25327.0, 15238.0, 9227.0, 5613.0, 3340.0, 2023.0, 1206.0, 734.0, 445.0, 258.0, 176.0, 96.0, 74.0, 52.0, 28.0, 20.0, 15.0, 14.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2753715515136719, -0.26631927490234375, -0.2572669982910156, -0.2482147216796875, -0.23916244506835938, -0.23011016845703125, -0.22105789184570312, -0.212005615234375, -0.20295333862304688, -0.19390106201171875, -0.18484878540039062, -0.1757965087890625, -0.16674423217773438, -0.15769195556640625, -0.14863967895507812, -0.13958740234375, -0.13053512573242188, -0.12148284912109375, -0.11243057250976562, -0.1033782958984375, -0.09432601928710938, -0.08527374267578125, -0.07622146606445312, -0.067169189453125, -0.058116912841796875, -0.04906463623046875, -0.040012359619140625, -0.0309600830078125, -0.021907806396484375, -0.01285552978515625, -0.003803253173828125, 0.0052490234375, 0.014301300048828125, 0.02335357666015625, 0.032405853271484375, 0.0414581298828125, 0.050510406494140625, 0.05956268310546875, 0.06861495971679688, 0.077667236328125, 0.08671951293945312, 0.09577178955078125, 0.10482406616210938, 0.1138763427734375, 0.12292861938476562, 0.13198089599609375, 0.14103317260742188, 0.15008544921875, 0.15913772583007812, 0.16819000244140625, 0.17724227905273438, 0.1862945556640625, 0.19534683227539062, 0.20439910888671875, 0.21345138549804688, 0.222503662109375, 0.23155593872070312, 0.24060821533203125, 0.24966049194335938, 0.2587127685546875, 0.2677650451660156, 0.27681732177734375, 0.2858695983886719, 0.294921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 11.0, 4.0, 20.0, 16.0, 12.0, 30.0, 38.0, 44.0, 42.0, 59.0, 65.0, 57.0, 56.0, 71.0, 75.0, 47.0, 58.0, 42.0, 54.0, 35.0, 30.0, 21.0, 12.0, 17.0, 14.0, 8.0, 10.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020160675048828125, -0.0019510090351104736, -0.0018859505653381348, -0.001820892095565796, -0.001755833625793457, -0.0016907751560211182, -0.0016257166862487793, -0.0015606582164764404, -0.0014955997467041016, -0.0014305412769317627, -0.0013654828071594238, -0.001300424337387085, -0.001235365867614746, -0.0011703073978424072, -0.0011052489280700684, -0.0010401904582977295, -0.0009751319885253906, -0.0009100735187530518, -0.0008450150489807129, -0.000779956579208374, -0.0007148981094360352, -0.0006498396396636963, -0.0005847811698913574, -0.0005197227001190186, -0.0004546642303466797, -0.0003896057605743408, -0.00032454729080200195, -0.0002594888210296631, -0.00019443035125732422, -0.00012937188148498535, -6.431341171264648e-05, 7.450580596923828e-07, 6.580352783203125e-05, 0.00013086199760437012, 0.00019592046737670898, 0.00026097893714904785, 0.0003260374069213867, 0.0003910958766937256, 0.00045615434646606445, 0.0005212128162384033, 0.0005862712860107422, 0.0006513297557830811, 0.0007163882255554199, 0.0007814466953277588, 0.0008465051651000977, 0.0009115636348724365, 0.0009766221046447754, 0.0010416805744171143, 0.0011067390441894531, 0.001171797513961792, 0.0012368559837341309, 0.0013019144535064697, 0.0013669729232788086, 0.0014320313930511475, 0.0014970898628234863, 0.0015621483325958252, 0.001627206802368164, 0.001692265272140503, 0.0017573237419128418, 0.0018223822116851807, 0.0018874406814575195, 0.0019524991512298584, 0.0020175576210021973, 0.002082616090774536, 0.002147674560546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 13.0, 13.0, 22.0, 29.0, 39.0, 45.0, 49.0, 74.0, 103.0, 141.0, 137.0, 191.0, 344.0, 716.0, 5486.0, 1028896.0, 9972.0, 807.0, 412.0, 256.0, 158.0, 129.0, 107.0, 78.0, 45.0, 49.0, 28.0, 30.0, 20.0, 27.0, 28.0, 12.0, 6.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0401611328125, -0.038999080657958984, -0.03783702850341797, -0.03667497634887695, -0.03551292419433594, -0.03435087203979492, -0.033188819885253906, -0.03202676773071289, -0.030864715576171875, -0.02970266342163086, -0.028540611267089844, -0.027378559112548828, -0.026216506958007812, -0.025054454803466797, -0.02389240264892578, -0.022730350494384766, -0.02156829833984375, -0.020406246185302734, -0.01924419403076172, -0.018082141876220703, -0.016920089721679688, -0.015758037567138672, -0.014595985412597656, -0.01343393325805664, -0.012271881103515625, -0.01110982894897461, -0.009947776794433594, -0.008785724639892578, -0.0076236724853515625, -0.006461620330810547, -0.005299568176269531, -0.004137516021728516, -0.0029754638671875, -0.0018134117126464844, -0.0006513595581054688, 0.0005106925964355469, 0.0016727447509765625, 0.002834796905517578, 0.003996849060058594, 0.005158901214599609, 0.006320953369140625, 0.007483005523681641, 0.008645057678222656, 0.009807109832763672, 0.010969161987304688, 0.012131214141845703, 0.013293266296386719, 0.014455318450927734, 0.01561737060546875, 0.016779422760009766, 0.01794147491455078, 0.019103527069091797, 0.020265579223632812, 0.021427631378173828, 0.022589683532714844, 0.02375173568725586, 0.024913787841796875, 0.02607583999633789, 0.027237892150878906, 0.028399944305419922, 0.029561996459960938, 0.030724048614501953, 0.03188610076904297, 0.033048152923583984, 0.034210205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 979.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028607146814465523, -0.027993997558951378, -0.027380848303437233, -0.026767700910568237, -0.026154551655054092, -0.025541402399539948, -0.024928253144025803, -0.024315103888511658, -0.023701954632997513, -0.023088805377483368, -0.022475656121969223, -0.021862506866455078, -0.021249359473586082, -0.020636210218071938, -0.020023060962557793, -0.019409911707043648, -0.018796764314174652, -0.018183615058660507, -0.017570465803146362, -0.016957316547632217, -0.016344169154763222, -0.015731019899249077, -0.015117870643734932, -0.014504721388220787, -0.013891572132706642, -0.013278422877192497, -0.012665274553000927, -0.012052125297486782, -0.011438976041972637, -0.010825827717781067, -0.010212678462266922, -0.009599529206752777, -0.008986380882561207, -0.008373231627047062, -0.007760082837194204, -0.007146934047341347, -0.006533784791827202, -0.005920636001974344, -0.005307487212121487, -0.004694337956607342, -0.004081189166754484, -0.003468040144070983, -0.0028548911213874817, -0.002241742331534624, -0.0016285933088511229, -0.0010154442861676216, -0.000402295496314764, 0.00021085375919938087, 0.0008240025490522385, 0.0014371515717357397, 0.002050300594419241, 0.0026634493842720985, 0.0032765984069556, 0.003889747429639101, 0.004502896219491959, 0.0051160454750061035, 0.005729194264858961, 0.006342343054711819, 0.006955492310225964, 0.007568641100078821, 0.008181789889931679, 0.008794939145445824, 0.009408088400959969, 0.010021237656474113, 0.010634385980665684]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 11.0, 10.0, 20.0, 25.0, 26.0, 53.0, 35.0, 36.0, 55.0, 59.0, 55.0, 68.0, 55.0, 69.0, 66.0, 62.0, 52.0, 51.0, 43.0, 37.0, 16.0, 22.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011274218559265137, -0.0010774759575724602, -0.0010275300592184067, -0.0009775841608643532, -0.0009276382625102997, -0.0008776923641562462, -0.0008277464658021927, -0.0007778005674481392, -0.0007278546690940857, -0.0006779087707400322, -0.0006279628723859787, -0.0005780169740319252, -0.0005280710756778717, -0.0004781251773238182, -0.0004281792789697647, -0.0003782333806157112, -0.0003282874822616577, -0.0002783415839076042, -0.00022839568555355072, -0.00017844978719949722, -0.00012850388884544373, -7.855799049139023e-05, -2.861209213733673e-05, 2.1333806216716766e-05, 7.127970457077026e-05, 0.00012122560292482376, 0.00017117150127887726, 0.00022111739963293076, 0.00027106329798698425, 0.00032100919634103775, 0.00037095509469509125, 0.00042090099304914474, 0.00047084689140319824, 0.0005207927897572517, 0.0005707386881113052, 0.0006206845864653587, 0.0006706304848194122, 0.0007205763831734657, 0.0007705222815275192, 0.0008204681798815727, 0.0008704140782356262, 0.0009203599765896797, 0.0009703058749437332, 0.0010202517732977867, 0.0010701976716518402, 0.0011201435700058937, 0.0011700894683599472, 0.0012200353667140007, 0.0012699812650680542, 0.0013199271634221077, 0.0013698730617761612, 0.0014198189601302147, 0.0014697648584842682, 0.0015197107568383217, 0.0015696566551923752, 0.0016196025535464287, 0.0016695484519004822, 0.0017194943502545357, 0.0017694402486085892, 0.0018193861469626427, 0.0018693320453166962, 0.0019192779436707497, 0.001969223842024803, 0.0020191697403788567, 0.00206911563873291]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 13.0, 5.0, 13.0, 26.0, 29.0, 33.0, 64.0, 62.0, 131.0, 181.0, 224.0, 401.0, 512.0, 884.0, 1401.0, 2391.0, 3829.0, 6746.0, 13246.0, 34029.0, 348266.0, 559734.0, 42755.0, 15040.0, 7447.0, 4349.0, 2382.0, 1483.0, 962.0, 613.0, 397.0, 273.0, 188.0, 137.0, 84.0, 57.0, 46.0, 27.0, 29.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.07470703125, -17.4931640625, -16.91162109375, -16.330078125, -15.74853515625, -15.1669921875, -14.58544921875, -14.00390625, -13.42236328125, -12.8408203125, -12.25927734375, -11.677734375, -11.09619140625, -10.5146484375, -9.93310546875, -9.3515625, -8.77001953125, -8.1884765625, -7.60693359375, -7.025390625, -6.44384765625, -5.8623046875, -5.28076171875, -4.69921875, -4.11767578125, -3.5361328125, -2.95458984375, -2.373046875, -1.79150390625, -1.2099609375, -0.62841796875, -0.046875, 0.53466796875, 1.1162109375, 1.69775390625, 2.279296875, 2.86083984375, 3.4423828125, 4.02392578125, 4.60546875, 5.18701171875, 5.7685546875, 6.35009765625, 6.931640625, 7.51318359375, 8.0947265625, 8.67626953125, 9.2578125, 9.83935546875, 10.4208984375, 11.00244140625, 11.583984375, 12.16552734375, 12.7470703125, 13.32861328125, 13.91015625, 14.49169921875, 15.0732421875, 15.65478515625, 16.236328125, 16.81787109375, 17.3994140625, 17.98095703125, 18.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 11.0, 16.0, 24.0, 14.0, 30.0, 32.0, 29.0, 40.0, 37.0, 46.0, 60.0, 56.0, 113.0, 412.0, 1511.0, 162.0, 57.0, 53.0, 49.0, 47.0, 29.0, 47.0, 25.0, 18.0, 19.0, 19.0, 17.0, 9.0, 10.0, 6.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.765625, -15.3408203125, -14.916015625, -14.4912109375, -14.06640625, -13.6416015625, -13.216796875, -12.7919921875, -12.3671875, -11.9423828125, -11.517578125, -11.0927734375, -10.66796875, -10.2431640625, -9.818359375, -9.3935546875, -8.96875, -8.5439453125, -8.119140625, -7.6943359375, -7.26953125, -6.8447265625, -6.419921875, -5.9951171875, -5.5703125, -5.1455078125, -4.720703125, -4.2958984375, -3.87109375, -3.4462890625, -3.021484375, -2.5966796875, -2.171875, -1.7470703125, -1.322265625, -0.8974609375, -0.47265625, -0.0478515625, 0.376953125, 0.8017578125, 1.2265625, 1.6513671875, 2.076171875, 2.5009765625, 2.92578125, 3.3505859375, 3.775390625, 4.2001953125, 4.625, 5.0498046875, 5.474609375, 5.8994140625, 6.32421875, 6.7490234375, 7.173828125, 7.5986328125, 8.0234375, 8.4482421875, 8.873046875, 9.2978515625, 9.72265625, 10.1474609375, 10.572265625, 10.9970703125, 11.421875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 7.0, 21.0, 13.0, 31.0, 18.0, 39.0, 31.0, 62.0, 62.0, 130.0, 273.0, 1353.0, 2075228.0, 1066373.0, 1222.0, 291.0, 141.0, 86.0, 59.0, 36.0, 35.0, 25.0, 21.0, 22.0, 14.0, 17.0, 19.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.69580078125, -45.8603515625, -44.02490234375, -42.189453125, -40.35400390625, -38.5185546875, -36.68310546875, -34.84765625, -33.01220703125, -31.1767578125, -29.34130859375, -27.505859375, -25.67041015625, -23.8349609375, -21.99951171875, -20.1640625, -18.32861328125, -16.4931640625, -14.65771484375, -12.822265625, -10.98681640625, -9.1513671875, -7.31591796875, -5.48046875, -3.64501953125, -1.8095703125, 0.02587890625, 1.861328125, 3.69677734375, 5.5322265625, 7.36767578125, 9.203125, 11.03857421875, 12.8740234375, 14.70947265625, 16.544921875, 18.38037109375, 20.2158203125, 22.05126953125, 23.88671875, 25.72216796875, 27.5576171875, 29.39306640625, 31.228515625, 33.06396484375, 34.8994140625, 36.73486328125, 38.5703125, 40.40576171875, 42.2412109375, 44.07666015625, 45.912109375, 47.74755859375, 49.5830078125, 51.41845703125, 53.25390625, 55.08935546875, 56.9248046875, 58.76025390625, 60.595703125, 62.43115234375, 64.2666015625, 66.10205078125, 67.9375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 94.0, 612.0, 286.0, 18.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.560911178588867, -9.121329307556152, -6.6817474365234375, -4.242165565490723, -1.8025836944580078, 0.636998176574707, 3.076580047607422, 5.51616096496582, 7.955743789672852, 10.395325660705566, 12.834907531738281, 15.274489402770996, 17.71407127380371, 20.15365219116211, 22.59323501586914, 25.03281593322754, 27.47239875793457, 29.91197967529297, 32.3515625, 34.79114532470703, 37.23072814941406, 39.67030715942383, 42.10988998413086, 44.549468994140625, 46.989051818847656, 49.42863464355469, 51.86821746826172, 54.307796478271484, 56.747379302978516, 59.18696212768555, 61.62654113769531, 64.06612396240234, 66.50570678710938, 68.9452896118164, 71.38487243652344, 73.82445526123047, 76.2640380859375, 78.70361328125, 81.14319610595703, 83.58277893066406, 86.0223617553711, 88.46194458007812, 90.90152740478516, 93.34111022949219, 95.78068542480469, 98.22026824951172, 100.65985107421875, 103.09943389892578, 105.53901672363281, 107.97859954833984, 110.41818237304688, 112.8577651977539, 115.29734802246094, 117.73692321777344, 120.17650604248047, 122.6160888671875, 125.05567169189453, 127.49525451660156, 129.93482971191406, 132.37442016601562, 134.81399536132812, 137.2535858154297, 139.6931610107422, 142.13275146484375, 144.57232666015625]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 2.0, 9.0, 10.0, 9.0, 16.0, 12.0, 14.0, 19.0, 18.0, 24.0, 26.0, 29.0, 21.0, 35.0, 32.0, 33.0, 36.0, 41.0, 35.0, 40.0, 44.0, 53.0, 38.0, 41.0, 34.0, 32.0, 38.0, 47.0, 37.0, 26.0, 22.0, 18.0, 22.0, 15.0, 11.0, 12.0, 12.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-46.899314880371094, -45.650611877441406, -44.40190505981445, -43.153202056884766, -41.90449905395508, -40.655792236328125, -39.40708923339844, -38.15838623046875, -36.9096794128418, -35.66097640991211, -34.412269592285156, -33.16356658935547, -31.91486167907715, -30.666156768798828, -29.41745376586914, -28.16874885559082, -26.920045852661133, -25.671340942382812, -24.422637939453125, -23.173933029174805, -21.925228118896484, -20.676525115966797, -19.427820205688477, -18.179115295410156, -16.93041229248047, -15.681708335876465, -14.433003425598145, -13.18429946899414, -11.93559455871582, -10.686890602111816, -9.438186645507812, -8.189481735229492, -6.940776824951172, -5.69207239151001, -4.443367958068848, -3.1946640014648438, -1.9459595680236816, -0.6972551345825195, 0.5514488220214844, 1.8001537322998047, 3.0488576889038086, 4.297562122344971, 5.546266555786133, 6.794970512390137, 8.04367446899414, 9.292379379272461, 10.541083335876465, 11.789788246154785, 13.038492202758789, 14.287196159362793, 15.535901069641113, 16.784605026245117, 18.033309936523438, 19.282012939453125, 20.530717849731445, 21.779422760009766, 23.028125762939453, 24.276830673217773, 25.52553367614746, 26.77423858642578, 28.0229434967041, 29.271648406982422, 30.52035140991211, 31.76905632019043, 33.01776123046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 40.0, 35.0, 36.0, 51.0, 49.0, 49.0, 35.0, 61.0, 72.0, 49.0, 55.0, 53.0, 37.0, 45.0, 52.0, 28.0, 35.0, 32.0, 34.0, 22.0, 16.0, 7.0, 3.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2210693359375, -6.051513671875, -5.8819580078125, -5.71240234375, -5.5428466796875, -5.373291015625, -5.2037353515625, -5.0341796875, -4.8646240234375, -4.695068359375, -4.5255126953125, -4.35595703125, -4.1864013671875, -4.016845703125, -3.8472900390625, -3.677734375, -3.5081787109375, -3.338623046875, -3.1690673828125, -2.99951171875, -2.8299560546875, -2.660400390625, -2.4908447265625, -2.3212890625, -2.1517333984375, -1.982177734375, -1.8126220703125, -1.64306640625, -1.4735107421875, -1.303955078125, -1.1343994140625, -0.96484375, -0.7952880859375, -0.625732421875, -0.4561767578125, -0.28662109375, -0.1170654296875, 0.052490234375, 0.2220458984375, 0.3916015625, 0.5611572265625, 0.730712890625, 0.9002685546875, 1.06982421875, 1.2393798828125, 1.408935546875, 1.5784912109375, 1.748046875, 1.9176025390625, 2.087158203125, 2.2567138671875, 2.42626953125, 2.5958251953125, 2.765380859375, 2.9349365234375, 3.1044921875, 3.2740478515625, 3.443603515625, 3.6131591796875, 3.78271484375, 3.9522705078125, 4.121826171875, 4.2913818359375, 4.4609375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 14.0, 20.0, 40.0, 78.0, 90.0, 179.0, 303.0, 581.0, 1442.0, 4561.0, 24196.0, 390990.0, 3632661.0, 120839.0, 13014.0, 3091.0, 1052.0, 488.0, 227.0, 145.0, 89.0, 70.0, 35.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-40.375, -39.46435546875, -38.5537109375, -37.64306640625, -36.732421875, -35.82177734375, -34.9111328125, -34.00048828125, -33.08984375, -32.17919921875, -31.2685546875, -30.35791015625, -29.447265625, -28.53662109375, -27.6259765625, -26.71533203125, -25.8046875, -24.89404296875, -23.9833984375, -23.07275390625, -22.162109375, -21.25146484375, -20.3408203125, -19.43017578125, -18.51953125, -17.60888671875, -16.6982421875, -15.78759765625, -14.876953125, -13.96630859375, -13.0556640625, -12.14501953125, -11.234375, -10.32373046875, -9.4130859375, -8.50244140625, -7.591796875, -6.68115234375, -5.7705078125, -4.85986328125, -3.94921875, -3.03857421875, -2.1279296875, -1.21728515625, -0.306640625, 0.60400390625, 1.5146484375, 2.42529296875, 3.3359375, 4.24658203125, 5.1572265625, 6.06787109375, 6.978515625, 7.88916015625, 8.7998046875, 9.71044921875, 10.62109375, 11.53173828125, 12.4423828125, 13.35302734375, 14.263671875, 15.17431640625, 16.0849609375, 16.99560546875, 17.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 1.0, 10.0, 9.0, 30.0, 37.0, 71.0, 116.0, 154.0, 259.0, 422.0, 640.0, 763.0, 603.0, 369.0, 234.0, 130.0, 73.0, 61.0, 41.0, 23.0, 9.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.6533203125, -17.947265625, -17.2412109375, -16.53515625, -15.8291015625, -15.123046875, -14.4169921875, -13.7109375, -13.0048828125, -12.298828125, -11.5927734375, -10.88671875, -10.1806640625, -9.474609375, -8.7685546875, -8.0625, -7.3564453125, -6.650390625, -5.9443359375, -5.23828125, -4.5322265625, -3.826171875, -3.1201171875, -2.4140625, -1.7080078125, -1.001953125, -0.2958984375, 0.41015625, 1.1162109375, 1.822265625, 2.5283203125, 3.234375, 3.9404296875, 4.646484375, 5.3525390625, 6.05859375, 6.7646484375, 7.470703125, 8.1767578125, 8.8828125, 9.5888671875, 10.294921875, 11.0009765625, 11.70703125, 12.4130859375, 13.119140625, 13.8251953125, 14.53125, 15.2373046875, 15.943359375, 16.6494140625, 17.35546875, 18.0615234375, 18.767578125, 19.4736328125, 20.1796875, 20.8857421875, 21.591796875, 22.2978515625, 23.00390625, 23.7099609375, 24.416015625, 25.1220703125, 25.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 12.0, 7.0, 8.0, 25.0, 18.0, 45.0, 56.0, 105.0, 176.0, 377.0, 1285.0, 16107.0, 3893395.0, 277834.0, 3443.0, 669.0, 327.0, 142.0, 76.0, 61.0, 17.0, 30.0, 18.0, 13.0, 12.0, 6.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -44.40869140625, -42.1611328125, -39.91357421875, -37.666015625, -35.41845703125, -33.1708984375, -30.92333984375, -28.67578125, -26.42822265625, -24.1806640625, -21.93310546875, -19.685546875, -17.43798828125, -15.1904296875, -12.94287109375, -10.6953125, -8.44775390625, -6.2001953125, -3.95263671875, -1.705078125, 0.54248046875, 2.7900390625, 5.03759765625, 7.28515625, 9.53271484375, 11.7802734375, 14.02783203125, 16.275390625, 18.52294921875, 20.7705078125, 23.01806640625, 25.265625, 27.51318359375, 29.7607421875, 32.00830078125, 34.255859375, 36.50341796875, 38.7509765625, 40.99853515625, 43.24609375, 45.49365234375, 47.7412109375, 49.98876953125, 52.236328125, 54.48388671875, 56.7314453125, 58.97900390625, 61.2265625, 63.47412109375, 65.7216796875, 67.96923828125, 70.216796875, 72.46435546875, 74.7119140625, 76.95947265625, 79.20703125, 81.45458984375, 83.7021484375, 85.94970703125, 88.197265625, 90.44482421875, 92.6923828125, 94.93994140625, 97.1875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 36.0, 151.0, 460.0, 280.0, 77.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.6538848876953, -163.9443359375, -158.23477172851562, -152.5252227783203, -146.815673828125, -141.10610961914062, -135.3965606689453, -129.68701171875, -123.97745513916016, -118.26789855957031, -112.558349609375, -106.84879302978516, -101.13923645019531, -95.4296875, -89.72013092041016, -84.01057434082031, -78.301025390625, -72.59146881103516, -66.88191986083984, -61.17236328125, -55.46281051635742, -49.753257751464844, -44.043701171875, -38.33414840698242, -32.624595642089844, -26.915042877197266, -21.205488204956055, -15.495933532714844, -9.786380767822266, -4.0768280029296875, 1.6327285766601562, 7.342281341552734, 13.051849365234375, 18.761402130126953, 24.470956802368164, 30.180511474609375, 35.89006423950195, 41.59961700439453, 47.309173583984375, 53.01872634887695, 58.72827911376953, 64.43783569335938, 70.14738464355469, 75.85694122314453, 81.56649780273438, 87.27604675292969, 92.98560333251953, 98.69515991210938, 104.40470886230469, 110.11426544189453, 115.82381439208984, 121.53337097167969, 127.242919921875, 132.95248413085938, 138.6620330810547, 144.37158203125, 150.08114624023438, 155.7906951904297, 161.50025939941406, 167.20980834960938, 172.9193572998047, 178.62890625, 184.33847045898438, 190.0480194091797, 195.757568359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 20.0, 14.0, 24.0, 19.0, 18.0, 19.0, 35.0, 44.0, 42.0, 42.0, 53.0, 51.0, 48.0, 38.0, 44.0, 48.0, 47.0, 32.0, 43.0, 23.0, 41.0, 29.0, 32.0, 24.0, 38.0, 21.0, 16.0, 13.0, 15.0, 2.0, 9.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.267303466796875, -51.675743103027344, -50.08417892456055, -48.492618560791016, -46.90105438232422, -45.30949401855469, -43.717933654785156, -42.126373291015625, -40.53480911254883, -38.9432487487793, -37.3516845703125, -35.76012420654297, -34.16856384277344, -32.57699966430664, -30.98543930053711, -29.393877029418945, -27.80231475830078, -26.210752487182617, -24.619190216064453, -23.027629852294922, -21.436067581176758, -19.844505310058594, -18.252944946289062, -16.6613826751709, -15.069820404052734, -13.47825813293457, -11.886696815490723, -10.295135498046875, -8.703573226928711, -7.112011432647705, -5.520449638366699, -3.9288883209228516, -2.3373260498046875, -0.7457642555236816, 0.8457975387573242, 2.43735933303833, 4.028921127319336, 5.620482921600342, 7.212044715881348, 8.803606033325195, 10.39516830444336, 11.986730575561523, 13.578291893005371, 15.169853210449219, 16.761415481567383, 18.352977752685547, 19.944538116455078, 21.536100387573242, 23.127662658691406, 24.71922492980957, 26.310787200927734, 27.902347564697266, 29.49390983581543, 31.085472106933594, 32.677032470703125, 34.268592834472656, 35.86015701293945, 37.451717376708984, 39.04328155517578, 40.63484191894531, 42.226402282714844, 43.81796646118164, 45.40952682495117, 47.00109100341797, 48.5926513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 23.0, 25.0, 37.0, 63.0, 99.0, 149.0, 189.0, 300.0, 470.0, 723.0, 1155.0, 1642.0, 2769.0, 4415.0, 6930.0, 11315.0, 18100.0, 29291.0, 48200.0, 79185.0, 126807.0, 179916.0, 186340.0, 133353.0, 84004.0, 50657.0, 31157.0, 19255.0, 11853.0, 7508.0, 4510.0, 2835.0, 1842.0, 1213.0, 736.0, 518.0, 313.0, 173.0, 175.0, 102.0, 70.0, 32.0, 27.0, 21.0, 16.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3854179382324219, -0.37215423583984375, -0.3588905334472656, -0.3456268310546875, -0.3323631286621094, -0.31909942626953125, -0.3058357238769531, -0.292572021484375, -0.2793083190917969, -0.26604461669921875, -0.2527809143066406, -0.2395172119140625, -0.22625350952148438, -0.21298980712890625, -0.19972610473632812, -0.18646240234375, -0.17319869995117188, -0.15993499755859375, -0.14667129516601562, -0.1334075927734375, -0.12014389038085938, -0.10688018798828125, -0.09361648559570312, -0.080352783203125, -0.06708908081054688, -0.05382537841796875, -0.040561676025390625, -0.0272979736328125, -0.014034271240234375, -0.00077056884765625, 0.012493133544921875, 0.0257568359375, 0.039020538330078125, 0.05228424072265625, 0.06554794311523438, 0.0788116455078125, 0.09207534790039062, 0.10533905029296875, 0.11860275268554688, 0.131866455078125, 0.14513015747070312, 0.15839385986328125, 0.17165756225585938, 0.1849212646484375, 0.19818496704101562, 0.21144866943359375, 0.22471237182617188, 0.23797607421875, 0.2512397766113281, 0.26450347900390625, 0.2777671813964844, 0.2910308837890625, 0.3042945861816406, 0.31755828857421875, 0.3308219909667969, 0.344085693359375, 0.3573493957519531, 0.37061309814453125, 0.3838768005371094, 0.3971405029296875, 0.4104042053222656, 0.42366790771484375, 0.4369316101074219, 0.4501953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 7.0, 12.0, 11.0, 12.0, 21.0, 13.0, 16.0, 20.0, 28.0, 48.0, 36.0, 35.0, 49.0, 57.0, 51.0, 41.0, 1070.0, 53.0, 56.0, 53.0, 45.0, 32.0, 30.0, 38.0, 30.0, 27.0, 28.0, 23.0, 24.0, 7.0, 10.0, 9.0, 9.0, 17.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.231353759765625, -3.13458251953125, -3.037811279296875, -2.9410400390625, -2.844268798828125, -2.74749755859375, -2.650726318359375, -2.553955078125, -2.457183837890625, -2.36041259765625, -2.263641357421875, -2.1668701171875, -2.070098876953125, -1.97332763671875, -1.876556396484375, -1.77978515625, -1.683013916015625, -1.58624267578125, -1.489471435546875, -1.3927001953125, -1.295928955078125, -1.19915771484375, -1.102386474609375, -1.005615234375, -0.908843994140625, -0.81207275390625, -0.715301513671875, -0.6185302734375, -0.521759033203125, -0.42498779296875, -0.328216552734375, -0.2314453125, -0.134674072265625, -0.03790283203125, 0.058868408203125, 0.1556396484375, 0.252410888671875, 0.34918212890625, 0.445953369140625, 0.542724609375, 0.639495849609375, 0.73626708984375, 0.833038330078125, 0.9298095703125, 1.026580810546875, 1.12335205078125, 1.220123291015625, 1.31689453125, 1.413665771484375, 1.51043701171875, 1.607208251953125, 1.7039794921875, 1.800750732421875, 1.89752197265625, 1.994293212890625, 2.091064453125, 2.187835693359375, 2.28460693359375, 2.381378173828125, 2.4781494140625, 2.574920654296875, 2.67169189453125, 2.768463134765625, 2.865234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 26.0, 31.0, 55.0, 90.0, 164.0, 262.0, 417.0, 658.0, 1018.0, 1716.0, 2793.0, 4563.0, 7677.0, 12990.0, 21925.0, 37430.0, 63105.0, 101756.0, 151310.0, 1231360.0, 164621.0, 115425.0, 71977.0, 43097.0, 25598.0, 14868.0, 8677.0, 5322.0, 3220.0, 1934.0, 1150.0, 706.0, 417.0, 262.0, 194.0, 93.0, 49.0, 50.0, 29.0, 21.0, 15.0, 13.0, 9.0, 3.0, 3.0, 5.0, 0.0, 4.0], "bins": [-0.363037109375, -0.35285186767578125, -0.3426666259765625, -0.33248138427734375, -0.322296142578125, -0.31211090087890625, -0.3019256591796875, -0.29174041748046875, -0.28155517578125, -0.27136993408203125, -0.2611846923828125, -0.25099945068359375, -0.240814208984375, -0.23062896728515625, -0.2204437255859375, -0.21025848388671875, -0.2000732421875, -0.18988800048828125, -0.1797027587890625, -0.16951751708984375, -0.159332275390625, -0.14914703369140625, -0.1389617919921875, -0.12877655029296875, -0.11859130859375, -0.10840606689453125, -0.0982208251953125, -0.08803558349609375, -0.077850341796875, -0.06766510009765625, -0.0574798583984375, -0.04729461669921875, -0.037109375, -0.02692413330078125, -0.0167388916015625, -0.00655364990234375, 0.003631591796875, 0.01381683349609375, 0.0240020751953125, 0.03418731689453125, 0.04437255859375, 0.05455780029296875, 0.0647430419921875, 0.07492828369140625, 0.085113525390625, 0.09529876708984375, 0.1054840087890625, 0.11566925048828125, 0.1258544921875, 0.13603973388671875, 0.1462249755859375, 0.15641021728515625, 0.166595458984375, 0.17678070068359375, 0.1869659423828125, 0.19715118408203125, 0.20733642578125, 0.21752166748046875, 0.2277069091796875, 0.23789215087890625, 0.248077392578125, 0.25826263427734375, 0.2684478759765625, 0.27863311767578125, 0.288818359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 3.0, 7.0, 4.0, 12.0, 17.0, 18.0, 19.0, 25.0, 29.0, 34.0, 44.0, 39.0, 56.0, 48.0, 58.0, 75.0, 64.0, 67.0, 52.0, 47.0, 44.0, 38.0, 29.0, 33.0, 25.0, 24.0, 28.0, 16.0, 13.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023345947265625, -0.0022717267274856567, -0.0022088587284088135, -0.00214599072933197, -0.002083122730255127, -0.0020202547311782837, -0.0019573867321014404, -0.0018945187330245972, -0.001831650733947754, -0.0017687827348709106, -0.0017059147357940674, -0.0016430467367172241, -0.0015801787376403809, -0.0015173107385635376, -0.0014544427394866943, -0.001391574740409851, -0.0013287067413330078, -0.0012658387422561646, -0.0012029707431793213, -0.001140102744102478, -0.0010772347450256348, -0.0010143667459487915, -0.0009514987468719482, -0.000888630747795105, -0.0008257627487182617, -0.0007628947496414185, -0.0007000267505645752, -0.0006371587514877319, -0.0005742907524108887, -0.0005114227533340454, -0.00044855475425720215, -0.0003856867551803589, -0.0003228187561035156, -0.00025995075702667236, -0.0001970827579498291, -0.00013421475887298584, -7.134675979614258e-05, -8.478760719299316e-06, 5.4389238357543945e-05, 0.00011725723743438721, 0.00018012523651123047, 0.00024299323558807373, 0.000305861234664917, 0.00036872923374176025, 0.0004315972328186035, 0.0004944652318954468, 0.00055733323097229, 0.0006202012300491333, 0.0006830692291259766, 0.0007459372282028198, 0.0008088052272796631, 0.0008716732263565063, 0.0009345412254333496, 0.0009974092245101929, 0.0010602772235870361, 0.0011231452226638794, 0.0011860132217407227, 0.001248881220817566, 0.0013117492198944092, 0.0013746172189712524, 0.0014374852180480957, 0.001500353217124939, 0.0015632212162017822, 0.0016260892152786255, 0.0016889572143554688]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 12.0, 17.0, 27.0, 34.0, 41.0, 47.0, 70.0, 72.0, 95.0, 130.0, 187.0, 300.0, 598.0, 3586.0, 1026557.0, 14843.0, 751.0, 329.0, 230.0, 129.0, 109.0, 102.0, 82.0, 47.0, 38.0, 24.0, 25.0, 16.0, 7.0, 10.0, 12.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042236328125, -0.04085731506347656, -0.039478302001953125, -0.03809928894042969, -0.03672027587890625, -0.03534126281738281, -0.033962249755859375, -0.03258323669433594, -0.0312042236328125, -0.029825210571289062, -0.028446197509765625, -0.027067184448242188, -0.02568817138671875, -0.024309158325195312, -0.022930145263671875, -0.021551132202148438, -0.020172119140625, -0.018793106079101562, -0.017414093017578125, -0.016035079956054688, -0.01465606689453125, -0.013277053833007812, -0.011898040771484375, -0.010519027709960938, -0.0091400146484375, -0.0077610015869140625, -0.006381988525390625, -0.0050029754638671875, -0.00362396240234375, -0.0022449493408203125, -0.000865936279296875, 0.0005130767822265625, 0.00189208984375, 0.0032711029052734375, 0.004650115966796875, 0.0060291290283203125, 0.00740814208984375, 0.008787155151367188, 0.010166168212890625, 0.011545181274414062, 0.0129241943359375, 0.014303207397460938, 0.015682220458984375, 0.017061233520507812, 0.01844024658203125, 0.019819259643554688, 0.021198272705078125, 0.022577285766601562, 0.023956298828125, 0.025335311889648438, 0.026714324951171875, 0.028093338012695312, 0.02947235107421875, 0.030851364135742188, 0.032230377197265625, 0.03360939025878906, 0.0349884033203125, 0.03636741638183594, 0.037746429443359375, 0.03912544250488281, 0.04050445556640625, 0.04188346862792969, 0.043262481689453125, 0.04464149475097656, 0.0460205078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 524.0, 492.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02187264710664749, -0.02111779898405075, -0.02036294899880886, -0.01960810087621212, -0.01885325089097023, -0.01809840276837349, -0.01734355464577675, -0.01658870466053486, -0.01583385467529297, -0.015079005621373653, -0.014324156567454338, -0.013569308444857597, -0.012814458459615707, -0.012059610337018967, -0.011304761283099651, -0.010549912229180336, -0.009795064106583595, -0.00904021505266428, -0.008285365998744965, -0.007530517410486937, -0.006775668356567621, -0.006020819302648306, -0.005265970714390278, -0.0045111216604709625, -0.003756272606551647, -0.003001423552632332, -0.00224657473154366, -0.0014917259104549885, -0.0007368768565356731, 1.7972197383642197e-05, 0.0007728207856416702, 0.0015276698395609856, 0.00228252075612545, 0.0030373698100447655, 0.003792218631133437, 0.004547067452222109, 0.005301916506141424, 0.0060567655600607395, 0.0068116141483187675, 0.007566463202238083, 0.008321312256157398, 0.009076161310076714, 0.009831010363996029, 0.010585859417915344, 0.011340707540512085, 0.012095557525753975, 0.012850405648350716, 0.013605254702270031, 0.014360103756189346, 0.015114952810108662, 0.015869801864027977, 0.016624649986624718, 0.017379499971866608, 0.01813434809446335, 0.01888919621706009, 0.01964404620230198, 0.02039889618754387, 0.02115374431014061, 0.0219085942953825, 0.02266344241797924, 0.02341829240322113, 0.02417314052581787, 0.024927988648414612, 0.025682838633656502, 0.026437686756253242]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 13.0, 9.0, 13.0, 16.0, 22.0, 33.0, 19.0, 32.0, 35.0, 48.0, 59.0, 52.0, 38.0, 50.0, 47.0, 50.0, 68.0, 54.0, 51.0, 31.0, 33.0, 30.0, 37.0, 29.0, 22.0, 18.0, 15.0, 11.0, 15.0, 8.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000983893871307373, -0.0009442325681447983, -0.0009045712649822235, -0.0008649099618196487, -0.000825248658657074, -0.0007855873554944992, -0.0007459260523319244, -0.0007062647491693497, -0.0006666034460067749, -0.0006269421428442001, -0.0005872808396816254, -0.0005476195365190506, -0.0005079582333564758, -0.00046829693019390106, -0.0004286356270313263, -0.0003889743238687515, -0.00034931302070617676, -0.000309651717543602, -0.0002699904143810272, -0.00023032911121845245, -0.00019066780805587769, -0.00015100650489330292, -0.00011134520173072815, -7.168389856815338e-05, -3.202259540557861e-05, 7.638707756996155e-06, 4.730001091957092e-05, 8.696131408214569e-05, 0.00012662261724472046, 0.00016628392040729523, 0.00020594522356987, 0.00024560652673244476, 0.00028526782989501953, 0.0003249291330575943, 0.00036459043622016907, 0.00040425173938274384, 0.0004439130425453186, 0.00048357434570789337, 0.0005232356488704681, 0.0005628969520330429, 0.0006025582551956177, 0.0006422195583581924, 0.0006818808615207672, 0.000721542164683342, 0.0007612034678459167, 0.0008008647710084915, 0.0008405260741710663, 0.000880187377333641, 0.0009198486804962158, 0.0009595099836587906, 0.0009991712868213654, 0.0010388325899839401, 0.001078493893146515, 0.0011181551963090897, 0.0011578164994716644, 0.0011974778026342392, 0.001237139105796814, 0.0012768004089593887, 0.0013164617121219635, 0.0013561230152845383, 0.001395784318447113, 0.0014354456216096878, 0.0014751069247722626, 0.0015147682279348373, 0.0015544295310974121]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 25.0, 26.0, 38.0, 69.0, 112.0, 131.0, 231.0, 328.0, 602.0, 1074.0, 2405.0, 6356.0, 23466.0, 104769.0, 502465.0, 320371.0, 62366.0, 14984.0, 4629.0, 1797.0, 882.0, 460.0, 344.0, 225.0, 131.0, 74.0, 57.0, 34.0, 32.0, 13.0, 12.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.05224609375, -4.8935546875, -4.73486328125, -4.576171875, -4.41748046875, -4.2587890625, -4.10009765625, -3.94140625, -3.78271484375, -3.6240234375, -3.46533203125, -3.306640625, -3.14794921875, -2.9892578125, -2.83056640625, -2.671875, -2.51318359375, -2.3544921875, -2.19580078125, -2.037109375, -1.87841796875, -1.7197265625, -1.56103515625, -1.40234375, -1.24365234375, -1.0849609375, -0.92626953125, -0.767578125, -0.60888671875, -0.4501953125, -0.29150390625, -0.1328125, 0.02587890625, 0.1845703125, 0.34326171875, 0.501953125, 0.66064453125, 0.8193359375, 0.97802734375, 1.13671875, 1.29541015625, 1.4541015625, 1.61279296875, 1.771484375, 1.93017578125, 2.0888671875, 2.24755859375, 2.40625, 2.56494140625, 2.7236328125, 2.88232421875, 3.041015625, 3.19970703125, 3.3583984375, 3.51708984375, 3.67578125, 3.83447265625, 3.9931640625, 4.15185546875, 4.310546875, 4.46923828125, 4.6279296875, 4.78662109375, 4.9453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 16.0, 16.0, 13.0, 9.0, 18.0, 21.0, 25.0, 26.0, 34.0, 39.0, 28.0, 37.0, 42.0, 52.0, 60.0, 147.0, 1772.0, 196.0, 75.0, 50.0, 36.0, 28.0, 31.0, 30.0, 35.0, 30.0, 32.0, 18.0, 12.0, 20.0, 16.0, 8.0, 13.0, 6.0, 8.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-16.265625, -15.8212890625, -15.376953125, -14.9326171875, -14.48828125, -14.0439453125, -13.599609375, -13.1552734375, -12.7109375, -12.2666015625, -11.822265625, -11.3779296875, -10.93359375, -10.4892578125, -10.044921875, -9.6005859375, -9.15625, -8.7119140625, -8.267578125, -7.8232421875, -7.37890625, -6.9345703125, -6.490234375, -6.0458984375, -5.6015625, -5.1572265625, -4.712890625, -4.2685546875, -3.82421875, -3.3798828125, -2.935546875, -2.4912109375, -2.046875, -1.6025390625, -1.158203125, -0.7138671875, -0.26953125, 0.1748046875, 0.619140625, 1.0634765625, 1.5078125, 1.9521484375, 2.396484375, 2.8408203125, 3.28515625, 3.7294921875, 4.173828125, 4.6181640625, 5.0625, 5.5068359375, 5.951171875, 6.3955078125, 6.83984375, 7.2841796875, 7.728515625, 8.1728515625, 8.6171875, 9.0615234375, 9.505859375, 9.9501953125, 10.39453125, 10.8388671875, 11.283203125, 11.7275390625, 12.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 3.0, 5.0, 10.0, 14.0, 11.0, 10.0, 19.0, 9.0, 21.0, 28.0, 34.0, 30.0, 48.0, 45.0, 71.0, 110.0, 205.0, 430.0, 1472.0, 29980.0, 3098407.0, 12455.0, 1182.0, 415.0, 178.0, 103.0, 69.0, 51.0, 53.0, 34.0, 24.0, 32.0, 19.0, 17.0, 14.0, 16.0, 8.0, 12.0, 15.0, 8.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.296875, -24.374267578125, -23.45166015625, -22.529052734375, -21.6064453125, -20.683837890625, -19.76123046875, -18.838623046875, -17.916015625, -16.993408203125, -16.07080078125, -15.148193359375, -14.2255859375, -13.302978515625, -12.38037109375, -11.457763671875, -10.53515625, -9.612548828125, -8.68994140625, -7.767333984375, -6.8447265625, -5.922119140625, -4.99951171875, -4.076904296875, -3.154296875, -2.231689453125, -1.30908203125, -0.386474609375, 0.5361328125, 1.458740234375, 2.38134765625, 3.303955078125, 4.2265625, 5.149169921875, 6.07177734375, 6.994384765625, 7.9169921875, 8.839599609375, 9.76220703125, 10.684814453125, 11.607421875, 12.530029296875, 13.45263671875, 14.375244140625, 15.2978515625, 16.220458984375, 17.14306640625, 18.065673828125, 18.98828125, 19.910888671875, 20.83349609375, 21.756103515625, 22.6787109375, 23.601318359375, 24.52392578125, 25.446533203125, 26.369140625, 27.291748046875, 28.21435546875, 29.136962890625, 30.0595703125, 30.982177734375, 31.90478515625, 32.827392578125, 33.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [19.0, 408.0, 574.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.012465476989746, -2.6173341274261475, -0.22220277786254883, 2.172928810119629, 4.568059921264648, 6.963191032409668, 9.358323097229004, 11.753453254699707, 14.148585319519043, 16.543716430664062, 18.9388484954834, 21.333980560302734, 23.729110717773438, 26.12424087524414, 28.51937484741211, 30.914505004882812, 33.309635162353516, 35.70476531982422, 38.09989929199219, 40.49502944946289, 42.890159606933594, 45.28529357910156, 47.680423736572266, 50.07555389404297, 52.47068786621094, 54.86581802368164, 57.26095199584961, 59.65608215332031, 62.051212310791016, 64.44634246826172, 66.84147644042969, 69.23660278320312, 71.6317367553711, 74.02687072753906, 76.4219970703125, 78.81713104248047, 81.21226501464844, 83.60739135742188, 86.00252532958984, 88.39765930175781, 90.79278564453125, 93.18791961669922, 95.58304595947266, 97.97817993164062, 100.3733139038086, 102.76844024658203, 105.16357421875, 107.55870056152344, 109.95384216308594, 112.3489761352539, 114.74410247802734, 117.13923645019531, 119.53437042236328, 121.92949676513672, 124.32463073730469, 126.71975708007812, 129.11488342285156, 131.510009765625, 133.9051513671875, 136.30027770996094, 138.69540405273438, 141.09054565429688, 143.4856719970703, 145.88079833984375, 148.27593994140625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 14.0, 9.0, 7.0, 12.0, 17.0, 21.0, 21.0, 28.0, 29.0, 28.0, 27.0, 26.0, 46.0, 42.0, 62.0, 48.0, 38.0, 47.0, 49.0, 52.0, 51.0, 43.0, 35.0, 35.0, 39.0, 31.0, 27.0, 15.0, 16.0, 16.0, 9.0, 14.0, 13.0, 12.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.16040802001953, -45.56102752685547, -43.961647033691406, -42.362266540527344, -40.76288604736328, -39.16350555419922, -37.564125061035156, -35.964744567871094, -34.36536407470703, -32.76598358154297, -31.166603088378906, -29.567222595214844, -27.96784210205078, -26.36846160888672, -24.769079208374023, -23.16969871520996, -21.570316314697266, -19.970935821533203, -18.37155532836914, -16.772174835205078, -15.1727933883667, -13.573412895202637, -11.974031448364258, -10.374650955200195, -8.775270462036133, -7.17588996887207, -5.57650899887085, -3.977128028869629, -2.3777475357055664, -0.7783670425415039, 0.821014404296875, 2.4203948974609375, 4.019775390625, 5.6191558837890625, 7.218536853790283, 8.817917823791504, 10.417298316955566, 12.016678810119629, 13.616060256958008, 15.21544075012207, 16.814821243286133, 18.414201736450195, 20.013582229614258, 21.612964630126953, 23.212345123291016, 24.811725616455078, 26.41110610961914, 28.010486602783203, 29.609867095947266, 31.209247589111328, 32.80862808227539, 34.40800857543945, 36.007389068603516, 37.60676956176758, 39.206153869628906, 40.80553436279297, 42.40491485595703, 44.004295349121094, 45.603675842285156, 47.20305633544922, 48.80243682861328, 50.401817321777344, 52.001197814941406, 53.60057830810547, 55.19995880126953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 8.0, 16.0, 9.0, 14.0, 24.0, 25.0, 34.0, 31.0, 47.0, 42.0, 49.0, 34.0, 46.0, 54.0, 59.0, 41.0, 66.0, 61.0, 36.0, 40.0, 46.0, 34.0, 32.0, 32.0, 18.0, 22.0, 27.0, 19.0, 12.0, 5.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.122802734375, -4.95654296875, -4.790283203125, -4.6240234375, -4.457763671875, -4.29150390625, -4.125244140625, -3.958984375, -3.792724609375, -3.62646484375, -3.460205078125, -3.2939453125, -3.127685546875, -2.96142578125, -2.795166015625, -2.62890625, -2.462646484375, -2.29638671875, -2.130126953125, -1.9638671875, -1.797607421875, -1.63134765625, -1.465087890625, -1.298828125, -1.132568359375, -0.96630859375, -0.800048828125, -0.6337890625, -0.467529296875, -0.30126953125, -0.135009765625, 0.03125, 0.197509765625, 0.36376953125, 0.530029296875, 0.6962890625, 0.862548828125, 1.02880859375, 1.195068359375, 1.361328125, 1.527587890625, 1.69384765625, 1.860107421875, 2.0263671875, 2.192626953125, 2.35888671875, 2.525146484375, 2.69140625, 2.857666015625, 3.02392578125, 3.190185546875, 3.3564453125, 3.522705078125, 3.68896484375, 3.855224609375, 4.021484375, 4.187744140625, 4.35400390625, 4.520263671875, 4.6865234375, 4.852783203125, 5.01904296875, 5.185302734375, 5.3515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 2.0, 3.0, 10.0, 5.0, 13.0, 12.0, 19.0, 25.0, 39.0, 49.0, 52.0, 94.0, 138.0, 298.0, 832.0, 3017.0, 19772.0, 366154.0, 3563850.0, 221603.0, 14459.0, 2437.0, 708.0, 260.0, 143.0, 67.0, 54.0, 48.0, 32.0, 20.0, 21.0, 20.0, 6.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.801025390625, -21.14892578125, -20.496826171875, -19.8447265625, -19.192626953125, -18.54052734375, -17.888427734375, -17.236328125, -16.584228515625, -15.93212890625, -15.280029296875, -14.6279296875, -13.975830078125, -13.32373046875, -12.671630859375, -12.01953125, -11.367431640625, -10.71533203125, -10.063232421875, -9.4111328125, -8.759033203125, -8.10693359375, -7.454833984375, -6.802734375, -6.150634765625, -5.49853515625, -4.846435546875, -4.1943359375, -3.542236328125, -2.89013671875, -2.238037109375, -1.5859375, -0.933837890625, -0.28173828125, 0.370361328125, 1.0224609375, 1.674560546875, 2.32666015625, 2.978759765625, 3.630859375, 4.282958984375, 4.93505859375, 5.587158203125, 6.2392578125, 6.891357421875, 7.54345703125, 8.195556640625, 8.84765625, 9.499755859375, 10.15185546875, 10.803955078125, 11.4560546875, 12.108154296875, 12.76025390625, 13.412353515625, 14.064453125, 14.716552734375, 15.36865234375, 16.020751953125, 16.6728515625, 17.324951171875, 17.97705078125, 18.629150390625, 19.28125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 10.0, 8.0, 11.0, 25.0, 29.0, 51.0, 99.0, 138.0, 198.0, 332.0, 473.0, 606.0, 659.0, 485.0, 361.0, 221.0, 118.0, 98.0, 56.0, 36.0, 26.0, 16.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.44677734375, -16.8466796875, -16.24658203125, -15.646484375, -15.04638671875, -14.4462890625, -13.84619140625, -13.24609375, -12.64599609375, -12.0458984375, -11.44580078125, -10.845703125, -10.24560546875, -9.6455078125, -9.04541015625, -8.4453125, -7.84521484375, -7.2451171875, -6.64501953125, -6.044921875, -5.44482421875, -4.8447265625, -4.24462890625, -3.64453125, -3.04443359375, -2.4443359375, -1.84423828125, -1.244140625, -0.64404296875, -0.0439453125, 0.55615234375, 1.15625, 1.75634765625, 2.3564453125, 2.95654296875, 3.556640625, 4.15673828125, 4.7568359375, 5.35693359375, 5.95703125, 6.55712890625, 7.1572265625, 7.75732421875, 8.357421875, 8.95751953125, 9.5576171875, 10.15771484375, 10.7578125, 11.35791015625, 11.9580078125, 12.55810546875, 13.158203125, 13.75830078125, 14.3583984375, 14.95849609375, 15.55859375, 16.15869140625, 16.7587890625, 17.35888671875, 17.958984375, 18.55908203125, 19.1591796875, 19.75927734375, 20.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 23.0, 22.0, 41.0, 83.0, 120.0, 231.0, 383.0, 985.0, 4300.0, 70229.0, 3707947.0, 396397.0, 10611.0, 1601.0, 596.0, 304.0, 135.0, 84.0, 63.0, 32.0, 34.0, 14.0, 7.0, 8.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.44580078125, -31.0166015625, -29.58740234375, -28.158203125, -26.72900390625, -25.2998046875, -23.87060546875, -22.44140625, -21.01220703125, -19.5830078125, -18.15380859375, -16.724609375, -15.29541015625, -13.8662109375, -12.43701171875, -11.0078125, -9.57861328125, -8.1494140625, -6.72021484375, -5.291015625, -3.86181640625, -2.4326171875, -1.00341796875, 0.42578125, 1.85498046875, 3.2841796875, 4.71337890625, 6.142578125, 7.57177734375, 9.0009765625, 10.43017578125, 11.859375, 13.28857421875, 14.7177734375, 16.14697265625, 17.576171875, 19.00537109375, 20.4345703125, 21.86376953125, 23.29296875, 24.72216796875, 26.1513671875, 27.58056640625, 29.009765625, 30.43896484375, 31.8681640625, 33.29736328125, 34.7265625, 36.15576171875, 37.5849609375, 39.01416015625, 40.443359375, 41.87255859375, 43.3017578125, 44.73095703125, 46.16015625, 47.58935546875, 49.0185546875, 50.44775390625, 51.876953125, 53.30615234375, 54.7353515625, 56.16455078125, 57.59375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 31.0, 232.0, 461.0, 243.0, 42.0, 6.0, 0.0, 1.0], "bins": [-401.98382568359375, -395.11151123046875, -388.2391662597656, -381.3668518066406, -374.4945068359375, -367.6221923828125, -360.7498779296875, -353.8775329589844, -347.0052185058594, -340.1329040527344, -333.26055908203125, -326.38824462890625, -319.5158996582031, -312.6435852050781, -305.771240234375, -298.89892578125, -292.026611328125, -285.154296875, -278.2819519042969, -271.4096374511719, -264.53729248046875, -257.66497802734375, -250.7926483154297, -243.92031860351562, -237.0479736328125, -230.17564392089844, -223.30331420898438, -216.43099975585938, -209.5586700439453, -202.68634033203125, -195.8140106201172, -188.94168090820312, -182.06936645507812, -175.19703674316406, -168.32470703125, -161.452392578125, -154.58006286621094, -147.70773315429688, -140.8354034423828, -133.96307373046875, -127.09074401855469, -120.21841430664062, -113.3460922241211, -106.47376251220703, -99.6014404296875, -92.72911071777344, -85.85678100585938, -78.98445129394531, -72.11212921142578, -65.23979949951172, -58.36747741699219, -51.495147705078125, -44.62282180786133, -37.75049591064453, -30.87816619873047, -24.005840301513672, -17.133514404296875, -10.261187553405762, -3.3888607025146484, 3.4834671020507812, 10.355792999267578, 17.228118896484375, 24.100448608398438, 30.972774505615234, 37.84510040283203]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 6.0, 4.0, 8.0, 10.0, 9.0, 15.0, 4.0, 10.0, 12.0, 9.0, 18.0, 13.0, 26.0, 26.0, 17.0, 26.0, 25.0, 42.0, 28.0, 33.0, 34.0, 16.0, 44.0, 32.0, 25.0, 34.0, 44.0, 33.0, 42.0, 22.0, 36.0, 32.0, 18.0, 25.0, 25.0, 21.0, 22.0, 21.0, 22.0, 12.0, 13.0, 12.0, 6.0, 8.0, 10.0, 13.0, 11.0, 5.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-35.4333381652832, -34.29182434082031, -33.150306701660156, -32.008792877197266, -30.867279052734375, -29.72576332092285, -28.584247589111328, -27.442733764648438, -26.301218032836914, -25.15970230102539, -24.0181884765625, -22.876672744750977, -21.735157012939453, -20.593643188476562, -19.45212745666504, -18.310611724853516, -17.169097900390625, -16.0275821685791, -14.886068344116211, -13.744552612304688, -12.60303783416748, -11.461523056030273, -10.32000732421875, -9.178492546081543, -8.036977767944336, -6.895462989807129, -5.753947734832764, -4.612432479858398, -3.4709177017211914, -2.3294029235839844, -1.1878876686096191, -0.046372413635253906, 1.0951461791992188, 2.236661195755005, 3.378176212310791, 4.519691467285156, 5.661206245422363, 6.80272102355957, 7.9442362785339355, 9.0857515335083, 10.227266311645508, 11.368781089782715, 12.510295867919922, 13.651811599731445, 14.793326377868652, 15.93484115600586, 17.076356887817383, 18.217872619628906, 19.359386444091797, 20.50090217590332, 21.64241600036621, 22.783931732177734, 23.925445556640625, 25.06696128845215, 26.208477020263672, 27.349990844726562, 28.491506576538086, 29.63302230834961, 30.7745361328125, 31.916051864624023, 33.05756759643555, 34.19908142089844, 35.34059524536133, 36.482112884521484, 37.623626708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 8.0, 14.0, 21.0, 29.0, 49.0, 66.0, 86.0, 160.0, 175.0, 274.0, 420.0, 599.0, 855.0, 1381.0, 1958.0, 2964.0, 4537.0, 6884.0, 10491.0, 16619.0, 26619.0, 42629.0, 70017.0, 114301.0, 170342.0, 193117.0, 143829.0, 90858.0, 55500.0, 34051.0, 20778.0, 13464.0, 8534.0, 5580.0, 3717.0, 2494.0, 1644.0, 1079.0, 687.0, 526.0, 397.0, 209.0, 170.0, 130.0, 97.0, 74.0, 29.0, 18.0, 15.0, 30.0, 12.0, 13.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.453369140625, -0.4397392272949219, -0.42610931396484375, -0.4124794006347656, -0.3988494873046875, -0.3852195739746094, -0.37158966064453125, -0.3579597473144531, -0.344329833984375, -0.3306999206542969, -0.31707000732421875, -0.3034400939941406, -0.2898101806640625, -0.2761802673339844, -0.26255035400390625, -0.24892044067382812, -0.23529052734375, -0.22166061401367188, -0.20803070068359375, -0.19440078735351562, -0.1807708740234375, -0.16714096069335938, -0.15351104736328125, -0.13988113403320312, -0.126251220703125, -0.11262130737304688, -0.09899139404296875, -0.08536148071289062, -0.0717315673828125, -0.058101654052734375, -0.04447174072265625, -0.030841827392578125, -0.0172119140625, -0.003582000732421875, 0.01004791259765625, 0.023677825927734375, 0.0373077392578125, 0.050937652587890625, 0.06456756591796875, 0.07819747924804688, 0.091827392578125, 0.10545730590820312, 0.11908721923828125, 0.13271713256835938, 0.1463470458984375, 0.15997695922851562, 0.17360687255859375, 0.18723678588867188, 0.20086669921875, 0.21449661254882812, 0.22812652587890625, 0.24175643920898438, 0.2553863525390625, 0.2690162658691406, 0.28264617919921875, 0.2962760925292969, 0.309906005859375, 0.3235359191894531, 0.33716583251953125, 0.3507957458496094, 0.3644256591796875, 0.3780555725097656, 0.39168548583984375, 0.4053153991699219, 0.4189453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 14.0, 12.0, 16.0, 11.0, 11.0, 24.0, 23.0, 16.0, 25.0, 32.0, 32.0, 25.0, 25.0, 38.0, 40.0, 52.0, 35.0, 1069.0, 34.0, 37.0, 33.0, 34.0, 34.0, 42.0, 34.0, 27.0, 43.0, 30.0, 21.0, 23.0, 10.0, 12.0, 8.0, 11.0, 18.0, 4.0, 4.0, 10.0, 8.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-2.74609375, -2.667266845703125, -2.58843994140625, -2.509613037109375, -2.4307861328125, -2.351959228515625, -2.27313232421875, -2.194305419921875, -2.115478515625, -2.036651611328125, -1.95782470703125, -1.878997802734375, -1.8001708984375, -1.721343994140625, -1.64251708984375, -1.563690185546875, -1.48486328125, -1.406036376953125, -1.32720947265625, -1.248382568359375, -1.1695556640625, -1.090728759765625, -1.01190185546875, -0.933074951171875, -0.854248046875, -0.775421142578125, -0.69659423828125, -0.617767333984375, -0.5389404296875, -0.460113525390625, -0.38128662109375, -0.302459716796875, -0.2236328125, -0.144805908203125, -0.06597900390625, 0.012847900390625, 0.0916748046875, 0.170501708984375, 0.24932861328125, 0.328155517578125, 0.406982421875, 0.485809326171875, 0.56463623046875, 0.643463134765625, 0.7222900390625, 0.801116943359375, 0.87994384765625, 0.958770751953125, 1.03759765625, 1.116424560546875, 1.19525146484375, 1.274078369140625, 1.3529052734375, 1.431732177734375, 1.51055908203125, 1.589385986328125, 1.668212890625, 1.747039794921875, 1.82586669921875, 1.904693603515625, 1.9835205078125, 2.062347412109375, 2.14117431640625, 2.220001220703125, 2.298828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 5.0, 18.0, 30.0, 25.0, 50.0, 90.0, 137.0, 195.0, 330.0, 588.0, 820.0, 1293.0, 2125.0, 3356.0, 4986.0, 8003.0, 12510.0, 19494.0, 30383.0, 46139.0, 70379.0, 102728.0, 138598.0, 1205070.0, 140136.0, 104518.0, 72107.0, 46951.0, 30606.0, 19909.0, 12559.0, 8246.0, 5247.0, 3467.0, 2195.0, 1386.0, 918.0, 541.0, 365.0, 211.0, 146.0, 103.0, 45.0, 35.0, 34.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.332275390625, -0.3226509094238281, -0.31302642822265625, -0.3034019470214844, -0.2937774658203125, -0.2841529846191406, -0.27452850341796875, -0.2649040222167969, -0.255279541015625, -0.24565505981445312, -0.23603057861328125, -0.22640609741210938, -0.2167816162109375, -0.20715713500976562, -0.19753265380859375, -0.18790817260742188, -0.17828369140625, -0.16865921020507812, -0.15903472900390625, -0.14941024780273438, -0.1397857666015625, -0.13016128540039062, -0.12053680419921875, -0.11091232299804688, -0.101287841796875, -0.09166336059570312, -0.08203887939453125, -0.07241439819335938, -0.0627899169921875, -0.053165435791015625, -0.04354095458984375, -0.033916473388671875, -0.0242919921875, -0.014667510986328125, -0.00504302978515625, 0.004581451416015625, 0.0142059326171875, 0.023830413818359375, 0.03345489501953125, 0.043079376220703125, 0.052703857421875, 0.062328338623046875, 0.07195281982421875, 0.08157730102539062, 0.0912017822265625, 0.10082626342773438, 0.11045074462890625, 0.12007522583007812, 0.12969970703125, 0.13932418823242188, 0.14894866943359375, 0.15857315063476562, 0.1681976318359375, 0.17782211303710938, 0.18744659423828125, 0.19707107543945312, 0.206695556640625, 0.21632003784179688, 0.22594451904296875, 0.23556900024414062, 0.2451934814453125, 0.2548179626464844, 0.26444244384765625, 0.2740669250488281, 0.28369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 12.0, 12.0, 19.0, 18.0, 37.0, 41.0, 51.0, 55.0, 81.0, 99.0, 94.0, 81.0, 83.0, 71.0, 52.0, 48.0, 38.0, 18.0, 11.0, 15.0, 13.0, 6.0, 7.0, 4.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00237274169921875, -0.0022725462913513184, -0.0021723508834838867, -0.002072155475616455, -0.0019719600677490234, -0.0018717646598815918, -0.0017715692520141602, -0.0016713738441467285, -0.0015711784362792969, -0.0014709830284118652, -0.0013707876205444336, -0.001270592212677002, -0.0011703968048095703, -0.0010702013969421387, -0.000970005989074707, -0.0008698105812072754, -0.0007696151733398438, -0.0006694197654724121, -0.0005692243576049805, -0.00046902894973754883, -0.0003688335418701172, -0.00026863813400268555, -0.0001684427261352539, -6.824731826782227e-05, 3.1948089599609375e-05, 0.00013214349746704102, 0.00023233890533447266, 0.0003325343132019043, 0.00043272972106933594, 0.0005329251289367676, 0.0006331205368041992, 0.0007333159446716309, 0.0008335113525390625, 0.0009337067604064941, 0.0010339021682739258, 0.0011340975761413574, 0.001234292984008789, 0.0013344883918762207, 0.0014346837997436523, 0.001534879207611084, 0.0016350746154785156, 0.0017352700233459473, 0.001835465431213379, 0.0019356608390808105, 0.002035856246948242, 0.002136051654815674, 0.0022362470626831055, 0.002336442470550537, 0.0024366378784179688, 0.0025368332862854004, 0.002637028694152832, 0.0027372241020202637, 0.0028374195098876953, 0.002937614917755127, 0.0030378103256225586, 0.0031380057334899902, 0.003238201141357422, 0.0033383965492248535, 0.003438591957092285, 0.003538787364959717, 0.0036389827728271484, 0.00373917818069458, 0.0038393735885620117, 0.003939568996429443, 0.004039764404296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 6.0, 14.0, 35.0, 41.0, 34.0, 72.0, 101.0, 141.0, 260.0, 411.0, 1099.0, 904138.0, 140365.0, 791.0, 351.0, 246.0, 132.0, 88.0, 43.0, 45.0, 44.0, 20.0, 11.0, 11.0, 10.0, 7.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.08294677734375, -0.08091878890991211, -0.07889080047607422, -0.07686281204223633, -0.07483482360839844, -0.07280683517456055, -0.07077884674072266, -0.06875085830688477, -0.06672286987304688, -0.06469488143920898, -0.0626668930053711, -0.0606389045715332, -0.05861091613769531, -0.05658292770385742, -0.05455493927001953, -0.05252695083618164, -0.05049896240234375, -0.04847097396850586, -0.04644298553466797, -0.04441499710083008, -0.04238700866699219, -0.0403590202331543, -0.038331031799316406, -0.036303043365478516, -0.034275054931640625, -0.032247066497802734, -0.030219078063964844, -0.028191089630126953, -0.026163101196289062, -0.024135112762451172, -0.02210712432861328, -0.02007913589477539, -0.0180511474609375, -0.01602315902709961, -0.013995170593261719, -0.011967182159423828, -0.009939193725585938, -0.007911205291748047, -0.005883216857910156, -0.0038552284240722656, -0.001827239990234375, 0.00020074844360351562, 0.0022287368774414062, 0.004256725311279297, 0.0062847137451171875, 0.008312702178955078, 0.010340690612792969, 0.01236867904663086, 0.01439666748046875, 0.01642465591430664, 0.01845264434814453, 0.020480632781982422, 0.022508621215820312, 0.024536609649658203, 0.026564598083496094, 0.028592586517333984, 0.030620574951171875, 0.032648563385009766, 0.034676551818847656, 0.03670454025268555, 0.03873252868652344, 0.04076051712036133, 0.04278850555419922, 0.04481649398803711, 0.046844482421875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1008.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051476843655109406, -0.05020083114504814, -0.04892481863498688, -0.04764880612492561, -0.04637279361486435, -0.04509677737951279, -0.04382076486945152, -0.04254475235939026, -0.041268739849328995, -0.03999272733926773, -0.03871671482920647, -0.0374407023191452, -0.03616468608379364, -0.034888673573732376, -0.03361266106367111, -0.03233664855360985, -0.031060636043548584, -0.02978462353348732, -0.028508611023426056, -0.027232596650719643, -0.02595658414065838, -0.024680571630597115, -0.0234045572578907, -0.022128544747829437, -0.020852532237768173, -0.01957651972770691, -0.018300507217645645, -0.017024492844939232, -0.015748480334877968, -0.014472467824816704, -0.013196454383432865, -0.011920440942049026, -0.010644424706697464, -0.0093684121966362, -0.008092398755252361, -0.00681638577952981, -0.005540372803807259, -0.004264359828084707, -0.002988346852362156, -0.0017123334109783173, -0.0004363209009170532, 0.0008396920748054981, 0.0021157050505280495, 0.003391718026250601, 0.004667731001973152, 0.0059437439776957035, 0.007219756953418255, 0.008495770394802094, 0.009771782904863358, 0.011047795414924622, 0.01232380885630846, 0.013599822297692299, 0.014875834807753563, 0.016151847317814827, 0.01742786169052124, 0.018703874200582504, 0.01997988671064377, 0.021255899220705032, 0.022531911730766296, 0.02380792610347271, 0.025083938613533974, 0.026359951123595238, 0.02763596549630165, 0.028911978006362915, 0.03018799051642418]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 8.0, 12.0, 15.0, 20.0, 19.0, 32.0, 25.0, 44.0, 45.0, 57.0, 55.0, 51.0, 64.0, 71.0, 76.0, 81.0, 66.0, 52.0, 45.0, 36.0, 24.0, 30.0, 17.0, 29.0, 15.0, 7.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015898346900939941, -0.0015199529007077217, -0.0014500711113214493, -0.0013801893219351768, -0.0013103075325489044, -0.001240425743162632, -0.0011705439537763596, -0.0011006621643900871, -0.0010307803750038147, -0.0009608985856175423, -0.0008910167962312698, -0.0008211350068449974, -0.000751253217458725, -0.0006813714280724525, -0.0006114896386861801, -0.0005416078492999077, -0.00047172605991363525, -0.0004018442705273628, -0.0003319624811410904, -0.00026208069175481796, -0.00019219890236854553, -0.0001223171129822731, -5.243532359600067e-05, 1.744646579027176e-05, 8.732825517654419e-05, 0.00015721004456281662, 0.00022709183394908905, 0.0002969736233353615, 0.0003668554127216339, 0.00043673720210790634, 0.0005066189914941788, 0.0005765007808804512, 0.0006463825702667236, 0.0007162643596529961, 0.0007861461490392685, 0.0008560279384255409, 0.0009259097278118134, 0.0009957915171980858, 0.0010656733065843582, 0.0011355550959706306, 0.001205436885356903, 0.0012753186747431755, 0.001345200464129448, 0.0014150822535157204, 0.0014849640429019928, 0.0015548458322882652, 0.0016247276216745377, 0.00169460941106081, 0.0017644912004470825, 0.001834372989833355, 0.0019042547792196274, 0.0019741365686059, 0.0020440183579921722, 0.0021139001473784447, 0.002183781936764717, 0.0022536637261509895, 0.002323545515537262, 0.0023934273049235344, 0.002463309094309807, 0.0025331908836960793, 0.0026030726730823517, 0.002672954462468624, 0.0027428362518548965, 0.002812718041241169, 0.0028825998306274414]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 21.0, 37.0, 43.0, 63.0, 109.0, 177.0, 330.0, 525.0, 966.0, 1787.0, 3128.0, 5823.0, 12117.0, 28929.0, 91019.0, 440442.0, 341067.0, 74438.0, 25067.0, 10568.0, 5298.0, 2769.0, 1603.0, 942.0, 530.0, 313.0, 179.0, 99.0, 57.0, 37.0, 20.0, 14.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-4.94140625, -4.817626953125, -4.69384765625, -4.570068359375, -4.4462890625, -4.322509765625, -4.19873046875, -4.074951171875, -3.951171875, -3.827392578125, -3.70361328125, -3.579833984375, -3.4560546875, -3.332275390625, -3.20849609375, -3.084716796875, -2.9609375, -2.837158203125, -2.71337890625, -2.589599609375, -2.4658203125, -2.342041015625, -2.21826171875, -2.094482421875, -1.970703125, -1.846923828125, -1.72314453125, -1.599365234375, -1.4755859375, -1.351806640625, -1.22802734375, -1.104248046875, -0.98046875, -0.856689453125, -0.73291015625, -0.609130859375, -0.4853515625, -0.361572265625, -0.23779296875, -0.114013671875, 0.009765625, 0.133544921875, 0.25732421875, 0.381103515625, 0.5048828125, 0.628662109375, 0.75244140625, 0.876220703125, 1.0, 1.123779296875, 1.24755859375, 1.371337890625, 1.4951171875, 1.618896484375, 1.74267578125, 1.866455078125, 1.990234375, 2.114013671875, 2.23779296875, 2.361572265625, 2.4853515625, 2.609130859375, 2.73291015625, 2.856689453125, 2.98046875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 7.0, 14.0, 13.0, 14.0, 16.0, 24.0, 25.0, 28.0, 43.0, 43.0, 44.0, 52.0, 61.0, 71.0, 306.0, 1725.0, 105.0, 57.0, 46.0, 48.0, 43.0, 39.0, 26.0, 29.0, 33.0, 30.0, 20.0, 20.0, 10.0, 15.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.58740234375, -16.0185546875, -15.44970703125, -14.880859375, -14.31201171875, -13.7431640625, -13.17431640625, -12.60546875, -12.03662109375, -11.4677734375, -10.89892578125, -10.330078125, -9.76123046875, -9.1923828125, -8.62353515625, -8.0546875, -7.48583984375, -6.9169921875, -6.34814453125, -5.779296875, -5.21044921875, -4.6416015625, -4.07275390625, -3.50390625, -2.93505859375, -2.3662109375, -1.79736328125, -1.228515625, -0.65966796875, -0.0908203125, 0.47802734375, 1.046875, 1.61572265625, 2.1845703125, 2.75341796875, 3.322265625, 3.89111328125, 4.4599609375, 5.02880859375, 5.59765625, 6.16650390625, 6.7353515625, 7.30419921875, 7.873046875, 8.44189453125, 9.0107421875, 9.57958984375, 10.1484375, 10.71728515625, 11.2861328125, 11.85498046875, 12.423828125, 12.99267578125, 13.5615234375, 14.13037109375, 14.69921875, 15.26806640625, 15.8369140625, 16.40576171875, 16.974609375, 17.54345703125, 18.1123046875, 18.68115234375, 19.25]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 11.0, 14.0, 22.0, 29.0, 29.0, 38.0, 40.0, 48.0, 72.0, 118.0, 176.0, 372.0, 1234.0, 11390.0, 2969667.0, 157545.0, 3473.0, 667.0, 269.0, 133.0, 73.0, 65.0, 40.0, 39.0, 29.0, 15.0, 14.0, 11.0, 16.0, 13.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.20458984375, -30.2529296875, -29.30126953125, -28.349609375, -27.39794921875, -26.4462890625, -25.49462890625, -24.54296875, -23.59130859375, -22.6396484375, -21.68798828125, -20.736328125, -19.78466796875, -18.8330078125, -17.88134765625, -16.9296875, -15.97802734375, -15.0263671875, -14.07470703125, -13.123046875, -12.17138671875, -11.2197265625, -10.26806640625, -9.31640625, -8.36474609375, -7.4130859375, -6.46142578125, -5.509765625, -4.55810546875, -3.6064453125, -2.65478515625, -1.703125, -0.75146484375, 0.2001953125, 1.15185546875, 2.103515625, 3.05517578125, 4.0068359375, 4.95849609375, 5.91015625, 6.86181640625, 7.8134765625, 8.76513671875, 9.716796875, 10.66845703125, 11.6201171875, 12.57177734375, 13.5234375, 14.47509765625, 15.4267578125, 16.37841796875, 17.330078125, 18.28173828125, 19.2333984375, 20.18505859375, 21.13671875, 22.08837890625, 23.0400390625, 23.99169921875, 24.943359375, 25.89501953125, 26.8466796875, 27.79833984375, 28.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [18.0, 218.0, 684.0, 92.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.627401351928711, -4.445851802825928, -1.2643022537231445, 1.9172477722167969, 5.098796844482422, 8.280345916748047, 11.461896896362305, 14.64344596862793, 17.824995040893555, 21.00654411315918, 24.188095092773438, 27.369644165039062, 30.551193237304688, 33.73274230957031, 36.91429138183594, 40.09584045410156, 43.27738952636719, 46.45893859863281, 49.64048767089844, 52.82203674316406, 56.00358581542969, 59.18513488769531, 62.3666877746582, 65.54823303222656, 68.72978973388672, 71.91133880615234, 75.09288787841797, 78.2744369506836, 81.45598602294922, 84.63753509521484, 87.819091796875, 91.00064086914062, 94.18218994140625, 97.36373901367188, 100.5452880859375, 103.72683715820312, 106.90838623046875, 110.08993530273438, 113.271484375, 116.45303344726562, 119.63458251953125, 122.81613159179688, 125.9976806640625, 129.17922973632812, 132.36077880859375, 135.54232788085938, 138.723876953125, 141.90542602539062, 145.08697509765625, 148.26852416992188, 151.4500732421875, 154.63162231445312, 157.81317138671875, 160.99472045898438, 164.17626953125, 167.35781860351562, 170.5393829345703, 173.72093200683594, 176.90248107910156, 180.0840301513672, 183.2655792236328, 186.44712829589844, 189.62867736816406, 192.8102264404297, 195.9917755126953]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 10.0, 5.0, 12.0, 9.0, 12.0, 20.0, 18.0, 22.0, 23.0, 18.0, 18.0, 20.0, 27.0, 27.0, 36.0, 34.0, 39.0, 38.0, 46.0, 31.0, 35.0, 45.0, 39.0, 46.0, 38.0, 36.0, 33.0, 26.0, 40.0, 24.0, 21.0, 19.0, 22.0, 17.0, 13.0, 20.0, 20.0, 13.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.74734115600586, -49.18922424316406, -47.631107330322266, -46.07299041748047, -44.51487350463867, -42.956756591796875, -41.39863967895508, -39.84052276611328, -38.282405853271484, -36.72428894042969, -35.16617202758789, -33.608055114746094, -32.0499382019043, -30.4918212890625, -28.933704376220703, -27.375587463378906, -25.817468643188477, -24.25935173034668, -22.701234817504883, -21.143117904663086, -19.58500099182129, -18.026884078979492, -16.468765258789062, -14.910649299621582, -13.352532386779785, -11.794415473937988, -10.236298561096191, -8.678180694580078, -7.1200642585754395, -5.561947345733643, -4.0038299560546875, -2.4457130432128906, -0.8875961303710938, 0.6705209016799927, 2.228637933731079, 3.786755084991455, 5.344871997833252, 6.902988910675049, 8.461106300354004, 10.0192232131958, 11.577340126037598, 13.135457038879395, 14.693573951721191, 16.251691818237305, 17.8098087310791, 19.3679256439209, 20.926042556762695, 22.484159469604492, 24.04227638244629, 25.600393295288086, 27.158510208129883, 28.71662712097168, 30.274744033813477, 31.832860946655273, 33.3909797668457, 34.9490966796875, 36.5072135925293, 38.065330505371094, 39.62344741821289, 41.18156433105469, 42.739681243896484, 44.29779815673828, 45.85591506958008, 47.414031982421875, 48.97214889526367]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 4.0, 11.0, 14.0, 17.0, 17.0, 23.0, 28.0, 22.0, 27.0, 35.0, 39.0, 40.0, 30.0, 52.0, 42.0, 49.0, 48.0, 44.0, 38.0, 52.0, 35.0, 47.0, 30.0, 33.0, 24.0, 40.0, 26.0, 24.0, 12.0, 10.0, 15.0, 14.0, 7.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.17340087890625, -4.0264892578125, -3.87957763671875, -3.732666015625, -3.58575439453125, -3.4388427734375, -3.29193115234375, -3.14501953125, -2.99810791015625, -2.8511962890625, -2.70428466796875, -2.557373046875, -2.41046142578125, -2.2635498046875, -2.11663818359375, -1.9697265625, -1.82281494140625, -1.6759033203125, -1.52899169921875, -1.382080078125, -1.23516845703125, -1.0882568359375, -0.94134521484375, -0.79443359375, -0.64752197265625, -0.5006103515625, -0.35369873046875, -0.206787109375, -0.05987548828125, 0.0870361328125, 0.23394775390625, 0.380859375, 0.52777099609375, 0.6746826171875, 0.82159423828125, 0.968505859375, 1.11541748046875, 1.2623291015625, 1.40924072265625, 1.55615234375, 1.70306396484375, 1.8499755859375, 1.99688720703125, 2.143798828125, 2.29071044921875, 2.4376220703125, 2.58453369140625, 2.7314453125, 2.87835693359375, 3.0252685546875, 3.17218017578125, 3.319091796875, 3.46600341796875, 3.6129150390625, 3.75982666015625, 3.90673828125, 4.05364990234375, 4.2005615234375, 4.34747314453125, 4.494384765625, 4.64129638671875, 4.7882080078125, 4.93511962890625, 5.08203125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 7.0, 10.0, 15.0, 8.0, 26.0, 19.0, 28.0, 28.0, 43.0, 42.0, 55.0, 91.0, 212.0, 1000.0, 8653.0, 242223.0, 3808525.0, 126582.0, 5577.0, 649.0, 141.0, 75.0, 43.0, 40.0, 31.0, 24.0, 25.0, 24.0, 17.0, 17.0, 6.0, 10.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.80322265625, -22.9658203125, -22.12841796875, -21.291015625, -20.45361328125, -19.6162109375, -18.77880859375, -17.94140625, -17.10400390625, -16.2666015625, -15.42919921875, -14.591796875, -13.75439453125, -12.9169921875, -12.07958984375, -11.2421875, -10.40478515625, -9.5673828125, -8.72998046875, -7.892578125, -7.05517578125, -6.2177734375, -5.38037109375, -4.54296875, -3.70556640625, -2.8681640625, -2.03076171875, -1.193359375, -0.35595703125, 0.4814453125, 1.31884765625, 2.15625, 2.99365234375, 3.8310546875, 4.66845703125, 5.505859375, 6.34326171875, 7.1806640625, 8.01806640625, 8.85546875, 9.69287109375, 10.5302734375, 11.36767578125, 12.205078125, 13.04248046875, 13.8798828125, 14.71728515625, 15.5546875, 16.39208984375, 17.2294921875, 18.06689453125, 18.904296875, 19.74169921875, 20.5791015625, 21.41650390625, 22.25390625, 23.09130859375, 23.9287109375, 24.76611328125, 25.603515625, 26.44091796875, 27.2783203125, 28.11572265625, 28.953125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 8.0, 22.0, 45.0, 66.0, 83.0, 116.0, 202.0, 207.0, 329.0, 476.0, 573.0, 552.0, 447.0, 304.0, 210.0, 144.0, 86.0, 57.0, 40.0, 23.0, 15.0, 14.0, 10.0, 5.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.802001953125, -20.29150390625, -19.781005859375, -19.2705078125, -18.760009765625, -18.24951171875, -17.739013671875, -17.228515625, -16.718017578125, -16.20751953125, -15.697021484375, -15.1865234375, -14.676025390625, -14.16552734375, -13.655029296875, -13.14453125, -12.634033203125, -12.12353515625, -11.613037109375, -11.1025390625, -10.592041015625, -10.08154296875, -9.571044921875, -9.060546875, -8.550048828125, -8.03955078125, -7.529052734375, -7.0185546875, -6.508056640625, -5.99755859375, -5.487060546875, -4.9765625, -4.466064453125, -3.95556640625, -3.445068359375, -2.9345703125, -2.424072265625, -1.91357421875, -1.403076171875, -0.892578125, -0.382080078125, 0.12841796875, 0.638916015625, 1.1494140625, 1.659912109375, 2.17041015625, 2.680908203125, 3.19140625, 3.701904296875, 4.21240234375, 4.722900390625, 5.2333984375, 5.743896484375, 6.25439453125, 6.764892578125, 7.275390625, 7.785888671875, 8.29638671875, 8.806884765625, 9.3173828125, 9.827880859375, 10.33837890625, 10.848876953125, 11.359375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 7.0, 0.0, 16.0, 9.0, 27.0, 39.0, 70.0, 88.0, 183.0, 359.0, 1026.0, 10520.0, 1109813.0, 3051089.0, 18770.0, 1358.0, 392.0, 197.0, 133.0, 68.0, 44.0, 37.0, 16.0, 14.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.296875, -23.501220703125, -21.70556640625, -19.909912109375, -18.1142578125, -16.318603515625, -14.52294921875, -12.727294921875, -10.931640625, -9.135986328125, -7.34033203125, -5.544677734375, -3.7490234375, -1.953369140625, -0.15771484375, 1.637939453125, 3.43359375, 5.229248046875, 7.02490234375, 8.820556640625, 10.6162109375, 12.411865234375, 14.20751953125, 16.003173828125, 17.798828125, 19.594482421875, 21.39013671875, 23.185791015625, 24.9814453125, 26.777099609375, 28.57275390625, 30.368408203125, 32.1640625, 33.959716796875, 35.75537109375, 37.551025390625, 39.3466796875, 41.142333984375, 42.93798828125, 44.733642578125, 46.529296875, 48.324951171875, 50.12060546875, 51.916259765625, 53.7119140625, 55.507568359375, 57.30322265625, 59.098876953125, 60.89453125, 62.690185546875, 64.48583984375, 66.281494140625, 68.0771484375, 69.872802734375, 71.66845703125, 73.464111328125, 75.259765625, 77.055419921875, 78.85107421875, 80.646728515625, 82.4423828125, 84.238037109375, 86.03369140625, 87.829345703125, 89.625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 15.0, 48.0, 80.0, 145.0, 229.0, 213.0, 149.0, 61.0, 36.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.05523681640625, -156.84902954101562, -153.642822265625, -150.4365997314453, -147.2303924560547, -144.02418518066406, -140.81796264648438, -137.61175537109375, -134.40554809570312, -131.1993408203125, -127.99312591552734, -124.78691101074219, -121.58070373535156, -118.37449645996094, -115.16828155517578, -111.96206665039062, -108.755859375, -105.54965209960938, -102.34343719482422, -99.13722229003906, -95.93101501464844, -92.72480773925781, -89.51859283447266, -86.3123779296875, -83.10617065429688, -79.89996337890625, -76.6937484741211, -73.48753356933594, -70.28132629394531, -67.07511901855469, -63.86890411376953, -60.66269302368164, -57.45648956298828, -54.25027847290039, -51.0440673828125, -47.83785629272461, -44.63164520263672, -41.42543411254883, -38.21922302246094, -35.01301193237305, -31.806800842285156, -28.600589752197266, -25.394378662109375, -22.188167572021484, -18.981956481933594, -15.775745391845703, -12.569534301757812, -9.363323211669922, -6.157112121582031, -2.9509010314941406, 0.25531005859375, 3.4615211486816406, 6.667732238769531, 9.873943328857422, 13.080154418945312, 16.286365509033203, 19.492576599121094, 22.698787689208984, 25.904998779296875, 29.111209869384766, 32.317420959472656, 35.52363204956055, 38.72984313964844, 41.93605422973633, 45.14226531982422]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 14.0, 18.0, 18.0, 32.0, 26.0, 16.0, 44.0, 25.0, 35.0, 34.0, 32.0, 34.0, 38.0, 44.0, 44.0, 37.0, 29.0, 38.0, 42.0, 39.0, 34.0, 19.0, 35.0, 29.0, 33.0, 20.0, 28.0, 20.0, 23.0, 6.0, 12.0, 10.0, 12.0, 15.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.816436767578125, -41.521385192871094, -40.22633743286133, -38.9312858581543, -37.63623809814453, -36.3411865234375, -35.04613494873047, -33.75108337402344, -32.45603561401367, -31.160985946655273, -29.865936279296875, -28.570884704589844, -27.275835037231445, -25.980785369873047, -24.685733795166016, -23.390684127807617, -22.09563446044922, -20.80058479309082, -19.505535125732422, -18.21048355102539, -16.915433883666992, -15.620384216308594, -14.325333595275879, -13.030282974243164, -11.735233306884766, -10.440183639526367, -9.145133018493652, -7.850082874298096, -6.555032730102539, -5.259982585906982, -3.964932441711426, -2.669881820678711, -1.3748321533203125, -0.07978200912475586, 1.2152681350708008, 2.5103182792663574, 3.805368423461914, 5.100418567657471, 6.395468711853027, 7.690519332885742, 8.98556900024414, 10.280618667602539, 11.575669288635254, 12.870719909667969, 14.165769577026367, 15.460819244384766, 16.755870819091797, 18.050920486450195, 19.345970153808594, 20.641019821166992, 21.93606948852539, 23.231121063232422, 24.52617073059082, 25.82122039794922, 27.11627197265625, 28.41132164001465, 29.706371307373047, 31.001420974731445, 32.296470642089844, 33.591522216796875, 34.886573791503906, 36.18162155151367, 37.4766731262207, 38.77172088623047, 40.0667724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 4.0, 21.0, 29.0, 53.0, 53.0, 72.0, 130.0, 175.0, 252.0, 346.0, 519.0, 815.0, 1139.0, 1628.0, 2554.0, 3779.0, 5670.0, 8623.0, 13245.0, 20505.0, 32040.0, 50265.0, 80100.0, 123032.0, 169697.0, 172929.0, 127988.0, 84170.0, 52745.0, 33635.0, 21554.0, 13888.0, 8875.0, 5919.0, 3922.0, 2610.0, 1747.0, 1201.0, 825.0, 558.0, 375.0, 286.0, 170.0, 138.0, 88.0, 63.0, 40.0, 24.0, 16.0, 12.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.419677734375, -0.4061622619628906, -0.39264678955078125, -0.3791313171386719, -0.3656158447265625, -0.3521003723144531, -0.33858489990234375, -0.3250694274902344, -0.311553955078125, -0.2980384826660156, -0.28452301025390625, -0.2710075378417969, -0.2574920654296875, -0.24397659301757812, -0.23046112060546875, -0.21694564819335938, -0.20343017578125, -0.18991470336914062, -0.17639923095703125, -0.16288375854492188, -0.1493682861328125, -0.13585281372070312, -0.12233734130859375, -0.10882186889648438, -0.095306396484375, -0.08179092407226562, -0.06827545166015625, -0.054759979248046875, -0.0412445068359375, -0.027729034423828125, -0.01421356201171875, -0.000698089599609375, 0.0128173828125, 0.026332855224609375, 0.03984832763671875, 0.053363800048828125, 0.0668792724609375, 0.08039474487304688, 0.09391021728515625, 0.10742568969726562, 0.120941162109375, 0.13445663452148438, 0.14797210693359375, 0.16148757934570312, 0.1750030517578125, 0.18851852416992188, 0.20203399658203125, 0.21554946899414062, 0.22906494140625, 0.24258041381835938, 0.25609588623046875, 0.2696113586425781, 0.2831268310546875, 0.2966423034667969, 0.31015777587890625, 0.3236732482910156, 0.337188720703125, 0.3507041931152344, 0.36421966552734375, 0.3777351379394531, 0.3912506103515625, 0.4047660827636719, 0.41828155517578125, 0.4317970275878906, 0.4453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 13.0, 15.0, 13.0, 22.0, 18.0, 21.0, 26.0, 32.0, 33.0, 33.0, 38.0, 29.0, 35.0, 47.0, 38.0, 47.0, 1063.0, 39.0, 45.0, 38.0, 33.0, 37.0, 44.0, 39.0, 31.0, 25.0, 20.0, 23.0, 19.0, 17.0, 10.0, 16.0, 8.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.59228515625, -2.5009765625, -2.40966796875, -2.318359375, -2.22705078125, -2.1357421875, -2.04443359375, -1.953125, -1.86181640625, -1.7705078125, -1.67919921875, -1.587890625, -1.49658203125, -1.4052734375, -1.31396484375, -1.22265625, -1.13134765625, -1.0400390625, -0.94873046875, -0.857421875, -0.76611328125, -0.6748046875, -0.58349609375, -0.4921875, -0.40087890625, -0.3095703125, -0.21826171875, -0.126953125, -0.03564453125, 0.0556640625, 0.14697265625, 0.23828125, 0.32958984375, 0.4208984375, 0.51220703125, 0.603515625, 0.69482421875, 0.7861328125, 0.87744140625, 0.96875, 1.06005859375, 1.1513671875, 1.24267578125, 1.333984375, 1.42529296875, 1.5166015625, 1.60791015625, 1.69921875, 1.79052734375, 1.8818359375, 1.97314453125, 2.064453125, 2.15576171875, 2.2470703125, 2.33837890625, 2.4296875, 2.52099609375, 2.6123046875, 2.70361328125, 2.794921875, 2.88623046875, 2.9775390625, 3.06884765625, 3.16015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 10.0, 11.0, 16.0, 32.0, 60.0, 93.0, 149.0, 220.0, 444.0, 741.0, 1259.0, 2210.0, 3875.0, 6876.0, 11823.0, 20662.0, 35539.0, 60717.0, 100157.0, 152237.0, 1236607.0, 170079.0, 118305.0, 72792.0, 42961.0, 25182.0, 14531.0, 8331.0, 4729.0, 2736.0, 1624.0, 896.0, 495.0, 324.0, 160.0, 113.0, 58.0, 30.0, 18.0, 13.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.430908203125, -0.41883087158203125, -0.4067535400390625, -0.39467620849609375, -0.382598876953125, -0.37052154541015625, -0.3584442138671875, -0.34636688232421875, -0.33428955078125, -0.32221221923828125, -0.3101348876953125, -0.29805755615234375, -0.285980224609375, -0.27390289306640625, -0.2618255615234375, -0.24974822998046875, -0.2376708984375, -0.22559356689453125, -0.2135162353515625, -0.20143890380859375, -0.189361572265625, -0.17728424072265625, -0.1652069091796875, -0.15312957763671875, -0.14105224609375, -0.12897491455078125, -0.1168975830078125, -0.10482025146484375, -0.092742919921875, -0.08066558837890625, -0.0685882568359375, -0.05651092529296875, -0.04443359375, -0.03235626220703125, -0.0202789306640625, -0.00820159912109375, 0.003875732421875, 0.01595306396484375, 0.0280303955078125, 0.04010772705078125, 0.05218505859375, 0.06426239013671875, 0.0763397216796875, 0.08841705322265625, 0.100494384765625, 0.11257171630859375, 0.1246490478515625, 0.13672637939453125, 0.1488037109375, 0.16088104248046875, 0.1729583740234375, 0.18503570556640625, 0.197113037109375, 0.20919036865234375, 0.2212677001953125, 0.23334503173828125, 0.24542236328125, 0.25749969482421875, 0.2695770263671875, 0.28165435791015625, 0.293731689453125, 0.30580902099609375, 0.3178863525390625, 0.32996368408203125, 0.342041015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 5.0, 10.0, 14.0, 17.0, 10.0, 18.0, 16.0, 14.0, 23.0, 41.0, 48.0, 51.0, 56.0, 58.0, 69.0, 67.0, 66.0, 72.0, 67.0, 43.0, 46.0, 41.0, 35.0, 20.0, 22.0, 15.0, 8.0, 14.0, 6.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411285400390625, -0.0035358965396881104, -0.003430664539337158, -0.003325432538986206, -0.003220200538635254, -0.0031149685382843018, -0.0030097365379333496, -0.0029045045375823975, -0.0027992725372314453, -0.002694040536880493, -0.002588808536529541, -0.002483576536178589, -0.0023783445358276367, -0.0022731125354766846, -0.0021678805351257324, -0.0020626485347747803, -0.001957416534423828, -0.001852184534072876, -0.0017469525337219238, -0.0016417205333709717, -0.0015364885330200195, -0.0014312565326690674, -0.0013260245323181152, -0.001220792531967163, -0.001115560531616211, -0.0010103285312652588, -0.0009050965309143066, -0.0007998645305633545, -0.0006946325302124023, -0.0005894005298614502, -0.00048416852951049805, -0.0003789365291595459, -0.00027370452880859375, -0.0001684725284576416, -6.324052810668945e-05, 4.1991472244262695e-05, 0.00014722347259521484, 0.000252455472946167, 0.00035768747329711914, 0.0004629194736480713, 0.0005681514739990234, 0.0006733834743499756, 0.0007786154747009277, 0.0008838474750518799, 0.000989079475402832, 0.0010943114757537842, 0.0011995434761047363, 0.0013047754764556885, 0.0014100074768066406, 0.0015152394771575928, 0.001620471477508545, 0.001725703477859497, 0.0018309354782104492, 0.0019361674785614014, 0.0020413994789123535, 0.0021466314792633057, 0.002251863479614258, 0.00235709547996521, 0.002462327480316162, 0.0025675594806671143, 0.0026727914810180664, 0.0027780234813690186, 0.0028832554817199707, 0.002988487482070923, 0.003093719482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 18.0, 30.0, 39.0, 44.0, 57.0, 71.0, 81.0, 84.0, 143.0, 204.0, 391.0, 770.0, 17784.0, 1021439.0, 5634.0, 619.0, 292.0, 227.0, 152.0, 103.0, 81.0, 55.0, 49.0, 36.0, 21.0, 25.0, 9.0, 14.0, 10.0, 4.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058502197265625, -0.05663871765136719, -0.054775238037109375, -0.05291175842285156, -0.05104827880859375, -0.04918479919433594, -0.047321319580078125, -0.04545783996582031, -0.0435943603515625, -0.04173088073730469, -0.039867401123046875, -0.03800392150878906, -0.03614044189453125, -0.03427696228027344, -0.032413482666015625, -0.030550003051757812, -0.0286865234375, -0.026823043823242188, -0.024959564208984375, -0.023096084594726562, -0.02123260498046875, -0.019369125366210938, -0.017505645751953125, -0.015642166137695312, -0.0137786865234375, -0.011915206909179688, -0.010051727294921875, -0.008188247680664062, -0.00632476806640625, -0.0044612884521484375, -0.002597808837890625, -0.0007343292236328125, 0.001129150390625, 0.0029926300048828125, 0.004856109619140625, 0.0067195892333984375, 0.00858306884765625, 0.010446548461914062, 0.012310028076171875, 0.014173507690429688, 0.0160369873046875, 0.017900466918945312, 0.019763946533203125, 0.021627426147460938, 0.02349090576171875, 0.025354385375976562, 0.027217864990234375, 0.029081344604492188, 0.03094482421875, 0.03280830383300781, 0.034671783447265625, 0.03653526306152344, 0.03839874267578125, 0.04026222229003906, 0.042125701904296875, 0.04398918151855469, 0.0458526611328125, 0.04771614074707031, 0.049579620361328125, 0.05144309997558594, 0.05330657958984375, 0.05517005920410156, 0.057033538818359375, 0.05889701843261719, 0.060760498046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1005.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037998151034116745, -0.036793846637010574, -0.035589538514614105, -0.034385234117507935, -0.033180929720401764, -0.03197662532329559, -0.030772319063544273, -0.029568012803792953, -0.028363708406686783, -0.027159404009580612, -0.025955097749829292, -0.024750791490077972, -0.023546487092971802, -0.02234218269586563, -0.02113787643611431, -0.01993357017636299, -0.01872926577925682, -0.01752496138215065, -0.01632065512239933, -0.015116349793970585, -0.01391204446554184, -0.012707739137113094, -0.011503433808684349, -0.010299128480255604, -0.009094823151826859, -0.007890517823398113, -0.006686212494969368, -0.005481907166540623, -0.0042776018381118774, -0.003073296509683132, -0.001868991181254387, -0.0006646858528256416, 0.0005396232008934021, 0.0017439285293221474, 0.0029482338577508926, 0.004152539186179638, 0.005356844514608383, 0.0065611498430371284, 0.007765455171465874, 0.008969760499894619, 0.010174065828323364, 0.01137837115675211, 0.012582676485180855, 0.0137869818136096, 0.014991287142038345, 0.016195591539144516, 0.017399897798895836, 0.018604204058647156, 0.019808508455753326, 0.021012812852859497, 0.022217119112610817, 0.023421425372362137, 0.024625729769468307, 0.025830034166574478, 0.027034340426325798, 0.028238646686077118, 0.02944295108318329, 0.03064725548028946, 0.03185155987739563, 0.0330558679997921, 0.03426017239689827, 0.03546447679400444, 0.03666878491640091, 0.03787308931350708, 0.03907739371061325]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 7.0, 14.0, 18.0, 12.0, 32.0, 23.0, 26.0, 32.0, 35.0, 51.0, 58.0, 44.0, 44.0, 62.0, 52.0, 52.0, 63.0, 47.0, 64.0, 41.0, 39.0, 32.0, 22.0, 22.0, 28.0, 16.0, 21.0, 4.0, 13.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018758773803710938, -0.001799331046640873, -0.0017227847129106522, -0.0016462383791804314, -0.0015696920454502106, -0.0014931457117199898, -0.001416599377989769, -0.0013400530442595482, -0.0012635067105293274, -0.0011869603767991066, -0.0011104140430688858, -0.001033867709338665, -0.0009573213756084442, -0.0008807750418782234, -0.0008042287081480026, -0.0007276823744177818, -0.000651136040687561, -0.0005745897069573402, -0.0004980433732271194, -0.00042149703949689865, -0.00034495070576667786, -0.00026840437203645706, -0.00019185803830623627, -0.00011531170457601547, -3.876537084579468e-05, 3.778096288442612e-05, 0.00011432729661464691, 0.0001908736303448677, 0.0002674199640750885, 0.0003439662978053093, 0.0004205126315355301, 0.0004970589652657509, 0.0005736052989959717, 0.0006501516327261925, 0.0007266979664564133, 0.0008032443001866341, 0.0008797906339168549, 0.0009563369676470757, 0.0010328833013772964, 0.0011094296351075172, 0.001185975968837738, 0.0012625223025679588, 0.0013390686362981796, 0.0014156149700284004, 0.0014921613037586212, 0.001568707637488842, 0.0016452539712190628, 0.0017218003049492836, 0.0017983466386795044, 0.0018748929724097252, 0.001951439306139946, 0.0020279856398701668, 0.0021045319736003876, 0.0021810783073306084, 0.002257624641060829, 0.00233417097479105, 0.0024107173085212708, 0.0024872636422514915, 0.0025638099759817123, 0.002640356309711933, 0.002716902643442154, 0.0027934489771723747, 0.0028699953109025955, 0.0029465416446328163, 0.003023087978363037]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 19.0, 26.0, 21.0, 42.0, 72.0, 92.0, 119.0, 163.0, 315.0, 436.0, 793.0, 1325.0, 2596.0, 5159.0, 10176.0, 23638.0, 66454.0, 252070.0, 480102.0, 133026.0, 40169.0, 15739.0, 7454.0, 3741.0, 1938.0, 1057.0, 622.0, 398.0, 244.0, 136.0, 115.0, 91.0, 53.0, 36.0, 31.0, 20.0, 18.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.390625, -3.288726806640625, -3.18682861328125, -3.084930419921875, -2.9830322265625, -2.881134033203125, -2.77923583984375, -2.677337646484375, -2.575439453125, -2.473541259765625, -2.37164306640625, -2.269744873046875, -2.1678466796875, -2.065948486328125, -1.96405029296875, -1.862152099609375, -1.76025390625, -1.658355712890625, -1.55645751953125, -1.454559326171875, -1.3526611328125, -1.250762939453125, -1.14886474609375, -1.046966552734375, -0.945068359375, -0.843170166015625, -0.74127197265625, -0.639373779296875, -0.5374755859375, -0.435577392578125, -0.33367919921875, -0.231781005859375, -0.1298828125, -0.027984619140625, 0.07391357421875, 0.175811767578125, 0.2777099609375, 0.379608154296875, 0.48150634765625, 0.583404541015625, 0.685302734375, 0.787200927734375, 0.88909912109375, 0.990997314453125, 1.0928955078125, 1.194793701171875, 1.29669189453125, 1.398590087890625, 1.50048828125, 1.602386474609375, 1.70428466796875, 1.806182861328125, 1.9080810546875, 2.009979248046875, 2.11187744140625, 2.213775634765625, 2.315673828125, 2.417572021484375, 2.51947021484375, 2.621368408203125, 2.7232666015625, 2.825164794921875, 2.92706298828125, 3.028961181640625, 3.130859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 6.0, 19.0, 17.0, 16.0, 24.0, 23.0, 25.0, 37.0, 28.0, 32.0, 45.0, 46.0, 44.0, 64.0, 77.0, 1697.0, 313.0, 75.0, 62.0, 50.0, 53.0, 49.0, 37.0, 33.0, 29.0, 26.0, 22.0, 22.0, 12.0, 15.0, 10.0, 10.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.34375, -17.8177490234375, -17.291748046875, -16.7657470703125, -16.23974609375, -15.7137451171875, -15.187744140625, -14.6617431640625, -14.1357421875, -13.6097412109375, -13.083740234375, -12.5577392578125, -12.03173828125, -11.5057373046875, -10.979736328125, -10.4537353515625, -9.927734375, -9.4017333984375, -8.875732421875, -8.3497314453125, -7.82373046875, -7.2977294921875, -6.771728515625, -6.2457275390625, -5.7197265625, -5.1937255859375, -4.667724609375, -4.1417236328125, -3.61572265625, -3.0897216796875, -2.563720703125, -2.0377197265625, -1.51171875, -0.9857177734375, -0.459716796875, 0.0662841796875, 0.59228515625, 1.1182861328125, 1.644287109375, 2.1702880859375, 2.6962890625, 3.2222900390625, 3.748291015625, 4.2742919921875, 4.80029296875, 5.3262939453125, 5.852294921875, 6.3782958984375, 6.904296875, 7.4302978515625, 7.956298828125, 8.4822998046875, 9.00830078125, 9.5343017578125, 10.060302734375, 10.5863037109375, 11.1123046875, 11.6383056640625, 12.164306640625, 12.6903076171875, 13.21630859375, 13.7423095703125, 14.268310546875, 14.7943115234375, 15.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 12.0, 13.0, 8.0, 5.0, 15.0, 25.0, 18.0, 29.0, 36.0, 33.0, 52.0, 95.0, 114.0, 191.0, 376.0, 934.0, 3434.0, 76101.0, 3043765.0, 16947.0, 2014.0, 640.0, 267.0, 156.0, 111.0, 56.0, 41.0, 50.0, 24.0, 26.0, 24.0, 20.0, 18.0, 13.0, 13.0, 2.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.914306640625, -23.12548828125, -22.336669921875, -21.5478515625, -20.759033203125, -19.97021484375, -19.181396484375, -18.392578125, -17.603759765625, -16.81494140625, -16.026123046875, -15.2373046875, -14.448486328125, -13.65966796875, -12.870849609375, -12.08203125, -11.293212890625, -10.50439453125, -9.715576171875, -8.9267578125, -8.137939453125, -7.34912109375, -6.560302734375, -5.771484375, -4.982666015625, -4.19384765625, -3.405029296875, -2.6162109375, -1.827392578125, -1.03857421875, -0.249755859375, 0.5390625, 1.327880859375, 2.11669921875, 2.905517578125, 3.6943359375, 4.483154296875, 5.27197265625, 6.060791015625, 6.849609375, 7.638427734375, 8.42724609375, 9.216064453125, 10.0048828125, 10.793701171875, 11.58251953125, 12.371337890625, 13.16015625, 13.948974609375, 14.73779296875, 15.526611328125, 16.3154296875, 17.104248046875, 17.89306640625, 18.681884765625, 19.470703125, 20.259521484375, 21.04833984375, 21.837158203125, 22.6259765625, 23.414794921875, 24.20361328125, 24.992431640625, 25.78125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 126.0, 715.0, 159.0, 8.0], "bins": [-174.2695770263672, -171.43614196777344, -168.60269165039062, -165.76925659179688, -162.93580627441406, -160.1023712158203, -157.2689208984375, -154.43548583984375, -151.60205078125, -148.76861572265625, -145.93516540527344, -143.1017303466797, -140.26828002929688, -137.43484497070312, -134.60140991210938, -131.76795959472656, -128.93450927734375, -126.10106658935547, -123.26762390136719, -120.43418884277344, -117.60074615478516, -114.76730346679688, -111.9338607788086, -109.10041809082031, -106.26698303222656, -103.43354034423828, -100.60009765625, -97.76666259765625, -94.93321990966797, -92.09977722167969, -89.2663345336914, -86.43289184570312, -83.59944915771484, -80.76600646972656, -77.93256378173828, -75.09912109375, -72.26568603515625, -69.43224334716797, -66.59880065917969, -63.765357971191406, -60.93191909790039, -58.09847640991211, -55.265037536621094, -52.43159484863281, -49.59815216064453, -46.76470947265625, -43.931270599365234, -41.09782791137695, -38.26438903808594, -35.430946350097656, -32.59750747680664, -29.76406478881836, -26.930622100830078, -24.09718132019043, -21.26374053955078, -18.4302978515625, -15.596856117248535, -12.76341438293457, -9.929973602294922, -7.096531867980957, -4.263090133666992, -1.4296483993530273, 1.403792381286621, 4.237235069274902, 7.070675849914551]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 12.0, 22.0, 20.0, 26.0, 17.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 28.0, 27.0, 38.0, 31.0, 40.0, 31.0, 46.0, 38.0, 40.0, 33.0, 33.0, 34.0, 25.0, 32.0, 20.0, 19.0, 19.0, 20.0, 21.0, 17.0, 12.0, 20.0, 19.0, 11.0, 10.0, 11.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-44.84918212890625, -43.43840789794922, -42.02763748168945, -40.61686325073242, -39.206092834472656, -37.795318603515625, -36.384544372558594, -34.97377014160156, -33.5629997253418, -32.152225494384766, -30.741455078125, -29.33068084716797, -27.91990852355957, -26.509136199951172, -25.09836196899414, -23.687589645385742, -22.276817321777344, -20.866044998168945, -19.455272674560547, -18.044498443603516, -16.633726119995117, -15.222953796386719, -13.812180519104004, -12.401407241821289, -10.99063491821289, -9.579862594604492, -8.169089317321777, -6.758316516876221, -5.347543716430664, -3.9367709159851074, -2.525998115539551, -1.115224838256836, 0.2955513000488281, 1.7063241004943848, 3.1170969009399414, 4.527869701385498, 5.938642501831055, 7.349415302276611, 8.760188102722168, 10.170961380004883, 11.581733703613281, 12.99250602722168, 14.403279304504395, 15.81405258178711, 17.224824905395508, 18.635597229003906, 20.046371459960938, 21.457143783569336, 22.867916107177734, 24.278688430786133, 25.68946075439453, 27.100234985351562, 28.51100730895996, 29.92177963256836, 31.33255386352539, 32.743324279785156, 34.15409851074219, 35.56487274169922, 36.975643157958984, 38.386417388916016, 39.79718780517578, 41.20796203613281, 42.618736267089844, 44.029510498046875, 45.44028091430664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 13.0, 10.0, 7.0, 17.0, 19.0, 12.0, 22.0, 32.0, 21.0, 36.0, 42.0, 31.0, 35.0, 40.0, 45.0, 41.0, 34.0, 47.0, 44.0, 43.0, 44.0, 44.0, 33.0, 36.0, 26.0, 33.0, 26.0, 24.0, 18.0, 9.0, 18.0, 18.0, 16.0, 10.0, 11.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48858642578125, -4.3404541015625, -4.19232177734375, -4.044189453125, -3.89605712890625, -3.7479248046875, -3.59979248046875, -3.45166015625, -3.30352783203125, -3.1553955078125, -3.00726318359375, -2.859130859375, -2.71099853515625, -2.5628662109375, -2.41473388671875, -2.2666015625, -2.11846923828125, -1.9703369140625, -1.82220458984375, -1.674072265625, -1.52593994140625, -1.3778076171875, -1.22967529296875, -1.08154296875, -0.93341064453125, -0.7852783203125, -0.63714599609375, -0.489013671875, -0.34088134765625, -0.1927490234375, -0.04461669921875, 0.103515625, 0.25164794921875, 0.3997802734375, 0.54791259765625, 0.696044921875, 0.84417724609375, 0.9923095703125, 1.14044189453125, 1.28857421875, 1.43670654296875, 1.5848388671875, 1.73297119140625, 1.881103515625, 2.02923583984375, 2.1773681640625, 2.32550048828125, 2.4736328125, 2.62176513671875, 2.7698974609375, 2.91802978515625, 3.066162109375, 3.21429443359375, 3.3624267578125, 3.51055908203125, 3.65869140625, 3.80682373046875, 3.9549560546875, 4.10308837890625, 4.251220703125, 4.39935302734375, 4.5474853515625, 4.69561767578125, 4.84375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 6.0, 10.0, 17.0, 25.0, 28.0, 36.0, 45.0, 82.0, 131.0, 204.0, 382.0, 822.0, 1605.0, 3658.0, 9587.0, 28481.0, 109746.0, 721311.0, 2282006.0, 857762.0, 129653.0, 31958.0, 9862.0, 3672.0, 1545.0, 717.0, 363.0, 170.0, 111.0, 68.0, 41.0, 34.0, 21.0, 21.0, 19.0, 15.0, 12.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3104248046875, -8.019287109375, -7.7281494140625, -7.43701171875, -7.1458740234375, -6.854736328125, -6.5635986328125, -6.2724609375, -5.9813232421875, -5.690185546875, -5.3990478515625, -5.10791015625, -4.8167724609375, -4.525634765625, -4.2344970703125, -3.943359375, -3.6522216796875, -3.361083984375, -3.0699462890625, -2.77880859375, -2.4876708984375, -2.196533203125, -1.9053955078125, -1.6142578125, -1.3231201171875, -1.031982421875, -0.7408447265625, -0.44970703125, -0.1585693359375, 0.132568359375, 0.4237060546875, 0.71484375, 1.0059814453125, 1.297119140625, 1.5882568359375, 1.87939453125, 2.1705322265625, 2.461669921875, 2.7528076171875, 3.0439453125, 3.3350830078125, 3.626220703125, 3.9173583984375, 4.20849609375, 4.4996337890625, 4.790771484375, 5.0819091796875, 5.373046875, 5.6641845703125, 5.955322265625, 6.2464599609375, 6.53759765625, 6.8287353515625, 7.119873046875, 7.4110107421875, 7.7021484375, 7.9932861328125, 8.284423828125, 8.5755615234375, 8.86669921875, 9.1578369140625, 9.448974609375, 9.7401123046875, 10.03125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 21.0, 22.0, 41.0, 60.0, 55.0, 107.0, 141.0, 205.0, 328.0, 422.0, 543.0, 616.0, 461.0, 325.0, 235.0, 164.0, 102.0, 71.0, 48.0, 29.0, 21.0, 13.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.607666015625, -16.10595703125, -15.604248046875, -15.1025390625, -14.600830078125, -14.09912109375, -13.597412109375, -13.095703125, -12.593994140625, -12.09228515625, -11.590576171875, -11.0888671875, -10.587158203125, -10.08544921875, -9.583740234375, -9.08203125, -8.580322265625, -8.07861328125, -7.576904296875, -7.0751953125, -6.573486328125, -6.07177734375, -5.570068359375, -5.068359375, -4.566650390625, -4.06494140625, -3.563232421875, -3.0615234375, -2.559814453125, -2.05810546875, -1.556396484375, -1.0546875, -0.552978515625, -0.05126953125, 0.450439453125, 0.9521484375, 1.453857421875, 1.95556640625, 2.457275390625, 2.958984375, 3.460693359375, 3.96240234375, 4.464111328125, 4.9658203125, 5.467529296875, 5.96923828125, 6.470947265625, 6.97265625, 7.474365234375, 7.97607421875, 8.477783203125, 8.9794921875, 9.481201171875, 9.98291015625, 10.484619140625, 10.986328125, 11.488037109375, 11.98974609375, 12.491455078125, 12.9931640625, 13.494873046875, 13.99658203125, 14.498291015625, 15.0]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 2.0, 1.0, 7.0, 11.0, 15.0, 9.0, 18.0, 20.0, 25.0, 37.0, 43.0, 82.0, 88.0, 101.0, 194.0, 339.0, 556.0, 1379.0, 5073.0, 35135.0, 580777.0, 3369238.0, 179804.0, 16087.0, 2990.0, 920.0, 431.0, 251.0, 180.0, 113.0, 88.0, 53.0, 48.0, 28.0, 34.0, 22.0, 12.0, 11.0, 11.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-29.046875, -28.119384765625, -27.19189453125, -26.264404296875, -25.3369140625, -24.409423828125, -23.48193359375, -22.554443359375, -21.626953125, -20.699462890625, -19.77197265625, -18.844482421875, -17.9169921875, -16.989501953125, -16.06201171875, -15.134521484375, -14.20703125, -13.279541015625, -12.35205078125, -11.424560546875, -10.4970703125, -9.569580078125, -8.64208984375, -7.714599609375, -6.787109375, -5.859619140625, -4.93212890625, -4.004638671875, -3.0771484375, -2.149658203125, -1.22216796875, -0.294677734375, 0.6328125, 1.560302734375, 2.48779296875, 3.415283203125, 4.3427734375, 5.270263671875, 6.19775390625, 7.125244140625, 8.052734375, 8.980224609375, 9.90771484375, 10.835205078125, 11.7626953125, 12.690185546875, 13.61767578125, 14.545166015625, 15.47265625, 16.400146484375, 17.32763671875, 18.255126953125, 19.1826171875, 20.110107421875, 21.03759765625, 21.965087890625, 22.892578125, 23.820068359375, 24.74755859375, 25.675048828125, 26.6025390625, 27.530029296875, 28.45751953125, 29.385009765625, 30.3125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 24.0, 32.0, 69.0, 100.0, 124.0, 140.0, 155.0, 119.0, 108.0, 62.0, 26.0, 14.0, 12.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.81227111816406, -74.55052185058594, -72.28877258300781, -70.02702331542969, -67.76527404785156, -65.50352478027344, -63.24177932739258, -60.98003005981445, -58.71828079223633, -56.4565315246582, -54.19478225708008, -51.93303298950195, -49.671287536621094, -47.40953826904297, -45.147789001464844, -42.88603973388672, -40.624290466308594, -38.36254119873047, -36.100791931152344, -33.83904266357422, -31.577295303344727, -29.3155460357666, -27.05379867553711, -24.792049407958984, -22.53030014038086, -20.268550872802734, -18.00680160522461, -15.745054244995117, -13.483304977416992, -11.221555709838867, -8.959807395935059, -6.69805908203125, -4.436309814453125, -2.174561023712158, 0.0871877670288086, 2.3489365577697754, 4.610685348510742, 6.872434616088867, 9.134182929992676, 11.395931243896484, 13.65768051147461, 15.919429779052734, 18.18117904663086, 20.44292640686035, 22.704675674438477, 24.9664249420166, 27.228172302246094, 29.48992156982422, 31.751670837402344, 34.01342010498047, 36.275169372558594, 38.53691864013672, 40.798667907714844, 43.06041717529297, 45.32216262817383, 47.58391189575195, 49.84566116333008, 52.1074104309082, 54.36915969848633, 56.63090896606445, 58.89265441894531, 61.15440368652344, 63.41615295410156, 65.67790222167969, 67.93965148925781]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 8.0, 16.0, 13.0, 26.0, 20.0, 22.0, 30.0, 35.0, 34.0, 33.0, 37.0, 39.0, 37.0, 38.0, 51.0, 39.0, 46.0, 42.0, 57.0, 53.0, 44.0, 28.0, 42.0, 32.0, 32.0, 19.0, 20.0, 13.0, 19.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.31919860839844, -41.86086654663086, -40.402530670166016, -38.94419860839844, -37.485862731933594, -36.027530670166016, -34.56919860839844, -33.110862731933594, -31.652528762817383, -30.194194793701172, -28.73586082458496, -27.27752685546875, -25.819194793701172, -24.360858917236328, -22.90252685546875, -21.44419288635254, -19.985858917236328, -18.527524948120117, -17.069190979003906, -15.610857963562012, -14.1525239944458, -12.69419002532959, -11.235857009887695, -9.777523040771484, -8.319189071655273, -6.8608551025390625, -5.40252161026001, -3.944188117980957, -2.485854148864746, -1.0275201797485352, 0.4308128356933594, 1.8891468048095703, 3.3474807739257812, 4.805814743041992, 6.264148235321045, 7.722481727600098, 9.180815696716309, 10.63914966583252, 12.097482681274414, 13.555816650390625, 15.014150619506836, 16.472484588623047, 17.930818557739258, 19.38915252685547, 20.847484588623047, 22.30582046508789, 23.76415252685547, 25.22248649597168, 26.68082046508789, 28.1391544342041, 29.597488403320312, 31.05582046508789, 32.514156341552734, 33.97248840332031, 35.430824279785156, 36.889156341552734, 38.34748840332031, 39.80582046508789, 41.264156341552734, 42.72248840332031, 44.180824279785156, 45.639156341552734, 47.09748840332031, 48.555824279785156, 50.01416015625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 3.0, 16.0, 18.0, 8.0, 31.0, 34.0, 51.0, 74.0, 88.0, 124.0, 180.0, 267.0, 400.0, 568.0, 803.0, 1150.0, 1713.0, 2478.0, 3857.0, 5902.0, 9038.0, 13980.0, 22122.0, 34545.0, 55387.0, 87665.0, 132525.0, 173248.0, 165699.0, 120940.0, 78440.0, 49300.0, 31134.0, 19910.0, 12512.0, 8047.0, 5270.0, 3525.0, 2342.0, 1578.0, 1068.0, 762.0, 512.0, 346.0, 260.0, 187.0, 137.0, 89.0, 56.0, 47.0, 38.0, 28.0, 21.0, 9.0, 11.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44341278076171875, -0.4285736083984375, -0.41373443603515625, -0.398895263671875, -0.38405609130859375, -0.3692169189453125, -0.35437774658203125, -0.33953857421875, -0.32469940185546875, -0.3098602294921875, -0.29502105712890625, -0.280181884765625, -0.26534271240234375, -0.2505035400390625, -0.23566436767578125, -0.2208251953125, -0.20598602294921875, -0.1911468505859375, -0.17630767822265625, -0.161468505859375, -0.14662933349609375, -0.1317901611328125, -0.11695098876953125, -0.10211181640625, -0.08727264404296875, -0.0724334716796875, -0.05759429931640625, -0.042755126953125, -0.02791595458984375, -0.0130767822265625, 0.00176239013671875, 0.0166015625, 0.03144073486328125, 0.0462799072265625, 0.06111907958984375, 0.075958251953125, 0.09079742431640625, 0.1056365966796875, 0.12047576904296875, 0.13531494140625, 0.15015411376953125, 0.1649932861328125, 0.17983245849609375, 0.194671630859375, 0.20951080322265625, 0.2243499755859375, 0.23918914794921875, 0.2540283203125, 0.26886749267578125, 0.2837066650390625, 0.29854583740234375, 0.313385009765625, 0.32822418212890625, 0.3430633544921875, 0.35790252685546875, 0.37274169921875, 0.38758087158203125, 0.4024200439453125, 0.41725921630859375, 0.432098388671875, 0.44693756103515625, 0.4617767333984375, 0.47661590576171875, 0.491455078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 10.0, 5.0, 6.0, 7.0, 12.0, 15.0, 20.0, 24.0, 31.0, 26.0, 32.0, 37.0, 42.0, 45.0, 39.0, 56.0, 48.0, 1065.0, 51.0, 63.0, 57.0, 55.0, 41.0, 39.0, 30.0, 25.0, 36.0, 29.0, 29.0, 18.0, 13.0, 15.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.923858642578125, -3.80084228515625, -3.677825927734375, -3.5548095703125, -3.431793212890625, -3.30877685546875, -3.185760498046875, -3.062744140625, -2.939727783203125, -2.81671142578125, -2.693695068359375, -2.5706787109375, -2.447662353515625, -2.32464599609375, -2.201629638671875, -2.07861328125, -1.955596923828125, -1.83258056640625, -1.709564208984375, -1.5865478515625, -1.463531494140625, -1.34051513671875, -1.217498779296875, -1.094482421875, -0.971466064453125, -0.84844970703125, -0.725433349609375, -0.6024169921875, -0.479400634765625, -0.35638427734375, -0.233367919921875, -0.1103515625, 0.012664794921875, 0.13568115234375, 0.258697509765625, 0.3817138671875, 0.504730224609375, 0.62774658203125, 0.750762939453125, 0.873779296875, 0.996795654296875, 1.11981201171875, 1.242828369140625, 1.3658447265625, 1.488861083984375, 1.61187744140625, 1.734893798828125, 1.85791015625, 1.980926513671875, 2.10394287109375, 2.226959228515625, 2.3499755859375, 2.472991943359375, 2.59600830078125, 2.719024658203125, 2.842041015625, 2.965057373046875, 3.08807373046875, 3.211090087890625, 3.3341064453125, 3.457122802734375, 3.58013916015625, 3.703155517578125, 3.826171875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 17.0, 25.0, 32.0, 47.0, 114.0, 174.0, 258.0, 438.0, 731.0, 1217.0, 2052.0, 3395.0, 5520.0, 9215.0, 15369.0, 25379.0, 42081.0, 68286.0, 107979.0, 155898.0, 1228516.0, 153608.0, 105608.0, 66709.0, 41099.0, 24865.0, 15166.0, 9175.0, 5618.0, 3322.0, 2081.0, 1217.0, 730.0, 478.0, 242.0, 199.0, 102.0, 55.0, 30.0, 18.0, 15.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.368408203125, -0.3563232421875, -0.34423828125, -0.3321533203125, -0.320068359375, -0.3079833984375, -0.2958984375, -0.2838134765625, -0.271728515625, -0.2596435546875, -0.24755859375, -0.2354736328125, -0.223388671875, -0.2113037109375, -0.19921875, -0.1871337890625, -0.175048828125, -0.1629638671875, -0.15087890625, -0.1387939453125, -0.126708984375, -0.1146240234375, -0.1025390625, -0.0904541015625, -0.078369140625, -0.0662841796875, -0.05419921875, -0.0421142578125, -0.030029296875, -0.0179443359375, -0.005859375, 0.0062255859375, 0.018310546875, 0.0303955078125, 0.04248046875, 0.0545654296875, 0.066650390625, 0.0787353515625, 0.0908203125, 0.1029052734375, 0.114990234375, 0.1270751953125, 0.13916015625, 0.1512451171875, 0.163330078125, 0.1754150390625, 0.1875, 0.1995849609375, 0.211669921875, 0.2237548828125, 0.23583984375, 0.2479248046875, 0.260009765625, 0.2720947265625, 0.2841796875, 0.2962646484375, 0.308349609375, 0.3204345703125, 0.33251953125, 0.3446044921875, 0.356689453125, 0.3687744140625, 0.380859375, 0.3929443359375, 0.405029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 11.0, 14.0, 18.0, 21.0, 21.0, 24.0, 34.0, 53.0, 57.0, 59.0, 69.0, 67.0, 56.0, 73.0, 51.0, 50.0, 63.0, 41.0, 32.0, 22.0, 31.0, 20.0, 19.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0033111572265625, -0.003223031759262085, -0.00313490629196167, -0.003046780824661255, -0.00295865535736084, -0.002870529890060425, -0.0027824044227600098, -0.0026942789554595947, -0.0026061534881591797, -0.0025180280208587646, -0.0024299025535583496, -0.0023417770862579346, -0.0022536516189575195, -0.0021655261516571045, -0.0020774006843566895, -0.0019892752170562744, -0.0019011497497558594, -0.0018130242824554443, -0.0017248988151550293, -0.0016367733478546143, -0.0015486478805541992, -0.0014605224132537842, -0.0013723969459533691, -0.001284271478652954, -0.001196146011352539, -0.001108020544052124, -0.001019895076751709, -0.0009317696094512939, -0.0008436441421508789, -0.0007555186748504639, -0.0006673932075500488, -0.0005792677402496338, -0.0004911422729492188, -0.0004030168056488037, -0.00031489133834838867, -0.00022676587104797363, -0.0001386404037475586, -5.0514936447143555e-05, 3.7610530853271484e-05, 0.00012573599815368652, 0.00021386146545410156, 0.0003019869327545166, 0.00039011240005493164, 0.0004782378673553467, 0.0005663633346557617, 0.0006544888019561768, 0.0007426142692565918, 0.0008307397365570068, 0.0009188652038574219, 0.001006990671157837, 0.001095116138458252, 0.001183241605758667, 0.001271367073059082, 0.001359492540359497, 0.0014476180076599121, 0.0015357434749603271, 0.0016238689422607422, 0.0017119944095611572, 0.0018001198768615723, 0.0018882453441619873, 0.0019763708114624023, 0.0020644962787628174, 0.0021526217460632324, 0.0022407472133636475, 0.0023288726806640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 13.0, 10.0, 11.0, 11.0, 19.0, 25.0, 42.0, 55.0, 78.0, 99.0, 123.0, 202.0, 283.0, 535.0, 3627.0, 953122.0, 87945.0, 1095.0, 403.0, 239.0, 148.0, 121.0, 100.0, 57.0, 49.0, 44.0, 22.0, 19.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047515869140625, -0.04574155807495117, -0.043967247009277344, -0.042192935943603516, -0.04041862487792969, -0.03864431381225586, -0.03687000274658203, -0.0350956916809082, -0.033321380615234375, -0.03154706954956055, -0.02977275848388672, -0.02799844741821289, -0.026224136352539062, -0.024449825286865234, -0.022675514221191406, -0.020901203155517578, -0.01912689208984375, -0.017352581024169922, -0.015578269958496094, -0.013803958892822266, -0.012029647827148438, -0.01025533676147461, -0.008481025695800781, -0.006706714630126953, -0.004932403564453125, -0.003158092498779297, -0.0013837814331054688, 0.0003905296325683594, 0.0021648406982421875, 0.003939151763916016, 0.005713462829589844, 0.007487773895263672, 0.0092620849609375, 0.011036396026611328, 0.012810707092285156, 0.014585018157958984, 0.016359329223632812, 0.01813364028930664, 0.01990795135498047, 0.021682262420654297, 0.023456573486328125, 0.025230884552001953, 0.02700519561767578, 0.02877950668334961, 0.030553817749023438, 0.032328128814697266, 0.034102439880371094, 0.03587675094604492, 0.03765106201171875, 0.03942537307739258, 0.041199684143066406, 0.042973995208740234, 0.04474830627441406, 0.04652261734008789, 0.04829692840576172, 0.05007123947143555, 0.051845550537109375, 0.0536198616027832, 0.05539417266845703, 0.05716848373413086, 0.05894279479980469, 0.060717105865478516, 0.062491416931152344, 0.06426572799682617, 0.0660400390625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 443.0, 531.0, 31.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016857799142599106, -0.016347317025065422, -0.015836836770176888, -0.015326354652643204, -0.014815873466432095, -0.014305392280220985, -0.013794910162687302, -0.013284428976476192, -0.012773947790265083, -0.012263466604053974, -0.011752985417842865, -0.011242503300309181, -0.010732022114098072, -0.010221540927886963, -0.009711058810353279, -0.00920057762414217, -0.00869009643793106, -0.008179615251719952, -0.007669133599847555, -0.007158651947975159, -0.0066481707617640495, -0.00613768957555294, -0.005627207923680544, -0.005116726271808147, -0.004606245085597038, -0.004095763899385929, -0.0035852822475135326, -0.00307480082847178, -0.002564319409430027, -0.002053837990388274, -0.0015433565713465214, -0.0010328751523047686, -0.000522395595908165, -1.1914176866412163e-05, 0.0004985672421753407, 0.0010090486612170935, 0.0015195300802588463, 0.002030011499300599, 0.002540492918342352, 0.0030509743373841047, 0.0035614557564258575, 0.004071936942636967, 0.004582418594509363, 0.00509290024638176, 0.005603381432592869, 0.006113862618803978, 0.0066243442706763744, 0.007134825922548771, 0.00764530710875988, 0.00815578829497099, 0.008666269481182098, 0.009176751598715782, 0.009687232784926891, 0.010197713971138, 0.010708196088671684, 0.011218677274882793, 0.011729158461093903, 0.012239639647305012, 0.012750120833516121, 0.013260602951049805, 0.013771084137260914, 0.014281565323472023, 0.014792047441005707, 0.015302528627216816, 0.015813009813427925]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 5.0, 8.0, 9.0, 10.0, 22.0, 25.0, 13.0, 20.0, 24.0, 26.0, 32.0, 23.0, 37.0, 31.0, 33.0, 31.0, 24.0, 36.0, 45.0, 52.0, 47.0, 45.0, 34.0, 36.0, 28.0, 42.0, 23.0, 31.0, 24.0, 20.0, 29.0, 12.0, 17.0, 14.0, 10.0, 17.0, 13.0, 13.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013415217399597168, -0.0012950357049703598, -0.0012485496699810028, -0.0012020636349916458, -0.0011555776000022888, -0.0011090915650129318, -0.0010626055300235748, -0.0010161194950342178, -0.0009696334600448608, -0.0009231474250555038, -0.0008766613900661469, -0.0008301753550767899, -0.0007836893200874329, -0.0007372032850980759, -0.0006907172501087189, -0.0006442312151193619, -0.0005977451801300049, -0.0005512591451406479, -0.0005047731101512909, -0.0004582870751619339, -0.0004118010401725769, -0.0003653150051832199, -0.0003188289701938629, -0.0002723429352045059, -0.00022585690021514893, -0.00017937086522579193, -0.00013288483023643494, -8.639879524707794e-05, -3.991276025772095e-05, 6.573274731636047e-06, 5.305930972099304e-05, 9.954534471035004e-05, 0.00014603137969970703, 0.00019251741468906403, 0.00023900344967842102, 0.000285489484667778, 0.000331975519657135, 0.000378461554646492, 0.000424947589635849, 0.000471433624625206, 0.000517919659614563, 0.00056440569460392, 0.000610891729593277, 0.000657377764582634, 0.000703863799571991, 0.000750349834561348, 0.000796835869550705, 0.000843321904540062, 0.0008898079395294189, 0.0009362939745187759, 0.000982780009508133, 0.00102926604449749, 0.001075752079486847, 0.001122238114476204, 0.001168724149465561, 0.001215210184454918, 0.001261696219444275, 0.001308182254433632, 0.001354668289422989, 0.0014011543244123459, 0.0014476403594017029, 0.0014941263943910599, 0.0015406124293804169, 0.0015870984643697739, 0.0016335844993591309]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 16.0, 12.0, 17.0, 33.0, 47.0, 64.0, 100.0, 127.0, 189.0, 265.0, 413.0, 626.0, 964.0, 1428.0, 2303.0, 4158.0, 8233.0, 19779.0, 63299.0, 265849.0, 489946.0, 129315.0, 34752.0, 12404.0, 5773.0, 3169.0, 1792.0, 1121.0, 749.0, 535.0, 315.0, 231.0, 159.0, 110.0, 75.0, 46.0, 42.0, 25.0, 15.0, 17.0, 6.0, 4.0, 4.0, 8.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0390625, -3.913848876953125, -3.78863525390625, -3.663421630859375, -3.5382080078125, -3.412994384765625, -3.28778076171875, -3.162567138671875, -3.037353515625, -2.912139892578125, -2.78692626953125, -2.661712646484375, -2.5364990234375, -2.411285400390625, -2.28607177734375, -2.160858154296875, -2.03564453125, -1.910430908203125, -1.78521728515625, -1.660003662109375, -1.5347900390625, -1.409576416015625, -1.28436279296875, -1.159149169921875, -1.033935546875, -0.908721923828125, -0.78350830078125, -0.658294677734375, -0.5330810546875, -0.407867431640625, -0.28265380859375, -0.157440185546875, -0.0322265625, 0.092987060546875, 0.21820068359375, 0.343414306640625, 0.4686279296875, 0.593841552734375, 0.71905517578125, 0.844268798828125, 0.969482421875, 1.094696044921875, 1.21990966796875, 1.345123291015625, 1.4703369140625, 1.595550537109375, 1.72076416015625, 1.845977783203125, 1.97119140625, 2.096405029296875, 2.22161865234375, 2.346832275390625, 2.4720458984375, 2.597259521484375, 2.72247314453125, 2.847686767578125, 2.972900390625, 3.098114013671875, 3.22332763671875, 3.348541259765625, 3.4737548828125, 3.598968505859375, 3.72418212890625, 3.849395751953125, 3.974609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 1.0, 4.0, 8.0, 12.0, 9.0, 9.0, 15.0, 16.0, 26.0, 24.0, 26.0, 34.0, 31.0, 51.0, 54.0, 49.0, 62.0, 113.0, 1731.0, 276.0, 77.0, 55.0, 49.0, 48.0, 39.0, 37.0, 37.0, 21.0, 29.0, 27.0, 17.0, 11.0, 12.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.25244140625, -15.6455078125, -15.03857421875, -14.431640625, -13.82470703125, -13.2177734375, -12.61083984375, -12.00390625, -11.39697265625, -10.7900390625, -10.18310546875, -9.576171875, -8.96923828125, -8.3623046875, -7.75537109375, -7.1484375, -6.54150390625, -5.9345703125, -5.32763671875, -4.720703125, -4.11376953125, -3.5068359375, -2.89990234375, -2.29296875, -1.68603515625, -1.0791015625, -0.47216796875, 0.134765625, 0.74169921875, 1.3486328125, 1.95556640625, 2.5625, 3.16943359375, 3.7763671875, 4.38330078125, 4.990234375, 5.59716796875, 6.2041015625, 6.81103515625, 7.41796875, 8.02490234375, 8.6318359375, 9.23876953125, 9.845703125, 10.45263671875, 11.0595703125, 11.66650390625, 12.2734375, 12.88037109375, 13.4873046875, 14.09423828125, 14.701171875, 15.30810546875, 15.9150390625, 16.52197265625, 17.12890625, 17.73583984375, 18.3427734375, 18.94970703125, 19.556640625, 20.16357421875, 20.7705078125, 21.37744140625, 21.984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 13.0, 4.0, 3.0, 14.0, 12.0, 11.0, 19.0, 24.0, 31.0, 42.0, 49.0, 69.0, 76.0, 126.0, 218.0, 460.0, 1378.0, 18918.0, 3061004.0, 59624.0, 2330.0, 491.0, 243.0, 153.0, 97.0, 72.0, 51.0, 42.0, 26.0, 23.0, 16.0, 19.0, 7.0, 11.0, 12.0, 5.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.875, -34.895751953125, -33.91650390625, -32.937255859375, -31.9580078125, -30.978759765625, -29.99951171875, -29.020263671875, -28.041015625, -27.061767578125, -26.08251953125, -25.103271484375, -24.1240234375, -23.144775390625, -22.16552734375, -21.186279296875, -20.20703125, -19.227783203125, -18.24853515625, -17.269287109375, -16.2900390625, -15.310791015625, -14.33154296875, -13.352294921875, -12.373046875, -11.393798828125, -10.41455078125, -9.435302734375, -8.4560546875, -7.476806640625, -6.49755859375, -5.518310546875, -4.5390625, -3.559814453125, -2.58056640625, -1.601318359375, -0.6220703125, 0.357177734375, 1.33642578125, 2.315673828125, 3.294921875, 4.274169921875, 5.25341796875, 6.232666015625, 7.2119140625, 8.191162109375, 9.17041015625, 10.149658203125, 11.12890625, 12.108154296875, 13.08740234375, 14.066650390625, 15.0458984375, 16.025146484375, 17.00439453125, 17.983642578125, 18.962890625, 19.942138671875, 20.92138671875, 21.900634765625, 22.8798828125, 23.859130859375, 24.83837890625, 25.817626953125, 26.796875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 42.0, 330.0, 538.0, 97.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.038566589355469, -11.344952583312988, -8.651338577270508, -5.957724571228027, -3.264110565185547, -0.5704965591430664, 2.123117446899414, 4.816730499267578, 7.510345458984375, 10.203959465026855, 12.897573471069336, 15.591187477111816, 18.284801483154297, 20.978416442871094, 23.672029495239258, 26.365642547607422, 29.05925750732422, 31.752872467041016, 34.44648742675781, 37.140098571777344, 39.83371353149414, 42.52732849121094, 45.22093963623047, 47.914554595947266, 50.60816955566406, 53.30178451538086, 55.995399475097656, 58.68901062011719, 61.382625579833984, 64.07624053955078, 66.76985168457031, 69.46347045898438, 72.15708923339844, 74.85070037841797, 77.54431915283203, 80.23793029785156, 82.93154907226562, 85.62516021728516, 88.31877136230469, 91.01239013671875, 93.70600128173828, 96.39961242675781, 99.09323120117188, 101.7868423461914, 104.48045349121094, 107.174072265625, 109.86768341064453, 112.56129455566406, 115.25491333007812, 117.94852447509766, 120.64214324951172, 123.33575439453125, 126.02937316894531, 128.7229766845703, 131.41659545898438, 134.11021423339844, 136.8038330078125, 139.49745178222656, 142.19105529785156, 144.88467407226562, 147.5782928466797, 150.2718963623047, 152.96551513671875, 155.6591339111328, 158.3527374267578]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 16.0, 14.0, 16.0, 20.0, 24.0, 14.0, 35.0, 29.0, 26.0, 39.0, 45.0, 28.0, 31.0, 36.0, 29.0, 36.0, 36.0, 33.0, 28.0, 53.0, 36.0, 38.0, 25.0, 29.0, 18.0, 17.0, 24.0, 19.0, 15.0, 16.0, 12.0, 15.0, 13.0, 7.0, 14.0, 4.0, 13.0, 4.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-50.27008819580078, -48.72826385498047, -47.186439514160156, -45.64461898803711, -44.1027946472168, -42.560970306396484, -41.01914978027344, -39.477325439453125, -37.93550109863281, -36.3936767578125, -34.85185241699219, -33.31003189086914, -31.768207550048828, -30.226383209228516, -28.684560775756836, -27.142738342285156, -25.600914001464844, -24.05908966064453, -22.51726722717285, -20.975444793701172, -19.43362045288086, -17.891796112060547, -16.349973678588867, -14.808150291442871, -13.266326904296875, -11.724503517150879, -10.182680130004883, -8.640856742858887, -7.099033355712891, -5.5572099685668945, -4.015386581420898, -2.4735631942749023, -0.9317359924316406, 0.6100873947143555, 2.1519107818603516, 3.6937341690063477, 5.235557556152344, 6.77738094329834, 8.319204330444336, 9.861027717590332, 11.402851104736328, 12.944674491882324, 14.48649787902832, 16.0283203125, 17.570144653320312, 19.111968994140625, 20.653791427612305, 22.195613861083984, 23.737438201904297, 25.27926254272461, 26.82108497619629, 28.36290740966797, 29.90473175048828, 31.446556091308594, 32.988380432128906, 34.53020095825195, 36.072025299072266, 37.61384963989258, 39.155670166015625, 40.69749450683594, 42.23931884765625, 43.78114318847656, 45.322967529296875, 46.86478805541992, 48.406612396240234]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 7.0, 22.0, 15.0, 13.0, 25.0, 25.0, 26.0, 25.0, 32.0, 32.0, 32.0, 37.0, 51.0, 51.0, 34.0, 45.0, 47.0, 38.0, 35.0, 39.0, 42.0, 36.0, 33.0, 32.0, 29.0, 37.0, 26.0, 15.0, 17.0, 18.0, 10.0, 11.0, 6.0, 8.0, 8.0, 10.0, 0.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.350830078125, -5.19384765625, -5.036865234375, -4.8798828125, -4.722900390625, -4.56591796875, -4.408935546875, -4.251953125, -4.094970703125, -3.93798828125, -3.781005859375, -3.6240234375, -3.467041015625, -3.31005859375, -3.153076171875, -2.99609375, -2.839111328125, -2.68212890625, -2.525146484375, -2.3681640625, -2.211181640625, -2.05419921875, -1.897216796875, -1.740234375, -1.583251953125, -1.42626953125, -1.269287109375, -1.1123046875, -0.955322265625, -0.79833984375, -0.641357421875, -0.484375, -0.327392578125, -0.17041015625, -0.013427734375, 0.1435546875, 0.300537109375, 0.45751953125, 0.614501953125, 0.771484375, 0.928466796875, 1.08544921875, 1.242431640625, 1.3994140625, 1.556396484375, 1.71337890625, 1.870361328125, 2.02734375, 2.184326171875, 2.34130859375, 2.498291015625, 2.6552734375, 2.812255859375, 2.96923828125, 3.126220703125, 3.283203125, 3.440185546875, 3.59716796875, 3.754150390625, 3.9111328125, 4.068115234375, 4.22509765625, 4.382080078125, 4.5390625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 5.0, 15.0, 17.0, 21.0, 15.0, 17.0, 31.0, 33.0, 42.0, 104.0, 161.0, 360.0, 851.0, 3031.0, 14341.0, 103183.0, 1710362.0, 2196482.0, 142218.0, 17737.0, 3441.0, 952.0, 354.0, 167.0, 91.0, 49.0, 42.0, 21.0, 23.0, 17.0, 18.0, 14.0, 10.0, 7.0, 7.0, 8.0, 7.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.8336181640625, -15.354736328125, -14.8758544921875, -14.39697265625, -13.9180908203125, -13.439208984375, -12.9603271484375, -12.4814453125, -12.0025634765625, -11.523681640625, -11.0447998046875, -10.56591796875, -10.0870361328125, -9.608154296875, -9.1292724609375, -8.650390625, -8.1715087890625, -7.692626953125, -7.2137451171875, -6.73486328125, -6.2559814453125, -5.777099609375, -5.2982177734375, -4.8193359375, -4.3404541015625, -3.861572265625, -3.3826904296875, -2.90380859375, -2.4249267578125, -1.946044921875, -1.4671630859375, -0.98828125, -0.5093994140625, -0.030517578125, 0.4483642578125, 0.92724609375, 1.4061279296875, 1.885009765625, 2.3638916015625, 2.8427734375, 3.3216552734375, 3.800537109375, 4.2794189453125, 4.75830078125, 5.2371826171875, 5.716064453125, 6.1949462890625, 6.673828125, 7.1527099609375, 7.631591796875, 8.1104736328125, 8.58935546875, 9.0682373046875, 9.547119140625, 10.0260009765625, 10.5048828125, 10.9837646484375, 11.462646484375, 11.9415283203125, 12.42041015625, 12.8992919921875, 13.378173828125, 13.8570556640625, 14.3359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 11.0, 16.0, 20.0, 28.0, 53.0, 79.0, 88.0, 156.0, 193.0, 326.0, 461.0, 586.0, 553.0, 468.0, 319.0, 262.0, 139.0, 101.0, 72.0, 47.0, 29.0, 19.0, 15.0, 14.0, 4.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-20.328125, -19.8197021484375, -19.311279296875, -18.8028564453125, -18.29443359375, -17.7860107421875, -17.277587890625, -16.7691650390625, -16.2607421875, -15.7523193359375, -15.243896484375, -14.7354736328125, -14.22705078125, -13.7186279296875, -13.210205078125, -12.7017822265625, -12.193359375, -11.6849365234375, -11.176513671875, -10.6680908203125, -10.15966796875, -9.6512451171875, -9.142822265625, -8.6343994140625, -8.1259765625, -7.6175537109375, -7.109130859375, -6.6007080078125, -6.09228515625, -5.5838623046875, -5.075439453125, -4.5670166015625, -4.05859375, -3.5501708984375, -3.041748046875, -2.5333251953125, -2.02490234375, -1.5164794921875, -1.008056640625, -0.4996337890625, 0.0087890625, 0.5172119140625, 1.025634765625, 1.5340576171875, 2.04248046875, 2.5509033203125, 3.059326171875, 3.5677490234375, 4.076171875, 4.5845947265625, 5.093017578125, 5.6014404296875, 6.10986328125, 6.6182861328125, 7.126708984375, 7.6351318359375, 8.1435546875, 8.6519775390625, 9.160400390625, 9.6688232421875, 10.17724609375, 10.6856689453125, 11.194091796875, 11.7025146484375, 12.2109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 17.0, 19.0, 25.0, 29.0, 43.0, 62.0, 97.0, 126.0, 197.0, 388.0, 877.0, 3427.0, 33745.0, 1341233.0, 2747850.0, 59150.0, 4779.0, 1047.0, 451.0, 211.0, 152.0, 79.0, 71.0, 52.0, 38.0, 23.0, 18.0, 16.0, 5.0, 8.0, 13.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.404296875, -28.27734375, -27.150390625, -26.0234375, -24.896484375, -23.76953125, -22.642578125, -21.515625, -20.388671875, -19.26171875, -18.134765625, -17.0078125, -15.880859375, -14.75390625, -13.626953125, -12.5, -11.373046875, -10.24609375, -9.119140625, -7.9921875, -6.865234375, -5.73828125, -4.611328125, -3.484375, -2.357421875, -1.23046875, -0.103515625, 1.0234375, 2.150390625, 3.27734375, 4.404296875, 5.53125, 6.658203125, 7.78515625, 8.912109375, 10.0390625, 11.166015625, 12.29296875, 13.419921875, 14.546875, 15.673828125, 16.80078125, 17.927734375, 19.0546875, 20.181640625, 21.30859375, 22.435546875, 23.5625, 24.689453125, 25.81640625, 26.943359375, 28.0703125, 29.197265625, 30.32421875, 31.451171875, 32.578125, 33.705078125, 34.83203125, 35.958984375, 37.0859375, 38.212890625, 39.33984375, 40.466796875, 41.59375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 30.0, 142.0, 363.0, 322.0, 132.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.1250305175781, -283.5070495605469, -276.8890686035156, -270.2710876464844, -263.6531066894531, -257.03515625, -250.4171600341797, -243.79917907714844, -237.18121337890625, -230.563232421875, -223.94525146484375, -217.3272705078125, -210.7093048095703, -204.09132385253906, -197.4733428955078, -190.85536193847656, -184.2373809814453, -177.61940002441406, -171.0014190673828, -164.38345336914062, -157.76547241210938, -151.14749145507812, -144.52951049804688, -137.91152954101562, -131.29354858398438, -124.67556762695312, -118.0575942993164, -111.43961334228516, -104.82164001464844, -98.20365905761719, -91.58567810058594, -84.96769714355469, -78.34971618652344, -71.73173522949219, -65.11376190185547, -58.49578094482422, -51.877803802490234, -45.25982666015625, -38.641845703125, -32.023868560791016, -25.40589141845703, -18.787914276123047, -12.16993522644043, -5.5519561767578125, 1.0660209655761719, 7.683998107910156, 14.301979064941406, 20.91995620727539, 27.537933349609375, 34.15591049194336, 40.773887634277344, 47.391868591308594, 54.00984573364258, 60.62782287597656, 67.24580383300781, 73.86378479003906, 80.48175811767578, 87.09973907470703, 93.71771240234375, 100.335693359375, 106.95367431640625, 113.57164764404297, 120.18962860107422, 126.80760192871094, 133.4255828857422]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 15.0, 8.0, 6.0, 13.0, 13.0, 22.0, 22.0, 26.0, 26.0, 23.0, 30.0, 32.0, 32.0, 38.0, 28.0, 34.0, 46.0, 47.0, 31.0, 46.0, 41.0, 43.0, 40.0, 30.0, 39.0, 37.0, 31.0, 33.0, 21.0, 20.0, 18.0, 16.0, 19.0, 15.0, 13.0, 6.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.915924072265625, -41.523773193359375, -40.131622314453125, -38.739471435546875, -37.347320556640625, -35.95517349243164, -34.56302261352539, -33.17087173461914, -31.77872085571289, -30.38656997680664, -28.99441909790039, -27.602270126342773, -26.210119247436523, -24.817968368530273, -23.425819396972656, -22.033668518066406, -20.641517639160156, -19.249366760253906, -17.857215881347656, -16.46506690979004, -15.072916030883789, -13.680765151977539, -12.288615226745605, -10.896465301513672, -9.504314422607422, -8.112163543701172, -6.720013618469238, -5.3278632164001465, -3.9357128143310547, -2.543562412261963, -1.151412010192871, 0.2407379150390625, 1.6328887939453125, 3.0250391960144043, 4.417189598083496, 5.809340000152588, 7.20149040222168, 8.59364128112793, 9.985791206359863, 11.377941131591797, 12.770092010498047, 14.162242889404297, 15.55439281463623, 16.946542739868164, 18.338693618774414, 19.730844497680664, 21.12299346923828, 22.51514434814453, 23.90729522705078, 25.29944610595703, 26.69159698486328, 28.0837459564209, 29.47589683532715, 30.8680477142334, 32.260196685791016, 33.652347564697266, 35.044498443603516, 36.436649322509766, 37.828800201416016, 39.220951080322266, 40.61309814453125, 42.0052490234375, 43.39739990234375, 44.78955078125, 46.18170166015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 38.0, 29.0, 27.0, 24.0, 27.0, 22.0, 12.0, 16.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 21.0, 31.0, 55.0, 77.0, 113.0, 190.0, 257.0, 354.0, 530.0, 762.0, 1239.0, 1750.0, 2666.0, 4017.0, 5923.0, 8961.0, 13594.0, 20748.0, 31690.0, 49608.0, 76277.0, 113127.0, 152441.0, 164121.0, 132015.0, 93086.0, 60885.0, 39174.0, 25624.0, 16589.0, 10822.0, 7201.0, 4867.0, 3185.0, 2163.0, 1411.0, 977.0, 668.0, 415.0, 291.0, 201.0, 126.0, 98.0, 64.0, 49.0, 30.0, 11.0, 12.0, 7.0, 13.0, 2.0, 4.0], "bins": [-0.51025390625, -0.4957733154296875, -0.481292724609375, -0.4668121337890625, -0.45233154296875, -0.4378509521484375, -0.423370361328125, -0.4088897705078125, -0.3944091796875, -0.3799285888671875, -0.365447998046875, -0.3509674072265625, -0.33648681640625, -0.3220062255859375, -0.307525634765625, -0.2930450439453125, -0.278564453125, -0.2640838623046875, -0.249603271484375, -0.2351226806640625, -0.22064208984375, -0.2061614990234375, -0.191680908203125, -0.1772003173828125, -0.1627197265625, -0.1482391357421875, -0.133758544921875, -0.1192779541015625, -0.10479736328125, -0.0903167724609375, -0.075836181640625, -0.0613555908203125, -0.046875, -0.0323944091796875, -0.017913818359375, -0.0034332275390625, 0.01104736328125, 0.0255279541015625, 0.040008544921875, 0.0544891357421875, 0.0689697265625, 0.0834503173828125, 0.097930908203125, 0.1124114990234375, 0.12689208984375, 0.1413726806640625, 0.155853271484375, 0.1703338623046875, 0.184814453125, 0.1992950439453125, 0.213775634765625, 0.2282562255859375, 0.24273681640625, 0.2572174072265625, 0.271697998046875, 0.2861785888671875, 0.3006591796875, 0.3151397705078125, 0.329620361328125, 0.3441009521484375, 0.35858154296875, 0.3730621337890625, 0.387542724609375, 0.4020233154296875, 0.41650390625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 17.0, 7.0, 11.0, 17.0, 22.0, 17.0, 29.0, 30.0, 29.0, 30.0, 34.0, 42.0, 50.0, 33.0, 47.0, 40.0, 1065.0, 33.0, 37.0, 34.0, 43.0, 37.0, 31.0, 37.0, 31.0, 26.0, 28.0, 18.0, 31.0, 11.0, 13.0, 19.0, 9.0, 7.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-3.93359375, -3.8292236328125, -3.724853515625, -3.6204833984375, -3.51611328125, -3.4117431640625, -3.307373046875, -3.2030029296875, -3.0986328125, -2.9942626953125, -2.889892578125, -2.7855224609375, -2.68115234375, -2.5767822265625, -2.472412109375, -2.3680419921875, -2.263671875, -2.1593017578125, -2.054931640625, -1.9505615234375, -1.84619140625, -1.7418212890625, -1.637451171875, -1.5330810546875, -1.4287109375, -1.3243408203125, -1.219970703125, -1.1156005859375, -1.01123046875, -0.9068603515625, -0.802490234375, -0.6981201171875, -0.59375, -0.4893798828125, -0.385009765625, -0.2806396484375, -0.17626953125, -0.0718994140625, 0.032470703125, 0.1368408203125, 0.2412109375, 0.3455810546875, 0.449951171875, 0.5543212890625, 0.65869140625, 0.7630615234375, 0.867431640625, 0.9718017578125, 1.076171875, 1.1805419921875, 1.284912109375, 1.3892822265625, 1.49365234375, 1.5980224609375, 1.702392578125, 1.8067626953125, 1.9111328125, 2.0155029296875, 2.119873046875, 2.2242431640625, 2.32861328125, 2.4329833984375, 2.537353515625, 2.6417236328125, 2.74609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 12.0, 10.0, 31.0, 34.0, 83.0, 106.0, 166.0, 276.0, 434.0, 701.0, 1065.0, 1837.0, 2882.0, 4471.0, 7062.0, 10878.0, 16859.0, 25970.0, 40017.0, 61382.0, 92321.0, 130035.0, 1200742.0, 154481.0, 116473.0, 79995.0, 52644.0, 34136.0, 22217.0, 14269.0, 9221.0, 5895.0, 3897.0, 2435.0, 1528.0, 995.0, 567.0, 357.0, 233.0, 138.0, 103.0, 55.0, 43.0, 26.0, 17.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3671875, -0.3559989929199219, -0.34481048583984375, -0.3336219787597656, -0.3224334716796875, -0.3112449645996094, -0.30005645751953125, -0.2888679504394531, -0.277679443359375, -0.2664909362792969, -0.25530242919921875, -0.24411392211914062, -0.2329254150390625, -0.22173690795898438, -0.21054840087890625, -0.19935989379882812, -0.18817138671875, -0.17698287963867188, -0.16579437255859375, -0.15460586547851562, -0.1434173583984375, -0.13222885131835938, -0.12104034423828125, -0.10985183715820312, -0.098663330078125, -0.08747482299804688, -0.07628631591796875, -0.06509780883789062, -0.0539093017578125, -0.042720794677734375, -0.03153228759765625, -0.020343780517578125, -0.0091552734375, 0.002033233642578125, 0.01322174072265625, 0.024410247802734375, 0.0355987548828125, 0.046787261962890625, 0.05797576904296875, 0.06916427612304688, 0.080352783203125, 0.09154129028320312, 0.10272979736328125, 0.11391830444335938, 0.1251068115234375, 0.13629531860351562, 0.14748382568359375, 0.15867233276367188, 0.16986083984375, 0.18104934692382812, 0.19223785400390625, 0.20342636108398438, 0.2146148681640625, 0.22580337524414062, 0.23699188232421875, 0.24818038940429688, 0.259368896484375, 0.2705574035644531, 0.28174591064453125, 0.2929344177246094, 0.3041229248046875, 0.3153114318847656, 0.32649993896484375, 0.3376884460449219, 0.348876953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 2.0, 5.0, 3.0, 7.0, 10.0, 14.0, 16.0, 20.0, 23.0, 21.0, 25.0, 37.0, 42.0, 50.0, 76.0, 82.0, 78.0, 73.0, 68.0, 53.0, 43.0, 50.0, 32.0, 29.0, 32.0, 14.0, 19.0, 10.0, 9.0, 11.0, 8.0, 6.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029582977294921875, -0.0028679370880126953, -0.002777576446533203, -0.002687215805053711, -0.0025968551635742188, -0.0025064945220947266, -0.0024161338806152344, -0.002325773239135742, -0.00223541259765625, -0.002145051956176758, -0.0020546913146972656, -0.0019643306732177734, -0.0018739700317382812, -0.001783609390258789, -0.0016932487487792969, -0.0016028881072998047, -0.0015125274658203125, -0.0014221668243408203, -0.0013318061828613281, -0.001241445541381836, -0.0011510848999023438, -0.0010607242584228516, -0.0009703636169433594, -0.0008800029754638672, -0.000789642333984375, -0.0006992816925048828, -0.0006089210510253906, -0.0005185604095458984, -0.00042819976806640625, -0.00033783912658691406, -0.0002474784851074219, -0.0001571178436279297, -6.67572021484375e-05, 2.3603439331054688e-05, 0.00011396408081054688, 0.00020432472229003906, 0.00029468536376953125, 0.00038504600524902344, 0.0004754066467285156, 0.0005657672882080078, 0.0006561279296875, 0.0007464885711669922, 0.0008368492126464844, 0.0009272098541259766, 0.0010175704956054688, 0.001107931137084961, 0.0011982917785644531, 0.0012886524200439453, 0.0013790130615234375, 0.0014693737030029297, 0.0015597343444824219, 0.001650094985961914, 0.0017404556274414062, 0.0018308162689208984, 0.0019211769104003906, 0.002011537551879883, 0.002101898193359375, 0.002192258834838867, 0.0022826194763183594, 0.0023729801177978516, 0.0024633407592773438, 0.002553701400756836, 0.002644062042236328, 0.0027344226837158203, 0.0028247833251953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 7.0, 12.0, 11.0, 6.0, 19.0, 31.0, 41.0, 49.0, 62.0, 107.0, 167.0, 263.0, 470.0, 1367.0, 215607.0, 826420.0, 2439.0, 550.0, 293.0, 187.0, 133.0, 74.0, 48.0, 43.0, 26.0, 24.0, 16.0, 15.0, 8.0, 5.0, 10.0, 6.0, 6.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05712890625, -0.055350303649902344, -0.05357170104980469, -0.05179309844970703, -0.050014495849609375, -0.04823589324951172, -0.04645729064941406, -0.044678688049316406, -0.04290008544921875, -0.041121482849121094, -0.03934288024902344, -0.03756427764892578, -0.035785675048828125, -0.03400707244873047, -0.03222846984863281, -0.030449867248535156, -0.0286712646484375, -0.026892662048339844, -0.025114059448242188, -0.02333545684814453, -0.021556854248046875, -0.01977825164794922, -0.017999649047851562, -0.016221046447753906, -0.01444244384765625, -0.012663841247558594, -0.010885238647460938, -0.009106636047363281, -0.007328033447265625, -0.005549430847167969, -0.0037708282470703125, -0.0019922256469726562, -0.000213623046875, 0.0015649795532226562, 0.0033435821533203125, 0.005122184753417969, 0.006900787353515625, 0.008679389953613281, 0.010457992553710938, 0.012236595153808594, 0.01401519775390625, 0.015793800354003906, 0.017572402954101562, 0.01935100555419922, 0.021129608154296875, 0.02290821075439453, 0.024686813354492188, 0.026465415954589844, 0.0282440185546875, 0.030022621154785156, 0.03180122375488281, 0.03357982635498047, 0.035358428955078125, 0.03713703155517578, 0.03891563415527344, 0.040694236755371094, 0.04247283935546875, 0.044251441955566406, 0.04603004455566406, 0.04780864715576172, 0.049587249755859375, 0.05136585235595703, 0.05314445495605469, 0.054923057556152344, 0.05670166015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 167.0, 644.0, 180.0, 14.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006655517499893904, -0.006295669823884964, -0.005935822147876024, -0.0055759744718670845, -0.005216127261519432, -0.004856279119849205, -0.004496431909501553, -0.004136584233492613, -0.003776736557483673, -0.0034168888814747334, -0.0030570412054657936, -0.0026971937622874975, -0.0023373460862785578, -0.001977498410269618, -0.001617650967091322, -0.0012578032910823822, -0.0008979556150734425, -0.0005381079972721636, -0.0001782603794708848, 0.00018158718012273312, 0.0005414348561316729, 0.0009012825321406126, 0.0012611299753189087, 0.0016209776513278484, 0.001980825327336788, 0.002340673003345728, 0.0027005206793546677, 0.0030603681225329638, 0.0034202157985419035, 0.0037800634745508432, 0.004139910917729139, 0.004499758593738079, 0.0048596058040857315, 0.005219453480094671, 0.005579301156103611, 0.005939148366451263, 0.0062989965081214905, 0.006658843718469143, 0.007018691394478083, 0.007378539070487022, 0.007738386746495962, 0.008098234422504902, 0.008458081632852554, 0.008817929774522781, 0.009177776984870434, 0.00953762512654066, 0.009897472336888313, 0.01025732047855854, 0.010617167688906193, 0.010977014899253845, 0.011336863040924072, 0.011696710251271725, 0.012056558392941952, 0.012416405603289604, 0.012776253744959831, 0.013136100955307484, 0.013495948165655136, 0.013855795376002789, 0.014215643517673016, 0.014575490728020668, 0.014935338869690895, 0.015295186080038548, 0.0156550332903862, 0.016014881432056427, 0.016374729573726654]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 14.0, 16.0, 17.0, 30.0, 44.0, 39.0, 34.0, 60.0, 53.0, 32.0, 53.0, 47.0, 48.0, 52.0, 53.0, 45.0, 44.0, 31.0, 38.0, 33.0, 31.0, 27.0, 17.0, 17.0, 22.0, 8.0, 14.0, 11.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020488500595092773, -0.0019908715039491653, -0.0019328929483890533, -0.0018749143928289413, -0.0018169358372688293, -0.0017589572817087173, -0.0017009787261486053, -0.0016430001705884933, -0.0015850216150283813, -0.0015270430594682693, -0.0014690645039081573, -0.0014110859483480453, -0.0013531073927879333, -0.0012951288372278214, -0.0012371502816677094, -0.0011791717261075974, -0.0011211931705474854, -0.0010632146149873734, -0.0010052360594272614, -0.0009472575038671494, -0.0008892789483070374, -0.0008313003927469254, -0.0007733218371868134, -0.0007153432816267014, -0.0006573647260665894, -0.0005993861705064774, -0.0005414076149463654, -0.00048342905938625336, -0.00042545050382614136, -0.00036747194826602936, -0.00030949339270591736, -0.00025151483714580536, -0.00019353628158569336, -0.00013555772602558136, -7.757917046546936e-05, -1.960061490535736e-05, 3.837794065475464e-05, 9.635649621486664e-05, 0.00015433505177497864, 0.00021231360733509064, 0.00027029216289520264, 0.00032827071845531464, 0.00038624927401542664, 0.00044422782957553864, 0.0005022063851356506, 0.0005601849406957626, 0.0006181634962558746, 0.0006761420518159866, 0.0007341206073760986, 0.0007920991629362106, 0.0008500777184963226, 0.0009080562740564346, 0.0009660348296165466, 0.0010240133851766586, 0.0010819919407367706, 0.0011399704962968826, 0.0011979490518569946, 0.0012559276074171066, 0.0013139061629772186, 0.0013718847185373306, 0.0014298632740974426, 0.0014878418296575546, 0.0015458203852176666, 0.0016037989407777786, 0.0016617774963378906]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 37.0, 30.0, 27.0, 24.0, 27.0, 22.0, 13.0, 15.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 18.0, 35.0, 50.0, 72.0, 117.0, 164.0, 243.0, 340.0, 527.0, 783.0, 1165.0, 1789.0, 2696.0, 4143.0, 6642.0, 12243.0, 26342.0, 74168.0, 315040.0, 438492.0, 96693.0, 31905.0, 14274.0, 7476.0, 4440.0, 2865.0, 1891.0, 1257.0, 781.0, 585.0, 404.0, 290.0, 180.0, 130.0, 73.0, 59.0, 41.0, 34.0, 28.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.2032470703125, -4.058837890625, -3.9144287109375, -3.77001953125, -3.6256103515625, -3.481201171875, -3.3367919921875, -3.1923828125, -3.0479736328125, -2.903564453125, -2.7591552734375, -2.61474609375, -2.4703369140625, -2.325927734375, -2.1815185546875, -2.037109375, -1.8927001953125, -1.748291015625, -1.6038818359375, -1.45947265625, -1.3150634765625, -1.170654296875, -1.0262451171875, -0.8818359375, -0.7374267578125, -0.593017578125, -0.4486083984375, -0.30419921875, -0.1597900390625, -0.015380859375, 0.1290283203125, 0.2734375, 0.4178466796875, 0.562255859375, 0.7066650390625, 0.85107421875, 0.9954833984375, 1.139892578125, 1.2843017578125, 1.4287109375, 1.5731201171875, 1.717529296875, 1.8619384765625, 2.00634765625, 2.1507568359375, 2.295166015625, 2.4395751953125, 2.583984375, 2.7283935546875, 2.872802734375, 3.0172119140625, 3.16162109375, 3.3060302734375, 3.450439453125, 3.5948486328125, 3.7392578125, 3.8836669921875, 4.028076171875, 4.1724853515625, 4.31689453125, 4.4613037109375, 4.605712890625, 4.7501220703125, 4.89453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 11.0, 5.0, 10.0, 16.0, 24.0, 23.0, 25.0, 24.0, 40.0, 30.0, 35.0, 36.0, 37.0, 52.0, 85.0, 176.0, 1699.0, 210.0, 79.0, 53.0, 41.0, 40.0, 34.0, 30.0, 24.0, 36.0, 26.0, 25.0, 15.0, 23.0, 12.0, 15.0, 6.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-21.859375, -21.27783203125, -20.6962890625, -20.11474609375, -19.533203125, -18.95166015625, -18.3701171875, -17.78857421875, -17.20703125, -16.62548828125, -16.0439453125, -15.46240234375, -14.880859375, -14.29931640625, -13.7177734375, -13.13623046875, -12.5546875, -11.97314453125, -11.3916015625, -10.81005859375, -10.228515625, -9.64697265625, -9.0654296875, -8.48388671875, -7.90234375, -7.32080078125, -6.7392578125, -6.15771484375, -5.576171875, -4.99462890625, -4.4130859375, -3.83154296875, -3.25, -2.66845703125, -2.0869140625, -1.50537109375, -0.923828125, -0.34228515625, 0.2392578125, 0.82080078125, 1.40234375, 1.98388671875, 2.5654296875, 3.14697265625, 3.728515625, 4.31005859375, 4.8916015625, 5.47314453125, 6.0546875, 6.63623046875, 7.2177734375, 7.79931640625, 8.380859375, 8.96240234375, 9.5439453125, 10.12548828125, 10.70703125, 11.28857421875, 11.8701171875, 12.45166015625, 13.033203125, 13.61474609375, 14.1962890625, 14.77783203125, 15.359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 12.0, 13.0, 13.0, 24.0, 28.0, 39.0, 57.0, 97.0, 113.0, 204.0, 374.0, 1153.0, 18679.0, 3091759.0, 30707.0, 1394.0, 366.0, 218.0, 122.0, 94.0, 63.0, 43.0, 36.0, 22.0, 12.0, 16.0, 8.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.28125, -40.8505859375, -39.419921875, -37.9892578125, -36.55859375, -35.1279296875, -33.697265625, -32.2666015625, -30.8359375, -29.4052734375, -27.974609375, -26.5439453125, -25.11328125, -23.6826171875, -22.251953125, -20.8212890625, -19.390625, -17.9599609375, -16.529296875, -15.0986328125, -13.66796875, -12.2373046875, -10.806640625, -9.3759765625, -7.9453125, -6.5146484375, -5.083984375, -3.6533203125, -2.22265625, -0.7919921875, 0.638671875, 2.0693359375, 3.5, 4.9306640625, 6.361328125, 7.7919921875, 9.22265625, 10.6533203125, 12.083984375, 13.5146484375, 14.9453125, 16.3759765625, 17.806640625, 19.2373046875, 20.66796875, 22.0986328125, 23.529296875, 24.9599609375, 26.390625, 27.8212890625, 29.251953125, 30.6826171875, 32.11328125, 33.5439453125, 34.974609375, 36.4052734375, 37.8359375, 39.2666015625, 40.697265625, 42.1279296875, 43.55859375, 44.9892578125, 46.419921875, 47.8505859375, 49.28125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 59.0, 307.0, 457.0, 161.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.2296371459961, -80.72634887695312, -78.22306823730469, -75.71977996826172, -73.21649932861328, -70.71321105957031, -68.20993041992188, -65.7066421508789, -63.2033576965332, -60.7000732421875, -58.1967887878418, -55.693504333496094, -53.190216064453125, -50.68693542480469, -48.18364715576172, -45.680362701416016, -43.17707824707031, -40.67379379272461, -38.170509338378906, -35.6672248840332, -33.1639404296875, -30.660654067993164, -28.157367706298828, -25.654083251953125, -23.150798797607422, -20.64751434326172, -18.144229888916016, -15.64094352722168, -13.137659072875977, -10.634374618530273, -8.131089210510254, -5.627803802490234, -3.1245193481445312, -0.6212344169616699, 1.8820505142211914, 4.385335445404053, 6.888620376586914, 9.391904830932617, 11.895190238952637, 14.398475646972656, 16.90176010131836, 19.405044555664062, 21.908329010009766, 24.4116153717041, 26.914899826049805, 29.418184280395508, 31.921470642089844, 34.42475509643555, 36.92803955078125, 39.43132400512695, 41.934608459472656, 44.43789291381836, 46.94117736816406, 49.44446563720703, 51.947750091552734, 54.45103454589844, 56.95431900024414, 59.457603454589844, 61.96088790893555, 64.46417236328125, 66.96746063232422, 69.47074127197266, 71.97402954101562, 74.47731018066406, 76.98059844970703]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 8.0, 10.0, 6.0, 17.0, 16.0, 20.0, 24.0, 16.0, 27.0, 23.0, 34.0, 32.0, 39.0, 44.0, 32.0, 38.0, 31.0, 31.0, 43.0, 52.0, 44.0, 32.0, 29.0, 41.0, 31.0, 42.0, 33.0, 28.0, 19.0, 17.0, 26.0, 24.0, 12.0, 9.0, 13.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.48713302612305, -49.892730712890625, -48.29833221435547, -46.70392990112305, -45.10953140258789, -43.51512908935547, -41.92073059082031, -40.32632827758789, -38.73192596435547, -37.13752365112305, -35.54312515258789, -33.94872283935547, -32.35432434082031, -30.75992202758789, -29.1655216217041, -27.571121215820312, -25.976722717285156, -24.382322311401367, -22.787921905517578, -21.193519592285156, -19.59912109375, -18.004718780517578, -16.41031837463379, -14.81591796875, -13.221517562866211, -11.627117156982422, -10.032716751098633, -8.438315391540527, -6.843914985656738, -5.249514579772949, -3.6551132202148438, -2.0607128143310547, -0.46631622314453125, 1.128084421157837, 2.722485065460205, 4.316885948181152, 5.911286354064941, 7.5056867599487305, 9.100088119506836, 10.694488525390625, 12.288888931274414, 13.883289337158203, 15.477689743041992, 17.07209014892578, 18.666492462158203, 20.26089096069336, 21.85529327392578, 23.44969367980957, 25.04409408569336, 26.63849449157715, 28.232894897460938, 29.82729721069336, 31.421695709228516, 33.01609802246094, 34.610496520996094, 36.204898834228516, 37.79930114746094, 39.39370346069336, 40.988101959228516, 42.58250427246094, 44.176902770996094, 45.771305084228516, 47.36570739746094, 48.960105895996094, 50.55450439453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 1.0, 8.0, 1.0, 5.0, 8.0, 7.0, 11.0, 15.0, 17.0, 18.0, 24.0, 20.0, 22.0, 19.0, 27.0, 27.0, 38.0, 41.0, 34.0, 35.0, 42.0, 47.0, 42.0, 30.0, 38.0, 35.0, 36.0, 38.0, 41.0, 26.0, 29.0, 31.0, 23.0, 29.0, 18.0, 20.0, 17.0, 13.0, 13.0, 13.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.3515625, -5.19842529296875, -5.0452880859375, -4.89215087890625, -4.739013671875, -4.58587646484375, -4.4327392578125, -4.27960205078125, -4.12646484375, -3.97332763671875, -3.8201904296875, -3.66705322265625, -3.513916015625, -3.36077880859375, -3.2076416015625, -3.05450439453125, -2.9013671875, -2.74822998046875, -2.5950927734375, -2.44195556640625, -2.288818359375, -2.13568115234375, -1.9825439453125, -1.82940673828125, -1.67626953125, -1.52313232421875, -1.3699951171875, -1.21685791015625, -1.063720703125, -0.91058349609375, -0.7574462890625, -0.60430908203125, -0.451171875, -0.29803466796875, -0.1448974609375, 0.00823974609375, 0.161376953125, 0.31451416015625, 0.4676513671875, 0.62078857421875, 0.77392578125, 0.92706298828125, 1.0802001953125, 1.23333740234375, 1.386474609375, 1.53961181640625, 1.6927490234375, 1.84588623046875, 1.9990234375, 2.15216064453125, 2.3052978515625, 2.45843505859375, 2.611572265625, 2.76470947265625, 2.9178466796875, 3.07098388671875, 3.22412109375, 3.37725830078125, 3.5303955078125, 3.68353271484375, 3.836669921875, 3.98980712890625, 4.1429443359375, 4.29608154296875, 4.44921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 12.0, 17.0, 22.0, 30.0, 24.0, 43.0, 75.0, 98.0, 162.0, 214.0, 379.0, 527.0, 935.0, 1569.0, 2748.0, 5162.0, 10019.0, 21319.0, 50931.0, 151626.0, 528431.0, 1302299.0, 1321608.0, 542995.0, 157475.0, 52142.0, 21543.0, 10013.0, 5059.0, 2756.0, 1562.0, 946.0, 528.0, 336.0, 214.0, 145.0, 83.0, 56.0, 53.0, 22.0, 29.0, 24.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.25, -6.0606689453125, -5.871337890625, -5.6820068359375, -5.49267578125, -5.3033447265625, -5.114013671875, -4.9246826171875, -4.7353515625, -4.5460205078125, -4.356689453125, -4.1673583984375, -3.97802734375, -3.7886962890625, -3.599365234375, -3.4100341796875, -3.220703125, -3.0313720703125, -2.842041015625, -2.6527099609375, -2.46337890625, -2.2740478515625, -2.084716796875, -1.8953857421875, -1.7060546875, -1.5167236328125, -1.327392578125, -1.1380615234375, -0.94873046875, -0.7593994140625, -0.570068359375, -0.3807373046875, -0.19140625, -0.0020751953125, 0.187255859375, 0.3765869140625, 0.56591796875, 0.7552490234375, 0.944580078125, 1.1339111328125, 1.3232421875, 1.5125732421875, 1.701904296875, 1.8912353515625, 2.08056640625, 2.2698974609375, 2.459228515625, 2.6485595703125, 2.837890625, 3.0272216796875, 3.216552734375, 3.4058837890625, 3.59521484375, 3.7845458984375, 3.973876953125, 4.1632080078125, 4.3525390625, 4.5418701171875, 4.731201171875, 4.9205322265625, 5.10986328125, 5.2991943359375, 5.488525390625, 5.6778564453125, 5.8671875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 18.0, 29.0, 37.0, 54.0, 63.0, 105.0, 119.0, 181.0, 228.0, 274.0, 450.0, 502.0, 471.0, 423.0, 291.0, 214.0, 171.0, 134.0, 87.0, 56.0, 41.0, 32.0, 26.0, 13.0, 11.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.2310791015625, -10.798095703125, -10.3651123046875, -9.93212890625, -9.4991455078125, -9.066162109375, -8.6331787109375, -8.2001953125, -7.7672119140625, -7.334228515625, -6.9012451171875, -6.46826171875, -6.0352783203125, -5.602294921875, -5.1693115234375, -4.736328125, -4.3033447265625, -3.870361328125, -3.4373779296875, -3.00439453125, -2.5714111328125, -2.138427734375, -1.7054443359375, -1.2724609375, -0.8394775390625, -0.406494140625, 0.0264892578125, 0.45947265625, 0.8924560546875, 1.325439453125, 1.7584228515625, 2.19140625, 2.6243896484375, 3.057373046875, 3.4903564453125, 3.92333984375, 4.3563232421875, 4.789306640625, 5.2222900390625, 5.6552734375, 6.0882568359375, 6.521240234375, 6.9542236328125, 7.38720703125, 7.8201904296875, 8.253173828125, 8.6861572265625, 9.119140625, 9.5521240234375, 9.985107421875, 10.4180908203125, 10.85107421875, 11.2840576171875, 11.717041015625, 12.1500244140625, 12.5830078125, 13.0159912109375, 13.448974609375, 13.8819580078125, 14.31494140625, 14.7479248046875, 15.180908203125, 15.6138916015625, 16.046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 12.0, 18.0, 24.0, 49.0, 46.0, 70.0, 96.0, 145.0, 244.0, 405.0, 1084.0, 5460.0, 107353.0, 3670372.0, 393710.0, 12117.0, 1648.0, 558.0, 283.0, 177.0, 112.0, 82.0, 62.0, 39.0, 28.0, 22.0, 15.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.5625, -26.34619140625, -25.1298828125, -23.91357421875, -22.697265625, -21.48095703125, -20.2646484375, -19.04833984375, -17.83203125, -16.61572265625, -15.3994140625, -14.18310546875, -12.966796875, -11.75048828125, -10.5341796875, -9.31787109375, -8.1015625, -6.88525390625, -5.6689453125, -4.45263671875, -3.236328125, -2.02001953125, -0.8037109375, 0.41259765625, 1.62890625, 2.84521484375, 4.0615234375, 5.27783203125, 6.494140625, 7.71044921875, 8.9267578125, 10.14306640625, 11.359375, 12.57568359375, 13.7919921875, 15.00830078125, 16.224609375, 17.44091796875, 18.6572265625, 19.87353515625, 21.08984375, 22.30615234375, 23.5224609375, 24.73876953125, 25.955078125, 27.17138671875, 28.3876953125, 29.60400390625, 30.8203125, 32.03662109375, 33.2529296875, 34.46923828125, 35.685546875, 36.90185546875, 38.1181640625, 39.33447265625, 40.55078125, 41.76708984375, 42.9833984375, 44.19970703125, 45.416015625, 46.63232421875, 47.8486328125, 49.06494140625, 50.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 20.0, 27.0, 45.0, 72.0, 108.0, 152.0, 153.0, 152.0, 113.0, 61.0, 44.0, 30.0, 19.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.60558319091797, -121.05137634277344, -118.49716186523438, -115.94295501708984, -113.38874816894531, -110.83454132080078, -108.28033447265625, -105.72611999511719, -103.17191314697266, -100.61770629882812, -98.06349182128906, -95.50928497314453, -92.955078125, -90.40087127685547, -87.84666442871094, -85.29244995117188, -82.73824310302734, -80.18403625488281, -77.62982177734375, -75.07561492919922, -72.52140808105469, -69.96720123291016, -67.41299438476562, -64.85877990722656, -62.30457305908203, -59.7503662109375, -57.1961555480957, -54.641944885253906, -52.087738037109375, -49.533531188964844, -46.97932052612305, -44.42510986328125, -41.87089538574219, -39.316688537597656, -36.76247787475586, -34.20826721191406, -31.65406036376953, -29.099851608276367, -26.545642852783203, -23.99143409729004, -21.437225341796875, -18.88301658630371, -16.328807830810547, -13.774599075317383, -11.220390319824219, -8.666181564331055, -6.111972808837891, -3.5577640533447266, -1.0035552978515625, 1.5506534576416016, 4.104862213134766, 6.65907096862793, 9.213279724121094, 11.767488479614258, 14.321697235107422, 16.875905990600586, 19.43011474609375, 21.984323501586914, 24.538532257080078, 27.092741012573242, 29.646949768066406, 32.20115661621094, 34.755367279052734, 37.30957794189453, 39.86378479003906]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 6.0, 2.0, 9.0, 8.0, 10.0, 6.0, 16.0, 14.0, 14.0, 23.0, 26.0, 14.0, 21.0, 24.0, 24.0, 29.0, 23.0, 35.0, 41.0, 36.0, 29.0, 46.0, 43.0, 36.0, 44.0, 37.0, 38.0, 41.0, 30.0, 34.0, 34.0, 20.0, 16.0, 21.0, 23.0, 15.0, 13.0, 16.0, 11.0, 7.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.10260009765625, -36.93830108642578, -35.77400207519531, -34.60970687866211, -33.44540786743164, -32.28110885620117, -31.116811752319336, -29.9525146484375, -28.78821563720703, -27.623916625976562, -26.459619522094727, -25.29532241821289, -24.131023406982422, -22.966724395751953, -21.802427291870117, -20.63813018798828, -19.473831176757812, -18.309532165527344, -17.145235061645508, -15.980937004089355, -14.816638946533203, -13.65234088897705, -12.488042831420898, -11.323744773864746, -10.159446716308594, -8.995148658752441, -7.830850601196289, -6.666552543640137, -5.502254486083984, -4.337956428527832, -3.1736583709716797, -2.0093603134155273, -0.845062255859375, 0.31923580169677734, 1.4835338592529297, 2.647831916809082, 3.8121299743652344, 4.976428031921387, 6.140726089477539, 7.305024147033691, 8.469322204589844, 9.633620262145996, 10.797918319702148, 11.9622163772583, 13.126514434814453, 14.290812492370605, 15.455110549926758, 16.619407653808594, 17.783706665039062, 18.94800567626953, 20.112302780151367, 21.276599884033203, 22.440898895263672, 23.60519790649414, 24.769495010375977, 25.933792114257812, 27.09809112548828, 28.26239013671875, 29.426687240600586, 30.590984344482422, 31.75528335571289, 32.91958236694336, 34.08387756347656, 35.24817657470703, 36.4124755859375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 42.0, 40.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 13.0, 16.0, 27.0, 39.0, 75.0, 85.0, 144.0, 220.0, 343.0, 562.0, 782.0, 1267.0, 1957.0, 2976.0, 4636.0, 7105.0, 11002.0, 17378.0, 27069.0, 42489.0, 66520.0, 102655.0, 150531.0, 180080.0, 148493.0, 100888.0, 65226.0, 41673.0, 26689.0, 16766.0, 10982.0, 7044.0, 4481.0, 2994.0, 1812.0, 1261.0, 778.0, 521.0, 333.0, 221.0, 145.0, 92.0, 70.0, 39.0, 28.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.54736328125, -0.5305099487304688, -0.5136566162109375, -0.49680328369140625, -0.479949951171875, -0.46309661865234375, -0.4462432861328125, -0.42938995361328125, -0.41253662109375, -0.39568328857421875, -0.3788299560546875, -0.36197662353515625, -0.345123291015625, -0.32826995849609375, -0.3114166259765625, -0.29456329345703125, -0.2777099609375, -0.26085662841796875, -0.2440032958984375, -0.22714996337890625, -0.210296630859375, -0.19344329833984375, -0.1765899658203125, -0.15973663330078125, -0.14288330078125, -0.12602996826171875, -0.1091766357421875, -0.09232330322265625, -0.075469970703125, -0.05861663818359375, -0.0417633056640625, -0.02490997314453125, -0.008056640625, 0.00879669189453125, 0.0256500244140625, 0.04250335693359375, 0.059356689453125, 0.07621002197265625, 0.0930633544921875, 0.10991668701171875, 0.12677001953125, 0.14362335205078125, 0.1604766845703125, 0.17733001708984375, 0.194183349609375, 0.21103668212890625, 0.2278900146484375, 0.24474334716796875, 0.2615966796875, 0.27845001220703125, 0.2953033447265625, 0.31215667724609375, 0.329010009765625, 0.34586334228515625, 0.3627166748046875, 0.37957000732421875, 0.39642333984375, 0.41327667236328125, 0.4301300048828125, 0.44698333740234375, 0.463836669921875, 0.48069000244140625, 0.4975433349609375, 0.5143966674804688, 0.53125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 11.0, 10.0, 10.0, 15.0, 14.0, 12.0, 19.0, 22.0, 19.0, 21.0, 25.0, 33.0, 26.0, 33.0, 48.0, 40.0, 42.0, 36.0, 1066.0, 49.0, 35.0, 54.0, 44.0, 41.0, 36.0, 23.0, 28.0, 35.0, 28.0, 19.0, 23.0, 18.0, 23.0, 9.0, 16.0, 8.0, 5.0, 6.0, 8.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-3.892578125, -3.78668212890625, -3.6807861328125, -3.57489013671875, -3.468994140625, -3.36309814453125, -3.2572021484375, -3.15130615234375, -3.04541015625, -2.93951416015625, -2.8336181640625, -2.72772216796875, -2.621826171875, -2.51593017578125, -2.4100341796875, -2.30413818359375, -2.1982421875, -2.09234619140625, -1.9864501953125, -1.88055419921875, -1.774658203125, -1.66876220703125, -1.5628662109375, -1.45697021484375, -1.35107421875, -1.24517822265625, -1.1392822265625, -1.03338623046875, -0.927490234375, -0.82159423828125, -0.7156982421875, -0.60980224609375, -0.50390625, -0.39801025390625, -0.2921142578125, -0.18621826171875, -0.080322265625, 0.02557373046875, 0.1314697265625, 0.23736572265625, 0.34326171875, 0.44915771484375, 0.5550537109375, 0.66094970703125, 0.766845703125, 0.87274169921875, 0.9786376953125, 1.08453369140625, 1.1904296875, 1.29632568359375, 1.4022216796875, 1.50811767578125, 1.614013671875, 1.71990966796875, 1.8258056640625, 1.93170166015625, 2.03759765625, 2.14349365234375, 2.2493896484375, 2.35528564453125, 2.461181640625, 2.56707763671875, 2.6729736328125, 2.77886962890625, 2.884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 5.0, 13.0, 8.0, 29.0, 47.0, 44.0, 79.0, 94.0, 188.0, 245.0, 372.0, 552.0, 904.0, 1288.0, 2064.0, 3070.0, 4614.0, 6891.0, 10818.0, 16144.0, 25087.0, 37506.0, 56598.0, 83411.0, 116957.0, 223890.0, 1117129.0, 122062.0, 88863.0, 60573.0, 40381.0, 26397.0, 17427.0, 11332.0, 7484.0, 4846.0, 3329.0, 2184.0, 1436.0, 969.0, 578.0, 390.0, 278.0, 189.0, 119.0, 85.0, 63.0, 34.0, 23.0, 23.0, 14.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.34415435791015625, -0.3330841064453125, -0.32201385498046875, -0.310943603515625, -0.29987335205078125, -0.2888031005859375, -0.27773284912109375, -0.26666259765625, -0.25559234619140625, -0.2445220947265625, -0.23345184326171875, -0.222381591796875, -0.21131134033203125, -0.2002410888671875, -0.18917083740234375, -0.1781005859375, -0.16703033447265625, -0.1559600830078125, -0.14488983154296875, -0.133819580078125, -0.12274932861328125, -0.1116790771484375, -0.10060882568359375, -0.08953857421875, -0.07846832275390625, -0.0673980712890625, -0.05632781982421875, -0.045257568359375, -0.03418731689453125, -0.0231170654296875, -0.01204681396484375, -0.0009765625, 0.01009368896484375, 0.0211639404296875, 0.03223419189453125, 0.043304443359375, 0.05437469482421875, 0.0654449462890625, 0.07651519775390625, 0.08758544921875, 0.09865570068359375, 0.1097259521484375, 0.12079620361328125, 0.131866455078125, 0.14293670654296875, 0.1540069580078125, 0.16507720947265625, 0.1761474609375, 0.18721771240234375, 0.1982879638671875, 0.20935821533203125, 0.220428466796875, 0.23149871826171875, 0.2425689697265625, 0.25363922119140625, 0.26470947265625, 0.27577972412109375, 0.2868499755859375, 0.29792022705078125, 0.308990478515625, 0.32006072998046875, 0.3311309814453125, 0.34220123291015625, 0.353271484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 16.0, 19.0, 11.0, 17.0, 12.0, 24.0, 21.0, 25.0, 38.0, 45.0, 53.0, 73.0, 66.0, 66.0, 75.0, 69.0, 66.0, 54.0, 38.0, 35.0, 31.0, 35.0, 16.0, 11.0, 12.0, 14.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003917694091796875, -0.003775477409362793, -0.003633260726928711, -0.003491044044494629, -0.003348827362060547, -0.003206610679626465, -0.003064393997192383, -0.0029221773147583008, -0.0027799606323242188, -0.0026377439498901367, -0.0024955272674560547, -0.0023533105850219727, -0.0022110939025878906, -0.0020688772201538086, -0.0019266605377197266, -0.0017844438552856445, -0.0016422271728515625, -0.0015000104904174805, -0.0013577938079833984, -0.0012155771255493164, -0.0010733604431152344, -0.0009311437606811523, -0.0007889270782470703, -0.0006467103958129883, -0.0005044937133789062, -0.0003622770309448242, -0.0002200603485107422, -7.784366607666016e-05, 6.437301635742188e-05, 0.0002065896987915039, 0.00034880638122558594, 0.000491023063659668, 0.00063323974609375, 0.000775456428527832, 0.0009176731109619141, 0.001059889793395996, 0.0012021064758300781, 0.0013443231582641602, 0.0014865398406982422, 0.0016287565231323242, 0.0017709732055664062, 0.0019131898880004883, 0.0020554065704345703, 0.0021976232528686523, 0.0023398399353027344, 0.0024820566177368164, 0.0026242733001708984, 0.0027664899826049805, 0.0029087066650390625, 0.0030509233474731445, 0.0031931400299072266, 0.0033353567123413086, 0.0034775733947753906, 0.0036197900772094727, 0.0037620067596435547, 0.0039042234420776367, 0.004046440124511719, 0.004188656806945801, 0.004330873489379883, 0.004473090171813965, 0.004615306854248047, 0.004757523536682129, 0.004899740219116211, 0.005041956901550293, 0.005184173583984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 19.0, 18.0, 24.0, 28.0, 47.0, 66.0, 93.0, 136.0, 178.0, 296.0, 521.0, 2716.0, 823777.0, 217757.0, 1543.0, 449.0, 282.0, 157.0, 127.0, 70.0, 55.0, 34.0, 37.0, 25.0, 21.0, 14.0, 14.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.1013631820678711, -0.09853935241699219, -0.09571552276611328, -0.09289169311523438, -0.09006786346435547, -0.08724403381347656, -0.08442020416259766, -0.08159637451171875, -0.07877254486083984, -0.07594871520996094, -0.07312488555908203, -0.07030105590820312, -0.06747722625732422, -0.06465339660644531, -0.061829566955566406, -0.0590057373046875, -0.056181907653808594, -0.05335807800292969, -0.05053424835205078, -0.047710418701171875, -0.04488658905029297, -0.04206275939941406, -0.039238929748535156, -0.03641510009765625, -0.033591270446777344, -0.030767440795898438, -0.02794361114501953, -0.025119781494140625, -0.02229595184326172, -0.019472122192382812, -0.016648292541503906, -0.013824462890625, -0.011000633239746094, -0.008176803588867188, -0.005352973937988281, -0.002529144287109375, 0.00029468536376953125, 0.0031185150146484375, 0.005942344665527344, 0.00876617431640625, 0.011590003967285156, 0.014413833618164062, 0.01723766326904297, 0.020061492919921875, 0.02288532257080078, 0.025709152221679688, 0.028532981872558594, 0.0313568115234375, 0.034180641174316406, 0.03700447082519531, 0.03982830047607422, 0.042652130126953125, 0.04547595977783203, 0.04829978942871094, 0.051123619079589844, 0.05394744873046875, 0.056771278381347656, 0.05959510803222656, 0.06241893768310547, 0.06524276733398438, 0.06806659698486328, 0.07089042663574219, 0.0737142562866211, 0.0765380859375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 850.0, 151.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0566568598151207, -0.05529935285449028, -0.05394184589385986, -0.052584342658519745, -0.05122683569788933, -0.04986932873725891, -0.048511821776628494, -0.04715431481599808, -0.04579680785536766, -0.044439300894737244, -0.04308179393410683, -0.04172428697347641, -0.04036678373813629, -0.039009276777505875, -0.03765176981687546, -0.03629426285624504, -0.034936755895614624, -0.03357924893498421, -0.03222174197435379, -0.030864236876368523, -0.029506729915738106, -0.028149224817752838, -0.02679171785712242, -0.025434210896492004, -0.024076707661151886, -0.02271920070052147, -0.0213616956025362, -0.020004188641905785, -0.018646681681275368, -0.0172891765832901, -0.015931669622659683, -0.014574162662029266, -0.013216657564043999, -0.011859151534736156, -0.01050164457410574, -0.009144138544797897, -0.007786632049828768, -0.006429125554859638, -0.005071619525551796, -0.003714112564921379, -0.002356606535613537, -0.000999100157059729, 0.00035840622149407864, 0.0017159124836325645, 0.003073418978601694, 0.004430925473570824, 0.005788431502878666, 0.007145938463509083, 0.008503444492816925, 0.009860950522124767, 0.011218457482755184, 0.012575963512063026, 0.013933470472693443, 0.015290976502001286, 0.016648482531309128, 0.018005989491939545, 0.01936349645256996, 0.02072100341320038, 0.022078508511185646, 0.023436015471816063, 0.02479352243244648, 0.026151027530431747, 0.027508534491062164, 0.02886604145169258, 0.03022354654967785]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 21.0, 23.0, 19.0, 35.0, 32.0, 34.0, 43.0, 45.0, 45.0, 42.0, 58.0, 37.0, 53.0, 44.0, 42.0, 42.0, 42.0, 42.0, 41.0, 35.0, 33.0, 27.0, 15.0, 23.0, 20.0, 7.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031978487968444824, -0.0031014643609523773, -0.003005079925060272, -0.002908695489168167, -0.002812311053276062, -0.002715926617383957, -0.002619542181491852, -0.0025231577455997467, -0.0024267733097076416, -0.0023303888738155365, -0.0022340044379234314, -0.0021376200020313263, -0.002041235566139221, -0.001944851130247116, -0.001848466694355011, -0.0017520822584629059, -0.0016556978225708008, -0.0015593133866786957, -0.0014629289507865906, -0.0013665445148944855, -0.0012701600790023804, -0.0011737756431102753, -0.0010773912072181702, -0.000981006771326065, -0.00088462233543396, -0.0007882378995418549, -0.0006918534636497498, -0.0005954690277576447, -0.0004990845918655396, -0.00040270015597343445, -0.00030631572008132935, -0.00020993128418922424, -0.00011354684829711914, -1.7162412405014038e-05, 7.922202348709106e-05, 0.00017560645937919617, 0.00027199089527130127, 0.00036837533116340637, 0.0004647597670555115, 0.0005611442029476166, 0.0006575286388397217, 0.0007539130747318268, 0.0008502975106239319, 0.000946681946516037, 0.001043066382408142, 0.0011394508183002472, 0.0012358352541923523, 0.0013322196900844574, 0.0014286041259765625, 0.0015249885618686676, 0.0016213729977607727, 0.0017177574336528778, 0.001814141869544983, 0.001910526305437088, 0.002006910741329193, 0.0021032951772212982, 0.0021996796131134033, 0.0022960640490055084, 0.0023924484848976135, 0.0024888329207897186, 0.0025852173566818237, 0.002681601792573929, 0.002777986228466034, 0.002874370664358139, 0.002970755100250244]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 41.0, 41.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 4.0, 6.0, 13.0, 24.0, 35.0, 33.0, 79.0, 91.0, 129.0, 187.0, 282.0, 410.0, 537.0, 849.0, 1288.0, 1938.0, 3205.0, 5699.0, 11385.0, 26710.0, 78535.0, 295515.0, 427141.0, 123202.0, 38021.0, 15156.0, 7294.0, 3963.0, 2262.0, 1478.0, 935.0, 651.0, 451.0, 357.0, 225.0, 136.0, 97.0, 71.0, 57.0, 29.0, 27.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.91949462890625, -3.7803955078125, -3.64129638671875, -3.502197265625, -3.36309814453125, -3.2239990234375, -3.08489990234375, -2.94580078125, -2.80670166015625, -2.6676025390625, -2.52850341796875, -2.389404296875, -2.25030517578125, -2.1112060546875, -1.97210693359375, -1.8330078125, -1.69390869140625, -1.5548095703125, -1.41571044921875, -1.276611328125, -1.13751220703125, -0.9984130859375, -0.85931396484375, -0.72021484375, -0.58111572265625, -0.4420166015625, -0.30291748046875, -0.163818359375, -0.02471923828125, 0.1143798828125, 0.25347900390625, 0.392578125, 0.53167724609375, 0.6707763671875, 0.80987548828125, 0.948974609375, 1.08807373046875, 1.2271728515625, 1.36627197265625, 1.50537109375, 1.64447021484375, 1.7835693359375, 1.92266845703125, 2.061767578125, 2.20086669921875, 2.3399658203125, 2.47906494140625, 2.6181640625, 2.75726318359375, 2.8963623046875, 3.03546142578125, 3.174560546875, 3.31365966796875, 3.4527587890625, 3.59185791015625, 3.73095703125, 3.87005615234375, 4.0091552734375, 4.14825439453125, 4.287353515625, 4.42645263671875, 4.5655517578125, 4.70465087890625, 4.84375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 14.0, 15.0, 21.0, 26.0, 28.0, 26.0, 35.0, 33.0, 32.0, 37.0, 43.0, 60.0, 105.0, 345.0, 1569.0, 127.0, 72.0, 42.0, 43.0, 28.0, 34.0, 37.0, 32.0, 22.0, 26.0, 17.0, 19.0, 21.0, 14.0, 11.0, 6.0, 11.0, 6.0, 11.0, 3.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.393310546875, -15.84912109375, -15.304931640625, -14.7607421875, -14.216552734375, -13.67236328125, -13.128173828125, -12.583984375, -12.039794921875, -11.49560546875, -10.951416015625, -10.4072265625, -9.863037109375, -9.31884765625, -8.774658203125, -8.23046875, -7.686279296875, -7.14208984375, -6.597900390625, -6.0537109375, -5.509521484375, -4.96533203125, -4.421142578125, -3.876953125, -3.332763671875, -2.78857421875, -2.244384765625, -1.7001953125, -1.156005859375, -0.61181640625, -0.067626953125, 0.4765625, 1.020751953125, 1.56494140625, 2.109130859375, 2.6533203125, 3.197509765625, 3.74169921875, 4.285888671875, 4.830078125, 5.374267578125, 5.91845703125, 6.462646484375, 7.0068359375, 7.551025390625, 8.09521484375, 8.639404296875, 9.18359375, 9.727783203125, 10.27197265625, 10.816162109375, 11.3603515625, 11.904541015625, 12.44873046875, 12.992919921875, 13.537109375, 14.081298828125, 14.62548828125, 15.169677734375, 15.7138671875, 16.258056640625, 16.80224609375, 17.346435546875, 17.890625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 6.0, 11.0, 12.0, 7.0, 9.0, 19.0, 14.0, 21.0, 35.0, 25.0, 42.0, 55.0, 85.0, 97.0, 107.0, 167.0, 218.0, 376.0, 1278.0, 17145.0, 3054831.0, 67267.0, 2312.0, 523.0, 286.0, 185.0, 118.0, 92.0, 76.0, 52.0, 45.0, 34.0, 25.0, 20.0, 22.0, 10.0, 8.0, 10.0, 5.0, 8.0, 6.0, 8.0, 10.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.84375, -34.74609375, -33.6484375, -32.55078125, -31.453125, -30.35546875, -29.2578125, -28.16015625, -27.0625, -25.96484375, -24.8671875, -23.76953125, -22.671875, -21.57421875, -20.4765625, -19.37890625, -18.28125, -17.18359375, -16.0859375, -14.98828125, -13.890625, -12.79296875, -11.6953125, -10.59765625, -9.5, -8.40234375, -7.3046875, -6.20703125, -5.109375, -4.01171875, -2.9140625, -1.81640625, -0.71875, 0.37890625, 1.4765625, 2.57421875, 3.671875, 4.76953125, 5.8671875, 6.96484375, 8.0625, 9.16015625, 10.2578125, 11.35546875, 12.453125, 13.55078125, 14.6484375, 15.74609375, 16.84375, 17.94140625, 19.0390625, 20.13671875, 21.234375, 22.33203125, 23.4296875, 24.52734375, 25.625, 26.72265625, 27.8203125, 28.91796875, 30.015625, 31.11328125, 32.2109375, 33.30859375, 34.40625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [37.0, 929.0, 49.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.242090225219727, -3.6338396072387695, 2.9744110107421875, 9.582662582397461, 16.1909122467041, 22.799161911010742, 29.40741539001465, 36.015663146972656, 42.62391662597656, 49.2321662902832, 55.840415954589844, 62.44866943359375, 69.05691528320312, 75.66516876220703, 82.27342224121094, 88.88166809082031, 95.48992156982422, 102.09817504882812, 108.7064208984375, 115.3146743774414, 121.92292785644531, 128.5311737060547, 135.13943481445312, 141.7476806640625, 148.35592651367188, 154.96417236328125, 161.5724334716797, 168.18067932128906, 174.78892517089844, 181.39718627929688, 188.00543212890625, 194.61367797851562, 201.221923828125, 207.83016967773438, 214.4384307861328, 221.0466766357422, 227.65492248535156, 234.26318359375, 240.87142944335938, 247.47967529296875, 254.08792114257812, 260.6961669921875, 267.3044128417969, 273.91265869140625, 280.52093505859375, 287.1291809082031, 293.7374267578125, 300.3456726074219, 306.95391845703125, 313.5621643066406, 320.17041015625, 326.7786865234375, 333.3869323730469, 339.99517822265625, 346.6034240722656, 353.211669921875, 359.8199462890625, 366.4281921386719, 373.03643798828125, 379.64471435546875, 386.2529602050781, 392.8612060546875, 399.4694519042969, 406.07769775390625, 412.6859436035156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 9.0, 5.0, 11.0, 7.0, 18.0, 17.0, 21.0, 22.0, 20.0, 17.0, 25.0, 36.0, 38.0, 27.0, 37.0, 45.0, 43.0, 28.0, 37.0, 43.0, 47.0, 35.0, 35.0, 28.0, 36.0, 44.0, 39.0, 31.0, 26.0, 26.0, 24.0, 17.0, 22.0, 15.0, 13.0, 7.0, 10.0, 5.0, 9.0, 5.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-51.54712677001953, -50.032745361328125, -48.51836013793945, -47.00397872924805, -45.489593505859375, -43.97521209716797, -42.46083068847656, -40.94644546508789, -39.43206024169922, -37.91767883300781, -36.40329360961914, -34.888912200927734, -33.37452697753906, -31.860145568847656, -30.345762252807617, -28.831378936767578, -27.316997528076172, -25.802614212036133, -24.288230895996094, -22.773849487304688, -21.259464263916016, -19.74508285522461, -18.23069953918457, -16.71631622314453, -15.201932907104492, -13.687549591064453, -12.173166275024414, -10.658783912658691, -9.144400596618652, -7.630017280578613, -6.115634918212891, -4.601251602172852, -3.0868682861328125, -1.5724852085113525, -0.05810213088989258, 1.4562807083129883, 2.9706640243530273, 4.485047340393066, 5.999429702758789, 7.513813018798828, 9.028196334838867, 10.542579650878906, 12.056962966918945, 13.571345329284668, 15.085728645324707, 16.600112915039062, 18.11449432373047, 19.628877639770508, 21.143260955810547, 22.657644271850586, 24.172027587890625, 25.68640899658203, 27.200794219970703, 28.71517562866211, 30.22955894470215, 31.743942260742188, 33.258323669433594, 34.772705078125, 36.28709030151367, 37.80147171020508, 39.31585693359375, 40.830238342285156, 42.34461975097656, 43.859004974365234, 45.373390197753906]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 8.0, 8.0, 7.0, 8.0, 12.0, 21.0, 24.0, 18.0, 25.0, 27.0, 34.0, 40.0, 39.0, 33.0, 39.0, 53.0, 41.0, 43.0, 34.0, 40.0, 36.0, 37.0, 42.0, 27.0, 46.0, 29.0, 27.0, 20.0, 33.0, 25.0, 19.0, 20.0, 16.0, 12.0, 7.0, 8.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.9609375, -5.78814697265625, -5.6153564453125, -5.44256591796875, -5.269775390625, -5.09698486328125, -4.9241943359375, -4.75140380859375, -4.57861328125, -4.40582275390625, -4.2330322265625, -4.06024169921875, -3.887451171875, -3.71466064453125, -3.5418701171875, -3.36907958984375, -3.1962890625, -3.02349853515625, -2.8507080078125, -2.67791748046875, -2.505126953125, -2.33233642578125, -2.1595458984375, -1.98675537109375, -1.81396484375, -1.64117431640625, -1.4683837890625, -1.29559326171875, -1.122802734375, -0.95001220703125, -0.7772216796875, -0.60443115234375, -0.431640625, -0.25885009765625, -0.0860595703125, 0.08673095703125, 0.259521484375, 0.43231201171875, 0.6051025390625, 0.77789306640625, 0.95068359375, 1.12347412109375, 1.2962646484375, 1.46905517578125, 1.641845703125, 1.81463623046875, 1.9874267578125, 2.16021728515625, 2.3330078125, 2.50579833984375, 2.6785888671875, 2.85137939453125, 3.024169921875, 3.19696044921875, 3.3697509765625, 3.54254150390625, 3.71533203125, 3.88812255859375, 4.0609130859375, 4.23370361328125, 4.406494140625, 4.57928466796875, 4.7520751953125, 4.92486572265625, 5.09765625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 11.0, 16.0, 21.0, 13.0, 21.0, 29.0, 29.0, 45.0, 52.0, 67.0, 96.0, 159.0, 369.0, 2157.0, 26198.0, 1786726.0, 2340829.0, 34047.0, 2370.0, 402.0, 133.0, 107.0, 72.0, 50.0, 46.0, 26.0, 26.0, 28.0, 16.0, 19.0, 14.0, 11.0, 10.0, 8.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-30.796875, -29.9423828125, -29.087890625, -28.2333984375, -27.37890625, -26.5244140625, -25.669921875, -24.8154296875, -23.9609375, -23.1064453125, -22.251953125, -21.3974609375, -20.54296875, -19.6884765625, -18.833984375, -17.9794921875, -17.125, -16.2705078125, -15.416015625, -14.5615234375, -13.70703125, -12.8525390625, -11.998046875, -11.1435546875, -10.2890625, -9.4345703125, -8.580078125, -7.7255859375, -6.87109375, -6.0166015625, -5.162109375, -4.3076171875, -3.453125, -2.5986328125, -1.744140625, -0.8896484375, -0.03515625, 0.8193359375, 1.673828125, 2.5283203125, 3.3828125, 4.2373046875, 5.091796875, 5.9462890625, 6.80078125, 7.6552734375, 8.509765625, 9.3642578125, 10.21875, 11.0732421875, 11.927734375, 12.7822265625, 13.63671875, 14.4912109375, 15.345703125, 16.2001953125, 17.0546875, 17.9091796875, 18.763671875, 19.6181640625, 20.47265625, 21.3271484375, 22.181640625, 23.0361328125, 23.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 12.0, 8.0, 18.0, 23.0, 37.0, 42.0, 54.0, 91.0, 134.0, 161.0, 226.0, 327.0, 405.0, 513.0, 489.0, 427.0, 330.0, 229.0, 155.0, 131.0, 82.0, 59.0, 28.0, 31.0, 14.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.924072265625, -11.49658203125, -11.069091796875, -10.6416015625, -10.214111328125, -9.78662109375, -9.359130859375, -8.931640625, -8.504150390625, -8.07666015625, -7.649169921875, -7.2216796875, -6.794189453125, -6.36669921875, -5.939208984375, -5.51171875, -5.084228515625, -4.65673828125, -4.229248046875, -3.8017578125, -3.374267578125, -2.94677734375, -2.519287109375, -2.091796875, -1.664306640625, -1.23681640625, -0.809326171875, -0.3818359375, 0.045654296875, 0.47314453125, 0.900634765625, 1.328125, 1.755615234375, 2.18310546875, 2.610595703125, 3.0380859375, 3.465576171875, 3.89306640625, 4.320556640625, 4.748046875, 5.175537109375, 5.60302734375, 6.030517578125, 6.4580078125, 6.885498046875, 7.31298828125, 7.740478515625, 8.16796875, 8.595458984375, 9.02294921875, 9.450439453125, 9.8779296875, 10.305419921875, 10.73291015625, 11.160400390625, 11.587890625, 12.015380859375, 12.44287109375, 12.870361328125, 13.2978515625, 13.725341796875, 14.15283203125, 14.580322265625, 15.0078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 12.0, 13.0, 12.0, 21.0, 31.0, 42.0, 54.0, 62.0, 98.0, 139.0, 186.0, 296.0, 547.0, 1692.0, 21048.0, 1729504.0, 2410485.0, 26489.0, 1977.0, 526.0, 315.0, 188.0, 132.0, 104.0, 83.0, 56.0, 45.0, 18.0, 26.0, 16.0, 20.0, 6.0, 8.0, 11.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.53125, -41.20361328125, -39.8759765625, -38.54833984375, -37.220703125, -35.89306640625, -34.5654296875, -33.23779296875, -31.91015625, -30.58251953125, -29.2548828125, -27.92724609375, -26.599609375, -25.27197265625, -23.9443359375, -22.61669921875, -21.2890625, -19.96142578125, -18.6337890625, -17.30615234375, -15.978515625, -14.65087890625, -13.3232421875, -11.99560546875, -10.66796875, -9.34033203125, -8.0126953125, -6.68505859375, -5.357421875, -4.02978515625, -2.7021484375, -1.37451171875, -0.046875, 1.28076171875, 2.6083984375, 3.93603515625, 5.263671875, 6.59130859375, 7.9189453125, 9.24658203125, 10.57421875, 11.90185546875, 13.2294921875, 14.55712890625, 15.884765625, 17.21240234375, 18.5400390625, 19.86767578125, 21.1953125, 22.52294921875, 23.8505859375, 25.17822265625, 26.505859375, 27.83349609375, 29.1611328125, 30.48876953125, 31.81640625, 33.14404296875, 34.4716796875, 35.79931640625, 37.126953125, 38.45458984375, 39.7822265625, 41.10986328125, 42.4375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 26.0, 67.0, 90.0, 142.0, 225.0, 167.0, 140.0, 71.0, 45.0, 17.0, 8.0, 1.0, 3.0], "bins": [-175.13687133789062, -171.99627685546875, -168.85569763183594, -165.71511840820312, -162.57452392578125, -159.43392944335938, -156.29335021972656, -153.15277099609375, -150.01217651367188, -146.87158203125, -143.7310028076172, -140.59042358398438, -137.4498291015625, -134.30923461914062, -131.1686553955078, -128.028076171875, -124.88748168945312, -121.74689483642578, -118.60630798339844, -115.4657211303711, -112.32513427734375, -109.1845474243164, -106.04396057128906, -102.90337371826172, -99.76278686523438, -96.62220001220703, -93.48161315917969, -90.34102630615234, -87.200439453125, -84.05985260009766, -80.91926574707031, -77.77867889404297, -74.63809204101562, -71.49750518798828, -68.35691833496094, -65.2163314819336, -62.07574462890625, -58.935157775878906, -55.79457092285156, -52.65398406982422, -49.513397216796875, -46.37281036376953, -43.23222351074219, -40.091636657714844, -36.9510498046875, -33.810462951660156, -30.669876098632812, -27.52928924560547, -24.388702392578125, -21.24811553955078, -18.107528686523438, -14.966941833496094, -11.82635498046875, -8.685768127441406, -5.5451812744140625, -2.4045944213867188, 0.735992431640625, 3.8765792846679688, 7.0171661376953125, 10.157752990722656, 13.29833984375, 16.438926696777344, 19.579513549804688, 22.72010040283203, 25.860687255859375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 10.0, 1.0, 12.0, 15.0, 6.0, 11.0, 10.0, 18.0, 21.0, 25.0, 21.0, 29.0, 28.0, 27.0, 26.0, 25.0, 37.0, 51.0, 31.0, 43.0, 27.0, 50.0, 39.0, 37.0, 36.0, 36.0, 34.0, 35.0, 28.0, 27.0, 30.0, 21.0, 18.0, 24.0, 24.0, 19.0, 15.0, 11.0, 5.0, 4.0, 5.0, 8.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.52217102050781, -34.38365936279297, -33.245147705078125, -32.10663604736328, -30.968124389648438, -29.829612731933594, -28.691099166870117, -27.552587509155273, -26.41407585144043, -25.275564193725586, -24.137052536010742, -22.9985408782959, -21.860027313232422, -20.721515655517578, -19.583003997802734, -18.44449234008789, -17.305980682373047, -16.167469024658203, -15.02895736694336, -13.8904447555542, -12.751933097839355, -11.613421440124512, -10.474908828735352, -9.336397171020508, -8.197885513305664, -7.05937385559082, -5.920861721038818, -4.782349586486816, -3.6438379287719727, -2.505326271057129, -1.366814136505127, -0.228302001953125, 0.9102096557617188, 2.0487215518951416, 3.1872334480285645, 4.325745582580566, 5.46425724029541, 6.602768898010254, 7.741281032562256, 8.879793167114258, 10.018304824829102, 11.156816482543945, 12.295328140258789, 13.43384075164795, 14.572352409362793, 15.710864067077637, 16.849376678466797, 17.98788833618164, 19.126399993896484, 20.264911651611328, 21.403423309326172, 22.541934967041016, 23.68044662475586, 24.818958282470703, 25.95747184753418, 27.095983505249023, 28.234495162963867, 29.37300682067871, 30.511518478393555, 31.6500301361084, 32.788543701171875, 33.92705535888672, 35.06556701660156, 36.204078674316406, 37.34259033203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 33.0, 45.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 5.0, 17.0, 39.0, 34.0, 78.0, 118.0, 198.0, 333.0, 597.0, 936.0, 1558.0, 2614.0, 4113.0, 7081.0, 11535.0, 19185.0, 33461.0, 57909.0, 100157.0, 161772.0, 208330.0, 173416.0, 110378.0, 64576.0, 36757.0, 21404.0, 12731.0, 7497.0, 4664.0, 2830.0, 1668.0, 984.0, 656.0, 358.0, 213.0, 138.0, 69.0, 59.0, 37.0, 19.0, 12.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6212921142578125, -0.600982666015625, -0.5806732177734375, -0.56036376953125, -0.5400543212890625, -0.519744873046875, -0.4994354248046875, -0.4791259765625, -0.4588165283203125, -0.438507080078125, -0.4181976318359375, -0.39788818359375, -0.3775787353515625, -0.357269287109375, -0.3369598388671875, -0.316650390625, -0.2963409423828125, -0.276031494140625, -0.2557220458984375, -0.23541259765625, -0.2151031494140625, -0.194793701171875, -0.1744842529296875, -0.1541748046875, -0.1338653564453125, -0.113555908203125, -0.0932464599609375, -0.07293701171875, -0.0526275634765625, -0.032318115234375, -0.0120086669921875, 0.00830078125, 0.0286102294921875, 0.048919677734375, 0.0692291259765625, 0.08953857421875, 0.1098480224609375, 0.130157470703125, 0.1504669189453125, 0.1707763671875, 0.1910858154296875, 0.211395263671875, 0.2317047119140625, 0.25201416015625, 0.2723236083984375, 0.292633056640625, 0.3129425048828125, 0.333251953125, 0.3535614013671875, 0.373870849609375, 0.3941802978515625, 0.41448974609375, 0.4347991943359375, 0.455108642578125, 0.4754180908203125, 0.4957275390625, 0.5160369873046875, 0.536346435546875, 0.5566558837890625, 0.57696533203125, 0.5972747802734375, 0.617584228515625, 0.6378936767578125, 0.658203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 23.0, 15.0, 18.0, 18.0, 27.0, 25.0, 32.0, 17.0, 38.0, 36.0, 34.0, 32.0, 42.0, 23.0, 39.0, 1063.0, 38.0, 29.0, 51.0, 34.0, 35.0, 33.0, 31.0, 31.0, 30.0, 26.0, 24.0, 28.0, 8.0, 14.0, 16.0, 12.0, 12.0, 4.0, 13.0, 8.0, 6.0, 4.0, 1.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3671875, -3.26776123046875, -3.1683349609375, -3.06890869140625, -2.969482421875, -2.87005615234375, -2.7706298828125, -2.67120361328125, -2.57177734375, -2.47235107421875, -2.3729248046875, -2.27349853515625, -2.174072265625, -2.07464599609375, -1.9752197265625, -1.87579345703125, -1.7763671875, -1.67694091796875, -1.5775146484375, -1.47808837890625, -1.378662109375, -1.27923583984375, -1.1798095703125, -1.08038330078125, -0.98095703125, -0.88153076171875, -0.7821044921875, -0.68267822265625, -0.583251953125, -0.48382568359375, -0.3843994140625, -0.28497314453125, -0.185546875, -0.08612060546875, 0.0133056640625, 0.11273193359375, 0.212158203125, 0.31158447265625, 0.4110107421875, 0.51043701171875, 0.60986328125, 0.70928955078125, 0.8087158203125, 0.90814208984375, 1.007568359375, 1.10699462890625, 1.2064208984375, 1.30584716796875, 1.4052734375, 1.50469970703125, 1.6041259765625, 1.70355224609375, 1.802978515625, 1.90240478515625, 2.0018310546875, 2.10125732421875, 2.20068359375, 2.30010986328125, 2.3995361328125, 2.49896240234375, 2.598388671875, 2.69781494140625, 2.7972412109375, 2.89666748046875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 8.0, 2.0, 8.0, 13.0, 19.0, 34.0, 40.0, 67.0, 112.0, 182.0, 332.0, 508.0, 807.0, 1373.0, 2168.0, 3775.0, 5909.0, 9830.0, 16190.0, 26735.0, 43580.0, 70906.0, 110714.0, 155703.0, 1224796.0, 149971.0, 103778.0, 65905.0, 40903.0, 24510.0, 14910.0, 8999.0, 5554.0, 3455.0, 2085.0, 1244.0, 755.0, 479.0, 289.0, 182.0, 114.0, 72.0, 44.0, 27.0, 15.0, 12.0, 9.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4067955017089844, -0.39342498779296875, -0.3800544738769531, -0.3666839599609375, -0.3533134460449219, -0.33994293212890625, -0.3265724182128906, -0.313201904296875, -0.2998313903808594, -0.28646087646484375, -0.2730903625488281, -0.2597198486328125, -0.24634933471679688, -0.23297882080078125, -0.21960830688476562, -0.20623779296875, -0.19286727905273438, -0.17949676513671875, -0.16612625122070312, -0.1527557373046875, -0.13938522338867188, -0.12601470947265625, -0.11264419555664062, -0.099273681640625, -0.08590316772460938, -0.07253265380859375, -0.059162139892578125, -0.0457916259765625, -0.032421112060546875, -0.01905059814453125, -0.005680084228515625, 0.0076904296875, 0.021060943603515625, 0.03443145751953125, 0.047801971435546875, 0.0611724853515625, 0.07454299926757812, 0.08791351318359375, 0.10128402709960938, 0.114654541015625, 0.12802505493164062, 0.14139556884765625, 0.15476608276367188, 0.1681365966796875, 0.18150711059570312, 0.19487762451171875, 0.20824813842773438, 0.22161865234375, 0.23498916625976562, 0.24835968017578125, 0.2617301940917969, 0.2751007080078125, 0.2884712219238281, 0.30184173583984375, 0.3152122497558594, 0.328582763671875, 0.3419532775878906, 0.35532379150390625, 0.3686943054199219, 0.3820648193359375, 0.3954353332519531, 0.40880584716796875, 0.4221763610839844, 0.435546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 10.0, 11.0, 12.0, 19.0, 24.0, 29.0, 28.0, 46.0, 47.0, 50.0, 52.0, 64.0, 86.0, 74.0, 67.0, 52.0, 56.0, 35.0, 31.0, 25.0, 24.0, 27.0, 15.0, 15.0, 12.0, 7.0, 7.0, 5.0, 4.0, 6.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.005229949951171875, -0.005082249641418457, -0.004934549331665039, -0.004786849021911621, -0.004639148712158203, -0.004491448402404785, -0.004343748092651367, -0.004196047782897949, -0.004048347473144531, -0.0039006471633911133, -0.0037529468536376953, -0.0036052465438842773, -0.0034575462341308594, -0.0033098459243774414, -0.0031621456146240234, -0.0030144453048706055, -0.0028667449951171875, -0.0027190446853637695, -0.0025713443756103516, -0.0024236440658569336, -0.0022759437561035156, -0.0021282434463500977, -0.0019805431365966797, -0.0018328428268432617, -0.0016851425170898438, -0.0015374422073364258, -0.0013897418975830078, -0.0012420415878295898, -0.0010943412780761719, -0.0009466409683227539, -0.0007989406585693359, -0.000651240348815918, -0.0005035400390625, -0.00035583972930908203, -0.00020813941955566406, -6.0439109802246094e-05, 8.726119995117188e-05, 0.00023496150970458984, 0.0003826618194580078, 0.0005303621292114258, 0.0006780624389648438, 0.0008257627487182617, 0.0009734630584716797, 0.0011211633682250977, 0.0012688636779785156, 0.0014165639877319336, 0.0015642642974853516, 0.0017119646072387695, 0.0018596649169921875, 0.0020073652267456055, 0.0021550655364990234, 0.0023027658462524414, 0.0024504661560058594, 0.0025981664657592773, 0.0027458667755126953, 0.0028935670852661133, 0.0030412673950195312, 0.0031889677047729492, 0.003336668014526367, 0.003484368324279785, 0.003632068634033203, 0.003779768943786621, 0.003927469253540039, 0.004075169563293457, 0.004222869873046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 2.0, 6.0, 10.0, 6.0, 3.0, 4.0, 11.0, 21.0, 29.0, 38.0, 55.0, 63.0, 71.0, 105.0, 182.0, 289.0, 599.0, 4284.0, 990878.0, 49860.0, 895.0, 413.0, 225.0, 143.0, 99.0, 70.0, 49.0, 35.0, 18.0, 18.0, 14.0, 4.0, 6.0, 6.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08699798583984375, -0.0839691162109375, -0.08094024658203125, -0.077911376953125, -0.07488250732421875, -0.0718536376953125, -0.06882476806640625, -0.0657958984375, -0.06276702880859375, -0.0597381591796875, -0.05670928955078125, -0.053680419921875, -0.05065155029296875, -0.0476226806640625, -0.04459381103515625, -0.04156494140625, -0.03853607177734375, -0.0355072021484375, -0.03247833251953125, -0.029449462890625, -0.02642059326171875, -0.0233917236328125, -0.02036285400390625, -0.017333984375, -0.01430511474609375, -0.0112762451171875, -0.00824737548828125, -0.005218505859375, -0.00218963623046875, 0.0008392333984375, 0.00386810302734375, 0.00689697265625, 0.00992584228515625, 0.0129547119140625, 0.01598358154296875, 0.019012451171875, 0.02204132080078125, 0.0250701904296875, 0.02809906005859375, 0.0311279296875, 0.03415679931640625, 0.0371856689453125, 0.04021453857421875, 0.043243408203125, 0.04627227783203125, 0.0493011474609375, 0.05233001708984375, 0.05535888671875, 0.05838775634765625, 0.0614166259765625, 0.06444549560546875, 0.067474365234375, 0.07050323486328125, 0.0735321044921875, 0.07656097412109375, 0.07958984375, 0.08261871337890625, 0.0856475830078125, 0.08867645263671875, 0.091705322265625, 0.09473419189453125, 0.0977630615234375, 0.10079193115234375, 0.10382080078125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 165.0, 762.0, 71.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00869666412472725, -0.007854385301470757, -0.007012106012552977, -0.006169827189296484, -0.005327547900378704, -0.0044852690771222115, -0.003642990253865719, -0.002800710964947939, -0.0019584321416914463, -0.00111615308560431, -0.0002738741459324956, 0.0005684047937393188, 0.0014106838498264551, 0.0022529629059135914, 0.003095241729170084, 0.003937521018087864, 0.0047797998413443565, 0.005622078664600849, 0.006464357953518629, 0.007306636776775122, 0.008148916065692902, 0.008991194888949394, 0.009833473712205887, 0.01067575253546238, 0.011518031358718872, 0.012360310181975365, 0.013202589005231857, 0.01404486782848835, 0.014887147583067417, 0.015729427337646484, 0.016571704298257828, 0.01741398498415947, 0.018256263807415962, 0.019098542630672455, 0.019940821453928947, 0.02078310027718544, 0.021625379100441933, 0.022467657923698425, 0.023309938609600067, 0.02415221743285656, 0.024994496256113052, 0.025836775079369545, 0.026679053902626038, 0.02752133272588253, 0.028363611549139023, 0.029205892235040665, 0.030048169195652008, 0.03089044988155365, 0.03173272684216499, 0.032575007528066635, 0.03341728448867798, 0.03425956517457962, 0.035101842135190964, 0.035944122821092606, 0.03678639978170395, 0.03762868046760559, 0.03847096115350723, 0.039313241839408875, 0.04015551880002022, 0.04099779948592186, 0.0418400764465332, 0.042682357132434845, 0.04352463409304619, 0.04436691477894783, 0.045209191739559174]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 15.0, 23.0, 19.0, 32.0, 42.0, 43.0, 42.0, 53.0, 51.0, 64.0, 52.0, 47.0, 51.0, 56.0, 64.0, 36.0, 55.0, 41.0, 38.0, 25.0, 34.0, 21.0, 18.0, 12.0, 13.0, 7.0, 8.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004752993583679199, -0.004619834013283253, -0.004486674442887306, -0.00435351487249136, -0.004220355302095413, -0.004087195731699467, -0.00395403616130352, -0.0038208765909075737, -0.003687717020511627, -0.0035545574501156807, -0.003421397879719734, -0.0032882383093237877, -0.003155078738927841, -0.0030219191685318947, -0.002888759598135948, -0.0027556000277400017, -0.002622440457344055, -0.0024892808869481087, -0.002356121316552162, -0.0022229617461562157, -0.002089802175760269, -0.0019566426053643227, -0.0018234830349683762, -0.0016903234645724297, -0.0015571638941764832, -0.0014240043237805367, -0.0012908447533845901, -0.0011576851829886436, -0.0010245256125926971, -0.0008913660421967506, -0.0007582064718008041, -0.0006250469014048576, -0.0004918873310089111, -0.00035872776061296463, -0.00022556819021701813, -9.240861982107162e-05, 4.075095057487488e-05, 0.00017391052097082138, 0.0003070700913667679, 0.0004402296617627144, 0.0005733892321586609, 0.0007065488025546074, 0.0008397083729505539, 0.0009728679433465004, 0.001106027513742447, 0.0012391870841383934, 0.00137234665453434, 0.0015055062249302864, 0.001638665795326233, 0.0017718253657221794, 0.001904984936118126, 0.0020381445065140724, 0.002171304076910019, 0.0023044636473059654, 0.002437623217701912, 0.0025707827880978584, 0.002703942358493805, 0.0028371019288897514, 0.002970261499285698, 0.0031034210696816444, 0.003236580640077591, 0.0033697402104735374, 0.003502899780869484, 0.0036360593512654305, 0.003769218921661377]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 34.0, 44.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 2.0, 9.0, 11.0, 21.0, 37.0, 38.0, 54.0, 104.0, 178.0, 280.0, 424.0, 625.0, 1100.0, 1748.0, 2775.0, 4643.0, 8018.0, 13800.0, 25276.0, 52256.0, 147238.0, 443603.0, 209615.0, 66886.0, 30397.0, 16296.0, 9358.0, 5364.0, 3232.0, 1940.0, 1187.0, 749.0, 435.0, 314.0, 188.0, 127.0, 69.0, 48.0, 37.0, 29.0, 23.0, 13.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.4669189453125, -3.353759765625, -3.2406005859375, -3.12744140625, -3.0142822265625, -2.901123046875, -2.7879638671875, -2.6748046875, -2.5616455078125, -2.448486328125, -2.3353271484375, -2.22216796875, -2.1090087890625, -1.995849609375, -1.8826904296875, -1.76953125, -1.6563720703125, -1.543212890625, -1.4300537109375, -1.31689453125, -1.2037353515625, -1.090576171875, -0.9774169921875, -0.8642578125, -0.7510986328125, -0.637939453125, -0.5247802734375, -0.41162109375, -0.2984619140625, -0.185302734375, -0.0721435546875, 0.041015625, 0.1541748046875, 0.267333984375, 0.3804931640625, 0.49365234375, 0.6068115234375, 0.719970703125, 0.8331298828125, 0.9462890625, 1.0594482421875, 1.172607421875, 1.2857666015625, 1.39892578125, 1.5120849609375, 1.625244140625, 1.7384033203125, 1.8515625, 1.9647216796875, 2.077880859375, 2.1910400390625, 2.30419921875, 2.4173583984375, 2.530517578125, 2.6436767578125, 2.7568359375, 2.8699951171875, 2.983154296875, 3.0963134765625, 3.20947265625, 3.3226318359375, 3.435791015625, 3.5489501953125, 3.662109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 19.0, 12.0, 18.0, 29.0, 29.0, 32.0, 29.0, 33.0, 49.0, 46.0, 64.0, 129.0, 1681.0, 304.0, 95.0, 58.0, 40.0, 46.0, 46.0, 32.0, 34.0, 29.0, 24.0, 31.0, 19.0, 17.0, 9.0, 16.0, 8.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.674560546875, -16.98974609375, -16.304931640625, -15.6201171875, -14.935302734375, -14.25048828125, -13.565673828125, -12.880859375, -12.196044921875, -11.51123046875, -10.826416015625, -10.1416015625, -9.456787109375, -8.77197265625, -8.087158203125, -7.40234375, -6.717529296875, -6.03271484375, -5.347900390625, -4.6630859375, -3.978271484375, -3.29345703125, -2.608642578125, -1.923828125, -1.239013671875, -0.55419921875, 0.130615234375, 0.8154296875, 1.500244140625, 2.18505859375, 2.869873046875, 3.5546875, 4.239501953125, 4.92431640625, 5.609130859375, 6.2939453125, 6.978759765625, 7.66357421875, 8.348388671875, 9.033203125, 9.718017578125, 10.40283203125, 11.087646484375, 11.7724609375, 12.457275390625, 13.14208984375, 13.826904296875, 14.51171875, 15.196533203125, 15.88134765625, 16.566162109375, 17.2509765625, 17.935791015625, 18.62060546875, 19.305419921875, 19.990234375, 20.675048828125, 21.35986328125, 22.044677734375, 22.7294921875, 23.414306640625, 24.09912109375, 24.783935546875, 25.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 12.0, 17.0, 18.0, 26.0, 43.0, 49.0, 63.0, 87.0, 108.0, 218.0, 401.0, 1089.0, 19032.0, 3106433.0, 16107.0, 973.0, 377.0, 210.0, 120.0, 85.0, 49.0, 37.0, 32.0, 23.0, 19.0, 18.0, 13.0, 9.0, 6.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.1875, -65.39501953125, -63.6025390625, -61.81005859375, -60.017578125, -58.22509765625, -56.4326171875, -54.64013671875, -52.84765625, -51.05517578125, -49.2626953125, -47.47021484375, -45.677734375, -43.88525390625, -42.0927734375, -40.30029296875, -38.5078125, -36.71533203125, -34.9228515625, -33.13037109375, -31.337890625, -29.54541015625, -27.7529296875, -25.96044921875, -24.16796875, -22.37548828125, -20.5830078125, -18.79052734375, -16.998046875, -15.20556640625, -13.4130859375, -11.62060546875, -9.828125, -8.03564453125, -6.2431640625, -4.45068359375, -2.658203125, -0.86572265625, 0.9267578125, 2.71923828125, 4.51171875, 6.30419921875, 8.0966796875, 9.88916015625, 11.681640625, 13.47412109375, 15.2666015625, 17.05908203125, 18.8515625, 20.64404296875, 22.4365234375, 24.22900390625, 26.021484375, 27.81396484375, 29.6064453125, 31.39892578125, 33.19140625, 34.98388671875, 36.7763671875, 38.56884765625, 40.361328125, 42.15380859375, 43.9462890625, 45.73876953125, 47.53125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 14.0, 35.0, 59.0, 101.0, 152.0, 187.0, 168.0, 145.0, 75.0, 40.0, 22.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.403079986572266, -46.38817596435547, -45.373268127441406, -44.35836410522461, -43.34346008300781, -42.32855224609375, -41.31364822387695, -40.298744201660156, -39.283836364746094, -38.2689323425293, -37.254024505615234, -36.23912048339844, -35.22421646118164, -34.209312438964844, -33.19440460205078, -32.179500579833984, -31.164596557617188, -30.149690628051758, -29.13478660583496, -28.11988067626953, -27.104976654052734, -26.090070724487305, -25.075164794921875, -24.060260772705078, -23.04535484313965, -22.03044891357422, -21.015544891357422, -20.000638961791992, -18.985733032226562, -17.970829010009766, -16.955923080444336, -15.941018104553223, -14.926109313964844, -13.91120433807373, -12.896299362182617, -11.881393432617188, -10.866488456726074, -9.851583480834961, -8.836677551269531, -7.821772575378418, -6.806867599487305, -5.791962623596191, -4.77705717086792, -3.7621519565582275, -2.747246742248535, -1.7323417663574219, -0.7174363136291504, 0.2974691390991211, 1.3123741149902344, 2.3272793292999268, 3.342184543609619, 4.357089996337891, 5.371994972229004, 6.386899948120117, 7.401805400848389, 8.41671085357666, 9.431615829467773, 10.446520805358887, 11.46142578125, 12.47633171081543, 13.491236686706543, 14.506141662597656, 15.521047592163086, 16.535953521728516, 17.550857543945312]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 4.0, 11.0, 6.0, 18.0, 15.0, 16.0, 24.0, 20.0, 25.0, 25.0, 25.0, 34.0, 40.0, 35.0, 35.0, 45.0, 24.0, 46.0, 43.0, 40.0, 36.0, 55.0, 29.0, 47.0, 35.0, 34.0, 27.0, 27.0, 21.0, 32.0, 16.0, 17.0, 8.0, 17.0, 15.0, 9.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.996826171875, -48.29018783569336, -46.58354568481445, -44.87690734863281, -43.170265197753906, -41.463626861572266, -39.756988525390625, -38.05034637451172, -36.34370803833008, -34.63706970214844, -32.93042755126953, -31.22378921508789, -29.517148971557617, -27.810508728027344, -26.10386848449707, -24.397228240966797, -22.690587997436523, -20.98394775390625, -19.277307510375977, -17.570667266845703, -15.864028930664062, -14.157388687133789, -12.450748443603516, -10.744109153747559, -9.037468910217285, -7.33082914352417, -5.624189376831055, -3.9175491333007812, -2.210909366607666, -0.5042695999145508, 1.2023706436157227, 2.9090099334716797, 4.615650177001953, 6.322289943695068, 8.028929710388184, 9.735569953918457, 11.442209243774414, 13.148849487304688, 14.855489730834961, 16.562129974365234, 18.268768310546875, 19.97540855407715, 21.682048797607422, 23.388687133789062, 25.095327377319336, 26.80196762084961, 28.508607864379883, 30.215248107910156, 31.92188835144043, 33.6285285949707, 35.335166931152344, 37.04180908203125, 38.74844741821289, 40.45508575439453, 42.16172790527344, 43.86836624145508, 45.575008392333984, 47.281646728515625, 48.98828887939453, 50.69492721557617, 52.40156936645508, 54.10820770263672, 55.814849853515625, 57.521488189697266, 59.228126525878906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 10.0, 7.0, 8.0, 11.0, 16.0, 9.0, 15.0, 20.0, 26.0, 41.0, 30.0, 34.0, 33.0, 26.0, 23.0, 32.0, 35.0, 33.0, 49.0, 39.0, 39.0, 38.0, 27.0, 36.0, 32.0, 32.0, 35.0, 26.0, 28.0, 23.0, 20.0, 25.0, 18.0, 9.0, 19.0, 13.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.7607421875, -4.595703125, -4.4306640625, -4.265625, -4.1005859375, -3.935546875, -3.7705078125, -3.60546875, -3.4404296875, -3.275390625, -3.1103515625, -2.9453125, -2.7802734375, -2.615234375, -2.4501953125, -2.28515625, -2.1201171875, -1.955078125, -1.7900390625, -1.625, -1.4599609375, -1.294921875, -1.1298828125, -0.96484375, -0.7998046875, -0.634765625, -0.4697265625, -0.3046875, -0.1396484375, 0.025390625, 0.1904296875, 0.35546875, 0.5205078125, 0.685546875, 0.8505859375, 1.015625, 1.1806640625, 1.345703125, 1.5107421875, 1.67578125, 1.8408203125, 2.005859375, 2.1708984375, 2.3359375, 2.5009765625, 2.666015625, 2.8310546875, 2.99609375, 3.1611328125, 3.326171875, 3.4912109375, 3.65625, 3.8212890625, 3.986328125, 4.1513671875, 4.31640625, 4.4814453125, 4.646484375, 4.8115234375, 4.9765625, 5.1416015625, 5.306640625, 5.4716796875, 5.63671875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 14.0, 19.0, 31.0, 64.0, 59.0, 100.0, 154.0, 215.0, 326.0, 573.0, 1010.0, 1970.0, 4168.0, 10138.0, 30960.0, 128332.0, 675938.0, 1841519.0, 1180792.0, 241944.0, 49560.0, 14997.0, 5709.0, 2466.0, 1262.0, 699.0, 384.0, 255.0, 172.0, 120.0, 82.0, 47.0, 33.0, 29.0, 29.0, 23.0, 19.0, 13.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.171875, -8.891357421875, -8.61083984375, -8.330322265625, -8.0498046875, -7.769287109375, -7.48876953125, -7.208251953125, -6.927734375, -6.647216796875, -6.36669921875, -6.086181640625, -5.8056640625, -5.525146484375, -5.24462890625, -4.964111328125, -4.68359375, -4.403076171875, -4.12255859375, -3.842041015625, -3.5615234375, -3.281005859375, -3.00048828125, -2.719970703125, -2.439453125, -2.158935546875, -1.87841796875, -1.597900390625, -1.3173828125, -1.036865234375, -0.75634765625, -0.475830078125, -0.1953125, 0.085205078125, 0.36572265625, 0.646240234375, 0.9267578125, 1.207275390625, 1.48779296875, 1.768310546875, 2.048828125, 2.329345703125, 2.60986328125, 2.890380859375, 3.1708984375, 3.451416015625, 3.73193359375, 4.012451171875, 4.29296875, 4.573486328125, 4.85400390625, 5.134521484375, 5.4150390625, 5.695556640625, 5.97607421875, 6.256591796875, 6.537109375, 6.817626953125, 7.09814453125, 7.378662109375, 7.6591796875, 7.939697265625, 8.22021484375, 8.500732421875, 8.78125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 10.0, 20.0, 16.0, 18.0, 23.0, 23.0, 54.0, 60.0, 78.0, 106.0, 144.0, 200.0, 216.0, 338.0, 386.0, 412.0, 431.0, 328.0, 311.0, 188.0, 176.0, 128.0, 103.0, 66.0, 59.0, 28.0, 43.0, 30.0, 19.0, 11.0, 11.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -9.979736328125, -9.60791015625, -9.236083984375, -8.8642578125, -8.492431640625, -8.12060546875, -7.748779296875, -7.376953125, -7.005126953125, -6.63330078125, -6.261474609375, -5.8896484375, -5.517822265625, -5.14599609375, -4.774169921875, -4.40234375, -4.030517578125, -3.65869140625, -3.286865234375, -2.9150390625, -2.543212890625, -2.17138671875, -1.799560546875, -1.427734375, -1.055908203125, -0.68408203125, -0.312255859375, 0.0595703125, 0.431396484375, 0.80322265625, 1.175048828125, 1.546875, 1.918701171875, 2.29052734375, 2.662353515625, 3.0341796875, 3.406005859375, 3.77783203125, 4.149658203125, 4.521484375, 4.893310546875, 5.26513671875, 5.636962890625, 6.0087890625, 6.380615234375, 6.75244140625, 7.124267578125, 7.49609375, 7.867919921875, 8.23974609375, 8.611572265625, 8.9833984375, 9.355224609375, 9.72705078125, 10.098876953125, 10.470703125, 10.842529296875, 11.21435546875, 11.586181640625, 11.9580078125, 12.329833984375, 12.70166015625, 13.073486328125, 13.4453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 12.0, 9.0, 6.0, 15.0, 18.0, 19.0, 23.0, 27.0, 47.0, 68.0, 71.0, 100.0, 146.0, 214.0, 393.0, 1128.0, 5364.0, 91694.0, 3452386.0, 621605.0, 17212.0, 2115.0, 573.0, 311.0, 182.0, 106.0, 102.0, 66.0, 69.0, 45.0, 34.0, 26.0, 18.0, 13.0, 10.0, 13.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-40.15625, -39.03271484375, -37.9091796875, -36.78564453125, -35.662109375, -34.53857421875, -33.4150390625, -32.29150390625, -31.16796875, -30.04443359375, -28.9208984375, -27.79736328125, -26.673828125, -25.55029296875, -24.4267578125, -23.30322265625, -22.1796875, -21.05615234375, -19.9326171875, -18.80908203125, -17.685546875, -16.56201171875, -15.4384765625, -14.31494140625, -13.19140625, -12.06787109375, -10.9443359375, -9.82080078125, -8.697265625, -7.57373046875, -6.4501953125, -5.32666015625, -4.203125, -3.07958984375, -1.9560546875, -0.83251953125, 0.291015625, 1.41455078125, 2.5380859375, 3.66162109375, 4.78515625, 5.90869140625, 7.0322265625, 8.15576171875, 9.279296875, 10.40283203125, 11.5263671875, 12.64990234375, 13.7734375, 14.89697265625, 16.0205078125, 17.14404296875, 18.267578125, 19.39111328125, 20.5146484375, 21.63818359375, 22.76171875, 23.88525390625, 25.0087890625, 26.13232421875, 27.255859375, 28.37939453125, 29.5029296875, 30.62646484375, 31.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 18.0, 25.0, 42.0, 107.0, 138.0, 162.0, 192.0, 132.0, 92.0, 50.0, 27.0, 15.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.44627380371094, -91.58157348632812, -88.71688079833984, -85.85218048095703, -82.98748779296875, -80.12278747558594, -77.25808715820312, -74.39339447021484, -71.52870178222656, -68.66400146484375, -65.79930877685547, -62.934608459472656, -60.069915771484375, -57.20521545410156, -54.340518951416016, -51.47582244873047, -48.611122131347656, -45.74642562866211, -42.88172912597656, -40.01702880859375, -37.15233612060547, -34.287635803222656, -31.42293930053711, -28.558242797851562, -25.693546295166016, -22.82884979248047, -19.964153289794922, -17.099454879760742, -14.234758377075195, -11.370061874389648, -8.505363464355469, -5.640666961669922, -2.7759628295898438, 0.08873414993286133, 2.9534311294555664, 5.81812858581543, 8.682825088500977, 11.547521591186523, 14.412220001220703, 17.27691650390625, 20.141613006591797, 23.006309509277344, 25.87100601196289, 28.73570442199707, 31.600400924682617, 34.46509552001953, 37.329795837402344, 40.19449234008789, 43.05918884277344, 45.923885345458984, 48.78858184814453, 51.653282165527344, 54.517974853515625, 57.38267517089844, 60.247371673583984, 63.11206817626953, 65.97676086425781, 68.84146118164062, 71.7061538696289, 74.57085418701172, 77.435546875, 80.30024719238281, 83.16494750976562, 86.0296401977539, 88.89434051513672]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 12.0, 7.0, 6.0, 13.0, 14.0, 17.0, 18.0, 22.0, 34.0, 31.0, 25.0, 37.0, 32.0, 38.0, 35.0, 54.0, 35.0, 50.0, 43.0, 32.0, 28.0, 33.0, 39.0, 38.0, 34.0, 31.0, 38.0, 22.0, 23.0, 27.0, 13.0, 17.0, 22.0, 13.0, 12.0, 15.0, 14.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-44.685394287109375, -43.43315124511719, -42.180912017822266, -40.92866897583008, -39.676429748535156, -38.42418670654297, -37.17194366455078, -35.91970443725586, -34.66746139526367, -33.415218353271484, -32.16297912597656, -30.910736083984375, -29.65849494934082, -28.406253814697266, -27.15401268005371, -25.901771545410156, -24.6495304107666, -23.397289276123047, -22.145048141479492, -20.892807006835938, -19.64056396484375, -18.388322830200195, -17.13608169555664, -15.88383960723877, -14.631598472595215, -13.37935733795166, -12.127115249633789, -10.874874114990234, -9.62263298034668, -8.370390892028809, -7.118149757385254, -5.865907669067383, -4.613666534423828, -3.3614249229431152, -2.1091835498809814, -0.8569421768188477, 0.39529943466186523, 1.6475410461425781, 2.899782180786133, 4.152024269104004, 5.404265403747559, 6.6565070152282715, 7.908748626708984, 9.160989761352539, 10.413230895996094, 11.665472984313965, 12.91771411895752, 14.16995620727539, 15.422197341918945, 16.6744384765625, 17.926679611206055, 19.17892074584961, 20.431163787841797, 21.68340492248535, 22.935646057128906, 24.187889099121094, 25.440128326416016, 26.69236946105957, 27.944610595703125, 29.196853637695312, 30.449094772338867, 31.701335906982422, 32.953575134277344, 34.20581817626953, 35.45806121826172]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 26.0, 48.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 9.0, 8.0, 28.0, 39.0, 65.0, 88.0, 137.0, 193.0, 336.0, 483.0, 722.0, 1060.0, 1651.0, 2494.0, 3855.0, 6064.0, 9302.0, 14522.0, 23202.0, 35901.0, 56899.0, 88645.0, 132188.0, 173355.0, 163855.0, 118451.0, 77679.0, 49606.0, 31397.0, 20249.0, 12904.0, 8124.0, 5314.0, 3309.0, 2267.0, 1438.0, 892.0, 593.0, 429.0, 259.0, 184.0, 115.0, 70.0, 52.0, 36.0, 35.0, 18.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5703125, -0.5524063110351562, -0.5345001220703125, -0.5165939331054688, -0.498687744140625, -0.48078155517578125, -0.4628753662109375, -0.44496917724609375, -0.42706298828125, -0.40915679931640625, -0.3912506103515625, -0.37334442138671875, -0.355438232421875, -0.33753204345703125, -0.3196258544921875, -0.30171966552734375, -0.2838134765625, -0.26590728759765625, -0.2480010986328125, -0.23009490966796875, -0.212188720703125, -0.19428253173828125, -0.1763763427734375, -0.15847015380859375, -0.14056396484375, -0.12265777587890625, -0.1047515869140625, -0.08684539794921875, -0.068939208984375, -0.05103302001953125, -0.0331268310546875, -0.01522064208984375, 0.002685546875, 0.02059173583984375, 0.0384979248046875, 0.05640411376953125, 0.074310302734375, 0.09221649169921875, 0.1101226806640625, 0.12802886962890625, 0.14593505859375, 0.16384124755859375, 0.1817474365234375, 0.19965362548828125, 0.217559814453125, 0.23546600341796875, 0.2533721923828125, 0.27127838134765625, 0.2891845703125, 0.30709075927734375, 0.3249969482421875, 0.34290313720703125, 0.360809326171875, 0.37871551513671875, 0.3966217041015625, 0.41452789306640625, 0.43243408203125, 0.45034027099609375, 0.4682464599609375, 0.48615264892578125, 0.504058837890625, 0.5219650268554688, 0.5398712158203125, 0.5577774047851562, 0.57568359375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 7.0, 13.0, 15.0, 11.0, 25.0, 27.0, 36.0, 37.0, 24.0, 48.0, 42.0, 48.0, 41.0, 35.0, 48.0, 1074.0, 44.0, 55.0, 45.0, 52.0, 35.0, 43.0, 31.0, 35.0, 23.0, 17.0, 17.0, 17.0, 18.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.7744140625, -3.638671875, -3.5029296875, -3.3671875, -3.2314453125, -3.095703125, -2.9599609375, -2.82421875, -2.6884765625, -2.552734375, -2.4169921875, -2.28125, -2.1455078125, -2.009765625, -1.8740234375, -1.73828125, -1.6025390625, -1.466796875, -1.3310546875, -1.1953125, -1.0595703125, -0.923828125, -0.7880859375, -0.65234375, -0.5166015625, -0.380859375, -0.2451171875, -0.109375, 0.0263671875, 0.162109375, 0.2978515625, 0.43359375, 0.5693359375, 0.705078125, 0.8408203125, 0.9765625, 1.1123046875, 1.248046875, 1.3837890625, 1.51953125, 1.6552734375, 1.791015625, 1.9267578125, 2.0625, 2.1982421875, 2.333984375, 2.4697265625, 2.60546875, 2.7412109375, 2.876953125, 3.0126953125, 3.1484375, 3.2841796875, 3.419921875, 3.5556640625, 3.69140625, 3.8271484375, 3.962890625, 4.0986328125, 4.234375, 4.3701171875, 4.505859375, 4.6416015625, 4.77734375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 14.0, 15.0, 23.0, 34.0, 49.0, 82.0, 162.0, 212.0, 396.0, 646.0, 1139.0, 1927.0, 3183.0, 5130.0, 8602.0, 14507.0, 24499.0, 40960.0, 67843.0, 108318.0, 156442.0, 1229716.0, 156428.0, 107360.0, 67558.0, 40941.0, 24308.0, 14851.0, 8730.0, 5288.0, 3131.0, 1861.0, 1128.0, 712.0, 358.0, 234.0, 162.0, 71.0, 37.0, 24.0, 12.0, 18.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.492919921875, -0.47820281982421875, -0.4634857177734375, -0.44876861572265625, -0.434051513671875, -0.41933441162109375, -0.4046173095703125, -0.38990020751953125, -0.37518310546875, -0.36046600341796875, -0.3457489013671875, -0.33103179931640625, -0.316314697265625, -0.30159759521484375, -0.2868804931640625, -0.27216339111328125, -0.2574462890625, -0.24272918701171875, -0.2280120849609375, -0.21329498291015625, -0.198577880859375, -0.18386077880859375, -0.1691436767578125, -0.15442657470703125, -0.13970947265625, -0.12499237060546875, -0.1102752685546875, -0.09555816650390625, -0.080841064453125, -0.06612396240234375, -0.0514068603515625, -0.03668975830078125, -0.02197265625, -0.00725555419921875, 0.0074615478515625, 0.02217864990234375, 0.036895751953125, 0.05161285400390625, 0.0663299560546875, 0.08104705810546875, 0.09576416015625, 0.11048126220703125, 0.1251983642578125, 0.13991546630859375, 0.154632568359375, 0.16934967041015625, 0.1840667724609375, 0.19878387451171875, 0.2135009765625, 0.22821807861328125, 0.2429351806640625, 0.25765228271484375, 0.272369384765625, 0.28708648681640625, 0.3018035888671875, 0.31652069091796875, 0.33123779296875, 0.34595489501953125, 0.3606719970703125, 0.37538909912109375, 0.390106201171875, 0.40482330322265625, 0.4195404052734375, 0.43425750732421875, 0.448974609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 13.0, 6.0, 11.0, 20.0, 25.0, 29.0, 39.0, 44.0, 64.0, 81.0, 89.0, 90.0, 98.0, 76.0, 75.0, 58.0, 37.0, 26.0, 27.0, 17.0, 15.0, 9.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.006439208984375, -0.0062631964683532715, -0.006087183952331543, -0.0059111714363098145, -0.005735158920288086, -0.005559146404266357, -0.005383133888244629, -0.0052071213722229, -0.005031108856201172, -0.004855096340179443, -0.004679083824157715, -0.004503071308135986, -0.004327058792114258, -0.004151046276092529, -0.003975033760070801, -0.0037990212440490723, -0.0036230087280273438, -0.0034469962120056152, -0.0032709836959838867, -0.003094971179962158, -0.0029189586639404297, -0.002742946147918701, -0.0025669336318969727, -0.002390921115875244, -0.0022149085998535156, -0.002038896083831787, -0.0018628835678100586, -0.00168687105178833, -0.0015108585357666016, -0.001334846019744873, -0.0011588335037231445, -0.000982820987701416, -0.0008068084716796875, -0.000630795955657959, -0.00045478343963623047, -0.00027877092361450195, -0.00010275840759277344, 7.325410842895508e-05, 0.0002492666244506836, 0.0004252791404724121, 0.0006012916564941406, 0.0007773041725158691, 0.0009533166885375977, 0.0011293292045593262, 0.0013053417205810547, 0.0014813542366027832, 0.0016573667526245117, 0.0018333792686462402, 0.0020093917846679688, 0.0021854043006896973, 0.0023614168167114258, 0.0025374293327331543, 0.002713441848754883, 0.0028894543647766113, 0.00306546688079834, 0.0032414793968200684, 0.003417491912841797, 0.0035935044288635254, 0.003769516944885254, 0.003945529460906982, 0.004121541976928711, 0.0042975544929504395, 0.004473567008972168, 0.0046495795249938965, 0.004825592041015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 11.0, 15.0, 16.0, 36.0, 53.0, 76.0, 133.0, 225.0, 501.0, 2850.0, 1018335.0, 24836.0, 750.0, 289.0, 144.0, 97.0, 50.0, 40.0, 18.0, 15.0, 9.0, 12.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.10495376586914062, -0.10102081298828125, -0.09708786010742188, -0.0931549072265625, -0.08922195434570312, -0.08528900146484375, -0.08135604858398438, -0.077423095703125, -0.07349014282226562, -0.06955718994140625, -0.06562423706054688, -0.0616912841796875, -0.057758331298828125, -0.05382537841796875, -0.049892425537109375, -0.04595947265625, -0.042026519775390625, -0.03809356689453125, -0.034160614013671875, -0.0302276611328125, -0.026294708251953125, -0.02236175537109375, -0.018428802490234375, -0.014495849609375, -0.010562896728515625, -0.00662994384765625, -0.002696990966796875, 0.0012359619140625, 0.005168914794921875, 0.00910186767578125, 0.013034820556640625, 0.0169677734375, 0.020900726318359375, 0.02483367919921875, 0.028766632080078125, 0.0326995849609375, 0.036632537841796875, 0.04056549072265625, 0.044498443603515625, 0.048431396484375, 0.052364349365234375, 0.05629730224609375, 0.060230255126953125, 0.0641632080078125, 0.06809616088867188, 0.07202911376953125, 0.07596206665039062, 0.07989501953125, 0.08382797241210938, 0.08776092529296875, 0.09169387817382812, 0.0956268310546875, 0.09955978393554688, 0.10349273681640625, 0.10742568969726562, 0.111358642578125, 0.11529159545898438, 0.11922454833984375, 0.12315750122070312, 0.1270904541015625, 0.13102340698242188, 0.13495635986328125, 0.13888931274414062, 0.142822265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 48.0, 807.0, 148.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026813577860593796, -0.0016594692133367062, -0.0006375806406140327, 0.00038430793210864067, 0.001406196504831314, 0.0024280850775539875, 0.003449973650276661, 0.004471862222999334, 0.005493750795722008, 0.006515639368444681, 0.007537527941167355, 0.008559416979551315, 0.009581305086612701, 0.010603193193674088, 0.011625082232058048, 0.012646971270442009, 0.013668859377503395, 0.014690747484564781, 0.015712637454271317, 0.016734525561332703, 0.01775641366839409, 0.018778301775455475, 0.01980018988251686, 0.020822079852223396, 0.021843967959284782, 0.02286585606634617, 0.023887746036052704, 0.02490963414311409, 0.025931522250175476, 0.026953410357236862, 0.02797529846429825, 0.028997188434004784, 0.03001907467842102, 0.031040962785482407, 0.03206285089254379, 0.03308473899960518, 0.034106627106666565, 0.03512851893901825, 0.036150407046079636, 0.03717229515314102, 0.03819418326020241, 0.039216071367263794, 0.04023795947432518, 0.041259847581386566, 0.04228173941373825, 0.04330362752079964, 0.04432551562786102, 0.04534740373492241, 0.046369291841983795, 0.04739117994904518, 0.04841306805610657, 0.049434956163167953, 0.05045684427022934, 0.051478736102581024, 0.05250062420964241, 0.053522512316703796, 0.05454440042376518, 0.05556628853082657, 0.056588176637887955, 0.05761006474494934, 0.058631956577301025, 0.05965384468436241, 0.0606757327914238, 0.061697620898485184, 0.06271950900554657]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 10.0, 15.0, 24.0, 26.0, 24.0, 30.0, 45.0, 42.0, 46.0, 74.0, 80.0, 68.0, 63.0, 69.0, 63.0, 50.0, 46.0, 51.0, 29.0, 28.0, 29.0, 23.0, 16.0, 10.0, 13.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00514751672744751, -0.005015549249947071, -0.004883581772446632, -0.004751614294946194, -0.004619646817445755, -0.004487679339945316, -0.004355711862444878, -0.004223744384944439, -0.004091776907444, -0.0039598094299435616, -0.003827841952443123, -0.003695874474942684, -0.0035639069974422455, -0.003431939519941807, -0.003299972042441368, -0.0031680045649409294, -0.0030360370874404907, -0.002904069609940052, -0.0027721021324396133, -0.0026401346549391747, -0.002508167177438736, -0.0023761996999382973, -0.0022442322224378586, -0.00211226474493742, -0.001980297267436981, -0.0018483297899365425, -0.0017163623124361038, -0.0015843948349356651, -0.0014524273574352264, -0.0013204598799347878, -0.001188492402434349, -0.0010565249249339104, -0.0009245574474334717, -0.000792589969933033, -0.0006606224924325943, -0.0005286550149321556, -0.0003966875374317169, -0.00026472005993127823, -0.00013275258243083954, -7.851049304008484e-07, 0.00013118237257003784, 0.00026314985007047653, 0.0003951173275709152, 0.0005270848050713539, 0.0006590522825717926, 0.0007910197600722313, 0.00092298723757267, 0.0010549547150731087, 0.0011869221925735474, 0.001318889670073986, 0.0014508571475744247, 0.0015828246250748634, 0.0017147921025753021, 0.0018467595800757408, 0.0019787270575761795, 0.002110694535076618, 0.002242662012577057, 0.0023746294900774956, 0.0025065969675779343, 0.002638564445078373, 0.0027705319225788116, 0.0029024994000792503, 0.003034466877579689, 0.0031664343550801277, 0.0032984018325805664]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 27.0, 47.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 15.0, 27.0, 34.0, 77.0, 117.0, 209.0, 289.0, 513.0, 922.0, 1688.0, 3437.0, 7373.0, 16888.0, 39932.0, 100964.0, 305161.0, 366589.0, 121406.0, 46459.0, 19404.0, 8679.0, 3902.0, 1952.0, 1035.0, 575.0, 327.0, 175.0, 123.0, 96.0, 63.0, 36.0, 24.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.72308349609375, -4.5711669921875, -4.41925048828125, -4.267333984375, -4.11541748046875, -3.9635009765625, -3.81158447265625, -3.65966796875, -3.50775146484375, -3.3558349609375, -3.20391845703125, -3.052001953125, -2.90008544921875, -2.7481689453125, -2.59625244140625, -2.4443359375, -2.29241943359375, -2.1405029296875, -1.98858642578125, -1.836669921875, -1.68475341796875, -1.5328369140625, -1.38092041015625, -1.22900390625, -1.07708740234375, -0.9251708984375, -0.77325439453125, -0.621337890625, -0.46942138671875, -0.3175048828125, -0.16558837890625, -0.013671875, 0.13824462890625, 0.2901611328125, 0.44207763671875, 0.593994140625, 0.74591064453125, 0.8978271484375, 1.04974365234375, 1.20166015625, 1.35357666015625, 1.5054931640625, 1.65740966796875, 1.809326171875, 1.96124267578125, 2.1131591796875, 2.26507568359375, 2.4169921875, 2.56890869140625, 2.7208251953125, 2.87274169921875, 3.024658203125, 3.17657470703125, 3.3284912109375, 3.48040771484375, 3.63232421875, 3.78424072265625, 3.9361572265625, 4.08807373046875, 4.239990234375, 4.39190673828125, 4.5438232421875, 4.69573974609375, 4.84765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 25.0, 27.0, 18.0, 33.0, 27.0, 36.0, 30.0, 64.0, 58.0, 94.0, 168.0, 1645.0, 269.0, 90.0, 60.0, 47.0, 49.0, 40.0, 29.0, 32.0, 31.0, 17.0, 25.0, 12.0, 14.0, 6.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.34375, -25.584228515625, -24.82470703125, -24.065185546875, -23.3056640625, -22.546142578125, -21.78662109375, -21.027099609375, -20.267578125, -19.508056640625, -18.74853515625, -17.989013671875, -17.2294921875, -16.469970703125, -15.71044921875, -14.950927734375, -14.19140625, -13.431884765625, -12.67236328125, -11.912841796875, -11.1533203125, -10.393798828125, -9.63427734375, -8.874755859375, -8.115234375, -7.355712890625, -6.59619140625, -5.836669921875, -5.0771484375, -4.317626953125, -3.55810546875, -2.798583984375, -2.0390625, -1.279541015625, -0.52001953125, 0.239501953125, 0.9990234375, 1.758544921875, 2.51806640625, 3.277587890625, 4.037109375, 4.796630859375, 5.55615234375, 6.315673828125, 7.0751953125, 7.834716796875, 8.59423828125, 9.353759765625, 10.11328125, 10.872802734375, 11.63232421875, 12.391845703125, 13.1513671875, 13.910888671875, 14.67041015625, 15.429931640625, 16.189453125, 16.948974609375, 17.70849609375, 18.468017578125, 19.2275390625, 19.987060546875, 20.74658203125, 21.506103515625, 22.265625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 8.0, 14.0, 19.0, 13.0, 15.0, 15.0, 45.0, 38.0, 65.0, 67.0, 109.0, 128.0, 209.0, 261.0, 480.0, 2146.0, 231901.0, 2903542.0, 4781.0, 721.0, 331.0, 213.0, 165.0, 88.0, 67.0, 63.0, 32.0, 41.0, 33.0, 20.0, 22.0, 10.0, 8.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -48.0732421875, -46.365234375, -44.6572265625, -42.94921875, -41.2412109375, -39.533203125, -37.8251953125, -36.1171875, -34.4091796875, -32.701171875, -30.9931640625, -29.28515625, -27.5771484375, -25.869140625, -24.1611328125, -22.453125, -20.7451171875, -19.037109375, -17.3291015625, -15.62109375, -13.9130859375, -12.205078125, -10.4970703125, -8.7890625, -7.0810546875, -5.373046875, -3.6650390625, -1.95703125, -0.2490234375, 1.458984375, 3.1669921875, 4.875, 6.5830078125, 8.291015625, 9.9990234375, 11.70703125, 13.4150390625, 15.123046875, 16.8310546875, 18.5390625, 20.2470703125, 21.955078125, 23.6630859375, 25.37109375, 27.0791015625, 28.787109375, 30.4951171875, 32.203125, 33.9111328125, 35.619140625, 37.3271484375, 39.03515625, 40.7431640625, 42.451171875, 44.1591796875, 45.8671875, 47.5751953125, 49.283203125, 50.9912109375, 52.69921875, 54.4072265625, 56.115234375, 57.8232421875, 59.53125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 156.0, 584.0, 250.0, 13.0, 6.0], "bins": [-253.69003295898438, -249.50735473632812, -245.32469177246094, -241.1420135498047, -236.9593505859375, -232.77667236328125, -228.59400939941406, -224.4113311767578, -220.22866821289062, -216.04598999023438, -211.8633270263672, -207.68064880371094, -203.49798583984375, -199.3153076171875, -195.1326446533203, -190.94996643066406, -186.76730346679688, -182.58462524414062, -178.40196228027344, -174.2192840576172, -170.03662109375, -165.85394287109375, -161.67127990722656, -157.4886016845703, -153.30592346191406, -149.1232452392578, -144.94058227539062, -140.75790405273438, -136.5752410888672, -132.39256286621094, -128.20989990234375, -124.0272216796875, -119.84456634521484, -115.66189575195312, -111.4792251586914, -107.29655456542969, -103.11388397216797, -98.93121337890625, -94.74853515625, -90.56587219238281, -86.38319396972656, -82.20052337646484, -78.01785278320312, -73.8351821899414, -69.65251159667969, -65.46984100341797, -61.287166595458984, -57.104496002197266, -52.92182922363281, -48.739158630371094, -44.556488037109375, -40.373817443847656, -36.19114685058594, -32.00847625732422, -27.825801849365234, -23.643131256103516, -19.460460662841797, -15.277790069580078, -11.095118522644043, -6.912446975708008, -2.729776382446289, 1.4528942108154297, 5.635566711425781, 9.8182373046875, 14.000907897949219]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 11.0, 1.0, 5.0, 5.0, 7.0, 12.0, 11.0, 7.0, 12.0, 11.0, 17.0, 18.0, 22.0, 20.0, 27.0, 28.0, 27.0, 44.0, 33.0, 46.0, 44.0, 48.0, 48.0, 40.0, 47.0, 44.0, 47.0, 42.0, 40.0, 23.0, 25.0, 33.0, 21.0, 24.0, 17.0, 16.0, 15.0, 15.0, 12.0, 11.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.866756439208984, -47.237186431884766, -45.60762023925781, -43.978050231933594, -42.34848403930664, -40.71891403198242, -39.08934783935547, -37.45977783203125, -35.83020782470703, -34.20063781738281, -32.57107162475586, -30.94150161743164, -29.311935424804688, -27.68236541748047, -26.052797317504883, -24.423229217529297, -22.793663024902344, -21.164094924926758, -19.534526824951172, -17.904956817626953, -16.275390625, -14.645821571350098, -13.016252517700195, -11.38668441772461, -9.757116317749023, -8.127548217773438, -6.497979640960693, -4.868411064147949, -3.2388429641723633, -1.6092748641967773, 0.020294189453125, 1.649862289428711, 3.2794342041015625, 4.909002304077148, 6.538570880889893, 8.168139457702637, 9.797707557678223, 11.427275657653809, 13.056844711303711, 14.686412811279297, 16.315980911254883, 17.94554901123047, 19.575117111206055, 21.20468521118164, 22.83425521850586, 24.463821411132812, 26.09339141845703, 27.722959518432617, 29.352527618408203, 30.98209571838379, 32.611663818359375, 34.241233825683594, 35.87080001831055, 37.500370025634766, 39.12993621826172, 40.75950622558594, 42.389076232910156, 44.018646240234375, 45.64821243286133, 47.27778244018555, 48.9073486328125, 50.53691864013672, 52.16648864746094, 53.79605484008789, 55.425621032714844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 10.0, 9.0, 16.0, 12.0, 11.0, 22.0, 24.0, 31.0, 23.0, 29.0, 22.0, 34.0, 30.0, 39.0, 43.0, 58.0, 42.0, 42.0, 34.0, 43.0, 38.0, 37.0, 37.0, 39.0, 32.0, 46.0, 31.0, 22.0, 21.0, 19.0, 15.0, 14.0, 13.0, 11.0, 13.0, 6.0, 4.0, 9.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.4361572265625, -5.243408203125, -5.0506591796875, -4.85791015625, -4.6651611328125, -4.472412109375, -4.2796630859375, -4.0869140625, -3.8941650390625, -3.701416015625, -3.5086669921875, -3.31591796875, -3.1231689453125, -2.930419921875, -2.7376708984375, -2.544921875, -2.3521728515625, -2.159423828125, -1.9666748046875, -1.77392578125, -1.5811767578125, -1.388427734375, -1.1956787109375, -1.0029296875, -0.8101806640625, -0.617431640625, -0.4246826171875, -0.23193359375, -0.0391845703125, 0.153564453125, 0.3463134765625, 0.5390625, 0.7318115234375, 0.924560546875, 1.1173095703125, 1.31005859375, 1.5028076171875, 1.695556640625, 1.8883056640625, 2.0810546875, 2.2738037109375, 2.466552734375, 2.6593017578125, 2.85205078125, 3.0447998046875, 3.237548828125, 3.4302978515625, 3.623046875, 3.8157958984375, 4.008544921875, 4.2012939453125, 4.39404296875, 4.5867919921875, 4.779541015625, 4.9722900390625, 5.1650390625, 5.3577880859375, 5.550537109375, 5.7432861328125, 5.93603515625, 6.1287841796875, 6.321533203125, 6.5142822265625, 6.70703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 9.0, 8.0, 10.0, 17.0, 21.0, 23.0, 26.0, 20.0, 23.0, 27.0, 19.0, 52.0, 84.0, 229.0, 941.0, 5483.0, 97002.0, 3231045.0, 838919.0, 17329.0, 2066.0, 426.0, 147.0, 69.0, 43.0, 41.0, 28.0, 28.0, 17.0, 19.0, 16.0, 19.0, 15.0, 7.0, 8.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.177001953125, -20.38525390625, -19.593505859375, -18.8017578125, -18.010009765625, -17.21826171875, -16.426513671875, -15.634765625, -14.843017578125, -14.05126953125, -13.259521484375, -12.4677734375, -11.676025390625, -10.88427734375, -10.092529296875, -9.30078125, -8.509033203125, -7.71728515625, -6.925537109375, -6.1337890625, -5.342041015625, -4.55029296875, -3.758544921875, -2.966796875, -2.175048828125, -1.38330078125, -0.591552734375, 0.2001953125, 0.991943359375, 1.78369140625, 2.575439453125, 3.3671875, 4.158935546875, 4.95068359375, 5.742431640625, 6.5341796875, 7.325927734375, 8.11767578125, 8.909423828125, 9.701171875, 10.492919921875, 11.28466796875, 12.076416015625, 12.8681640625, 13.659912109375, 14.45166015625, 15.243408203125, 16.03515625, 16.826904296875, 17.61865234375, 18.410400390625, 19.2021484375, 19.993896484375, 20.78564453125, 21.577392578125, 22.369140625, 23.160888671875, 23.95263671875, 24.744384765625, 25.5361328125, 26.327880859375, 27.11962890625, 27.911376953125, 28.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 2.0, 8.0, 15.0, 12.0, 12.0, 17.0, 24.0, 30.0, 24.0, 50.0, 55.0, 67.0, 95.0, 97.0, 117.0, 164.0, 217.0, 255.0, 319.0, 358.0, 352.0, 345.0, 298.0, 235.0, 203.0, 152.0, 114.0, 102.0, 71.0, 68.0, 46.0, 31.0, 33.0, 19.0, 17.0, 14.0, 5.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.625, -10.3140869140625, -10.003173828125, -9.6922607421875, -9.38134765625, -9.0704345703125, -8.759521484375, -8.4486083984375, -8.1376953125, -7.8267822265625, -7.515869140625, -7.2049560546875, -6.89404296875, -6.5831298828125, -6.272216796875, -5.9613037109375, -5.650390625, -5.3394775390625, -5.028564453125, -4.7176513671875, -4.40673828125, -4.0958251953125, -3.784912109375, -3.4739990234375, -3.1630859375, -2.8521728515625, -2.541259765625, -2.2303466796875, -1.91943359375, -1.6085205078125, -1.297607421875, -0.9866943359375, -0.67578125, -0.3648681640625, -0.053955078125, 0.2569580078125, 0.56787109375, 0.8787841796875, 1.189697265625, 1.5006103515625, 1.8115234375, 2.1224365234375, 2.433349609375, 2.7442626953125, 3.05517578125, 3.3660888671875, 3.677001953125, 3.9879150390625, 4.298828125, 4.6097412109375, 4.920654296875, 5.2315673828125, 5.54248046875, 5.8533935546875, 6.164306640625, 6.4752197265625, 6.7861328125, 7.0970458984375, 7.407958984375, 7.7188720703125, 8.02978515625, 8.3406982421875, 8.651611328125, 8.9625244140625, 9.2734375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 11.0, 26.0, 28.0, 26.0, 46.0, 63.0, 101.0, 149.0, 218.0, 312.0, 807.0, 6086.0, 371188.0, 3763225.0, 48539.0, 2017.0, 543.0, 266.0, 156.0, 118.0, 76.0, 67.0, 44.0, 41.0, 27.0, 25.0, 10.0, 9.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.3837890625, -36.923828125, -35.4638671875, -34.00390625, -32.5439453125, -31.083984375, -29.6240234375, -28.1640625, -26.7041015625, -25.244140625, -23.7841796875, -22.32421875, -20.8642578125, -19.404296875, -17.9443359375, -16.484375, -15.0244140625, -13.564453125, -12.1044921875, -10.64453125, -9.1845703125, -7.724609375, -6.2646484375, -4.8046875, -3.3447265625, -1.884765625, -0.4248046875, 1.03515625, 2.4951171875, 3.955078125, 5.4150390625, 6.875, 8.3349609375, 9.794921875, 11.2548828125, 12.71484375, 14.1748046875, 15.634765625, 17.0947265625, 18.5546875, 20.0146484375, 21.474609375, 22.9345703125, 24.39453125, 25.8544921875, 27.314453125, 28.7744140625, 30.234375, 31.6943359375, 33.154296875, 34.6142578125, 36.07421875, 37.5341796875, 38.994140625, 40.4541015625, 41.9140625, 43.3740234375, 44.833984375, 46.2939453125, 47.75390625, 49.2138671875, 50.673828125, 52.1337890625, 53.59375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 59.0, 173.0, 295.0, 310.0, 127.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.20521545410156, -181.99156188964844, -176.77792358398438, -171.56427001953125, -166.35061645507812, -161.136962890625, -155.92330932617188, -150.7096710205078, -145.4960174560547, -140.28236389160156, -135.0687255859375, -129.85507202148438, -124.64141845703125, -119.42776489257812, -114.21411895751953, -109.00047302246094, -103.78681945800781, -98.57316589355469, -93.3595199584961, -88.1458740234375, -82.93222045898438, -77.71856689453125, -72.50492095947266, -67.29127502441406, -62.07762145996094, -56.86397171020508, -51.65032196044922, -46.43667221069336, -41.2230224609375, -36.00937271118164, -30.79572296142578, -25.582073211669922, -20.368423461914062, -15.154773712158203, -9.941123962402344, -4.727474212646484, 0.486175537109375, 5.699825286865234, 10.913475036621094, 16.127124786376953, 21.340774536132812, 26.554424285888672, 31.76807403564453, 36.98172378540039, 42.19537353515625, 47.40902328491211, 52.62267303466797, 57.83632278442383, 63.04997253417969, 68.26362609863281, 73.4772720336914, 78.69091796875, 83.90457153320312, 89.11822509765625, 94.33187103271484, 99.54551696777344, 104.75917053222656, 109.97282409667969, 115.18647003173828, 120.40011596679688, 125.61376953125, 130.82742309570312, 136.04107666015625, 141.2547149658203, 146.46836853027344]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 9.0, 2.0, 6.0, 5.0, 8.0, 9.0, 17.0, 14.0, 15.0, 27.0, 21.0, 26.0, 46.0, 29.0, 35.0, 39.0, 39.0, 38.0, 43.0, 38.0, 38.0, 40.0, 31.0, 41.0, 35.0, 40.0, 33.0, 25.0, 43.0, 36.0, 25.0, 30.0, 22.0, 15.0, 24.0, 17.0, 5.0, 11.0, 7.0, 1.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.928253173828125, -39.651458740234375, -38.374664306640625, -37.09787368774414, -35.82107925415039, -34.54428482055664, -33.26749038696289, -31.99069595336914, -30.713903427124023, -29.437108993530273, -28.160316467285156, -26.883522033691406, -25.606727600097656, -24.32993507385254, -23.05314064025879, -21.776348114013672, -20.499553680419922, -19.222759246826172, -17.945966720581055, -16.669172286987305, -15.392378807067871, -14.115585327148438, -12.838790893554688, -11.561997413635254, -10.28520393371582, -9.008410453796387, -7.731616497039795, -6.454822540283203, -5.1780290603637695, -3.901235580444336, -2.624441623687744, -1.3476476669311523, -0.07085800170898438, 1.2059357166290283, 2.482729434967041, 3.7595231533050537, 5.036316871643066, 6.3131103515625, 7.589904308319092, 8.866698265075684, 10.143491744995117, 11.42028522491455, 12.697078704833984, 13.973873138427734, 15.250666618347168, 16.5274600982666, 17.80425453186035, 19.08104705810547, 20.35784149169922, 21.63463592529297, 22.911428451538086, 24.188222885131836, 25.465015411376953, 26.741809844970703, 28.018604278564453, 29.295398712158203, 30.57219123840332, 31.84898567199707, 33.12577819824219, 34.40257263183594, 35.67936706542969, 36.95616149902344, 38.23295211791992, 39.50974655151367, 40.78654098510742]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 45.0, 20.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 8.0, 23.0, 44.0, 58.0, 93.0, 140.0, 249.0, 402.0, 639.0, 1037.0, 1647.0, 2623.0, 4221.0, 6869.0, 11272.0, 19178.0, 32383.0, 56394.0, 97039.0, 159933.0, 213022.0, 175589.0, 109701.0, 64459.0, 36964.0, 21565.0, 12881.0, 7626.0, 4764.0, 2869.0, 1835.0, 1111.0, 689.0, 447.0, 285.0, 168.0, 121.0, 59.0, 40.0, 38.0, 15.0, 15.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.7861328125, -0.7640609741210938, -0.7419891357421875, -0.7199172973632812, -0.697845458984375, -0.6757736206054688, -0.6537017822265625, -0.6316299438476562, -0.60955810546875, -0.5874862670898438, -0.5654144287109375, -0.5433425903320312, -0.521270751953125, -0.49919891357421875, -0.4771270751953125, -0.45505523681640625, -0.4329833984375, -0.41091156005859375, -0.3888397216796875, -0.36676788330078125, -0.344696044921875, -0.32262420654296875, -0.3005523681640625, -0.27848052978515625, -0.25640869140625, -0.23433685302734375, -0.2122650146484375, -0.19019317626953125, -0.168121337890625, -0.14604949951171875, -0.1239776611328125, -0.10190582275390625, -0.079833984375, -0.05776214599609375, -0.0356903076171875, -0.01361846923828125, 0.008453369140625, 0.03052520751953125, 0.0525970458984375, 0.07466888427734375, 0.09674072265625, 0.11881256103515625, 0.1408843994140625, 0.16295623779296875, 0.185028076171875, 0.20709991455078125, 0.2291717529296875, 0.25124359130859375, 0.2733154296875, 0.29538726806640625, 0.3174591064453125, 0.33953094482421875, 0.361602783203125, 0.38367462158203125, 0.4057464599609375, 0.42781829833984375, 0.44989013671875, 0.47196197509765625, 0.4940338134765625, 0.5161056518554688, 0.538177490234375, 0.5602493286132812, 0.5823211669921875, 0.6043930053710938, 0.62646484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 12.0, 10.0, 11.0, 10.0, 19.0, 21.0, 20.0, 28.0, 28.0, 20.0, 31.0, 39.0, 33.0, 58.0, 44.0, 38.0, 1080.0, 51.0, 35.0, 42.0, 44.0, 31.0, 53.0, 35.0, 37.0, 38.0, 27.0, 26.0, 13.0, 15.0, 8.0, 13.0, 9.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.40118408203125, -4.2633056640625, -4.12542724609375, -3.987548828125, -3.84967041015625, -3.7117919921875, -3.57391357421875, -3.43603515625, -3.29815673828125, -3.1602783203125, -3.02239990234375, -2.884521484375, -2.74664306640625, -2.6087646484375, -2.47088623046875, -2.3330078125, -2.19512939453125, -2.0572509765625, -1.91937255859375, -1.781494140625, -1.64361572265625, -1.5057373046875, -1.36785888671875, -1.22998046875, -1.09210205078125, -0.9542236328125, -0.81634521484375, -0.678466796875, -0.54058837890625, -0.4027099609375, -0.26483154296875, -0.126953125, 0.01092529296875, 0.1488037109375, 0.28668212890625, 0.424560546875, 0.56243896484375, 0.7003173828125, 0.83819580078125, 0.97607421875, 1.11395263671875, 1.2518310546875, 1.38970947265625, 1.527587890625, 1.66546630859375, 1.8033447265625, 1.94122314453125, 2.0791015625, 2.21697998046875, 2.3548583984375, 2.49273681640625, 2.630615234375, 2.76849365234375, 2.9063720703125, 3.04425048828125, 3.18212890625, 3.32000732421875, 3.4578857421875, 3.59576416015625, 3.733642578125, 3.87152099609375, 4.0093994140625, 4.14727783203125, 4.28515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 17.0, 25.0, 32.0, 55.0, 69.0, 86.0, 172.0, 274.0, 424.0, 635.0, 1094.0, 1689.0, 2528.0, 3986.0, 6246.0, 9811.0, 15546.0, 24074.0, 37630.0, 58271.0, 87229.0, 121375.0, 506172.0, 843562.0, 122644.0, 87970.0, 58836.0, 38234.0, 24604.0, 15843.0, 10051.0, 6532.0, 4094.0, 2677.0, 1686.0, 1028.0, 650.0, 444.0, 297.0, 207.0, 115.0, 81.0, 49.0, 30.0, 15.0, 12.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.409423828125, -0.395782470703125, -0.38214111328125, -0.368499755859375, -0.3548583984375, -0.341217041015625, -0.32757568359375, -0.313934326171875, -0.30029296875, -0.286651611328125, -0.27301025390625, -0.259368896484375, -0.2457275390625, -0.232086181640625, -0.21844482421875, -0.204803466796875, -0.191162109375, -0.177520751953125, -0.16387939453125, -0.150238037109375, -0.1365966796875, -0.122955322265625, -0.10931396484375, -0.095672607421875, -0.08203125, -0.068389892578125, -0.05474853515625, -0.041107177734375, -0.0274658203125, -0.013824462890625, -0.00018310546875, 0.013458251953125, 0.027099609375, 0.040740966796875, 0.05438232421875, 0.068023681640625, 0.0816650390625, 0.095306396484375, 0.10894775390625, 0.122589111328125, 0.13623046875, 0.149871826171875, 0.16351318359375, 0.177154541015625, 0.1907958984375, 0.204437255859375, 0.21807861328125, 0.231719970703125, 0.245361328125, 0.259002685546875, 0.27264404296875, 0.286285400390625, 0.2999267578125, 0.313568115234375, 0.32720947265625, 0.340850830078125, 0.3544921875, 0.368133544921875, 0.38177490234375, 0.395416259765625, 0.4090576171875, 0.422698974609375, 0.43634033203125, 0.449981689453125, 0.463623046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 6.0, 3.0, 7.0, 6.0, 8.0, 13.0, 12.0, 21.0, 26.0, 17.0, 32.0, 35.0, 46.0, 41.0, 58.0, 79.0, 74.0, 64.0, 65.0, 52.0, 61.0, 49.0, 36.0, 29.0, 27.0, 19.0, 19.0, 18.0, 8.0, 11.0, 11.0, 7.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004188179969787598, -0.004065752029418945, -0.003943324089050293, -0.0038208961486816406, -0.0036984682083129883, -0.003576040267944336, -0.0034536123275756836, -0.0033311843872070312, -0.003208756446838379, -0.0030863285064697266, -0.0029639005661010742, -0.002841472625732422, -0.0027190446853637695, -0.002596616744995117, -0.002474188804626465, -0.0023517608642578125, -0.00222933292388916, -0.002106904983520508, -0.0019844770431518555, -0.0018620491027832031, -0.0017396211624145508, -0.0016171932220458984, -0.001494765281677246, -0.0013723373413085938, -0.0012499094009399414, -0.001127481460571289, -0.0010050535202026367, -0.0008826255798339844, -0.000760197639465332, -0.0006377696990966797, -0.0005153417587280273, -0.000392913818359375, -0.00027048587799072266, -0.0001480579376220703, -2.562999725341797e-05, 9.679794311523438e-05, 0.00021922588348388672, 0.00034165382385253906, 0.0004640817642211914, 0.0005865097045898438, 0.0007089376449584961, 0.0008313655853271484, 0.0009537935256958008, 0.0010762214660644531, 0.0011986494064331055, 0.0013210773468017578, 0.0014435052871704102, 0.0015659332275390625, 0.0016883611679077148, 0.0018107891082763672, 0.0019332170486450195, 0.002055644989013672, 0.0021780729293823242, 0.0023005008697509766, 0.002422928810119629, 0.0025453567504882812, 0.0026677846908569336, 0.002790212631225586, 0.0029126405715942383, 0.0030350685119628906, 0.003157496452331543, 0.0032799243927001953, 0.0034023523330688477, 0.0035247802734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 7.0, 11.0, 6.0, 12.0, 18.0, 17.0, 23.0, 22.0, 35.0, 57.0, 63.0, 126.0, 183.0, 316.0, 885.0, 34974.0, 1003709.0, 6674.0, 590.0, 279.0, 171.0, 107.0, 69.0, 28.0, 38.0, 29.0, 19.0, 14.0, 15.0, 18.0, 8.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08575439453125, -0.08301925659179688, -0.08028411865234375, -0.07754898071289062, -0.0748138427734375, -0.07207870483398438, -0.06934356689453125, -0.06660842895507812, -0.063873291015625, -0.061138153076171875, -0.05840301513671875, -0.055667877197265625, -0.0529327392578125, -0.050197601318359375, -0.04746246337890625, -0.044727325439453125, -0.0419921875, -0.039257049560546875, -0.03652191162109375, -0.033786773681640625, -0.0310516357421875, -0.028316497802734375, -0.02558135986328125, -0.022846221923828125, -0.020111083984375, -0.017375946044921875, -0.01464080810546875, -0.011905670166015625, -0.0091705322265625, -0.006435394287109375, -0.00370025634765625, -0.000965118408203125, 0.00177001953125, 0.004505157470703125, 0.00724029541015625, 0.009975433349609375, 0.0127105712890625, 0.015445709228515625, 0.01818084716796875, 0.020915985107421875, 0.023651123046875, 0.026386260986328125, 0.02912139892578125, 0.031856536865234375, 0.0345916748046875, 0.037326812744140625, 0.04006195068359375, 0.042797088623046875, 0.0455322265625, 0.048267364501953125, 0.05100250244140625, 0.053737640380859375, 0.0564727783203125, 0.059207916259765625, 0.06194305419921875, 0.06467819213867188, 0.067413330078125, 0.07014846801757812, 0.07288360595703125, 0.07561874389648438, 0.0783538818359375, 0.08108901977539062, 0.08382415771484375, 0.08655929565429688, 0.08929443359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 10.0, 174.0, 731.0, 93.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030269038397818804, -0.002339038299396634, -0.001651172642596066, -0.0009633069857954979, -0.0002754414454102516, 0.00041242409497499466, 0.0011002898681908846, 0.0017881554085761309, 0.002476020948961377, 0.0031638864893466234, 0.0038517522625625134, 0.00453961780294776, 0.005227483343333006, 0.005915348883718252, 0.006603214889764786, 0.007291080430150032, 0.007978945970535278, 0.008666811510920525, 0.009354677051305771, 0.010042542591691017, 0.010730408132076263, 0.01141827367246151, 0.012106139212846756, 0.012794004753232002, 0.013481870293617249, 0.014169735834002495, 0.014857601374387741, 0.015545466914772987, 0.016233332455158234, 0.01692119799554348, 0.017609063535928726, 0.018296929076313972, 0.018984796479344368, 0.019672662019729614, 0.02036052756011486, 0.021048393100500107, 0.021736258640885353, 0.0224241241812706, 0.023111989721655846, 0.023799855262041092, 0.024487720802426338, 0.025175586342811584, 0.02586345188319683, 0.026551317423582077, 0.027239182963967323, 0.02792704850435257, 0.028614914044737816, 0.029302779585123062, 0.029990646988153458, 0.030678512528538704, 0.03136637806892395, 0.032054245471954346, 0.03274210914969444, 0.03342997655272484, 0.034117840230464935, 0.03480570763349533, 0.03549357131123543, 0.03618143871426582, 0.03686930239200592, 0.037557169795036316, 0.03824503347277641, 0.03893290087580681, 0.039620764553546906, 0.0403086319565773, 0.0409964956343174]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 8.0, 12.0, 15.0, 17.0, 25.0, 28.0, 30.0, 35.0, 35.0, 50.0, 35.0, 38.0, 53.0, 41.0, 39.0, 39.0, 47.0, 51.0, 53.0, 45.0, 52.0, 37.0, 30.0, 26.0, 29.0, 21.0, 21.0, 14.0, 11.0, 16.0, 12.0, 14.0, 7.0, 1.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028460025787353516, -0.002757125534117222, -0.002668248489499092, -0.0025793714448809624, -0.0024904944002628326, -0.002401617355644703, -0.002312740311026573, -0.0022238632664084435, -0.0021349862217903137, -0.002046109177172184, -0.0019572321325540543, -0.0018683550879359245, -0.0017794780433177948, -0.001690600998699665, -0.0016017239540815353, -0.0015128469094634056, -0.0014239698648452759, -0.0013350928202271461, -0.0012462157756090164, -0.0011573387309908867, -0.001068461686372757, -0.0009795846417546272, -0.0008907075971364975, -0.0008018305525183678, -0.000712953507900238, -0.0006240764632821083, -0.0005351994186639786, -0.00044632237404584885, -0.0003574453294277191, -0.0002685682848095894, -0.00017969124019145966, -9.081419557332993e-05, -1.9371509552001953e-06, 8.693989366292953e-05, 0.00017581693828105927, 0.000264693982899189, 0.0003535710275173187, 0.00044244807213544846, 0.0005313251167535782, 0.0006202021613717079, 0.0007090792059898376, 0.0007979562506079674, 0.0008868332952260971, 0.0009757103398442268, 0.0010645873844623566, 0.0011534644290804863, 0.001242341473698616, 0.0013312185183167458, 0.0014200955629348755, 0.0015089726075530052, 0.001597849652171135, 0.0016867266967892647, 0.0017756037414073944, 0.0018644807860255241, 0.001953357830643654, 0.0020422348752617836, 0.0021311119198799133, 0.002219988964498043, 0.002308866009116173, 0.0023977430537343025, 0.0024866200983524323, 0.002575497142970562, 0.0026643741875886917, 0.0027532512322068214, 0.002842128276824951]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 46.0, 19.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 10.0, 16.0, 14.0, 20.0, 31.0, 59.0, 79.0, 115.0, 183.0, 341.0, 550.0, 965.0, 1789.0, 3440.0, 6680.0, 14493.0, 39002.0, 123582.0, 447300.0, 279982.0, 80562.0, 27073.0, 10958.0, 5087.0, 2693.0, 1473.0, 821.0, 484.0, 276.0, 153.0, 98.0, 61.0, 42.0, 26.0, 27.0, 19.0, 7.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.438720703125, -5.25634765625, -5.073974609375, -4.8916015625, -4.709228515625, -4.52685546875, -4.344482421875, -4.162109375, -3.979736328125, -3.79736328125, -3.614990234375, -3.4326171875, -3.250244140625, -3.06787109375, -2.885498046875, -2.703125, -2.520751953125, -2.33837890625, -2.156005859375, -1.9736328125, -1.791259765625, -1.60888671875, -1.426513671875, -1.244140625, -1.061767578125, -0.87939453125, -0.697021484375, -0.5146484375, -0.332275390625, -0.14990234375, 0.032470703125, 0.21484375, 0.397216796875, 0.57958984375, 0.761962890625, 0.9443359375, 1.126708984375, 1.30908203125, 1.491455078125, 1.673828125, 1.856201171875, 2.03857421875, 2.220947265625, 2.4033203125, 2.585693359375, 2.76806640625, 2.950439453125, 3.1328125, 3.315185546875, 3.49755859375, 3.679931640625, 3.8623046875, 4.044677734375, 4.22705078125, 4.409423828125, 4.591796875, 4.774169921875, 4.95654296875, 5.138916015625, 5.3212890625, 5.503662109375, 5.68603515625, 5.868408203125, 6.05078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 7.0, 15.0, 13.0, 13.0, 10.0, 24.0, 18.0, 27.0, 30.0, 35.0, 36.0, 32.0, 41.0, 61.0, 51.0, 69.0, 140.0, 1481.0, 322.0, 125.0, 80.0, 46.0, 38.0, 43.0, 32.0, 31.0, 31.0, 23.0, 28.0, 23.0, 16.0, 16.0, 15.0, 11.0, 9.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.09375, -18.49560546875, -17.8974609375, -17.29931640625, -16.701171875, -16.10302734375, -15.5048828125, -14.90673828125, -14.30859375, -13.71044921875, -13.1123046875, -12.51416015625, -11.916015625, -11.31787109375, -10.7197265625, -10.12158203125, -9.5234375, -8.92529296875, -8.3271484375, -7.72900390625, -7.130859375, -6.53271484375, -5.9345703125, -5.33642578125, -4.73828125, -4.14013671875, -3.5419921875, -2.94384765625, -2.345703125, -1.74755859375, -1.1494140625, -0.55126953125, 0.046875, 0.64501953125, 1.2431640625, 1.84130859375, 2.439453125, 3.03759765625, 3.6357421875, 4.23388671875, 4.83203125, 5.43017578125, 6.0283203125, 6.62646484375, 7.224609375, 7.82275390625, 8.4208984375, 9.01904296875, 9.6171875, 10.21533203125, 10.8134765625, 11.41162109375, 12.009765625, 12.60791015625, 13.2060546875, 13.80419921875, 14.40234375, 15.00048828125, 15.5986328125, 16.19677734375, 16.794921875, 17.39306640625, 17.9912109375, 18.58935546875, 19.1875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 21.0, 22.0, 48.0, 50.0, 94.0, 138.0, 198.0, 355.0, 845.0, 17680.0, 3120232.0, 4380.0, 695.0, 342.0, 194.0, 135.0, 77.0, 58.0, 31.0, 36.0, 14.0, 14.0, 8.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.1875, -95.75537109375, -93.3232421875, -90.89111328125, -88.458984375, -86.02685546875, -83.5947265625, -81.16259765625, -78.73046875, -76.29833984375, -73.8662109375, -71.43408203125, -69.001953125, -66.56982421875, -64.1376953125, -61.70556640625, -59.2734375, -56.84130859375, -54.4091796875, -51.97705078125, -49.544921875, -47.11279296875, -44.6806640625, -42.24853515625, -39.81640625, -37.38427734375, -34.9521484375, -32.52001953125, -30.087890625, -27.65576171875, -25.2236328125, -22.79150390625, -20.359375, -17.92724609375, -15.4951171875, -13.06298828125, -10.630859375, -8.19873046875, -5.7666015625, -3.33447265625, -0.90234375, 1.52978515625, 3.9619140625, 6.39404296875, 8.826171875, 11.25830078125, 13.6904296875, 16.12255859375, 18.5546875, 20.98681640625, 23.4189453125, 25.85107421875, 28.283203125, 30.71533203125, 33.1474609375, 35.57958984375, 38.01171875, 40.44384765625, 42.8759765625, 45.30810546875, 47.740234375, 50.17236328125, 52.6044921875, 55.03662109375, 57.46875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 29.0, 165.0, 345.0, 291.0, 139.0, 30.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.14201354980469, -51.978763580322266, -49.815513610839844, -47.652259826660156, -45.489009857177734, -43.32575988769531, -41.16250991821289, -38.99925994873047, -36.83600616455078, -34.67275619506836, -32.50950622558594, -30.346254348754883, -28.183002471923828, -26.019752502441406, -23.856502532958984, -21.693252563476562, -19.53000259399414, -17.36675262451172, -15.203500747680664, -13.040250778198242, -10.876999855041504, -8.713748931884766, -6.550498962402344, -4.3872480392456055, -2.223997116088867, -0.06074643135070801, 2.102504253387451, 4.265754699707031, 6.4290056228637695, 8.592256546020508, 10.75550651550293, 12.918757438659668, 15.082008361816406, 17.245258331298828, 19.408510208129883, 21.571760177612305, 23.73501205444336, 25.89826202392578, 28.061511993408203, 30.224761962890625, 32.38801574707031, 34.551265716552734, 36.714515686035156, 38.877769470214844, 41.041019439697266, 43.20426940917969, 45.36751937866211, 47.53076934814453, 49.69401931762695, 51.857269287109375, 54.0205192565918, 56.18376922607422, 58.347023010253906, 60.51027297973633, 62.67352294921875, 64.83677673339844, 67.0000228881836, 69.16327667236328, 71.32652282714844, 73.48977661132812, 75.65302276611328, 77.81627655029297, 79.97952270507812, 82.14277648925781, 84.3060302734375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 3.0, 6.0, 9.0, 5.0, 16.0, 15.0, 13.0, 18.0, 17.0, 21.0, 20.0, 24.0, 25.0, 23.0, 28.0, 40.0, 42.0, 31.0, 42.0, 50.0, 33.0, 47.0, 35.0, 29.0, 41.0, 35.0, 38.0, 27.0, 36.0, 27.0, 33.0, 24.0, 19.0, 16.0, 11.0, 12.0, 14.0, 9.0, 7.0, 11.0, 9.0, 10.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-53.2945556640625, -51.62506866455078, -49.95558166503906, -48.286094665527344, -46.616607666015625, -44.947120666503906, -43.27763748168945, -41.608150482177734, -39.938663482666016, -38.2691764831543, -36.59968948364258, -34.93020248413086, -33.260719299316406, -31.591230392456055, -29.92174530029297, -28.25225830078125, -26.58277130126953, -24.913284301757812, -23.243797302246094, -21.574312210083008, -19.90482521057129, -18.23533821105957, -16.565853118896484, -14.896366119384766, -13.226879119873047, -11.557392120361328, -9.887906074523926, -8.218420028686523, -6.548933029174805, -4.879446029663086, -3.2099599838256836, -1.5404739379882812, 0.1290130615234375, 1.798499584197998, 3.4679861068725586, 5.137472629547119, 6.80695915222168, 8.476446151733398, 10.1459321975708, 11.815418243408203, 13.484905242919922, 15.15439224243164, 16.82387924194336, 18.493364334106445, 20.162851333618164, 21.832338333129883, 23.50182342529297, 25.171310424804688, 26.840797424316406, 28.510284423828125, 30.179771423339844, 31.84925651550293, 33.51874542236328, 35.188232421875, 36.85771560668945, 38.52720260620117, 40.19668960571289, 41.86617660522461, 43.53566360473633, 45.20515060424805, 46.8746337890625, 48.54412078857422, 50.21360778808594, 51.883094787597656, 53.552581787109375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 12.0, 23.0, 17.0, 20.0, 24.0, 18.0, 34.0, 40.0, 33.0, 34.0, 48.0, 35.0, 34.0, 36.0, 44.0, 46.0, 48.0, 51.0, 43.0, 39.0, 38.0, 44.0, 24.0, 34.0, 17.0, 29.0, 14.0, 26.0, 16.0, 8.0, 7.0, 2.0, 11.0, 6.0, 6.0, 2.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.880126953125, -5.66259765625, -5.445068359375, -5.2275390625, -5.010009765625, -4.79248046875, -4.574951171875, -4.357421875, -4.139892578125, -3.92236328125, -3.704833984375, -3.4873046875, -3.269775390625, -3.05224609375, -2.834716796875, -2.6171875, -2.399658203125, -2.18212890625, -1.964599609375, -1.7470703125, -1.529541015625, -1.31201171875, -1.094482421875, -0.876953125, -0.659423828125, -0.44189453125, -0.224365234375, -0.0068359375, 0.210693359375, 0.42822265625, 0.645751953125, 0.86328125, 1.080810546875, 1.29833984375, 1.515869140625, 1.7333984375, 1.950927734375, 2.16845703125, 2.385986328125, 2.603515625, 2.821044921875, 3.03857421875, 3.256103515625, 3.4736328125, 3.691162109375, 3.90869140625, 4.126220703125, 4.34375, 4.561279296875, 4.77880859375, 4.996337890625, 5.2138671875, 5.431396484375, 5.64892578125, 5.866455078125, 6.083984375, 6.301513671875, 6.51904296875, 6.736572265625, 6.9541015625, 7.171630859375, 7.38916015625, 7.606689453125, 7.82421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 2.0, 7.0, 11.0, 12.0, 16.0, 22.0, 23.0, 24.0, 24.0, 31.0, 37.0, 45.0, 65.0, 139.0, 476.0, 2103.0, 16446.0, 531872.0, 3454642.0, 177468.0, 8556.0, 1462.0, 357.0, 129.0, 73.0, 45.0, 36.0, 29.0, 24.0, 23.0, 17.0, 16.0, 8.0, 11.0, 5.0, 9.0, 2.0, 7.0, 9.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.661865234375, -20.87060546875, -20.079345703125, -19.2880859375, -18.496826171875, -17.70556640625, -16.914306640625, -16.123046875, -15.331787109375, -14.54052734375, -13.749267578125, -12.9580078125, -12.166748046875, -11.37548828125, -10.584228515625, -9.79296875, -9.001708984375, -8.21044921875, -7.419189453125, -6.6279296875, -5.836669921875, -5.04541015625, -4.254150390625, -3.462890625, -2.671630859375, -1.88037109375, -1.089111328125, -0.2978515625, 0.493408203125, 1.28466796875, 2.075927734375, 2.8671875, 3.658447265625, 4.44970703125, 5.240966796875, 6.0322265625, 6.823486328125, 7.61474609375, 8.406005859375, 9.197265625, 9.988525390625, 10.77978515625, 11.571044921875, 12.3623046875, 13.153564453125, 13.94482421875, 14.736083984375, 15.52734375, 16.318603515625, 17.10986328125, 17.901123046875, 18.6923828125, 19.483642578125, 20.27490234375, 21.066162109375, 21.857421875, 22.648681640625, 23.43994140625, 24.231201171875, 25.0224609375, 25.813720703125, 26.60498046875, 27.396240234375, 28.1875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 6.0, 12.0, 23.0, 17.0, 28.0, 28.0, 50.0, 53.0, 78.0, 100.0, 138.0, 170.0, 278.0, 350.0, 404.0, 497.0, 435.0, 359.0, 251.0, 196.0, 161.0, 122.0, 79.0, 74.0, 49.0, 25.0, 22.0, 18.0, 10.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.5859375, -11.1800537109375, -10.774169921875, -10.3682861328125, -9.96240234375, -9.5565185546875, -9.150634765625, -8.7447509765625, -8.3388671875, -7.9329833984375, -7.527099609375, -7.1212158203125, -6.71533203125, -6.3094482421875, -5.903564453125, -5.4976806640625, -5.091796875, -4.6859130859375, -4.280029296875, -3.8741455078125, -3.46826171875, -3.0623779296875, -2.656494140625, -2.2506103515625, -1.8447265625, -1.4388427734375, -1.032958984375, -0.6270751953125, -0.22119140625, 0.1846923828125, 0.590576171875, 0.9964599609375, 1.40234375, 1.8082275390625, 2.214111328125, 2.6199951171875, 3.02587890625, 3.4317626953125, 3.837646484375, 4.2435302734375, 4.6494140625, 5.0552978515625, 5.461181640625, 5.8670654296875, 6.27294921875, 6.6788330078125, 7.084716796875, 7.4906005859375, 7.896484375, 8.3023681640625, 8.708251953125, 9.1141357421875, 9.52001953125, 9.9259033203125, 10.331787109375, 10.7376708984375, 11.1435546875, 11.5494384765625, 11.955322265625, 12.3612060546875, 12.76708984375, 13.1729736328125, 13.578857421875, 13.9847412109375, 14.390625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 14.0, 10.0, 16.0, 33.0, 26.0, 35.0, 51.0, 99.0, 98.0, 148.0, 171.0, 234.0, 312.0, 706.0, 3268.0, 134564.0, 3938568.0, 111124.0, 2926.0, 636.0, 301.0, 215.0, 164.0, 108.0, 103.0, 62.0, 59.0, 62.0, 37.0, 36.0, 21.0, 18.0, 10.0, 19.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-54.0625, -52.58056640625, -51.0986328125, -49.61669921875, -48.134765625, -46.65283203125, -45.1708984375, -43.68896484375, -42.20703125, -40.72509765625, -39.2431640625, -37.76123046875, -36.279296875, -34.79736328125, -33.3154296875, -31.83349609375, -30.3515625, -28.86962890625, -27.3876953125, -25.90576171875, -24.423828125, -22.94189453125, -21.4599609375, -19.97802734375, -18.49609375, -17.01416015625, -15.5322265625, -14.05029296875, -12.568359375, -11.08642578125, -9.6044921875, -8.12255859375, -6.640625, -5.15869140625, -3.6767578125, -2.19482421875, -0.712890625, 0.76904296875, 2.2509765625, 3.73291015625, 5.21484375, 6.69677734375, 8.1787109375, 9.66064453125, 11.142578125, 12.62451171875, 14.1064453125, 15.58837890625, 17.0703125, 18.55224609375, 20.0341796875, 21.51611328125, 22.998046875, 24.47998046875, 25.9619140625, 27.44384765625, 28.92578125, 30.40771484375, 31.8896484375, 33.37158203125, 34.853515625, 36.33544921875, 37.8173828125, 39.29931640625, 40.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 7.0, 17.0, 25.0, 59.0, 83.0, 119.0, 158.0, 128.0, 137.0, 107.0, 67.0, 50.0, 21.0, 10.0, 11.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-115.23910522460938, -112.9880599975586, -110.73701477050781, -108.48597717285156, -106.23493194580078, -103.98388671875, -101.73284912109375, -99.48180389404297, -97.23075866699219, -94.9797134399414, -92.72866821289062, -90.47763061523438, -88.2265853881836, -85.97554016113281, -83.72450256347656, -81.47345733642578, -79.222412109375, -76.97136688232422, -74.72032165527344, -72.46928405761719, -70.2182388305664, -67.96719360351562, -65.71615600585938, -63.465110778808594, -61.21406555175781, -58.96302032470703, -56.711978912353516, -54.4609375, -52.20989227294922, -49.95884704589844, -47.70780563354492, -45.456764221191406, -43.205718994140625, -40.954673767089844, -38.70363235473633, -36.45259094238281, -34.20154571533203, -31.950502395629883, -29.699459075927734, -27.448415756225586, -25.197372436523438, -22.94632911682129, -20.69528579711914, -18.444242477416992, -16.193199157714844, -13.942155838012695, -11.691112518310547, -9.440069198608398, -7.18902587890625, -4.937982559204102, -2.686939239501953, -0.4358959197998047, 1.8151473999023438, 4.066190719604492, 6.317234039306641, 8.568277359008789, 10.819320678710938, 13.070363998413086, 15.321407318115234, 17.572450637817383, 19.82349395751953, 22.07453727722168, 24.325580596923828, 26.576623916625977, 28.827667236328125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 10.0, 5.0, 13.0, 13.0, 13.0, 23.0, 24.0, 20.0, 32.0, 32.0, 28.0, 28.0, 34.0, 32.0, 32.0, 41.0, 39.0, 33.0, 50.0, 38.0, 40.0, 44.0, 35.0, 38.0, 30.0, 30.0, 33.0, 20.0, 21.0, 19.0, 22.0, 20.0, 9.0, 19.0, 12.0, 7.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0], "bins": [-43.00483703613281, -41.735206604003906, -40.465576171875, -39.195945739746094, -37.92631530761719, -36.65668487548828, -35.387054443359375, -34.11742401123047, -32.84779357910156, -31.578163146972656, -30.30853271484375, -29.038902282714844, -27.769271850585938, -26.49964141845703, -25.230010986328125, -23.96038055419922, -22.69074821472168, -21.421117782592773, -20.151487350463867, -18.88185691833496, -17.612226486206055, -16.34259605407715, -15.072964668273926, -13.80333423614502, -12.533703804016113, -11.264073371887207, -9.9944429397583, -8.724811553955078, -7.45518159866333, -6.185551166534424, -4.915920257568359, -3.646289825439453, -2.376659393310547, -1.107028841972351, 0.16260170936584473, 1.43223237991333, 2.7018628120422363, 3.9714932441711426, 5.241124153137207, 6.510754585266113, 7.7803850173950195, 9.050015449523926, 10.319645881652832, 11.589277267456055, 12.858907699584961, 14.128538131713867, 15.398168563842773, 16.66779899597168, 17.937429428100586, 19.207059860229492, 20.4766902923584, 21.746320724487305, 23.01595115661621, 24.285581588745117, 25.555213928222656, 26.824844360351562, 28.09447479248047, 29.364105224609375, 30.63373565673828, 31.903366088867188, 33.172996520996094, 34.442626953125, 35.712257385253906, 36.98188781738281, 38.25151824951172]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 35.0, 33.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 26.0, 21.0, 30.0, 67.0, 69.0, 115.0, 162.0, 273.0, 385.0, 583.0, 1000.0, 1649.0, 2700.0, 4519.0, 7448.0, 12728.0, 22059.0, 38313.0, 68366.0, 120543.0, 193181.0, 217486.0, 151132.0, 88146.0, 49291.0, 28197.0, 16300.0, 9444.0, 5595.0, 3291.0, 2009.0, 1240.0, 783.0, 490.0, 303.0, 209.0, 141.0, 69.0, 63.0, 27.0, 25.0, 20.0, 9.0, 15.0, 10.0, 3.0, 2.0, 1.0, 8.0, 1.0, 2.0], "bins": [-0.8544921875, -0.8295211791992188, -0.8045501708984375, -0.7795791625976562, -0.754608154296875, -0.7296371459960938, -0.7046661376953125, -0.6796951293945312, -0.65472412109375, -0.6297531127929688, -0.6047821044921875, -0.5798110961914062, -0.554840087890625, -0.5298690795898438, -0.5048980712890625, -0.47992706298828125, -0.4549560546875, -0.42998504638671875, -0.4050140380859375, -0.38004302978515625, -0.355072021484375, -0.33010101318359375, -0.3051300048828125, -0.28015899658203125, -0.25518798828125, -0.23021697998046875, -0.2052459716796875, -0.18027496337890625, -0.155303955078125, -0.13033294677734375, -0.1053619384765625, -0.08039093017578125, -0.055419921875, -0.03044891357421875, -0.0054779052734375, 0.01949310302734375, 0.044464111328125, 0.06943511962890625, 0.0944061279296875, 0.11937713623046875, 0.14434814453125, 0.16931915283203125, 0.1942901611328125, 0.21926116943359375, 0.244232177734375, 0.26920318603515625, 0.2941741943359375, 0.31914520263671875, 0.3441162109375, 0.36908721923828125, 0.3940582275390625, 0.41902923583984375, 0.444000244140625, 0.46897125244140625, 0.4939422607421875, 0.5189132690429688, 0.54388427734375, 0.5688552856445312, 0.5938262939453125, 0.6187973022460938, 0.643768310546875, 0.6687393188476562, 0.6937103271484375, 0.7186813354492188, 0.74365234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 2.0, 4.0, 11.0, 13.0, 13.0, 14.0, 11.0, 13.0, 19.0, 26.0, 21.0, 32.0, 28.0, 30.0, 36.0, 31.0, 32.0, 32.0, 37.0, 36.0, 32.0, 1066.0, 37.0, 36.0, 38.0, 31.0, 38.0, 26.0, 36.0, 25.0, 23.0, 26.0, 26.0, 19.0, 16.0, 7.0, 17.0, 11.0, 16.0, 14.0, 8.0, 4.0, 6.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.509765625, -3.39788818359375, -3.2860107421875, -3.17413330078125, -3.062255859375, -2.95037841796875, -2.8385009765625, -2.72662353515625, -2.61474609375, -2.50286865234375, -2.3909912109375, -2.27911376953125, -2.167236328125, -2.05535888671875, -1.9434814453125, -1.83160400390625, -1.7197265625, -1.60784912109375, -1.4959716796875, -1.38409423828125, -1.272216796875, -1.16033935546875, -1.0484619140625, -0.93658447265625, -0.82470703125, -0.71282958984375, -0.6009521484375, -0.48907470703125, -0.377197265625, -0.26531982421875, -0.1534423828125, -0.04156494140625, 0.0703125, 0.18218994140625, 0.2940673828125, 0.40594482421875, 0.517822265625, 0.62969970703125, 0.7415771484375, 0.85345458984375, 0.96533203125, 1.07720947265625, 1.1890869140625, 1.30096435546875, 1.412841796875, 1.52471923828125, 1.6365966796875, 1.74847412109375, 1.8603515625, 1.97222900390625, 2.0841064453125, 2.19598388671875, 2.307861328125, 2.41973876953125, 2.5316162109375, 2.64349365234375, 2.75537109375, 2.86724853515625, 2.9791259765625, 3.09100341796875, 3.202880859375, 3.31475830078125, 3.4266357421875, 3.53851318359375, 3.650390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 19.0, 31.0, 78.0, 96.0, 215.0, 277.0, 446.0, 685.0, 1219.0, 1887.0, 2982.0, 4802.0, 7588.0, 11936.0, 19156.0, 30000.0, 47377.0, 73601.0, 110181.0, 148516.0, 1211482.0, 140107.0, 100719.0, 67169.0, 43015.0, 27496.0, 16985.0, 10812.0, 6888.0, 4241.0, 2692.0, 1684.0, 1054.0, 648.0, 403.0, 252.0, 144.0, 79.0, 57.0, 36.0, 16.0, 23.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46044921875, -0.4457817077636719, -0.43111419677734375, -0.4164466857910156, -0.4017791748046875, -0.3871116638183594, -0.37244415283203125, -0.3577766418457031, -0.343109130859375, -0.3284416198730469, -0.31377410888671875, -0.2991065979003906, -0.2844390869140625, -0.2697715759277344, -0.25510406494140625, -0.24043655395507812, -0.22576904296875, -0.21110153198242188, -0.19643402099609375, -0.18176651000976562, -0.1670989990234375, -0.15243148803710938, -0.13776397705078125, -0.12309646606445312, -0.108428955078125, -0.09376144409179688, -0.07909393310546875, -0.06442642211914062, -0.0497589111328125, -0.035091400146484375, -0.02042388916015625, -0.005756378173828125, 0.0089111328125, 0.023578643798828125, 0.03824615478515625, 0.052913665771484375, 0.0675811767578125, 0.08224868774414062, 0.09691619873046875, 0.11158370971679688, 0.126251220703125, 0.14091873168945312, 0.15558624267578125, 0.17025375366210938, 0.1849212646484375, 0.19958877563476562, 0.21425628662109375, 0.22892379760742188, 0.24359130859375, 0.2582588195800781, 0.27292633056640625, 0.2875938415527344, 0.3022613525390625, 0.3169288635253906, 0.33159637451171875, 0.3462638854980469, 0.360931396484375, 0.3755989074707031, 0.39026641845703125, 0.4049339294433594, 0.4196014404296875, 0.4342689514160156, 0.44893646240234375, 0.4636039733886719, 0.478271484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 15.0, 19.0, 21.0, 20.0, 17.0, 34.0, 32.0, 34.0, 45.0, 51.0, 67.0, 84.0, 72.0, 68.0, 56.0, 53.0, 37.0, 46.0, 39.0, 36.0, 27.0, 11.0, 12.0, 18.0, 10.0, 11.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042572021484375, -0.004100680351257324, -0.0039441585540771484, -0.0037876367568969727, -0.003631114959716797, -0.003474593162536621, -0.0033180713653564453, -0.0031615495681762695, -0.0030050277709960938, -0.002848505973815918, -0.002691984176635742, -0.0025354623794555664, -0.0023789405822753906, -0.002222418785095215, -0.002065896987915039, -0.0019093751907348633, -0.0017528533935546875, -0.0015963315963745117, -0.001439809799194336, -0.0012832880020141602, -0.0011267662048339844, -0.0009702444076538086, -0.0008137226104736328, -0.000657200813293457, -0.0005006790161132812, -0.00034415721893310547, -0.0001876354217529297, -3.1113624572753906e-05, 0.00012540817260742188, 0.00028192996978759766, 0.00043845176696777344, 0.0005949735641479492, 0.000751495361328125, 0.0009080171585083008, 0.0010645389556884766, 0.0012210607528686523, 0.0013775825500488281, 0.001534104347229004, 0.0016906261444091797, 0.0018471479415893555, 0.0020036697387695312, 0.002160191535949707, 0.002316713333129883, 0.0024732351303100586, 0.0026297569274902344, 0.00278627872467041, 0.002942800521850586, 0.0030993223190307617, 0.0032558441162109375, 0.0034123659133911133, 0.003568887710571289, 0.003725409507751465, 0.0038819313049316406, 0.004038453102111816, 0.004194974899291992, 0.004351496696472168, 0.004508018493652344, 0.0046645402908325195, 0.004821062088012695, 0.004977583885192871, 0.005134105682373047, 0.005290627479553223, 0.0054471492767333984, 0.005603671073913574, 0.00576019287109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 8.0, 3.0, 1.0, 10.0, 14.0, 12.0, 16.0, 20.0, 23.0, 27.0, 47.0, 64.0, 61.0, 95.0, 151.0, 230.0, 536.0, 4533.0, 844770.0, 194827.0, 2039.0, 414.0, 163.0, 109.0, 66.0, 62.0, 60.0, 28.0, 23.0, 38.0, 28.0, 15.0, 8.0, 15.0, 6.0, 5.0, 7.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.11370849609375, -0.11062431335449219, -0.10754013061523438, -0.10445594787597656, -0.10137176513671875, -0.09828758239746094, -0.09520339965820312, -0.09211921691894531, -0.0890350341796875, -0.08595085144042969, -0.08286666870117188, -0.07978248596191406, -0.07669830322265625, -0.07361412048339844, -0.07052993774414062, -0.06744575500488281, -0.064361572265625, -0.06127738952636719, -0.058193206787109375, -0.05510902404785156, -0.05202484130859375, -0.04894065856933594, -0.045856475830078125, -0.04277229309082031, -0.0396881103515625, -0.03660392761230469, -0.033519744873046875, -0.030435562133789062, -0.02735137939453125, -0.024267196655273438, -0.021183013916015625, -0.018098831176757812, -0.0150146484375, -0.011930465698242188, -0.008846282958984375, -0.0057621002197265625, -0.00267791748046875, 0.0004062652587890625, 0.003490447998046875, 0.0065746307373046875, 0.0096588134765625, 0.012742996215820312, 0.015827178955078125, 0.018911361694335938, 0.02199554443359375, 0.025079727172851562, 0.028163909912109375, 0.031248092651367188, 0.034332275390625, 0.03741645812988281, 0.040500640869140625, 0.04358482360839844, 0.04666900634765625, 0.04975318908691406, 0.052837371826171875, 0.05592155456542969, 0.0590057373046875, 0.06208992004394531, 0.06517410278320312, 0.06825828552246094, 0.07134246826171875, 0.07442665100097656, 0.07751083374023438, 0.08059501647949219, 0.08367919921875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 85.0, 678.0, 219.0, 25.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032518741209059954, -0.002353122690692544, -0.0014543713768944144, -0.0005556200630962849, 0.0003431313671171665, 0.0012418825644999743, 0.0021406339947134256, 0.003039385424926877, 0.003938136622309685, 0.004836888052523136, 0.0057356394827365875, 0.006634390912950039, 0.00753314234316349, 0.008431892842054367, 0.009330645203590393, 0.01022939570248127, 0.011128148064017296, 0.012026899494230747, 0.012925650924444199, 0.01382440235465765, 0.014723153784871101, 0.015621904283761978, 0.016520656645298004, 0.01741940714418888, 0.018318159505724907, 0.019216910004615784, 0.02011566236615181, 0.021014412865042686, 0.021913165226578712, 0.02281191572546959, 0.023710668087005615, 0.024609418585896492, 0.025508170947432518, 0.026406921446323395, 0.02730567380785942, 0.028204424306750298, 0.029103176668286324, 0.0300019271671772, 0.030900679528713226, 0.03179943189024925, 0.03269818052649498, 0.033596932888031006, 0.03449568152427673, 0.03539443388581276, 0.036293186247348785, 0.03719193860888481, 0.03809068724513054, 0.038989439606666565, 0.03988819196820259, 0.04078694432973862, 0.041685692965984344, 0.04258444532752037, 0.043483197689056396, 0.04438195005059242, 0.04528069868683815, 0.046179451048374176, 0.0470782034099102, 0.04797695577144623, 0.048875704407691956, 0.04977445676922798, 0.05067320913076401, 0.051571961492300034, 0.05247071012854576, 0.05336946249008179, 0.05426821485161781]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 5.0, 14.0, 15.0, 12.0, 23.0, 26.0, 31.0, 32.0, 42.0, 38.0, 31.0, 37.0, 47.0, 54.0, 64.0, 55.0, 57.0, 54.0, 57.0, 47.0, 46.0, 36.0, 34.0, 23.0, 23.0, 26.0, 10.0, 8.0, 15.0, 7.0, 9.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004744350910186768, -0.004613455384969711, -0.004482559859752655, -0.004351664334535599, -0.0042207688093185425, -0.004089873284101486, -0.00395897775888443, -0.0038280822336673737, -0.0036971867084503174, -0.003566291183233261, -0.003435395658016205, -0.0033045001327991486, -0.0031736046075820923, -0.003042709082365036, -0.0029118135571479797, -0.0027809180319309235, -0.002650022506713867, -0.002519126981496811, -0.0023882314562797546, -0.0022573359310626984, -0.002126440405845642, -0.001995544880628586, -0.0018646493554115295, -0.0017337538301944733, -0.001602858304977417, -0.0014719627797603607, -0.0013410672545433044, -0.0012101717293262482, -0.001079276204109192, -0.0009483806788921356, -0.0008174851536750793, -0.0006865896284580231, -0.0005556941032409668, -0.0004247985780239105, -0.00029390305280685425, -0.00016300752758979797, -3.21120023727417e-05, 9.878352284431458e-05, 0.00022967904806137085, 0.0003605745732784271, 0.0004914700984954834, 0.0006223656237125397, 0.000753261148929596, 0.0008841566741466522, 0.0010150521993637085, 0.0011459477245807648, 0.001276843249797821, 0.0014077387750148773, 0.0015386343002319336, 0.0016695298254489899, 0.0018004253506660461, 0.0019313208758831024, 0.0020622164011001587, 0.002193111926317215, 0.0023240074515342712, 0.0024549029767513275, 0.002585798501968384, 0.00271669402718544, 0.0028475895524024963, 0.0029784850776195526, 0.003109380602836609, 0.003240276128053665, 0.0033711716532707214, 0.0035020671784877777, 0.003632962703704834]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 34.0, 34.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 7.0, 7.0, 9.0, 18.0, 23.0, 37.0, 43.0, 51.0, 85.0, 112.0, 200.0, 268.0, 480.0, 791.0, 1395.0, 2436.0, 4623.0, 8854.0, 18548.0, 43427.0, 120629.0, 387109.0, 298168.0, 93773.0, 35318.0, 15425.0, 7420.0, 3983.0, 2167.0, 1195.0, 722.0, 429.0, 251.0, 183.0, 111.0, 72.0, 58.0, 37.0, 28.0, 16.0, 17.0, 9.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.50421142578125, -4.3482666015625, -4.19232177734375, -4.036376953125, -3.88043212890625, -3.7244873046875, -3.56854248046875, -3.41259765625, -3.25665283203125, -3.1007080078125, -2.94476318359375, -2.788818359375, -2.63287353515625, -2.4769287109375, -2.32098388671875, -2.1650390625, -2.00909423828125, -1.8531494140625, -1.69720458984375, -1.541259765625, -1.38531494140625, -1.2293701171875, -1.07342529296875, -0.91748046875, -0.76153564453125, -0.6055908203125, -0.44964599609375, -0.293701171875, -0.13775634765625, 0.0181884765625, 0.17413330078125, 0.330078125, 0.48602294921875, 0.6419677734375, 0.79791259765625, 0.953857421875, 1.10980224609375, 1.2657470703125, 1.42169189453125, 1.57763671875, 1.73358154296875, 1.8895263671875, 2.04547119140625, 2.201416015625, 2.35736083984375, 2.5133056640625, 2.66925048828125, 2.8251953125, 2.98114013671875, 3.1370849609375, 3.29302978515625, 3.448974609375, 3.60491943359375, 3.7608642578125, 3.91680908203125, 4.07275390625, 4.22869873046875, 4.3846435546875, 4.54058837890625, 4.696533203125, 4.85247802734375, 5.0084228515625, 5.16436767578125, 5.3203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 4.0, 12.0, 14.0, 17.0, 12.0, 15.0, 14.0, 21.0, 22.0, 20.0, 29.0, 34.0, 25.0, 43.0, 30.0, 54.0, 83.0, 235.0, 1648.0, 194.0, 67.0, 54.0, 48.0, 38.0, 39.0, 28.0, 30.0, 24.0, 32.0, 22.0, 17.0, 18.0, 11.0, 11.0, 18.0, 12.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.59375, -19.008056640625, -18.42236328125, -17.836669921875, -17.2509765625, -16.665283203125, -16.07958984375, -15.493896484375, -14.908203125, -14.322509765625, -13.73681640625, -13.151123046875, -12.5654296875, -11.979736328125, -11.39404296875, -10.808349609375, -10.22265625, -9.636962890625, -9.05126953125, -8.465576171875, -7.8798828125, -7.294189453125, -6.70849609375, -6.122802734375, -5.537109375, -4.951416015625, -4.36572265625, -3.780029296875, -3.1943359375, -2.608642578125, -2.02294921875, -1.437255859375, -0.8515625, -0.265869140625, 0.31982421875, 0.905517578125, 1.4912109375, 2.076904296875, 2.66259765625, 3.248291015625, 3.833984375, 4.419677734375, 5.00537109375, 5.591064453125, 6.1767578125, 6.762451171875, 7.34814453125, 7.933837890625, 8.51953125, 9.105224609375, 9.69091796875, 10.276611328125, 10.8623046875, 11.447998046875, 12.03369140625, 12.619384765625, 13.205078125, 13.790771484375, 14.37646484375, 14.962158203125, 15.5478515625, 16.133544921875, 16.71923828125, 17.304931640625, 17.890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 5.0, 13.0, 11.0, 16.0, 28.0, 35.0, 43.0, 59.0, 87.0, 122.0, 172.0, 236.0, 362.0, 653.0, 7978.0, 3091226.0, 42388.0, 932.0, 392.0, 246.0, 181.0, 128.0, 86.0, 64.0, 50.0, 42.0, 30.0, 28.0, 15.0, 16.0, 13.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-64.1875, -62.3876953125, -60.587890625, -58.7880859375, -56.98828125, -55.1884765625, -53.388671875, -51.5888671875, -49.7890625, -47.9892578125, -46.189453125, -44.3896484375, -42.58984375, -40.7900390625, -38.990234375, -37.1904296875, -35.390625, -33.5908203125, -31.791015625, -29.9912109375, -28.19140625, -26.3916015625, -24.591796875, -22.7919921875, -20.9921875, -19.1923828125, -17.392578125, -15.5927734375, -13.79296875, -11.9931640625, -10.193359375, -8.3935546875, -6.59375, -4.7939453125, -2.994140625, -1.1943359375, 0.60546875, 2.4052734375, 4.205078125, 6.0048828125, 7.8046875, 9.6044921875, 11.404296875, 13.2041015625, 15.00390625, 16.8037109375, 18.603515625, 20.4033203125, 22.203125, 24.0029296875, 25.802734375, 27.6025390625, 29.40234375, 31.2021484375, 33.001953125, 34.8017578125, 36.6015625, 38.4013671875, 40.201171875, 42.0009765625, 43.80078125, 45.6005859375, 47.400390625, 49.2001953125, 51.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [3.0, 4.0, 41.0, 400.0, 483.0, 82.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.019357681274414, -9.892585754394531, -6.76581335067749, -3.639040946960449, -0.5122690200805664, 2.6145029067993164, 5.741275787353516, 8.868047714233398, 11.994819641113281, 15.121591567993164, 18.248363494873047, 21.375137329101562, 24.501907348632812, 27.628681182861328, 30.75545310974121, 33.882225036621094, 37.008995056152344, 40.13576889038086, 43.26253890991211, 46.389312744140625, 49.516082763671875, 52.64285659790039, 55.769630432128906, 58.896400451660156, 62.02317428588867, 65.14994812011719, 68.27671813964844, 71.40348815917969, 74.53026580810547, 77.65703582763672, 80.78380584716797, 83.91058349609375, 87.03734588623047, 90.16411590576172, 93.2908935546875, 96.41766357421875, 99.54443359375, 102.67120361328125, 105.79798126220703, 108.92475128173828, 112.05152130126953, 115.17829132080078, 118.30506896972656, 121.43183898925781, 124.55860900878906, 127.68537902832031, 130.81214904785156, 133.93893432617188, 137.06570434570312, 140.19247436523438, 143.31924438476562, 146.44601440429688, 149.5727996826172, 152.69956970214844, 155.8263397216797, 158.95310974121094, 162.0798797607422, 165.20664978027344, 168.3334197998047, 171.46018981933594, 174.58697509765625, 177.7137451171875, 180.84051513671875, 183.96728515625, 187.09405517578125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 14.0, 4.0, 12.0, 14.0, 12.0, 16.0, 22.0, 22.0, 28.0, 27.0, 32.0, 32.0, 33.0, 54.0, 44.0, 40.0, 55.0, 34.0, 66.0, 52.0, 44.0, 43.0, 31.0, 41.0, 34.0, 24.0, 38.0, 33.0, 23.0, 17.0, 14.0, 10.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.58349609375, -51.70321273803711, -49.82292556762695, -47.94264221191406, -46.062355041503906, -44.182071685791016, -42.301788330078125, -40.42150115966797, -38.54121780395508, -36.66093444824219, -34.78064727783203, -32.90036392211914, -31.020078659057617, -29.139793395996094, -27.25950813293457, -25.379222869873047, -23.498937606811523, -21.61865234375, -19.738367080688477, -17.858081817626953, -15.977798461914062, -14.097513198852539, -12.217227935791016, -10.336943626403809, -8.456658363342285, -6.57637357711792, -4.696088790893555, -2.8158035278320312, -0.935518741607666, 0.9447660446166992, 2.8250513076782227, 4.70533561706543, 6.585620880126953, 8.465906143188477, 10.346190452575684, 12.226475715637207, 14.106760025024414, 15.987045288085938, 17.86733055114746, 19.747615814208984, 21.627899169921875, 23.5081844329834, 25.388469696044922, 27.268753051757812, 29.149038314819336, 31.02932357788086, 32.90960693359375, 34.789894104003906, 36.67018127441406, 38.55046463012695, 40.43075180053711, 42.31103515625, 44.191322326660156, 46.07160568237305, 47.95188903808594, 49.832176208496094, 51.712459564208984, 53.592742919921875, 55.47303009033203, 57.35331344604492, 59.23360061645508, 61.11388397216797, 62.994171142578125, 64.87445068359375, 66.7547378540039]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 9.0, 11.0, 10.0, 6.0, 10.0, 20.0, 27.0, 19.0, 17.0, 23.0, 25.0, 40.0, 36.0, 38.0, 34.0, 35.0, 40.0, 44.0, 38.0, 50.0, 40.0, 38.0, 33.0, 34.0, 40.0, 36.0, 24.0, 25.0, 30.0, 21.0, 19.0, 15.0, 21.0, 15.0, 9.0, 12.0, 6.0, 9.0, 2.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.37542724609375, -5.1766357421875, -4.97784423828125, -4.779052734375, -4.58026123046875, -4.3814697265625, -4.18267822265625, -3.98388671875, -3.78509521484375, -3.5863037109375, -3.38751220703125, -3.188720703125, -2.98992919921875, -2.7911376953125, -2.59234619140625, -2.3935546875, -2.19476318359375, -1.9959716796875, -1.79718017578125, -1.598388671875, -1.39959716796875, -1.2008056640625, -1.00201416015625, -0.80322265625, -0.60443115234375, -0.4056396484375, -0.20684814453125, -0.008056640625, 0.19073486328125, 0.3895263671875, 0.58831787109375, 0.787109375, 0.98590087890625, 1.1846923828125, 1.38348388671875, 1.582275390625, 1.78106689453125, 1.9798583984375, 2.17864990234375, 2.37744140625, 2.57623291015625, 2.7750244140625, 2.97381591796875, 3.172607421875, 3.37139892578125, 3.5701904296875, 3.76898193359375, 3.9677734375, 4.16656494140625, 4.3653564453125, 4.56414794921875, 4.762939453125, 4.96173095703125, 5.1605224609375, 5.35931396484375, 5.55810546875, 5.75689697265625, 5.9556884765625, 6.15447998046875, 6.353271484375, 6.55206298828125, 6.7508544921875, 6.94964599609375, 7.1484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 14.0, 8.0, 10.0, 4.0, 16.0, 18.0, 15.0, 19.0, 32.0, 28.0, 55.0, 97.0, 199.0, 411.0, 836.0, 2198.0, 7793.0, 50624.0, 836289.0, 2848255.0, 411251.0, 27704.0, 5316.0, 1644.0, 659.0, 297.0, 139.0, 97.0, 60.0, 39.0, 31.0, 34.0, 13.0, 9.0, 11.0, 9.0, 6.0, 7.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.6044921875, -13.068359375, -12.5322265625, -11.99609375, -11.4599609375, -10.923828125, -10.3876953125, -9.8515625, -9.3154296875, -8.779296875, -8.2431640625, -7.70703125, -7.1708984375, -6.634765625, -6.0986328125, -5.5625, -5.0263671875, -4.490234375, -3.9541015625, -3.41796875, -2.8818359375, -2.345703125, -1.8095703125, -1.2734375, -0.7373046875, -0.201171875, 0.3349609375, 0.87109375, 1.4072265625, 1.943359375, 2.4794921875, 3.015625, 3.5517578125, 4.087890625, 4.6240234375, 5.16015625, 5.6962890625, 6.232421875, 6.7685546875, 7.3046875, 7.8408203125, 8.376953125, 8.9130859375, 9.44921875, 9.9853515625, 10.521484375, 11.0576171875, 11.59375, 12.1298828125, 12.666015625, 13.2021484375, 13.73828125, 14.2744140625, 14.810546875, 15.3466796875, 15.8828125, 16.4189453125, 16.955078125, 17.4912109375, 18.02734375, 18.5634765625, 19.099609375, 19.6357421875, 20.171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 7.0, 13.0, 14.0, 29.0, 24.0, 43.0, 37.0, 57.0, 69.0, 102.0, 145.0, 135.0, 216.0, 295.0, 341.0, 403.0, 413.0, 393.0, 311.0, 251.0, 166.0, 145.0, 109.0, 86.0, 52.0, 51.0, 33.0, 35.0, 20.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -8.9642333984375, -8.608154296875, -8.2520751953125, -7.89599609375, -7.5399169921875, -7.183837890625, -6.8277587890625, -6.4716796875, -6.1156005859375, -5.759521484375, -5.4034423828125, -5.04736328125, -4.6912841796875, -4.335205078125, -3.9791259765625, -3.623046875, -3.2669677734375, -2.910888671875, -2.5548095703125, -2.19873046875, -1.8426513671875, -1.486572265625, -1.1304931640625, -0.7744140625, -0.4183349609375, -0.062255859375, 0.2938232421875, 0.64990234375, 1.0059814453125, 1.362060546875, 1.7181396484375, 2.07421875, 2.4302978515625, 2.786376953125, 3.1424560546875, 3.49853515625, 3.8546142578125, 4.210693359375, 4.5667724609375, 4.9228515625, 5.2789306640625, 5.635009765625, 5.9910888671875, 6.34716796875, 6.7032470703125, 7.059326171875, 7.4154052734375, 7.771484375, 8.1275634765625, 8.483642578125, 8.8397216796875, 9.19580078125, 9.5518798828125, 9.907958984375, 10.2640380859375, 10.6201171875, 10.9761962890625, 11.332275390625, 11.6883544921875, 12.04443359375, 12.4005126953125, 12.756591796875, 13.1126708984375, 13.46875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 7.0, 7.0, 7.0, 16.0, 25.0, 24.0, 34.0, 55.0, 67.0, 55.0, 90.0, 101.0, 131.0, 169.0, 250.0, 329.0, 617.0, 4472.0, 229493.0, 3860920.0, 92858.0, 2607.0, 558.0, 300.0, 234.0, 178.0, 149.0, 93.0, 90.0, 77.0, 56.0, 40.0, 28.0, 35.0, 19.0, 21.0, 14.0, 10.0, 9.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-46.28125, -44.93603515625, -43.5908203125, -42.24560546875, -40.900390625, -39.55517578125, -38.2099609375, -36.86474609375, -35.51953125, -34.17431640625, -32.8291015625, -31.48388671875, -30.138671875, -28.79345703125, -27.4482421875, -26.10302734375, -24.7578125, -23.41259765625, -22.0673828125, -20.72216796875, -19.376953125, -18.03173828125, -16.6865234375, -15.34130859375, -13.99609375, -12.65087890625, -11.3056640625, -9.96044921875, -8.615234375, -7.27001953125, -5.9248046875, -4.57958984375, -3.234375, -1.88916015625, -0.5439453125, 0.80126953125, 2.146484375, 3.49169921875, 4.8369140625, 6.18212890625, 7.52734375, 8.87255859375, 10.2177734375, 11.56298828125, 12.908203125, 14.25341796875, 15.5986328125, 16.94384765625, 18.2890625, 19.63427734375, 20.9794921875, 22.32470703125, 23.669921875, 25.01513671875, 26.3603515625, 27.70556640625, 29.05078125, 30.39599609375, 31.7412109375, 33.08642578125, 34.431640625, 35.77685546875, 37.1220703125, 38.46728515625, 39.8125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 14.0, 27.0, 47.0, 74.0, 132.0, 157.0, 147.0, 126.0, 129.0, 76.0, 42.0, 20.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3076171875, -63.020355224609375, -60.73309326171875, -58.445831298828125, -56.1585693359375, -53.871307373046875, -51.58404541015625, -49.296783447265625, -47.009521484375, -44.722259521484375, -42.43499755859375, -40.147735595703125, -37.8604736328125, -35.573211669921875, -33.28594970703125, -30.998687744140625, -28.71142578125, -26.424163818359375, -24.13690185546875, -21.849639892578125, -19.5623779296875, -17.275115966796875, -14.98785400390625, -12.700592041015625, -10.413330078125, -8.126068115234375, -5.83880615234375, -3.551544189453125, -1.2642822265625, 1.022979736328125, 3.31024169921875, 5.597503662109375, 7.884765625, 10.172027587890625, 12.45928955078125, 14.746551513671875, 17.0338134765625, 19.321075439453125, 21.60833740234375, 23.895599365234375, 26.182861328125, 28.470123291015625, 30.75738525390625, 33.044647216796875, 35.3319091796875, 37.619171142578125, 39.90643310546875, 42.193695068359375, 44.48095703125, 46.768218994140625, 49.05548095703125, 51.342742919921875, 53.6300048828125, 55.917266845703125, 58.20452880859375, 60.491790771484375, 62.779052734375, 65.06631469726562, 67.35357666015625, 69.64083862304688, 71.9281005859375, 74.21536254882812, 76.50262451171875, 78.78988647460938, 81.0771484375]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 15.0, 23.0, 21.0, 17.0, 15.0, 24.0, 28.0, 20.0, 48.0, 27.0, 34.0, 36.0, 41.0, 50.0, 40.0, 38.0, 40.0, 36.0, 43.0, 38.0, 40.0, 31.0, 36.0, 37.0, 31.0, 27.0, 17.0, 19.0, 18.0, 18.0, 7.0, 12.0, 12.0, 5.0, 5.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.99188232421875, -38.7181282043457, -37.44437026977539, -36.170616149902344, -34.89685821533203, -33.623104095458984, -32.34934997558594, -31.075593948364258, -29.801837921142578, -28.5280818939209, -27.25432586669922, -25.980571746826172, -24.706815719604492, -23.433059692382812, -22.159305572509766, -20.885549545288086, -19.611793518066406, -18.338037490844727, -17.064281463623047, -15.79052734375, -14.51677131652832, -13.24301528930664, -11.969260215759277, -10.695505142211914, -9.421749114990234, -8.147993087768555, -6.874238014221191, -5.60048246383667, -4.326726913452148, -3.052971363067627, -1.7792158126831055, -0.5054607391357422, 0.7682952880859375, 2.042050838470459, 3.3158063888549805, 4.589561939239502, 5.863317489624023, 7.137073040008545, 8.410828590393066, 9.68458366394043, 10.95833969116211, 12.232095718383789, 13.505850791931152, 14.779605865478516, 16.053361892700195, 17.327117919921875, 18.600872039794922, 19.8746280670166, 21.14838409423828, 22.42214012145996, 23.69589614868164, 24.969650268554688, 26.243406295776367, 27.517162322998047, 28.790916442871094, 30.064672470092773, 31.338428497314453, 32.6121826171875, 33.88594055175781, 35.15969467163086, 36.433448791503906, 37.70720672607422, 38.980960845947266, 40.25471496582031, 41.528472900390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 48.0, 42.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 19.0, 26.0, 31.0, 70.0, 78.0, 110.0, 144.0, 218.0, 341.0, 498.0, 766.0, 1303.0, 1857.0, 2991.0, 4596.0, 7614.0, 11941.0, 19602.0, 32285.0, 52291.0, 85690.0, 137511.0, 189870.0, 179952.0, 122308.0, 76040.0, 46355.0, 27897.0, 17194.0, 10700.0, 6607.0, 4202.0, 2504.0, 1657.0, 1151.0, 701.0, 440.0, 302.0, 210.0, 147.0, 108.0, 62.0, 48.0, 27.0, 22.0, 21.0, 3.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6435546875, -0.62200927734375, -0.6004638671875, -0.57891845703125, -0.557373046875, -0.53582763671875, -0.5142822265625, -0.49273681640625, -0.47119140625, -0.44964599609375, -0.4281005859375, -0.40655517578125, -0.385009765625, -0.36346435546875, -0.3419189453125, -0.32037353515625, -0.298828125, -0.27728271484375, -0.2557373046875, -0.23419189453125, -0.212646484375, -0.19110107421875, -0.1695556640625, -0.14801025390625, -0.12646484375, -0.10491943359375, -0.0833740234375, -0.06182861328125, -0.040283203125, -0.01873779296875, 0.0028076171875, 0.02435302734375, 0.0458984375, 0.06744384765625, 0.0889892578125, 0.11053466796875, 0.132080078125, 0.15362548828125, 0.1751708984375, 0.19671630859375, 0.21826171875, 0.23980712890625, 0.2613525390625, 0.28289794921875, 0.304443359375, 0.32598876953125, 0.3475341796875, 0.36907958984375, 0.390625, 0.41217041015625, 0.4337158203125, 0.45526123046875, 0.476806640625, 0.49835205078125, 0.5198974609375, 0.54144287109375, 0.56298828125, 0.58453369140625, 0.6060791015625, 0.62762451171875, 0.649169921875, 0.67071533203125, 0.6922607421875, 0.71380615234375, 0.7353515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 11.0, 10.0, 5.0, 5.0, 7.0, 14.0, 19.0, 20.0, 13.0, 21.0, 13.0, 22.0, 29.0, 25.0, 22.0, 34.0, 34.0, 38.0, 29.0, 32.0, 36.0, 43.0, 1058.0, 38.0, 32.0, 33.0, 27.0, 39.0, 41.0, 27.0, 27.0, 23.0, 26.0, 16.0, 28.0, 13.0, 22.0, 13.0, 11.0, 10.0, 6.0, 13.0, 12.0, 4.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.955078125, -3.83673095703125, -3.7183837890625, -3.60003662109375, -3.481689453125, -3.36334228515625, -3.2449951171875, -3.12664794921875, -3.00830078125, -2.88995361328125, -2.7716064453125, -2.65325927734375, -2.534912109375, -2.41656494140625, -2.2982177734375, -2.17987060546875, -2.0615234375, -1.94317626953125, -1.8248291015625, -1.70648193359375, -1.588134765625, -1.46978759765625, -1.3514404296875, -1.23309326171875, -1.11474609375, -0.99639892578125, -0.8780517578125, -0.75970458984375, -0.641357421875, -0.52301025390625, -0.4046630859375, -0.28631591796875, -0.16796875, -0.04962158203125, 0.0687255859375, 0.18707275390625, 0.305419921875, 0.42376708984375, 0.5421142578125, 0.66046142578125, 0.77880859375, 0.89715576171875, 1.0155029296875, 1.13385009765625, 1.252197265625, 1.37054443359375, 1.4888916015625, 1.60723876953125, 1.7255859375, 1.84393310546875, 1.9622802734375, 2.08062744140625, 2.198974609375, 2.31732177734375, 2.4356689453125, 2.55401611328125, 2.67236328125, 2.79071044921875, 2.9090576171875, 3.02740478515625, 3.145751953125, 3.26409912109375, 3.3824462890625, 3.50079345703125, 3.619140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 11.0, 12.0, 26.0, 26.0, 54.0, 83.0, 121.0, 236.0, 364.0, 551.0, 990.0, 1532.0, 2555.0, 4221.0, 6958.0, 11293.0, 18404.0, 29953.0, 48489.0, 77285.0, 117860.0, 162251.0, 1220772.0, 139291.0, 94775.0, 61097.0, 37769.0, 23318.0, 14570.0, 8713.0, 5330.0, 3175.0, 1972.0, 1229.0, 747.0, 390.0, 260.0, 167.0, 88.0, 63.0, 44.0, 28.0, 16.0, 18.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.5322265625, -0.515716552734375, -0.49920654296875, -0.482696533203125, -0.4661865234375, -0.449676513671875, -0.43316650390625, -0.416656494140625, -0.400146484375, -0.383636474609375, -0.36712646484375, -0.350616455078125, -0.3341064453125, -0.317596435546875, -0.30108642578125, -0.284576416015625, -0.26806640625, -0.251556396484375, -0.23504638671875, -0.218536376953125, -0.2020263671875, -0.185516357421875, -0.16900634765625, -0.152496337890625, -0.135986328125, -0.119476318359375, -0.10296630859375, -0.086456298828125, -0.0699462890625, -0.053436279296875, -0.03692626953125, -0.020416259765625, -0.00390625, 0.012603759765625, 0.02911376953125, 0.045623779296875, 0.0621337890625, 0.078643798828125, 0.09515380859375, 0.111663818359375, 0.128173828125, 0.144683837890625, 0.16119384765625, 0.177703857421875, 0.1942138671875, 0.210723876953125, 0.22723388671875, 0.243743896484375, 0.26025390625, 0.276763916015625, 0.29327392578125, 0.309783935546875, 0.3262939453125, 0.342803955078125, 0.35931396484375, 0.375823974609375, 0.392333984375, 0.408843994140625, 0.42535400390625, 0.441864013671875, 0.4583740234375, 0.474884033203125, 0.49139404296875, 0.507904052734375, 0.5244140625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 14.0, 6.0, 4.0, 12.0, 8.0, 14.0, 32.0, 30.0, 21.0, 55.0, 48.0, 71.0, 81.0, 83.0, 77.0, 78.0, 81.0, 53.0, 57.0, 45.0, 30.0, 25.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005512237548828125, -0.005355119705200195, -0.005198001861572266, -0.005040884017944336, -0.004883766174316406, -0.0047266483306884766, -0.004569530487060547, -0.004412412643432617, -0.0042552947998046875, -0.004098176956176758, -0.003941059112548828, -0.0037839412689208984, -0.0036268234252929688, -0.003469705581665039, -0.0033125877380371094, -0.0031554698944091797, -0.00299835205078125, -0.0028412342071533203, -0.0026841163635253906, -0.002526998519897461, -0.0023698806762695312, -0.0022127628326416016, -0.002055644989013672, -0.0018985271453857422, -0.0017414093017578125, -0.0015842914581298828, -0.0014271736145019531, -0.0012700557708740234, -0.0011129379272460938, -0.0009558200836181641, -0.0007987022399902344, -0.0006415843963623047, -0.000484466552734375, -0.0003273487091064453, -0.00017023086547851562, -1.3113021850585938e-05, 0.00014400482177734375, 0.00030112266540527344, 0.0004582405090332031, 0.0006153583526611328, 0.0007724761962890625, 0.0009295940399169922, 0.0010867118835449219, 0.0012438297271728516, 0.0014009475708007812, 0.001558065414428711, 0.0017151832580566406, 0.0018723011016845703, 0.0020294189453125, 0.0021865367889404297, 0.0023436546325683594, 0.002500772476196289, 0.0026578903198242188, 0.0028150081634521484, 0.002972126007080078, 0.003129243850708008, 0.0032863616943359375, 0.003443479537963867, 0.003600597381591797, 0.0037577152252197266, 0.003914833068847656, 0.004071950912475586, 0.004229068756103516, 0.004386186599731445, 0.004543304443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 9.0, 3.0, 8.0, 6.0, 5.0, 15.0, 19.0, 24.0, 35.0, 42.0, 76.0, 106.0, 164.0, 375.0, 3955.0, 1030283.0, 12376.0, 473.0, 190.0, 119.0, 77.0, 45.0, 41.0, 27.0, 16.0, 10.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1015625, -0.09801101684570312, -0.09445953369140625, -0.09090805053710938, -0.0873565673828125, -0.08380508422851562, -0.08025360107421875, -0.07670211791992188, -0.073150634765625, -0.06959915161132812, -0.06604766845703125, -0.062496185302734375, -0.0589447021484375, -0.055393218994140625, -0.05184173583984375, -0.048290252685546875, -0.04473876953125, -0.041187286376953125, -0.03763580322265625, -0.034084320068359375, -0.0305328369140625, -0.026981353759765625, -0.02342987060546875, -0.019878387451171875, -0.016326904296875, -0.012775421142578125, -0.00922393798828125, -0.005672454833984375, -0.0021209716796875, 0.001430511474609375, 0.00498199462890625, 0.008533477783203125, 0.0120849609375, 0.015636444091796875, 0.01918792724609375, 0.022739410400390625, 0.0262908935546875, 0.029842376708984375, 0.03339385986328125, 0.036945343017578125, 0.040496826171875, 0.044048309326171875, 0.04759979248046875, 0.051151275634765625, 0.0547027587890625, 0.058254241943359375, 0.06180572509765625, 0.06535720825195312, 0.06890869140625, 0.07246017456054688, 0.07601165771484375, 0.07956314086914062, 0.0831146240234375, 0.08666610717773438, 0.09021759033203125, 0.09376907348632812, 0.097320556640625, 0.10087203979492188, 0.10442352294921875, 0.10797500610351562, 0.1115264892578125, 0.11507797241210938, 0.11862945556640625, 0.12218093872070312, 0.125732421875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [33.0, 727.0, 244.0, 13.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015578450402244925, -0.0006737327785231173, 0.00021037948317825794, 0.001094491803087294, 0.0019786041229963303, 0.002862716093659401, 0.003746828529983759, 0.00463094050064683, 0.005515052936971188, 0.006399165373295546, 0.007283277343958616, 0.008167389780282974, 0.009051501750946045, 0.009935613721609116, 0.010819726623594761, 0.011703838594257832, 0.012587951496243477, 0.013472063466906548, 0.014356176368892193, 0.015240288339555264, 0.01612440124154091, 0.01700851321220398, 0.01789262518286705, 0.01877673715353012, 0.01966084912419319, 0.020544961094856262, 0.021429073065519333, 0.022313185036182404, 0.023197298869490623, 0.024081410840153694, 0.024965522810816765, 0.025849634781479836, 0.026733746752142906, 0.027617858722805977, 0.028501970693469048, 0.029386084526777267, 0.030270196497440338, 0.03115430846810341, 0.03203842043876648, 0.03292253240942955, 0.03380664438009262, 0.03469075635075569, 0.03557486832141876, 0.03645898029208183, 0.037343092262744904, 0.038227204233407974, 0.039111316204071045, 0.039995431900024414, 0.040879543870687485, 0.041763655841350555, 0.042647767812013626, 0.0435318797826767, 0.04441599175333977, 0.04530010372400284, 0.04618421941995621, 0.04706832766532898, 0.04795243963599205, 0.04883655160665512, 0.04972066357731819, 0.05060477554798126, 0.05148888751864433, 0.052372999489307404, 0.05325711518526077, 0.054141223430633545, 0.055025339126586914]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 6.0, 10.0, 13.0, 25.0, 27.0, 25.0, 36.0, 31.0, 44.0, 32.0, 38.0, 64.0, 59.0, 47.0, 48.0, 59.0, 58.0, 55.0, 45.0, 44.0, 39.0, 32.0, 24.0, 24.0, 20.0, 21.0, 19.0, 21.0, 15.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031934380531311035, -0.0031006978824734688, -0.003007957711815834, -0.0029152175411581993, -0.0028224773705005646, -0.00272973719984293, -0.002636997029185295, -0.0025442568585276604, -0.0024515166878700256, -0.002358776517212391, -0.002266036346554756, -0.0021732961758971214, -0.0020805560052394867, -0.001987815834581852, -0.0018950756639242172, -0.0018023354932665825, -0.0017095953226089478, -0.001616855151951313, -0.0015241149812936783, -0.0014313748106360435, -0.0013386346399784088, -0.001245894469320774, -0.0011531542986631393, -0.0010604141280055046, -0.0009676739573478699, -0.0008749337866902351, -0.0007821936160326004, -0.0006894534453749657, -0.0005967132747173309, -0.0005039731040596962, -0.00041123293340206146, -0.00031849276274442673, -0.000225752592086792, -0.00013301242142915726, -4.027225077152252e-05, 5.246791988611221e-05, 0.00014520809054374695, 0.00023794826120138168, 0.0003306884318590164, 0.00042342860251665115, 0.0005161687731742859, 0.0006089089438319206, 0.0007016491144895554, 0.0007943892851471901, 0.0008871294558048248, 0.0009798696264624596, 0.0010726097971200943, 0.001165349967777729, 0.0012580901384353638, 0.0013508303090929985, 0.0014435704797506332, 0.001536310650408268, 0.0016290508210659027, 0.0017217909917235374, 0.0018145311623811722, 0.001907271333038807, 0.0020000115036964417, 0.0020927516743540764, 0.002185491845011711, 0.002278232015669346, 0.0023709721863269806, 0.0024637123569846153, 0.00255645252764225, 0.002649192698299885, 0.0027419328689575195]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 47.0, 43.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 16.0, 15.0, 21.0, 24.0, 44.0, 39.0, 73.0, 128.0, 152.0, 252.0, 432.0, 787.0, 1481.0, 3160.0, 7529.0, 20845.0, 80455.0, 371038.0, 431717.0, 91772.0, 23355.0, 8045.0, 3340.0, 1693.0, 842.0, 446.0, 282.0, 168.0, 105.0, 68.0, 51.0, 37.0, 36.0, 22.0, 12.0, 16.0, 9.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.4124755859375, -5.219482421875, -5.0264892578125, -4.83349609375, -4.6405029296875, -4.447509765625, -4.2545166015625, -4.0615234375, -3.8685302734375, -3.675537109375, -3.4825439453125, -3.28955078125, -3.0965576171875, -2.903564453125, -2.7105712890625, -2.517578125, -2.3245849609375, -2.131591796875, -1.9385986328125, -1.74560546875, -1.5526123046875, -1.359619140625, -1.1666259765625, -0.9736328125, -0.7806396484375, -0.587646484375, -0.3946533203125, -0.20166015625, -0.0086669921875, 0.184326171875, 0.3773193359375, 0.5703125, 0.7633056640625, 0.956298828125, 1.1492919921875, 1.34228515625, 1.5352783203125, 1.728271484375, 1.9212646484375, 2.1142578125, 2.3072509765625, 2.500244140625, 2.6932373046875, 2.88623046875, 3.0792236328125, 3.272216796875, 3.4652099609375, 3.658203125, 3.8511962890625, 4.044189453125, 4.2371826171875, 4.43017578125, 4.6231689453125, 4.816162109375, 5.0091552734375, 5.2021484375, 5.3951416015625, 5.588134765625, 5.7811279296875, 5.97412109375, 6.1671142578125, 6.360107421875, 6.5531005859375, 6.74609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 10.0, 8.0, 9.0, 11.0, 20.0, 17.0, 14.0, 19.0, 17.0, 31.0, 28.0, 29.0, 26.0, 38.0, 32.0, 52.0, 47.0, 89.0, 347.0, 1567.0, 139.0, 69.0, 41.0, 38.0, 35.0, 33.0, 30.0, 29.0, 40.0, 18.0, 22.0, 25.0, 22.0, 6.0, 10.0, 9.0, 5.0, 5.0, 11.0, 7.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-19.421875, -18.818359375, -18.21484375, -17.611328125, -17.0078125, -16.404296875, -15.80078125, -15.197265625, -14.59375, -13.990234375, -13.38671875, -12.783203125, -12.1796875, -11.576171875, -10.97265625, -10.369140625, -9.765625, -9.162109375, -8.55859375, -7.955078125, -7.3515625, -6.748046875, -6.14453125, -5.541015625, -4.9375, -4.333984375, -3.73046875, -3.126953125, -2.5234375, -1.919921875, -1.31640625, -0.712890625, -0.109375, 0.494140625, 1.09765625, 1.701171875, 2.3046875, 2.908203125, 3.51171875, 4.115234375, 4.71875, 5.322265625, 5.92578125, 6.529296875, 7.1328125, 7.736328125, 8.33984375, 8.943359375, 9.546875, 10.150390625, 10.75390625, 11.357421875, 11.9609375, 12.564453125, 13.16796875, 13.771484375, 14.375, 14.978515625, 15.58203125, 16.185546875, 16.7890625, 17.392578125, 17.99609375, 18.599609375, 19.203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 11.0, 16.0, 17.0, 19.0, 22.0, 36.0, 68.0, 105.0, 166.0, 266.0, 504.0, 1878.0, 2726368.0, 413560.0, 1536.0, 440.0, 246.0, 163.0, 87.0, 54.0, 41.0, 31.0, 21.0, 15.0, 13.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.25, -73.7041015625, -71.158203125, -68.6123046875, -66.06640625, -63.5205078125, -60.974609375, -58.4287109375, -55.8828125, -53.3369140625, -50.791015625, -48.2451171875, -45.69921875, -43.1533203125, -40.607421875, -38.0615234375, -35.515625, -32.9697265625, -30.423828125, -27.8779296875, -25.33203125, -22.7861328125, -20.240234375, -17.6943359375, -15.1484375, -12.6025390625, -10.056640625, -7.5107421875, -4.96484375, -2.4189453125, 0.126953125, 2.6728515625, 5.21875, 7.7646484375, 10.310546875, 12.8564453125, 15.40234375, 17.9482421875, 20.494140625, 23.0400390625, 25.5859375, 28.1318359375, 30.677734375, 33.2236328125, 35.76953125, 38.3154296875, 40.861328125, 43.4072265625, 45.953125, 48.4990234375, 51.044921875, 53.5908203125, 56.13671875, 58.6826171875, 61.228515625, 63.7744140625, 66.3203125, 68.8662109375, 71.412109375, 73.9580078125, 76.50390625, 79.0498046875, 81.595703125, 84.1416015625, 86.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 26.0, 163.0, 310.0, 317.0, 137.0, 41.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.58265686035156, -36.074092864990234, -34.56553268432617, -33.056968688964844, -31.54840850830078, -30.039846420288086, -28.53128433227539, -27.022720336914062, -25.51416015625, -24.005598068237305, -22.49703598022461, -20.988473892211914, -19.47991180419922, -17.971349716186523, -16.462787628173828, -14.954224586486816, -13.445661544799805, -11.93709945678711, -10.428537368774414, -8.919975280761719, -7.411412715911865, -5.90285062789917, -4.394288063049316, -2.885725975036621, -1.3771638870239258, 0.13139832019805908, 1.639960527420044, 3.1485228538513184, 4.657084941864014, 6.165647029876709, 7.6742095947265625, 9.182771682739258, 10.691333770751953, 12.199895858764648, 13.708457946777344, 15.217020034790039, 16.725582122802734, 18.23414421081543, 19.742706298828125, 21.251270294189453, 22.759830474853516, 24.26839256286621, 25.776954650878906, 27.2855167388916, 28.794078826904297, 30.302640914916992, 31.811203002929688, 33.319766998291016, 34.828330993652344, 36.33689498901367, 37.845455169677734, 39.35401916503906, 40.862579345703125, 42.37114334106445, 43.879703521728516, 45.388267517089844, 46.896827697753906, 48.405391693115234, 49.9139518737793, 51.422515869140625, 52.93107604980469, 54.439640045166016, 55.94820022583008, 57.456764221191406, 58.96532440185547]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 20.0, 15.0, 16.0, 16.0, 27.0, 28.0, 26.0, 44.0, 27.0, 38.0, 38.0, 46.0, 43.0, 44.0, 36.0, 53.0, 49.0, 40.0, 39.0, 43.0, 35.0, 26.0, 30.0, 24.0, 18.0, 24.0, 19.0, 18.0, 11.0, 12.0, 16.0, 6.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.525245666503906, -54.71100616455078, -52.896766662597656, -51.08252716064453, -49.268287658691406, -47.45404815673828, -45.63980484008789, -43.825565338134766, -42.01132583618164, -40.197086334228516, -38.38284683227539, -36.568607330322266, -34.754364013671875, -32.94012451171875, -31.125885009765625, -29.3116455078125, -27.497406005859375, -25.68316650390625, -23.868927001953125, -22.054685592651367, -20.240446090698242, -18.426206588745117, -16.61196517944336, -14.797725677490234, -12.98348617553711, -11.169246673583984, -9.355006217956543, -7.54076623916626, -5.726526260375977, -3.9122867584228516, -2.09804630279541, -0.28380584716796875, 1.5304336547851562, 3.3446736335754395, 5.158913612365723, 6.973153591156006, 8.787393569946289, 10.601633071899414, 12.415873527526855, 14.230113983154297, 16.044353485107422, 17.858592987060547, 19.672832489013672, 21.48707389831543, 23.301313400268555, 25.11555290222168, 26.929794311523438, 28.744033813476562, 30.558273315429688, 32.37251281738281, 34.18675231933594, 36.00099182128906, 37.81523132324219, 39.62947082519531, 41.4437141418457, 43.25795364379883, 45.07219314575195, 46.88643264770508, 48.7006721496582, 50.51491165161133, 52.32915496826172, 54.143394470214844, 55.95763397216797, 57.771873474121094, 59.58611297607422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 9.0, 9.0, 11.0, 9.0, 20.0, 8.0, 14.0, 19.0, 25.0, 36.0, 23.0, 31.0, 32.0, 30.0, 43.0, 31.0, 61.0, 41.0, 41.0, 45.0, 52.0, 30.0, 39.0, 36.0, 33.0, 40.0, 25.0, 31.0, 28.0, 20.0, 24.0, 13.0, 17.0, 16.0, 13.0, 10.0, 5.0, 1.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0859375, -5.8760986328125, -5.666259765625, -5.4564208984375, -5.24658203125, -5.0367431640625, -4.826904296875, -4.6170654296875, -4.4072265625, -4.1973876953125, -3.987548828125, -3.7777099609375, -3.56787109375, -3.3580322265625, -3.148193359375, -2.9383544921875, -2.728515625, -2.5186767578125, -2.308837890625, -2.0989990234375, -1.88916015625, -1.6793212890625, -1.469482421875, -1.2596435546875, -1.0498046875, -0.8399658203125, -0.630126953125, -0.4202880859375, -0.21044921875, -0.0006103515625, 0.209228515625, 0.4190673828125, 0.62890625, 0.8387451171875, 1.048583984375, 1.2584228515625, 1.46826171875, 1.6781005859375, 1.887939453125, 2.0977783203125, 2.3076171875, 2.5174560546875, 2.727294921875, 2.9371337890625, 3.14697265625, 3.3568115234375, 3.566650390625, 3.7764892578125, 3.986328125, 4.1961669921875, 4.406005859375, 4.6158447265625, 4.82568359375, 5.0355224609375, 5.245361328125, 5.4552001953125, 5.6650390625, 5.8748779296875, 6.084716796875, 6.2945556640625, 6.50439453125, 6.7142333984375, 6.924072265625, 7.1339111328125, 7.34375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 14.0, 5.0, 10.0, 14.0, 17.0, 28.0, 22.0, 26.0, 39.0, 42.0, 48.0, 59.0, 79.0, 111.0, 175.0, 280.0, 718.0, 2210.0, 11054.0, 103648.0, 1550228.0, 2300031.0, 203154.0, 17149.0, 3107.0, 904.0, 361.0, 180.0, 129.0, 97.0, 81.0, 50.0, 40.0, 34.0, 27.0, 32.0, 19.0, 10.0, 11.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8125, -13.28369140625, -12.7548828125, -12.22607421875, -11.697265625, -11.16845703125, -10.6396484375, -10.11083984375, -9.58203125, -9.05322265625, -8.5244140625, -7.99560546875, -7.466796875, -6.93798828125, -6.4091796875, -5.88037109375, -5.3515625, -4.82275390625, -4.2939453125, -3.76513671875, -3.236328125, -2.70751953125, -2.1787109375, -1.64990234375, -1.12109375, -0.59228515625, -0.0634765625, 0.46533203125, 0.994140625, 1.52294921875, 2.0517578125, 2.58056640625, 3.109375, 3.63818359375, 4.1669921875, 4.69580078125, 5.224609375, 5.75341796875, 6.2822265625, 6.81103515625, 7.33984375, 7.86865234375, 8.3974609375, 8.92626953125, 9.455078125, 9.98388671875, 10.5126953125, 11.04150390625, 11.5703125, 12.09912109375, 12.6279296875, 13.15673828125, 13.685546875, 14.21435546875, 14.7431640625, 15.27197265625, 15.80078125, 16.32958984375, 16.8583984375, 17.38720703125, 17.916015625, 18.44482421875, 18.9736328125, 19.50244140625, 20.03125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 13.0, 12.0, 12.0, 19.0, 26.0, 51.0, 52.0, 56.0, 88.0, 98.0, 136.0, 166.0, 208.0, 292.0, 390.0, 456.0, 442.0, 378.0, 290.0, 225.0, 160.0, 128.0, 98.0, 62.0, 60.0, 34.0, 28.0, 33.0, 20.0, 10.0, 10.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.086181640625, -12.71142578125, -12.336669921875, -11.9619140625, -11.587158203125, -11.21240234375, -10.837646484375, -10.462890625, -10.088134765625, -9.71337890625, -9.338623046875, -8.9638671875, -8.589111328125, -8.21435546875, -7.839599609375, -7.46484375, -7.090087890625, -6.71533203125, -6.340576171875, -5.9658203125, -5.591064453125, -5.21630859375, -4.841552734375, -4.466796875, -4.092041015625, -3.71728515625, -3.342529296875, -2.9677734375, -2.593017578125, -2.21826171875, -1.843505859375, -1.46875, -1.093994140625, -0.71923828125, -0.344482421875, 0.0302734375, 0.405029296875, 0.77978515625, 1.154541015625, 1.529296875, 1.904052734375, 2.27880859375, 2.653564453125, 3.0283203125, 3.403076171875, 3.77783203125, 4.152587890625, 4.52734375, 4.902099609375, 5.27685546875, 5.651611328125, 6.0263671875, 6.401123046875, 6.77587890625, 7.150634765625, 7.525390625, 7.900146484375, 8.27490234375, 8.649658203125, 9.0244140625, 9.399169921875, 9.77392578125, 10.148681640625, 10.5234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 31.0, 39.0, 32.0, 46.0, 71.0, 97.0, 102.0, 143.0, 160.0, 255.0, 303.0, 543.0, 2324.0, 153659.0, 3984583.0, 48541.0, 1483.0, 479.0, 292.0, 209.0, 198.0, 135.0, 116.0, 96.0, 64.0, 54.0, 52.0, 34.0, 25.0, 19.0, 10.0, 16.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.71875, -43.08642578125, -41.4541015625, -39.82177734375, -38.189453125, -36.55712890625, -34.9248046875, -33.29248046875, -31.66015625, -30.02783203125, -28.3955078125, -26.76318359375, -25.130859375, -23.49853515625, -21.8662109375, -20.23388671875, -18.6015625, -16.96923828125, -15.3369140625, -13.70458984375, -12.072265625, -10.43994140625, -8.8076171875, -7.17529296875, -5.54296875, -3.91064453125, -2.2783203125, -0.64599609375, 0.986328125, 2.61865234375, 4.2509765625, 5.88330078125, 7.515625, 9.14794921875, 10.7802734375, 12.41259765625, 14.044921875, 15.67724609375, 17.3095703125, 18.94189453125, 20.57421875, 22.20654296875, 23.8388671875, 25.47119140625, 27.103515625, 28.73583984375, 30.3681640625, 32.00048828125, 33.6328125, 35.26513671875, 36.8974609375, 38.52978515625, 40.162109375, 41.79443359375, 43.4267578125, 45.05908203125, 46.69140625, 48.32373046875, 49.9560546875, 51.58837890625, 53.220703125, 54.85302734375, 56.4853515625, 58.11767578125, 59.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 16.0, 127.0, 353.0, 378.0, 117.0, 20.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.40177154541016, -113.42817687988281, -107.45457458496094, -101.4809799194336, -95.50738525390625, -89.53378295898438, -83.56018829345703, -77.58659362792969, -71.61299133300781, -65.63939666748047, -59.66579818725586, -53.69219970703125, -47.718605041503906, -41.7450065612793, -35.77140808105469, -29.797813415527344, -23.82421875, -17.850622177124023, -11.87702465057373, -5.9034271240234375, 0.07016944885253906, 6.043766021728516, 12.017364501953125, 17.99095916748047, 23.964557647705078, 29.938154220581055, 35.91175079345703, 41.88534927368164, 47.85894775390625, 53.832542419433594, 59.8061408996582, 65.77973937988281, 71.75334167480469, 77.72693634033203, 83.7005386352539, 89.67413330078125, 95.6477279663086, 101.62132263183594, 107.59492492675781, 113.56851959228516, 119.5421142578125, 125.51570892333984, 131.4893035888672, 137.46290588378906, 143.43650817871094, 149.41009521484375, 155.38369750976562, 161.3572998046875, 167.33090209960938, 173.30450439453125, 179.27809143066406, 185.25169372558594, 191.2252960205078, 197.19888305664062, 203.1724853515625, 209.14608764648438, 215.1196746826172, 221.09327697753906, 227.06686401367188, 233.04046630859375, 239.01406860351562, 244.98765563964844, 250.9612579345703, 256.9348449707031, 262.908447265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 13.0, 14.0, 15.0, 11.0, 19.0, 26.0, 27.0, 28.0, 24.0, 38.0, 32.0, 38.0, 51.0, 50.0, 42.0, 45.0, 42.0, 54.0, 42.0, 42.0, 35.0, 31.0, 40.0, 34.0, 30.0, 28.0, 21.0, 24.0, 16.0, 18.0, 7.0, 10.0, 13.0, 4.0, 5.0, 3.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.3616943359375, -47.98292541503906, -46.60416030883789, -45.22539138793945, -43.84662628173828, -42.467857360839844, -41.089088439941406, -39.71031951904297, -38.3315544128418, -36.95278549194336, -35.57402038574219, -34.19525146484375, -32.81648254394531, -31.43771743774414, -30.058948516845703, -28.6801815032959, -27.301414489746094, -25.92264747619629, -24.543880462646484, -23.165111541748047, -21.786344528198242, -20.407577514648438, -19.02880859375, -17.650041580200195, -16.27127456665039, -14.892507553100586, -13.513739585876465, -12.134971618652344, -10.756204605102539, -9.377437591552734, -7.998669624328613, -6.619901657104492, -5.2411346435546875, -3.8623671531677246, -2.4835996627807617, -1.1048321723937988, 0.27393531799316406, 1.652702808380127, 3.03147029876709, 4.410238265991211, 5.789005279541016, 7.1677727699279785, 8.546540260314941, 9.925308227539062, 11.304075241088867, 12.682842254638672, 14.061610221862793, 15.440378189086914, 16.81914520263672, 18.197912216186523, 19.576679229736328, 20.955448150634766, 22.33421516418457, 23.712982177734375, 25.091751098632812, 26.470518112182617, 27.849285125732422, 29.228052139282227, 30.60681915283203, 31.98558807373047, 33.364356994628906, 34.74312210083008, 36.121891021728516, 37.50065612792969, 38.879425048828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 44.0, 49.0, 37.0, 29.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 8.0, 7.0, 9.0, 17.0, 13.0, 41.0, 57.0, 58.0, 101.0, 155.0, 226.0, 282.0, 479.0, 760.0, 1077.0, 1703.0, 2625.0, 4058.0, 6268.0, 10183.0, 16396.0, 26203.0, 42071.0, 68373.0, 106964.0, 154932.0, 181413.0, 149102.0, 101952.0, 64911.0, 40696.0, 25227.0, 15575.0, 9709.0, 5865.0, 3936.0, 2393.0, 1551.0, 1005.0, 681.0, 501.0, 311.0, 211.0, 136.0, 84.0, 79.0, 45.0, 33.0, 27.0, 20.0, 10.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.63916015625, -0.61883544921875, -0.5985107421875, -0.57818603515625, -0.557861328125, -0.53753662109375, -0.5172119140625, -0.49688720703125, -0.4765625, -0.45623779296875, -0.4359130859375, -0.41558837890625, -0.395263671875, -0.37493896484375, -0.3546142578125, -0.33428955078125, -0.31396484375, -0.29364013671875, -0.2733154296875, -0.25299072265625, -0.232666015625, -0.21234130859375, -0.1920166015625, -0.17169189453125, -0.1513671875, -0.13104248046875, -0.1107177734375, -0.09039306640625, -0.070068359375, -0.04974365234375, -0.0294189453125, -0.00909423828125, 0.01123046875, 0.03155517578125, 0.0518798828125, 0.07220458984375, 0.092529296875, 0.11285400390625, 0.1331787109375, 0.15350341796875, 0.173828125, 0.19415283203125, 0.2144775390625, 0.23480224609375, 0.255126953125, 0.27545166015625, 0.2957763671875, 0.31610107421875, 0.33642578125, 0.35675048828125, 0.3770751953125, 0.39739990234375, 0.417724609375, 0.43804931640625, 0.4583740234375, 0.47869873046875, 0.4990234375, 0.51934814453125, 0.5396728515625, 0.55999755859375, 0.580322265625, 0.60064697265625, 0.6209716796875, 0.64129638671875, 0.66162109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 3.0, 14.0, 19.0, 12.0, 12.0, 14.0, 24.0, 27.0, 29.0, 24.0, 32.0, 42.0, 40.0, 37.0, 60.0, 43.0, 47.0, 1067.0, 52.0, 47.0, 35.0, 42.0, 40.0, 45.0, 41.0, 33.0, 21.0, 14.0, 25.0, 20.0, 16.0, 8.0, 2.0, 7.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.0546875, -4.91143798828125, -4.7681884765625, -4.62493896484375, -4.481689453125, -4.33843994140625, -4.1951904296875, -4.05194091796875, -3.90869140625, -3.76544189453125, -3.6221923828125, -3.47894287109375, -3.335693359375, -3.19244384765625, -3.0491943359375, -2.90594482421875, -2.7626953125, -2.61944580078125, -2.4761962890625, -2.33294677734375, -2.189697265625, -2.04644775390625, -1.9031982421875, -1.75994873046875, -1.61669921875, -1.47344970703125, -1.3302001953125, -1.18695068359375, -1.043701171875, -0.90045166015625, -0.7572021484375, -0.61395263671875, -0.470703125, -0.32745361328125, -0.1842041015625, -0.04095458984375, 0.102294921875, 0.24554443359375, 0.3887939453125, 0.53204345703125, 0.67529296875, 0.81854248046875, 0.9617919921875, 1.10504150390625, 1.248291015625, 1.39154052734375, 1.5347900390625, 1.67803955078125, 1.8212890625, 1.96453857421875, 2.1077880859375, 2.25103759765625, 2.394287109375, 2.53753662109375, 2.6807861328125, 2.82403564453125, 2.96728515625, 3.11053466796875, 3.2537841796875, 3.39703369140625, 3.540283203125, 3.68353271484375, 3.8267822265625, 3.97003173828125, 4.11328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 10.0, 15.0, 19.0, 59.0, 74.0, 135.0, 184.0, 333.0, 512.0, 909.0, 1331.0, 2290.0, 3638.0, 5870.0, 9420.0, 15302.0, 24481.0, 38759.0, 62394.0, 95587.0, 135797.0, 1212029.0, 157605.0, 117736.0, 78735.0, 50538.0, 31765.0, 19473.0, 12232.0, 7448.0, 4716.0, 2938.0, 1830.0, 1152.0, 681.0, 444.0, 249.0, 170.0, 97.0, 60.0, 37.0, 23.0, 15.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4797706604003906, -0.46417999267578125, -0.4485893249511719, -0.4329986572265625, -0.4174079895019531, -0.40181732177734375, -0.3862266540527344, -0.370635986328125, -0.3550453186035156, -0.33945465087890625, -0.3238639831542969, -0.3082733154296875, -0.2926826477050781, -0.27709197998046875, -0.2615013122558594, -0.24591064453125, -0.23031997680664062, -0.21472930908203125, -0.19913864135742188, -0.1835479736328125, -0.16795730590820312, -0.15236663818359375, -0.13677597045898438, -0.121185302734375, -0.10559463500976562, -0.09000396728515625, -0.07441329956054688, -0.0588226318359375, -0.043231964111328125, -0.02764129638671875, -0.012050628662109375, 0.0035400390625, 0.019130706787109375, 0.03472137451171875, 0.050312042236328125, 0.0659027099609375, 0.08149337768554688, 0.09708404541015625, 0.11267471313476562, 0.128265380859375, 0.14385604858398438, 0.15944671630859375, 0.17503738403320312, 0.1906280517578125, 0.20621871948242188, 0.22180938720703125, 0.23740005493164062, 0.25299072265625, 0.2685813903808594, 0.28417205810546875, 0.2997627258300781, 0.3153533935546875, 0.3309440612792969, 0.34653472900390625, 0.3621253967285156, 0.377716064453125, 0.3933067321777344, 0.40889739990234375, 0.4244880676269531, 0.4400787353515625, 0.4556694030761719, 0.47126007080078125, 0.4868507385253906, 0.50244140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 2.0, 13.0, 13.0, 19.0, 21.0, 19.0, 20.0, 34.0, 48.0, 64.0, 69.0, 85.0, 78.0, 95.0, 67.0, 83.0, 40.0, 47.0, 38.0, 20.0, 23.0, 16.0, 11.0, 13.0, 11.0, 4.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004192352294921875, -0.0040648579597473145, -0.003937363624572754, -0.0038098692893981934, -0.003682374954223633, -0.0035548806190490723, -0.0034273862838745117, -0.003299891948699951, -0.0031723976135253906, -0.00304490327835083, -0.0029174089431762695, -0.002789914608001709, -0.0026624202728271484, -0.002534925937652588, -0.0024074316024780273, -0.002279937267303467, -0.0021524429321289062, -0.0020249485969543457, -0.0018974542617797852, -0.0017699599266052246, -0.001642465591430664, -0.0015149712562561035, -0.001387476921081543, -0.0012599825859069824, -0.0011324882507324219, -0.0010049939155578613, -0.0008774995803833008, -0.0007500052452087402, -0.0006225109100341797, -0.0004950165748596191, -0.0003675222396850586, -0.00024002790451049805, -0.0001125335693359375, 1.4960765838623047e-05, 0.0001424551010131836, 0.00026994943618774414, 0.0003974437713623047, 0.0005249381065368652, 0.0006524324417114258, 0.0007799267768859863, 0.0009074211120605469, 0.0010349154472351074, 0.001162409782409668, 0.0012899041175842285, 0.001417398452758789, 0.0015448927879333496, 0.0016723871231079102, 0.0017998814582824707, 0.0019273757934570312, 0.002054870128631592, 0.0021823644638061523, 0.002309858798980713, 0.0024373531341552734, 0.002564847469329834, 0.0026923418045043945, 0.002819836139678955, 0.0029473304748535156, 0.003074824810028076, 0.0032023191452026367, 0.0033298134803771973, 0.003457307815551758, 0.0035848021507263184, 0.003712296485900879, 0.0038397908210754395, 0.00396728515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 6.0, 11.0, 11.0, 17.0, 21.0, 27.0, 32.0, 45.0, 63.0, 90.0, 135.0, 251.0, 993.0, 70357.0, 972484.0, 3038.0, 363.0, 203.0, 121.0, 76.0, 41.0, 32.0, 26.0, 24.0, 12.0, 14.0, 15.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083740234375, -0.08087348937988281, -0.07800674438476562, -0.07513999938964844, -0.07227325439453125, -0.06940650939941406, -0.06653976440429688, -0.06367301940917969, -0.0608062744140625, -0.05793952941894531, -0.055072784423828125, -0.05220603942871094, -0.04933929443359375, -0.04647254943847656, -0.043605804443359375, -0.04073905944824219, -0.037872314453125, -0.03500556945800781, -0.032138824462890625, -0.029272079467773438, -0.02640533447265625, -0.023538589477539062, -0.020671844482421875, -0.017805099487304688, -0.0149383544921875, -0.012071609497070312, -0.009204864501953125, -0.0063381195068359375, -0.00347137451171875, -0.0006046295166015625, 0.002262115478515625, 0.0051288604736328125, 0.00799560546875, 0.010862350463867188, 0.013729095458984375, 0.016595840454101562, 0.01946258544921875, 0.022329330444335938, 0.025196075439453125, 0.028062820434570312, 0.0309295654296875, 0.03379631042480469, 0.036663055419921875, 0.03952980041503906, 0.04239654541015625, 0.04526329040527344, 0.048130035400390625, 0.05099678039550781, 0.053863525390625, 0.05673027038574219, 0.059597015380859375, 0.06246376037597656, 0.06533050537109375, 0.06819725036621094, 0.07106399536132812, 0.07393074035644531, 0.0767974853515625, 0.07966423034667969, 0.08253097534179688, 0.08539772033691406, 0.08826446533203125, 0.09113121032714844, 0.09399795532226562, 0.09686470031738281, 0.0997314453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 10.0, 15.0, 29.0, 61.0, 104.0, 203.0, 230.0, 169.0, 85.0, 50.0, 28.0, 15.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018103704787790775, -0.0016513746231794357, -0.0014923788839951158, -0.0013333831448107958, -0.001174387289211154, -0.0010153914336115122, -0.0008563956944271922, -0.0006973999552428722, -0.0005384040996432304, -0.00037940830225124955, -0.00022041250485926867, -6.141670746728778e-05, 9.757908992469311e-05, 0.000256574887316674, 0.0004155706847086549, 0.0005745664238929749, 0.0007335622794926167, 0.0008925580768845975, 0.0010515538742765784, 0.0012105496134608984, 0.0013695454690605402, 0.001528541324660182, 0.001687537063844502, 0.001846532803028822, 0.0020055286586284637, 0.0021645245142281055, 0.0023235203698277473, 0.0024825159925967455, 0.0026415118481963873, 0.002800507703796029, 0.0029595033265650272, 0.003118499182164669, 0.003277495503425598, 0.00343649135902524, 0.0035954872146248817, 0.00375448283739388, 0.003913478925824165, 0.00407247431576252, 0.004231470171362162, 0.0043904660269618034, 0.004549461882561445, 0.004708457738161087, 0.004867453593760729, 0.005026449449360371, 0.005185444839298725, 0.005344440694898367, 0.005503436550498009, 0.0056624324060976505, 0.005821428261697292, 0.005980424117296934, 0.006139419972896576, 0.006298415828496218, 0.0064574116840958595, 0.006616407074034214, 0.006775402929633856, 0.006934398785233498, 0.007093394640833139, 0.007252390496432781, 0.007411386352032423, 0.007570382207632065, 0.007729377597570419, 0.007888373918831348, 0.008047369308769703, 0.008206365630030632, 0.008365361019968987]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 11.0, 12.0, 12.0, 13.0, 22.0, 35.0, 36.0, 24.0, 38.0, 42.0, 23.0, 43.0, 46.0, 43.0, 35.0, 41.0, 40.0, 29.0, 46.0, 31.0, 37.0, 34.0, 35.0, 30.0, 30.0, 34.0, 28.0, 15.0, 19.0, 9.0, 19.0, 14.0, 9.0, 4.0, 9.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0019698143005371094, -0.0019105495885014534, -0.0018512848764657974, -0.0017920201644301414, -0.0017327554523944855, -0.0016734907403588295, -0.0016142260283231735, -0.0015549613162875175, -0.0014956966042518616, -0.0014364318922162056, -0.0013771671801805496, -0.0013179024681448936, -0.0012586377561092377, -0.0011993730440735817, -0.0011401083320379257, -0.0010808436200022697, -0.0010215789079666138, -0.0009623141959309578, -0.0009030494838953018, -0.0008437847718596458, -0.0007845200598239899, -0.0007252553477883339, -0.0006659906357526779, -0.0006067259237170219, -0.000547461211681366, -0.00048819649964571, -0.000428931787610054, -0.00036966707557439804, -0.00031040236353874207, -0.0002511376515030861, -0.00019187293946743011, -0.00013260822743177414, -7.334351539611816e-05, -1.4078803360462189e-05, 4.518590867519379e-05, 0.00010445062071084976, 0.00016371533274650574, 0.0002229800447821617, 0.0002822447568178177, 0.00034150946885347366, 0.00040077418088912964, 0.0004600388929247856, 0.0005193036049604416, 0.0005785683169960976, 0.0006378330290317535, 0.0006970977410674095, 0.0007563624531030655, 0.0008156271651387215, 0.0008748918771743774, 0.0009341565892100334, 0.0009934213012456894, 0.0010526860132813454, 0.0011119507253170013, 0.0011712154373526573, 0.0012304801493883133, 0.0012897448614239693, 0.0013490095734596252, 0.0014082742854952812, 0.0014675389975309372, 0.0015268037095665932, 0.0015860684216022491, 0.0016453331336379051, 0.001704597845673561, 0.001763862557709217, 0.001823127269744873]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 45.0, 48.0, 38.0, 28.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 13.0, 20.0, 21.0, 31.0, 38.0, 72.0, 113.0, 203.0, 313.0, 485.0, 798.0, 1393.0, 2177.0, 3882.0, 7034.0, 13261.0, 28969.0, 74106.0, 223881.0, 434586.0, 155868.0, 54069.0, 22348.0, 10878.0, 5764.0, 3230.0, 1928.0, 1196.0, 664.0, 444.0, 250.0, 193.0, 109.0, 63.0, 43.0, 32.0, 22.0, 12.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -4.9930419921875, -4.833740234375, -4.6744384765625, -4.51513671875, -4.3558349609375, -4.196533203125, -4.0372314453125, -3.8779296875, -3.7186279296875, -3.559326171875, -3.4000244140625, -3.24072265625, -3.0814208984375, -2.922119140625, -2.7628173828125, -2.603515625, -2.4442138671875, -2.284912109375, -2.1256103515625, -1.96630859375, -1.8070068359375, -1.647705078125, -1.4884033203125, -1.3291015625, -1.1697998046875, -1.010498046875, -0.8511962890625, -0.69189453125, -0.5325927734375, -0.373291015625, -0.2139892578125, -0.0546875, 0.1046142578125, 0.263916015625, 0.4232177734375, 0.58251953125, 0.7418212890625, 0.901123046875, 1.0604248046875, 1.2197265625, 1.3790283203125, 1.538330078125, 1.6976318359375, 1.85693359375, 2.0162353515625, 2.175537109375, 2.3348388671875, 2.494140625, 2.6534423828125, 2.812744140625, 2.9720458984375, 3.13134765625, 3.2906494140625, 3.449951171875, 3.6092529296875, 3.7685546875, 3.9278564453125, 4.087158203125, 4.2464599609375, 4.40576171875, 4.5650634765625, 4.724365234375, 4.8836669921875, 5.04296875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 15.0, 19.0, 12.0, 14.0, 19.0, 25.0, 30.0, 38.0, 32.0, 41.0, 51.0, 52.0, 73.0, 97.0, 286.0, 1617.0, 145.0, 66.0, 58.0, 58.0, 35.0, 35.0, 28.0, 30.0, 28.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.80908203125, -21.0869140625, -20.36474609375, -19.642578125, -18.92041015625, -18.1982421875, -17.47607421875, -16.75390625, -16.03173828125, -15.3095703125, -14.58740234375, -13.865234375, -13.14306640625, -12.4208984375, -11.69873046875, -10.9765625, -10.25439453125, -9.5322265625, -8.81005859375, -8.087890625, -7.36572265625, -6.6435546875, -5.92138671875, -5.19921875, -4.47705078125, -3.7548828125, -3.03271484375, -2.310546875, -1.58837890625, -0.8662109375, -0.14404296875, 0.578125, 1.30029296875, 2.0224609375, 2.74462890625, 3.466796875, 4.18896484375, 4.9111328125, 5.63330078125, 6.35546875, 7.07763671875, 7.7998046875, 8.52197265625, 9.244140625, 9.96630859375, 10.6884765625, 11.41064453125, 12.1328125, 12.85498046875, 13.5771484375, 14.29931640625, 15.021484375, 15.74365234375, 16.4658203125, 17.18798828125, 17.91015625, 18.63232421875, 19.3544921875, 20.07666015625, 20.798828125, 21.52099609375, 22.2431640625, 22.96533203125, 23.6875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 5.0, 3.0, 7.0, 12.0, 7.0, 12.0, 18.0, 19.0, 23.0, 22.0, 32.0, 39.0, 61.0, 74.0, 120.0, 133.0, 212.0, 301.0, 560.0, 3099.0, 855099.0, 2280285.0, 3778.0, 567.0, 329.0, 222.0, 148.0, 132.0, 91.0, 57.0, 39.0, 35.0, 38.0, 22.0, 29.0, 16.0, 16.0, 7.0, 12.0, 3.0, 3.0, 6.0, 2.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.40625, -54.69873046875, -52.9912109375, -51.28369140625, -49.576171875, -47.86865234375, -46.1611328125, -44.45361328125, -42.74609375, -41.03857421875, -39.3310546875, -37.62353515625, -35.916015625, -34.20849609375, -32.5009765625, -30.79345703125, -29.0859375, -27.37841796875, -25.6708984375, -23.96337890625, -22.255859375, -20.54833984375, -18.8408203125, -17.13330078125, -15.42578125, -13.71826171875, -12.0107421875, -10.30322265625, -8.595703125, -6.88818359375, -5.1806640625, -3.47314453125, -1.765625, -0.05810546875, 1.6494140625, 3.35693359375, 5.064453125, 6.77197265625, 8.4794921875, 10.18701171875, 11.89453125, 13.60205078125, 15.3095703125, 17.01708984375, 18.724609375, 20.43212890625, 22.1396484375, 23.84716796875, 25.5546875, 27.26220703125, 28.9697265625, 30.67724609375, 32.384765625, 34.09228515625, 35.7998046875, 37.50732421875, 39.21484375, 40.92236328125, 42.6298828125, 44.33740234375, 46.044921875, 47.75244140625, 49.4599609375, 51.16748046875, 52.875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 153.0, 806.0, 55.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.01434326171875, -22.866750717163086, -17.719158172607422, -12.571565628051758, -7.423973083496094, -2.2763805389404297, 2.8712120056152344, 8.018806457519531, 13.166397094726562, 18.313989639282227, 23.46158218383789, 28.609174728393555, 33.75676727294922, 38.90435791015625, 44.05195236206055, 49.199546813964844, 54.347137451171875, 59.494728088378906, 64.64231872558594, 69.7899169921875, 74.93750762939453, 80.08509826660156, 85.23269653320312, 90.38028717041016, 95.52787780761719, 100.67546844482422, 105.82305908203125, 110.97065734863281, 116.11824798583984, 121.26583862304688, 126.41343688964844, 131.56103515625, 136.7086181640625, 141.85621643066406, 147.00379943847656, 152.15139770507812, 157.29898071289062, 162.4465789794922, 167.59417724609375, 172.74176025390625, 177.8893585205078, 183.03695678710938, 188.18453979492188, 193.33213806152344, 198.479736328125, 203.6273193359375, 208.77491760253906, 213.92251586914062, 219.07009887695312, 224.2176971435547, 229.3652801513672, 234.51287841796875, 239.66046142578125, 244.8080596923828, 249.95565795898438, 255.10324096679688, 260.2508544921875, 265.3984375, 270.5460510253906, 275.6936340332031, 280.8412170410156, 285.98883056640625, 291.13641357421875, 296.28399658203125, 301.43157958984375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 5.0, 9.0, 12.0, 18.0, 9.0, 18.0, 14.0, 27.0, 23.0, 24.0, 29.0, 29.0, 32.0, 29.0, 42.0, 33.0, 36.0, 42.0, 39.0, 46.0, 41.0, 32.0, 33.0, 42.0, 29.0, 37.0, 28.0, 24.0, 23.0, 22.0, 16.0, 12.0, 12.0, 12.0, 11.0, 12.0, 8.0, 8.0, 9.0, 3.0, 7.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-43.49616241455078, -42.049827575683594, -40.603492736816406, -39.15715789794922, -37.71082305908203, -36.26448440551758, -34.81814956665039, -33.3718147277832, -31.925479888916016, -30.479145050048828, -29.03281021118164, -27.58647346496582, -26.140138626098633, -24.693803787231445, -23.247467041015625, -21.801132202148438, -20.35479736328125, -18.908462524414062, -17.462127685546875, -16.015790939331055, -14.569456100463867, -13.12312126159668, -11.676785469055176, -10.230449676513672, -8.784114837646484, -7.337779521942139, -5.891444206237793, -4.445108890533447, -2.9987735748291016, -1.5524382591247559, -0.10610294342041016, 1.3402328491210938, 2.7865676879882812, 4.232903003692627, 5.679238319396973, 7.125573635101318, 8.571908950805664, 10.018243789672852, 11.464579582214355, 12.91091537475586, 14.357250213623047, 15.803585052490234, 17.249919891357422, 18.696256637573242, 20.14259147644043, 21.588926315307617, 23.035263061523438, 24.481597900390625, 25.927932739257812, 27.374267578125, 28.820602416992188, 30.266939163208008, 31.713274002075195, 33.159610748291016, 34.6059455871582, 36.05228042602539, 37.49861526489258, 38.944950103759766, 40.39128494262695, 41.83761978149414, 43.283958435058594, 44.73029327392578, 46.17662811279297, 47.622962951660156, 49.069297790527344]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 13.0, 5.0, 10.0, 10.0, 15.0, 18.0, 16.0, 17.0, 29.0, 30.0, 22.0, 30.0, 35.0, 36.0, 32.0, 34.0, 34.0, 38.0, 47.0, 44.0, 45.0, 35.0, 33.0, 29.0, 44.0, 33.0, 28.0, 34.0, 27.0, 26.0, 16.0, 24.0, 17.0, 18.0, 12.0, 11.0, 11.0, 9.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.63201904296875, -5.4281005859375, -5.22418212890625, -5.020263671875, -4.81634521484375, -4.6124267578125, -4.40850830078125, -4.20458984375, -4.00067138671875, -3.7967529296875, -3.59283447265625, -3.388916015625, -3.18499755859375, -2.9810791015625, -2.77716064453125, -2.5732421875, -2.36932373046875, -2.1654052734375, -1.96148681640625, -1.757568359375, -1.55364990234375, -1.3497314453125, -1.14581298828125, -0.94189453125, -0.73797607421875, -0.5340576171875, -0.33013916015625, -0.126220703125, 0.07769775390625, 0.2816162109375, 0.48553466796875, 0.689453125, 0.89337158203125, 1.0972900390625, 1.30120849609375, 1.505126953125, 1.70904541015625, 1.9129638671875, 2.11688232421875, 2.32080078125, 2.52471923828125, 2.7286376953125, 2.93255615234375, 3.136474609375, 3.34039306640625, 3.5443115234375, 3.74822998046875, 3.9521484375, 4.15606689453125, 4.3599853515625, 4.56390380859375, 4.767822265625, 4.97174072265625, 5.1756591796875, 5.37957763671875, 5.58349609375, 5.78741455078125, 5.9913330078125, 6.19525146484375, 6.399169921875, 6.60308837890625, 6.8070068359375, 7.01092529296875, 7.21484375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 0.0, 5.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 12.0, 12.0, 33.0, 26.0, 32.0, 46.0, 56.0, 93.0, 205.0, 436.0, 1288.0, 4578.0, 27088.0, 519366.0, 3174116.0, 436548.0, 23766.0, 4187.0, 1221.0, 489.0, 215.0, 105.0, 59.0, 52.0, 37.0, 19.0, 28.0, 20.0, 17.0, 14.0, 14.0, 12.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.921875, -15.296875, -14.671875, -14.046875, -13.421875, -12.796875, -12.171875, -11.546875, -10.921875, -10.296875, -9.671875, -9.046875, -8.421875, -7.796875, -7.171875, -6.546875, -5.921875, -5.296875, -4.671875, -4.046875, -3.421875, -2.796875, -2.171875, -1.546875, -0.921875, -0.296875, 0.328125, 0.953125, 1.578125, 2.203125, 2.828125, 3.453125, 4.078125, 4.703125, 5.328125, 5.953125, 6.578125, 7.203125, 7.828125, 8.453125, 9.078125, 9.703125, 10.328125, 10.953125, 11.578125, 12.203125, 12.828125, 13.453125, 14.078125, 14.703125, 15.328125, 15.953125, 16.578125, 17.203125, 17.828125, 18.453125, 19.078125, 19.703125, 20.328125, 20.953125, 21.578125, 22.203125, 22.828125, 23.453125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 4.0, 11.0, 12.0, 9.0, 16.0, 13.0, 32.0, 35.0, 32.0, 39.0, 56.0, 86.0, 87.0, 115.0, 152.0, 187.0, 251.0, 333.0, 392.0, 407.0, 387.0, 323.0, 224.0, 202.0, 149.0, 114.0, 97.0, 52.0, 60.0, 35.0, 31.0, 22.0, 20.0, 14.0, 17.0, 10.0, 12.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.921875, -10.594482421875, -10.26708984375, -9.939697265625, -9.6123046875, -9.284912109375, -8.95751953125, -8.630126953125, -8.302734375, -7.975341796875, -7.64794921875, -7.320556640625, -6.9931640625, -6.665771484375, -6.33837890625, -6.010986328125, -5.68359375, -5.356201171875, -5.02880859375, -4.701416015625, -4.3740234375, -4.046630859375, -3.71923828125, -3.391845703125, -3.064453125, -2.737060546875, -2.40966796875, -2.082275390625, -1.7548828125, -1.427490234375, -1.10009765625, -0.772705078125, -0.4453125, -0.117919921875, 0.20947265625, 0.536865234375, 0.8642578125, 1.191650390625, 1.51904296875, 1.846435546875, 2.173828125, 2.501220703125, 2.82861328125, 3.156005859375, 3.4833984375, 3.810791015625, 4.13818359375, 4.465576171875, 4.79296875, 5.120361328125, 5.44775390625, 5.775146484375, 6.1025390625, 6.429931640625, 6.75732421875, 7.084716796875, 7.412109375, 7.739501953125, 8.06689453125, 8.394287109375, 8.7216796875, 9.049072265625, 9.37646484375, 9.703857421875, 10.03125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 9.0, 16.0, 15.0, 15.0, 19.0, 25.0, 31.0, 47.0, 58.0, 65.0, 78.0, 105.0, 125.0, 182.0, 219.0, 305.0, 402.0, 1587.0, 41038.0, 3824102.0, 319366.0, 4392.0, 592.0, 311.0, 219.0, 191.0, 159.0, 107.0, 98.0, 81.0, 65.0, 61.0, 39.0, 36.0, 32.0, 17.0, 21.0, 7.0, 11.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.84375, -47.30322265625, -45.7626953125, -44.22216796875, -42.681640625, -41.14111328125, -39.6005859375, -38.06005859375, -36.51953125, -34.97900390625, -33.4384765625, -31.89794921875, -30.357421875, -28.81689453125, -27.2763671875, -25.73583984375, -24.1953125, -22.65478515625, -21.1142578125, -19.57373046875, -18.033203125, -16.49267578125, -14.9521484375, -13.41162109375, -11.87109375, -10.33056640625, -8.7900390625, -7.24951171875, -5.708984375, -4.16845703125, -2.6279296875, -1.08740234375, 0.453125, 1.99365234375, 3.5341796875, 5.07470703125, 6.615234375, 8.15576171875, 9.6962890625, 11.23681640625, 12.77734375, 14.31787109375, 15.8583984375, 17.39892578125, 18.939453125, 20.47998046875, 22.0205078125, 23.56103515625, 25.1015625, 26.64208984375, 28.1826171875, 29.72314453125, 31.263671875, 32.80419921875, 34.3447265625, 35.88525390625, 37.42578125, 38.96630859375, 40.5068359375, 42.04736328125, 43.587890625, 45.12841796875, 46.6689453125, 48.20947265625, 49.75]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 12.0, 43.0, 81.0, 157.0, 204.0, 213.0, 153.0, 89.0, 36.0, 14.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.66555786132812, -93.73625183105469, -90.80694580078125, -87.87764739990234, -84.9483413696289, -82.01903533935547, -79.08973693847656, -76.16043090820312, -73.23112487792969, -70.30181884765625, -67.37251281738281, -64.4432144165039, -61.51390838623047, -58.58460235595703, -55.65530014038086, -52.72599792480469, -49.79669189453125, -46.86738586425781, -43.93808364868164, -41.00878143310547, -38.07947540283203, -35.150169372558594, -32.22086715698242, -29.291563034057617, -26.362258911132812, -23.432954788208008, -20.503650665283203, -17.5743465423584, -14.645042419433594, -11.715738296508789, -8.786434173583984, -5.85713005065918, -2.9278182983398438, 0.0014858245849609375, 2.9307899475097656, 5.86009407043457, 8.789398193359375, 11.71870231628418, 14.648006439208984, 17.57731056213379, 20.506614685058594, 23.4359188079834, 26.365222930908203, 29.294527053833008, 32.22383117675781, 35.15313720703125, 38.08243942260742, 41.011741638183594, 43.94104766845703, 46.87035369873047, 49.79965591430664, 52.72895812988281, 55.65826416015625, 58.58757019042969, 61.51687240600586, 64.44617462158203, 67.37548065185547, 70.3047866821289, 73.23408508300781, 76.16339111328125, 79.09269714355469, 82.02200317382812, 84.95130920410156, 87.88060760498047, 90.8099136352539]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 8.0, 6.0, 11.0, 16.0, 15.0, 20.0, 19.0, 29.0, 26.0, 33.0, 32.0, 35.0, 34.0, 43.0, 30.0, 43.0, 42.0, 30.0, 51.0, 29.0, 55.0, 36.0, 31.0, 34.0, 30.0, 31.0, 32.0, 22.0, 26.0, 19.0, 14.0, 21.0, 18.0, 17.0, 11.0, 12.0, 6.0, 3.0, 6.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.440338134765625, -39.168846130371094, -37.8973503112793, -36.625858306884766, -35.35436248779297, -34.08287048339844, -32.811378479003906, -31.539884567260742, -30.268390655517578, -28.996896743774414, -27.72540283203125, -26.45391082763672, -25.182416915893555, -23.91092300415039, -22.63943099975586, -21.367937088012695, -20.09644317626953, -18.824949264526367, -17.553455352783203, -16.281963348388672, -15.010469436645508, -13.738975524902344, -12.467482566833496, -11.195989608764648, -9.924495697021484, -8.65300178527832, -7.381508827209473, -6.110015392303467, -4.838521957397461, -3.567028522491455, -2.295535087585449, -1.0240421295166016, 0.2474517822265625, 1.5189452171325684, 2.790438652038574, 4.06193208694458, 5.333425521850586, 6.604918956756592, 7.876412391662598, 9.147905349731445, 10.41939926147461, 11.690893173217773, 12.962386131286621, 14.233879089355469, 15.505373001098633, 16.776866912841797, 18.048358917236328, 19.319852828979492, 20.591346740722656, 21.86284065246582, 23.134334564208984, 24.405826568603516, 25.67732048034668, 26.948814392089844, 28.220306396484375, 29.49180030822754, 30.763294219970703, 32.034786224365234, 33.30628204345703, 34.57777404785156, 35.849266052246094, 37.12076187133789, 38.39225387573242, 39.66374969482422, 40.93524169921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 33.0, 23.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 10.0, 22.0, 24.0, 52.0, 81.0, 118.0, 156.0, 279.0, 438.0, 682.0, 953.0, 1517.0, 2365.0, 3675.0, 5810.0, 9203.0, 14509.0, 23276.0, 37834.0, 61601.0, 98723.0, 147986.0, 184909.0, 159820.0, 111352.0, 69369.0, 42787.0, 26219.0, 16148.0, 10262.0, 6518.0, 4285.0, 2613.0, 1772.0, 1082.0, 724.0, 473.0, 305.0, 204.0, 138.0, 87.0, 53.0, 39.0, 21.0, 14.0, 16.0, 10.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.72900390625, -0.7085418701171875, -0.688079833984375, -0.6676177978515625, -0.64715576171875, -0.6266937255859375, -0.606231689453125, -0.5857696533203125, -0.5653076171875, -0.5448455810546875, -0.524383544921875, -0.5039215087890625, -0.48345947265625, -0.4629974365234375, -0.442535400390625, -0.4220733642578125, -0.401611328125, -0.3811492919921875, -0.360687255859375, -0.3402252197265625, -0.31976318359375, -0.2993011474609375, -0.278839111328125, -0.2583770751953125, -0.2379150390625, -0.2174530029296875, -0.196990966796875, -0.1765289306640625, -0.15606689453125, -0.1356048583984375, -0.115142822265625, -0.0946807861328125, -0.07421875, -0.0537567138671875, -0.033294677734375, -0.0128326416015625, 0.00762939453125, 0.0280914306640625, 0.048553466796875, 0.0690155029296875, 0.0894775390625, 0.1099395751953125, 0.130401611328125, 0.1508636474609375, 0.17132568359375, 0.1917877197265625, 0.212249755859375, 0.2327117919921875, 0.253173828125, 0.2736358642578125, 0.294097900390625, 0.3145599365234375, 0.33502197265625, 0.3554840087890625, 0.375946044921875, 0.3964080810546875, 0.4168701171875, 0.4373321533203125, 0.457794189453125, 0.4782562255859375, 0.49871826171875, 0.5191802978515625, 0.539642333984375, 0.5601043701171875, 0.58056640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 4.0, 6.0, 14.0, 15.0, 11.0, 11.0, 17.0, 23.0, 25.0, 26.0, 25.0, 22.0, 21.0, 33.0, 26.0, 39.0, 45.0, 40.0, 35.0, 27.0, 1084.0, 27.0, 33.0, 46.0, 34.0, 27.0, 28.0, 30.0, 19.0, 22.0, 24.0, 25.0, 27.0, 17.0, 15.0, 17.0, 11.0, 14.0, 13.0, 12.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4765625, -3.36114501953125, -3.2457275390625, -3.13031005859375, -3.014892578125, -2.89947509765625, -2.7840576171875, -2.66864013671875, -2.55322265625, -2.43780517578125, -2.3223876953125, -2.20697021484375, -2.091552734375, -1.97613525390625, -1.8607177734375, -1.74530029296875, -1.6298828125, -1.51446533203125, -1.3990478515625, -1.28363037109375, -1.168212890625, -1.05279541015625, -0.9373779296875, -0.82196044921875, -0.70654296875, -0.59112548828125, -0.4757080078125, -0.36029052734375, -0.244873046875, -0.12945556640625, -0.0140380859375, 0.10137939453125, 0.216796875, 0.33221435546875, 0.4476318359375, 0.56304931640625, 0.678466796875, 0.79388427734375, 0.9093017578125, 1.02471923828125, 1.14013671875, 1.25555419921875, 1.3709716796875, 1.48638916015625, 1.601806640625, 1.71722412109375, 1.8326416015625, 1.94805908203125, 2.0634765625, 2.17889404296875, 2.2943115234375, 2.40972900390625, 2.525146484375, 2.64056396484375, 2.7559814453125, 2.87139892578125, 2.98681640625, 3.10223388671875, 3.2176513671875, 3.33306884765625, 3.448486328125, 3.56390380859375, 3.6793212890625, 3.79473876953125, 3.91015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 16.0, 27.0, 31.0, 53.0, 110.0, 177.0, 299.0, 533.0, 946.0, 1620.0, 2911.0, 4782.0, 8338.0, 13508.0, 22538.0, 37024.0, 60519.0, 97000.0, 143703.0, 1224228.0, 164383.0, 118833.0, 76963.0, 47148.0, 28668.0, 17491.0, 10565.0, 6140.0, 3560.0, 2031.0, 1282.0, 699.0, 411.0, 214.0, 161.0, 92.0, 31.0, 32.0, 17.0, 19.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5201873779296875, -0.503265380859375, -0.4863433837890625, -0.46942138671875, -0.4524993896484375, -0.435577392578125, -0.4186553955078125, -0.4017333984375, -0.3848114013671875, -0.367889404296875, -0.3509674072265625, -0.33404541015625, -0.3171234130859375, -0.300201416015625, -0.2832794189453125, -0.266357421875, -0.2494354248046875, -0.232513427734375, -0.2155914306640625, -0.19866943359375, -0.1817474365234375, -0.164825439453125, -0.1479034423828125, -0.1309814453125, -0.1140594482421875, -0.097137451171875, -0.0802154541015625, -0.06329345703125, -0.0463714599609375, -0.029449462890625, -0.0125274658203125, 0.00439453125, 0.0213165283203125, 0.038238525390625, 0.0551605224609375, 0.07208251953125, 0.0890045166015625, 0.105926513671875, 0.1228485107421875, 0.1397705078125, 0.1566925048828125, 0.173614501953125, 0.1905364990234375, 0.20745849609375, 0.2243804931640625, 0.241302490234375, 0.2582244873046875, 0.275146484375, 0.2920684814453125, 0.308990478515625, 0.3259124755859375, 0.34283447265625, 0.3597564697265625, 0.376678466796875, 0.3936004638671875, 0.4105224609375, 0.4274444580078125, 0.444366455078125, 0.4612884521484375, 0.47821044921875, 0.4951324462890625, 0.512054443359375, 0.5289764404296875, 0.5458984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 5.0, 9.0, 7.0, 13.0, 17.0, 21.0, 15.0, 20.0, 25.0, 43.0, 53.0, 67.0, 56.0, 68.0, 75.0, 66.0, 61.0, 62.0, 60.0, 34.0, 28.0, 31.0, 21.0, 24.0, 15.0, 16.0, 16.0, 9.0, 16.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.003993988037109375, -0.0038833022117614746, -0.0037726163864135742, -0.003661930561065674, -0.0035512447357177734, -0.003440558910369873, -0.0033298730850219727, -0.0032191872596740723, -0.003108501434326172, -0.0029978156089782715, -0.002887129783630371, -0.0027764439582824707, -0.0026657581329345703, -0.00255507230758667, -0.0024443864822387695, -0.002333700656890869, -0.0022230148315429688, -0.0021123290061950684, -0.002001643180847168, -0.0018909573554992676, -0.0017802715301513672, -0.0016695857048034668, -0.0015588998794555664, -0.001448214054107666, -0.0013375282287597656, -0.0012268424034118652, -0.0011161565780639648, -0.0010054707527160645, -0.0008947849273681641, -0.0007840991020202637, -0.0006734132766723633, -0.0005627274513244629, -0.0004520416259765625, -0.0003413558006286621, -0.00023066997528076172, -0.00011998414993286133, -9.298324584960938e-06, 0.00010138750076293945, 0.00021207332611083984, 0.00032275915145874023, 0.0004334449768066406, 0.000544130802154541, 0.0006548166275024414, 0.0007655024528503418, 0.0008761882781982422, 0.0009868741035461426, 0.001097559928894043, 0.0012082457542419434, 0.0013189315795898438, 0.0014296174049377441, 0.0015403032302856445, 0.001650989055633545, 0.0017616748809814453, 0.0018723607063293457, 0.001983046531677246, 0.0020937323570251465, 0.002204418182373047, 0.0023151040077209473, 0.0024257898330688477, 0.002536475658416748, 0.0026471614837646484, 0.002757847309112549, 0.0028685331344604492, 0.0029792189598083496, 0.00308990478515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 16.0, 16.0, 14.0, 21.0, 28.0, 46.0, 40.0, 68.0, 80.0, 107.0, 238.0, 1016.0, 47103.0, 990464.0, 8096.0, 524.0, 197.0, 116.0, 96.0, 51.0, 43.0, 24.0, 27.0, 12.0, 17.0, 14.0, 12.0, 6.0, 7.0, 8.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06951904296875, -0.0668783187866211, -0.06423759460449219, -0.06159687042236328, -0.058956146240234375, -0.05631542205810547, -0.05367469787597656, -0.051033973693847656, -0.04839324951171875, -0.045752525329589844, -0.04311180114746094, -0.04047107696533203, -0.037830352783203125, -0.03518962860107422, -0.03254890441894531, -0.029908180236816406, -0.0272674560546875, -0.024626731872558594, -0.021986007690429688, -0.01934528350830078, -0.016704559326171875, -0.014063835144042969, -0.011423110961914062, -0.008782386779785156, -0.00614166259765625, -0.0035009384155273438, -0.0008602142333984375, 0.0017805099487304688, 0.004421234130859375, 0.007061958312988281, 0.009702682495117188, 0.012343406677246094, 0.014984130859375, 0.017624855041503906, 0.020265579223632812, 0.02290630340576172, 0.025547027587890625, 0.02818775177001953, 0.030828475952148438, 0.033469200134277344, 0.03610992431640625, 0.038750648498535156, 0.04139137268066406, 0.04403209686279297, 0.046672821044921875, 0.04931354522705078, 0.05195426940917969, 0.054594993591308594, 0.0572357177734375, 0.059876441955566406, 0.06251716613769531, 0.06515789031982422, 0.06779861450195312, 0.07043933868408203, 0.07308006286621094, 0.07572078704833984, 0.07836151123046875, 0.08100223541259766, 0.08364295959472656, 0.08628368377685547, 0.08892440795898438, 0.09156513214111328, 0.09420585632324219, 0.0968465805053711, 0.0994873046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 38.0, 518.0, 418.0, 34.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002878597006201744, -0.0021503595635294914, -0.0014221223536878824, -0.0006938851438462734, 3.435229882597923e-05, 0.0007625897414982319, 0.0014908267185091972, 0.00221906416118145, 0.0029473016038537025, 0.003675539046525955, 0.004403776489198208, 0.005132013466209173, 0.005860250908881426, 0.0065884883515536785, 0.007316725328564644, 0.008044962771236897, 0.00877320021390915, 0.009501437656581402, 0.010229675099253654, 0.010957911610603333, 0.01168614998459816, 0.012414386495947838, 0.01314262393862009, 0.013870861381292343, 0.014599098823964596, 0.015327336266636848, 0.016055572777986526, 0.016783811151981354, 0.017512047663331032, 0.01824028603732586, 0.018968522548675537, 0.019696760922670364, 0.02042499929666519, 0.02115323580801487, 0.021881474182009697, 0.022609710693359375, 0.023337949067354202, 0.02406618557870388, 0.02479442209005356, 0.025522660464048386, 0.026250898838043213, 0.02697913534939289, 0.027707373723387718, 0.028435610234737396, 0.029163848608732224, 0.0298920851200819, 0.03062032163143158, 0.03134856000542641, 0.032076798379421234, 0.03280503675341606, 0.03353327140212059, 0.03426150977611542, 0.034989748150110245, 0.03571798652410507, 0.0364462211728096, 0.03717445954680443, 0.03790269419550896, 0.038630932569503784, 0.03935916721820831, 0.04008740559220314, 0.04081564396619797, 0.041543882340192795, 0.042272116988897324, 0.04300035536289215, 0.04372859373688698]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 16.0, 15.0, 26.0, 28.0, 33.0, 37.0, 39.0, 56.0, 63.0, 63.0, 62.0, 61.0, 76.0, 70.0, 67.0, 42.0, 45.0, 57.0, 26.0, 19.0, 21.0, 15.0, 17.0, 9.0, 8.0, 8.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00315779447555542, -0.0030496595427393913, -0.0029415246099233627, -0.002833389677107334, -0.0027252547442913055, -0.002617119811475277, -0.0025089848786592484, -0.0024008499458432198, -0.002292715013027191, -0.0021845800802111626, -0.002076445147395134, -0.0019683102145791054, -0.0018601752817630768, -0.0017520403489470482, -0.0016439054161310196, -0.001535770483314991, -0.0014276355504989624, -0.0013195006176829338, -0.0012113656848669052, -0.0011032307520508766, -0.000995095819234848, -0.0008869608864188194, -0.0007788259536027908, -0.0006706910207867622, -0.0005625560879707336, -0.00045442115515470505, -0.00034628622233867645, -0.00023815128952264786, -0.00013001635670661926, -2.1881423890590668e-05, 8.625350892543793e-05, 0.00019438844174146652, 0.0003025233745574951, 0.0004106583073735237, 0.0005187932401895523, 0.0006269281730055809, 0.0007350631058216095, 0.0008431980386376381, 0.0009513329714536667, 0.0010594679042696953, 0.0011676028370857239, 0.0012757377699017525, 0.001383872702717781, 0.0014920076355338097, 0.0016001425683498383, 0.0017082775011658669, 0.0018164124339818954, 0.001924547366797924, 0.0020326822996139526, 0.0021408172324299812, 0.00224895216524601, 0.0023570870980620384, 0.002465222030878067, 0.0025733569636940956, 0.002681491896510124, 0.002789626829326153, 0.0028977617621421814, 0.00300589669495821, 0.0031140316277742386, 0.003222166560590267, 0.0033303014934062958, 0.0034384364262223244, 0.003546571359038353, 0.0036547062918543816, 0.00376284122467041]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 32.0, 24.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 18.0, 23.0, 34.0, 32.0, 53.0, 57.0, 81.0, 125.0, 171.0, 283.0, 430.0, 882.0, 1753.0, 3752.0, 8442.0, 20365.0, 53640.0, 156912.0, 488872.0, 202755.0, 65841.0, 24978.0, 10138.0, 4431.0, 2025.0, 934.0, 495.0, 320.0, 203.0, 132.0, 81.0, 57.0, 50.0, 40.0, 29.0, 27.0, 17.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.208251953125, -5.99853515625, -5.788818359375, -5.5791015625, -5.369384765625, -5.15966796875, -4.949951171875, -4.740234375, -4.530517578125, -4.32080078125, -4.111083984375, -3.9013671875, -3.691650390625, -3.48193359375, -3.272216796875, -3.0625, -2.852783203125, -2.64306640625, -2.433349609375, -2.2236328125, -2.013916015625, -1.80419921875, -1.594482421875, -1.384765625, -1.175048828125, -0.96533203125, -0.755615234375, -0.5458984375, -0.336181640625, -0.12646484375, 0.083251953125, 0.29296875, 0.502685546875, 0.71240234375, 0.922119140625, 1.1318359375, 1.341552734375, 1.55126953125, 1.760986328125, 1.970703125, 2.180419921875, 2.39013671875, 2.599853515625, 2.8095703125, 3.019287109375, 3.22900390625, 3.438720703125, 3.6484375, 3.858154296875, 4.06787109375, 4.277587890625, 4.4873046875, 4.697021484375, 4.90673828125, 5.116455078125, 5.326171875, 5.535888671875, 5.74560546875, 5.955322265625, 6.1650390625, 6.374755859375, 6.58447265625, 6.794189453125, 7.00390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 10.0, 10.0, 7.0, 7.0, 6.0, 8.0, 15.0, 16.0, 19.0, 14.0, 33.0, 30.0, 30.0, 31.0, 39.0, 34.0, 56.0, 50.0, 109.0, 384.0, 1582.0, 110.0, 59.0, 55.0, 42.0, 36.0, 42.0, 25.0, 23.0, 24.0, 16.0, 14.0, 13.0, 25.0, 14.0, 13.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.22216796875, -17.6162109375, -17.01025390625, -16.404296875, -15.79833984375, -15.1923828125, -14.58642578125, -13.98046875, -13.37451171875, -12.7685546875, -12.16259765625, -11.556640625, -10.95068359375, -10.3447265625, -9.73876953125, -9.1328125, -8.52685546875, -7.9208984375, -7.31494140625, -6.708984375, -6.10302734375, -5.4970703125, -4.89111328125, -4.28515625, -3.67919921875, -3.0732421875, -2.46728515625, -1.861328125, -1.25537109375, -0.6494140625, -0.04345703125, 0.5625, 1.16845703125, 1.7744140625, 2.38037109375, 2.986328125, 3.59228515625, 4.1982421875, 4.80419921875, 5.41015625, 6.01611328125, 6.6220703125, 7.22802734375, 7.833984375, 8.43994140625, 9.0458984375, 9.65185546875, 10.2578125, 10.86376953125, 11.4697265625, 12.07568359375, 12.681640625, 13.28759765625, 13.8935546875, 14.49951171875, 15.10546875, 15.71142578125, 16.3173828125, 16.92333984375, 17.529296875, 18.13525390625, 18.7412109375, 19.34716796875, 19.953125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 8.0, 7.0, 16.0, 11.0, 17.0, 19.0, 26.0, 31.0, 30.0, 35.0, 45.0, 72.0, 90.0, 143.0, 218.0, 326.0, 663.0, 1176.0, 6112.0, 2706212.0, 424309.0, 3461.0, 1071.0, 562.0, 300.0, 182.0, 141.0, 87.0, 68.0, 35.0, 42.0, 42.0, 24.0, 8.0, 23.0, 22.0, 13.0, 10.0, 4.0, 8.0, 8.0, 4.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-45.71875, -44.28564453125, -42.8525390625, -41.41943359375, -39.986328125, -38.55322265625, -37.1201171875, -35.68701171875, -34.25390625, -32.82080078125, -31.3876953125, -29.95458984375, -28.521484375, -27.08837890625, -25.6552734375, -24.22216796875, -22.7890625, -21.35595703125, -19.9228515625, -18.48974609375, -17.056640625, -15.62353515625, -14.1904296875, -12.75732421875, -11.32421875, -9.89111328125, -8.4580078125, -7.02490234375, -5.591796875, -4.15869140625, -2.7255859375, -1.29248046875, 0.140625, 1.57373046875, 3.0068359375, 4.43994140625, 5.873046875, 7.30615234375, 8.7392578125, 10.17236328125, 11.60546875, 13.03857421875, 14.4716796875, 15.90478515625, 17.337890625, 18.77099609375, 20.2041015625, 21.63720703125, 23.0703125, 24.50341796875, 25.9365234375, 27.36962890625, 28.802734375, 30.23583984375, 31.6689453125, 33.10205078125, 34.53515625, 35.96826171875, 37.4013671875, 38.83447265625, 40.267578125, 41.70068359375, 43.1337890625, 44.56689453125, 46.0]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 22.0, 42.0, 62.0, 84.0, 107.0, 155.0, 175.0, 126.0, 85.0, 69.0, 38.0, 20.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.023704528808594, -35.27062225341797, -34.51754379272461, -33.764461517333984, -33.011383056640625, -32.25830078125, -31.505218505859375, -30.752138137817383, -29.99905776977539, -29.2459774017334, -28.492897033691406, -27.73981475830078, -26.98673439025879, -26.233654022216797, -25.480571746826172, -24.72749137878418, -23.974411010742188, -23.221330642700195, -22.468250274658203, -21.715167999267578, -20.962087631225586, -20.209007263183594, -19.45592498779297, -18.702844619750977, -17.949764251708984, -17.196683883666992, -16.443603515625, -15.690521240234375, -14.937440872192383, -14.18436050415039, -13.431279182434082, -12.678197860717773, -11.925118446350098, -11.172037124633789, -10.418956756591797, -9.665876388549805, -8.912795066833496, -8.159713745117188, -7.406633377075195, -6.653552532196045, -5.9004716873168945, -5.147390842437744, -4.394309997558594, -3.6412291526794434, -2.888148307800293, -2.1350674629211426, -1.3819866180419922, -0.6289057731628418, 0.1241750717163086, 0.877255916595459, 1.6303367614746094, 2.3834176063537598, 3.13649845123291, 3.8895792961120605, 4.642660140991211, 5.395740985870361, 6.148821830749512, 6.901902675628662, 7.6549835205078125, 8.408063888549805, 9.161145210266113, 9.914226531982422, 10.667306900024414, 11.420387268066406, 12.173468589782715]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 5.0, 15.0, 9.0, 11.0, 18.0, 14.0, 10.0, 11.0, 23.0, 19.0, 19.0, 29.0, 21.0, 24.0, 42.0, 29.0, 32.0, 45.0, 43.0, 33.0, 31.0, 36.0, 34.0, 38.0, 30.0, 40.0, 33.0, 36.0, 26.0, 26.0, 23.0, 17.0, 17.0, 18.0, 20.0, 14.0, 22.0, 15.0, 16.0, 11.0, 6.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-46.38966751098633, -44.90962600708008, -43.42958450317383, -41.94954299926758, -40.46950149536133, -38.98945999145508, -37.50941848754883, -36.02937698364258, -34.54933547973633, -33.06929397583008, -31.589252471923828, -30.109210968017578, -28.629169464111328, -27.149127960205078, -25.669086456298828, -24.189044952392578, -22.709001541137695, -21.228960037231445, -19.748918533325195, -18.268877029418945, -16.788835525512695, -15.308794021606445, -13.828751564025879, -12.348710060119629, -10.868668556213379, -9.388627052307129, -7.908585548400879, -6.428543567657471, -4.948502063751221, -3.4684605598449707, -1.9884185791015625, -0.5083770751953125, 0.9716644287109375, 2.4517059326171875, 3.9317476749420166, 5.411789417266846, 6.891830921173096, 8.371871948242188, 9.851914405822754, 11.331955909729004, 12.811997413635254, 14.292038917541504, 15.772080421447754, 17.25212287902832, 18.73216438293457, 20.21220588684082, 21.69224739074707, 23.17228889465332, 24.65233039855957, 26.13237190246582, 27.61241340637207, 29.09245491027832, 30.57249641418457, 32.05253982543945, 33.5325813293457, 35.01262283325195, 36.4926643371582, 37.97270584106445, 39.4527473449707, 40.93278884887695, 42.4128303527832, 43.89287185668945, 45.3729133605957, 46.85295486450195, 48.3329963684082]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 7.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 20.0, 19.0, 16.0, 28.0, 27.0, 19.0, 35.0, 23.0, 30.0, 40.0, 42.0, 43.0, 65.0, 37.0, 39.0, 47.0, 45.0, 50.0, 34.0, 36.0, 33.0, 29.0, 25.0, 17.0, 21.0, 23.0, 22.0, 13.0, 20.0, 8.0, 8.0, 15.0, 3.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.87109375, -5.6484375, -5.42578125, -5.203125, -4.98046875, -4.7578125, -4.53515625, -4.3125, -4.08984375, -3.8671875, -3.64453125, -3.421875, -3.19921875, -2.9765625, -2.75390625, -2.53125, -2.30859375, -2.0859375, -1.86328125, -1.640625, -1.41796875, -1.1953125, -0.97265625, -0.75, -0.52734375, -0.3046875, -0.08203125, 0.140625, 0.36328125, 0.5859375, 0.80859375, 1.03125, 1.25390625, 1.4765625, 1.69921875, 1.921875, 2.14453125, 2.3671875, 2.58984375, 2.8125, 3.03515625, 3.2578125, 3.48046875, 3.703125, 3.92578125, 4.1484375, 4.37109375, 4.59375, 4.81640625, 5.0390625, 5.26171875, 5.484375, 5.70703125, 5.9296875, 6.15234375, 6.375, 6.59765625, 6.8203125, 7.04296875, 7.265625, 7.48828125, 7.7109375, 7.93359375, 8.15625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 2.0, 13.0, 12.0, 18.0, 12.0, 35.0, 29.0, 43.0, 29.0, 57.0, 95.0, 120.0, 246.0, 557.0, 1970.0, 11276.0, 205060.0, 3335625.0, 613287.0, 20985.0, 3108.0, 824.0, 296.0, 169.0, 97.0, 73.0, 43.0, 30.0, 31.0, 24.0, 26.0, 16.0, 12.0, 13.0, 4.0, 8.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -18.828125, -18.09375, -17.359375, -16.625, -15.890625, -15.15625, -14.421875, -13.6875, -12.953125, -12.21875, -11.484375, -10.75, -10.015625, -9.28125, -8.546875, -7.8125, -7.078125, -6.34375, -5.609375, -4.875, -4.140625, -3.40625, -2.671875, -1.9375, -1.203125, -0.46875, 0.265625, 1.0, 1.734375, 2.46875, 3.203125, 3.9375, 4.671875, 5.40625, 6.140625, 6.875, 7.609375, 8.34375, 9.078125, 9.8125, 10.546875, 11.28125, 12.015625, 12.75, 13.484375, 14.21875, 14.953125, 15.6875, 16.421875, 17.15625, 17.890625, 18.625, 19.359375, 20.09375, 20.828125, 21.5625, 22.296875, 23.03125, 23.765625, 24.5, 25.234375, 25.96875, 26.703125, 27.4375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 8.0, 7.0, 7.0, 7.0, 13.0, 14.0, 16.0, 38.0, 35.0, 55.0, 76.0, 91.0, 140.0, 197.0, 271.0, 377.0, 507.0, 531.0, 475.0, 380.0, 262.0, 146.0, 125.0, 88.0, 46.0, 40.0, 38.0, 30.0, 17.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7578125, -13.3326416015625, -12.907470703125, -12.4822998046875, -12.05712890625, -11.6319580078125, -11.206787109375, -10.7816162109375, -10.3564453125, -9.9312744140625, -9.506103515625, -9.0809326171875, -8.65576171875, -8.2305908203125, -7.805419921875, -7.3802490234375, -6.955078125, -6.5299072265625, -6.104736328125, -5.6795654296875, -5.25439453125, -4.8292236328125, -4.404052734375, -3.9788818359375, -3.5537109375, -3.1285400390625, -2.703369140625, -2.2781982421875, -1.85302734375, -1.4278564453125, -1.002685546875, -0.5775146484375, -0.15234375, 0.2728271484375, 0.697998046875, 1.1231689453125, 1.54833984375, 1.9735107421875, 2.398681640625, 2.8238525390625, 3.2490234375, 3.6741943359375, 4.099365234375, 4.5245361328125, 4.94970703125, 5.3748779296875, 5.800048828125, 6.2252197265625, 6.650390625, 7.0755615234375, 7.500732421875, 7.9259033203125, 8.35107421875, 8.7762451171875, 9.201416015625, 9.6265869140625, 10.0517578125, 10.4769287109375, 10.902099609375, 11.3272705078125, 11.75244140625, 12.1776123046875, 12.602783203125, 13.0279541015625, 13.453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 13.0, 14.0, 25.0, 32.0, 46.0, 50.0, 74.0, 117.0, 156.0, 257.0, 317.0, 623.0, 5154.0, 3121429.0, 1061055.0, 3227.0, 495.0, 302.0, 248.0, 165.0, 120.0, 114.0, 68.0, 52.0, 38.0, 22.0, 11.0, 10.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -72.0458984375, -69.716796875, -67.3876953125, -65.05859375, -62.7294921875, -60.400390625, -58.0712890625, -55.7421875, -53.4130859375, -51.083984375, -48.7548828125, -46.42578125, -44.0966796875, -41.767578125, -39.4384765625, -37.109375, -34.7802734375, -32.451171875, -30.1220703125, -27.79296875, -25.4638671875, -23.134765625, -20.8056640625, -18.4765625, -16.1474609375, -13.818359375, -11.4892578125, -9.16015625, -6.8310546875, -4.501953125, -2.1728515625, 0.15625, 2.4853515625, 4.814453125, 7.1435546875, 9.47265625, 11.8017578125, 14.130859375, 16.4599609375, 18.7890625, 21.1181640625, 23.447265625, 25.7763671875, 28.10546875, 30.4345703125, 32.763671875, 35.0927734375, 37.421875, 39.7509765625, 42.080078125, 44.4091796875, 46.73828125, 49.0673828125, 51.396484375, 53.7255859375, 56.0546875, 58.3837890625, 60.712890625, 63.0419921875, 65.37109375, 67.7001953125, 70.029296875, 72.3583984375, 74.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 11.0, 30.0, 92.0, 202.0, 281.0, 206.0, 116.0, 45.0, 19.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.51287841796875, -168.0595703125, -164.60626220703125, -161.15296936035156, -157.6996612548828, -154.24635314941406, -150.7930450439453, -147.33973693847656, -143.88644409179688, -140.43313598632812, -136.97982788085938, -133.5265350341797, -130.07322692871094, -126.61991882324219, -123.16661071777344, -119.71331024169922, -116.25999450683594, -112.80668640136719, -109.35338592529297, -105.90007781982422, -102.44677734375, -98.99346923828125, -95.5401611328125, -92.08686065673828, -88.63356018066406, -85.18025207519531, -81.7269515991211, -78.27364349365234, -74.82034301757812, -71.36703491210938, -67.91372680664062, -64.4604263305664, -61.007118225097656, -57.55381393432617, -54.10050964355469, -50.64720153808594, -47.19389724731445, -43.74059295654297, -40.287288665771484, -36.833984375, -33.38067626953125, -29.927371978759766, -26.47406578063965, -23.020761489868164, -19.567455291748047, -16.114151000976562, -12.660846710205078, -9.207540512084961, -5.754238128662109, -2.3009331226348877, 1.152371883392334, 4.605676651000977, 8.058981895446777, 11.512287139892578, 14.965591430664062, 18.41889762878418, 21.872201919555664, 25.32550621032715, 28.778812408447266, 32.23211669921875, 35.685420989990234, 39.13872528076172, 42.59203338623047, 46.04533767700195, 49.49864196777344]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 5.0, 2.0, 11.0, 15.0, 17.0, 13.0, 17.0, 18.0, 19.0, 15.0, 20.0, 24.0, 28.0, 33.0, 31.0, 31.0, 39.0, 45.0, 37.0, 54.0, 38.0, 47.0, 51.0, 36.0, 38.0, 37.0, 24.0, 30.0, 31.0, 19.0, 20.0, 22.0, 13.0, 23.0, 14.0, 18.0, 17.0, 10.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.41998291015625, -37.218482971191406, -36.01698303222656, -34.81548309326172, -33.613983154296875, -32.412479400634766, -31.210979461669922, -30.009479522705078, -28.807979583740234, -27.60647964477539, -26.404979705810547, -25.20347785949707, -24.001977920532227, -22.800477981567383, -21.598976135253906, -20.397476196289062, -19.19597625732422, -17.994476318359375, -16.79297637939453, -15.591474533081055, -14.389974594116211, -13.188474655151367, -11.986973762512207, -10.785472869873047, -9.583972930908203, -8.38247299194336, -7.180972099304199, -5.979471683502197, -4.777971267700195, -3.5764708518981934, -2.3749704360961914, -1.1734695434570312, 0.0280303955078125, 1.2295308113098145, 2.4310312271118164, 3.6325316429138184, 4.83403205871582, 6.035532474517822, 7.237032890319824, 8.438533782958984, 9.640033721923828, 10.841533660888672, 12.043034553527832, 13.244535446166992, 14.446035385131836, 15.64753532409668, 16.849037170410156, 18.050537109375, 19.252037048339844, 20.453536987304688, 21.65503692626953, 22.856538772583008, 24.05803871154785, 25.259538650512695, 26.461040496826172, 27.662540435791016, 28.86404037475586, 30.065540313720703, 31.267040252685547, 32.46854019165039, 33.6700439453125, 34.871543884277344, 36.07304382324219, 37.27454376220703, 38.476043701171875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 48.0, 41.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 16.0, 26.0, 26.0, 52.0, 67.0, 100.0, 174.0, 260.0, 418.0, 710.0, 1189.0, 1977.0, 3160.0, 5145.0, 8273.0, 12600.0, 20089.0, 31966.0, 52147.0, 85864.0, 137606.0, 187584.0, 177016.0, 122884.0, 76292.0, 45968.0, 28269.0, 17873.0, 11415.0, 7367.0, 4664.0, 2928.0, 1660.0, 1098.0, 649.0, 414.0, 232.0, 141.0, 76.0, 53.0, 35.0, 30.0, 16.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7509765625, -0.7281341552734375, -0.705291748046875, -0.6824493408203125, -0.65960693359375, -0.6367645263671875, -0.613922119140625, -0.5910797119140625, -0.5682373046875, -0.5453948974609375, -0.522552490234375, -0.4997100830078125, -0.47686767578125, -0.4540252685546875, -0.431182861328125, -0.4083404541015625, -0.385498046875, -0.3626556396484375, -0.339813232421875, -0.3169708251953125, -0.29412841796875, -0.2712860107421875, -0.248443603515625, -0.2256011962890625, -0.2027587890625, -0.1799163818359375, -0.157073974609375, -0.1342315673828125, -0.11138916015625, -0.0885467529296875, -0.065704345703125, -0.0428619384765625, -0.02001953125, 0.0028228759765625, 0.025665283203125, 0.0485076904296875, 0.07135009765625, 0.0941925048828125, 0.117034912109375, 0.1398773193359375, 0.1627197265625, 0.1855621337890625, 0.208404541015625, 0.2312469482421875, 0.25408935546875, 0.2769317626953125, 0.299774169921875, 0.3226165771484375, 0.345458984375, 0.3683013916015625, 0.391143798828125, 0.4139862060546875, 0.43682861328125, 0.4596710205078125, 0.482513427734375, 0.5053558349609375, 0.5281982421875, 0.5510406494140625, 0.573883056640625, 0.5967254638671875, 0.61956787109375, 0.6424102783203125, 0.665252685546875, 0.6880950927734375, 0.7109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 12.0, 14.0, 18.0, 17.0, 21.0, 20.0, 23.0, 28.0, 45.0, 35.0, 29.0, 35.0, 34.0, 55.0, 48.0, 1061.0, 39.0, 45.0, 47.0, 38.0, 43.0, 33.0, 31.0, 32.0, 23.0, 21.0, 21.0, 12.0, 17.0, 7.0, 12.0, 12.0, 11.0, 13.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.98590087890625, -3.8507080078125, -3.71551513671875, -3.580322265625, -3.44512939453125, -3.3099365234375, -3.17474365234375, -3.03955078125, -2.90435791015625, -2.7691650390625, -2.63397216796875, -2.498779296875, -2.36358642578125, -2.2283935546875, -2.09320068359375, -1.9580078125, -1.82281494140625, -1.6876220703125, -1.55242919921875, -1.417236328125, -1.28204345703125, -1.1468505859375, -1.01165771484375, -0.87646484375, -0.74127197265625, -0.6060791015625, -0.47088623046875, -0.335693359375, -0.20050048828125, -0.0653076171875, 0.06988525390625, 0.205078125, 0.34027099609375, 0.4754638671875, 0.61065673828125, 0.745849609375, 0.88104248046875, 1.0162353515625, 1.15142822265625, 1.28662109375, 1.42181396484375, 1.5570068359375, 1.69219970703125, 1.827392578125, 1.96258544921875, 2.0977783203125, 2.23297119140625, 2.3681640625, 2.50335693359375, 2.6385498046875, 2.77374267578125, 2.908935546875, 3.04412841796875, 3.1793212890625, 3.31451416015625, 3.44970703125, 3.58489990234375, 3.7200927734375, 3.85528564453125, 3.990478515625, 4.12567138671875, 4.2608642578125, 4.39605712890625, 4.53125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 9.0, 18.0, 19.0, 25.0, 66.0, 97.0, 153.0, 249.0, 440.0, 731.0, 1157.0, 1952.0, 3181.0, 5565.0, 9110.0, 15496.0, 25759.0, 43715.0, 71316.0, 112372.0, 159275.0, 1227935.0, 151684.0, 104017.0, 65222.0, 39335.0, 23240.0, 14023.0, 8394.0, 5032.0, 3048.0, 1811.0, 1042.0, 643.0, 376.0, 218.0, 165.0, 83.0, 49.0, 46.0, 23.0, 21.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5597152709960938, -0.5413055419921875, -0.5228958129882812, -0.504486083984375, -0.48607635498046875, -0.4676666259765625, -0.44925689697265625, -0.43084716796875, -0.41243743896484375, -0.3940277099609375, -0.37561798095703125, -0.357208251953125, -0.33879852294921875, -0.3203887939453125, -0.30197906494140625, -0.2835693359375, -0.26515960693359375, -0.2467498779296875, -0.22834014892578125, -0.209930419921875, -0.19152069091796875, -0.1731109619140625, -0.15470123291015625, -0.13629150390625, -0.11788177490234375, -0.0994720458984375, -0.08106231689453125, -0.062652587890625, -0.04424285888671875, -0.0258331298828125, -0.00742340087890625, 0.010986328125, 0.02939605712890625, 0.0478057861328125, 0.06621551513671875, 0.084625244140625, 0.10303497314453125, 0.1214447021484375, 0.13985443115234375, 0.15826416015625, 0.17667388916015625, 0.1950836181640625, 0.21349334716796875, 0.231903076171875, 0.25031280517578125, 0.2687225341796875, 0.28713226318359375, 0.3055419921875, 0.32395172119140625, 0.3423614501953125, 0.36077117919921875, 0.379180908203125, 0.39759063720703125, 0.4160003662109375, 0.43441009521484375, 0.45281982421875, 0.47122955322265625, 0.4896392822265625, 0.5080490112304688, 0.526458740234375, 0.5448684692382812, 0.5632781982421875, 0.5816879272460938, 0.60009765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 8.0, 5.0, 11.0, 10.0, 20.0, 21.0, 22.0, 32.0, 29.0, 38.0, 39.0, 43.0, 45.0, 43.0, 62.0, 68.0, 74.0, 69.0, 50.0, 35.0, 36.0, 39.0, 34.0, 28.0, 27.0, 21.0, 18.0, 15.0, 5.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.003307342529296875, -0.0032024383544921875, -0.0030975341796875, -0.0029926300048828125, -0.002887725830078125, -0.0027828216552734375, -0.00267791748046875, -0.0025730133056640625, -0.002468109130859375, -0.0023632049560546875, -0.00225830078125, -0.0021533966064453125, -0.002048492431640625, -0.0019435882568359375, -0.00183868408203125, -0.0017337799072265625, -0.001628875732421875, -0.0015239715576171875, -0.0014190673828125, -0.0013141632080078125, -0.001209259033203125, -0.0011043548583984375, -0.00099945068359375, -0.0008945465087890625, -0.000789642333984375, -0.0006847381591796875, -0.000579833984375, -0.0004749298095703125, -0.000370025634765625, -0.0002651214599609375, -0.00016021728515625, -5.53131103515625e-05, 4.9591064453125e-05, 0.0001544952392578125, 0.0002593994140625, 0.0003643035888671875, 0.000469207763671875, 0.0005741119384765625, 0.00067901611328125, 0.0007839202880859375, 0.000888824462890625, 0.0009937286376953125, 0.0010986328125, 0.0012035369873046875, 0.001308441162109375, 0.0014133453369140625, 0.00151824951171875, 0.0016231536865234375, 0.001728057861328125, 0.0018329620361328125, 0.0019378662109375, 0.0020427703857421875, 0.002147674560546875, 0.0022525787353515625, 0.00235748291015625, 0.0024623870849609375, 0.002567291259765625, 0.0026721954345703125, 0.002777099609375, 0.0028820037841796875, 0.002986907958984375, 0.0030918121337890625, 0.00319671630859375, 0.0033016204833984375, 0.003406524658203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 8.0, 8.0, 12.0, 14.0, 27.0, 29.0, 28.0, 44.0, 56.0, 83.0, 100.0, 139.0, 265.0, 619.0, 9037.0, 936400.0, 99086.0, 1547.0, 355.0, 190.0, 128.0, 71.0, 72.0, 48.0, 37.0, 33.0, 22.0, 19.0, 14.0, 9.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07609367370605469, -0.07369613647460938, -0.07129859924316406, -0.06890106201171875, -0.06650352478027344, -0.06410598754882812, -0.06170845031738281, -0.0593109130859375, -0.05691337585449219, -0.054515838623046875, -0.05211830139160156, -0.04972076416015625, -0.04732322692871094, -0.044925689697265625, -0.04252815246582031, -0.040130615234375, -0.03773307800292969, -0.035335540771484375, -0.03293800354003906, -0.03054046630859375, -0.028142929077148438, -0.025745391845703125, -0.023347854614257812, -0.0209503173828125, -0.018552780151367188, -0.016155242919921875, -0.013757705688476562, -0.01136016845703125, -0.008962631225585938, -0.006565093994140625, -0.0041675567626953125, -0.00177001953125, 0.0006275177001953125, 0.003025054931640625, 0.0054225921630859375, 0.00782012939453125, 0.010217666625976562, 0.012615203857421875, 0.015012741088867188, 0.0174102783203125, 0.019807815551757812, 0.022205352783203125, 0.024602890014648438, 0.02700042724609375, 0.029397964477539062, 0.031795501708984375, 0.03419303894042969, 0.036590576171875, 0.03898811340332031, 0.041385650634765625, 0.04378318786621094, 0.04618072509765625, 0.04857826232910156, 0.050975799560546875, 0.05337333679199219, 0.0557708740234375, 0.05816841125488281, 0.060565948486328125, 0.06296348571777344, 0.06536102294921875, 0.06775856018066406, 0.07015609741210938, 0.07255363464355469, 0.074951171875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 20.0, 140.0, 533.0, 246.0, 58.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028252651914954185, -0.027736257761716843, -0.0272198636084795, -0.026703469455242157, -0.026187075302004814, -0.02567068114876747, -0.02515428699553013, -0.024637892842292786, -0.024121496826410294, -0.02360510267317295, -0.023088708519935608, -0.022572314366698265, -0.022055920213460922, -0.02153952606022358, -0.021023131906986237, -0.020506735891103745, -0.01999034360051155, -0.019473949447274208, -0.018957555294036865, -0.018441161140799522, -0.01792476698756218, -0.017408372834324837, -0.016891978681087494, -0.016375582665205002, -0.015859190374612808, -0.015342796221375465, -0.014826402068138123, -0.01431000791490078, -0.013793613761663437, -0.013277219608426094, -0.012760824523866177, -0.012244430370628834, -0.011728035286068916, -0.011211641132831573, -0.01069524697959423, -0.010178852826356888, -0.009662458673119545, -0.009146064519882202, -0.008629669435322285, -0.008113275282084942, -0.007596881128847599, -0.007080486975610256, -0.006564092822372913, -0.006047698203474283, -0.00553130405023694, -0.0050149098969995975, -0.004498515278100967, -0.003982121124863625, -0.0034657269716262817, -0.002949332818388939, -0.0024329384323209524, -0.0019165441626682878, -0.001400149893015623, -0.0008837557397782803, -0.00036736135371029377, 0.00014903303235769272, 0.0006654271855950356, 0.0011818214552477002, 0.0016982157249003649, 0.0022146101109683514, 0.002731004264205694, 0.003247398417443037, 0.0037637928035110235, 0.00428018718957901, 0.004796581342816353]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 11.0, 14.0, 15.0, 27.0, 20.0, 35.0, 23.0, 26.0, 35.0, 37.0, 31.0, 44.0, 50.0, 36.0, 40.0, 49.0, 46.0, 51.0, 52.0, 38.0, 45.0, 30.0, 22.0, 34.0, 41.0, 17.0, 22.0, 20.0, 21.0, 11.0, 11.0, 9.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024050474166870117, -0.002334785647690296, -0.0022645238786935806, -0.002194262109696865, -0.0021240003407001495, -0.002053738571703434, -0.0019834768027067184, -0.001913215033710003, -0.0018429532647132874, -0.0017726914957165718, -0.0017024297267198563, -0.0016321679577231407, -0.0015619061887264252, -0.0014916444197297096, -0.001421382650732994, -0.0013511208817362785, -0.001280859112739563, -0.0012105973437428474, -0.001140335574746132, -0.0010700738057494164, -0.0009998120367527008, -0.0009295502677559853, -0.0008592884987592697, -0.0007890267297625542, -0.0007187649607658386, -0.0006485031917691231, -0.0005782414227724075, -0.000507979653775692, -0.00043771788477897644, -0.0003674561157822609, -0.00029719434678554535, -0.0002269325777888298, -0.00015667080879211426, -8.640903979539871e-05, -1.6147270798683167e-05, 5.411449819803238e-05, 0.00012437626719474792, 0.00019463803619146347, 0.000264899805188179, 0.00033516157418489456, 0.0004054233431816101, 0.00047568511217832565, 0.0005459468811750412, 0.0006162086501717567, 0.0006864704191684723, 0.0007567321881651878, 0.0008269939571619034, 0.0008972557261586189, 0.0009675174951553345, 0.00103777926415205, 0.0011080410331487656, 0.0011783028021454811, 0.0012485645711421967, 0.0013188263401389122, 0.0013890881091356277, 0.0014593498781323433, 0.0015296116471290588, 0.0015998734161257744, 0.00167013518512249, 0.0017403969541192055, 0.001810658723115921, 0.0018809204921126366, 0.0019511822611093521, 0.0020214440301060677, 0.002091705799102783]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 47.0, 42.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 11.0, 11.0, 10.0, 15.0, 15.0, 11.0, 37.0, 30.0, 41.0, 60.0, 75.0, 114.0, 130.0, 232.0, 344.0, 633.0, 1336.0, 3459.0, 13149.0, 74670.0, 747616.0, 174254.0, 22854.0, 5562.0, 1778.0, 786.0, 421.0, 260.0, 168.0, 114.0, 69.0, 61.0, 51.0, 40.0, 27.0, 24.0, 12.0, 14.0, 18.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -10.999267578125, -10.61572265625, -10.232177734375, -9.8486328125, -9.465087890625, -9.08154296875, -8.697998046875, -8.314453125, -7.930908203125, -7.54736328125, -7.163818359375, -6.7802734375, -6.396728515625, -6.01318359375, -5.629638671875, -5.24609375, -4.862548828125, -4.47900390625, -4.095458984375, -3.7119140625, -3.328369140625, -2.94482421875, -2.561279296875, -2.177734375, -1.794189453125, -1.41064453125, -1.027099609375, -0.6435546875, -0.260009765625, 0.12353515625, 0.507080078125, 0.890625, 1.274169921875, 1.65771484375, 2.041259765625, 2.4248046875, 2.808349609375, 3.19189453125, 3.575439453125, 3.958984375, 4.342529296875, 4.72607421875, 5.109619140625, 5.4931640625, 5.876708984375, 6.26025390625, 6.643798828125, 7.02734375, 7.410888671875, 7.79443359375, 8.177978515625, 8.5615234375, 8.945068359375, 9.32861328125, 9.712158203125, 10.095703125, 10.479248046875, 10.86279296875, 11.246337890625, 11.6298828125, 12.013427734375, 12.39697265625, 12.780517578125, 13.1640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 8.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 20.0, 20.0, 25.0, 33.0, 33.0, 24.0, 22.0, 35.0, 41.0, 44.0, 63.0, 155.0, 1776.0, 204.0, 59.0, 45.0, 52.0, 49.0, 47.0, 35.0, 38.0, 29.0, 29.0, 12.0, 26.0, 19.0, 11.0, 10.0, 11.0, 8.0, 3.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.457275390625, -17.78955078125, -17.121826171875, -16.4541015625, -15.786376953125, -15.11865234375, -14.450927734375, -13.783203125, -13.115478515625, -12.44775390625, -11.780029296875, -11.1123046875, -10.444580078125, -9.77685546875, -9.109130859375, -8.44140625, -7.773681640625, -7.10595703125, -6.438232421875, -5.7705078125, -5.102783203125, -4.43505859375, -3.767333984375, -3.099609375, -2.431884765625, -1.76416015625, -1.096435546875, -0.4287109375, 0.239013671875, 0.90673828125, 1.574462890625, 2.2421875, 2.909912109375, 3.57763671875, 4.245361328125, 4.9130859375, 5.580810546875, 6.24853515625, 6.916259765625, 7.583984375, 8.251708984375, 8.91943359375, 9.587158203125, 10.2548828125, 10.922607421875, 11.59033203125, 12.258056640625, 12.92578125, 13.593505859375, 14.26123046875, 14.928955078125, 15.5966796875, 16.264404296875, 16.93212890625, 17.599853515625, 18.267578125, 18.935302734375, 19.60302734375, 20.270751953125, 20.9384765625, 21.606201171875, 22.27392578125, 22.941650390625, 23.609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 12.0, 11.0, 27.0, 24.0, 30.0, 44.0, 48.0, 67.0, 65.0, 115.0, 177.0, 313.0, 801.0, 14052.0, 3121063.0, 7328.0, 636.0, 304.0, 141.0, 87.0, 59.0, 47.0, 43.0, 33.0, 31.0, 24.0, 18.0, 7.0, 15.0, 10.0, 7.0, 6.0, 7.0, 7.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-71.125, -69.0595703125, -66.994140625, -64.9287109375, -62.86328125, -60.7978515625, -58.732421875, -56.6669921875, -54.6015625, -52.5361328125, -50.470703125, -48.4052734375, -46.33984375, -44.2744140625, -42.208984375, -40.1435546875, -38.078125, -36.0126953125, -33.947265625, -31.8818359375, -29.81640625, -27.7509765625, -25.685546875, -23.6201171875, -21.5546875, -19.4892578125, -17.423828125, -15.3583984375, -13.29296875, -11.2275390625, -9.162109375, -7.0966796875, -5.03125, -2.9658203125, -0.900390625, 1.1650390625, 3.23046875, 5.2958984375, 7.361328125, 9.4267578125, 11.4921875, 13.5576171875, 15.623046875, 17.6884765625, 19.75390625, 21.8193359375, 23.884765625, 25.9501953125, 28.015625, 30.0810546875, 32.146484375, 34.2119140625, 36.27734375, 38.3427734375, 40.408203125, 42.4736328125, 44.5390625, 46.6044921875, 48.669921875, 50.7353515625, 52.80078125, 54.8662109375, 56.931640625, 58.9970703125, 61.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 110.0, 746.0, 157.0, 5.0], "bins": [-245.0657196044922, -241.08157348632812, -237.09744262695312, -233.11329650878906, -229.129150390625, -225.14500427246094, -221.16085815429688, -217.17672729492188, -213.1925811767578, -209.20843505859375, -205.22430419921875, -201.2401580810547, -197.25601196289062, -193.27186584472656, -189.2877197265625, -185.3035888671875, -181.31944274902344, -177.33529663085938, -173.35116577148438, -169.3670196533203, -165.38287353515625, -161.3987274169922, -157.41458129882812, -153.43045043945312, -149.44630432128906, -145.462158203125, -141.47802734375, -137.49388122558594, -133.50973510742188, -129.5255889892578, -125.54145050048828, -121.55731201171875, -117.57316589355469, -113.58901977539062, -109.6048812866211, -105.62074279785156, -101.6365966796875, -97.65245056152344, -93.6683120727539, -89.68417358398438, -85.70002746582031, -81.71588134765625, -77.73174285888672, -73.74760437011719, -69.76345825195312, -65.77931213378906, -61.79517364501953, -57.811031341552734, -53.82688522338867, -49.842742919921875, -45.85860061645508, -41.87445831298828, -37.890316009521484, -33.90617370605469, -29.92203140258789, -25.937889099121094, -21.953746795654297, -17.9696044921875, -13.985462188720703, -10.001319885253906, -6.017177581787109, -2.0330352783203125, 1.9511070251464844, 5.935249328613281, 9.919390678405762]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 8.0, 11.0, 7.0, 6.0, 12.0, 17.0, 16.0, 16.0, 19.0, 17.0, 30.0, 28.0, 18.0, 40.0, 34.0, 32.0, 33.0, 36.0, 35.0, 39.0, 41.0, 40.0, 33.0, 45.0, 40.0, 31.0, 38.0, 27.0, 21.0, 32.0, 27.0, 17.0, 20.0, 19.0, 16.0, 19.0, 10.0, 12.0, 11.0, 8.0, 7.0, 3.0, 7.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-62.56318664550781, -60.72850036621094, -58.89381408691406, -57.05912780761719, -55.22444152832031, -53.38975524902344, -51.55506896972656, -49.72038269042969, -47.88569641113281, -46.05101013183594, -44.21632385253906, -42.38163757324219, -40.54695129394531, -38.71226501464844, -36.87757873535156, -35.04289245605469, -33.20820236206055, -31.373516082763672, -29.538829803466797, -27.704143524169922, -25.869457244873047, -24.034770965576172, -22.200082778930664, -20.36539649963379, -18.530710220336914, -16.69602394104004, -14.861337661743164, -13.026650428771973, -11.191964149475098, -9.357277870178223, -7.522590637207031, -5.687904357910156, -3.8532180786132812, -2.018531560897827, -0.18384504318237305, 1.6508417129516602, 3.485527992248535, 5.32021427154541, 7.154901504516602, 8.989587783813477, 10.824274063110352, 12.658960342407227, 14.493646621704102, 16.32833480834961, 18.163021087646484, 19.99770736694336, 21.832393646240234, 23.66707992553711, 25.501766204833984, 27.33645248413086, 29.171138763427734, 31.00582504272461, 32.840511322021484, 34.67519760131836, 36.5098876953125, 38.344573974609375, 40.17926025390625, 42.013946533203125, 43.8486328125, 45.683319091796875, 47.51800537109375, 49.352691650390625, 51.1873779296875, 53.022064208984375, 54.85675048828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 2.0, 11.0, 6.0, 10.0, 13.0, 7.0, 22.0, 22.0, 21.0, 26.0, 24.0, 32.0, 36.0, 30.0, 48.0, 42.0, 48.0, 41.0, 50.0, 36.0, 44.0, 37.0, 48.0, 42.0, 36.0, 38.0, 30.0, 23.0, 24.0, 21.0, 19.0, 16.0, 20.0, 5.0, 6.0, 14.0, 10.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.98614501953125, -6.7535400390625, -6.52093505859375, -6.288330078125, -6.05572509765625, -5.8231201171875, -5.59051513671875, -5.35791015625, -5.12530517578125, -4.8927001953125, -4.66009521484375, -4.427490234375, -4.19488525390625, -3.9622802734375, -3.72967529296875, -3.4970703125, -3.26446533203125, -3.0318603515625, -2.79925537109375, -2.566650390625, -2.33404541015625, -2.1014404296875, -1.86883544921875, -1.63623046875, -1.40362548828125, -1.1710205078125, -0.93841552734375, -0.705810546875, -0.47320556640625, -0.2406005859375, -0.00799560546875, 0.224609375, 0.45721435546875, 0.6898193359375, 0.92242431640625, 1.155029296875, 1.38763427734375, 1.6202392578125, 1.85284423828125, 2.08544921875, 2.31805419921875, 2.5506591796875, 2.78326416015625, 3.015869140625, 3.24847412109375, 3.4810791015625, 3.71368408203125, 3.9462890625, 4.17889404296875, 4.4114990234375, 4.64410400390625, 4.876708984375, 5.10931396484375, 5.3419189453125, 5.57452392578125, 5.80712890625, 6.03973388671875, 6.2723388671875, 6.50494384765625, 6.737548828125, 6.97015380859375, 7.2027587890625, 7.43536376953125, 7.66796875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 4.0, 11.0, 10.0, 17.0, 23.0, 38.0, 34.0, 56.0, 79.0, 136.0, 203.0, 287.0, 466.0, 763.0, 1361.0, 2472.0, 4900.0, 10476.0, 26248.0, 86239.0, 331269.0, 1018546.0, 1557390.0, 808837.0, 239734.0, 64975.0, 21212.0, 8755.0, 4182.0, 2266.0, 1186.0, 713.0, 471.0, 277.0, 172.0, 119.0, 103.0, 65.0, 45.0, 36.0, 26.0, 19.0, 13.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.328125, -8.062744140625, -7.79736328125, -7.531982421875, -7.2666015625, -7.001220703125, -6.73583984375, -6.470458984375, -6.205078125, -5.939697265625, -5.67431640625, -5.408935546875, -5.1435546875, -4.878173828125, -4.61279296875, -4.347412109375, -4.08203125, -3.816650390625, -3.55126953125, -3.285888671875, -3.0205078125, -2.755126953125, -2.48974609375, -2.224365234375, -1.958984375, -1.693603515625, -1.42822265625, -1.162841796875, -0.8974609375, -0.632080078125, -0.36669921875, -0.101318359375, 0.1640625, 0.429443359375, 0.69482421875, 0.960205078125, 1.2255859375, 1.490966796875, 1.75634765625, 2.021728515625, 2.287109375, 2.552490234375, 2.81787109375, 3.083251953125, 3.3486328125, 3.614013671875, 3.87939453125, 4.144775390625, 4.41015625, 4.675537109375, 4.94091796875, 5.206298828125, 5.4716796875, 5.737060546875, 6.00244140625, 6.267822265625, 6.533203125, 6.798583984375, 7.06396484375, 7.329345703125, 7.5947265625, 7.860107421875, 8.12548828125, 8.390869140625, 8.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 12.0, 5.0, 22.0, 36.0, 50.0, 100.0, 113.0, 179.0, 268.0, 408.0, 621.0, 687.0, 532.0, 366.0, 258.0, 144.0, 97.0, 60.0, 52.0, 23.0, 19.0, 8.0, 6.0, 8.0, 7.0, 1.0, 1.0], "bins": [-29.265625, -28.6602783203125, -28.054931640625, -27.4495849609375, -26.84423828125, -26.2388916015625, -25.633544921875, -25.0281982421875, -24.4228515625, -23.8175048828125, -23.212158203125, -22.6068115234375, -22.00146484375, -21.3961181640625, -20.790771484375, -20.1854248046875, -19.580078125, -18.9747314453125, -18.369384765625, -17.7640380859375, -17.15869140625, -16.5533447265625, -15.947998046875, -15.3426513671875, -14.7373046875, -14.1319580078125, -13.526611328125, -12.9212646484375, -12.31591796875, -11.7105712890625, -11.105224609375, -10.4998779296875, -9.89453125, -9.2891845703125, -8.683837890625, -8.0784912109375, -7.47314453125, -6.8677978515625, -6.262451171875, -5.6571044921875, -5.0517578125, -4.4464111328125, -3.841064453125, -3.2357177734375, -2.63037109375, -2.0250244140625, -1.419677734375, -0.8143310546875, -0.208984375, 0.3963623046875, 1.001708984375, 1.6070556640625, 2.21240234375, 2.8177490234375, 3.423095703125, 4.0284423828125, 4.6337890625, 5.2391357421875, 5.844482421875, 6.4498291015625, 7.05517578125, 7.6605224609375, 8.265869140625, 8.8712158203125, 9.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 15.0, 17.0, 32.0, 65.0, 103.0, 158.0, 282.0, 440.0, 1007.0, 7899.0, 4055565.0, 125536.0, 1680.0, 608.0, 357.0, 223.0, 125.0, 72.0, 44.0, 29.0, 16.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.9375, -60.2841796875, -57.630859375, -54.9775390625, -52.32421875, -49.6708984375, -47.017578125, -44.3642578125, -41.7109375, -39.0576171875, -36.404296875, -33.7509765625, -31.09765625, -28.4443359375, -25.791015625, -23.1376953125, -20.484375, -17.8310546875, -15.177734375, -12.5244140625, -9.87109375, -7.2177734375, -4.564453125, -1.9111328125, 0.7421875, 3.3955078125, 6.048828125, 8.7021484375, 11.35546875, 14.0087890625, 16.662109375, 19.3154296875, 21.96875, 24.6220703125, 27.275390625, 29.9287109375, 32.58203125, 35.2353515625, 37.888671875, 40.5419921875, 43.1953125, 45.8486328125, 48.501953125, 51.1552734375, 53.80859375, 56.4619140625, 59.115234375, 61.7685546875, 64.421875, 67.0751953125, 69.728515625, 72.3818359375, 75.03515625, 77.6884765625, 80.341796875, 82.9951171875, 85.6484375, 88.3017578125, 90.955078125, 93.6083984375, 96.26171875, 98.9150390625, 101.568359375, 104.2216796875, 106.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 342.0, 676.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1392.4459228515625, -1367.169921875, -1341.89404296875, -1316.6180419921875, -1291.3421630859375, -1266.066162109375, -1240.790283203125, -1215.5142822265625, -1190.2384033203125, -1164.96240234375, -1139.6865234375, -1114.4105224609375, -1089.1346435546875, -1063.858642578125, -1038.582763671875, -1013.3067626953125, -988.0308227539062, -962.7548828125, -937.4789428710938, -912.2030029296875, -886.9270629882812, -861.651123046875, -836.3751220703125, -811.0992431640625, -785.8232421875, -760.5473022460938, -735.2713623046875, -709.9954223632812, -684.719482421875, -659.4435424804688, -634.1676025390625, -608.8916015625, -583.61572265625, -558.3397827148438, -533.0638427734375, -507.78790283203125, -482.511962890625, -457.23602294921875, -431.9600524902344, -406.6841125488281, -381.408203125, -356.13226318359375, -330.8563232421875, -305.58038330078125, -280.304443359375, -255.0284881591797, -229.75253295898438, -204.47659301757812, -179.2006378173828, -153.92469787597656, -128.64874267578125, -103.372802734375, -78.09686279296875, -52.8209228515625, -27.544967651367188, -2.2690277099609375, 23.006912231445312, 48.28285598754883, 73.55879974365234, 98.83474731445312, 124.11068725585938, 149.38662719726562, 174.66258239746094, 199.9385223388672, 225.21446228027344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 9.0, 15.0, 18.0, 12.0, 26.0, 31.0, 27.0, 43.0, 48.0, 51.0, 50.0, 58.0, 58.0, 62.0, 62.0, 47.0, 55.0, 50.0, 56.0, 45.0, 33.0, 40.0, 26.0, 20.0, 23.0, 14.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.742645263671875, -43.7707633972168, -41.79888153076172, -39.82699966430664, -37.85511779785156, -35.88323974609375, -33.91135787963867, -31.939476013183594, -29.967594146728516, -27.995712280273438, -26.02383041381836, -24.051950454711914, -22.080068588256836, -20.108186721801758, -18.136306762695312, -16.164424896240234, -14.192543029785156, -12.220661163330078, -10.248780250549316, -8.276899337768555, -6.305017471313477, -4.333135604858398, -2.3612546920776367, -0.389373779296875, 1.5825080871582031, 3.554389476776123, 5.526270866394043, 7.498152256011963, 9.470033645629883, 11.441915512084961, 13.413796424865723, 15.385677337646484, 17.357559204101562, 19.32944107055664, 21.30132293701172, 23.273202896118164, 25.245084762573242, 27.21696662902832, 29.188846588134766, 31.160728454589844, 33.13261032104492, 35.1044921875, 37.07637405395508, 39.048255920410156, 41.02013397216797, 42.99201965332031, 44.963897705078125, 46.9357795715332, 48.90766143798828, 50.87954330444336, 52.85142517089844, 54.823307037353516, 56.795188903808594, 58.767066955566406, 60.738948822021484, 62.71083068847656, 64.68270874023438, 66.65458679199219, 68.62647247314453, 70.59835052490234, 72.57023620605469, 74.5421142578125, 76.51399993896484, 78.48587799072266, 80.457763671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 40.0, 46.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 21.0, 39.0, 51.0, 69.0, 94.0, 170.0, 248.0, 358.0, 501.0, 679.0, 1040.0, 1590.0, 2242.0, 3376.0, 4780.0, 7045.0, 10458.0, 15408.0, 22632.0, 34583.0, 51116.0, 77387.0, 110941.0, 147149.0, 157669.0, 126405.0, 89143.0, 60510.0, 39794.0, 26825.0, 18041.0, 12245.0, 8298.0, 5520.0, 3900.0, 2583.0, 1810.0, 1204.0, 821.0, 591.0, 381.0, 282.0, 180.0, 128.0, 81.0, 52.0, 41.0, 22.0, 18.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.6103515625, -0.5919647216796875, -0.573577880859375, -0.5551910400390625, -0.53680419921875, -0.5184173583984375, -0.500030517578125, -0.4816436767578125, -0.4632568359375, -0.4448699951171875, -0.426483154296875, -0.4080963134765625, -0.38970947265625, -0.3713226318359375, -0.352935791015625, -0.3345489501953125, -0.316162109375, -0.2977752685546875, -0.279388427734375, -0.2610015869140625, -0.24261474609375, -0.2242279052734375, -0.205841064453125, -0.1874542236328125, -0.1690673828125, -0.1506805419921875, -0.132293701171875, -0.1139068603515625, -0.09552001953125, -0.0771331787109375, -0.058746337890625, -0.0403594970703125, -0.02197265625, -0.0035858154296875, 0.014801025390625, 0.0331878662109375, 0.05157470703125, 0.0699615478515625, 0.088348388671875, 0.1067352294921875, 0.1251220703125, 0.1435089111328125, 0.161895751953125, 0.1802825927734375, 0.19866943359375, 0.2170562744140625, 0.235443115234375, 0.2538299560546875, 0.272216796875, 0.2906036376953125, 0.308990478515625, 0.3273773193359375, 0.34576416015625, 0.3641510009765625, 0.382537841796875, 0.4009246826171875, 0.4193115234375, 0.4376983642578125, 0.456085205078125, 0.4744720458984375, 0.49285888671875, 0.5112457275390625, 0.529632568359375, 0.5480194091796875, 0.56640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 4.0, 5.0, 15.0, 14.0, 18.0, 23.0, 27.0, 15.0, 24.0, 31.0, 38.0, 32.0, 30.0, 48.0, 36.0, 44.0, 42.0, 1065.0, 38.0, 44.0, 39.0, 32.0, 35.0, 29.0, 37.0, 23.0, 25.0, 21.0, 35.0, 23.0, 21.0, 15.0, 12.0, 12.0, 8.0, 7.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.4183349609375, -4.281982421875, -4.1456298828125, -4.00927734375, -3.8729248046875, -3.736572265625, -3.6002197265625, -3.4638671875, -3.3275146484375, -3.191162109375, -3.0548095703125, -2.91845703125, -2.7821044921875, -2.645751953125, -2.5093994140625, -2.373046875, -2.2366943359375, -2.100341796875, -1.9639892578125, -1.82763671875, -1.6912841796875, -1.554931640625, -1.4185791015625, -1.2822265625, -1.1458740234375, -1.009521484375, -0.8731689453125, -0.73681640625, -0.6004638671875, -0.464111328125, -0.3277587890625, -0.19140625, -0.0550537109375, 0.081298828125, 0.2176513671875, 0.35400390625, 0.4903564453125, 0.626708984375, 0.7630615234375, 0.8994140625, 1.0357666015625, 1.172119140625, 1.3084716796875, 1.44482421875, 1.5811767578125, 1.717529296875, 1.8538818359375, 1.990234375, 2.1265869140625, 2.262939453125, 2.3992919921875, 2.53564453125, 2.6719970703125, 2.808349609375, 2.9447021484375, 3.0810546875, 3.2174072265625, 3.353759765625, 3.4901123046875, 3.62646484375, 3.7628173828125, 3.899169921875, 4.0355224609375, 4.171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 18.0, 24.0, 35.0, 52.0, 72.0, 128.0, 202.0, 290.0, 498.0, 827.0, 1311.0, 1945.0, 3292.0, 5429.0, 8747.0, 13987.0, 22692.0, 36774.0, 58017.0, 89471.0, 127933.0, 1047659.0, 316026.0, 125412.0, 86720.0, 56909.0, 35565.0, 21751.0, 13566.0, 8385.0, 5147.0, 3148.0, 1857.0, 1184.0, 735.0, 478.0, 281.0, 180.0, 131.0, 85.0, 57.0, 32.0, 21.0, 19.0, 16.0, 11.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.58447265625, -0.5677566528320312, -0.5510406494140625, -0.5343246459960938, -0.517608642578125, -0.5008926391601562, -0.4841766357421875, -0.46746063232421875, -0.45074462890625, -0.43402862548828125, -0.4173126220703125, -0.40059661865234375, -0.383880615234375, -0.36716461181640625, -0.3504486083984375, -0.33373260498046875, -0.3170166015625, -0.30030059814453125, -0.2835845947265625, -0.26686859130859375, -0.250152587890625, -0.23343658447265625, -0.2167205810546875, -0.20000457763671875, -0.18328857421875, -0.16657257080078125, -0.1498565673828125, -0.13314056396484375, -0.116424560546875, -0.09970855712890625, -0.0829925537109375, -0.06627655029296875, -0.049560546875, -0.03284454345703125, -0.0161285400390625, 0.00058746337890625, 0.017303466796875, 0.03401947021484375, 0.0507354736328125, 0.06745147705078125, 0.08416748046875, 0.10088348388671875, 0.1175994873046875, 0.13431549072265625, 0.151031494140625, 0.16774749755859375, 0.1844635009765625, 0.20117950439453125, 0.2178955078125, 0.23461151123046875, 0.2513275146484375, 0.26804351806640625, 0.284759521484375, 0.30147552490234375, 0.3181915283203125, 0.33490753173828125, 0.35162353515625, 0.36833953857421875, 0.3850555419921875, 0.40177154541015625, 0.418487548828125, 0.43520355224609375, 0.4519195556640625, 0.46863555908203125, 0.4853515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 16.0, 14.0, 27.0, 25.0, 36.0, 47.0, 54.0, 63.0, 60.0, 65.0, 74.0, 78.0, 80.0, 44.0, 53.0, 41.0, 47.0, 39.0, 22.0, 18.0, 13.0, 24.0, 11.0, 2.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037250518798828125, -0.0035968124866485596, -0.0034685730934143066, -0.0033403337001800537, -0.0032120943069458008, -0.003083854913711548, -0.002955615520477295, -0.002827376127243042, -0.002699136734008789, -0.002570897340774536, -0.002442657947540283, -0.0023144185543060303, -0.0021861791610717773, -0.0020579397678375244, -0.0019297003746032715, -0.0018014609813690186, -0.0016732215881347656, -0.0015449821949005127, -0.0014167428016662598, -0.0012885034084320068, -0.001160264015197754, -0.001032024621963501, -0.000903785228729248, -0.0007755458354949951, -0.0006473064422607422, -0.0005190670490264893, -0.00039082765579223633, -0.0002625882625579834, -0.00013434886932373047, -6.109476089477539e-06, 0.0001221299171447754, 0.0002503693103790283, 0.00037860870361328125, 0.0005068480968475342, 0.0006350874900817871, 0.00076332688331604, 0.000891566276550293, 0.001019805669784546, 0.0011480450630187988, 0.0012762844562530518, 0.0014045238494873047, 0.0015327632427215576, 0.0016610026359558105, 0.0017892420291900635, 0.0019174814224243164, 0.0020457208156585693, 0.0021739602088928223, 0.002302199602127075, 0.002430438995361328, 0.002558678388595581, 0.002686917781829834, 0.002815157175064087, 0.00294339656829834, 0.0030716359615325928, 0.0031998753547668457, 0.0033281147480010986, 0.0034563541412353516, 0.0035845935344696045, 0.0037128329277038574, 0.0038410723209381104, 0.003969311714172363, 0.004097551107406616, 0.004225790500640869, 0.004354029893875122, 0.004482269287109375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 7.0, 18.0, 25.0, 36.0, 25.0, 56.0, 76.0, 115.0, 183.0, 351.0, 3169.0, 955740.0, 87006.0, 978.0, 267.0, 156.0, 108.0, 69.0, 45.0, 31.0, 30.0, 16.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.1115407943725586, -0.10833549499511719, -0.10513019561767578, -0.10192489624023438, -0.09871959686279297, -0.09551429748535156, -0.09230899810791016, -0.08910369873046875, -0.08589839935302734, -0.08269309997558594, -0.07948780059814453, -0.07628250122070312, -0.07307720184326172, -0.06987190246582031, -0.0666666030883789, -0.0634613037109375, -0.060256004333496094, -0.05705070495605469, -0.05384540557861328, -0.050640106201171875, -0.04743480682373047, -0.04422950744628906, -0.041024208068847656, -0.03781890869140625, -0.034613609313964844, -0.03140830993652344, -0.02820301055908203, -0.024997711181640625, -0.02179241180419922, -0.018587112426757812, -0.015381813049316406, -0.012176513671875, -0.008971214294433594, -0.0057659149169921875, -0.0025606155395507812, 0.000644683837890625, 0.0038499832153320312, 0.0070552825927734375, 0.010260581970214844, 0.01346588134765625, 0.016671180725097656, 0.019876480102539062, 0.02308177947998047, 0.026287078857421875, 0.02949237823486328, 0.03269767761230469, 0.035902976989746094, 0.0391082763671875, 0.042313575744628906, 0.04551887512207031, 0.04872417449951172, 0.051929473876953125, 0.05513477325439453, 0.05834007263183594, 0.061545372009277344, 0.06475067138671875, 0.06795597076416016, 0.07116127014160156, 0.07436656951904297, 0.07757186889648438, 0.08077716827392578, 0.08398246765136719, 0.0871877670288086, 0.09039306640625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 180.0, 805.0, 29.0, 4.0], "bins": [-0.06408385932445526, -0.06303854286670685, -0.061993226408958435, -0.06094790995121002, -0.05990259349346161, -0.058857280761003494, -0.05781196430325508, -0.05676664784550667, -0.055721331387758255, -0.05467601493000984, -0.05363069847226143, -0.052585382014513016, -0.0515400692820549, -0.05049475282430649, -0.049449436366558075, -0.04840411990880966, -0.04735880345106125, -0.046313486993312836, -0.04526817053556442, -0.04422285407781601, -0.043177537620067596, -0.04213222488760948, -0.04108690842986107, -0.040041591972112656, -0.03899627551436424, -0.03795095905661583, -0.036905642598867416, -0.035860326141119, -0.03481501340866089, -0.033769696950912476, -0.03272438049316406, -0.03167906403541565, -0.030633747577667236, -0.029588431119918823, -0.02854311466217041, -0.027497800067067146, -0.026452483609318733, -0.02540716715157032, -0.024361852556467056, -0.023316536098718643, -0.02227121964097023, -0.021225903183221817, -0.020180586725473404, -0.01913527213037014, -0.018089955672621727, -0.017044639214873314, -0.01599932461977005, -0.014954008162021637, -0.01390869077295065, -0.01286337524652481, -0.011818058788776398, -0.010772742331027985, -0.009727426804602146, -0.008682111278176308, -0.007636794820427895, -0.006591478828340769, -0.005546162836253643, -0.004500846844166517, -0.0034555308520793915, -0.0024102148599922657, -0.00136489886790514, -0.00031958287581801414, 0.0007257331162691116, 0.0017710491083562374, 0.0028163648676127195]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 14.0, 16.0, 10.0, 20.0, 23.0, 30.0, 30.0, 40.0, 43.0, 39.0, 46.0, 52.0, 52.0, 73.0, 50.0, 55.0, 41.0, 35.0, 49.0, 40.0, 40.0, 31.0, 35.0, 22.0, 18.0, 14.0, 11.0, 13.0, 12.0, 3.0, 4.0, 8.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001860976219177246, -0.0017893752083182335, -0.0017177741974592209, -0.0016461731866002083, -0.0015745721757411957, -0.001502971164882183, -0.0014313701540231705, -0.0013597691431641579, -0.0012881681323051453, -0.0012165671214461327, -0.00114496611058712, -0.0010733650997281075, -0.0010017640888690948, -0.0009301630780100822, -0.0008585620671510696, -0.000786961056292057, -0.0007153600454330444, -0.0006437590345740318, -0.0005721580237150192, -0.0005005570128560066, -0.000428956001996994, -0.0003573549911379814, -0.0002857539802789688, -0.0002141529694199562, -0.0001425519585609436, -7.0950947701931e-05, 6.50063157081604e-07, 7.225107401609421e-05, 0.0001438520848751068, 0.00021545309573411942, 0.000287054106593132, 0.0003586551174521446, 0.0004302561283111572, 0.0005018571391701698, 0.0005734581500291824, 0.000645059160888195, 0.0007166601717472076, 0.0007882611826062202, 0.0008598621934652328, 0.0009314632043242455, 0.001003064215183258, 0.0010746652260422707, 0.0011462662369012833, 0.0012178672477602959, 0.0012894682586193085, 0.001361069269478321, 0.0014326702803373337, 0.0015042712911963463, 0.0015758723020553589, 0.0016474733129143715, 0.001719074323773384, 0.0017906753346323967, 0.0018622763454914093, 0.001933877356350422, 0.0020054783672094345, 0.002077079378068447, 0.0021486803889274597, 0.0022202813997864723, 0.002291882410645485, 0.0023634834215044975, 0.00243508443236351, 0.0025066854432225227, 0.0025782864540815353, 0.002649887464940548, 0.0027214884757995605]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 41.0, 45.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 10.0, 17.0, 23.0, 35.0, 31.0, 61.0, 107.0, 158.0, 281.0, 513.0, 916.0, 1770.0, 3797.0, 7901.0, 17252.0, 39542.0, 98640.0, 309182.0, 369647.0, 115727.0, 45733.0, 19661.0, 8954.0, 4176.0, 2034.0, 986.0, 553.0, 294.0, 182.0, 110.0, 67.0, 44.0, 37.0, 12.0, 15.0, 15.0, 15.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05859375, -5.857177734375, -5.65576171875, -5.454345703125, -5.2529296875, -5.051513671875, -4.85009765625, -4.648681640625, -4.447265625, -4.245849609375, -4.04443359375, -3.843017578125, -3.6416015625, -3.440185546875, -3.23876953125, -3.037353515625, -2.8359375, -2.634521484375, -2.43310546875, -2.231689453125, -2.0302734375, -1.828857421875, -1.62744140625, -1.426025390625, -1.224609375, -1.023193359375, -0.82177734375, -0.620361328125, -0.4189453125, -0.217529296875, -0.01611328125, 0.185302734375, 0.38671875, 0.588134765625, 0.78955078125, 0.990966796875, 1.1923828125, 1.393798828125, 1.59521484375, 1.796630859375, 1.998046875, 2.199462890625, 2.40087890625, 2.602294921875, 2.8037109375, 3.005126953125, 3.20654296875, 3.407958984375, 3.609375, 3.810791015625, 4.01220703125, 4.213623046875, 4.4150390625, 4.616455078125, 4.81787109375, 5.019287109375, 5.220703125, 5.422119140625, 5.62353515625, 5.824951171875, 6.0263671875, 6.227783203125, 6.42919921875, 6.630615234375, 6.83203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 4.0, 13.0, 17.0, 22.0, 18.0, 23.0, 24.0, 30.0, 27.0, 33.0, 39.0, 40.0, 47.0, 50.0, 75.0, 246.0, 1605.0, 190.0, 83.0, 53.0, 43.0, 47.0, 44.0, 39.0, 28.0, 33.0, 26.0, 20.0, 23.0, 18.0, 14.0, 6.0, 16.0, 6.0, 8.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-23.078125, -22.40673828125, -21.7353515625, -21.06396484375, -20.392578125, -19.72119140625, -19.0498046875, -18.37841796875, -17.70703125, -17.03564453125, -16.3642578125, -15.69287109375, -15.021484375, -14.35009765625, -13.6787109375, -13.00732421875, -12.3359375, -11.66455078125, -10.9931640625, -10.32177734375, -9.650390625, -8.97900390625, -8.3076171875, -7.63623046875, -6.96484375, -6.29345703125, -5.6220703125, -4.95068359375, -4.279296875, -3.60791015625, -2.9365234375, -2.26513671875, -1.59375, -0.92236328125, -0.2509765625, 0.42041015625, 1.091796875, 1.76318359375, 2.4345703125, 3.10595703125, 3.77734375, 4.44873046875, 5.1201171875, 5.79150390625, 6.462890625, 7.13427734375, 7.8056640625, 8.47705078125, 9.1484375, 9.81982421875, 10.4912109375, 11.16259765625, 11.833984375, 12.50537109375, 13.1767578125, 13.84814453125, 14.51953125, 15.19091796875, 15.8623046875, 16.53369140625, 17.205078125, 17.87646484375, 18.5478515625, 19.21923828125, 19.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 12.0, 11.0, 9.0, 10.0, 14.0, 15.0, 28.0, 27.0, 28.0, 48.0, 46.0, 88.0, 87.0, 145.0, 170.0, 193.0, 348.0, 631.0, 2735.0, 78505.0, 3007643.0, 50891.0, 2279.0, 578.0, 311.0, 201.0, 149.0, 124.0, 63.0, 62.0, 53.0, 40.0, 31.0, 29.0, 28.0, 12.0, 7.0, 10.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.0, -31.87939453125, -30.7587890625, -29.63818359375, -28.517578125, -27.39697265625, -26.2763671875, -25.15576171875, -24.03515625, -22.91455078125, -21.7939453125, -20.67333984375, -19.552734375, -18.43212890625, -17.3115234375, -16.19091796875, -15.0703125, -13.94970703125, -12.8291015625, -11.70849609375, -10.587890625, -9.46728515625, -8.3466796875, -7.22607421875, -6.10546875, -4.98486328125, -3.8642578125, -2.74365234375, -1.623046875, -0.50244140625, 0.6181640625, 1.73876953125, 2.859375, 3.97998046875, 5.1005859375, 6.22119140625, 7.341796875, 8.46240234375, 9.5830078125, 10.70361328125, 11.82421875, 12.94482421875, 14.0654296875, 15.18603515625, 16.306640625, 17.42724609375, 18.5478515625, 19.66845703125, 20.7890625, 21.90966796875, 23.0302734375, 24.15087890625, 25.271484375, 26.39208984375, 27.5126953125, 28.63330078125, 29.75390625, 30.87451171875, 31.9951171875, 33.11572265625, 34.236328125, 35.35693359375, 36.4775390625, 37.59814453125, 38.71875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 171.0, 722.0, 119.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.3849792480469, -263.5423583984375, -258.6997375488281, -253.8571014404297, -249.01446533203125, -244.17184448242188, -239.32920837402344, -234.48658752441406, -229.64395141601562, -224.80133056640625, -219.9586944580078, -215.11607360839844, -210.2734375, -205.43081665039062, -200.5881805419922, -195.7455596923828, -190.90293884277344, -186.06031799316406, -181.21768188476562, -176.37506103515625, -171.5324249267578, -166.68980407714844, -161.84716796875, -157.00454711914062, -152.16192626953125, -147.31930541992188, -142.47666931152344, -137.63404846191406, -132.79141235351562, -127.94879150390625, -123.10616302490234, -118.26353454589844, -113.42090606689453, -108.57827758789062, -103.73564910888672, -98.89302062988281, -94.05039978027344, -89.207763671875, -84.36514282226562, -79.52251434326172, -74.67988586425781, -69.8372573852539, -64.99462890625, -60.15200424194336, -55.30937576293945, -50.46674728393555, -45.624122619628906, -40.781494140625, -35.938865661621094, -31.096237182617188, -26.253610610961914, -21.41098403930664, -16.568355560302734, -11.725727081298828, -6.883100509643555, -2.0404739379882812, 2.802154541015625, 7.644782066345215, 12.487409591674805, 17.330036163330078, 22.172664642333984, 27.01529312133789, 31.857919692993164, 36.70054626464844, 41.543174743652344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 10.0, 10.0, 11.0, 5.0, 11.0, 12.0, 19.0, 21.0, 16.0, 18.0, 25.0, 29.0, 37.0, 20.0, 35.0, 33.0, 33.0, 34.0, 48.0, 36.0, 41.0, 43.0, 33.0, 36.0, 41.0, 38.0, 30.0, 34.0, 22.0, 21.0, 32.0, 22.0, 13.0, 22.0, 14.0, 14.0, 10.0, 12.0, 11.0, 14.0, 15.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.861915588378906, -49.33371353149414, -47.80550765991211, -46.277305603027344, -44.74910354614258, -43.22089767456055, -41.69269561767578, -40.16448974609375, -38.636287689208984, -37.10808563232422, -35.57987976074219, -34.05167770385742, -32.523475646972656, -30.995269775390625, -29.46706771850586, -27.93886375427246, -26.410661697387695, -24.882457733154297, -23.35425567626953, -21.826051712036133, -20.297847747802734, -18.76964569091797, -17.24144172668457, -15.713237762451172, -14.18503475189209, -12.656831741333008, -11.12862777709961, -9.600424766540527, -8.072221755981445, -6.544017791748047, -5.015814781188965, -3.4876108169555664, -1.9594078063964844, -0.4312044382095337, 1.096998929977417, 2.625202178955078, 4.153405666351318, 5.681609153747559, 7.209812164306641, 8.738016128540039, 10.266219139099121, 11.794422149658203, 13.322626113891602, 14.850829124450684, 16.379032135009766, 17.907236099243164, 19.435440063476562, 20.963642120361328, 22.491846084594727, 24.020050048828125, 25.54825210571289, 27.07645606994629, 28.604660034179688, 30.132862091064453, 31.66106605529785, 33.18927001953125, 34.717472076416016, 36.24567413330078, 37.77388000488281, 39.30208206176758, 40.830284118652344, 42.358489990234375, 43.88669204711914, 45.414894104003906, 46.94309997558594]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 9.0, 3.0, 9.0, 5.0, 9.0, 18.0, 8.0, 17.0, 25.0, 24.0, 22.0, 23.0, 30.0, 30.0, 45.0, 36.0, 35.0, 52.0, 41.0, 47.0, 45.0, 50.0, 34.0, 40.0, 39.0, 31.0, 33.0, 29.0, 25.0, 34.0, 16.0, 17.0, 15.0, 15.0, 11.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.47265625, -6.2568359375, -6.041015625, -5.8251953125, -5.609375, -5.3935546875, -5.177734375, -4.9619140625, -4.74609375, -4.5302734375, -4.314453125, -4.0986328125, -3.8828125, -3.6669921875, -3.451171875, -3.2353515625, -3.01953125, -2.8037109375, -2.587890625, -2.3720703125, -2.15625, -1.9404296875, -1.724609375, -1.5087890625, -1.29296875, -1.0771484375, -0.861328125, -0.6455078125, -0.4296875, -0.2138671875, 0.001953125, 0.2177734375, 0.43359375, 0.6494140625, 0.865234375, 1.0810546875, 1.296875, 1.5126953125, 1.728515625, 1.9443359375, 2.16015625, 2.3759765625, 2.591796875, 2.8076171875, 3.0234375, 3.2392578125, 3.455078125, 3.6708984375, 3.88671875, 4.1025390625, 4.318359375, 4.5341796875, 4.75, 4.9658203125, 5.181640625, 5.3974609375, 5.61328125, 5.8291015625, 6.044921875, 6.2607421875, 6.4765625, 6.6923828125, 6.908203125, 7.1240234375, 7.33984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 7.0, 15.0, 15.0, 21.0, 24.0, 18.0, 35.0, 41.0, 47.0, 79.0, 129.0, 274.0, 619.0, 1559.0, 6461.0, 37763.0, 524763.0, 3077826.0, 499595.0, 35799.0, 6166.0, 1636.0, 615.0, 252.0, 138.0, 91.0, 38.0, 36.0, 44.0, 27.0, 24.0, 18.0, 18.0, 11.0, 8.0, 10.0, 2.0, 7.0, 4.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.133056640625, -16.53173828125, -15.930419921875, -15.3291015625, -14.727783203125, -14.12646484375, -13.525146484375, -12.923828125, -12.322509765625, -11.72119140625, -11.119873046875, -10.5185546875, -9.917236328125, -9.31591796875, -8.714599609375, -8.11328125, -7.511962890625, -6.91064453125, -6.309326171875, -5.7080078125, -5.106689453125, -4.50537109375, -3.904052734375, -3.302734375, -2.701416015625, -2.10009765625, -1.498779296875, -0.8974609375, -0.296142578125, 0.30517578125, 0.906494140625, 1.5078125, 2.109130859375, 2.71044921875, 3.311767578125, 3.9130859375, 4.514404296875, 5.11572265625, 5.717041015625, 6.318359375, 6.919677734375, 7.52099609375, 8.122314453125, 8.7236328125, 9.324951171875, 9.92626953125, 10.527587890625, 11.12890625, 11.730224609375, 12.33154296875, 12.932861328125, 13.5341796875, 14.135498046875, 14.73681640625, 15.338134765625, 15.939453125, 16.540771484375, 17.14208984375, 17.743408203125, 18.3447265625, 18.946044921875, 19.54736328125, 20.148681640625, 20.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 10.0, 13.0, 18.0, 23.0, 24.0, 31.0, 47.0, 67.0, 78.0, 88.0, 122.0, 163.0, 206.0, 272.0, 287.0, 380.0, 397.0, 346.0, 339.0, 269.0, 180.0, 138.0, 114.0, 76.0, 67.0, 69.0, 44.0, 42.0, 29.0, 28.0, 19.0, 15.0, 7.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5361328125, -9.212890625, -8.8896484375, -8.56640625, -8.2431640625, -7.919921875, -7.5966796875, -7.2734375, -6.9501953125, -6.626953125, -6.3037109375, -5.98046875, -5.6572265625, -5.333984375, -5.0107421875, -4.6875, -4.3642578125, -4.041015625, -3.7177734375, -3.39453125, -3.0712890625, -2.748046875, -2.4248046875, -2.1015625, -1.7783203125, -1.455078125, -1.1318359375, -0.80859375, -0.4853515625, -0.162109375, 0.1611328125, 0.484375, 0.8076171875, 1.130859375, 1.4541015625, 1.77734375, 2.1005859375, 2.423828125, 2.7470703125, 3.0703125, 3.3935546875, 3.716796875, 4.0400390625, 4.36328125, 4.6865234375, 5.009765625, 5.3330078125, 5.65625, 5.9794921875, 6.302734375, 6.6259765625, 6.94921875, 7.2724609375, 7.595703125, 7.9189453125, 8.2421875, 8.5654296875, 8.888671875, 9.2119140625, 9.53515625, 9.8583984375, 10.181640625, 10.5048828125, 10.828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 11.0, 15.0, 14.0, 38.0, 44.0, 70.0, 79.0, 105.0, 143.0, 176.0, 265.0, 354.0, 1115.0, 13381.0, 2391994.0, 1772393.0, 11662.0, 983.0, 379.0, 296.0, 178.0, 147.0, 105.0, 75.0, 64.0, 53.0, 34.0, 22.0, 17.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.75, -61.005859375, -59.26171875, -57.517578125, -55.7734375, -54.029296875, -52.28515625, -50.541015625, -48.796875, -47.052734375, -45.30859375, -43.564453125, -41.8203125, -40.076171875, -38.33203125, -36.587890625, -34.84375, -33.099609375, -31.35546875, -29.611328125, -27.8671875, -26.123046875, -24.37890625, -22.634765625, -20.890625, -19.146484375, -17.40234375, -15.658203125, -13.9140625, -12.169921875, -10.42578125, -8.681640625, -6.9375, -5.193359375, -3.44921875, -1.705078125, 0.0390625, 1.783203125, 3.52734375, 5.271484375, 7.015625, 8.759765625, 10.50390625, 12.248046875, 13.9921875, 15.736328125, 17.48046875, 19.224609375, 20.96875, 22.712890625, 24.45703125, 26.201171875, 27.9453125, 29.689453125, 31.43359375, 33.177734375, 34.921875, 36.666015625, 38.41015625, 40.154296875, 41.8984375, 43.642578125, 45.38671875, 47.130859375, 48.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 210.0, 500.0, 243.0, 37.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-323.2208557128906, -316.421630859375, -309.6224060058594, -302.82318115234375, -296.02398681640625, -289.2247619628906, -282.425537109375, -275.6263122558594, -268.82708740234375, -262.0278625488281, -255.22865295410156, -248.42942810058594, -241.6302032470703, -234.83099365234375, -228.03176879882812, -221.2325439453125, -214.433349609375, -207.63412475585938, -200.8349151611328, -194.0356903076172, -187.23646545410156, -180.437255859375, -173.63803100585938, -166.83880615234375, -160.03958129882812, -153.2403564453125, -146.44114685058594, -139.6419219970703, -132.8426971435547, -126.04348754882812, -119.2442626953125, -112.4450454711914, -105.64582061767578, -98.84660339355469, -92.04737854003906, -85.24816131591797, -78.44894409179688, -71.64971923828125, -64.85050201416016, -58.05128479003906, -51.2520637512207, -44.452842712402344, -37.65362548828125, -30.85440444946289, -24.055185317993164, -17.255966186523438, -10.456745147705078, -3.6575279235839844, 3.141693115234375, 9.940912246704102, 16.740131378173828, 23.539352416992188, 30.338571548461914, 37.13779067993164, 43.93701171875, 50.736228942871094, 57.53544998168945, 64.33467102050781, 71.1338882446289, 77.93310546875, 84.73233032226562, 91.53154754638672, 98.33076477050781, 105.12998962402344, 111.92920684814453]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 7.0, 15.0, 14.0, 11.0, 21.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 31.0, 39.0, 26.0, 33.0, 33.0, 32.0, 45.0, 37.0, 54.0, 38.0, 48.0, 35.0, 21.0, 31.0, 37.0, 28.0, 29.0, 20.0, 25.0, 20.0, 17.0, 20.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.93975830078125, -38.61375427246094, -37.287750244140625, -35.96174621582031, -34.6357421875, -33.30973434448242, -31.98373031616211, -30.657726287841797, -29.331722259521484, -28.005718231201172, -26.67971420288086, -25.353708267211914, -24.0277042388916, -22.70170021057129, -21.375694274902344, -20.04969024658203, -18.72368621826172, -17.397682189941406, -16.071678161621094, -14.745672225952148, -13.419668197631836, -12.093664169311523, -10.767659187316895, -9.441654205322266, -8.115650177001953, -6.789645671844482, -5.463641166687012, -4.137636661529541, -2.8116321563720703, -1.4856276512145996, -0.1596231460571289, 1.1663818359375, 2.4923858642578125, 3.818390369415283, 5.144394874572754, 6.470399379730225, 7.796403884887695, 9.122407913208008, 10.448412895202637, 11.774417877197266, 13.100421905517578, 14.42642593383789, 15.75243091583252, 17.07843589782715, 18.40443992614746, 19.730443954467773, 21.05644989013672, 22.38245391845703, 23.708457946777344, 25.034461975097656, 26.36046600341797, 27.686471939086914, 29.012475967407227, 30.33847999572754, 31.664485931396484, 32.9904899597168, 34.31649398803711, 35.64249801635742, 36.968502044677734, 38.29450607299805, 39.620513916015625, 40.94651794433594, 42.27252197265625, 43.59852600097656, 44.924530029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 42.0, 37.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 7.0, 19.0, 20.0, 29.0, 47.0, 75.0, 97.0, 160.0, 221.0, 346.0, 565.0, 846.0, 1405.0, 2005.0, 3142.0, 4988.0, 7669.0, 11979.0, 18687.0, 29086.0, 45537.0, 71464.0, 109937.0, 154187.0, 173919.0, 141053.0, 97030.0, 62404.0, 40440.0, 25604.0, 16204.0, 10365.0, 6839.0, 4295.0, 2744.0, 1812.0, 1166.0, 739.0, 496.0, 315.0, 197.0, 147.0, 89.0, 64.0, 30.0, 28.0, 13.0, 16.0, 5.0, 9.0, 6.0, 8.0], "bins": [-0.76904296875, -0.7478866577148438, -0.7267303466796875, -0.7055740356445312, -0.684417724609375, -0.6632614135742188, -0.6421051025390625, -0.6209487915039062, -0.59979248046875, -0.5786361694335938, -0.5574798583984375, -0.5363235473632812, -0.515167236328125, -0.49401092529296875, -0.4728546142578125, -0.45169830322265625, -0.4305419921875, -0.40938568115234375, -0.3882293701171875, -0.36707305908203125, -0.345916748046875, -0.32476043701171875, -0.3036041259765625, -0.28244781494140625, -0.26129150390625, -0.24013519287109375, -0.2189788818359375, -0.19782257080078125, -0.176666259765625, -0.15550994873046875, -0.1343536376953125, -0.11319732666015625, -0.092041015625, -0.07088470458984375, -0.0497283935546875, -0.02857208251953125, -0.007415771484375, 0.01374053955078125, 0.0348968505859375, 0.05605316162109375, 0.07720947265625, 0.09836578369140625, 0.1195220947265625, 0.14067840576171875, 0.161834716796875, 0.18299102783203125, 0.2041473388671875, 0.22530364990234375, 0.2464599609375, 0.26761627197265625, 0.2887725830078125, 0.30992889404296875, 0.331085205078125, 0.35224151611328125, 0.3733978271484375, 0.39455413818359375, 0.41571044921875, 0.43686676025390625, 0.4580230712890625, 0.47917938232421875, 0.500335693359375, 0.5214920043945312, 0.5426483154296875, 0.5638046264648438, 0.5849609375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 3.0, 10.0, 6.0, 8.0, 11.0, 12.0, 17.0, 17.0, 26.0, 26.0, 20.0, 39.0, 31.0, 37.0, 36.0, 46.0, 37.0, 43.0, 34.0, 41.0, 1064.0, 47.0, 42.0, 39.0, 45.0, 34.0, 30.0, 30.0, 30.0, 21.0, 12.0, 23.0, 15.0, 19.0, 14.0, 16.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.864013671875, -4.71240234375, -4.560791015625, -4.4091796875, -4.257568359375, -4.10595703125, -3.954345703125, -3.802734375, -3.651123046875, -3.49951171875, -3.347900390625, -3.1962890625, -3.044677734375, -2.89306640625, -2.741455078125, -2.58984375, -2.438232421875, -2.28662109375, -2.135009765625, -1.9833984375, -1.831787109375, -1.68017578125, -1.528564453125, -1.376953125, -1.225341796875, -1.07373046875, -0.922119140625, -0.7705078125, -0.618896484375, -0.46728515625, -0.315673828125, -0.1640625, -0.012451171875, 0.13916015625, 0.290771484375, 0.4423828125, 0.593994140625, 0.74560546875, 0.897216796875, 1.048828125, 1.200439453125, 1.35205078125, 1.503662109375, 1.6552734375, 1.806884765625, 1.95849609375, 2.110107421875, 2.26171875, 2.413330078125, 2.56494140625, 2.716552734375, 2.8681640625, 3.019775390625, 3.17138671875, 3.322998046875, 3.474609375, 3.626220703125, 3.77783203125, 3.929443359375, 4.0810546875, 4.232666015625, 4.38427734375, 4.535888671875, 4.6875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 16.0, 36.0, 44.0, 78.0, 128.0, 196.0, 337.0, 638.0, 1046.0, 1929.0, 3436.0, 5730.0, 9936.0, 16706.0, 29097.0, 48792.0, 80270.0, 126686.0, 184959.0, 1219194.0, 140062.0, 92006.0, 56130.0, 33060.0, 19352.0, 11491.0, 6638.0, 3877.0, 2155.0, 1279.0, 766.0, 448.0, 214.0, 164.0, 94.0, 54.0, 31.0, 21.0, 9.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5530929565429688, -0.5334320068359375, -0.5137710571289062, -0.494110107421875, -0.47444915771484375, -0.4547882080078125, -0.43512725830078125, -0.41546630859375, -0.39580535888671875, -0.3761444091796875, -0.35648345947265625, -0.336822509765625, -0.31716156005859375, -0.2975006103515625, -0.27783966064453125, -0.2581787109375, -0.23851776123046875, -0.2188568115234375, -0.19919586181640625, -0.179534912109375, -0.15987396240234375, -0.1402130126953125, -0.12055206298828125, -0.10089111328125, -0.08123016357421875, -0.0615692138671875, -0.04190826416015625, -0.022247314453125, -0.00258636474609375, 0.0170745849609375, 0.03673553466796875, 0.056396484375, 0.07605743408203125, 0.0957183837890625, 0.11537933349609375, 0.135040283203125, 0.15470123291015625, 0.1743621826171875, 0.19402313232421875, 0.21368408203125, 0.23334503173828125, 0.2530059814453125, 0.27266693115234375, 0.292327880859375, 0.31198883056640625, 0.3316497802734375, 0.35131072998046875, 0.3709716796875, 0.39063262939453125, 0.4102935791015625, 0.42995452880859375, 0.449615478515625, 0.46927642822265625, 0.4889373779296875, 0.5085983276367188, 0.52825927734375, 0.5479202270507812, 0.5675811767578125, 0.5872421264648438, 0.606903076171875, 0.6265640258789062, 0.6462249755859375, 0.6658859252929688, 0.685546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 20.0, 18.0, 24.0, 23.0, 43.0, 47.0, 66.0, 61.0, 60.0, 85.0, 109.0, 88.0, 61.0, 71.0, 40.0, 31.0, 29.0, 33.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0063018798828125, -0.006111621856689453, -0.005921363830566406, -0.005731105804443359, -0.0055408477783203125, -0.005350589752197266, -0.005160331726074219, -0.004970073699951172, -0.004779815673828125, -0.004589557647705078, -0.004399299621582031, -0.004209041595458984, -0.0040187835693359375, -0.0038285255432128906, -0.0036382675170898438, -0.003448009490966797, -0.00325775146484375, -0.003067493438720703, -0.0028772354125976562, -0.0026869773864746094, -0.0024967193603515625, -0.0023064613342285156, -0.0021162033081054688, -0.0019259452819824219, -0.001735687255859375, -0.0015454292297363281, -0.0013551712036132812, -0.0011649131774902344, -0.0009746551513671875, -0.0007843971252441406, -0.0005941390991210938, -0.0004038810729980469, -0.000213623046875, -2.3365020751953125e-05, 0.00016689300537109375, 0.0003571510314941406, 0.0005474090576171875, 0.0007376670837402344, 0.0009279251098632812, 0.0011181831359863281, 0.001308441162109375, 0.0014986991882324219, 0.0016889572143554688, 0.0018792152404785156, 0.0020694732666015625, 0.0022597312927246094, 0.0024499893188476562, 0.002640247344970703, 0.00283050537109375, 0.003020763397216797, 0.0032110214233398438, 0.0034012794494628906, 0.0035915374755859375, 0.0037817955017089844, 0.003972053527832031, 0.004162311553955078, 0.004352569580078125, 0.004542827606201172, 0.004733085632324219, 0.004923343658447266, 0.0051136016845703125, 0.005303859710693359, 0.005494117736816406, 0.005684375762939453, 0.0058746337890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 3.0, 12.0, 13.0, 16.0, 28.0, 46.0, 56.0, 60.0, 89.0, 178.0, 323.0, 939.0, 416175.0, 628706.0, 983.0, 339.0, 164.0, 120.0, 83.0, 59.0, 38.0, 23.0, 24.0, 14.0, 10.0, 5.0, 4.0, 4.0, 7.0, 6.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1258544921875, -0.12179756164550781, -0.11774063110351562, -0.11368370056152344, -0.10962677001953125, -0.10556983947753906, -0.10151290893554688, -0.09745597839355469, -0.0933990478515625, -0.08934211730957031, -0.08528518676757812, -0.08122825622558594, -0.07717132568359375, -0.07311439514160156, -0.06905746459960938, -0.06500053405761719, -0.060943603515625, -0.05688667297363281, -0.052829742431640625, -0.04877281188964844, -0.04471588134765625, -0.04065895080566406, -0.036602020263671875, -0.03254508972167969, -0.0284881591796875, -0.024431228637695312, -0.020374298095703125, -0.016317367553710938, -0.01226043701171875, -0.008203506469726562, -0.004146575927734375, -8.96453857421875e-05, 0.00396728515625, 0.008024215698242188, 0.012081146240234375, 0.016138076782226562, 0.02019500732421875, 0.024251937866210938, 0.028308868408203125, 0.03236579895019531, 0.0364227294921875, 0.04047966003417969, 0.044536590576171875, 0.04859352111816406, 0.05265045166015625, 0.05670738220214844, 0.060764312744140625, 0.06482124328613281, 0.068878173828125, 0.07293510437011719, 0.07699203491210938, 0.08104896545410156, 0.08510589599609375, 0.08916282653808594, 0.09321975708007812, 0.09727668762207031, 0.1013336181640625, 0.10539054870605469, 0.10944747924804688, 0.11350440979003906, 0.11756134033203125, 0.12161827087402344, 0.12567520141601562, 0.1297321319580078, 0.1337890625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 31.0, 195.0, 519.0, 215.0, 39.0, 12.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.024682270362973213, -0.02424539066851139, -0.023808512836694717, -0.023371633142232895, -0.022934753447771072, -0.02249787375330925, -0.022060995921492577, -0.021624116227030754, -0.02118723839521408, -0.02075035870075226, -0.020313480868935585, -0.019876601174473763, -0.01943972148001194, -0.019002843648195267, -0.018565963953733444, -0.01812908425927162, -0.0176922045648098, -0.017255324870347977, -0.016818447038531303, -0.01638156734406948, -0.01594468764960766, -0.01550780888646841, -0.015070930123329163, -0.01463405042886734, -0.014197171665728092, -0.013760292902588844, -0.013323413208127022, -0.012886534444987774, -0.012449655681848526, -0.012012775987386703, -0.011575897224247456, -0.011139018461108208, -0.01070213969796896, -0.010265260934829712, -0.00982838124036789, -0.009391502477228642, -0.008954623714089394, -0.008517744019627571, -0.008080865256488323, -0.007643986027687788, -0.007207106798887253, -0.006770227570086718, -0.006333348341286182, -0.0058964695781469345, -0.005459590349346399, -0.005022711120545864, -0.004585832357406616, -0.004148953128606081, -0.003712073899805546, -0.0032751946710050106, -0.002838315675035119, -0.0024014366790652275, -0.0019645574502646923, -0.001527678221464157, -0.0010907992254942656, -0.000653920229524374, -0.0002170410007238388, 0.00021983811166137457, 0.0006567172240465879, 0.0010935963364318013, 0.0015304754488170147, 0.00196735467761755, 0.0024042336735874414, 0.002841112669557333, 0.003277991898357868]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 12.0, 20.0, 21.0, 24.0, 27.0, 24.0, 32.0, 51.0, 50.0, 50.0, 53.0, 70.0, 58.0, 60.0, 55.0, 56.0, 48.0, 40.0, 43.0, 33.0, 35.0, 26.0, 16.0, 25.0, 9.0, 10.0, 13.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003043830394744873, -0.0029310202226042747, -0.0028182100504636765, -0.002705399878323078, -0.00259258970618248, -0.0024797795340418816, -0.0023669693619012833, -0.002254159189760685, -0.0021413490176200867, -0.0020285388454794884, -0.00191572867333889, -0.0018029185011982918, -0.0016901083290576935, -0.0015772981569170952, -0.0014644879847764969, -0.0013516778126358986, -0.0012388676404953003, -0.001126057468354702, -0.0010132472962141037, -0.0009004371240735054, -0.0007876269519329071, -0.0006748167797923088, -0.0005620066076517105, -0.0004491964355111122, -0.0003363862633705139, -0.00022357609122991562, -0.00011076591908931732, 2.0442530512809753e-06, 0.00011485442519187927, 0.00022766459733247757, 0.00034047476947307587, 0.00045328494161367416, 0.0005660951137542725, 0.0006789052858948708, 0.0007917154580354691, 0.0009045256301760674, 0.0010173358023166656, 0.001130145974457264, 0.0012429561465978622, 0.0013557663187384605, 0.0014685764908790588, 0.0015813866630196571, 0.0016941968351602554, 0.0018070070073008537, 0.001919817179441452, 0.0020326273515820503, 0.0021454375237226486, 0.002258247695863247, 0.002371057868003845, 0.0024838680401444435, 0.002596678212285042, 0.00270948838442564, 0.0028222985565662384, 0.0029351087287068367, 0.003047918900847435, 0.0031607290729880333, 0.0032735392451286316, 0.00338634941726923, 0.003499159589409828, 0.0036119697615504265, 0.0037247799336910248, 0.003837590105831623, 0.003950400277972221, 0.00406321045011282, 0.004176020622253418]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 43.0, 36.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 10.0, 11.0, 6.0, 11.0, 20.0, 21.0, 20.0, 17.0, 46.0, 51.0, 56.0, 78.0, 129.0, 190.0, 270.0, 510.0, 1322.0, 4434.0, 18351.0, 111371.0, 774742.0, 111073.0, 18458.0, 4495.0, 1354.0, 564.0, 299.0, 160.0, 111.0, 87.0, 66.0, 56.0, 30.0, 31.0, 21.0, 19.0, 12.0, 16.0, 10.0, 8.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-15.1796875, -14.7265625, -14.2734375, -13.8203125, -13.3671875, -12.9140625, -12.4609375, -12.0078125, -11.5546875, -11.1015625, -10.6484375, -10.1953125, -9.7421875, -9.2890625, -8.8359375, -8.3828125, -7.9296875, -7.4765625, -7.0234375, -6.5703125, -6.1171875, -5.6640625, -5.2109375, -4.7578125, -4.3046875, -3.8515625, -3.3984375, -2.9453125, -2.4921875, -2.0390625, -1.5859375, -1.1328125, -0.6796875, -0.2265625, 0.2265625, 0.6796875, 1.1328125, 1.5859375, 2.0390625, 2.4921875, 2.9453125, 3.3984375, 3.8515625, 4.3046875, 4.7578125, 5.2109375, 5.6640625, 6.1171875, 6.5703125, 7.0234375, 7.4765625, 7.9296875, 8.3828125, 8.8359375, 9.2890625, 9.7421875, 10.1953125, 10.6484375, 11.1015625, 11.5546875, 12.0078125, 12.4609375, 12.9140625, 13.3671875, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 4.0, 7.0, 5.0, 12.0, 14.0, 14.0, 18.0, 18.0, 23.0, 33.0, 30.0, 48.0, 41.0, 44.0, 53.0, 51.0, 79.0, 227.0, 1699.0, 158.0, 76.0, 64.0, 40.0, 36.0, 37.0, 35.0, 28.0, 23.0, 24.0, 25.0, 20.0, 9.0, 7.0, 13.0, 5.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.109375, -22.375244140625, -21.64111328125, -20.906982421875, -20.1728515625, -19.438720703125, -18.70458984375, -17.970458984375, -17.236328125, -16.502197265625, -15.76806640625, -15.033935546875, -14.2998046875, -13.565673828125, -12.83154296875, -12.097412109375, -11.36328125, -10.629150390625, -9.89501953125, -9.160888671875, -8.4267578125, -7.692626953125, -6.95849609375, -6.224365234375, -5.490234375, -4.756103515625, -4.02197265625, -3.287841796875, -2.5537109375, -1.819580078125, -1.08544921875, -0.351318359375, 0.3828125, 1.116943359375, 1.85107421875, 2.585205078125, 3.3193359375, 4.053466796875, 4.78759765625, 5.521728515625, 6.255859375, 6.989990234375, 7.72412109375, 8.458251953125, 9.1923828125, 9.926513671875, 10.66064453125, 11.394775390625, 12.12890625, 12.863037109375, 13.59716796875, 14.331298828125, 15.0654296875, 15.799560546875, 16.53369140625, 17.267822265625, 18.001953125, 18.736083984375, 19.47021484375, 20.204345703125, 20.9384765625, 21.672607421875, 22.40673828125, 23.140869140625, 23.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 10.0, 6.0, 8.0, 24.0, 28.0, 24.0, 53.0, 47.0, 55.0, 71.0, 120.0, 183.0, 371.0, 1139.0, 27149.0, 3096117.0, 18180.0, 1026.0, 374.0, 178.0, 133.0, 94.0, 62.0, 45.0, 36.0, 32.0, 22.0, 25.0, 15.0, 16.0, 7.0, 7.0, 7.0, 3.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -54.0625, -52.34375, -50.625, -48.90625, -47.1875, -45.46875, -43.75, -42.03125, -40.3125, -38.59375, -36.875, -35.15625, -33.4375, -31.71875, -30.0, -28.28125, -26.5625, -24.84375, -23.125, -21.40625, -19.6875, -17.96875, -16.25, -14.53125, -12.8125, -11.09375, -9.375, -7.65625, -5.9375, -4.21875, -2.5, -0.78125, 0.9375, 2.65625, 4.375, 6.09375, 7.8125, 9.53125, 11.25, 12.96875, 14.6875, 16.40625, 18.125, 19.84375, 21.5625, 23.28125, 25.0, 26.71875, 28.4375, 30.15625, 31.875, 33.59375, 35.3125, 37.03125, 38.75, 40.46875, 42.1875, 43.90625, 45.625, 47.34375, 49.0625, 50.78125, 52.5, 54.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 14.0, 24.0, 38.0, 64.0, 113.0, 136.0, 149.0, 166.0, 103.0, 83.0, 47.0, 32.0, 16.0, 9.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.8138370513916, -28.0267391204834, -27.239639282226562, -26.45254135131836, -25.665443420410156, -24.878345489501953, -24.091245651245117, -23.304147720336914, -22.517047882080078, -21.729949951171875, -20.94285011291504, -20.155752182006836, -19.368654251098633, -18.581554412841797, -17.794456481933594, -17.00735855102539, -16.220260620117188, -15.433161735534668, -14.646063804626465, -13.858964920043945, -13.071866989135742, -12.284768104553223, -11.497669219970703, -10.7105712890625, -9.92347240447998, -9.136373519897461, -8.349275588989258, -7.562176704406738, -6.775078296661377, -5.987979888916016, -5.200881004333496, -4.413782596588135, -3.6266841888427734, -2.839585781097412, -2.0524871349334717, -1.2653884887695312, -0.4782900810241699, 0.3088083267211914, 1.095907211303711, 1.8830056190490723, 2.6701040267944336, 3.457202434539795, 4.244300842285156, 5.031399726867676, 5.818498134613037, 6.605596542358398, 7.392695426940918, 8.179794311523438, 8.96689224243164, 9.75399112701416, 10.541089057922363, 11.328187942504883, 12.115285873413086, 12.902384757995605, 13.689483642578125, 14.476581573486328, 15.263680458068848, 16.050779342651367, 16.83787727355957, 17.624977111816406, 18.41207504272461, 19.199172973632812, 19.986270904541016, 20.77337074279785, 21.560468673706055]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 8.0, 8.0, 10.0, 6.0, 12.0, 14.0, 16.0, 19.0, 22.0, 21.0, 29.0, 24.0, 34.0, 25.0, 30.0, 34.0, 24.0, 34.0, 36.0, 34.0, 35.0, 27.0, 36.0, 41.0, 34.0, 29.0, 30.0, 33.0, 23.0, 27.0, 27.0, 13.0, 26.0, 18.0, 22.0, 14.0, 22.0, 15.0, 13.0, 8.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-47.50079345703125, -46.00641632080078, -44.51204299926758, -43.017669677734375, -41.523292541503906, -40.02891540527344, -38.534542083740234, -37.04016876220703, -35.54579162597656, -34.051414489746094, -32.55704116821289, -31.062665939331055, -29.56829071044922, -28.073915481567383, -26.579540252685547, -25.08516502380371, -23.590789794921875, -22.09641456604004, -20.602039337158203, -19.107664108276367, -17.61328887939453, -16.118913650512695, -14.62453842163086, -13.130163192749023, -11.635787963867188, -10.141412734985352, -8.647037506103516, -7.15266227722168, -5.658287048339844, -4.163911819458008, -2.669536590576172, -1.175161361694336, 0.3192138671875, 1.813589096069336, 3.307964324951172, 4.802339553833008, 6.296714782714844, 7.79109001159668, 9.285465240478516, 10.779840469360352, 12.274215698242188, 13.768590927124023, 15.26296615600586, 16.757341384887695, 18.25171661376953, 19.746091842651367, 21.240467071533203, 22.73484230041504, 24.229217529296875, 25.72359275817871, 27.217967987060547, 28.712343215942383, 30.20671844482422, 31.701093673706055, 33.19546890258789, 34.689842224121094, 36.18421936035156, 37.67859649658203, 39.172969818115234, 40.66734313964844, 42.161720275878906, 43.656097412109375, 45.15047073364258, 46.64484405517578, 48.13922119140625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 7.0, 8.0, 12.0, 14.0, 13.0, 21.0, 14.0, 17.0, 27.0, 19.0, 25.0, 23.0, 26.0, 28.0, 46.0, 41.0, 42.0, 45.0, 48.0, 38.0, 50.0, 37.0, 38.0, 30.0, 32.0, 31.0, 28.0, 30.0, 25.0, 26.0, 22.0, 22.0, 16.0, 19.0, 7.0, 16.0, 9.0, 5.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-7.4375, -7.214599609375, -6.99169921875, -6.768798828125, -6.5458984375, -6.322998046875, -6.10009765625, -5.877197265625, -5.654296875, -5.431396484375, -5.20849609375, -4.985595703125, -4.7626953125, -4.539794921875, -4.31689453125, -4.093994140625, -3.87109375, -3.648193359375, -3.42529296875, -3.202392578125, -2.9794921875, -2.756591796875, -2.53369140625, -2.310791015625, -2.087890625, -1.864990234375, -1.64208984375, -1.419189453125, -1.1962890625, -0.973388671875, -0.75048828125, -0.527587890625, -0.3046875, -0.081787109375, 0.14111328125, 0.364013671875, 0.5869140625, 0.809814453125, 1.03271484375, 1.255615234375, 1.478515625, 1.701416015625, 1.92431640625, 2.147216796875, 2.3701171875, 2.593017578125, 2.81591796875, 3.038818359375, 3.26171875, 3.484619140625, 3.70751953125, 3.930419921875, 4.1533203125, 4.376220703125, 4.59912109375, 4.822021484375, 5.044921875, 5.267822265625, 5.49072265625, 5.713623046875, 5.9365234375, 6.159423828125, 6.38232421875, 6.605224609375, 6.828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 7.0, 7.0, 12.0, 16.0, 15.0, 23.0, 23.0, 33.0, 60.0, 88.0, 175.0, 381.0, 860.0, 2049.0, 5765.0, 18413.0, 98842.0, 1260143.0, 2498718.0, 261025.0, 33046.0, 8837.0, 3244.0, 1261.0, 538.0, 274.0, 126.0, 66.0, 40.0, 35.0, 24.0, 29.0, 17.0, 17.0, 11.0, 6.0, 8.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.618408203125, -16.04931640625, -15.480224609375, -14.9111328125, -14.342041015625, -13.77294921875, -13.203857421875, -12.634765625, -12.065673828125, -11.49658203125, -10.927490234375, -10.3583984375, -9.789306640625, -9.22021484375, -8.651123046875, -8.08203125, -7.512939453125, -6.94384765625, -6.374755859375, -5.8056640625, -5.236572265625, -4.66748046875, -4.098388671875, -3.529296875, -2.960205078125, -2.39111328125, -1.822021484375, -1.2529296875, -0.683837890625, -0.11474609375, 0.454345703125, 1.0234375, 1.592529296875, 2.16162109375, 2.730712890625, 3.2998046875, 3.868896484375, 4.43798828125, 5.007080078125, 5.576171875, 6.145263671875, 6.71435546875, 7.283447265625, 7.8525390625, 8.421630859375, 8.99072265625, 9.559814453125, 10.12890625, 10.697998046875, 11.26708984375, 11.836181640625, 12.4052734375, 12.974365234375, 13.54345703125, 14.112548828125, 14.681640625, 15.250732421875, 15.81982421875, 16.388916015625, 16.9580078125, 17.527099609375, 18.09619140625, 18.665283203125, 19.234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 26.0, 24.0, 27.0, 28.0, 56.0, 72.0, 80.0, 108.0, 137.0, 217.0, 293.0, 365.0, 440.0, 484.0, 435.0, 323.0, 222.0, 176.0, 132.0, 101.0, 76.0, 65.0, 40.0, 26.0, 19.0, 10.0, 16.0, 11.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8671875, -11.48779296875, -11.1083984375, -10.72900390625, -10.349609375, -9.97021484375, -9.5908203125, -9.21142578125, -8.83203125, -8.45263671875, -8.0732421875, -7.69384765625, -7.314453125, -6.93505859375, -6.5556640625, -6.17626953125, -5.796875, -5.41748046875, -5.0380859375, -4.65869140625, -4.279296875, -3.89990234375, -3.5205078125, -3.14111328125, -2.76171875, -2.38232421875, -2.0029296875, -1.62353515625, -1.244140625, -0.86474609375, -0.4853515625, -0.10595703125, 0.2734375, 0.65283203125, 1.0322265625, 1.41162109375, 1.791015625, 2.17041015625, 2.5498046875, 2.92919921875, 3.30859375, 3.68798828125, 4.0673828125, 4.44677734375, 4.826171875, 5.20556640625, 5.5849609375, 5.96435546875, 6.34375, 6.72314453125, 7.1025390625, 7.48193359375, 7.861328125, 8.24072265625, 8.6201171875, 8.99951171875, 9.37890625, 9.75830078125, 10.1376953125, 10.51708984375, 10.896484375, 11.27587890625, 11.6552734375, 12.03466796875, 12.4140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 6.0, 10.0, 14.0, 20.0, 29.0, 33.0, 56.0, 57.0, 81.0, 87.0, 142.0, 219.0, 375.0, 776.0, 2893.0, 23831.0, 688139.0, 3395488.0, 73070.0, 6282.0, 1250.0, 477.0, 249.0, 173.0, 127.0, 89.0, 79.0, 49.0, 42.0, 25.0, 27.0, 19.0, 14.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-48.5, -47.23046875, -45.9609375, -44.69140625, -43.421875, -42.15234375, -40.8828125, -39.61328125, -38.34375, -37.07421875, -35.8046875, -34.53515625, -33.265625, -31.99609375, -30.7265625, -29.45703125, -28.1875, -26.91796875, -25.6484375, -24.37890625, -23.109375, -21.83984375, -20.5703125, -19.30078125, -18.03125, -16.76171875, -15.4921875, -14.22265625, -12.953125, -11.68359375, -10.4140625, -9.14453125, -7.875, -6.60546875, -5.3359375, -4.06640625, -2.796875, -1.52734375, -0.2578125, 1.01171875, 2.28125, 3.55078125, 4.8203125, 6.08984375, 7.359375, 8.62890625, 9.8984375, 11.16796875, 12.4375, 13.70703125, 14.9765625, 16.24609375, 17.515625, 18.78515625, 20.0546875, 21.32421875, 22.59375, 23.86328125, 25.1328125, 26.40234375, 27.671875, 28.94140625, 30.2109375, 31.48046875, 32.75]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 15.0, 29.0, 37.0, 75.0, 138.0, 190.0, 196.0, 134.0, 80.0, 59.0, 26.0, 8.0, 9.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.93444061279297, -103.53251647949219, -101.13058471679688, -98.7286605834961, -96.32673645019531, -93.9248046875, -91.52288055419922, -89.12095642089844, -86.71902465820312, -84.31710052490234, -81.91516876220703, -79.51324462890625, -77.11131286621094, -74.70938873291016, -72.30746459960938, -69.90553283691406, -67.50360870361328, -65.1016845703125, -62.69975280761719, -60.297828674316406, -57.89590072631836, -55.49397277832031, -53.09204864501953, -50.690120697021484, -48.28819274902344, -45.88626480102539, -43.484336853027344, -41.08241271972656, -38.680484771728516, -36.27855682373047, -33.87663269042969, -31.47470474243164, -29.072784423828125, -26.670856475830078, -24.268930435180664, -21.86700439453125, -19.465076446533203, -17.063148498535156, -14.661222457885742, -12.259296417236328, -9.857368469238281, -7.455441474914551, -5.05351448059082, -2.65158748626709, -0.24966049194335938, 2.152266502380371, 4.554193496704102, 6.956119537353516, 9.358047485351562, 11.759974479675293, 14.161901473999023, 16.563827514648438, 18.965755462646484, 21.36768341064453, 23.769609451293945, 26.17153549194336, 28.573463439941406, 30.975391387939453, 33.3773193359375, 35.77924346923828, 38.18117141723633, 40.583099365234375, 42.985023498535156, 45.3869514465332, 47.78887939453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 6.0, 20.0, 17.0, 18.0, 24.0, 16.0, 31.0, 33.0, 31.0, 32.0, 32.0, 41.0, 40.0, 42.0, 38.0, 46.0, 35.0, 40.0, 56.0, 52.0, 35.0, 42.0, 32.0, 33.0, 25.0, 16.0, 19.0, 23.0, 21.0, 13.0, 13.0, 6.0, 9.0, 7.0, 5.0, 3.0, 10.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.097259521484375, -44.75735092163086, -43.41743850708008, -42.07752990722656, -40.73761749267578, -39.397708892822266, -38.05780029296875, -36.71788787841797, -35.37797546386719, -34.03806686401367, -32.69815444946289, -31.358245849609375, -30.018333435058594, -28.678424835205078, -27.33851432800293, -25.99860382080078, -24.658695220947266, -23.318784713745117, -21.97887420654297, -20.638965606689453, -19.299053192138672, -17.959144592285156, -16.619234085083008, -15.27932357788086, -13.939413070678711, -12.599502563476562, -11.259592056274414, -9.919682502746582, -8.579771995544434, -7.239861488342285, -5.899951934814453, -4.560041427612305, -3.2201309204101562, -1.880220651626587, -0.5403103828430176, 0.7995996475219727, 2.139510154724121, 3.4794206619262695, 4.819330215454102, 6.15924072265625, 7.499151229858398, 8.839061737060547, 10.178972244262695, 11.518881797790527, 12.858792304992676, 14.198702812194824, 15.538612365722656, 16.878522872924805, 18.218433380126953, 19.5583438873291, 20.89825439453125, 22.238162994384766, 23.578075408935547, 24.917984008789062, 26.25789451599121, 27.59780502319336, 28.937715530395508, 30.277626037597656, 31.617536544799805, 32.95744705200195, 34.29735565185547, 35.63726806640625, 36.977176666259766, 38.31708526611328, 39.65699768066406]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 8.0, 15.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 33.0, 35.0, 38.0, 40.0, 39.0, 41.0, 32.0, 38.0, 34.0, 42.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 11.0, 4.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.35546875, -7.12518310546875, -6.8948974609375, -6.66461181640625, -6.434326171875, -6.20404052734375, -5.9737548828125, -5.74346923828125, -5.51318359375, -5.28289794921875, -5.0526123046875, -4.82232666015625, -4.592041015625, -4.36175537109375, -4.1314697265625, -3.90118408203125, -3.6708984375, -3.44061279296875, -3.2103271484375, -2.98004150390625, -2.749755859375, -2.51947021484375, -2.2891845703125, -2.05889892578125, -1.82861328125, -1.59832763671875, -1.3680419921875, -1.13775634765625, -0.907470703125, -0.67718505859375, -0.4468994140625, -0.21661376953125, 0.013671875, 0.24395751953125, 0.4742431640625, 0.70452880859375, 0.934814453125, 1.16510009765625, 1.3953857421875, 1.62567138671875, 1.85595703125, 2.08624267578125, 2.3165283203125, 2.54681396484375, 2.777099609375, 3.00738525390625, 3.2376708984375, 3.46795654296875, 3.6982421875, 3.92852783203125, 4.1588134765625, 4.38909912109375, 4.619384765625, 4.84967041015625, 5.0799560546875, 5.31024169921875, 5.54052734375, 5.77081298828125, 6.0010986328125, 6.23138427734375, 6.461669921875, 6.69195556640625, 6.9222412109375, 7.15252685546875, 7.3828125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 13.0, 24.0, 27.0, 43.0, 71.0, 96.0, 125.0, 216.0, 306.0, 429.0, 621.0, 903.0, 1327.0, 1927.0, 2816.0, 4178.0, 5926.0, 8857.0, 12667.0, 19026.0, 27304.0, 40205.0, 58832.0, 85279.0, 118523.0, 148898.0, 144507.0, 112765.0, 80016.0, 54784.0, 37284.0, 25655.0, 17344.0, 11671.0, 8192.0, 5649.0, 3821.0, 2566.0, 1770.0, 1236.0, 793.0, 600.0, 385.0, 273.0, 178.0, 136.0, 86.0, 68.0, 43.0, 35.0, 21.0, 14.0, 6.0, 5.0, 5.0, 4.0, 2.0], "bins": [-0.63134765625, -0.6121597290039062, -0.5929718017578125, -0.5737838745117188, -0.554595947265625, -0.5354080200195312, -0.5162200927734375, -0.49703216552734375, -0.47784423828125, -0.45865631103515625, -0.4394683837890625, -0.42028045654296875, -0.401092529296875, -0.38190460205078125, -0.3627166748046875, -0.34352874755859375, -0.3243408203125, -0.30515289306640625, -0.2859649658203125, -0.26677703857421875, -0.247589111328125, -0.22840118408203125, -0.2092132568359375, -0.19002532958984375, -0.17083740234375, -0.15164947509765625, -0.1324615478515625, -0.11327362060546875, -0.094085693359375, -0.07489776611328125, -0.0557098388671875, -0.03652191162109375, -0.017333984375, 0.00185394287109375, 0.0210418701171875, 0.04022979736328125, 0.059417724609375, 0.07860565185546875, 0.0977935791015625, 0.11698150634765625, 0.13616943359375, 0.15535736083984375, 0.1745452880859375, 0.19373321533203125, 0.212921142578125, 0.23210906982421875, 0.2512969970703125, 0.27048492431640625, 0.2896728515625, 0.30886077880859375, 0.3280487060546875, 0.34723663330078125, 0.366424560546875, 0.38561248779296875, 0.4048004150390625, 0.42398834228515625, 0.44317626953125, 0.46236419677734375, 0.4815521240234375, 0.5007400512695312, 0.519927978515625, 0.5391159057617188, 0.5583038330078125, 0.5774917602539062, 0.5966796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 16.0, 18.0, 22.0, 15.0, 25.0, 29.0, 23.0, 20.0, 29.0, 28.0, 46.0, 38.0, 45.0, 36.0, 33.0, 32.0, 1055.0, 39.0, 46.0, 46.0, 30.0, 25.0, 43.0, 26.0, 22.0, 25.0, 27.0, 21.0, 28.0, 17.0, 13.0, 15.0, 13.0, 11.0, 4.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.68878173828125, -4.5416259765625, -4.39447021484375, -4.247314453125, -4.10015869140625, -3.9530029296875, -3.80584716796875, -3.65869140625, -3.51153564453125, -3.3643798828125, -3.21722412109375, -3.070068359375, -2.92291259765625, -2.7757568359375, -2.62860107421875, -2.4814453125, -2.33428955078125, -2.1871337890625, -2.03997802734375, -1.892822265625, -1.74566650390625, -1.5985107421875, -1.45135498046875, -1.30419921875, -1.15704345703125, -1.0098876953125, -0.86273193359375, -0.715576171875, -0.56842041015625, -0.4212646484375, -0.27410888671875, -0.126953125, 0.02020263671875, 0.1673583984375, 0.31451416015625, 0.461669921875, 0.60882568359375, 0.7559814453125, 0.90313720703125, 1.05029296875, 1.19744873046875, 1.3446044921875, 1.49176025390625, 1.638916015625, 1.78607177734375, 1.9332275390625, 2.08038330078125, 2.2275390625, 2.37469482421875, 2.5218505859375, 2.66900634765625, 2.816162109375, 2.96331787109375, 3.1104736328125, 3.25762939453125, 3.40478515625, 3.55194091796875, 3.6990966796875, 3.84625244140625, 3.993408203125, 4.14056396484375, 4.2877197265625, 4.43487548828125, 4.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 12.0, 10.0, 11.0, 29.0, 43.0, 41.0, 72.0, 120.0, 193.0, 285.0, 465.0, 714.0, 1186.0, 1803.0, 2966.0, 4363.0, 6714.0, 10379.0, 16068.0, 25077.0, 38331.0, 58337.0, 86205.0, 119207.0, 317434.0, 1025026.0, 121630.0, 87719.0, 60397.0, 39616.0, 25724.0, 16723.0, 10650.0, 6950.0, 4502.0, 2854.0, 1886.0, 1204.0, 764.0, 510.0, 336.0, 212.0, 146.0, 79.0, 44.0, 34.0, 23.0, 11.0, 13.0, 6.0, 7.0, 5.0, 1.0, 2.0], "bins": [-0.59814453125, -0.5810699462890625, -0.563995361328125, -0.5469207763671875, -0.52984619140625, -0.5127716064453125, -0.495697021484375, -0.4786224365234375, -0.4615478515625, -0.4444732666015625, -0.427398681640625, -0.4103240966796875, -0.39324951171875, -0.3761749267578125, -0.359100341796875, -0.3420257568359375, -0.324951171875, -0.3078765869140625, -0.290802001953125, -0.2737274169921875, -0.25665283203125, -0.2395782470703125, -0.222503662109375, -0.2054290771484375, -0.1883544921875, -0.1712799072265625, -0.154205322265625, -0.1371307373046875, -0.12005615234375, -0.1029815673828125, -0.085906982421875, -0.0688323974609375, -0.0517578125, -0.0346832275390625, -0.017608642578125, -0.0005340576171875, 0.01654052734375, 0.0336151123046875, 0.050689697265625, 0.0677642822265625, 0.0848388671875, 0.1019134521484375, 0.118988037109375, 0.1360626220703125, 0.15313720703125, 0.1702117919921875, 0.187286376953125, 0.2043609619140625, 0.221435546875, 0.2385101318359375, 0.255584716796875, 0.2726593017578125, 0.28973388671875, 0.3068084716796875, 0.323883056640625, 0.3409576416015625, 0.3580322265625, 0.3751068115234375, 0.392181396484375, 0.4092559814453125, 0.42633056640625, 0.4434051513671875, 0.460479736328125, 0.4775543212890625, 0.49462890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 2.0, 10.0, 7.0, 14.0, 13.0, 29.0, 39.0, 39.0, 44.0, 59.0, 80.0, 101.0, 83.0, 86.0, 85.0, 80.0, 50.0, 41.0, 25.0, 28.0, 17.0, 10.0, 9.0, 6.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005615234375, -0.00545269250869751, -0.0052901506423950195, -0.005127608776092529, -0.004965066909790039, -0.004802525043487549, -0.004639983177185059, -0.004477441310882568, -0.004314899444580078, -0.004152357578277588, -0.003989815711975098, -0.0038272738456726074, -0.003664731979370117, -0.003502190113067627, -0.0033396482467651367, -0.0031771063804626465, -0.0030145645141601562, -0.002852022647857666, -0.0026894807815551758, -0.0025269389152526855, -0.0023643970489501953, -0.002201855182647705, -0.002039313316345215, -0.0018767714500427246, -0.0017142295837402344, -0.0015516877174377441, -0.001389145851135254, -0.0012266039848327637, -0.0010640621185302734, -0.0009015202522277832, -0.000738978385925293, -0.0005764365196228027, -0.0004138946533203125, -0.00025135278701782227, -8.881092071533203e-05, 7.37309455871582e-05, 0.00023627281188964844, 0.00039881467819213867, 0.0005613565444946289, 0.0007238984107971191, 0.0008864402770996094, 0.0010489821434020996, 0.0012115240097045898, 0.00137406587600708, 0.0015366077423095703, 0.0016991496086120605, 0.0018616914749145508, 0.002024233341217041, 0.0021867752075195312, 0.0023493170738220215, 0.0025118589401245117, 0.002674400806427002, 0.002836942672729492, 0.0029994845390319824, 0.0031620264053344727, 0.003324568271636963, 0.003487110137939453, 0.0036496520042419434, 0.0038121938705444336, 0.003974735736846924, 0.004137277603149414, 0.004299819469451904, 0.0044623613357543945, 0.004624903202056885, 0.004787445068359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 8.0, 10.0, 15.0, 28.0, 33.0, 50.0, 73.0, 112.0, 167.0, 338.0, 872.0, 164677.0, 879786.0, 1361.0, 372.0, 207.0, 122.0, 86.0, 59.0, 37.0, 22.0, 29.0, 9.0, 17.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09300422668457031, -0.08957290649414062, -0.08614158630371094, -0.08271026611328125, -0.07927894592285156, -0.07584762573242188, -0.07241630554199219, -0.0689849853515625, -0.06555366516113281, -0.062122344970703125, -0.05869102478027344, -0.05525970458984375, -0.05182838439941406, -0.048397064208984375, -0.04496574401855469, -0.041534423828125, -0.03810310363769531, -0.034671783447265625, -0.031240463256835938, -0.02780914306640625, -0.024377822875976562, -0.020946502685546875, -0.017515182495117188, -0.0140838623046875, -0.010652542114257812, -0.007221221923828125, -0.0037899017333984375, -0.00035858154296875, 0.0030727386474609375, 0.006504058837890625, 0.009935379028320312, 0.01336669921875, 0.016798019409179688, 0.020229339599609375, 0.023660659790039062, 0.02709197998046875, 0.030523300170898438, 0.033954620361328125, 0.03738594055175781, 0.0408172607421875, 0.04424858093261719, 0.047679901123046875, 0.05111122131347656, 0.05454254150390625, 0.05797386169433594, 0.061405181884765625, 0.06483650207519531, 0.068267822265625, 0.07169914245605469, 0.07513046264648438, 0.07856178283691406, 0.08199310302734375, 0.08542442321777344, 0.08885574340820312, 0.09228706359863281, 0.0957183837890625, 0.09914970397949219, 0.10258102416992188, 0.10601234436035156, 0.10944366455078125, 0.11287498474121094, 0.11630630493164062, 0.11973762512207031, 0.1231689453125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 129.0, 702.0, 170.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012886013835668564, -0.012287216261029243, -0.011688417755067348, -0.011089619249105453, -0.010490821674466133, -0.009892024099826813, -0.009293225593864918, -0.008694427087903023, -0.008095629513263702, -0.007496831472963095, -0.006898033432662487, -0.006299235392361879, -0.005700437352061272, -0.005101639311760664, -0.004502841271460056, -0.0039040432311594486, -0.003305245190858841, -0.0027064471505582333, -0.0021076491102576256, -0.001508851069957018, -0.0009100530296564102, -0.00031125498935580254, 0.00028754305094480515, 0.0008863410912454128, 0.0014851391315460205, 0.002083937171846628, 0.002682735212147236, 0.0032815332524478436, 0.0038803312927484512, 0.004479129333049059, 0.005077927373349667, 0.005676725413650274, 0.006275523453950882, 0.00687432149425149, 0.007473119534552097, 0.008071918040513992, 0.008670715615153313, 0.009269513189792633, 0.009868311695754528, 0.010467110201716423, 0.011065907776355743, 0.011664705350995064, 0.012263503856956959, 0.012862302362918854, 0.013461099937558174, 0.014059897512197495, 0.01465869601815939, 0.015257494524121284, 0.015856292098760605, 0.016455089673399925, 0.017053887248039246, 0.017652686685323715, 0.018251484259963036, 0.018850281834602356, 0.019449081271886826, 0.020047878846526146, 0.020646676421165466, 0.021245473995804787, 0.021844271570444107, 0.022443071007728577, 0.023041868582367897, 0.023640666157007217, 0.024239465594291687, 0.024838263168931007, 0.025437060743570328]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 6.0, 8.0, 12.0, 16.0, 22.0, 15.0, 15.0, 19.0, 23.0, 29.0, 28.0, 24.0, 28.0, 34.0, 34.0, 36.0, 33.0, 32.0, 42.0, 36.0, 34.0, 39.0, 47.0, 30.0, 33.0, 32.0, 40.0, 38.0, 30.0, 27.0, 24.0, 18.0, 20.0, 22.0, 16.0, 4.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002066671848297119, -0.002003171481192112, -0.0019396711140871048, -0.0018761707469820976, -0.0018126703798770905, -0.0017491700127720833, -0.0016856696456670761, -0.001622169278562069, -0.0015586689114570618, -0.0014951685443520546, -0.0014316681772470474, -0.0013681678101420403, -0.001304667443037033, -0.001241167075932026, -0.0011776667088270187, -0.0011141663417220116, -0.0010506659746170044, -0.0009871656075119972, -0.00092366524040699, -0.0008601648733019829, -0.0007966645061969757, -0.0007331641390919685, -0.0006696637719869614, -0.0006061634048819542, -0.000542663037776947, -0.00047916267067193985, -0.0004156623035669327, -0.0003521619364619255, -0.00028866156935691833, -0.00022516120225191116, -0.000161660835146904, -9.816046804189682e-05, -3.466010093688965e-05, 2.8840266168117523e-05, 9.23406332731247e-05, 0.00015584100037813187, 0.00021934136748313904, 0.0002828417345881462, 0.0003463421016931534, 0.00040984246879816055, 0.0004733428359031677, 0.0005368432030081749, 0.0006003435701131821, 0.0006638439372181892, 0.0007273443043231964, 0.0007908446714282036, 0.0008543450385332108, 0.0009178454056382179, 0.000981345772743225, 0.0010448461398482323, 0.0011083465069532394, 0.0011718468740582466, 0.0012353472411632538, 0.001298847608268261, 0.0013623479753732681, 0.0014258483424782753, 0.0014893487095832825, 0.0015528490766882896, 0.0016163494437932968, 0.001679849810898304, 0.0017433501780033112, 0.0018068505451083183, 0.0018703509122133255, 0.0019338512793183327, 0.00199735164642334]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 7.0, 16.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 32.0, 36.0, 37.0, 40.0, 40.0, 41.0, 32.0, 38.0, 33.0, 43.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 10.0, 5.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.359375, -7.1290283203125, -6.898681640625, -6.6683349609375, -6.43798828125, -6.2076416015625, -5.977294921875, -5.7469482421875, -5.5166015625, -5.2862548828125, -5.055908203125, -4.8255615234375, -4.59521484375, -4.3648681640625, -4.134521484375, -3.9041748046875, -3.673828125, -3.4434814453125, -3.213134765625, -2.9827880859375, -2.75244140625, -2.5220947265625, -2.291748046875, -2.0614013671875, -1.8310546875, -1.6007080078125, -1.370361328125, -1.1400146484375, -0.90966796875, -0.6793212890625, -0.448974609375, -0.2186279296875, 0.01171875, 0.2420654296875, 0.472412109375, 0.7027587890625, 0.93310546875, 1.1634521484375, 1.393798828125, 1.6241455078125, 1.8544921875, 2.0848388671875, 2.315185546875, 2.5455322265625, 2.77587890625, 3.0062255859375, 3.236572265625, 3.4669189453125, 3.697265625, 3.9276123046875, 4.157958984375, 4.3883056640625, 4.61865234375, 4.8489990234375, 5.079345703125, 5.3096923828125, 5.5400390625, 5.7703857421875, 6.000732421875, 6.2310791015625, 6.46142578125, 6.6917724609375, 6.922119140625, 7.1524658203125, 7.3828125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 10.0, 7.0, 8.0, 14.0, 8.0, 13.0, 26.0, 31.0, 40.0, 39.0, 65.0, 58.0, 81.0, 110.0, 172.0, 216.0, 288.0, 411.0, 547.0, 1196.0, 2805.0, 9197.0, 36095.0, 505895.0, 441567.0, 34762.0, 8871.0, 2699.0, 1095.0, 584.0, 402.0, 293.0, 254.0, 156.0, 126.0, 101.0, 84.0, 58.0, 36.0, 34.0, 23.0, 18.0, 14.0, 14.0, 6.0, 10.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.515625, -17.936767578125, -17.35791015625, -16.779052734375, -16.2001953125, -15.621337890625, -15.04248046875, -14.463623046875, -13.884765625, -13.305908203125, -12.72705078125, -12.148193359375, -11.5693359375, -10.990478515625, -10.41162109375, -9.832763671875, -9.25390625, -8.675048828125, -8.09619140625, -7.517333984375, -6.9384765625, -6.359619140625, -5.78076171875, -5.201904296875, -4.623046875, -4.044189453125, -3.46533203125, -2.886474609375, -2.3076171875, -1.728759765625, -1.14990234375, -0.571044921875, 0.0078125, 0.586669921875, 1.16552734375, 1.744384765625, 2.3232421875, 2.902099609375, 3.48095703125, 4.059814453125, 4.638671875, 5.217529296875, 5.79638671875, 6.375244140625, 6.9541015625, 7.532958984375, 8.11181640625, 8.690673828125, 9.26953125, 9.848388671875, 10.42724609375, 11.006103515625, 11.5849609375, 12.163818359375, 12.74267578125, 13.321533203125, 13.900390625, 14.479248046875, 15.05810546875, 15.636962890625, 16.2158203125, 16.794677734375, 17.37353515625, 17.952392578125, 18.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 10.0, 13.0, 10.0, 21.0, 19.0, 16.0, 25.0, 29.0, 22.0, 33.0, 37.0, 38.0, 42.0, 47.0, 62.0, 99.0, 1701.0, 273.0, 78.0, 63.0, 41.0, 49.0, 38.0, 29.0, 29.0, 35.0, 23.0, 19.0, 23.0, 15.0, 18.0, 5.0, 8.0, 8.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.768798828125, -19.14697265625, -18.525146484375, -17.9033203125, -17.281494140625, -16.65966796875, -16.037841796875, -15.416015625, -14.794189453125, -14.17236328125, -13.550537109375, -12.9287109375, -12.306884765625, -11.68505859375, -11.063232421875, -10.44140625, -9.819580078125, -9.19775390625, -8.575927734375, -7.9541015625, -7.332275390625, -6.71044921875, -6.088623046875, -5.466796875, -4.844970703125, -4.22314453125, -3.601318359375, -2.9794921875, -2.357666015625, -1.73583984375, -1.114013671875, -0.4921875, 0.129638671875, 0.75146484375, 1.373291015625, 1.9951171875, 2.616943359375, 3.23876953125, 3.860595703125, 4.482421875, 5.104248046875, 5.72607421875, 6.347900390625, 6.9697265625, 7.591552734375, 8.21337890625, 8.835205078125, 9.45703125, 10.078857421875, 10.70068359375, 11.322509765625, 11.9443359375, 12.566162109375, 13.18798828125, 13.809814453125, 14.431640625, 15.053466796875, 15.67529296875, 16.297119140625, 16.9189453125, 17.540771484375, 18.16259765625, 18.784423828125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 11.0, 10.0, 6.0, 13.0, 19.0, 23.0, 28.0, 22.0, 25.0, 35.0, 51.0, 67.0, 78.0, 128.0, 225.0, 515.0, 3182.0, 113264.0, 3013563.0, 12496.0, 967.0, 317.0, 174.0, 82.0, 65.0, 52.0, 38.0, 33.0, 37.0, 26.0, 22.0, 20.0, 16.0, 19.0, 10.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.96875, -52.24072265625, -50.5126953125, -48.78466796875, -47.056640625, -45.32861328125, -43.6005859375, -41.87255859375, -40.14453125, -38.41650390625, -36.6884765625, -34.96044921875, -33.232421875, -31.50439453125, -29.7763671875, -28.04833984375, -26.3203125, -24.59228515625, -22.8642578125, -21.13623046875, -19.408203125, -17.68017578125, -15.9521484375, -14.22412109375, -12.49609375, -10.76806640625, -9.0400390625, -7.31201171875, -5.583984375, -3.85595703125, -2.1279296875, -0.39990234375, 1.328125, 3.05615234375, 4.7841796875, 6.51220703125, 8.240234375, 9.96826171875, 11.6962890625, 13.42431640625, 15.15234375, 16.88037109375, 18.6083984375, 20.33642578125, 22.064453125, 23.79248046875, 25.5205078125, 27.24853515625, 28.9765625, 30.70458984375, 32.4326171875, 34.16064453125, 35.888671875, 37.61669921875, 39.3447265625, 41.07275390625, 42.80078125, 44.52880859375, 46.2568359375, 47.98486328125, 49.712890625, 51.44091796875, 53.1689453125, 54.89697265625, 56.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 66.0, 207.0, 353.0, 258.0, 88.0, 19.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.25318908691406, -75.3061752319336, -73.35916900634766, -71.41215515136719, -69.46514892578125, -67.51813507080078, -65.57112884521484, -63.624114990234375, -61.67710876464844, -59.730098724365234, -57.78308868408203, -55.83607864379883, -53.889068603515625, -51.94205856323242, -49.99504852294922, -48.04803466796875, -46.10102462768555, -44.154014587402344, -42.20700454711914, -40.25999450683594, -38.312984466552734, -36.36597442626953, -34.41896057128906, -32.471954345703125, -30.52494239807129, -28.577932357788086, -26.630922317504883, -24.683910369873047, -22.736900329589844, -20.78989028930664, -18.842880249023438, -16.895870208740234, -14.948856353759766, -13.001846313476562, -11.05483627319336, -9.10782527923584, -7.160815238952637, -5.213805198669434, -3.266794204711914, -1.319784164428711, 0.6272258758544922, 2.5742361545562744, 4.521246433258057, 6.468256950378418, 8.415266990661621, 10.362277030944824, 12.309288024902344, 14.256298065185547, 16.20330810546875, 18.150318145751953, 20.097328186035156, 22.04433822631836, 23.991348266601562, 25.938358306884766, 27.8853702545166, 29.832380294799805, 31.779390335083008, 33.726402282714844, 35.67341232299805, 37.62042236328125, 39.56743240356445, 41.514442443847656, 43.46145248413086, 45.40846252441406, 47.355472564697266]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 1.0, 8.0, 7.0, 6.0, 20.0, 14.0, 17.0, 21.0, 26.0, 26.0, 31.0, 41.0, 35.0, 47.0, 37.0, 61.0, 42.0, 47.0, 51.0, 42.0, 32.0, 40.0, 44.0, 44.0, 34.0, 37.0, 37.0, 23.0, 17.0, 15.0, 19.0, 10.0, 19.0, 12.0, 4.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.02687072753906, -59.1953239440918, -57.3637809753418, -55.53223419189453, -53.700687408447266, -51.869140625, -50.03759765625, -48.206050872802734, -46.37450408935547, -44.5429573059082, -42.7114143371582, -40.87986755371094, -39.04832077026367, -37.216773986816406, -35.385231018066406, -33.55368423461914, -31.72214126586914, -29.890596389770508, -28.059049606323242, -26.22750473022461, -24.395957946777344, -22.56441307067871, -20.732868194580078, -18.901321411132812, -17.06977653503418, -15.23823070526123, -13.406684875488281, -11.575139999389648, -9.7435941696167, -7.91204833984375, -6.080503463745117, -4.248957633972168, -2.4174118041992188, -0.5858662128448486, 1.2456793785095215, 3.0772247314453125, 4.908770561218262, 6.740316390991211, 8.571861267089844, 10.403407096862793, 12.234952926635742, 14.066498756408691, 15.89804458618164, 17.729589462280273, 19.561134338378906, 21.392681121826172, 23.224225997924805, 25.055770874023438, 26.887317657470703, 28.718862533569336, 30.5504093170166, 32.381954193115234, 34.2135009765625, 36.0450439453125, 37.876590728759766, 39.70813751220703, 41.53968048095703, 43.3712272644043, 45.2027702331543, 47.03431701660156, 48.86586380004883, 50.697410583496094, 52.528953552246094, 54.36050033569336, 56.192047119140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 8.0, 11.0, 9.0, 12.0, 16.0, 18.0, 16.0, 23.0, 19.0, 22.0, 28.0, 26.0, 20.0, 29.0, 41.0, 34.0, 43.0, 46.0, 39.0, 42.0, 44.0, 34.0, 46.0, 41.0, 38.0, 35.0, 43.0, 34.0, 10.0, 26.0, 24.0, 23.0, 20.0, 17.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.828125, -7.58636474609375, -7.3446044921875, -7.10284423828125, -6.861083984375, -6.61932373046875, -6.3775634765625, -6.13580322265625, -5.89404296875, -5.65228271484375, -5.4105224609375, -5.16876220703125, -4.927001953125, -4.68524169921875, -4.4434814453125, -4.20172119140625, -3.9599609375, -3.71820068359375, -3.4764404296875, -3.23468017578125, -2.992919921875, -2.75115966796875, -2.5093994140625, -2.26763916015625, -2.02587890625, -1.78411865234375, -1.5423583984375, -1.30059814453125, -1.058837890625, -0.81707763671875, -0.5753173828125, -0.33355712890625, -0.091796875, 0.14996337890625, 0.3917236328125, 0.63348388671875, 0.875244140625, 1.11700439453125, 1.3587646484375, 1.60052490234375, 1.84228515625, 2.08404541015625, 2.3258056640625, 2.56756591796875, 2.809326171875, 3.05108642578125, 3.2928466796875, 3.53460693359375, 3.7763671875, 4.01812744140625, 4.2598876953125, 4.50164794921875, 4.743408203125, 4.98516845703125, 5.2269287109375, 5.46868896484375, 5.71044921875, 5.95220947265625, 6.1939697265625, 6.43572998046875, 6.677490234375, 6.91925048828125, 7.1610107421875, 7.40277099609375, 7.64453125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 17.0, 8.0, 16.0, 24.0, 29.0, 44.0, 58.0, 94.0, 104.0, 160.0, 283.0, 433.0, 759.0, 1369.0, 2700.0, 6098.0, 14870.0, 49043.0, 328152.0, 2165501.0, 1399109.0, 172450.0, 32382.0, 10983.0, 4507.0, 2242.0, 1089.0, 643.0, 375.0, 205.0, 145.0, 78.0, 74.0, 52.0, 35.0, 25.0, 22.0, 19.0, 20.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-15.796875, -15.31591796875, -14.8349609375, -14.35400390625, -13.873046875, -13.39208984375, -12.9111328125, -12.43017578125, -11.94921875, -11.46826171875, -10.9873046875, -10.50634765625, -10.025390625, -9.54443359375, -9.0634765625, -8.58251953125, -8.1015625, -7.62060546875, -7.1396484375, -6.65869140625, -6.177734375, -5.69677734375, -5.2158203125, -4.73486328125, -4.25390625, -3.77294921875, -3.2919921875, -2.81103515625, -2.330078125, -1.84912109375, -1.3681640625, -0.88720703125, -0.40625, 0.07470703125, 0.5556640625, 1.03662109375, 1.517578125, 1.99853515625, 2.4794921875, 2.96044921875, 3.44140625, 3.92236328125, 4.4033203125, 4.88427734375, 5.365234375, 5.84619140625, 6.3271484375, 6.80810546875, 7.2890625, 7.77001953125, 8.2509765625, 8.73193359375, 9.212890625, 9.69384765625, 10.1748046875, 10.65576171875, 11.13671875, 11.61767578125, 12.0986328125, 12.57958984375, 13.060546875, 13.54150390625, 14.0224609375, 14.50341796875, 14.984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 5.0, 13.0, 15.0, 29.0, 34.0, 38.0, 81.0, 100.0, 181.0, 244.0, 377.0, 565.0, 653.0, 601.0, 391.0, 229.0, 157.0, 116.0, 91.0, 50.0, 32.0, 21.0, 20.0, 10.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.671875, -15.139892578125, -14.60791015625, -14.075927734375, -13.5439453125, -13.011962890625, -12.47998046875, -11.947998046875, -11.416015625, -10.884033203125, -10.35205078125, -9.820068359375, -9.2880859375, -8.756103515625, -8.22412109375, -7.692138671875, -7.16015625, -6.628173828125, -6.09619140625, -5.564208984375, -5.0322265625, -4.500244140625, -3.96826171875, -3.436279296875, -2.904296875, -2.372314453125, -1.84033203125, -1.308349609375, -0.7763671875, -0.244384765625, 0.28759765625, 0.819580078125, 1.3515625, 1.883544921875, 2.41552734375, 2.947509765625, 3.4794921875, 4.011474609375, 4.54345703125, 5.075439453125, 5.607421875, 6.139404296875, 6.67138671875, 7.203369140625, 7.7353515625, 8.267333984375, 8.79931640625, 9.331298828125, 9.86328125, 10.395263671875, 10.92724609375, 11.459228515625, 11.9912109375, 12.523193359375, 13.05517578125, 13.587158203125, 14.119140625, 14.651123046875, 15.18310546875, 15.715087890625, 16.2470703125, 16.779052734375, 17.31103515625, 17.843017578125, 18.375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 8.0, 8.0, 14.0, 22.0, 35.0, 59.0, 54.0, 74.0, 135.0, 177.0, 264.0, 528.0, 1547.0, 8580.0, 121150.0, 3734941.0, 307272.0, 15544.0, 2288.0, 683.0, 327.0, 177.0, 130.0, 75.0, 53.0, 32.0, 30.0, 26.0, 15.0, 7.0, 10.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.48046875, -43.1171875, -41.75390625, -40.390625, -39.02734375, -37.6640625, -36.30078125, -34.9375, -33.57421875, -32.2109375, -30.84765625, -29.484375, -28.12109375, -26.7578125, -25.39453125, -24.03125, -22.66796875, -21.3046875, -19.94140625, -18.578125, -17.21484375, -15.8515625, -14.48828125, -13.125, -11.76171875, -10.3984375, -9.03515625, -7.671875, -6.30859375, -4.9453125, -3.58203125, -2.21875, -0.85546875, 0.5078125, 1.87109375, 3.234375, 4.59765625, 5.9609375, 7.32421875, 8.6875, 10.05078125, 11.4140625, 12.77734375, 14.140625, 15.50390625, 16.8671875, 18.23046875, 19.59375, 20.95703125, 22.3203125, 23.68359375, 25.046875, 26.41015625, 27.7734375, 29.13671875, 30.5, 31.86328125, 33.2265625, 34.58984375, 35.953125, 37.31640625, 38.6796875, 40.04296875, 41.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 15.0, 67.0, 247.0, 389.0, 209.0, 66.0, 14.0, 1.0, 0.0, 0.0, 1.0], "bins": [-306.80279541015625, -301.35601806640625, -295.90924072265625, -290.46246337890625, -285.01568603515625, -279.56890869140625, -274.12213134765625, -268.67535400390625, -263.22857666015625, -257.78179931640625, -252.33502197265625, -246.88824462890625, -241.44146728515625, -235.9946746826172, -230.5478973388672, -225.1011199951172, -219.65432739257812, -214.20755004882812, -208.76077270507812, -203.31399536132812, -197.86721801757812, -192.42042541503906, -186.97364807128906, -181.52687072753906, -176.08009338378906, -170.63331604003906, -165.18653869628906, -159.73976135253906, -154.29296875, -148.84619140625, -143.3994140625, -137.95263671875, -132.505859375, -127.05908203125, -121.6123046875, -116.16551971435547, -110.71874237060547, -105.27196502685547, -99.82518005371094, -94.37840270996094, -88.9316177368164, -83.4848403930664, -78.03805541992188, -72.59127807617188, -67.14450073242188, -61.697723388671875, -56.25094223022461, -50.804161071777344, -45.357383728027344, -39.910606384277344, -34.46382522583008, -29.017045974731445, -23.570266723632812, -18.12348747253418, -12.676708221435547, -7.229927062988281, -1.7831497192382812, 3.6636295318603516, 9.110408782958984, 14.557188034057617, 20.00396728515625, 25.450746536254883, 30.897525787353516, 36.34430694580078, 41.79108428955078]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 8.0, 2.0, 12.0, 7.0, 13.0, 16.0, 20.0, 17.0, 23.0, 18.0, 20.0, 25.0, 27.0, 36.0, 48.0, 35.0, 30.0, 39.0, 34.0, 44.0, 39.0, 42.0, 27.0, 40.0, 30.0, 31.0, 34.0, 27.0, 33.0, 30.0, 25.0, 31.0, 18.0, 16.0, 11.0, 12.0, 17.0, 5.0, 17.0, 5.0, 13.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.7432861328125, -37.51582336425781, -36.288360595703125, -35.06089782714844, -33.83343505859375, -32.60597229003906, -31.378511428833008, -30.15104866027832, -28.923585891723633, -27.696123123168945, -26.468660354614258, -25.24119758605957, -24.013736724853516, -22.786273956298828, -21.55881118774414, -20.331348419189453, -19.103885650634766, -17.876422882080078, -16.64896011352539, -15.42149829864502, -14.194035530090332, -12.966572761535645, -11.739110946655273, -10.511648178100586, -9.284185409545898, -8.056722640991211, -6.829260349273682, -5.601798057556152, -4.374335289001465, -3.1468725204467773, -1.919410228729248, -0.6919479370117188, 0.5355148315429688, 1.7629773616790771, 2.9904398918151855, 4.217902183532715, 5.445364952087402, 6.67282772064209, 7.900290012359619, 9.127752304077148, 10.355215072631836, 11.582677841186523, 12.810140609741211, 14.037602424621582, 15.26506519317627, 16.49252700805664, 17.719989776611328, 18.947452545166016, 20.174915313720703, 21.40237808227539, 22.629840850830078, 23.857303619384766, 25.084766387939453, 26.31222915649414, 27.539690017700195, 28.767152786254883, 29.99461555480957, 31.222078323364258, 32.44953918457031, 33.677001953125, 34.90446472167969, 36.131927490234375, 37.35939025878906, 38.58685302734375, 39.81431579589844]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 42.0, 44.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 12.0, 9.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 15.0, 26.0, 45.0, 58.0, 78.0, 123.0, 201.0, 297.0, 462.0, 714.0, 1127.0, 1764.0, 2649.0, 4109.0, 6392.0, 9966.0, 15626.0, 24178.0, 37751.0, 58858.0, 89771.0, 130651.0, 166749.0, 158209.0, 117265.0, 78659.0, 51227.0, 32562.0, 21060.0, 13167.0, 8845.0, 5528.0, 3688.0, 2421.0, 1538.0, 967.0, 653.0, 394.0, 248.0, 188.0, 114.0, 79.0, 45.0, 26.0, 24.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.7431640625, -0.7205352783203125, -0.697906494140625, -0.6752777099609375, -0.65264892578125, -0.6300201416015625, -0.607391357421875, -0.5847625732421875, -0.5621337890625, -0.5395050048828125, -0.516876220703125, -0.4942474365234375, -0.47161865234375, -0.4489898681640625, -0.426361083984375, -0.4037322998046875, -0.381103515625, -0.3584747314453125, -0.335845947265625, -0.3132171630859375, -0.29058837890625, -0.2679595947265625, -0.245330810546875, -0.2227020263671875, -0.2000732421875, -0.1774444580078125, -0.154815673828125, -0.1321868896484375, -0.10955810546875, -0.0869293212890625, -0.064300537109375, -0.0416717529296875, -0.01904296875, 0.0035858154296875, 0.026214599609375, 0.0488433837890625, 0.07147216796875, 0.0941009521484375, 0.116729736328125, 0.1393585205078125, 0.1619873046875, 0.1846160888671875, 0.207244873046875, 0.2298736572265625, 0.25250244140625, 0.2751312255859375, 0.297760009765625, 0.3203887939453125, 0.343017578125, 0.3656463623046875, 0.388275146484375, 0.4109039306640625, 0.43353271484375, 0.4561614990234375, 0.478790283203125, 0.5014190673828125, 0.5240478515625, 0.5466766357421875, 0.569305419921875, 0.5919342041015625, 0.61456298828125, 0.6371917724609375, 0.659820556640625, 0.6824493408203125, 0.705078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 13.0, 21.0, 22.0, 23.0, 25.0, 30.0, 26.0, 34.0, 38.0, 39.0, 46.0, 47.0, 43.0, 45.0, 1052.0, 31.0, 41.0, 31.0, 33.0, 35.0, 47.0, 36.0, 26.0, 33.0, 22.0, 19.0, 20.0, 22.0, 16.0, 5.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.08984375, -4.92645263671875, -4.7630615234375, -4.59967041015625, -4.436279296875, -4.27288818359375, -4.1094970703125, -3.94610595703125, -3.78271484375, -3.61932373046875, -3.4559326171875, -3.29254150390625, -3.129150390625, -2.96575927734375, -2.8023681640625, -2.63897705078125, -2.4755859375, -2.31219482421875, -2.1488037109375, -1.98541259765625, -1.822021484375, -1.65863037109375, -1.4952392578125, -1.33184814453125, -1.16845703125, -1.00506591796875, -0.8416748046875, -0.67828369140625, -0.514892578125, -0.35150146484375, -0.1881103515625, -0.02471923828125, 0.138671875, 0.30206298828125, 0.4654541015625, 0.62884521484375, 0.792236328125, 0.95562744140625, 1.1190185546875, 1.28240966796875, 1.44580078125, 1.60919189453125, 1.7725830078125, 1.93597412109375, 2.099365234375, 2.26275634765625, 2.4261474609375, 2.58953857421875, 2.7529296875, 2.91632080078125, 3.0797119140625, 3.24310302734375, 3.406494140625, 3.56988525390625, 3.7332763671875, 3.89666748046875, 4.06005859375, 4.22344970703125, 4.3868408203125, 4.55023193359375, 4.713623046875, 4.87701416015625, 5.0404052734375, 5.20379638671875, 5.3671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 13.0, 18.0, 35.0, 50.0, 75.0, 116.0, 186.0, 310.0, 522.0, 791.0, 1247.0, 1966.0, 3072.0, 4876.0, 7759.0, 12293.0, 19653.0, 30545.0, 48623.0, 74060.0, 109091.0, 145952.0, 1209332.0, 138691.0, 101158.0, 67319.0, 43447.0, 27722.0, 17804.0, 11105.0, 7083.0, 4377.0, 2895.0, 1831.0, 1149.0, 702.0, 469.0, 290.0, 171.0, 123.0, 78.0, 48.0, 27.0, 15.0, 9.0, 9.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.63330078125, -0.6137466430664062, -0.5941925048828125, -0.5746383666992188, -0.555084228515625, -0.5355300903320312, -0.5159759521484375, -0.49642181396484375, -0.47686767578125, -0.45731353759765625, -0.4377593994140625, -0.41820526123046875, -0.398651123046875, -0.37909698486328125, -0.3595428466796875, -0.33998870849609375, -0.3204345703125, -0.30088043212890625, -0.2813262939453125, -0.26177215576171875, -0.242218017578125, -0.22266387939453125, -0.2031097412109375, -0.18355560302734375, -0.16400146484375, -0.14444732666015625, -0.1248931884765625, -0.10533905029296875, -0.085784912109375, -0.06623077392578125, -0.0466766357421875, -0.02712249755859375, -0.007568359375, 0.01198577880859375, 0.0315399169921875, 0.05109405517578125, 0.070648193359375, 0.09020233154296875, 0.1097564697265625, 0.12931060791015625, 0.14886474609375, 0.16841888427734375, 0.1879730224609375, 0.20752716064453125, 0.227081298828125, 0.24663543701171875, 0.2661895751953125, 0.28574371337890625, 0.3052978515625, 0.32485198974609375, 0.3444061279296875, 0.36396026611328125, 0.383514404296875, 0.40306854248046875, 0.4226226806640625, 0.44217681884765625, 0.46173095703125, 0.48128509521484375, 0.5008392333984375, 0.5203933715820312, 0.539947509765625, 0.5595016479492188, 0.5790557861328125, 0.5986099243164062, 0.6181640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 23.0, 32.0, 44.0, 54.0, 60.0, 73.0, 85.0, 91.0, 81.0, 84.0, 58.0, 68.0, 58.0, 36.0, 32.0, 17.0, 17.0, 15.0, 7.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00699615478515625, -0.006795704364776611, -0.006595253944396973, -0.006394803524017334, -0.006194353103637695, -0.005993902683258057, -0.005793452262878418, -0.005593001842498779, -0.005392551422119141, -0.005192101001739502, -0.004991650581359863, -0.004791200160980225, -0.004590749740600586, -0.004390299320220947, -0.004189848899841309, -0.00398939847946167, -0.0037889480590820312, -0.0035884976387023926, -0.003388047218322754, -0.0031875967979431152, -0.0029871463775634766, -0.002786695957183838, -0.0025862455368041992, -0.0023857951164245605, -0.002185344696044922, -0.001984894275665283, -0.0017844438552856445, -0.0015839934349060059, -0.0013835430145263672, -0.0011830925941467285, -0.0009826421737670898, -0.0007821917533874512, -0.0005817413330078125, -0.00038129091262817383, -0.00018084049224853516, 1.9609928131103516e-05, 0.0002200603485107422, 0.00042051076889038086, 0.0006209611892700195, 0.0008214116096496582, 0.0010218620300292969, 0.0012223124504089355, 0.0014227628707885742, 0.0016232132911682129, 0.0018236637115478516, 0.0020241141319274902, 0.002224564552307129, 0.0024250149726867676, 0.0026254653930664062, 0.002825915813446045, 0.0030263662338256836, 0.0032268166542053223, 0.003427267074584961, 0.0036277174949645996, 0.0038281679153442383, 0.004028618335723877, 0.004229068756103516, 0.004429519176483154, 0.004629969596862793, 0.004830420017242432, 0.00503087043762207, 0.005231320858001709, 0.005431771278381348, 0.005632221698760986, 0.005832672119140625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 14.0, 13.0, 7.0, 25.0, 29.0, 34.0, 66.0, 82.0, 149.0, 165.0, 329.0, 803.0, 60574.0, 983653.0, 1463.0, 432.0, 224.0, 149.0, 100.0, 72.0, 36.0, 31.0, 21.0, 14.0, 10.0, 16.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10939979553222656, -0.10551834106445312, -0.10163688659667969, -0.09775543212890625, -0.09387397766113281, -0.08999252319335938, -0.08611106872558594, -0.0822296142578125, -0.07834815979003906, -0.07446670532226562, -0.07058525085449219, -0.06670379638671875, -0.06282234191894531, -0.058940887451171875, -0.05505943298339844, -0.051177978515625, -0.04729652404785156, -0.043415069580078125, -0.03953361511230469, -0.03565216064453125, -0.03177070617675781, -0.027889251708984375, -0.024007797241210938, -0.0201263427734375, -0.016244888305664062, -0.012363433837890625, -0.008481979370117188, -0.00460052490234375, -0.0007190704345703125, 0.003162384033203125, 0.0070438385009765625, 0.01092529296875, 0.014806747436523438, 0.018688201904296875, 0.022569656372070312, 0.02645111083984375, 0.030332565307617188, 0.034214019775390625, 0.03809547424316406, 0.0419769287109375, 0.04585838317871094, 0.049739837646484375, 0.05362129211425781, 0.05750274658203125, 0.06138420104980469, 0.06526565551757812, 0.06914710998535156, 0.073028564453125, 0.07691001892089844, 0.08079147338867188, 0.08467292785644531, 0.08855438232421875, 0.09243583679199219, 0.09631729125976562, 0.10019874572753906, 0.1040802001953125, 0.10796165466308594, 0.11184310913085938, 0.11572456359863281, 0.11960601806640625, 0.12348747253417969, 0.12736892700195312, 0.13125038146972656, 0.1351318359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 268.0, 748.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06338192522525787, -0.061718348413705826, -0.06005476787686348, -0.05839119106531143, -0.056727610528469086, -0.05506403371691704, -0.05340045690536499, -0.051736876368522644, -0.0500732958316803, -0.04840971902012825, -0.046746138483285904, -0.045082561671733856, -0.04341898113489151, -0.04175540432333946, -0.040091827511787415, -0.03842824697494507, -0.03676467016339302, -0.03510109335184097, -0.03343751281499863, -0.03177393600344658, -0.030110355466604233, -0.028446778655052185, -0.026783199980854988, -0.02511962130665779, -0.023456042632460594, -0.021792463958263397, -0.0201288852840662, -0.018465306609869003, -0.016801729798316956, -0.015138150192797184, -0.013474572449922562, -0.011810993775725365, -0.010147418826818466, -0.00848384015262127, -0.00682026194408536, -0.00515668373554945, -0.003493105061352253, -0.001829526387155056, -0.00016594864428043365, 0.0014976300299167633, 0.0031612087041139603, 0.004824787378311157, 0.006488365586847067, 0.008151943795382977, 0.009815522469580173, 0.01147910114377737, 0.013142678886651993, 0.01480625756084919, 0.016469836235046387, 0.018133414909243584, 0.01979699358344078, 0.02146057039499283, 0.023124150931835175, 0.024787727743387222, 0.02645130641758442, 0.028114885091781616, 0.029778463765978813, 0.03144204244017601, 0.03310561925172806, 0.034769199788570404, 0.03643277660012245, 0.0380963571369648, 0.039759933948516846, 0.04142351448535919, 0.04308709129691124]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 10.0, 13.0, 14.0, 13.0, 23.0, 27.0, 28.0, 33.0, 23.0, 26.0, 39.0, 35.0, 37.0, 45.0, 52.0, 52.0, 41.0, 54.0, 51.0, 47.0, 44.0, 49.0, 37.0, 30.0, 33.0, 34.0, 17.0, 19.0, 15.0, 19.0, 13.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024068355560302734, -0.002306555397808552, -0.00220627523958683, -0.0021059950813651085, -0.002005714923143387, -0.0019054347649216652, -0.0018051546066999435, -0.001704874448478222, -0.0016045942902565002, -0.0015043141320347786, -0.001404033973813057, -0.0013037538155913353, -0.0012034736573696136, -0.001103193499147892, -0.0010029133409261703, -0.0009026331827044487, -0.000802353024482727, -0.0007020728662610054, -0.0006017927080392838, -0.0005015125498175621, -0.00040123239159584045, -0.0003009522333741188, -0.00020067207515239716, -0.0001003919169306755, -1.1175870895385742e-07, 0.00010016839951276779, 0.00020044855773448944, 0.0003007287159562111, 0.00040100887417793274, 0.0005012890323996544, 0.000601569190621376, 0.0007018493488430977, 0.0008021295070648193, 0.000902409665286541, 0.0010026898235082626, 0.0011029699817299843, 0.001203250139951706, 0.0013035302981734276, 0.0014038104563951492, 0.0015040906146168709, 0.0016043707728385925, 0.0017046509310603142, 0.0018049310892820358, 0.0019052112475037575, 0.002005491405725479, 0.0021057715639472008, 0.0022060517221689224, 0.002306331880390644, 0.0024066120386123657, 0.0025068921968340874, 0.002607172355055809, 0.0027074525132775307, 0.0028077326714992523, 0.002908012829720974, 0.0030082929879426956, 0.0031085731461644173, 0.003208853304386139, 0.0033091334626078606, 0.003409413620829582, 0.003509693779051304, 0.0036099739372730255, 0.003710254095494747, 0.003810534253716469, 0.0039108144119381905, 0.004011094570159912]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 41.0, 45.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 13.0, 8.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 11.0, 9.0, 13.0, 18.0, 32.0, 29.0, 44.0, 61.0, 66.0, 124.0, 158.0, 272.0, 449.0, 831.0, 1526.0, 3095.0, 6202.0, 13311.0, 29188.0, 69345.0, 198131.0, 457629.0, 160008.0, 59471.0, 25691.0, 11428.0, 5389.0, 2681.0, 1367.0, 733.0, 370.0, 272.0, 172.0, 114.0, 73.0, 50.0, 44.0, 22.0, 31.0, 24.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-11.0859375, -10.7637939453125, -10.441650390625, -10.1195068359375, -9.79736328125, -9.4752197265625, -9.153076171875, -8.8309326171875, -8.5087890625, -8.1866455078125, -7.864501953125, -7.5423583984375, -7.22021484375, -6.8980712890625, -6.575927734375, -6.2537841796875, -5.931640625, -5.6094970703125, -5.287353515625, -4.9652099609375, -4.64306640625, -4.3209228515625, -3.998779296875, -3.6766357421875, -3.3544921875, -3.0323486328125, -2.710205078125, -2.3880615234375, -2.06591796875, -1.7437744140625, -1.421630859375, -1.0994873046875, -0.77734375, -0.4552001953125, -0.133056640625, 0.1890869140625, 0.51123046875, 0.8333740234375, 1.155517578125, 1.4776611328125, 1.7998046875, 2.1219482421875, 2.444091796875, 2.7662353515625, 3.08837890625, 3.4105224609375, 3.732666015625, 4.0548095703125, 4.376953125, 4.6990966796875, 5.021240234375, 5.3433837890625, 5.66552734375, 5.9876708984375, 6.309814453125, 6.6319580078125, 6.9541015625, 7.2762451171875, 7.598388671875, 7.9205322265625, 8.24267578125, 8.5648193359375, 8.886962890625, 9.2091064453125, 9.53125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 10.0, 10.0, 9.0, 16.0, 17.0, 21.0, 27.0, 20.0, 31.0, 22.0, 37.0, 42.0, 43.0, 71.0, 82.0, 138.0, 1518.0, 336.0, 141.0, 70.0, 55.0, 40.0, 28.0, 33.0, 40.0, 21.0, 28.0, 23.0, 20.0, 6.0, 14.0, 11.0, 12.0, 9.0, 10.0, 5.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.6494140625, -21.892578125, -21.1357421875, -20.37890625, -19.6220703125, -18.865234375, -18.1083984375, -17.3515625, -16.5947265625, -15.837890625, -15.0810546875, -14.32421875, -13.5673828125, -12.810546875, -12.0537109375, -11.296875, -10.5400390625, -9.783203125, -9.0263671875, -8.26953125, -7.5126953125, -6.755859375, -5.9990234375, -5.2421875, -4.4853515625, -3.728515625, -2.9716796875, -2.21484375, -1.4580078125, -0.701171875, 0.0556640625, 0.8125, 1.5693359375, 2.326171875, 3.0830078125, 3.83984375, 4.5966796875, 5.353515625, 6.1103515625, 6.8671875, 7.6240234375, 8.380859375, 9.1376953125, 9.89453125, 10.6513671875, 11.408203125, 12.1650390625, 12.921875, 13.6787109375, 14.435546875, 15.1923828125, 15.94921875, 16.7060546875, 17.462890625, 18.2197265625, 18.9765625, 19.7333984375, 20.490234375, 21.2470703125, 22.00390625, 22.7607421875, 23.517578125, 24.2744140625, 25.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 13.0, 19.0, 21.0, 28.0, 44.0, 50.0, 81.0, 102.0, 168.0, 248.0, 467.0, 1680.0, 19162.0, 1968957.0, 1135516.0, 16335.0, 1493.0, 491.0, 229.0, 161.0, 110.0, 79.0, 58.0, 38.0, 34.0, 25.0, 16.0, 15.0, 12.0, 2.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -36.990234375, -35.66796875, -34.345703125, -33.0234375, -31.701171875, -30.37890625, -29.056640625, -27.734375, -26.412109375, -25.08984375, -23.767578125, -22.4453125, -21.123046875, -19.80078125, -18.478515625, -17.15625, -15.833984375, -14.51171875, -13.189453125, -11.8671875, -10.544921875, -9.22265625, -7.900390625, -6.578125, -5.255859375, -3.93359375, -2.611328125, -1.2890625, 0.033203125, 1.35546875, 2.677734375, 4.0, 5.322265625, 6.64453125, 7.966796875, 9.2890625, 10.611328125, 11.93359375, 13.255859375, 14.578125, 15.900390625, 17.22265625, 18.544921875, 19.8671875, 21.189453125, 22.51171875, 23.833984375, 25.15625, 26.478515625, 27.80078125, 29.123046875, 30.4453125, 31.767578125, 33.08984375, 34.412109375, 35.734375, 37.056640625, 38.37890625, 39.701171875, 41.0234375, 42.345703125, 43.66796875, 44.990234375, 46.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 260.0, 748.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.1582641601562, -556.3590087890625, -544.5596923828125, -532.7604370117188, -520.961181640625, -509.1618957519531, -497.36260986328125, -485.5633544921875, -473.76409912109375, -461.9648132324219, -450.1655578613281, -438.36627197265625, -426.5670166015625, -414.7677307128906, -402.96844482421875, -391.169189453125, -379.3699035644531, -367.57061767578125, -355.7713623046875, -343.9720764160156, -332.1728210449219, -320.37353515625, -308.57427978515625, -296.7749938964844, -284.9757080078125, -273.1764221191406, -261.3771667480469, -249.577880859375, -237.77862548828125, -225.97933959960938, -214.18006896972656, -202.38079833984375, -190.58151245117188, -178.78224182128906, -166.98297119140625, -155.18368530273438, -143.38442993164062, -131.58514404296875, -119.78587341308594, -107.98660278320312, -96.18733215332031, -84.3880615234375, -72.58879089355469, -60.789512634277344, -48.99024200439453, -37.19097137451172, -25.391693115234375, -13.592422485351562, -1.79315185546875, 10.006120681762695, 21.80539321899414, 33.60466766357422, 45.40393829345703, 57.203208923339844, 69.00248718261719, 80.8017578125, 92.60102844238281, 104.40029907226562, 116.19956970214844, 127.99884796142578, 139.79812622070312, 151.59738159179688, 163.39666748046875, 175.19593811035156, 186.99520874023438]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 0.0, 9.0, 8.0, 7.0, 17.0, 18.0, 16.0, 12.0, 15.0, 24.0, 21.0, 30.0, 23.0, 27.0, 26.0, 35.0, 28.0, 44.0, 33.0, 38.0, 30.0, 36.0, 30.0, 31.0, 38.0, 37.0, 48.0, 29.0, 23.0, 37.0, 31.0, 22.0, 25.0, 28.0, 14.0, 19.0, 10.0, 15.0, 7.0, 6.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.95530700683594, -40.405799865722656, -38.856292724609375, -37.306785583496094, -35.75727844238281, -34.20777130126953, -32.65826416015625, -31.10875701904297, -29.559249877929688, -28.009742736816406, -26.460235595703125, -24.910728454589844, -23.361221313476562, -21.81171417236328, -20.26220703125, -18.71269989013672, -17.163192749023438, -15.613685607910156, -14.064178466796875, -12.514671325683594, -10.965164184570312, -9.415657043457031, -7.86614990234375, -6.316642761230469, -4.7671356201171875, -3.2176284790039062, -1.668121337890625, -0.11861419677734375, 1.4308929443359375, 2.9804000854492188, 4.5299072265625, 6.079414367675781, 7.6289215087890625, 9.178428649902344, 10.727935791015625, 12.277442932128906, 13.826950073242188, 15.376457214355469, 16.92596435546875, 18.47547149658203, 20.024978637695312, 21.574485778808594, 23.123992919921875, 24.673500061035156, 26.223007202148438, 27.77251434326172, 29.322021484375, 30.87152862548828, 32.42103576660156, 33.970542907714844, 35.520050048828125, 37.069557189941406, 38.61906433105469, 40.16857147216797, 41.71807861328125, 43.26758575439453, 44.81709289550781, 46.366600036621094, 47.916107177734375, 49.465614318847656, 51.01512145996094, 52.56462860107422, 54.1141357421875, 55.66364288330078, 57.21315002441406]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 18.0, 15.0, 10.0, 12.0, 21.0, 24.0, 21.0, 46.0, 34.0, 40.0, 46.0, 40.0, 26.0, 48.0, 28.0, 31.0, 47.0, 47.0, 52.0, 37.0, 36.0, 33.0, 27.0, 31.0, 33.0, 21.0, 30.0, 25.0, 16.0, 11.0, 7.0, 6.0, 6.0, 14.0, 4.0, 4.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.375732421875, -8.10302734375, -7.830322265625, -7.5576171875, -7.284912109375, -7.01220703125, -6.739501953125, -6.466796875, -6.194091796875, -5.92138671875, -5.648681640625, -5.3759765625, -5.103271484375, -4.83056640625, -4.557861328125, -4.28515625, -4.012451171875, -3.73974609375, -3.467041015625, -3.1943359375, -2.921630859375, -2.64892578125, -2.376220703125, -2.103515625, -1.830810546875, -1.55810546875, -1.285400390625, -1.0126953125, -0.739990234375, -0.46728515625, -0.194580078125, 0.078125, 0.350830078125, 0.62353515625, 0.896240234375, 1.1689453125, 1.441650390625, 1.71435546875, 1.987060546875, 2.259765625, 2.532470703125, 2.80517578125, 3.077880859375, 3.3505859375, 3.623291015625, 3.89599609375, 4.168701171875, 4.44140625, 4.714111328125, 4.98681640625, 5.259521484375, 5.5322265625, 5.804931640625, 6.07763671875, 6.350341796875, 6.623046875, 6.895751953125, 7.16845703125, 7.441162109375, 7.7138671875, 7.986572265625, 8.25927734375, 8.531982421875, 8.8046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 9.0, 13.0, 14.0, 18.0, 26.0, 47.0, 73.0, 119.0, 211.0, 379.0, 831.0, 1678.0, 4016.0, 10589.0, 36519.0, 281811.0, 2475834.0, 1247579.0, 101924.0, 20492.0, 6864.0, 2772.0, 1161.0, 576.0, 285.0, 162.0, 69.0, 56.0, 28.0, 28.0, 21.0, 9.0, 5.0, 10.0, 8.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.607177734375, -16.99560546875, -16.384033203125, -15.7724609375, -15.160888671875, -14.54931640625, -13.937744140625, -13.326171875, -12.714599609375, -12.10302734375, -11.491455078125, -10.8798828125, -10.268310546875, -9.65673828125, -9.045166015625, -8.43359375, -7.822021484375, -7.21044921875, -6.598876953125, -5.9873046875, -5.375732421875, -4.76416015625, -4.152587890625, -3.541015625, -2.929443359375, -2.31787109375, -1.706298828125, -1.0947265625, -0.483154296875, 0.12841796875, 0.739990234375, 1.3515625, 1.963134765625, 2.57470703125, 3.186279296875, 3.7978515625, 4.409423828125, 5.02099609375, 5.632568359375, 6.244140625, 6.855712890625, 7.46728515625, 8.078857421875, 8.6904296875, 9.302001953125, 9.91357421875, 10.525146484375, 11.13671875, 11.748291015625, 12.35986328125, 12.971435546875, 13.5830078125, 14.194580078125, 14.80615234375, 15.417724609375, 16.029296875, 16.640869140625, 17.25244140625, 17.864013671875, 18.4755859375, 19.087158203125, 19.69873046875, 20.310302734375, 20.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 13.0, 10.0, 8.0, 19.0, 24.0, 22.0, 21.0, 26.0, 57.0, 59.0, 72.0, 97.0, 139.0, 182.0, 291.0, 385.0, 476.0, 528.0, 484.0, 353.0, 220.0, 149.0, 98.0, 87.0, 59.0, 49.0, 27.0, 32.0, 19.0, 8.0, 13.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.36865234375, -10.9794921875, -10.59033203125, -10.201171875, -9.81201171875, -9.4228515625, -9.03369140625, -8.64453125, -8.25537109375, -7.8662109375, -7.47705078125, -7.087890625, -6.69873046875, -6.3095703125, -5.92041015625, -5.53125, -5.14208984375, -4.7529296875, -4.36376953125, -3.974609375, -3.58544921875, -3.1962890625, -2.80712890625, -2.41796875, -2.02880859375, -1.6396484375, -1.25048828125, -0.861328125, -0.47216796875, -0.0830078125, 0.30615234375, 0.6953125, 1.08447265625, 1.4736328125, 1.86279296875, 2.251953125, 2.64111328125, 3.0302734375, 3.41943359375, 3.80859375, 4.19775390625, 4.5869140625, 4.97607421875, 5.365234375, 5.75439453125, 6.1435546875, 6.53271484375, 6.921875, 7.31103515625, 7.7001953125, 8.08935546875, 8.478515625, 8.86767578125, 9.2568359375, 9.64599609375, 10.03515625, 10.42431640625, 10.8134765625, 11.20263671875, 11.591796875, 11.98095703125, 12.3701171875, 12.75927734375, 13.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 10.0, 6.0, 12.0, 20.0, 30.0, 28.0, 57.0, 63.0, 113.0, 174.0, 333.0, 624.0, 1487.0, 3482.0, 10410.0, 36931.0, 179319.0, 2119541.0, 1646334.0, 149476.0, 31126.0, 8838.0, 3092.0, 1328.0, 572.0, 304.0, 166.0, 105.0, 87.0, 50.0, 36.0, 20.0, 25.0, 17.0, 8.0, 9.0, 12.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.84375, -19.20263671875, -18.5615234375, -17.92041015625, -17.279296875, -16.63818359375, -15.9970703125, -15.35595703125, -14.71484375, -14.07373046875, -13.4326171875, -12.79150390625, -12.150390625, -11.50927734375, -10.8681640625, -10.22705078125, -9.5859375, -8.94482421875, -8.3037109375, -7.66259765625, -7.021484375, -6.38037109375, -5.7392578125, -5.09814453125, -4.45703125, -3.81591796875, -3.1748046875, -2.53369140625, -1.892578125, -1.25146484375, -0.6103515625, 0.03076171875, 0.671875, 1.31298828125, 1.9541015625, 2.59521484375, 3.236328125, 3.87744140625, 4.5185546875, 5.15966796875, 5.80078125, 6.44189453125, 7.0830078125, 7.72412109375, 8.365234375, 9.00634765625, 9.6474609375, 10.28857421875, 10.9296875, 11.57080078125, 12.2119140625, 12.85302734375, 13.494140625, 14.13525390625, 14.7763671875, 15.41748046875, 16.05859375, 16.69970703125, 17.3408203125, 17.98193359375, 18.623046875, 19.26416015625, 19.9052734375, 20.54638671875, 21.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 19.0, 44.0, 139.0, 290.0, 281.0, 151.0, 56.0, 19.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.59783935546875, -122.66924285888672, -118.74064636230469, -114.81204986572266, -110.88345336914062, -106.9548568725586, -103.02626037597656, -99.09766387939453, -95.1690673828125, -91.24047088623047, -87.31187438964844, -83.3832778930664, -79.45468139648438, -75.52608489990234, -71.59748840332031, -67.66889190673828, -63.74029541015625, -59.81169891357422, -55.88310241699219, -51.954505920410156, -48.025909423828125, -44.097312927246094, -40.16871643066406, -36.24011993408203, -32.3115234375, -28.38292694091797, -24.454330444335938, -20.525733947753906, -16.597137451171875, -12.668540954589844, -8.739944458007812, -4.811347961425781, -0.8827438354492188, 3.0458526611328125, 6.974449157714844, 10.903045654296875, 14.831642150878906, 18.760238647460938, 22.68883514404297, 26.617431640625, 30.54602813720703, 34.47462463378906, 38.403221130371094, 42.331817626953125, 46.260414123535156, 50.18901062011719, 54.11760711669922, 58.04620361328125, 61.97480010986328, 65.90339660644531, 69.83199310302734, 73.76058959960938, 77.6891860961914, 81.61778259277344, 85.54637908935547, 89.4749755859375, 93.40357208251953, 97.33216857910156, 101.2607650756836, 105.18936157226562, 109.11795806884766, 113.04655456542969, 116.97515106201172, 120.90374755859375, 124.83234405517578]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 19.0, 15.0, 12.0, 18.0, 27.0, 24.0, 28.0, 19.0, 28.0, 29.0, 31.0, 40.0, 38.0, 35.0, 44.0, 65.0, 36.0, 57.0, 39.0, 44.0, 39.0, 36.0, 31.0, 28.0, 37.0, 24.0, 18.0, 17.0, 18.0, 24.0, 10.0, 15.0, 3.0, 3.0, 10.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.79145812988281, -45.34745788574219, -43.9034538269043, -42.45945358276367, -41.01544952392578, -39.571449279785156, -38.12744903564453, -36.683448791503906, -35.239444732666016, -33.79544448852539, -32.3514404296875, -30.907440185546875, -29.463438034057617, -28.01943588256836, -26.575435638427734, -25.131433486938477, -23.68743133544922, -22.24342918395996, -20.799427032470703, -19.355426788330078, -17.91142463684082, -16.467422485351562, -15.023421287536621, -13.57942008972168, -12.135417938232422, -10.691415786743164, -9.247414588928223, -7.803412914276123, -6.359411239624023, -4.915409564971924, -3.471407890319824, -2.027406692504883, -0.583404541015625, 0.8605971336364746, 2.304598808288574, 3.748600482940674, 5.192602157592773, 6.636603832244873, 8.080605506896973, 9.524606704711914, 10.968608856201172, 12.41261100769043, 13.856612205505371, 15.300613403320312, 16.74461555480957, 18.188617706298828, 19.632617950439453, 21.07662010192871, 22.52062225341797, 23.964624404907227, 25.408626556396484, 26.85262680053711, 28.296628952026367, 29.740631103515625, 31.18463134765625, 32.628631591796875, 34.072635650634766, 35.51663589477539, 36.96063995361328, 38.404640197753906, 39.84864044189453, 41.29264450073242, 42.73664474487305, 44.18064880371094, 45.62464904785156]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 37.0, 32.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 45.0, 76.0, 100.0, 138.0, 287.0, 422.0, 621.0, 975.0, 1593.0, 2414.0, 3662.0, 5509.0, 8398.0, 12881.0, 19744.0, 29915.0, 45489.0, 69748.0, 102557.0, 142764.0, 165714.0, 139976.0, 100131.0, 67459.0, 43936.0, 29116.0, 18868.0, 12353.0, 8225.0, 5373.0, 3490.0, 2308.0, 1507.0, 924.0, 655.0, 433.0, 233.0, 173.0, 115.0, 65.0, 38.0, 25.0, 19.0, 7.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7734375, -0.7496109008789062, -0.7257843017578125, -0.7019577026367188, -0.678131103515625, -0.6543045043945312, -0.6304779052734375, -0.6066513061523438, -0.58282470703125, -0.5589981079101562, -0.5351715087890625, -0.5113449096679688, -0.487518310546875, -0.46369171142578125, -0.4398651123046875, -0.41603851318359375, -0.3922119140625, -0.36838531494140625, -0.3445587158203125, -0.32073211669921875, -0.296905517578125, -0.27307891845703125, -0.2492523193359375, -0.22542572021484375, -0.20159912109375, -0.17777252197265625, -0.1539459228515625, -0.13011932373046875, -0.106292724609375, -0.08246612548828125, -0.0586395263671875, -0.03481292724609375, -0.010986328125, 0.01284027099609375, 0.0366668701171875, 0.06049346923828125, 0.084320068359375, 0.10814666748046875, 0.1319732666015625, 0.15579986572265625, 0.17962646484375, 0.20345306396484375, 0.2272796630859375, 0.25110626220703125, 0.274932861328125, 0.29875946044921875, 0.3225860595703125, 0.34641265869140625, 0.3702392578125, 0.39406585693359375, 0.4178924560546875, 0.44171905517578125, 0.465545654296875, 0.48937225341796875, 0.5131988525390625, 0.5370254516601562, 0.56085205078125, 0.5846786499023438, 0.6085052490234375, 0.6323318481445312, 0.656158447265625, 0.6799850463867188, 0.7038116455078125, 0.7276382446289062, 0.75146484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 14.0, 13.0, 26.0, 22.0, 30.0, 33.0, 30.0, 28.0, 34.0, 40.0, 46.0, 54.0, 47.0, 44.0, 1087.0, 55.0, 54.0, 40.0, 33.0, 46.0, 30.0, 30.0, 29.0, 31.0, 24.0, 17.0, 10.0, 16.0, 13.0, 11.0, 2.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.046875, -6.83404541015625, -6.6212158203125, -6.40838623046875, -6.195556640625, -5.98272705078125, -5.7698974609375, -5.55706787109375, -5.34423828125, -5.13140869140625, -4.9185791015625, -4.70574951171875, -4.492919921875, -4.28009033203125, -4.0672607421875, -3.85443115234375, -3.6416015625, -3.42877197265625, -3.2159423828125, -3.00311279296875, -2.790283203125, -2.57745361328125, -2.3646240234375, -2.15179443359375, -1.93896484375, -1.72613525390625, -1.5133056640625, -1.30047607421875, -1.087646484375, -0.87481689453125, -0.6619873046875, -0.44915771484375, -0.236328125, -0.02349853515625, 0.1893310546875, 0.40216064453125, 0.614990234375, 0.82781982421875, 1.0406494140625, 1.25347900390625, 1.46630859375, 1.67913818359375, 1.8919677734375, 2.10479736328125, 2.317626953125, 2.53045654296875, 2.7432861328125, 2.95611572265625, 3.1689453125, 3.38177490234375, 3.5946044921875, 3.80743408203125, 4.020263671875, 4.23309326171875, 4.4459228515625, 4.65875244140625, 4.87158203125, 5.08441162109375, 5.2972412109375, 5.51007080078125, 5.722900390625, 5.93572998046875, 6.1485595703125, 6.36138916015625, 6.57421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 39.0, 72.0, 74.0, 119.0, 197.0, 319.0, 587.0, 952.0, 1558.0, 2712.0, 4492.0, 7300.0, 12253.0, 20097.0, 33125.0, 53363.0, 84543.0, 127512.0, 233118.0, 1151065.0, 131273.0, 88571.0, 55972.0, 34525.0, 21011.0, 12874.0, 7758.0, 4676.0, 2830.0, 1683.0, 893.0, 634.0, 356.0, 214.0, 140.0, 70.0, 45.0, 35.0, 17.0, 12.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.8037109375, -0.7814178466796875, -0.759124755859375, -0.7368316650390625, -0.71453857421875, -0.6922454833984375, -0.669952392578125, -0.6476593017578125, -0.6253662109375, -0.6030731201171875, -0.580780029296875, -0.5584869384765625, -0.53619384765625, -0.5139007568359375, -0.491607666015625, -0.4693145751953125, -0.447021484375, -0.4247283935546875, -0.402435302734375, -0.3801422119140625, -0.35784912109375, -0.3355560302734375, -0.313262939453125, -0.2909698486328125, -0.2686767578125, -0.2463836669921875, -0.224090576171875, -0.2017974853515625, -0.17950439453125, -0.1572113037109375, -0.134918212890625, -0.1126251220703125, -0.09033203125, -0.0680389404296875, -0.045745849609375, -0.0234527587890625, -0.00115966796875, 0.0211334228515625, 0.043426513671875, 0.0657196044921875, 0.0880126953125, 0.1103057861328125, 0.132598876953125, 0.1548919677734375, 0.17718505859375, 0.1994781494140625, 0.221771240234375, 0.2440643310546875, 0.266357421875, 0.2886505126953125, 0.310943603515625, 0.3332366943359375, 0.35552978515625, 0.3778228759765625, 0.400115966796875, 0.4224090576171875, 0.4447021484375, 0.4669952392578125, 0.489288330078125, 0.5115814208984375, 0.53387451171875, 0.5561676025390625, 0.578460693359375, 0.6007537841796875, 0.623046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 8.0, 25.0, 28.0, 33.0, 50.0, 62.0, 69.0, 90.0, 118.0, 123.0, 79.0, 55.0, 68.0, 50.0, 32.0, 20.0, 14.0, 15.0, 7.0, 5.0, 5.0, 2.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006488800048828125, -0.006296992301940918, -0.006105184555053711, -0.005913376808166504, -0.005721569061279297, -0.00552976131439209, -0.005337953567504883, -0.005146145820617676, -0.004954338073730469, -0.004762530326843262, -0.004570722579956055, -0.004378914833068848, -0.004187107086181641, -0.003995299339294434, -0.0038034915924072266, -0.0036116838455200195, -0.0034198760986328125, -0.0032280683517456055, -0.0030362606048583984, -0.0028444528579711914, -0.0026526451110839844, -0.0024608373641967773, -0.0022690296173095703, -0.0020772218704223633, -0.0018854141235351562, -0.0016936063766479492, -0.0015017986297607422, -0.0013099908828735352, -0.0011181831359863281, -0.0009263753890991211, -0.0007345676422119141, -0.000542759895324707, -0.0003509521484375, -0.00015914440155029297, 3.266334533691406e-05, 0.0002244710922241211, 0.0004162788391113281, 0.0006080865859985352, 0.0007998943328857422, 0.0009917020797729492, 0.0011835098266601562, 0.0013753175735473633, 0.0015671253204345703, 0.0017589330673217773, 0.0019507408142089844, 0.0021425485610961914, 0.0023343563079833984, 0.0025261640548706055, 0.0027179718017578125, 0.0029097795486450195, 0.0031015872955322266, 0.0032933950424194336, 0.0034852027893066406, 0.0036770105361938477, 0.0038688182830810547, 0.004060626029968262, 0.004252433776855469, 0.004444241523742676, 0.004636049270629883, 0.00482785701751709, 0.005019664764404297, 0.005211472511291504, 0.005403280258178711, 0.005595088005065918, 0.005786895751953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 13.0, 10.0, 12.0, 21.0, 30.0, 32.0, 50.0, 78.0, 130.0, 188.0, 325.0, 794.0, 23484.0, 1019948.0, 2174.0, 519.0, 234.0, 156.0, 100.0, 82.0, 44.0, 32.0, 8.0, 12.0, 9.0, 12.0, 3.0, 6.0, 1.0, 5.0, 5.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1087646484375, -0.10517406463623047, -0.10158348083496094, -0.0979928970336914, -0.09440231323242188, -0.09081172943115234, -0.08722114562988281, -0.08363056182861328, -0.08003997802734375, -0.07644939422607422, -0.07285881042480469, -0.06926822662353516, -0.06567764282226562, -0.062087059020996094, -0.05849647521972656, -0.05490589141845703, -0.0513153076171875, -0.04772472381591797, -0.04413414001464844, -0.040543556213378906, -0.036952972412109375, -0.033362388610839844, -0.029771804809570312, -0.02618122100830078, -0.02259063720703125, -0.01900005340576172, -0.015409469604492188, -0.011818885803222656, -0.008228302001953125, -0.004637718200683594, -0.0010471343994140625, 0.0025434494018554688, 0.006134033203125, 0.009724617004394531, 0.013315200805664062, 0.016905784606933594, 0.020496368408203125, 0.024086952209472656, 0.027677536010742188, 0.03126811981201172, 0.03485870361328125, 0.03844928741455078, 0.04203987121582031, 0.045630455017089844, 0.049221038818359375, 0.052811622619628906, 0.05640220642089844, 0.05999279022216797, 0.0635833740234375, 0.06717395782470703, 0.07076454162597656, 0.0743551254272461, 0.07794570922851562, 0.08153629302978516, 0.08512687683105469, 0.08871746063232422, 0.09230804443359375, 0.09589862823486328, 0.09948921203613281, 0.10307979583740234, 0.10667037963867188, 0.1102609634399414, 0.11385154724121094, 0.11744213104248047, 0.12103271484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 63.0, 697.0, 237.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02969544380903244, -0.029085952788591385, -0.02847646363079548, -0.027866972610354424, -0.027257483452558517, -0.026647992432117462, -0.026038503274321556, -0.0254290122538805, -0.024819523096084595, -0.02421003207564354, -0.023600542917847633, -0.022991051897406578, -0.022381562739610672, -0.021772071719169617, -0.02116258256137371, -0.020553091540932655, -0.01994360238313675, -0.019334111362695694, -0.018724622204899788, -0.018115131184458733, -0.017505642026662827, -0.01689615100622177, -0.016286661848425865, -0.01567717082798481, -0.015067679807543755, -0.014458189718425274, -0.013848699629306793, -0.013239209540188313, -0.012629719451069832, -0.012020229361951351, -0.01141073927283287, -0.010801248252391815, -0.010191758163273335, -0.009582268074154854, -0.008972777985036373, -0.008363287895917892, -0.007753797806799412, -0.007144307717680931, -0.006534817162901163, -0.005925327073782682, -0.005315836984664202, -0.004706346895545721, -0.00409685680642724, -0.003487366484478116, -0.0028778763953596354, -0.0022683863062411547, -0.0016588959842920303, -0.0010494058951735497, -0.00043991580605506897, 0.00016957434127107263, 0.0007790644885972142, 0.0013885546941310167, 0.0019980447832494974, 0.002607534872367978, 0.0032170251943171024, 0.003826515283435583, 0.004436005372554064, 0.0050454954616725445, 0.005654985550791025, 0.006264476105570793, 0.006873966194689274, 0.0074834562838077545, 0.008092946372926235, 0.008702436462044716, 0.009311926551163197]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 12.0, 3.0, 7.0, 12.0, 11.0, 8.0, 10.0, 16.0, 16.0, 19.0, 23.0, 25.0, 34.0, 25.0, 31.0, 33.0, 32.0, 38.0, 44.0, 38.0, 46.0, 29.0, 34.0, 43.0, 44.0, 43.0, 35.0, 30.0, 43.0, 33.0, 26.0, 22.0, 21.0, 18.0, 17.0, 16.0, 15.0, 8.0, 6.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020622611045837402, -0.001985718496143818, -0.0019091758877038956, -0.0018326332792639732, -0.001756090670824051, -0.0016795480623841286, -0.0016030054539442062, -0.001526462845504284, -0.0014499202370643616, -0.0013733776286244392, -0.001296835020184517, -0.0012202924117445946, -0.0011437498033046722, -0.00106720719486475, -0.0009906645864248276, -0.0009141219779849052, -0.0008375793695449829, -0.0007610367611050606, -0.0006844941526651382, -0.0006079515442252159, -0.0005314089357852936, -0.00045486632734537125, -0.0003783237189054489, -0.0003017811104655266, -0.00022523850202560425, -0.00014869589358568192, -7.215328514575958e-05, 4.38932329416275e-06, 8.093193173408508e-05, 0.00015747454017400742, 0.00023401714861392975, 0.0003105597570538521, 0.0003871023654937744, 0.00046364497393369675, 0.0005401875823736191, 0.0006167301908135414, 0.0006932727992534637, 0.0007698154076933861, 0.0008463580161333084, 0.0009229006245732307, 0.000999443233013153, 0.0010759858414530754, 0.0011525284498929977, 0.00122907105833292, 0.0013056136667728424, 0.0013821562752127647, 0.001458698883652687, 0.0015352414920926094, 0.0016117841005325317, 0.001688326708972454, 0.0017648693174123764, 0.0018414119258522987, 0.001917954534292221, 0.0019944971427321434, 0.0020710397511720657, 0.002147582359611988, 0.0022241249680519104, 0.0023006675764918327, 0.002377210184931755, 0.0024537527933716774, 0.0025302954018115997, 0.002606838010251522, 0.0026833806186914444, 0.0027599232271313667, 0.002836465835571289]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 36.0, 33.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 9.0, 12.0, 20.0, 24.0, 36.0, 46.0, 63.0, 73.0, 103.0, 152.0, 177.0, 276.0, 378.0, 535.0, 809.0, 1350.0, 2199.0, 4275.0, 8286.0, 17543.0, 39348.0, 94978.0, 310848.0, 370471.0, 111253.0, 44667.0, 19946.0, 9313.0, 4657.0, 2453.0, 1409.0, 865.0, 559.0, 376.0, 250.0, 195.0, 141.0, 96.0, 99.0, 68.0, 59.0, 33.0, 28.0, 19.0, 14.0, 8.0, 11.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.7265625, -9.42333984375, -9.1201171875, -8.81689453125, -8.513671875, -8.21044921875, -7.9072265625, -7.60400390625, -7.30078125, -6.99755859375, -6.6943359375, -6.39111328125, -6.087890625, -5.78466796875, -5.4814453125, -5.17822265625, -4.875, -4.57177734375, -4.2685546875, -3.96533203125, -3.662109375, -3.35888671875, -3.0556640625, -2.75244140625, -2.44921875, -2.14599609375, -1.8427734375, -1.53955078125, -1.236328125, -0.93310546875, -0.6298828125, -0.32666015625, -0.0234375, 0.27978515625, 0.5830078125, 0.88623046875, 1.189453125, 1.49267578125, 1.7958984375, 2.09912109375, 2.40234375, 2.70556640625, 3.0087890625, 3.31201171875, 3.615234375, 3.91845703125, 4.2216796875, 4.52490234375, 4.828125, 5.13134765625, 5.4345703125, 5.73779296875, 6.041015625, 6.34423828125, 6.6474609375, 6.95068359375, 7.25390625, 7.55712890625, 7.8603515625, 8.16357421875, 8.466796875, 8.77001953125, 9.0732421875, 9.37646484375, 9.6796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 5.0, 7.0, 11.0, 17.0, 12.0, 13.0, 24.0, 18.0, 36.0, 35.0, 29.0, 24.0, 49.0, 52.0, 67.0, 80.0, 151.0, 1480.0, 314.0, 124.0, 75.0, 48.0, 40.0, 40.0, 41.0, 33.0, 31.0, 26.0, 24.0, 14.0, 18.0, 24.0, 14.0, 6.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.134521484375, -16.47216796875, -15.809814453125, -15.1474609375, -14.485107421875, -13.82275390625, -13.160400390625, -12.498046875, -11.835693359375, -11.17333984375, -10.510986328125, -9.8486328125, -9.186279296875, -8.52392578125, -7.861572265625, -7.19921875, -6.536865234375, -5.87451171875, -5.212158203125, -4.5498046875, -3.887451171875, -3.22509765625, -2.562744140625, -1.900390625, -1.238037109375, -0.57568359375, 0.086669921875, 0.7490234375, 1.411376953125, 2.07373046875, 2.736083984375, 3.3984375, 4.060791015625, 4.72314453125, 5.385498046875, 6.0478515625, 6.710205078125, 7.37255859375, 8.034912109375, 8.697265625, 9.359619140625, 10.02197265625, 10.684326171875, 11.3466796875, 12.009033203125, 12.67138671875, 13.333740234375, 13.99609375, 14.658447265625, 15.32080078125, 15.983154296875, 16.6455078125, 17.307861328125, 17.97021484375, 18.632568359375, 19.294921875, 19.957275390625, 20.61962890625, 21.281982421875, 21.9443359375, 22.606689453125, 23.26904296875, 23.931396484375, 24.59375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 17.0, 13.0, 21.0, 25.0, 29.0, 41.0, 70.0, 91.0, 165.0, 250.0, 450.0, 1363.0, 18100.0, 2900034.0, 218769.0, 4581.0, 736.0, 316.0, 203.0, 118.0, 72.0, 52.0, 51.0, 39.0, 29.0, 15.0, 11.0, 7.0, 11.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.90625, -41.30419921875, -39.7021484375, -38.10009765625, -36.498046875, -34.89599609375, -33.2939453125, -31.69189453125, -30.08984375, -28.48779296875, -26.8857421875, -25.28369140625, -23.681640625, -22.07958984375, -20.4775390625, -18.87548828125, -17.2734375, -15.67138671875, -14.0693359375, -12.46728515625, -10.865234375, -9.26318359375, -7.6611328125, -6.05908203125, -4.45703125, -2.85498046875, -1.2529296875, 0.34912109375, 1.951171875, 3.55322265625, 5.1552734375, 6.75732421875, 8.359375, 9.96142578125, 11.5634765625, 13.16552734375, 14.767578125, 16.36962890625, 17.9716796875, 19.57373046875, 21.17578125, 22.77783203125, 24.3798828125, 25.98193359375, 27.583984375, 29.18603515625, 30.7880859375, 32.39013671875, 33.9921875, 35.59423828125, 37.1962890625, 38.79833984375, 40.400390625, 42.00244140625, 43.6044921875, 45.20654296875, 46.80859375, 48.41064453125, 50.0126953125, 51.61474609375, 53.216796875, 54.81884765625, 56.4208984375, 58.02294921875, 59.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 33.0, 93.0, 286.0, 353.0, 184.0, 46.0, 14.0, 2.0, 3.0, 1.0], "bins": [-146.693359375, -144.13621520996094, -141.5790557861328, -139.02191162109375, -136.46475219726562, -133.90760803222656, -131.3504638671875, -128.79330444335938, -126.23616027832031, -123.67900848388672, -121.12185668945312, -118.56471252441406, -116.00756072998047, -113.45040893554688, -110.89325714111328, -108.33610534667969, -105.7789535522461, -103.2218017578125, -100.6646499633789, -98.10750579833984, -95.55035400390625, -92.99320220947266, -90.43605041503906, -87.87889862060547, -85.32174682617188, -82.76459503173828, -80.20744323730469, -77.65029907226562, -75.09314727783203, -72.53599548339844, -69.97884368896484, -67.42169189453125, -64.86454010009766, -62.30738830566406, -59.750240325927734, -57.19308853149414, -54.63594055175781, -52.07878875732422, -49.521636962890625, -46.96448516845703, -44.40734100341797, -41.850189208984375, -39.29304122924805, -36.73588943481445, -34.178741455078125, -31.62158966064453, -29.064437866210938, -26.507287979125977, -23.950136184692383, -21.392986297607422, -18.835834503173828, -16.278684616088867, -13.721534729003906, -11.164384841918945, -8.607234001159668, -6.050083160400391, -3.4929332733154297, -0.9357829093933105, 1.6213674545288086, 4.178517818450928, 6.735668182373047, 9.292818069458008, 11.849968910217285, 14.407119750976562, 16.964269638061523]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 11.0, 7.0, 10.0, 9.0, 7.0, 13.0, 16.0, 21.0, 26.0, 25.0, 23.0, 30.0, 40.0, 31.0, 31.0, 37.0, 36.0, 39.0, 47.0, 41.0, 34.0, 41.0, 41.0, 38.0, 31.0, 32.0, 35.0, 33.0, 23.0, 26.0, 23.0, 12.0, 16.0, 14.0, 20.0, 16.0, 8.0, 10.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-48.311767578125, -46.86762237548828, -45.4234733581543, -43.97932434082031, -42.535179138183594, -41.091033935546875, -39.64688491821289, -38.202735900878906, -36.75859069824219, -35.31444549560547, -33.870296478271484, -32.4261474609375, -30.98200225830078, -29.53785514831543, -28.093708038330078, -26.649560928344727, -25.205413818359375, -23.761266708374023, -22.317119598388672, -20.87297248840332, -19.42882537841797, -17.984678268432617, -16.540531158447266, -15.096384048461914, -13.652236938476562, -12.208089828491211, -10.76394271850586, -9.319795608520508, -7.875648498535156, -6.431501388549805, -4.987354278564453, -3.5432071685791016, -2.09906005859375, -0.6549129486083984, 0.7892341613769531, 2.2333812713623047, 3.6775283813476562, 5.121675491333008, 6.565822601318359, 8.009969711303711, 9.454116821289062, 10.898263931274414, 12.342411041259766, 13.786558151245117, 15.230705261230469, 16.67485237121582, 18.118999481201172, 19.563146591186523, 21.007293701171875, 22.451440811157227, 23.895587921142578, 25.33973503112793, 26.78388214111328, 28.228029251098633, 29.672176361083984, 31.116323471069336, 32.56047058105469, 34.004615783691406, 35.44876480102539, 36.892913818359375, 38.337059020996094, 39.78120422363281, 41.2253532409668, 42.66950225830078, 44.1136474609375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 12.0, 11.0, 12.0, 10.0, 3.0, 12.0, 5.0, 21.0, 22.0, 26.0, 30.0, 20.0, 33.0, 39.0, 27.0, 29.0, 38.0, 37.0, 32.0, 42.0, 49.0, 39.0, 54.0, 35.0, 33.0, 31.0, 36.0, 19.0, 29.0, 27.0, 20.0, 18.0, 12.0, 17.0, 16.0, 9.0, 19.0, 9.0, 13.0, 2.0, 6.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.15625, -7.90435791015625, -7.6524658203125, -7.40057373046875, -7.148681640625, -6.89678955078125, -6.6448974609375, -6.39300537109375, -6.14111328125, -5.88922119140625, -5.6373291015625, -5.38543701171875, -5.133544921875, -4.88165283203125, -4.6297607421875, -4.37786865234375, -4.1259765625, -3.87408447265625, -3.6221923828125, -3.37030029296875, -3.118408203125, -2.86651611328125, -2.6146240234375, -2.36273193359375, -2.11083984375, -1.85894775390625, -1.6070556640625, -1.35516357421875, -1.103271484375, -0.85137939453125, -0.5994873046875, -0.34759521484375, -0.095703125, 0.15618896484375, 0.4080810546875, 0.65997314453125, 0.911865234375, 1.16375732421875, 1.4156494140625, 1.66754150390625, 1.91943359375, 2.17132568359375, 2.4232177734375, 2.67510986328125, 2.927001953125, 3.17889404296875, 3.4307861328125, 3.68267822265625, 3.9345703125, 4.18646240234375, 4.4383544921875, 4.69024658203125, 4.942138671875, 5.19403076171875, 5.4459228515625, 5.69781494140625, 5.94970703125, 6.20159912109375, 6.4534912109375, 6.70538330078125, 6.957275390625, 7.20916748046875, 7.4610595703125, 7.71295166015625, 7.96484375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 4.0, 14.0, 14.0, 19.0, 27.0, 44.0, 33.0, 58.0, 73.0, 108.0, 144.0, 179.0, 252.0, 362.0, 416.0, 3142.0, 4176288.0, 11109.0, 553.0, 359.0, 258.0, 198.0, 142.0, 105.0, 76.0, 64.0, 35.0, 42.0, 24.0, 21.0, 21.0, 14.0, 8.0, 9.0, 9.0, 8.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.5, -144.451171875, -139.40234375, -134.353515625, -129.3046875, -124.255859375, -119.20703125, -114.158203125, -109.109375, -104.060546875, -99.01171875, -93.962890625, -88.9140625, -83.865234375, -78.81640625, -73.767578125, -68.71875, -63.669921875, -58.62109375, -53.572265625, -48.5234375, -43.474609375, -38.42578125, -33.376953125, -28.328125, -23.279296875, -18.23046875, -13.181640625, -8.1328125, -3.083984375, 1.96484375, 7.013671875, 12.0625, 17.111328125, 22.16015625, 27.208984375, 32.2578125, 37.306640625, 42.35546875, 47.404296875, 52.453125, 57.501953125, 62.55078125, 67.599609375, 72.6484375, 77.697265625, 82.74609375, 87.794921875, 92.84375, 97.892578125, 102.94140625, 107.990234375, 113.0390625, 118.087890625, 123.13671875, 128.185546875, 133.234375, 138.283203125, 143.33203125, 148.380859375, 153.4296875, 158.478515625, 163.52734375, 168.576171875, 173.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 19.0, 21.0, 24.0, 49.0, 63.0, 94.0, 126.0, 226.0, 384.0, 682.0, 854.0, 585.0, 348.0, 170.0, 129.0, 84.0, 57.0, 32.0, 40.0, 22.0, 12.0, 12.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.990966796875, -18.40380859375, -17.816650390625, -17.2294921875, -16.642333984375, -16.05517578125, -15.468017578125, -14.880859375, -14.293701171875, -13.70654296875, -13.119384765625, -12.5322265625, -11.945068359375, -11.35791015625, -10.770751953125, -10.18359375, -9.596435546875, -9.00927734375, -8.422119140625, -7.8349609375, -7.247802734375, -6.66064453125, -6.073486328125, -5.486328125, -4.899169921875, -4.31201171875, -3.724853515625, -3.1376953125, -2.550537109375, -1.96337890625, -1.376220703125, -0.7890625, -0.201904296875, 0.38525390625, 0.972412109375, 1.5595703125, 2.146728515625, 2.73388671875, 3.321044921875, 3.908203125, 4.495361328125, 5.08251953125, 5.669677734375, 6.2568359375, 6.843994140625, 7.43115234375, 8.018310546875, 8.60546875, 9.192626953125, 9.77978515625, 10.366943359375, 10.9541015625, 11.541259765625, 12.12841796875, 12.715576171875, 13.302734375, 13.889892578125, 14.47705078125, 15.064208984375, 15.6513671875, 16.238525390625, 16.82568359375, 17.412841796875, 18.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 19.0, 16.0, 18.0, 16.0, 16.0, 28.0, 37.0, 45.0, 52.0, 80.0, 148.0, 465.0, 7015.0, 3826648.0, 356646.0, 2273.0, 315.0, 103.0, 51.0, 47.0, 33.0, 37.0, 29.0, 27.0, 19.0, 10.0, 8.0, 12.0, 7.0, 11.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.875, -78.1650390625, -75.455078125, -72.7451171875, -70.03515625, -67.3251953125, -64.615234375, -61.9052734375, -59.1953125, -56.4853515625, -53.775390625, -51.0654296875, -48.35546875, -45.6455078125, -42.935546875, -40.2255859375, -37.515625, -34.8056640625, -32.095703125, -29.3857421875, -26.67578125, -23.9658203125, -21.255859375, -18.5458984375, -15.8359375, -13.1259765625, -10.416015625, -7.7060546875, -4.99609375, -2.2861328125, 0.423828125, 3.1337890625, 5.84375, 8.5537109375, 11.263671875, 13.9736328125, 16.68359375, 19.3935546875, 22.103515625, 24.8134765625, 27.5234375, 30.2333984375, 32.943359375, 35.6533203125, 38.36328125, 41.0732421875, 43.783203125, 46.4931640625, 49.203125, 51.9130859375, 54.623046875, 57.3330078125, 60.04296875, 62.7529296875, 65.462890625, 68.1728515625, 70.8828125, 73.5927734375, 76.302734375, 79.0126953125, 81.72265625, 84.4326171875, 87.142578125, 89.8525390625, 92.5625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 20.0, 52.0, 135.0, 229.0, 230.0, 194.0, 85.0, 50.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.47761535644531, -99.20384216308594, -95.93006896972656, -92.65629577636719, -89.38252258300781, -86.10874938964844, -82.83497619628906, -79.56120300292969, -76.28742980957031, -73.01365661621094, -69.73988342285156, -66.46611022949219, -63.19233703613281, -59.91856384277344, -56.6447868347168, -53.37101364135742, -50.09723663330078, -46.823463439941406, -43.54969024658203, -40.275917053222656, -37.00214385986328, -33.728370666503906, -30.454593658447266, -27.18082046508789, -23.907047271728516, -20.63327407836914, -17.359500885009766, -14.085725784301758, -10.811952590942383, -7.538179397583008, -4.264404296875, -0.990631103515625, 2.2831497192382812, 5.5569233894348145, 8.830697059631348, 12.104471206665039, 15.378244400024414, 18.65201759338379, 21.925792694091797, 25.199565887451172, 28.473339080810547, 31.747112274169922, 35.0208854675293, 38.29466247558594, 41.56843566894531, 44.84220886230469, 48.11598205566406, 51.38975524902344, 54.66352844238281, 57.93730163574219, 61.21107482910156, 64.48484802246094, 67.75862121582031, 71.03239440917969, 74.30616760253906, 77.57994079589844, 80.85371398925781, 84.12748718261719, 87.40126037597656, 90.67503356933594, 93.94880676269531, 97.22257995605469, 100.49635314941406, 103.77012634277344, 107.04390716552734]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 3.0, 4.0, 5.0, 13.0, 13.0, 16.0, 19.0, 17.0, 18.0, 22.0, 23.0, 27.0, 36.0, 42.0, 33.0, 54.0, 41.0, 54.0, 42.0, 42.0, 42.0, 49.0, 51.0, 35.0, 28.0, 31.0, 25.0, 32.0, 24.0, 18.0, 29.0, 15.0, 15.0, 14.0, 15.0, 13.0, 11.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.605979919433594, -45.07762908935547, -43.54928207397461, -42.020931243896484, -40.49258041381836, -38.964229583740234, -37.435882568359375, -35.90753173828125, -34.379180908203125, -32.850830078125, -31.322481155395508, -29.794132232666016, -28.26578140258789, -26.7374324798584, -25.209083557128906, -23.68073272705078, -22.15238380432129, -20.624034881591797, -19.095684051513672, -17.56733512878418, -16.038984298706055, -14.510635375976562, -12.982285499572754, -11.453935623168945, -9.925585746765137, -8.397235870361328, -6.8688859939575195, -5.340536594390869, -3.8121867179870605, -2.283836841583252, -0.7554874420166016, 0.772862434387207, 2.3012123107910156, 3.829562187194824, 5.357912063598633, 6.886261463165283, 8.41461181640625, 9.942960739135742, 11.47131061553955, 12.99966049194336, 14.528010368347168, 16.056360244750977, 17.58470916748047, 19.113059997558594, 20.641408920288086, 22.16975975036621, 23.698108673095703, 25.226459503173828, 26.75480842590332, 28.283157348632812, 29.811508178710938, 31.33985710144043, 32.86820602416992, 34.39655685424805, 35.92490768432617, 37.45325469970703, 38.981605529785156, 40.50995635986328, 42.03830337524414, 43.566654205322266, 45.09500503540039, 46.623355865478516, 48.151702880859375, 49.6800537109375, 51.208404541015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 30.0, 39.0, 56.0, 82.0, 127.0, 220.0, 274.0, 389.0, 586.0, 884.0, 1306.0, 1933.0, 2793.0, 4259.0, 6228.0, 9150.0, 14096.0, 20973.0, 32139.0, 49192.0, 74998.0, 110500.0, 148374.0, 161428.0, 132301.0, 93210.0, 62298.0, 40583.0, 26800.0, 17650.0, 11721.0, 7725.0, 5175.0, 3566.0, 2366.0, 1613.0, 1123.0, 714.0, 519.0, 333.0, 236.0, 159.0, 122.0, 75.0, 51.0, 33.0, 33.0, 15.0, 15.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.72021484375, -0.6971893310546875, -0.674163818359375, -0.6511383056640625, -0.62811279296875, -0.6050872802734375, -0.582061767578125, -0.5590362548828125, -0.5360107421875, -0.5129852294921875, -0.489959716796875, -0.4669342041015625, -0.44390869140625, -0.4208831787109375, -0.397857666015625, -0.3748321533203125, -0.351806640625, -0.3287811279296875, -0.305755615234375, -0.2827301025390625, -0.25970458984375, -0.2366790771484375, -0.213653564453125, -0.1906280517578125, -0.1676025390625, -0.1445770263671875, -0.121551513671875, -0.0985260009765625, -0.07550048828125, -0.0524749755859375, -0.029449462890625, -0.0064239501953125, 0.0166015625, 0.0396270751953125, 0.062652587890625, 0.0856781005859375, 0.10870361328125, 0.1317291259765625, 0.154754638671875, 0.1777801513671875, 0.2008056640625, 0.2238311767578125, 0.246856689453125, 0.2698822021484375, 0.29290771484375, 0.3159332275390625, 0.338958740234375, 0.3619842529296875, 0.385009765625, 0.4080352783203125, 0.431060791015625, 0.4540863037109375, 0.47711181640625, 0.5001373291015625, 0.523162841796875, 0.5461883544921875, 0.5692138671875, 0.5922393798828125, 0.615264892578125, 0.6382904052734375, 0.66131591796875, 0.6843414306640625, 0.707366943359375, 0.7303924560546875, 0.75341796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 16.0, 19.0, 18.0, 24.0, 19.0, 33.0, 43.0, 40.0, 38.0, 46.0, 46.0, 36.0, 52.0, 1063.0, 61.0, 42.0, 44.0, 33.0, 38.0, 34.0, 36.0, 33.0, 24.0, 24.0, 23.0, 18.0, 13.0, 11.0, 10.0, 8.0, 2.0, 11.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-7.29296875, -7.09478759765625, -6.8966064453125, -6.69842529296875, -6.500244140625, -6.30206298828125, -6.1038818359375, -5.90570068359375, -5.70751953125, -5.50933837890625, -5.3111572265625, -5.11297607421875, -4.914794921875, -4.71661376953125, -4.5184326171875, -4.32025146484375, -4.1220703125, -3.92388916015625, -3.7257080078125, -3.52752685546875, -3.329345703125, -3.13116455078125, -2.9329833984375, -2.73480224609375, -2.53662109375, -2.33843994140625, -2.1402587890625, -1.94207763671875, -1.743896484375, -1.54571533203125, -1.3475341796875, -1.14935302734375, -0.951171875, -0.75299072265625, -0.5548095703125, -0.35662841796875, -0.158447265625, 0.03973388671875, 0.2379150390625, 0.43609619140625, 0.63427734375, 0.83245849609375, 1.0306396484375, 1.22882080078125, 1.427001953125, 1.62518310546875, 1.8233642578125, 2.02154541015625, 2.2197265625, 2.41790771484375, 2.6160888671875, 2.81427001953125, 3.012451171875, 3.21063232421875, 3.4088134765625, 3.60699462890625, 3.80517578125, 4.00335693359375, 4.2015380859375, 4.39971923828125, 4.597900390625, 4.79608154296875, 4.9942626953125, 5.19244384765625, 5.390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 22.0, 29.0, 42.0, 91.0, 137.0, 201.0, 328.0, 559.0, 882.0, 1479.0, 2350.0, 3786.0, 6270.0, 9840.0, 15555.0, 24569.0, 38407.0, 60681.0, 92453.0, 130781.0, 1206477.0, 158106.0, 118844.0, 81881.0, 52651.0, 33791.0, 21154.0, 13419.0, 8306.0, 5426.0, 3288.0, 2038.0, 1281.0, 754.0, 502.0, 286.0, 173.0, 115.0, 61.0, 37.0, 26.0, 11.0, 11.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6257095336914062, -0.6054229736328125, -0.5851364135742188, -0.564849853515625, -0.5445632934570312, -0.5242767333984375, -0.5039901733398438, -0.48370361328125, -0.46341705322265625, -0.4431304931640625, -0.42284393310546875, -0.402557373046875, -0.38227081298828125, -0.3619842529296875, -0.34169769287109375, -0.3214111328125, -0.30112457275390625, -0.2808380126953125, -0.26055145263671875, -0.240264892578125, -0.21997833251953125, -0.1996917724609375, -0.17940521240234375, -0.15911865234375, -0.13883209228515625, -0.1185455322265625, -0.09825897216796875, -0.077972412109375, -0.05768585205078125, -0.0373992919921875, -0.01711273193359375, 0.003173828125, 0.02346038818359375, 0.0437469482421875, 0.06403350830078125, 0.084320068359375, 0.10460662841796875, 0.1248931884765625, 0.14517974853515625, 0.16546630859375, 0.18575286865234375, 0.2060394287109375, 0.22632598876953125, 0.246612548828125, 0.26689910888671875, 0.2871856689453125, 0.30747222900390625, 0.3277587890625, 0.34804534912109375, 0.3683319091796875, 0.38861846923828125, 0.408905029296875, 0.42919158935546875, 0.4494781494140625, 0.46976470947265625, 0.49005126953125, 0.5103378295898438, 0.5306243896484375, 0.5509109497070312, 0.571197509765625, 0.5914840698242188, 0.6117706298828125, 0.6320571899414062, 0.65234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 4.0, 3.0, 11.0, 10.0, 12.0, 18.0, 9.0, 18.0, 20.0, 31.0, 33.0, 29.0, 35.0, 27.0, 53.0, 62.0, 59.0, 60.0, 64.0, 53.0, 68.0, 44.0, 38.0, 43.0, 22.0, 26.0, 21.0, 22.0, 18.0, 6.0, 14.0, 8.0, 8.0, 4.0, 1.0, 9.0, 4.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0036296844482421875, -0.0035242438316345215, -0.0034188032150268555, -0.0033133625984191895, -0.0032079219818115234, -0.0031024813652038574, -0.0029970407485961914, -0.0028916001319885254, -0.0027861595153808594, -0.0026807188987731934, -0.0025752782821655273, -0.0024698376655578613, -0.0023643970489501953, -0.0022589564323425293, -0.0021535158157348633, -0.0020480751991271973, -0.0019426345825195312, -0.0018371939659118652, -0.0017317533493041992, -0.0016263127326965332, -0.0015208721160888672, -0.0014154314994812012, -0.0013099908828735352, -0.0012045502662658691, -0.0010991096496582031, -0.0009936690330505371, -0.0008882284164428711, -0.0007827877998352051, -0.0006773471832275391, -0.000571906566619873, -0.00046646595001220703, -0.000361025333404541, -0.000255584716796875, -0.00015014410018920898, -4.470348358154297e-05, 6.073713302612305e-05, 0.00016617774963378906, 0.0002716183662414551, 0.0003770589828491211, 0.0004824995994567871, 0.0005879402160644531, 0.0006933808326721191, 0.0007988214492797852, 0.0009042620658874512, 0.0010097026824951172, 0.0011151432991027832, 0.0012205839157104492, 0.0013260245323181152, 0.0014314651489257812, 0.0015369057655334473, 0.0016423463821411133, 0.0017477869987487793, 0.0018532276153564453, 0.0019586682319641113, 0.0020641088485717773, 0.0021695494651794434, 0.0022749900817871094, 0.0023804306983947754, 0.0024858713150024414, 0.0025913119316101074, 0.0026967525482177734, 0.0028021931648254395, 0.0029076337814331055, 0.0030130743980407715, 0.0031185150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 12.0, 6.0, 8.0, 9.0, 16.0, 17.0, 16.0, 28.0, 49.0, 58.0, 60.0, 95.0, 118.0, 143.0, 209.0, 380.0, 636.0, 2082.0, 183891.0, 852706.0, 5818.0, 755.0, 423.0, 270.0, 159.0, 107.0, 98.0, 68.0, 53.0, 43.0, 32.0, 34.0, 27.0, 18.0, 19.0, 12.0, 8.0, 13.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05596590042114258, -0.053978919982910156, -0.051991939544677734, -0.05000495910644531, -0.04801797866821289, -0.04603099822998047, -0.04404401779174805, -0.042057037353515625, -0.0400700569152832, -0.03808307647705078, -0.03609609603881836, -0.03410911560058594, -0.032122135162353516, -0.030135154724121094, -0.028148174285888672, -0.02616119384765625, -0.024174213409423828, -0.022187232971191406, -0.020200252532958984, -0.018213272094726562, -0.01622629165649414, -0.014239311218261719, -0.012252330780029297, -0.010265350341796875, -0.008278369903564453, -0.006291389465332031, -0.004304409027099609, -0.0023174285888671875, -0.0003304481506347656, 0.0016565322875976562, 0.003643512725830078, 0.0056304931640625, 0.007617473602294922, 0.009604454040527344, 0.011591434478759766, 0.013578414916992188, 0.01556539535522461, 0.01755237579345703, 0.019539356231689453, 0.021526336669921875, 0.023513317108154297, 0.02550029754638672, 0.02748727798461914, 0.029474258422851562, 0.031461238861083984, 0.033448219299316406, 0.03543519973754883, 0.03742218017578125, 0.03940916061401367, 0.041396141052246094, 0.043383121490478516, 0.04537010192871094, 0.04735708236694336, 0.04934406280517578, 0.0513310432434082, 0.053318023681640625, 0.05530500411987305, 0.05729198455810547, 0.05927896499633789, 0.06126594543457031, 0.06325292587280273, 0.06523990631103516, 0.06722688674926758, 0.0692138671875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 56.0, 357.0, 415.0, 129.0, 36.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01804562658071518, -0.01769249700009823, -0.017339367419481277, -0.016986237838864326, -0.016633108258247375, -0.016279976814985275, -0.015926849097013474, -0.015573718585073948, -0.015220588073134422, -0.014867458492517471, -0.01451432891190052, -0.01416119933128357, -0.013808068819344044, -0.013454939238727093, -0.013101809658110142, -0.01274868007749319, -0.01239555049687624, -0.012042420916259289, -0.011689291335642338, -0.011336160823702812, -0.010983031243085861, -0.01062990166246891, -0.01027677208185196, -0.009923642501235008, -0.009570512920618057, -0.009217383340001106, -0.008864253759384155, -0.008511124178767204, -0.008157993666827679, -0.007804864086210728, -0.007451734505593777, -0.007098604924976826, -0.006745473947376013, -0.006392344366759062, -0.0060392143204808235, -0.0056860847398638725, -0.0053329551592469215, -0.004979825112968683, -0.004626695532351732, -0.004273565486073494, -0.003920435905456543, -0.0035673060920089483, -0.0032141762785613537, -0.0028610466979444027, -0.002507916884496808, -0.0021547870710492134, -0.0018016574904322624, -0.0014485276769846678, -0.0010953978635370731, -0.0007422681082971394, -0.0003891383530572057, -3.600865602493286e-05, 0.0003171211574226618, 0.0006702509708702564, 0.0010233805514872074, 0.001376510364934802, 0.0017296401783823967, 0.0020827699918299913, 0.002435899805277586, 0.002789029385894537, 0.0031421591993421316, 0.0034952890127897263, 0.0038484185934066772, 0.004201548174023628, 0.0045546782203018665]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 5.0, 11.0, 15.0, 14.0, 21.0, 15.0, 14.0, 27.0, 10.0, 33.0, 30.0, 29.0, 33.0, 33.0, 23.0, 48.0, 34.0, 39.0, 34.0, 33.0, 35.0, 34.0, 36.0, 44.0, 38.0, 36.0, 25.0, 30.0, 20.0, 20.0, 24.0, 24.0, 15.0, 18.0, 18.0, 11.0, 8.0, 11.0, 5.0, 2.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0018517374992370605, -0.0017941063269972801, -0.0017364751547574997, -0.0016788439825177193, -0.0016212128102779388, -0.0015635816380381584, -0.001505950465798378, -0.0014483192935585976, -0.0013906881213188171, -0.0013330569490790367, -0.0012754257768392563, -0.0012177946045994759, -0.0011601634323596954, -0.001102532260119915, -0.0010449010878801346, -0.0009872699156403542, -0.0009296387434005737, -0.0008720075711607933, -0.0008143763989210129, -0.0007567452266812325, -0.000699114054441452, -0.0006414828822016716, -0.0005838517099618912, -0.0005262205377221107, -0.0004685893654823303, -0.0004109581932425499, -0.00035332702100276947, -0.00029569584876298904, -0.00023806467652320862, -0.0001804335042834282, -0.00012280233204364777, -6.517115980386734e-05, -7.539987564086914e-06, 5.009118467569351e-05, 0.00010772235691547394, 0.00016535352915525436, 0.0002229847013950348, 0.0002806158736348152, 0.00033824704587459564, 0.00039587821811437607, 0.0004535093903541565, 0.0005111405625939369, 0.0005687717348337173, 0.0006264029070734978, 0.0006840340793132782, 0.0007416652515530586, 0.000799296423792839, 0.0008569275960326195, 0.0009145587682723999, 0.0009721899405121803, 0.0010298211127519608, 0.0010874522849917412, 0.0011450834572315216, 0.001202714629471302, 0.0012603458017110825, 0.0013179769739508629, 0.0013756081461906433, 0.0014332393184304237, 0.0014908704906702042, 0.0015485016629099846, 0.001606132835149765, 0.0016637640073895454, 0.0017213951796293259, 0.0017790263518691063, 0.0018366575241088867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 5.0, 15.0, 12.0, 19.0, 19.0, 20.0, 41.0, 50.0, 81.0, 95.0, 148.0, 188.0, 222.0, 262.0, 406.0, 609.0, 756.0, 1159.0, 1853.0, 3643.0, 9085.0, 31994.0, 156486.0, 578455.0, 201604.0, 40311.0, 10594.0, 4043.0, 1997.0, 1270.0, 838.0, 623.0, 433.0, 282.0, 213.0, 177.0, 128.0, 104.0, 86.0, 54.0, 40.0, 35.0, 23.0, 21.0, 8.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.359375, -14.8729248046875, -14.386474609375, -13.9000244140625, -13.41357421875, -12.9271240234375, -12.440673828125, -11.9542236328125, -11.4677734375, -10.9813232421875, -10.494873046875, -10.0084228515625, -9.52197265625, -9.0355224609375, -8.549072265625, -8.0626220703125, -7.576171875, -7.0897216796875, -6.603271484375, -6.1168212890625, -5.63037109375, -5.1439208984375, -4.657470703125, -4.1710205078125, -3.6845703125, -3.1981201171875, -2.711669921875, -2.2252197265625, -1.73876953125, -1.2523193359375, -0.765869140625, -0.2794189453125, 0.20703125, 0.6934814453125, 1.179931640625, 1.6663818359375, 2.15283203125, 2.6392822265625, 3.125732421875, 3.6121826171875, 4.0986328125, 4.5850830078125, 5.071533203125, 5.5579833984375, 6.04443359375, 6.5308837890625, 7.017333984375, 7.5037841796875, 7.990234375, 8.4766845703125, 8.963134765625, 9.4495849609375, 9.93603515625, 10.4224853515625, 10.908935546875, 11.3953857421875, 11.8818359375, 12.3682861328125, 12.854736328125, 13.3411865234375, 13.82763671875, 14.3140869140625, 14.800537109375, 15.2869873046875, 15.7734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 15.0, 5.0, 16.0, 17.0, 25.0, 23.0, 37.0, 34.0, 46.0, 34.0, 66.0, 83.0, 163.0, 1496.0, 371.0, 123.0, 64.0, 53.0, 46.0, 40.0, 28.0, 29.0, 31.0, 33.0, 26.0, 20.0, 21.0, 12.0, 11.0, 12.0, 5.0, 7.0, 10.0, 11.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.28076171875, -20.5927734375, -19.90478515625, -19.216796875, -18.52880859375, -17.8408203125, -17.15283203125, -16.46484375, -15.77685546875, -15.0888671875, -14.40087890625, -13.712890625, -13.02490234375, -12.3369140625, -11.64892578125, -10.9609375, -10.27294921875, -9.5849609375, -8.89697265625, -8.208984375, -7.52099609375, -6.8330078125, -6.14501953125, -5.45703125, -4.76904296875, -4.0810546875, -3.39306640625, -2.705078125, -2.01708984375, -1.3291015625, -0.64111328125, 0.046875, 0.73486328125, 1.4228515625, 2.11083984375, 2.798828125, 3.48681640625, 4.1748046875, 4.86279296875, 5.55078125, 6.23876953125, 6.9267578125, 7.61474609375, 8.302734375, 8.99072265625, 9.6787109375, 10.36669921875, 11.0546875, 11.74267578125, 12.4306640625, 13.11865234375, 13.806640625, 14.49462890625, 15.1826171875, 15.87060546875, 16.55859375, 17.24658203125, 17.9345703125, 18.62255859375, 19.310546875, 19.99853515625, 20.6865234375, 21.37451171875, 22.0625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 6.0, 0.0, 6.0, 7.0, 10.0, 7.0, 12.0, 15.0, 12.0, 29.0, 20.0, 34.0, 33.0, 54.0, 83.0, 131.0, 203.0, 407.0, 788.0, 3044.0, 3091129.0, 47132.0, 1279.0, 506.0, 275.0, 138.0, 102.0, 61.0, 37.0, 38.0, 19.0, 23.0, 11.0, 9.0, 9.0, 5.0, 2.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-102.3125, -99.6015625, -96.890625, -94.1796875, -91.46875, -88.7578125, -86.046875, -83.3359375, -80.625, -77.9140625, -75.203125, -72.4921875, -69.78125, -67.0703125, -64.359375, -61.6484375, -58.9375, -56.2265625, -53.515625, -50.8046875, -48.09375, -45.3828125, -42.671875, -39.9609375, -37.25, -34.5390625, -31.828125, -29.1171875, -26.40625, -23.6953125, -20.984375, -18.2734375, -15.5625, -12.8515625, -10.140625, -7.4296875, -4.71875, -2.0078125, 0.703125, 3.4140625, 6.125, 8.8359375, 11.546875, 14.2578125, 16.96875, 19.6796875, 22.390625, 25.1015625, 27.8125, 30.5234375, 33.234375, 35.9453125, 38.65625, 41.3671875, 44.078125, 46.7890625, 49.5, 52.2109375, 54.921875, 57.6328125, 60.34375, 63.0546875, 65.765625, 68.4765625, 71.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 597.0, 395.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.3544921875, -212.21298217773438, -202.07147216796875, -191.92994689941406, -181.78843688964844, -171.6469268798828, -161.50540161132812, -151.3638916015625, -141.22238159179688, -131.08087158203125, -120.9393539428711, -110.79783630371094, -100.65632629394531, -90.51481628417969, -80.37329864501953, -70.23178100585938, -60.09027099609375, -49.94875717163086, -39.80724334716797, -29.665729522705078, -19.524215698242188, -9.382701873779297, 0.7588119506835938, 10.90032958984375, 21.041839599609375, 31.183353424072266, 41.324867248535156, 51.46638107299805, 61.60789489746094, 71.74940490722656, 81.89092254638672, 92.03244018554688, 102.1739501953125, 112.31546020507812, 122.45697784423828, 132.59849548339844, 142.74000549316406, 152.8815155029297, 163.02304077148438, 173.16455078125, 183.30606079101562, 193.44757080078125, 203.58908081054688, 213.73060607910156, 223.8721160888672, 234.0136260986328, 244.1551513671875, 254.29666137695312, 264.43817138671875, 274.5796813964844, 284.72119140625, 294.8627014160156, 305.00421142578125, 315.145751953125, 325.2872619628906, 335.42877197265625, 345.5702819824219, 355.7117919921875, 365.8533020019531, 375.99481201171875, 386.1363525390625, 396.2778625488281, 406.41937255859375, 416.5608825683594, 426.702392578125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 12.0, 5.0, 9.0, 8.0, 16.0, 16.0, 21.0, 15.0, 22.0, 26.0, 29.0, 32.0, 28.0, 28.0, 40.0, 32.0, 44.0, 41.0, 39.0, 35.0, 47.0, 47.0, 38.0, 50.0, 40.0, 29.0, 33.0, 32.0, 18.0, 27.0, 21.0, 26.0, 6.0, 6.0, 11.0, 21.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.22264862060547, -57.51224899291992, -55.80184555053711, -54.09144592285156, -52.381046295166016, -50.67064666748047, -48.960243225097656, -47.24984359741211, -45.53944396972656, -43.829044342041016, -42.1186408996582, -40.408241271972656, -38.69784164428711, -36.98744201660156, -35.27703857421875, -33.5666389465332, -31.856237411499023, -30.145835876464844, -28.435436248779297, -26.725034713745117, -25.01463508605957, -23.30423355102539, -21.593833923339844, -19.883432388305664, -18.173030853271484, -16.462629318237305, -14.752229690551758, -13.041828155517578, -11.331428527832031, -9.621026992797852, -7.910626411437988, -6.200225830078125, -4.489826202392578, -2.779425621032715, -1.0690248012542725, 0.6413760185241699, 2.351776599884033, 4.062177658081055, 5.772578239440918, 7.482978820800781, 9.193379402160645, 10.903779983520508, 12.614180564880371, 14.324581146240234, 16.034982681274414, 17.745384216308594, 19.45578384399414, 21.166183471679688, 22.876585006713867, 24.586986541748047, 26.297386169433594, 28.007787704467773, 29.71818733215332, 31.4285888671875, 33.13898849487305, 34.849388122558594, 36.559791564941406, 38.27019119262695, 39.980594635009766, 41.69099426269531, 43.40139389038086, 45.111793518066406, 46.82219696044922, 48.532596588134766, 50.24299621582031]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 8.0, 6.0, 5.0, 13.0, 13.0, 19.0, 21.0, 32.0, 28.0, 30.0, 30.0, 38.0, 35.0, 46.0, 37.0, 38.0, 50.0, 43.0, 47.0, 40.0, 43.0, 40.0, 42.0, 38.0, 28.0, 34.0, 27.0, 22.0, 22.0, 33.0, 14.0, 10.0, 14.0, 9.0, 4.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6092529296875, -8.312255859375, -8.0152587890625, -7.71826171875, -7.4212646484375, -7.124267578125, -6.8272705078125, -6.5302734375, -6.2332763671875, -5.936279296875, -5.6392822265625, -5.34228515625, -5.0452880859375, -4.748291015625, -4.4512939453125, -4.154296875, -3.8572998046875, -3.560302734375, -3.2633056640625, -2.96630859375, -2.6693115234375, -2.372314453125, -2.0753173828125, -1.7783203125, -1.4813232421875, -1.184326171875, -0.8873291015625, -0.59033203125, -0.2933349609375, 0.003662109375, 0.3006591796875, 0.59765625, 0.8946533203125, 1.191650390625, 1.4886474609375, 1.78564453125, 2.0826416015625, 2.379638671875, 2.6766357421875, 2.9736328125, 3.2706298828125, 3.567626953125, 3.8646240234375, 4.16162109375, 4.4586181640625, 4.755615234375, 5.0526123046875, 5.349609375, 5.6466064453125, 5.943603515625, 6.2406005859375, 6.53759765625, 6.8345947265625, 7.131591796875, 7.4285888671875, 7.7255859375, 8.0225830078125, 8.319580078125, 8.6165771484375, 8.91357421875, 9.2105712890625, 9.507568359375, 9.8045654296875, 10.1015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 18.0, 21.0, 23.0, 34.0, 35.0, 45.0, 73.0, 86.0, 114.0, 167.0, 271.0, 416.0, 731.0, 1479.0, 3544.0, 9594.0, 43353.0, 379417.0, 2308499.0, 1278850.0, 136095.0, 20314.0, 5980.0, 2284.0, 1134.0, 566.0, 320.0, 221.0, 135.0, 111.0, 76.0, 57.0, 49.0, 33.0, 26.0, 18.0, 19.0, 10.0, 10.0, 8.0, 3.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.96875, -17.420654296875, -16.87255859375, -16.324462890625, -15.7763671875, -15.228271484375, -14.68017578125, -14.132080078125, -13.583984375, -13.035888671875, -12.48779296875, -11.939697265625, -11.3916015625, -10.843505859375, -10.29541015625, -9.747314453125, -9.19921875, -8.651123046875, -8.10302734375, -7.554931640625, -7.0068359375, -6.458740234375, -5.91064453125, -5.362548828125, -4.814453125, -4.266357421875, -3.71826171875, -3.170166015625, -2.6220703125, -2.073974609375, -1.52587890625, -0.977783203125, -0.4296875, 0.118408203125, 0.66650390625, 1.214599609375, 1.7626953125, 2.310791015625, 2.85888671875, 3.406982421875, 3.955078125, 4.503173828125, 5.05126953125, 5.599365234375, 6.1474609375, 6.695556640625, 7.24365234375, 7.791748046875, 8.33984375, 8.887939453125, 9.43603515625, 9.984130859375, 10.5322265625, 11.080322265625, 11.62841796875, 12.176513671875, 12.724609375, 13.272705078125, 13.82080078125, 14.368896484375, 14.9169921875, 15.465087890625, 16.01318359375, 16.561279296875, 17.109375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 23.0, 33.0, 38.0, 66.0, 97.0, 134.0, 191.0, 237.0, 504.0, 648.0, 675.0, 433.0, 292.0, 190.0, 141.0, 105.0, 64.0, 48.0, 35.0, 23.0, 20.0, 22.0, 10.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.03125, -23.4305419921875, -22.829833984375, -22.2291259765625, -21.62841796875, -21.0277099609375, -20.427001953125, -19.8262939453125, -19.2255859375, -18.6248779296875, -18.024169921875, -17.4234619140625, -16.82275390625, -16.2220458984375, -15.621337890625, -15.0206298828125, -14.419921875, -13.8192138671875, -13.218505859375, -12.6177978515625, -12.01708984375, -11.4163818359375, -10.815673828125, -10.2149658203125, -9.6142578125, -9.0135498046875, -8.412841796875, -7.8121337890625, -7.21142578125, -6.6107177734375, -6.010009765625, -5.4093017578125, -4.80859375, -4.2078857421875, -3.607177734375, -3.0064697265625, -2.40576171875, -1.8050537109375, -1.204345703125, -0.6036376953125, -0.0029296875, 0.5977783203125, 1.198486328125, 1.7991943359375, 2.39990234375, 3.0006103515625, 3.601318359375, 4.2020263671875, 4.802734375, 5.4034423828125, 6.004150390625, 6.6048583984375, 7.20556640625, 7.8062744140625, 8.406982421875, 9.0076904296875, 9.6083984375, 10.2091064453125, 10.809814453125, 11.4105224609375, 12.01123046875, 12.6119384765625, 13.212646484375, 13.8133544921875, 14.4140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 8.0, 13.0, 17.0, 40.0, 69.0, 100.0, 177.0, 423.0, 799.0, 2374.0, 15468.0, 619857.0, 3490822.0, 57609.0, 4299.0, 1219.0, 461.0, 225.0, 130.0, 67.0, 45.0, 23.0, 7.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -42.00830078125, -40.7041015625, -39.39990234375, -38.095703125, -36.79150390625, -35.4873046875, -34.18310546875, -32.87890625, -31.57470703125, -30.2705078125, -28.96630859375, -27.662109375, -26.35791015625, -25.0537109375, -23.74951171875, -22.4453125, -21.14111328125, -19.8369140625, -18.53271484375, -17.228515625, -15.92431640625, -14.6201171875, -13.31591796875, -12.01171875, -10.70751953125, -9.4033203125, -8.09912109375, -6.794921875, -5.49072265625, -4.1865234375, -2.88232421875, -1.578125, -0.27392578125, 1.0302734375, 2.33447265625, 3.638671875, 4.94287109375, 6.2470703125, 7.55126953125, 8.85546875, 10.15966796875, 11.4638671875, 12.76806640625, 14.072265625, 15.37646484375, 16.6806640625, 17.98486328125, 19.2890625, 20.59326171875, 21.8974609375, 23.20166015625, 24.505859375, 25.81005859375, 27.1142578125, 28.41845703125, 29.72265625, 31.02685546875, 32.3310546875, 33.63525390625, 34.939453125, 36.24365234375, 37.5478515625, 38.85205078125, 40.15625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 70.0, 849.0, 93.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-848.4249267578125, -831.959228515625, -815.4935302734375, -799.02783203125, -782.5621337890625, -766.096435546875, -749.6307373046875, -733.1650390625, -716.6993408203125, -700.233642578125, -683.7679443359375, -667.30224609375, -650.8365478515625, -634.370849609375, -617.9051513671875, -601.439453125, -584.9736938476562, -568.5079956054688, -552.0422973632812, -535.5765991210938, -519.1109008789062, -502.64520263671875, -486.1794738769531, -469.7137756347656, -453.2480773925781, -436.7823791503906, -420.3166809082031, -403.8509826660156, -387.38525390625, -370.9195556640625, -354.453857421875, -337.9881591796875, -321.5224609375, -305.0567626953125, -288.591064453125, -272.1253662109375, -255.65965270996094, -239.19395446777344, -222.72824096679688, -206.26254272460938, -189.79684448242188, -173.33114624023438, -156.86544799804688, -140.3997344970703, -123.93403625488281, -107.46833801269531, -91.00263214111328, -74.53692626953125, -58.07122802734375, -41.605525970458984, -25.13982391357422, -8.674121856689453, 7.7915802001953125, 24.257278442382812, 40.722984313964844, 57.188690185546875, 73.65438842773438, 90.12008666992188, 106.5857925415039, 123.05149841308594, 139.51719665527344, 155.98289489746094, 172.4486083984375, 188.914306640625, 205.3800048828125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 5.0, 13.0, 16.0, 18.0, 16.0, 18.0, 28.0, 23.0, 28.0, 38.0, 39.0, 37.0, 37.0, 37.0, 40.0, 39.0, 47.0, 52.0, 46.0, 37.0, 32.0, 46.0, 38.0, 39.0, 37.0, 24.0, 25.0, 23.0, 21.0, 16.0, 20.0, 7.0, 7.0, 12.0, 9.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-54.67823028564453, -52.84877395629883, -51.01932144165039, -49.18986511230469, -47.360408782958984, -45.53095626831055, -43.701499938964844, -41.872047424316406, -40.0425910949707, -38.213134765625, -36.38368225097656, -34.55422592163086, -32.724769592285156, -30.89531707763672, -29.065860748291016, -27.236406326293945, -25.406949996948242, -23.577495574951172, -21.74803924560547, -19.9185848236084, -18.089130401611328, -16.259674072265625, -14.430219650268555, -12.600765228271484, -10.771309852600098, -8.941854476928711, -7.112400054931641, -5.282944679260254, -3.4534897804260254, -1.6240348815917969, 0.20542049407958984, 2.03487491607666, 3.864330291748047, 5.693785190582275, 7.523240089416504, 9.35269546508789, 11.182149887084961, 13.011605262756348, 14.841060638427734, 16.670515060424805, 18.499969482421875, 20.329423904418945, 22.15888023376465, 23.98833465576172, 25.81778907775879, 27.64724349975586, 29.476699829101562, 31.306154251098633, 33.13561248779297, 34.96506881713867, 36.79452133178711, 38.62397766113281, 40.453433990478516, 42.28288650512695, 44.112342834472656, 45.941795349121094, 47.7712516784668, 49.6007080078125, 51.43016052246094, 53.25961685180664, 55.089073181152344, 56.91852569580078, 58.747982025146484, 60.57743835449219, 62.406890869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 15.0, 24.0, 15.0, 21.0, 32.0, 26.0, 40.0, 36.0, 43.0, 28.0, 43.0, 41.0, 33.0, 41.0, 31.0, 45.0, 53.0, 46.0, 33.0, 43.0, 41.0, 24.0, 37.0, 40.0, 22.0, 17.0, 14.0, 12.0, 13.0, 11.0, 11.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.3929443359375, -6.160888671875, -5.9288330078125, -5.69677734375, -5.4647216796875, -5.232666015625, -5.0006103515625, -4.7685546875, -4.5364990234375, -4.304443359375, -4.0723876953125, -3.84033203125, -3.6082763671875, -3.376220703125, -3.1441650390625, -2.912109375, -2.6800537109375, -2.447998046875, -2.2159423828125, -1.98388671875, -1.7518310546875, -1.519775390625, -1.2877197265625, -1.0556640625, -0.8236083984375, -0.591552734375, -0.3594970703125, -0.12744140625, 0.1046142578125, 0.336669921875, 0.5687255859375, 0.80078125, 1.0328369140625, 1.264892578125, 1.4969482421875, 1.72900390625, 1.9610595703125, 2.193115234375, 2.4251708984375, 2.6572265625, 2.8892822265625, 3.121337890625, 3.3533935546875, 3.58544921875, 3.8175048828125, 4.049560546875, 4.2816162109375, 4.513671875, 4.7457275390625, 4.977783203125, 5.2098388671875, 5.44189453125, 5.6739501953125, 5.906005859375, 6.1380615234375, 6.3701171875, 6.6021728515625, 6.834228515625, 7.0662841796875, 7.29833984375, 7.5303955078125, 7.762451171875, 7.9945068359375, 8.2265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 19.0, 29.0, 36.0, 53.0, 76.0, 143.0, 215.0, 320.0, 550.0, 879.0, 1376.0, 2149.0, 3522.0, 5771.0, 9553.0, 15674.0, 26178.0, 44056.0, 74336.0, 122980.0, 186681.0, 199791.0, 140671.0, 86098.0, 50774.0, 30443.0, 17992.0, 10947.0, 6560.0, 4122.0, 2444.0, 1525.0, 984.0, 573.0, 333.0, 249.0, 143.0, 108.0, 63.0, 43.0, 28.0, 19.0, 13.0, 11.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7138900756835938, -0.6909637451171875, -0.6680374145507812, -0.645111083984375, -0.6221847534179688, -0.5992584228515625, -0.5763320922851562, -0.55340576171875, -0.5304794311523438, -0.5075531005859375, -0.48462677001953125, -0.461700439453125, -0.43877410888671875, -0.4158477783203125, -0.39292144775390625, -0.3699951171875, -0.34706878662109375, -0.3241424560546875, -0.30121612548828125, -0.278289794921875, -0.25536346435546875, -0.2324371337890625, -0.20951080322265625, -0.18658447265625, -0.16365814208984375, -0.1407318115234375, -0.11780548095703125, -0.094879150390625, -0.07195281982421875, -0.0490264892578125, -0.02610015869140625, -0.003173828125, 0.01975250244140625, 0.0426788330078125, 0.06560516357421875, 0.088531494140625, 0.11145782470703125, 0.1343841552734375, 0.15731048583984375, 0.18023681640625, 0.20316314697265625, 0.2260894775390625, 0.24901580810546875, 0.271942138671875, 0.29486846923828125, 0.3177947998046875, 0.34072113037109375, 0.3636474609375, 0.38657379150390625, 0.4095001220703125, 0.43242645263671875, 0.455352783203125, 0.47827911376953125, 0.5012054443359375, 0.5241317749023438, 0.54705810546875, 0.5699844360351562, 0.5929107666015625, 0.6158370971679688, 0.638763427734375, 0.6616897583007812, 0.6846160888671875, 0.7075424194335938, 0.73046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 0.0, 6.0, 7.0, 9.0, 13.0, 13.0, 13.0, 19.0, 29.0, 23.0, 30.0, 27.0, 27.0, 31.0, 38.0, 23.0, 36.0, 47.0, 43.0, 44.0, 1066.0, 40.0, 36.0, 44.0, 30.0, 45.0, 27.0, 37.0, 26.0, 30.0, 16.0, 23.0, 24.0, 19.0, 15.0, 10.0, 17.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9837646484375, -3.842529296875, -3.7012939453125, -3.56005859375, -3.4188232421875, -3.277587890625, -3.1363525390625, -2.9951171875, -2.8538818359375, -2.712646484375, -2.5714111328125, -2.43017578125, -2.2889404296875, -2.147705078125, -2.0064697265625, -1.865234375, -1.7239990234375, -1.582763671875, -1.4415283203125, -1.30029296875, -1.1590576171875, -1.017822265625, -0.8765869140625, -0.7353515625, -0.5941162109375, -0.452880859375, -0.3116455078125, -0.17041015625, -0.0291748046875, 0.112060546875, 0.2532958984375, 0.39453125, 0.5357666015625, 0.677001953125, 0.8182373046875, 0.95947265625, 1.1007080078125, 1.241943359375, 1.3831787109375, 1.5244140625, 1.6656494140625, 1.806884765625, 1.9481201171875, 2.08935546875, 2.2305908203125, 2.371826171875, 2.5130615234375, 2.654296875, 2.7955322265625, 2.936767578125, 3.0780029296875, 3.21923828125, 3.3604736328125, 3.501708984375, 3.6429443359375, 3.7841796875, 3.9254150390625, 4.066650390625, 4.2078857421875, 4.34912109375, 4.4903564453125, 4.631591796875, 4.7728271484375, 4.9140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 20.0, 15.0, 27.0, 38.0, 97.0, 124.0, 206.0, 362.0, 588.0, 976.0, 1532.0, 2561.0, 4113.0, 6887.0, 11023.0, 17610.0, 28208.0, 44353.0, 70664.0, 105537.0, 146669.0, 1215288.0, 146113.0, 105757.0, 69751.0, 45004.0, 27754.0, 17322.0, 11172.0, 6693.0, 4189.0, 2581.0, 1546.0, 913.0, 575.0, 351.0, 192.0, 118.0, 68.0, 41.0, 28.0, 27.0, 17.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.59619140625, -0.5793952941894531, -0.5625991821289062, -0.5458030700683594, -0.5290069580078125, -0.5122108459472656, -0.49541473388671875, -0.4786186218261719, -0.461822509765625, -0.4450263977050781, -0.42823028564453125, -0.4114341735839844, -0.3946380615234375, -0.3778419494628906, -0.36104583740234375, -0.3442497253417969, -0.32745361328125, -0.3106575012207031, -0.29386138916015625, -0.2770652770996094, -0.2602691650390625, -0.24347305297851562, -0.22667694091796875, -0.20988082885742188, -0.193084716796875, -0.17628860473632812, -0.15949249267578125, -0.14269638061523438, -0.1259002685546875, -0.10910415649414062, -0.09230804443359375, -0.07551193237304688, -0.0587158203125, -0.041919708251953125, -0.02512359619140625, -0.008327484130859375, 0.0084686279296875, 0.025264739990234375, 0.04206085205078125, 0.058856964111328125, 0.075653076171875, 0.09244918823242188, 0.10924530029296875, 0.12604141235351562, 0.1428375244140625, 0.15963363647460938, 0.17642974853515625, 0.19322586059570312, 0.21002197265625, 0.22681808471679688, 0.24361419677734375, 0.2604103088378906, 0.2772064208984375, 0.2940025329589844, 0.31079864501953125, 0.3275947570800781, 0.344390869140625, 0.3611869812011719, 0.37798309326171875, 0.3947792053222656, 0.4115753173828125, 0.4283714294433594, 0.44516754150390625, 0.4619636535644531, 0.478759765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 8.0, 8.0, 9.0, 17.0, 16.0, 20.0, 26.0, 24.0, 22.0, 36.0, 36.0, 39.0, 58.0, 44.0, 46.0, 50.0, 39.0, 36.0, 50.0, 43.0, 46.0, 47.0, 33.0, 39.0, 34.0, 30.0, 22.0, 20.0, 15.0, 14.0, 17.0, 14.0, 10.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002166748046875, -0.0020940005779266357, -0.0020212531089782715, -0.0019485056400299072, -0.001875758171081543, -0.0018030107021331787, -0.0017302632331848145, -0.0016575157642364502, -0.001584768295288086, -0.0015120208263397217, -0.0014392733573913574, -0.0013665258884429932, -0.001293778419494629, -0.0012210309505462646, -0.0011482834815979004, -0.0010755360126495361, -0.0010027885437011719, -0.0009300410747528076, -0.0008572936058044434, -0.0007845461368560791, -0.0007117986679077148, -0.0006390511989593506, -0.0005663037300109863, -0.0004935562610626221, -0.0004208087921142578, -0.00034806132316589355, -0.0002753138542175293, -0.00020256638526916504, -0.00012981891632080078, -5.7071447372436523e-05, 1.5676021575927734e-05, 8.842349052429199e-05, 0.00016117095947265625, 0.0002339184284210205, 0.00030666589736938477, 0.000379413366317749, 0.0004521608352661133, 0.0005249083042144775, 0.0005976557731628418, 0.0006704032421112061, 0.0007431507110595703, 0.0008158981800079346, 0.0008886456489562988, 0.0009613931179046631, 0.0010341405868530273, 0.0011068880558013916, 0.0011796355247497559, 0.0012523829936981201, 0.0013251304626464844, 0.0013978779315948486, 0.0014706254005432129, 0.0015433728694915771, 0.0016161203384399414, 0.0016888678073883057, 0.00176161527633667, 0.0018343627452850342, 0.0019071102142333984, 0.0019798576831817627, 0.002052605152130127, 0.002125352621078491, 0.0021981000900268555, 0.0022708475589752197, 0.002343595027923584, 0.0024163424968719482, 0.0024890899658203125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 20.0, 19.0, 26.0, 26.0, 44.0, 40.0, 67.0, 73.0, 117.0, 158.0, 236.0, 308.0, 559.0, 1183.0, 60846.0, 975846.0, 6702.0, 783.0, 492.0, 289.0, 176.0, 137.0, 89.0, 74.0, 53.0, 50.0, 28.0, 28.0, 12.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.06341552734375, -0.06175994873046875, -0.0601043701171875, -0.05844879150390625, -0.056793212890625, -0.05513763427734375, -0.0534820556640625, -0.05182647705078125, -0.0501708984375, -0.04851531982421875, -0.0468597412109375, -0.04520416259765625, -0.043548583984375, -0.04189300537109375, -0.0402374267578125, -0.03858184814453125, -0.03692626953125, -0.03527069091796875, -0.0336151123046875, -0.03195953369140625, -0.030303955078125, -0.02864837646484375, -0.0269927978515625, -0.02533721923828125, -0.023681640625, -0.02202606201171875, -0.0203704833984375, -0.01871490478515625, -0.017059326171875, -0.01540374755859375, -0.0137481689453125, -0.01209259033203125, -0.01043701171875, -0.00878143310546875, -0.0071258544921875, -0.00547027587890625, -0.003814697265625, -0.00215911865234375, -0.0005035400390625, 0.00115203857421875, 0.0028076171875, 0.00446319580078125, 0.0061187744140625, 0.00777435302734375, 0.009429931640625, 0.01108551025390625, 0.0127410888671875, 0.01439666748046875, 0.01605224609375, 0.01770782470703125, 0.0193634033203125, 0.02101898193359375, 0.022674560546875, 0.02433013916015625, 0.0259857177734375, 0.02764129638671875, 0.029296875, 0.03095245361328125, 0.0326080322265625, 0.03426361083984375, 0.035919189453125, 0.03757476806640625, 0.0392303466796875, 0.04088592529296875, 0.04254150390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 524.0, 468.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03573993593454361, -0.035077761858701706, -0.0344155915081501, -0.0337534174323082, -0.03309124708175659, -0.03242907300591469, -0.03176690265536308, -0.03110472857952118, -0.030442556366324425, -0.02978038415312767, -0.029118211939930916, -0.02845603972673416, -0.027793865650892258, -0.027131693437695503, -0.02646952122449875, -0.025807349011301994, -0.02514517679810524, -0.024483004584908485, -0.02382083237171173, -0.023158660158514977, -0.022496487945318222, -0.02183431386947632, -0.021172141656279564, -0.02050996944308281, -0.019847797229886055, -0.0191856250166893, -0.018523452803492546, -0.01786128059029579, -0.017199106514453888, -0.016536934301257133, -0.01587476208806038, -0.015212589874863625, -0.01455041766166687, -0.013888245448470116, -0.013226073235273361, -0.012563900090754032, -0.011901727877557278, -0.011239555664360523, -0.010577382519841194, -0.00991521030664444, -0.009253038093447685, -0.00859086588025093, -0.007928693667054176, -0.007266520522534847, -0.006604348309338093, -0.005942176096141338, -0.005280003417283297, -0.004617830738425255, -0.0039556585252285, -0.0032934860792011023, -0.002631313633173704, -0.001969141187146306, -0.001306968741118908, -0.0006447962950915098, 1.737615093588829e-05, 0.00067954882979393, 0.0013417210429906845, 0.0020038934890180826, 0.0026660659350454807, 0.003328238381072879, 0.003990410827100277, 0.004652583040297031, 0.005314755719155073, 0.005976928398013115, 0.006639100611209869]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 6.0, 16.0, 11.0, 16.0, 20.0, 24.0, 32.0, 26.0, 34.0, 37.0, 40.0, 43.0, 44.0, 39.0, 45.0, 44.0, 57.0, 27.0, 49.0, 51.0, 40.0, 32.0, 36.0, 26.0, 39.0, 29.0, 24.0, 17.0, 15.0, 11.0, 12.0, 15.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015895962715148926, -0.001541762612760067, -0.0014939289540052414, -0.0014460952952504158, -0.0013982616364955902, -0.0013504279777407646, -0.001302594318985939, -0.0012547606602311134, -0.0012069270014762878, -0.0011590933427214622, -0.0011112596839666367, -0.001063426025211811, -0.0010155923664569855, -0.0009677587077021599, -0.0009199250489473343, -0.0008720913901925087, -0.0008242577314376831, -0.0007764240726828575, -0.0007285904139280319, -0.0006807567551732063, -0.0006329230964183807, -0.0005850894376635551, -0.0005372557789087296, -0.000489422120153904, -0.00044158846139907837, -0.0003937548026442528, -0.0003459211438894272, -0.0002980874851346016, -0.000250253826379776, -0.0002024201676249504, -0.00015458650887012482, -0.00010675285011529922, -5.891919136047363e-05, -1.108553260564804e-05, 3.674812614917755e-05, 8.458178490400314e-05, 0.00013241544365882874, 0.00018024910241365433, 0.00022808276116847992, 0.0002759164199233055, 0.0003237500786781311, 0.0003715837374329567, 0.0004194173961877823, 0.0004672510549426079, 0.0005150847136974335, 0.0005629183724522591, 0.0006107520312070847, 0.0006585856899619102, 0.0007064193487167358, 0.0007542530074715614, 0.000802086666226387, 0.0008499203249812126, 0.0008977539837360382, 0.0009455876424908638, 0.0009934213012456894, 0.001041254960000515, 0.0010890886187553406, 0.0011369222775101662, 0.0011847559362649918, 0.0012325895950198174, 0.001280423253774643, 0.0013282569125294685, 0.0013760905712842941, 0.0014239242300391197, 0.0014717578887939453]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 10.0, 15.0, 25.0, 15.0, 20.0, 32.0, 26.0, 40.0, 38.0, 41.0, 30.0, 42.0, 41.0, 33.0, 41.0, 30.0, 45.0, 53.0, 46.0, 35.0, 42.0, 41.0, 23.0, 38.0, 39.0, 22.0, 17.0, 14.0, 12.0, 13.0, 12.0, 10.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.38909912109375, -6.1571044921875, -5.92510986328125, -5.693115234375, -5.46112060546875, -5.2291259765625, -4.99713134765625, -4.76513671875, -4.53314208984375, -4.3011474609375, -4.06915283203125, -3.837158203125, -3.60516357421875, -3.3731689453125, -3.14117431640625, -2.9091796875, -2.67718505859375, -2.4451904296875, -2.21319580078125, -1.981201171875, -1.74920654296875, -1.5172119140625, -1.28521728515625, -1.05322265625, -0.82122802734375, -0.5892333984375, -0.35723876953125, -0.125244140625, 0.10675048828125, 0.3387451171875, 0.57073974609375, 0.802734375, 1.03472900390625, 1.2667236328125, 1.49871826171875, 1.730712890625, 1.96270751953125, 2.1947021484375, 2.42669677734375, 2.65869140625, 2.89068603515625, 3.1226806640625, 3.35467529296875, 3.586669921875, 3.81866455078125, 4.0506591796875, 4.28265380859375, 4.5146484375, 4.74664306640625, 4.9786376953125, 5.21063232421875, 5.442626953125, 5.67462158203125, 5.9066162109375, 6.13861083984375, 6.37060546875, 6.60260009765625, 6.8345947265625, 7.06658935546875, 7.298583984375, 7.53057861328125, 7.7625732421875, 7.99456787109375, 8.2265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 13.0, 9.0, 21.0, 21.0, 39.0, 40.0, 46.0, 70.0, 117.0, 148.0, 238.0, 379.0, 467.0, 710.0, 1119.0, 1819.0, 3093.0, 6273.0, 18845.0, 153711.0, 733705.0, 99624.0, 15065.0, 5263.0, 2838.0, 1631.0, 1017.0, 646.0, 532.0, 312.0, 218.0, 154.0, 98.0, 59.0, 69.0, 39.0, 33.0, 26.0, 10.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.390625, -20.78662109375, -20.1826171875, -19.57861328125, -18.974609375, -18.37060546875, -17.7666015625, -17.16259765625, -16.55859375, -15.95458984375, -15.3505859375, -14.74658203125, -14.142578125, -13.53857421875, -12.9345703125, -12.33056640625, -11.7265625, -11.12255859375, -10.5185546875, -9.91455078125, -9.310546875, -8.70654296875, -8.1025390625, -7.49853515625, -6.89453125, -6.29052734375, -5.6865234375, -5.08251953125, -4.478515625, -3.87451171875, -3.2705078125, -2.66650390625, -2.0625, -1.45849609375, -0.8544921875, -0.25048828125, 0.353515625, 0.95751953125, 1.5615234375, 2.16552734375, 2.76953125, 3.37353515625, 3.9775390625, 4.58154296875, 5.185546875, 5.78955078125, 6.3935546875, 6.99755859375, 7.6015625, 8.20556640625, 8.8095703125, 9.41357421875, 10.017578125, 10.62158203125, 11.2255859375, 11.82958984375, 12.43359375, 13.03759765625, 13.6416015625, 14.24560546875, 14.849609375, 15.45361328125, 16.0576171875, 16.66162109375, 17.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 4.0, 5.0, 15.0, 9.0, 15.0, 12.0, 21.0, 21.0, 18.0, 22.0, 35.0, 30.0, 37.0, 46.0, 65.0, 77.0, 123.0, 358.0, 1522.0, 186.0, 67.0, 45.0, 49.0, 32.0, 35.0, 30.0, 25.0, 22.0, 15.0, 13.0, 13.0, 13.0, 7.0, 10.0, 9.0, 2.0, 7.0, 6.0, 2.0, 2.0, 9.0, 2.0, 2.0, 2.0], "bins": [-21.671875, -21.1038818359375, -20.535888671875, -19.9678955078125, -19.39990234375, -18.8319091796875, -18.263916015625, -17.6959228515625, -17.1279296875, -16.5599365234375, -15.991943359375, -15.4239501953125, -14.85595703125, -14.2879638671875, -13.719970703125, -13.1519775390625, -12.583984375, -12.0159912109375, -11.447998046875, -10.8800048828125, -10.31201171875, -9.7440185546875, -9.176025390625, -8.6080322265625, -8.0400390625, -7.4720458984375, -6.904052734375, -6.3360595703125, -5.76806640625, -5.2000732421875, -4.632080078125, -4.0640869140625, -3.49609375, -2.9281005859375, -2.360107421875, -1.7921142578125, -1.22412109375, -0.6561279296875, -0.088134765625, 0.4798583984375, 1.0478515625, 1.6158447265625, 2.183837890625, 2.7518310546875, 3.31982421875, 3.8878173828125, 4.455810546875, 5.0238037109375, 5.591796875, 6.1597900390625, 6.727783203125, 7.2957763671875, 7.86376953125, 8.4317626953125, 8.999755859375, 9.5677490234375, 10.1357421875, 10.7037353515625, 11.271728515625, 11.8397216796875, 12.40771484375, 12.9757080078125, 13.543701171875, 14.1116943359375, 14.6796875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 29.0, 37.0, 42.0, 59.0, 86.0, 138.0, 227.0, 448.0, 1158.0, 21152.0, 3116365.0, 4051.0, 794.0, 375.0, 221.0, 135.0, 93.0, 77.0, 44.0, 29.0, 14.0, 13.0, 15.0, 12.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.8125, -76.58203125, -74.3515625, -72.12109375, -69.890625, -67.66015625, -65.4296875, -63.19921875, -60.96875, -58.73828125, -56.5078125, -54.27734375, -52.046875, -49.81640625, -47.5859375, -45.35546875, -43.125, -40.89453125, -38.6640625, -36.43359375, -34.203125, -31.97265625, -29.7421875, -27.51171875, -25.28125, -23.05078125, -20.8203125, -18.58984375, -16.359375, -14.12890625, -11.8984375, -9.66796875, -7.4375, -5.20703125, -2.9765625, -0.74609375, 1.484375, 3.71484375, 5.9453125, 8.17578125, 10.40625, 12.63671875, 14.8671875, 17.09765625, 19.328125, 21.55859375, 23.7890625, 26.01953125, 28.25, 30.48046875, 32.7109375, 34.94140625, 37.171875, 39.40234375, 41.6328125, 43.86328125, 46.09375, 48.32421875, 50.5546875, 52.78515625, 55.015625, 57.24609375, 59.4765625, 61.70703125, 63.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 88.0, 374.0, 434.0, 97.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.78763580322266, -111.15155792236328, -106.51548767089844, -101.87940979003906, -97.24333190917969, -92.60725402832031, -87.97117614746094, -83.3351058959961, -78.69902801513672, -74.06295013427734, -69.4268798828125, -64.79080200195312, -60.15472412109375, -55.518646240234375, -50.882572174072266, -46.246498107910156, -41.61042022705078, -36.974342346191406, -32.3382682800293, -27.702192306518555, -23.066116333007812, -18.43004035949707, -13.793964385986328, -9.157890319824219, -4.521812438964844, 0.11426353454589844, 4.750339508056641, 9.386415481567383, 14.022491455078125, 18.658567428588867, 23.29464340209961, 27.93071746826172, 32.56678771972656, 37.20286560058594, 41.83893966674805, 46.475013732910156, 51.11109161376953, 55.747169494628906, 60.383243560791016, 65.01931762695312, 69.6553955078125, 74.29147338867188, 78.92755126953125, 83.5636215209961, 88.19969940185547, 92.83577728271484, 97.47184753417969, 102.10792541503906, 106.74400329589844, 111.38008117675781, 116.01615905761719, 120.65222930908203, 125.2883071899414, 129.92437744140625, 134.56045532226562, 139.196533203125, 143.83261108398438, 148.46868896484375, 153.10476684570312, 157.7408447265625, 162.37692260742188, 167.0129852294922, 171.64906311035156, 176.28514099121094, 180.9212188720703]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 20.0, 22.0, 24.0, 26.0, 23.0, 41.0, 29.0, 26.0, 34.0, 24.0, 28.0, 43.0, 40.0, 43.0, 41.0, 32.0, 32.0, 40.0, 36.0, 37.0, 21.0, 29.0, 27.0, 16.0, 28.0, 20.0, 24.0, 20.0, 17.0, 7.0, 13.0, 4.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0], "bins": [-44.91546630859375, -43.57817840576172, -42.24089050292969, -40.903602600097656, -39.56631088256836, -38.22902297973633, -36.8917350769043, -35.554447174072266, -34.217159271240234, -32.8798713684082, -31.54258155822754, -30.205293655395508, -28.868005752563477, -27.530715942382812, -26.19342803955078, -24.85614013671875, -23.518850326538086, -22.181562423706055, -20.84427261352539, -19.50698471069336, -18.169696807861328, -16.832408905029297, -15.495119094848633, -14.157831192016602, -12.820542335510254, -11.483253479003906, -10.145965576171875, -8.808676719665527, -7.471388339996338, -6.134099960327148, -4.796811103820801, -3.4595232009887695, -2.122234344482422, -0.7849458456039429, 0.5523426532745361, 1.8896312713623047, 3.226919651031494, 4.564208030700684, 5.901496887207031, 7.2387847900390625, 8.57607364654541, 9.913362503051758, 11.250650405883789, 12.587939262390137, 13.925228118896484, 15.262516021728516, 16.599803924560547, 17.937091827392578, 19.274381637573242, 20.611669540405273, 21.948959350585938, 23.28624725341797, 24.62353515625, 25.96082305908203, 27.298112869262695, 28.635400772094727, 29.97269058227539, 31.309978485107422, 32.64726638793945, 33.98455810546875, 35.32184600830078, 36.65913391113281, 37.996421813964844, 39.333709716796875, 40.670997619628906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 8.0, 10.0, 13.0, 9.0, 12.0, 27.0, 17.0, 21.0, 20.0, 32.0, 27.0, 37.0, 30.0, 29.0, 23.0, 45.0, 37.0, 50.0, 52.0, 30.0, 44.0, 43.0, 43.0, 29.0, 30.0, 32.0, 24.0, 32.0, 20.0, 24.0, 26.0, 18.0, 14.0, 14.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.58984375, -6.369140625, -6.1484375, -5.927734375, -5.70703125, -5.486328125, -5.265625, -5.044921875, -4.82421875, -4.603515625, -4.3828125, -4.162109375, -3.94140625, -3.720703125, -3.5, -3.279296875, -3.05859375, -2.837890625, -2.6171875, -2.396484375, -2.17578125, -1.955078125, -1.734375, -1.513671875, -1.29296875, -1.072265625, -0.8515625, -0.630859375, -0.41015625, -0.189453125, 0.03125, 0.251953125, 0.47265625, 0.693359375, 0.9140625, 1.134765625, 1.35546875, 1.576171875, 1.796875, 2.017578125, 2.23828125, 2.458984375, 2.6796875, 2.900390625, 3.12109375, 3.341796875, 3.5625, 3.783203125, 4.00390625, 4.224609375, 4.4453125, 4.666015625, 4.88671875, 5.107421875, 5.328125, 5.548828125, 5.76953125, 5.990234375, 6.2109375, 6.431640625, 6.65234375, 6.873046875, 7.09375, 7.314453125, 7.53515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 18.0, 18.0, 30.0, 26.0, 31.0, 45.0, 71.0, 68.0, 102.0, 126.0, 178.0, 269.0, 333.0, 514.0, 737.0, 1216.0, 2095.0, 4366.0, 11827.0, 69532.0, 790289.0, 2655722.0, 590392.0, 46702.0, 9946.0, 3952.0, 2065.0, 1168.0, 725.0, 462.0, 316.0, 213.0, 172.0, 116.0, 110.0, 79.0, 54.0, 51.0, 25.0, 33.0, 18.0, 15.0, 10.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.2734375, -13.804443359375, -13.33544921875, -12.866455078125, -12.3974609375, -11.928466796875, -11.45947265625, -10.990478515625, -10.521484375, -10.052490234375, -9.58349609375, -9.114501953125, -8.6455078125, -8.176513671875, -7.70751953125, -7.238525390625, -6.76953125, -6.300537109375, -5.83154296875, -5.362548828125, -4.8935546875, -4.424560546875, -3.95556640625, -3.486572265625, -3.017578125, -2.548583984375, -2.07958984375, -1.610595703125, -1.1416015625, -0.672607421875, -0.20361328125, 0.265380859375, 0.734375, 1.203369140625, 1.67236328125, 2.141357421875, 2.6103515625, 3.079345703125, 3.54833984375, 4.017333984375, 4.486328125, 4.955322265625, 5.42431640625, 5.893310546875, 6.3623046875, 6.831298828125, 7.30029296875, 7.769287109375, 8.23828125, 8.707275390625, 9.17626953125, 9.645263671875, 10.1142578125, 10.583251953125, 11.05224609375, 11.521240234375, 11.990234375, 12.459228515625, 12.92822265625, 13.397216796875, 13.8662109375, 14.335205078125, 14.80419921875, 15.273193359375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 13.0, 19.0, 29.0, 48.0, 79.0, 122.0, 205.0, 314.0, 537.0, 774.0, 718.0, 454.0, 310.0, 184.0, 113.0, 59.0, 32.0, 18.0, 16.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.7659912109375, -13.164794921875, -12.5635986328125, -11.96240234375, -11.3612060546875, -10.760009765625, -10.1588134765625, -9.5576171875, -8.9564208984375, -8.355224609375, -7.7540283203125, -7.15283203125, -6.5516357421875, -5.950439453125, -5.3492431640625, -4.748046875, -4.1468505859375, -3.545654296875, -2.9444580078125, -2.34326171875, -1.7420654296875, -1.140869140625, -0.5396728515625, 0.0615234375, 0.6627197265625, 1.263916015625, 1.8651123046875, 2.46630859375, 3.0675048828125, 3.668701171875, 4.2698974609375, 4.87109375, 5.4722900390625, 6.073486328125, 6.6746826171875, 7.27587890625, 7.8770751953125, 8.478271484375, 9.0794677734375, 9.6806640625, 10.2818603515625, 10.883056640625, 11.4842529296875, 12.08544921875, 12.6866455078125, 13.287841796875, 13.8890380859375, 14.490234375, 15.0914306640625, 15.692626953125, 16.2938232421875, 16.89501953125, 17.4962158203125, 18.097412109375, 18.6986083984375, 19.2998046875, 19.9010009765625, 20.502197265625, 21.1033935546875, 21.70458984375, 22.3057861328125, 22.906982421875, 23.5081787109375, 24.109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 15.0, 20.0, 31.0, 37.0, 85.0, 144.0, 321.0, 704.0, 2021.0, 18326.0, 3935917.0, 230169.0, 4321.0, 1166.0, 472.0, 229.0, 123.0, 77.0, 26.0, 24.0, 18.0, 2.0, 7.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-56.5625, -55.173828125, -53.78515625, -52.396484375, -51.0078125, -49.619140625, -48.23046875, -46.841796875, -45.453125, -44.064453125, -42.67578125, -41.287109375, -39.8984375, -38.509765625, -37.12109375, -35.732421875, -34.34375, -32.955078125, -31.56640625, -30.177734375, -28.7890625, -27.400390625, -26.01171875, -24.623046875, -23.234375, -21.845703125, -20.45703125, -19.068359375, -17.6796875, -16.291015625, -14.90234375, -13.513671875, -12.125, -10.736328125, -9.34765625, -7.958984375, -6.5703125, -5.181640625, -3.79296875, -2.404296875, -1.015625, 0.373046875, 1.76171875, 3.150390625, 4.5390625, 5.927734375, 7.31640625, 8.705078125, 10.09375, 11.482421875, 12.87109375, 14.259765625, 15.6484375, 17.037109375, 18.42578125, 19.814453125, 21.203125, 22.591796875, 23.98046875, 25.369140625, 26.7578125, 28.146484375, 29.53515625, 30.923828125, 32.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 25.0, 137.0, 277.0, 355.0, 164.0, 39.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.05208587646484, -66.65472412109375, -62.257362365722656, -57.86000061035156, -53.46263885498047, -49.065277099609375, -44.66791915893555, -40.27055740356445, -35.87319564819336, -31.475833892822266, -27.078472137451172, -22.68111228942871, -18.283750534057617, -13.886388778686523, -9.489028930664062, -5.091667175292969, -0.694305419921875, 3.7030558586120605, 8.100417137145996, 12.497777938842773, 16.895139694213867, 21.29250144958496, 25.689861297607422, 30.087223052978516, 34.48458480834961, 38.8819465637207, 43.2793083190918, 47.676666259765625, 52.07402801513672, 56.47138977050781, 60.868751525878906, 65.26611328125, 69.66348266601562, 74.06084442138672, 78.45820617675781, 82.8555679321289, 87.2529296875, 91.6502914428711, 96.04765319824219, 100.44500732421875, 104.84237670898438, 109.23973846435547, 113.63710021972656, 118.03446197509766, 122.43182373046875, 126.82918548583984, 131.22654724121094, 135.6239013671875, 140.02127075195312, 144.4186248779297, 148.8159942626953, 153.21334838867188, 157.6107177734375, 162.00807189941406, 166.4054412841797, 170.80279541015625, 175.2001495361328, 179.59750366210938, 183.994873046875, 188.39222717285156, 192.7895965576172, 197.18695068359375, 201.58432006835938, 205.98167419433594, 210.37904357910156]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 5.0, 14.0, 15.0, 11.0, 12.0, 20.0, 22.0, 29.0, 25.0, 22.0, 29.0, 33.0, 36.0, 24.0, 30.0, 44.0, 40.0, 42.0, 46.0, 47.0, 32.0, 42.0, 38.0, 29.0, 35.0, 32.0, 24.0, 28.0, 18.0, 18.0, 27.0, 13.0, 21.0, 13.0, 11.0, 12.0, 14.0, 4.0, 4.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-42.887542724609375, -41.56871795654297, -40.24989318847656, -38.93106460571289, -37.612239837646484, -36.29341506958008, -34.97459030151367, -33.655765533447266, -32.336936950683594, -31.018112182617188, -29.69928550720215, -28.380460739135742, -27.061634063720703, -25.742809295654297, -24.42398452758789, -23.105159759521484, -21.786334991455078, -20.467510223388672, -19.148683547973633, -17.829858779907227, -16.511032104492188, -15.192207336425781, -13.873382568359375, -12.554556846618652, -11.23573112487793, -9.916905403137207, -8.598079681396484, -7.279254913330078, -5.9604291915893555, -4.641603469848633, -3.3227782249450684, -2.003952980041504, -0.6851272583007812, 0.6336982250213623, 1.9525237083435059, 3.2713491916656494, 4.590174674987793, 5.909000396728516, 7.22782564163208, 8.546650886535645, 9.865476608276367, 11.18430233001709, 12.503128051757812, 13.821952819824219, 15.140778541564941, 16.459604263305664, 17.77842903137207, 19.09725570678711, 20.416080474853516, 21.734905242919922, 23.05373191833496, 24.372556686401367, 25.691383361816406, 27.010208129882812, 28.32903289794922, 29.647857666015625, 30.966684341430664, 32.2855110168457, 33.60433578491211, 34.923160552978516, 36.24198532104492, 37.560813903808594, 38.879638671875, 40.198463439941406, 41.51728820800781]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 38.0, 37.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 26.0, 18.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 23.0, 39.0, 60.0, 87.0, 128.0, 216.0, 280.0, 388.0, 570.0, 807.0, 1218.0, 1748.0, 2287.0, 3431.0, 5201.0, 7592.0, 11584.0, 17279.0, 26939.0, 42103.0, 63906.0, 96468.0, 136084.0, 163773.0, 146855.0, 108526.0, 72287.0, 47569.0, 30928.0, 19825.0, 13106.0, 8751.0, 5846.0, 3980.0, 2644.0, 1849.0, 1323.0, 829.0, 641.0, 433.0, 307.0, 215.0, 134.0, 104.0, 68.0, 32.0, 28.0, 15.0, 10.0, 9.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.446533203125, -0.4319648742675781, -0.41739654541015625, -0.4028282165527344, -0.3882598876953125, -0.3736915588378906, -0.35912322998046875, -0.3445549011230469, -0.329986572265625, -0.3154182434082031, -0.30084991455078125, -0.2862815856933594, -0.2717132568359375, -0.2571449279785156, -0.24257659912109375, -0.22800827026367188, -0.21343994140625, -0.19887161254882812, -0.18430328369140625, -0.16973495483398438, -0.1551666259765625, -0.14059829711914062, -0.12602996826171875, -0.11146163940429688, -0.096893310546875, -0.08232498168945312, -0.06775665283203125, -0.053188323974609375, -0.0386199951171875, -0.024051666259765625, -0.00948333740234375, 0.005084991455078125, 0.0196533203125, 0.034221649169921875, 0.04878997802734375, 0.06335830688476562, 0.0779266357421875, 0.09249496459960938, 0.10706329345703125, 0.12163162231445312, 0.136199951171875, 0.15076828002929688, 0.16533660888671875, 0.17990493774414062, 0.1944732666015625, 0.20904159545898438, 0.22360992431640625, 0.23817825317382812, 0.25274658203125, 0.2673149108886719, 0.28188323974609375, 0.2964515686035156, 0.3110198974609375, 0.3255882263183594, 0.34015655517578125, 0.3547248840332031, 0.369293212890625, 0.3838615417480469, 0.39842987060546875, 0.4129981994628906, 0.4275665283203125, 0.4421348571777344, 0.45670318603515625, 0.4712715148925781, 0.48583984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 5.0, 7.0, 13.0, 6.0, 6.0, 7.0, 14.0, 18.0, 11.0, 17.0, 28.0, 29.0, 35.0, 32.0, 29.0, 40.0, 36.0, 36.0, 31.0, 44.0, 1069.0, 43.0, 38.0, 38.0, 33.0, 40.0, 39.0, 33.0, 27.0, 33.0, 21.0, 28.0, 25.0, 30.0, 14.0, 12.0, 8.0, 9.0, 7.0, 4.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.33203125, -3.21734619140625, -3.1026611328125, -2.98797607421875, -2.873291015625, -2.75860595703125, -2.6439208984375, -2.52923583984375, -2.41455078125, -2.29986572265625, -2.1851806640625, -2.07049560546875, -1.955810546875, -1.84112548828125, -1.7264404296875, -1.61175537109375, -1.4970703125, -1.38238525390625, -1.2677001953125, -1.15301513671875, -1.038330078125, -0.92364501953125, -0.8089599609375, -0.69427490234375, -0.57958984375, -0.46490478515625, -0.3502197265625, -0.23553466796875, -0.120849609375, -0.00616455078125, 0.1085205078125, 0.22320556640625, 0.337890625, 0.45257568359375, 0.5672607421875, 0.68194580078125, 0.796630859375, 0.91131591796875, 1.0260009765625, 1.14068603515625, 1.25537109375, 1.37005615234375, 1.4847412109375, 1.59942626953125, 1.714111328125, 1.82879638671875, 1.9434814453125, 2.05816650390625, 2.1728515625, 2.28753662109375, 2.4022216796875, 2.51690673828125, 2.631591796875, 2.74627685546875, 2.8609619140625, 2.97564697265625, 3.09033203125, 3.20501708984375, 3.3197021484375, 3.43438720703125, 3.549072265625, 3.66375732421875, 3.7784423828125, 3.89312744140625, 4.0078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 19.0, 28.0, 54.0, 70.0, 140.0, 230.0, 393.0, 609.0, 1145.0, 1863.0, 3087.0, 5359.0, 8868.0, 15267.0, 25898.0, 44093.0, 73825.0, 119166.0, 168667.0, 1232717.0, 149002.0, 99702.0, 60044.0, 35688.0, 21087.0, 12398.0, 7303.0, 4260.0, 2573.0, 1419.0, 858.0, 502.0, 305.0, 182.0, 131.0, 63.0, 40.0, 27.0, 16.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5124435424804688, -0.4970550537109375, -0.48166656494140625, -0.466278076171875, -0.45088958740234375, -0.4355010986328125, -0.42011260986328125, -0.40472412109375, -0.38933563232421875, -0.3739471435546875, -0.35855865478515625, -0.343170166015625, -0.32778167724609375, -0.3123931884765625, -0.29700469970703125, -0.2816162109375, -0.26622772216796875, -0.2508392333984375, -0.23545074462890625, -0.220062255859375, -0.20467376708984375, -0.1892852783203125, -0.17389678955078125, -0.15850830078125, -0.14311981201171875, -0.1277313232421875, -0.11234283447265625, -0.096954345703125, -0.08156585693359375, -0.0661773681640625, -0.05078887939453125, -0.035400390625, -0.02001190185546875, -0.0046234130859375, 0.01076507568359375, 0.026153564453125, 0.04154205322265625, 0.0569305419921875, 0.07231903076171875, 0.08770751953125, 0.10309600830078125, 0.1184844970703125, 0.13387298583984375, 0.149261474609375, 0.16464996337890625, 0.1800384521484375, 0.19542694091796875, 0.2108154296875, 0.22620391845703125, 0.2415924072265625, 0.25698089599609375, 0.272369384765625, 0.28775787353515625, 0.3031463623046875, 0.31853485107421875, 0.33392333984375, 0.34931182861328125, 0.3647003173828125, 0.38008880615234375, 0.395477294921875, 0.41086578369140625, 0.4262542724609375, 0.44164276123046875, 0.45703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 3.0, 17.0, 18.0, 19.0, 17.0, 25.0, 27.0, 29.0, 37.0, 33.0, 55.0, 49.0, 52.0, 55.0, 50.0, 57.0, 57.0, 65.0, 50.0, 34.0, 38.0, 39.0, 28.0, 31.0, 23.0, 25.0, 9.0, 9.0, 15.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001773834228515625, -0.0017108023166656494, -0.0016477704048156738, -0.0015847384929656982, -0.0015217065811157227, -0.001458674669265747, -0.0013956427574157715, -0.001332610845565796, -0.0012695789337158203, -0.0012065470218658447, -0.0011435151100158691, -0.0010804831981658936, -0.001017451286315918, -0.0009544193744659424, -0.0008913874626159668, -0.0008283555507659912, -0.0007653236389160156, -0.00070229172706604, -0.0006392598152160645, -0.0005762279033660889, -0.0005131959915161133, -0.0004501640796661377, -0.0003871321678161621, -0.0003241002559661865, -0.00026106834411621094, -0.00019803643226623535, -0.00013500452041625977, -7.197260856628418e-05, -8.940696716308594e-06, 5.409121513366699e-05, 0.00011712312698364258, 0.00018015503883361816, 0.00024318695068359375, 0.00030621886253356934, 0.0003692507743835449, 0.0004322826862335205, 0.0004953145980834961, 0.0005583465099334717, 0.0006213784217834473, 0.0006844103336334229, 0.0007474422454833984, 0.000810474157333374, 0.0008735060691833496, 0.0009365379810333252, 0.0009995698928833008, 0.0010626018047332764, 0.001125633716583252, 0.0011886656284332275, 0.0012516975402832031, 0.0013147294521331787, 0.0013777613639831543, 0.0014407932758331299, 0.0015038251876831055, 0.001566857099533081, 0.0016298890113830566, 0.0016929209232330322, 0.0017559528350830078, 0.0018189847469329834, 0.001882016658782959, 0.0019450485706329346, 0.00200808048248291, 0.0020711123943328857, 0.0021341443061828613, 0.002197176218032837, 0.0022602081298828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 7.0, 14.0, 18.0, 19.0, 33.0, 32.0, 40.0, 50.0, 78.0, 99.0, 123.0, 204.0, 261.0, 397.0, 709.0, 2458.0, 891582.0, 149158.0, 1340.0, 603.0, 374.0, 249.0, 171.0, 125.0, 74.0, 60.0, 57.0, 49.0, 39.0, 27.0, 25.0, 14.0, 9.0, 14.0, 6.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.04388427734375, -0.042693138122558594, -0.04150199890136719, -0.04031085968017578, -0.039119720458984375, -0.03792858123779297, -0.03673744201660156, -0.035546302795410156, -0.03435516357421875, -0.033164024353027344, -0.03197288513183594, -0.03078174591064453, -0.029590606689453125, -0.02839946746826172, -0.027208328247070312, -0.026017189025878906, -0.0248260498046875, -0.023634910583496094, -0.022443771362304688, -0.02125263214111328, -0.020061492919921875, -0.01887035369873047, -0.017679214477539062, -0.016488075256347656, -0.01529693603515625, -0.014105796813964844, -0.012914657592773438, -0.011723518371582031, -0.010532379150390625, -0.009341239929199219, -0.008150100708007812, -0.006958961486816406, -0.005767822265625, -0.004576683044433594, -0.0033855438232421875, -0.0021944046020507812, -0.001003265380859375, 0.00018787384033203125, 0.0013790130615234375, 0.0025701522827148438, 0.00376129150390625, 0.004952430725097656, 0.0061435699462890625, 0.007334709167480469, 0.008525848388671875, 0.009716987609863281, 0.010908126831054688, 0.012099266052246094, 0.0132904052734375, 0.014481544494628906, 0.015672683715820312, 0.01686382293701172, 0.018054962158203125, 0.01924610137939453, 0.020437240600585938, 0.021628379821777344, 0.02281951904296875, 0.024010658264160156, 0.025201797485351562, 0.02639293670654297, 0.027584075927734375, 0.02877521514892578, 0.029966354370117188, 0.031157493591308594, 0.0323486328125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 15.0, 170.0, 627.0, 193.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007932843640446663, -0.007702961564064026, -0.007473079487681389, -0.007243197411298752, -0.007013315334916115, -0.006783433258533478, -0.0065535507164895535, -0.006323668640106916, -0.006093786563724279, -0.005863904487341642, -0.005634022410959005, -0.005404140334576368, -0.005174257792532444, -0.004944375716149807, -0.00471449363976717, -0.004484611563384533, -0.004254729487001896, -0.004024847410619259, -0.003794965334236622, -0.003565083025023341, -0.003335200948640704, -0.003105318872258067, -0.0028754365630447865, -0.0026455544866621494, -0.0024156724102795124, -0.0021857903338968754, -0.0019559082575142384, -0.0017260259483009577, -0.0014961438719183207, -0.0012662617955356836, -0.0010363796027377248, -0.0008064974099397659, -0.0005766157992184162, -0.0003467336646281183, -0.00011685153003782034, 0.0001130306045524776, 0.00034291273914277554, 0.0005727948155254126, 0.0008026770083233714, 0.0010325592011213303, 0.0012624412775039673, 0.0014923233538866043, 0.0017222055466845632, 0.001952087739482522, 0.002181969815865159, 0.002411851892247796, 0.0026417342014610767, 0.0028716162778437138, 0.003101498354226351, 0.003331380430608988, 0.003561262506991625, 0.0037911448162049055, 0.004021027125418186, 0.004250909201800823, 0.00448079127818346, 0.004710673354566097, 0.004940555430948734, 0.005170437507331371, 0.005400319583714008, 0.005630201660096645, 0.005860083736479282, 0.006089965812861919, 0.006319848354905844, 0.006549730431288481, 0.006779612507671118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 7.0, 5.0, 7.0, 8.0, 10.0, 12.0, 16.0, 19.0, 24.0, 15.0, 21.0, 33.0, 20.0, 39.0, 32.0, 30.0, 32.0, 39.0, 40.0, 39.0, 46.0, 40.0, 42.0, 42.0, 38.0, 43.0, 48.0, 31.0, 30.0, 30.0, 20.0, 27.0, 31.0, 17.0, 17.0, 10.0, 16.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0011107921600341797, -0.0010784519836306572, -0.0010461118072271347, -0.0010137716308236122, -0.0009814314544200897, -0.0009490912780165672, -0.0009167511016130447, -0.0008844109252095222, -0.0008520707488059998, -0.0008197305724024773, -0.0007873903959989548, -0.0007550502195954323, -0.0007227100431919098, -0.0006903698667883873, -0.0006580296903848648, -0.0006256895139813423, -0.0005933493375778198, -0.0005610091611742973, -0.0005286689847707748, -0.0004963288083672523, -0.00046398863196372986, -0.00043164845556020737, -0.0003993082791566849, -0.0003669681027531624, -0.0003346279263496399, -0.0003022877499461174, -0.0002699475735425949, -0.00023760739713907242, -0.00020526722073554993, -0.00017292704433202744, -0.00014058686792850494, -0.00010824669152498245, -7.590651512145996e-05, -4.356633871793747e-05, -1.1226162314414978e-05, 2.1114014089107513e-05, 5.3454190492630005e-05, 8.57943668961525e-05, 0.00011813454329967499, 0.00015047471970319748, 0.00018281489610671997, 0.00021515507251024246, 0.00024749524891376495, 0.00027983542531728745, 0.00031217560172080994, 0.00034451577812433243, 0.0003768559545278549, 0.0004091961309313774, 0.0004415363073348999, 0.0004738764837384224, 0.0005062166601419449, 0.0005385568365454674, 0.0005708970129489899, 0.0006032371893525124, 0.0006355773657560349, 0.0006679175421595573, 0.0007002577185630798, 0.0007325978949666023, 0.0007649380713701248, 0.0007972782477736473, 0.0008296184241771698, 0.0008619586005806923, 0.0008942987769842148, 0.0009266389533877373, 0.0009589791297912598]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 39.0, 36.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 27.0, 17.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 27.0, 28.0, 17.0, 55.0, 62.0, 72.0, 121.0, 121.0, 201.0, 301.0, 446.0, 648.0, 1095.0, 1856.0, 3906.0, 10705.0, 38054.0, 201413.0, 604108.0, 140026.0, 28655.0, 8510.0, 3444.0, 1691.0, 1009.0, 604.0, 385.0, 279.0, 187.0, 134.0, 98.0, 73.0, 52.0, 33.0, 31.0, 26.0, 13.0, 7.0, 12.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4296875, -9.12939453125, -8.8291015625, -8.52880859375, -8.228515625, -7.92822265625, -7.6279296875, -7.32763671875, -7.02734375, -6.72705078125, -6.4267578125, -6.12646484375, -5.826171875, -5.52587890625, -5.2255859375, -4.92529296875, -4.625, -4.32470703125, -4.0244140625, -3.72412109375, -3.423828125, -3.12353515625, -2.8232421875, -2.52294921875, -2.22265625, -1.92236328125, -1.6220703125, -1.32177734375, -1.021484375, -0.72119140625, -0.4208984375, -0.12060546875, 0.1796875, 0.47998046875, 0.7802734375, 1.08056640625, 1.380859375, 1.68115234375, 1.9814453125, 2.28173828125, 2.58203125, 2.88232421875, 3.1826171875, 3.48291015625, 3.783203125, 4.08349609375, 4.3837890625, 4.68408203125, 4.984375, 5.28466796875, 5.5849609375, 5.88525390625, 6.185546875, 6.48583984375, 6.7861328125, 7.08642578125, 7.38671875, 7.68701171875, 7.9873046875, 8.28759765625, 8.587890625, 8.88818359375, 9.1884765625, 9.48876953125, 9.7890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 20.0, 17.0, 34.0, 35.0, 40.0, 52.0, 57.0, 61.0, 101.0, 282.0, 1688.0, 176.0, 104.0, 63.0, 46.0, 43.0, 46.0, 34.0, 25.0, 11.0, 16.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.49560546875, -15.9130859375, -15.33056640625, -14.748046875, -14.16552734375, -13.5830078125, -13.00048828125, -12.41796875, -11.83544921875, -11.2529296875, -10.67041015625, -10.087890625, -9.50537109375, -8.9228515625, -8.34033203125, -7.7578125, -7.17529296875, -6.5927734375, -6.01025390625, -5.427734375, -4.84521484375, -4.2626953125, -3.68017578125, -3.09765625, -2.51513671875, -1.9326171875, -1.35009765625, -0.767578125, -0.18505859375, 0.3974609375, 0.97998046875, 1.5625, 2.14501953125, 2.7275390625, 3.31005859375, 3.892578125, 4.47509765625, 5.0576171875, 5.64013671875, 6.22265625, 6.80517578125, 7.3876953125, 7.97021484375, 8.552734375, 9.13525390625, 9.7177734375, 10.30029296875, 10.8828125, 11.46533203125, 12.0478515625, 12.63037109375, 13.212890625, 13.79541015625, 14.3779296875, 14.96044921875, 15.54296875, 16.12548828125, 16.7080078125, 17.29052734375, 17.873046875, 18.45556640625, 19.0380859375, 19.62060546875, 20.203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 18.0, 21.0, 24.0, 26.0, 50.0, 82.0, 168.0, 284.0, 630.0, 2392.0, 3122660.0, 17465.0, 959.0, 383.0, 195.0, 117.0, 59.0, 41.0, 29.0, 22.0, 20.0, 7.0, 3.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.25, -59.53466796875, -57.8193359375, -56.10400390625, -54.388671875, -52.67333984375, -50.9580078125, -49.24267578125, -47.52734375, -45.81201171875, -44.0966796875, -42.38134765625, -40.666015625, -38.95068359375, -37.2353515625, -35.52001953125, -33.8046875, -32.08935546875, -30.3740234375, -28.65869140625, -26.943359375, -25.22802734375, -23.5126953125, -21.79736328125, -20.08203125, -18.36669921875, -16.6513671875, -14.93603515625, -13.220703125, -11.50537109375, -9.7900390625, -8.07470703125, -6.359375, -4.64404296875, -2.9287109375, -1.21337890625, 0.501953125, 2.21728515625, 3.9326171875, 5.64794921875, 7.36328125, 9.07861328125, 10.7939453125, 12.50927734375, 14.224609375, 15.93994140625, 17.6552734375, 19.37060546875, 21.0859375, 22.80126953125, 24.5166015625, 26.23193359375, 27.947265625, 29.66259765625, 31.3779296875, 33.09326171875, 34.80859375, 36.52392578125, 38.2392578125, 39.95458984375, 41.669921875, 43.38525390625, 45.1005859375, 46.81591796875, 48.53125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 204.0, 726.0, 76.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.03435516357422, -60.329872131347656, -56.625389099121094, -52.9209098815918, -49.216426849365234, -45.51194381713867, -41.807464599609375, -38.10298156738281, -34.39849853515625, -30.694015502929688, -26.989534378051758, -23.285053253173828, -19.580570220947266, -15.876087188720703, -12.171606063842773, -8.467124938964844, -4.762641906738281, -1.0581598281860352, 2.646322250366211, 6.350804328918457, 10.055286407470703, 13.759769439697266, 17.464250564575195, 21.168731689453125, 24.873214721679688, 28.57769775390625, 32.28218078613281, 35.98666000366211, 39.69114303588867, 43.395626068115234, 47.10010528564453, 50.804588317871094, 54.509063720703125, 58.21354675292969, 61.91802978515625, 65.62251281738281, 69.32699584960938, 73.03147888183594, 76.73595428466797, 80.44043731689453, 84.1449203491211, 87.84940338134766, 91.55388641357422, 95.25836944580078, 98.96284484863281, 102.66732788085938, 106.37181091308594, 110.0762939453125, 113.78077697753906, 117.48526000976562, 121.18974304199219, 124.89422607421875, 128.5987091064453, 132.30319213867188, 136.00767517089844, 139.712158203125, 143.4166259765625, 147.12110900878906, 150.82559204101562, 154.5300750732422, 158.23455810546875, 161.9390411376953, 165.64352416992188, 169.34799194335938, 173.052490234375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 13.0, 18.0, 23.0, 18.0, 22.0, 24.0, 22.0, 28.0, 38.0, 35.0, 46.0, 32.0, 37.0, 42.0, 44.0, 50.0, 43.0, 34.0, 39.0, 35.0, 36.0, 30.0, 36.0, 29.0, 30.0, 30.0, 21.0, 14.0, 15.0, 13.0, 13.0, 11.0, 7.0, 10.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-34.330711364746094, -33.250938415527344, -32.17116928100586, -31.09139633178711, -30.01162338256836, -28.931852340698242, -27.852081298828125, -26.772308349609375, -25.692535400390625, -24.612764358520508, -23.532991409301758, -22.45322036743164, -21.37344741821289, -20.293676376342773, -19.213905334472656, -18.134132385253906, -17.05436134338379, -15.974589347839355, -14.894817352294922, -13.815046310424805, -12.735273361206055, -11.655502319335938, -10.575730323791504, -9.49595832824707, -8.416186332702637, -7.336414337158203, -6.2566423416137695, -5.176870822906494, -4.0970988273620605, -3.017326831817627, -1.9375553131103516, -0.857783317565918, 0.22198867797851562, 1.3017605543136597, 2.3815324306488037, 3.461304187774658, 4.541076183319092, 5.620848178863525, 6.700619697570801, 7.780391693115234, 8.860163688659668, 9.939935684204102, 11.019707679748535, 12.099479675292969, 13.179250717163086, 14.259023666381836, 15.338794708251953, 16.418567657470703, 17.49833869934082, 18.578109741210938, 19.657882690429688, 20.737653732299805, 21.817426681518555, 22.897197723388672, 23.976970672607422, 25.05674171447754, 26.136512756347656, 27.216283798217773, 28.296056747436523, 29.37582778930664, 30.45560073852539, 31.535371780395508, 32.615142822265625, 33.694915771484375, 34.774688720703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 8.0, 16.0, 17.0, 18.0, 24.0, 22.0, 23.0, 18.0, 31.0, 41.0, 36.0, 36.0, 44.0, 37.0, 44.0, 46.0, 48.0, 34.0, 29.0, 57.0, 26.0, 36.0, 43.0, 28.0, 25.0, 23.0, 21.0, 30.0, 14.0, 21.0, 11.0, 18.0, 7.0, 4.0, 5.0, 4.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.1334228515625, -6.923095703125, -6.7127685546875, -6.50244140625, -6.2921142578125, -6.081787109375, -5.8714599609375, -5.6611328125, -5.4508056640625, -5.240478515625, -5.0301513671875, -4.81982421875, -4.6094970703125, -4.399169921875, -4.1888427734375, -3.978515625, -3.7681884765625, -3.557861328125, -3.3475341796875, -3.13720703125, -2.9268798828125, -2.716552734375, -2.5062255859375, -2.2958984375, -2.0855712890625, -1.875244140625, -1.6649169921875, -1.45458984375, -1.2442626953125, -1.033935546875, -0.8236083984375, -0.61328125, -0.4029541015625, -0.192626953125, 0.0177001953125, 0.22802734375, 0.4383544921875, 0.648681640625, 0.8590087890625, 1.0693359375, 1.2796630859375, 1.489990234375, 1.7003173828125, 1.91064453125, 2.1209716796875, 2.331298828125, 2.5416259765625, 2.751953125, 2.9622802734375, 3.172607421875, 3.3829345703125, 3.59326171875, 3.8035888671875, 4.013916015625, 4.2242431640625, 4.4345703125, 4.6448974609375, 4.855224609375, 5.0655517578125, 5.27587890625, 5.4862060546875, 5.696533203125, 5.9068603515625, 6.1171875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 14.0, 11.0, 16.0, 22.0, 26.0, 41.0, 35.0, 44.0, 59.0, 60.0, 77.0, 116.0, 156.0, 202.0, 224.0, 360.0, 490.0, 883.0, 1818.0, 6791.0, 81212.0, 3554881.0, 526849.0, 13834.0, 2762.0, 1058.0, 584.0, 403.0, 253.0, 202.0, 164.0, 126.0, 102.0, 79.0, 62.0, 58.0, 41.0, 34.0, 24.0, 14.0, 17.0, 15.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.0625, -32.01904296875, -30.9755859375, -29.93212890625, -28.888671875, -27.84521484375, -26.8017578125, -25.75830078125, -24.71484375, -23.67138671875, -22.6279296875, -21.58447265625, -20.541015625, -19.49755859375, -18.4541015625, -17.41064453125, -16.3671875, -15.32373046875, -14.2802734375, -13.23681640625, -12.193359375, -11.14990234375, -10.1064453125, -9.06298828125, -8.01953125, -6.97607421875, -5.9326171875, -4.88916015625, -3.845703125, -2.80224609375, -1.7587890625, -0.71533203125, 0.328125, 1.37158203125, 2.4150390625, 3.45849609375, 4.501953125, 5.54541015625, 6.5888671875, 7.63232421875, 8.67578125, 9.71923828125, 10.7626953125, 11.80615234375, 12.849609375, 13.89306640625, 14.9365234375, 15.97998046875, 17.0234375, 18.06689453125, 19.1103515625, 20.15380859375, 21.197265625, 22.24072265625, 23.2841796875, 24.32763671875, 25.37109375, 26.41455078125, 27.4580078125, 28.50146484375, 29.544921875, 30.58837890625, 31.6318359375, 32.67529296875, 33.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 17.0, 25.0, 86.0, 178.0, 488.0, 972.0, 1256.0, 597.0, 245.0, 104.0, 46.0, 16.0, 15.0, 5.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.78125, -36.9447021484375, -36.108154296875, -35.2716064453125, -34.43505859375, -33.5985107421875, -32.761962890625, -31.9254150390625, -31.0888671875, -30.2523193359375, -29.415771484375, -28.5792236328125, -27.74267578125, -26.9061279296875, -26.069580078125, -25.2330322265625, -24.396484375, -23.5599365234375, -22.723388671875, -21.8868408203125, -21.05029296875, -20.2137451171875, -19.377197265625, -18.5406494140625, -17.7041015625, -16.8675537109375, -16.031005859375, -15.1944580078125, -14.35791015625, -13.5213623046875, -12.684814453125, -11.8482666015625, -11.01171875, -10.1751708984375, -9.338623046875, -8.5020751953125, -7.66552734375, -6.8289794921875, -5.992431640625, -5.1558837890625, -4.3193359375, -3.4827880859375, -2.646240234375, -1.8096923828125, -0.97314453125, -0.1365966796875, 0.699951171875, 1.5364990234375, 2.373046875, 3.2095947265625, 4.046142578125, 4.8826904296875, 5.71923828125, 6.5557861328125, 7.392333984375, 8.2288818359375, 9.0654296875, 9.9019775390625, 10.738525390625, 11.5750732421875, 12.41162109375, 13.2481689453125, 14.084716796875, 14.9212646484375, 15.7578125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 8.0, 15.0, 31.0, 43.0, 45.0, 89.0, 178.0, 535.0, 2273.0, 29930.0, 3812218.0, 340758.0, 6612.0, 933.0, 324.0, 117.0, 71.0, 37.0, 27.0, 16.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.0625, -40.9482421875, -39.833984375, -38.7197265625, -37.60546875, -36.4912109375, -35.376953125, -34.2626953125, -33.1484375, -32.0341796875, -30.919921875, -29.8056640625, -28.69140625, -27.5771484375, -26.462890625, -25.3486328125, -24.234375, -23.1201171875, -22.005859375, -20.8916015625, -19.77734375, -18.6630859375, -17.548828125, -16.4345703125, -15.3203125, -14.2060546875, -13.091796875, -11.9775390625, -10.86328125, -9.7490234375, -8.634765625, -7.5205078125, -6.40625, -5.2919921875, -4.177734375, -3.0634765625, -1.94921875, -0.8349609375, 0.279296875, 1.3935546875, 2.5078125, 3.6220703125, 4.736328125, 5.8505859375, 6.96484375, 8.0791015625, 9.193359375, 10.3076171875, 11.421875, 12.5361328125, 13.650390625, 14.7646484375, 15.87890625, 16.9931640625, 18.107421875, 19.2216796875, 20.3359375, 21.4501953125, 22.564453125, 23.6787109375, 24.79296875, 25.9072265625, 27.021484375, 28.1357421875, 29.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 19.0, 26.0, 27.0, 70.0, 103.0, 123.0, 128.0, 137.0, 111.0, 83.0, 68.0, 34.0, 21.0, 21.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.160179138183594, -37.987518310546875, -34.814857482910156, -31.642200469970703, -28.469539642333984, -25.296878814697266, -22.12421989440918, -18.951560974121094, -15.778900146484375, -12.606240272521973, -9.43358039855957, -6.260920524597168, -3.0882606506347656, 0.08439922332763672, 3.257059097290039, 6.429718017578125, 9.602378845214844, 12.775038719177246, 15.947698593139648, 19.120357513427734, 22.293018341064453, 25.465679168701172, 28.638338088989258, 31.810997009277344, 34.98365783691406, 38.15631866455078, 41.3289794921875, 44.50163650512695, 47.67429733276367, 50.84695816040039, 54.019615173339844, 57.19227600097656, 60.36494445800781, 63.53760528564453, 66.71026611328125, 69.88292694091797, 73.05558776855469, 76.22824096679688, 79.4009017944336, 82.57356262207031, 85.74622344970703, 88.91888427734375, 92.09154510498047, 95.26420593261719, 98.43685913085938, 101.6095199584961, 104.78218078613281, 107.95484161376953, 111.12750244140625, 114.30016326904297, 117.47282409667969, 120.6454849243164, 123.81814575195312, 126.99079895019531, 130.16346740722656, 133.33612060546875, 136.5087890625, 139.6814422607422, 142.85411071777344, 146.02676391601562, 149.19943237304688, 152.37208557128906, 155.5447540283203, 158.7174072265625, 161.8900604248047]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 5.0, 4.0, 9.0, 16.0, 20.0, 13.0, 24.0, 18.0, 24.0, 24.0, 34.0, 27.0, 30.0, 31.0, 29.0, 39.0, 34.0, 36.0, 44.0, 44.0, 39.0, 42.0, 35.0, 37.0, 31.0, 28.0, 38.0, 16.0, 31.0, 30.0, 24.0, 18.0, 13.0, 17.0, 13.0, 11.0, 16.0, 6.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.422119140625, -39.09198760986328, -37.76185989379883, -36.43172836303711, -35.101600646972656, -33.77146911621094, -32.44133758544922, -31.111207962036133, -29.781078338623047, -28.45094871520996, -27.120819091796875, -25.790687561035156, -24.46055793762207, -23.130428314208984, -21.800296783447266, -20.47016716003418, -19.140037536621094, -17.809907913208008, -16.479778289794922, -15.149646759033203, -13.819517135620117, -12.489387512207031, -11.159256935119629, -9.829126358032227, -8.49899673461914, -7.1688666343688965, -5.838736534118652, -4.508606433868408, -3.178476333618164, -1.84834623336792, -0.5182161331176758, 0.8119144439697266, 2.1420440673828125, 3.4721741676330566, 4.802304267883301, 6.132434368133545, 7.462564468383789, 8.792694091796875, 10.122824668884277, 11.45295524597168, 12.783084869384766, 14.113214492797852, 15.443345069885254, 16.773475646972656, 18.103605270385742, 19.433734893798828, 20.763866424560547, 22.093996047973633, 23.42412567138672, 24.754255294799805, 26.08438491821289, 27.41451644897461, 28.744646072387695, 30.07477569580078, 31.4049072265625, 32.73503875732422, 34.06516647338867, 35.39529800415039, 36.725425720214844, 38.05555725097656, 39.38568878173828, 40.715816497802734, 42.04594802856445, 43.376075744628906, 44.706207275390625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 7.0, 5.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 19.0, 27.0, 36.0, 33.0, 29.0, 28.0, 42.0, 42.0, 39.0, 29.0, 42.0, 44.0, 50.0, 42.0, 40.0, 27.0, 36.0, 29.0, 27.0, 30.0, 28.0, 24.0, 26.0, 17.0, 9.0, 16.0, 19.0, 12.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-75.125, -72.7626953125, -70.400390625, -68.0380859375, -65.67578125, -63.3134765625, -60.951171875, -58.5888671875, -56.2265625, -53.8642578125, -51.501953125, -49.1396484375, -46.77734375, -44.4150390625, -42.052734375, -39.6904296875, -37.328125, -34.9658203125, -32.603515625, -30.2412109375, -27.87890625, -25.5166015625, -23.154296875, -20.7919921875, -18.4296875, -16.0673828125, -13.705078125, -11.3427734375, -8.98046875, -6.6181640625, -4.255859375, -1.8935546875, 0.46875, 2.8310546875, 5.193359375, 7.5556640625, 9.91796875, 12.2802734375, 14.642578125, 17.0048828125, 19.3671875, 21.7294921875, 24.091796875, 26.4541015625, 28.81640625, 31.1787109375, 33.541015625, 35.9033203125, 38.265625, 40.6279296875, 42.990234375, 45.3525390625, 47.71484375, 50.0771484375, 52.439453125, 54.8017578125, 57.1640625, 59.5263671875, 61.888671875, 64.2509765625, 66.61328125, 68.9755859375, 71.337890625, 73.7001953125, 76.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 13.0, 14.0, 28.0, 37.0, 66.0, 104.0, 159.0, 246.0, 406.0, 572.0, 929.0, 1429.0, 2098.0, 3379.0, 5069.0, 7840.0, 12261.0, 18763.0, 29532.0, 46597.0, 72496.0, 108444.0, 148386.0, 167116.0, 140643.0, 99082.0, 65315.0, 42101.0, 26727.0, 17218.0, 11175.0, 7108.0, 4573.0, 3042.0, 1982.0, 1272.0, 808.0, 547.0, 368.0, 223.0, 152.0, 90.0, 53.0, 36.0, 26.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.0625, -5.88092041015625, -5.6993408203125, -5.51776123046875, -5.336181640625, -5.15460205078125, -4.9730224609375, -4.79144287109375, -4.60986328125, -4.42828369140625, -4.2467041015625, -4.06512451171875, -3.883544921875, -3.70196533203125, -3.5203857421875, -3.33880615234375, -3.1572265625, -2.97564697265625, -2.7940673828125, -2.61248779296875, -2.430908203125, -2.24932861328125, -2.0677490234375, -1.88616943359375, -1.70458984375, -1.52301025390625, -1.3414306640625, -1.15985107421875, -0.978271484375, -0.79669189453125, -0.6151123046875, -0.43353271484375, -0.251953125, -0.07037353515625, 0.1112060546875, 0.29278564453125, 0.474365234375, 0.65594482421875, 0.8375244140625, 1.01910400390625, 1.20068359375, 1.38226318359375, 1.5638427734375, 1.74542236328125, 1.927001953125, 2.10858154296875, 2.2901611328125, 2.47174072265625, 2.6533203125, 2.83489990234375, 3.0164794921875, 3.19805908203125, 3.379638671875, 3.56121826171875, 3.7427978515625, 3.92437744140625, 4.10595703125, 4.28753662109375, 4.4691162109375, 4.65069580078125, 4.832275390625, 5.01385498046875, 5.1954345703125, 5.37701416015625, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 11.0, 9.0, 8.0, 15.0, 27.0, 24.0, 25.0, 25.0, 24.0, 29.0, 26.0, 36.0, 41.0, 55.0, 30.0, 42.0, 49.0, 1066.0, 43.0, 39.0, 35.0, 30.0, 22.0, 46.0, 38.0, 33.0, 24.0, 26.0, 18.0, 11.0, 20.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.875, -51.2802734375, -49.685546875, -48.0908203125, -46.49609375, -44.9013671875, -43.306640625, -41.7119140625, -40.1171875, -38.5224609375, -36.927734375, -35.3330078125, -33.73828125, -32.1435546875, -30.548828125, -28.9541015625, -27.359375, -25.7646484375, -24.169921875, -22.5751953125, -20.98046875, -19.3857421875, -17.791015625, -16.1962890625, -14.6015625, -13.0068359375, -11.412109375, -9.8173828125, -8.22265625, -6.6279296875, -5.033203125, -3.4384765625, -1.84375, -0.2490234375, 1.345703125, 2.9404296875, 4.53515625, 6.1298828125, 7.724609375, 9.3193359375, 10.9140625, 12.5087890625, 14.103515625, 15.6982421875, 17.29296875, 18.8876953125, 20.482421875, 22.0771484375, 23.671875, 25.2666015625, 26.861328125, 28.4560546875, 30.05078125, 31.6455078125, 33.240234375, 34.8349609375, 36.4296875, 38.0244140625, 39.619140625, 41.2138671875, 42.80859375, 44.4033203125, 45.998046875, 47.5927734375, 49.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 7.0, 17.0, 28.0, 35.0, 57.0, 74.0, 119.0, 196.0, 314.0, 503.0, 693.0, 1133.0, 1799.0, 2854.0, 4552.0, 7190.0, 11324.0, 17975.0, 28865.0, 46365.0, 73301.0, 112166.0, 153878.0, 1216529.0, 142627.0, 100577.0, 64647.0, 40615.0, 25373.0, 15975.0, 9990.0, 6432.0, 4018.0, 2628.0, 1563.0, 955.0, 615.0, 380.0, 271.0, 150.0, 114.0, 83.0, 53.0, 34.0, 16.0, 15.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.640625, -5.46075439453125, -5.2808837890625, -5.10101318359375, -4.921142578125, -4.74127197265625, -4.5614013671875, -4.38153076171875, -4.20166015625, -4.02178955078125, -3.8419189453125, -3.66204833984375, -3.482177734375, -3.30230712890625, -3.1224365234375, -2.94256591796875, -2.7626953125, -2.58282470703125, -2.4029541015625, -2.22308349609375, -2.043212890625, -1.86334228515625, -1.6834716796875, -1.50360107421875, -1.32373046875, -1.14385986328125, -0.9639892578125, -0.78411865234375, -0.604248046875, -0.42437744140625, -0.2445068359375, -0.06463623046875, 0.115234375, 0.29510498046875, 0.4749755859375, 0.65484619140625, 0.834716796875, 1.01458740234375, 1.1944580078125, 1.37432861328125, 1.55419921875, 1.73406982421875, 1.9139404296875, 2.09381103515625, 2.273681640625, 2.45355224609375, 2.6334228515625, 2.81329345703125, 2.9931640625, 3.17303466796875, 3.3529052734375, 3.53277587890625, 3.712646484375, 3.89251708984375, 4.0723876953125, 4.25225830078125, 4.43212890625, 4.61199951171875, 4.7918701171875, 4.97174072265625, 5.151611328125, 5.33148193359375, 5.5113525390625, 5.69122314453125, 5.87109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 6.0, 6.0, 6.0, 9.0, 10.0, 10.0, 20.0, 13.0, 22.0, 47.0, 23.0, 37.0, 44.0, 47.0, 70.0, 69.0, 70.0, 74.0, 62.0, 54.0, 52.0, 44.0, 28.0, 28.0, 27.0, 26.0, 14.0, 11.0, 9.0, 13.0, 8.0, 1.0, 5.0, 0.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04443359375, -0.042922019958496094, -0.04141044616699219, -0.03989887237548828, -0.038387298583984375, -0.03687572479248047, -0.03536415100097656, -0.033852577209472656, -0.03234100341796875, -0.030829429626464844, -0.029317855834960938, -0.02780628204345703, -0.026294708251953125, -0.02478313446044922, -0.023271560668945312, -0.021759986877441406, -0.0202484130859375, -0.018736839294433594, -0.017225265502929688, -0.01571369171142578, -0.014202117919921875, -0.012690544128417969, -0.011178970336914062, -0.009667396545410156, -0.00815582275390625, -0.006644248962402344, -0.0051326751708984375, -0.0036211013793945312, -0.002109527587890625, -0.0005979537963867188, 0.0009136199951171875, 0.0024251937866210938, 0.003936767578125, 0.005448341369628906, 0.0069599151611328125, 0.008471488952636719, 0.009983062744140625, 0.011494636535644531, 0.013006210327148438, 0.014517784118652344, 0.01602935791015625, 0.017540931701660156, 0.019052505493164062, 0.02056407928466797, 0.022075653076171875, 0.02358722686767578, 0.025098800659179688, 0.026610374450683594, 0.0281219482421875, 0.029633522033691406, 0.031145095825195312, 0.03265666961669922, 0.034168243408203125, 0.03567981719970703, 0.03719139099121094, 0.038702964782714844, 0.04021453857421875, 0.041726112365722656, 0.04323768615722656, 0.04474925994873047, 0.046260833740234375, 0.04777240753173828, 0.04928398132324219, 0.050795555114746094, 0.05230712890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 11.0, 9.0, 11.0, 18.0, 17.0, 21.0, 31.0, 50.0, 55.0, 70.0, 96.0, 133.0, 171.0, 204.0, 337.0, 590.0, 978.0, 1908.0, 4782.0, 14837.0, 56362.0, 258210.0, 515524.0, 144019.0, 33524.0, 9401.0, 3306.0, 1484.0, 791.0, 458.0, 312.0, 179.0, 145.0, 131.0, 86.0, 68.0, 54.0, 34.0, 36.0, 22.0, 10.0, 16.0, 11.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.31689453125, -0.3076591491699219, -0.29842376708984375, -0.2891883850097656, -0.2799530029296875, -0.2707176208496094, -0.26148223876953125, -0.2522468566894531, -0.243011474609375, -0.23377609252929688, -0.22454071044921875, -0.21530532836914062, -0.2060699462890625, -0.19683456420898438, -0.18759918212890625, -0.17836380004882812, -0.16912841796875, -0.15989303588867188, -0.15065765380859375, -0.14142227172851562, -0.1321868896484375, -0.12295150756835938, -0.11371612548828125, -0.10448074340820312, -0.095245361328125, -0.08600997924804688, -0.07677459716796875, -0.06753921508789062, -0.0583038330078125, -0.049068450927734375, -0.03983306884765625, -0.030597686767578125, -0.0213623046875, -0.012126922607421875, -0.00289154052734375, 0.006343841552734375, 0.0155792236328125, 0.024814605712890625, 0.03404998779296875, 0.043285369873046875, 0.052520751953125, 0.061756134033203125, 0.07099151611328125, 0.08022689819335938, 0.0894622802734375, 0.09869766235351562, 0.10793304443359375, 0.11716842651367188, 0.12640380859375, 0.13563919067382812, 0.14487457275390625, 0.15410995483398438, 0.1633453369140625, 0.17258071899414062, 0.18181610107421875, 0.19105148315429688, 0.200286865234375, 0.20952224731445312, 0.21875762939453125, 0.22799301147460938, 0.2372283935546875, 0.24646377563476562, 0.25569915771484375, 0.2649345397949219, 0.274169921875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 37.0, 55.0, 102.0, 175.0, 196.0, 144.0, 99.0, 70.0, 39.0, 24.0, 12.0, 14.0, 6.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04953237250447273, -0.04664928838610649, -0.04376620054244995, -0.04088311642408371, -0.03800003230571747, -0.03511694818735123, -0.03223386034369469, -0.029350776225328445, -0.026467690244317055, -0.023584604263305664, -0.020701520144939423, -0.017818434163928032, -0.014935349114239216, -0.0120522640645504, -0.009169178083539009, -0.006286093965172768, -0.003403007984161377, -0.0005199227016419172, 0.0023631625808775425, 0.005246248096227646, 0.008129333145916462, 0.011012418195605278, 0.013895504176616669, 0.01677858829498291, 0.0196616742759943, 0.02254476025700569, 0.025427844375371933, 0.028310930356383324, 0.031194016337394714, 0.034077100455760956, 0.0369601845741272, 0.03984326869249344, 0.04272636026144028, 0.04560944437980652, 0.04849253222346306, 0.0513756163418293, 0.05425870046019554, 0.05714178830385208, 0.06002487242221832, 0.06290795654058456, 0.0657910406589508, 0.06867412477731705, 0.07155720889568329, 0.07444030046463013, 0.07732338458299637, 0.08020646870136261, 0.08308955281972885, 0.08597263693809509, 0.08885572850704193, 0.09173881262540817, 0.09462189674377441, 0.09750498831272125, 0.1003880724310875, 0.10327115654945374, 0.10615424066781998, 0.10903732478618622, 0.11192040890455246, 0.1148034930229187, 0.11768657714128494, 0.12056966125965118, 0.12345275282859802, 0.12633582949638367, 0.1292189210653305, 0.13210201263427734, 0.134985089302063]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 10.0, 4.0, 5.0, 10.0, 7.0, 8.0, 12.0, 12.0, 18.0, 23.0, 11.0, 10.0, 27.0, 23.0, 28.0, 38.0, 37.0, 31.0, 40.0, 32.0, 29.0, 51.0, 34.0, 37.0, 44.0, 25.0, 43.0, 47.0, 28.0, 39.0, 30.0, 23.0, 26.0, 22.0, 24.0, 21.0, 17.0, 20.0, 9.0, 12.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03220796585083008, -0.03122302144765854, -0.03023807890713215, -0.02925313636660576, -0.02826819196343422, -0.02728324756026268, -0.02629830501973629, -0.0253133624792099, -0.02432841807603836, -0.02334347367286682, -0.02235853113234043, -0.02137358859181404, -0.020388644188642502, -0.019403699785470963, -0.018418757244944572, -0.017433814704418182, -0.016448870301246643, -0.015463926829397678, -0.014478983357548714, -0.013494039885699749, -0.012509096413850784, -0.01152415294200182, -0.010539209470152855, -0.00955426599830389, -0.008569322526454926, -0.007584379054605961, -0.006599435582756996, -0.0056144921109080315, -0.004629548639059067, -0.003644605167210102, -0.0026596616953611374, -0.0016747182235121727, -0.000689774751663208, 0.0002951687201857567, 0.0012801121920347214, 0.002265055663883686, 0.0032499991357326508, 0.0042349426075816154, 0.00521988607943058, 0.006204829551279545, 0.0071897730231285095, 0.008174716494977474, 0.009159659966826439, 0.010144603438675404, 0.011129546910524368, 0.012114490382373333, 0.013099433854222298, 0.014084377326071262, 0.015069320797920227, 0.016054265201091766, 0.017039207741618156, 0.018024150282144547, 0.019009094685316086, 0.019994039088487625, 0.020978981629014015, 0.021963924169540405, 0.022948868572711945, 0.023933812975883484, 0.024918755516409874, 0.025903698056936264, 0.026888642460107803, 0.027873586863279343, 0.028858529403805733, 0.029843471944332123, 0.030828416347503662]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 6.0, 6.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 20.0, 27.0, 37.0, 30.0, 29.0, 29.0, 41.0, 43.0, 39.0, 30.0, 43.0, 42.0, 49.0, 42.0, 41.0, 26.0, 37.0, 28.0, 29.0, 31.0, 26.0, 24.0, 23.0, 19.0, 10.0, 16.0, 20.0, 11.0, 9.0, 9.0, 10.0, 4.0, 5.0, 3.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-75.0625, -72.7021484375, -70.341796875, -67.9814453125, -65.62109375, -63.2607421875, -60.900390625, -58.5400390625, -56.1796875, -53.8193359375, -51.458984375, -49.0986328125, -46.73828125, -44.3779296875, -42.017578125, -39.6572265625, -37.296875, -34.9365234375, -32.576171875, -30.2158203125, -27.85546875, -25.4951171875, -23.134765625, -20.7744140625, -18.4140625, -16.0537109375, -13.693359375, -11.3330078125, -8.97265625, -6.6123046875, -4.251953125, -1.8916015625, 0.46875, 2.8291015625, 5.189453125, 7.5498046875, 9.91015625, 12.2705078125, 14.630859375, 16.9912109375, 19.3515625, 21.7119140625, 24.072265625, 26.4326171875, 28.79296875, 31.1533203125, 33.513671875, 35.8740234375, 38.234375, 40.5947265625, 42.955078125, 45.3154296875, 47.67578125, 50.0361328125, 52.396484375, 54.7568359375, 57.1171875, 59.4775390625, 61.837890625, 64.1982421875, 66.55859375, 68.9189453125, 71.279296875, 73.6396484375, 76.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 5.0, 11.0, 17.0, 19.0, 24.0, 39.0, 45.0, 77.0, 88.0, 177.0, 253.0, 373.0, 689.0, 1233.0, 2272.0, 4740.0, 11699.0, 37529.0, 180240.0, 593883.0, 160095.0, 34364.0, 11073.0, 4484.0, 2155.0, 1191.0, 621.0, 400.0, 214.0, 161.0, 102.0, 83.0, 52.0, 27.0, 21.0, 26.0, 13.0, 17.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.517578125, -15.95703125, -15.396484375, -14.8359375, -14.275390625, -13.71484375, -13.154296875, -12.59375, -12.033203125, -11.47265625, -10.912109375, -10.3515625, -9.791015625, -9.23046875, -8.669921875, -8.109375, -7.548828125, -6.98828125, -6.427734375, -5.8671875, -5.306640625, -4.74609375, -4.185546875, -3.625, -3.064453125, -2.50390625, -1.943359375, -1.3828125, -0.822265625, -0.26171875, 0.298828125, 0.859375, 1.419921875, 1.98046875, 2.541015625, 3.1015625, 3.662109375, 4.22265625, 4.783203125, 5.34375, 5.904296875, 6.46484375, 7.025390625, 7.5859375, 8.146484375, 8.70703125, 9.267578125, 9.828125, 10.388671875, 10.94921875, 11.509765625, 12.0703125, 12.630859375, 13.19140625, 13.751953125, 14.3125, 14.873046875, 15.43359375, 15.994140625, 16.5546875, 17.115234375, 17.67578125, 18.236328125, 18.796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 11.0, 28.0, 29.0, 28.0, 36.0, 48.0, 56.0, 58.0, 72.0, 87.0, 2128.0, 75.0, 79.0, 54.0, 41.0, 39.0, 26.0, 25.0, 19.0, 15.0, 12.0, 7.0, 9.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.5, -168.85546875, -162.2109375, -155.56640625, -148.921875, -142.27734375, -135.6328125, -128.98828125, -122.34375, -115.69921875, -109.0546875, -102.41015625, -95.765625, -89.12109375, -82.4765625, -75.83203125, -69.1875, -62.54296875, -55.8984375, -49.25390625, -42.609375, -35.96484375, -29.3203125, -22.67578125, -16.03125, -9.38671875, -2.7421875, 3.90234375, 10.546875, 17.19140625, 23.8359375, 30.48046875, 37.125, 43.76953125, 50.4140625, 57.05859375, 63.703125, 70.34765625, 76.9921875, 83.63671875, 90.28125, 96.92578125, 103.5703125, 110.21484375, 116.859375, 123.50390625, 130.1484375, 136.79296875, 143.4375, 150.08203125, 156.7265625, 163.37109375, 170.015625, 176.66015625, 183.3046875, 189.94921875, 196.59375, 203.23828125, 209.8828125, 216.52734375, 223.171875, 229.81640625, 236.4609375, 243.10546875, 249.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 8.0, 8.0, 13.0, 17.0, 11.0, 28.0, 36.0, 52.0, 81.0, 98.0, 194.0, 242.0, 409.0, 872.0, 2214.0, 9776.0, 165203.0, 2922826.0, 36072.0, 4461.0, 1384.0, 683.0, 351.0, 192.0, 143.0, 89.0, 70.0, 41.0, 27.0, 27.0, 22.0, 8.0, 10.0, 4.0, 7.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-50.84375, -49.44189453125, -48.0400390625, -46.63818359375, -45.236328125, -43.83447265625, -42.4326171875, -41.03076171875, -39.62890625, -38.22705078125, -36.8251953125, -35.42333984375, -34.021484375, -32.61962890625, -31.2177734375, -29.81591796875, -28.4140625, -27.01220703125, -25.6103515625, -24.20849609375, -22.806640625, -21.40478515625, -20.0029296875, -18.60107421875, -17.19921875, -15.79736328125, -14.3955078125, -12.99365234375, -11.591796875, -10.18994140625, -8.7880859375, -7.38623046875, -5.984375, -4.58251953125, -3.1806640625, -1.77880859375, -0.376953125, 1.02490234375, 2.4267578125, 3.82861328125, 5.23046875, 6.63232421875, 8.0341796875, 9.43603515625, 10.837890625, 12.23974609375, 13.6416015625, 15.04345703125, 16.4453125, 17.84716796875, 19.2490234375, 20.65087890625, 22.052734375, 23.45458984375, 24.8564453125, 26.25830078125, 27.66015625, 29.06201171875, 30.4638671875, 31.86572265625, 33.267578125, 34.66943359375, 36.0712890625, 37.47314453125, 38.875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 16.0, 31.0, 142.0, 460.0, 242.0, 76.0, 22.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-918.1880493164062, -899.7416381835938, -881.2952270507812, -862.8488159179688, -844.4024658203125, -825.9560546875, -807.5096435546875, -789.063232421875, -770.6168212890625, -752.17041015625, -733.7239990234375, -715.277587890625, -696.8311767578125, -678.3848266601562, -659.9384155273438, -641.4920043945312, -623.0455932617188, -604.5991821289062, -586.1527709960938, -567.7063598632812, -549.260009765625, -530.8135986328125, -512.3671875, -493.9207763671875, -475.474365234375, -457.0279541015625, -438.58154296875, -420.1351623535156, -401.6887512207031, -383.2423400878906, -364.79595947265625, -346.34954833984375, -327.9031677246094, -309.4567565917969, -291.0103759765625, -272.56396484375, -254.1175537109375, -235.671142578125, -217.22474670410156, -198.77835083007812, -180.33193969726562, -161.88552856445312, -143.4391326904297, -124.99272918701172, -106.54632568359375, -88.09992218017578, -69.65351867675781, -51.207122802734375, -32.760711669921875, -14.314308166503906, 4.1320953369140625, 22.57849884033203, 41.02490234375, 59.47130584716797, 77.91770935058594, 96.36410522460938, 114.81051635742188, 133.25692749023438, 151.7033233642578, 170.14971923828125, 188.59613037109375, 207.04254150390625, 225.4889373779297, 243.93533325195312, 262.3817443847656]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 15.0, 8.0, 25.0, 15.0, 22.0, 33.0, 29.0, 30.0, 34.0, 38.0, 49.0, 40.0, 51.0, 61.0, 55.0, 46.0, 62.0, 57.0, 44.0, 37.0, 44.0, 33.0, 24.0, 23.0, 18.0, 14.0, 16.0, 8.0, 13.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-227.23028564453125, -220.158935546875, -213.08758544921875, -206.01622009277344, -198.9448699951172, -191.87351989746094, -184.80215454101562, -177.73080444335938, -170.65945434570312, -163.58810424804688, -156.51675415039062, -149.4453887939453, -142.37403869628906, -135.3026885986328, -128.2313232421875, -121.15997314453125, -114.088623046875, -107.01727294921875, -99.94591522216797, -92.87455749511719, -85.80320739746094, -78.73185729980469, -71.6604995727539, -64.58914184570312, -57.517791748046875, -50.44643783569336, -43.375083923339844, -36.30373001098633, -29.232376098632812, -22.161022186279297, -15.089668273925781, -8.018314361572266, -0.94696044921875, 6.124393463134766, 13.195747375488281, 20.267101287841797, 27.338455200195312, 34.40980911254883, 41.481163024902344, 48.55251693725586, 55.623870849609375, 62.69522476196289, 69.7665786743164, 76.83793640136719, 83.90928649902344, 90.98063659667969, 98.05199432373047, 105.12335205078125, 112.1947021484375, 119.26605224609375, 126.33740997314453, 133.4087677001953, 140.48011779785156, 147.5514678955078, 154.62283325195312, 161.69418334960938, 168.76553344726562, 175.83688354492188, 182.90823364257812, 189.97959899902344, 197.0509490966797, 204.12229919433594, 211.19366455078125, 218.2650146484375, 225.33636474609375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 9.0, 8.0, 9.0, 11.0, 11.0, 22.0, 41.0, 39.0, 61.0, 71.0, 89.0, 122.0, 194.0, 245.0, 342.0, 435.0, 602.0, 744.0, 1239.0, 1040828.0, 802.0, 677.0, 506.0, 347.0, 305.0, 194.0, 146.0, 116.0, 75.0, 61.0, 40.0, 40.0, 24.0, 20.0, 14.0, 18.0, 12.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.662567138671875, -42.0578727722168, -40.453182220458984, -38.848487854003906, -37.243797302246094, -35.639102935791016, -34.03440856933594, -32.429718017578125, -30.82502555847168, -29.220333099365234, -27.61564064025879, -26.010948181152344, -24.406253814697266, -22.801563262939453, -21.196868896484375, -19.59217643737793, -17.987483978271484, -16.38279151916504, -14.778099060058594, -13.173405647277832, -11.568713188171387, -9.964020729064941, -8.35932731628418, -6.754634857177734, -5.149942398071289, -3.5452497005462646, -1.9405570030212402, -0.3358640670776367, 1.2688283920288086, 2.873520851135254, 4.478214263916016, 6.082906723022461, 7.687602996826172, 9.292295455932617, 10.896987915039062, 12.501681327819824, 14.10637378692627, 15.711066246032715, 17.315759658813477, 18.920452117919922, 20.525144577026367, 22.129837036132812, 23.734529495239258, 25.339221954345703, 26.94391632080078, 28.548606872558594, 30.153301239013672, 31.757993698120117, 33.36268615722656, 34.96738052368164, 36.57207107543945, 38.17676544189453, 39.781455993652344, 41.38615036010742, 42.9908447265625, 44.59553527832031, 46.200225830078125, 47.8049201965332, 49.409610748291016, 51.014305114746094, 52.618995666503906, 54.223690032958984, 55.82838439941406, 57.433074951171875, 59.03776931762695]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 14.0, 14.0, 21.0, 63.0, 447.0, 51462376.0, 120.0, 20.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3986.817138671875, -3800.021240234375, -3613.225341796875, -3426.4296875, -3239.6337890625, -3052.837890625, -2866.0419921875, -2679.24609375, -2492.4501953125, -2305.654296875, -2118.8583984375, -1932.0626220703125, -1745.2667236328125, -1558.4708251953125, -1371.675048828125, -1184.879150390625, -998.083251953125, -811.287353515625, -624.4915161132812, -437.6956787109375, -250.8997802734375, -64.1038818359375, 122.69189453125, 309.48779296875, 496.28369140625, 683.07958984375, 869.8754272460938, 1056.6712646484375, 1243.4671630859375, 1430.2630615234375, 1617.058837890625, 1803.854736328125, 1990.650390625, 2177.4462890625, 2364.2421875, 2551.0380859375, 2737.833984375, 2924.6298828125, 3111.425537109375, 3298.221435546875, 3485.017333984375, 3671.813232421875, 3858.609130859375, 4045.40478515625, 4232.20068359375, 4418.99658203125, 4605.79248046875, 4792.58837890625, 4979.38427734375, 5166.18017578125, 5352.97607421875, 5539.77197265625, 5726.56787109375, 5913.36376953125, 6100.1591796875, 6286.955078125, 6473.7509765625, 6660.546875, 6847.3427734375, 7034.138671875, 7220.9345703125, 7407.73046875, 7594.5263671875, 7781.322265625, 7968.1181640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 9.0, 13.0, 27.0, 37.0, 49.0, 70.0, 100.0, 133.0, 213.0, 350.0, 514.0, 769.0, 1206.0, 1771.0, 2622.0, 3765.0, 5422.0, 8543.0, 12433.0, 18256.0, 27801.0, 41151.0, 60176.0, 89086.0, 129959.0, 185002.0, 254876.0, 332189.0, 1713375.0, 2200863.0, 338229.0, 260509.0, 188864.0, 131972.0, 91061.0, 61354.0, 42275.0, 28225.0, 19191.0, 12790.0, 8643.0, 5723.0, 3904.0, 2545.0, 1769.0, 1220.0, 815.0, 558.0, 354.0, 225.0, 157.0, 90.0, 70.0, 46.0, 36.0, 15.0, 11.0, 6.0, 4.0, 2.0, 2.0], "bins": [-1.7490234375, -1.6944122314453125, -1.639801025390625, -1.5851898193359375, -1.53057861328125, -1.4759674072265625, -1.421356201171875, -1.3667449951171875, -1.3121337890625, -1.2575225830078125, -1.202911376953125, -1.1483001708984375, -1.09368896484375, -1.0390777587890625, -0.984466552734375, -0.9298553466796875, -0.875244140625, -0.8206329345703125, -0.766021728515625, -0.7114105224609375, -0.65679931640625, -0.6021881103515625, -0.547576904296875, -0.4929656982421875, -0.4383544921875, -0.3837432861328125, -0.329132080078125, -0.2745208740234375, -0.21990966796875, -0.1652984619140625, -0.110687255859375, -0.0560760498046875, -0.00146484375, 0.0531463623046875, 0.107757568359375, 0.1623687744140625, 0.21697998046875, 0.2715911865234375, 0.326202392578125, 0.3808135986328125, 0.4354248046875, 0.4900360107421875, 0.544647216796875, 0.5992584228515625, 0.65386962890625, 0.7084808349609375, 0.763092041015625, 0.8177032470703125, 0.872314453125, 0.9269256591796875, 0.981536865234375, 1.0361480712890625, 1.09075927734375, 1.1453704833984375, 1.199981689453125, 1.2545928955078125, 1.3092041015625, 1.3638153076171875, 1.418426513671875, 1.4730377197265625, 1.52764892578125, 1.5822601318359375, 1.636871337890625, 1.6914825439453125, 1.74609375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 6.0, 17.0, 16.0, 17.0, 16.0, 24.0, 20.0, 27.0, 33.0, 35.0, 32.0, 28.0, 40.0, 46.0, 50.0, 70.0, 836.0, 231.0, 36.0, 35.0, 39.0, 40.0, 37.0, 31.0, 36.0, 27.0, 25.0, 31.0, 19.0, 11.0, 13.0, 19.0, 11.0, 8.0, 9.0, 9.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2247314453125, -14.676025390625, -14.1273193359375, -13.57861328125, -13.0299072265625, -12.481201171875, -11.9324951171875, -11.3837890625, -10.8350830078125, -10.286376953125, -9.7376708984375, -9.18896484375, -8.6402587890625, -8.091552734375, -7.5428466796875, -6.994140625, -6.4454345703125, -5.896728515625, -5.3480224609375, -4.79931640625, -4.2506103515625, -3.701904296875, -3.1531982421875, -2.6044921875, -2.0557861328125, -1.507080078125, -0.9583740234375, -0.40966796875, 0.1390380859375, 0.687744140625, 1.2364501953125, 1.78515625, 2.3338623046875, 2.882568359375, 3.4312744140625, 3.97998046875, 4.5286865234375, 5.077392578125, 5.6260986328125, 6.1748046875, 6.7235107421875, 7.272216796875, 7.8209228515625, 8.36962890625, 8.9183349609375, 9.467041015625, 10.0157470703125, 10.564453125, 11.1131591796875, 11.661865234375, 12.2105712890625, 12.75927734375, 13.3079833984375, 13.856689453125, 14.4053955078125, 14.9541015625, 15.5028076171875, 16.051513671875, 16.6002197265625, 17.14892578125, 17.6976318359375, 18.246337890625, 18.7950439453125, 19.34375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 12.0, 6.0, 12.0, 22.0, 29.0, 51.0, 78.0, 114.0, 185.0, 254.0, 424.0, 682.0, 989.0, 1596.0, 2346.0, 3884.0, 6258.0, 9752.0, 15404.0, 24459.0, 40082.0, 63522.0, 101047.0, 159392.0, 238721.0, 339788.0, 600532.0, 3405163.0, 412485.0, 300125.0, 204884.0, 134118.0, 84283.0, 52967.0, 32496.0, 20471.0, 12875.0, 7941.0, 5065.0, 3166.0, 1998.0, 1298.0, 838.0, 571.0, 355.0, 250.0, 153.0, 95.0, 70.0, 48.0, 32.0, 18.0, 16.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.9287109375, -1.8650665283203125, -1.801422119140625, -1.7377777099609375, -1.67413330078125, -1.6104888916015625, -1.546844482421875, -1.4832000732421875, -1.4195556640625, -1.3559112548828125, -1.292266845703125, -1.2286224365234375, -1.16497802734375, -1.1013336181640625, -1.037689208984375, -0.9740447998046875, -0.910400390625, -0.8467559814453125, -0.783111572265625, -0.7194671630859375, -0.65582275390625, -0.5921783447265625, -0.528533935546875, -0.4648895263671875, -0.4012451171875, -0.3376007080078125, -0.273956298828125, -0.2103118896484375, -0.14666748046875, -0.0830230712890625, -0.019378662109375, 0.0442657470703125, 0.10791015625, 0.1715545654296875, 0.235198974609375, 0.2988433837890625, 0.36248779296875, 0.4261322021484375, 0.489776611328125, 0.5534210205078125, 0.6170654296875, 0.6807098388671875, 0.744354248046875, 0.8079986572265625, 0.87164306640625, 0.9352874755859375, 0.998931884765625, 1.0625762939453125, 1.126220703125, 1.1898651123046875, 1.253509521484375, 1.3171539306640625, 1.38079833984375, 1.4444427490234375, 1.508087158203125, 1.5717315673828125, 1.6353759765625, 1.6990203857421875, 1.762664794921875, 1.8263092041015625, 1.88995361328125, 1.9535980224609375, 2.017242431640625, 2.0808868408203125, 2.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 9.0, 10.0, 6.0, 12.0, 15.0, 12.0, 25.0, 15.0, 28.0, 20.0, 20.0, 36.0, 31.0, 37.0, 33.0, 33.0, 34.0, 42.0, 68.0, 738.0, 314.0, 40.0, 34.0, 48.0, 35.0, 44.0, 30.0, 30.0, 23.0, 22.0, 18.0, 23.0, 22.0, 14.0, 14.0, 12.0, 10.0, 15.0, 13.0, 5.0, 8.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.7734375, -12.384521484375, -11.99560546875, -11.606689453125, -11.2177734375, -10.828857421875, -10.43994140625, -10.051025390625, -9.662109375, -9.273193359375, -8.88427734375, -8.495361328125, -8.1064453125, -7.717529296875, -7.32861328125, -6.939697265625, -6.55078125, -6.161865234375, -5.77294921875, -5.384033203125, -4.9951171875, -4.606201171875, -4.21728515625, -3.828369140625, -3.439453125, -3.050537109375, -2.66162109375, -2.272705078125, -1.8837890625, -1.494873046875, -1.10595703125, -0.717041015625, -0.328125, 0.060791015625, 0.44970703125, 0.838623046875, 1.2275390625, 1.616455078125, 2.00537109375, 2.394287109375, 2.783203125, 3.172119140625, 3.56103515625, 3.949951171875, 4.3388671875, 4.727783203125, 5.11669921875, 5.505615234375, 5.89453125, 6.283447265625, 6.67236328125, 7.061279296875, 7.4501953125, 7.839111328125, 8.22802734375, 8.616943359375, 9.005859375, 9.394775390625, 9.78369140625, 10.172607421875, 10.5615234375, 10.950439453125, 11.33935546875, 11.728271484375, 12.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 10.0, 8.0, 17.0, 19.0, 13.0, 44.0, 72.0, 102.0, 132.0, 147.0, 232.0, 363.0, 550.0, 820.0, 1268.0, 2252.0, 3857.0, 7165.0, 14495.0, 31165.0, 71220.0, 198695.0, 5734360.0, 125225.0, 51279.0, 23007.0, 10842.0, 5729.0, 3179.0, 1928.0, 1016.0, 715.0, 465.0, 282.0, 189.0, 145.0, 98.0, 86.0, 60.0, 38.0, 31.0, 22.0, 21.0, 6.0, 9.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.484375, -8.21337890625, -7.9423828125, -7.67138671875, -7.400390625, -7.12939453125, -6.8583984375, -6.58740234375, -6.31640625, -6.04541015625, -5.7744140625, -5.50341796875, -5.232421875, -4.96142578125, -4.6904296875, -4.41943359375, -4.1484375, -3.87744140625, -3.6064453125, -3.33544921875, -3.064453125, -2.79345703125, -2.5224609375, -2.25146484375, -1.98046875, -1.70947265625, -1.4384765625, -1.16748046875, -0.896484375, -0.62548828125, -0.3544921875, -0.08349609375, 0.1875, 0.45849609375, 0.7294921875, 1.00048828125, 1.271484375, 1.54248046875, 1.8134765625, 2.08447265625, 2.35546875, 2.62646484375, 2.8974609375, 3.16845703125, 3.439453125, 3.71044921875, 3.9814453125, 4.25244140625, 4.5234375, 4.79443359375, 5.0654296875, 5.33642578125, 5.607421875, 5.87841796875, 6.1494140625, 6.42041015625, 6.69140625, 6.96240234375, 7.2333984375, 7.50439453125, 7.775390625, 8.04638671875, 8.3173828125, 8.58837890625, 8.859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 10.0, 13.0, 13.0, 9.0, 16.0, 20.0, 22.0, 24.0, 26.0, 26.0, 36.0, 36.0, 33.0, 30.0, 38.0, 49.0, 225.0, 786.0, 130.0, 61.0, 47.0, 34.0, 33.0, 37.0, 28.0, 27.0, 23.0, 26.0, 28.0, 26.0, 16.0, 10.0, 9.0, 12.0, 8.0, 11.0, 10.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.546875, -12.1827392578125, -11.818603515625, -11.4544677734375, -11.09033203125, -10.7261962890625, -10.362060546875, -9.9979248046875, -9.6337890625, -9.2696533203125, -8.905517578125, -8.5413818359375, -8.17724609375, -7.8131103515625, -7.448974609375, -7.0848388671875, -6.720703125, -6.3565673828125, -5.992431640625, -5.6282958984375, -5.26416015625, -4.9000244140625, -4.535888671875, -4.1717529296875, -3.8076171875, -3.4434814453125, -3.079345703125, -2.7152099609375, -2.35107421875, -1.9869384765625, -1.622802734375, -1.2586669921875, -0.89453125, -0.5303955078125, -0.166259765625, 0.1978759765625, 0.56201171875, 0.9261474609375, 1.290283203125, 1.6544189453125, 2.0185546875, 2.3826904296875, 2.746826171875, 3.1109619140625, 3.47509765625, 3.8392333984375, 4.203369140625, 4.5675048828125, 4.931640625, 5.2957763671875, 5.659912109375, 6.0240478515625, 6.38818359375, 6.7523193359375, 7.116455078125, 7.4805908203125, 7.8447265625, 8.2088623046875, 8.572998046875, 8.9371337890625, 9.30126953125, 9.6654052734375, 10.029541015625, 10.3936767578125, 10.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 8.0, 11.0, 14.0, 16.0, 29.0, 33.0, 66.0, 72.0, 94.0, 133.0, 130.0, 132.0, 77.0, 48.0, 35.0, 28.0, 17.0, 18.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.085384368896484, -23.286029815673828, -22.486675262451172, -21.68732261657715, -20.887968063354492, -20.088613510131836, -19.289260864257812, -18.489906311035156, -17.6905517578125, -16.891197204589844, -16.091842651367188, -15.292490005493164, -14.493135452270508, -13.693780899047852, -12.894427299499512, -12.095073699951172, -11.295719146728516, -10.49636459350586, -9.69701099395752, -8.89765739440918, -8.098302841186523, -7.298948764801025, -6.499594688415527, -5.700240612030029, -4.900886535644531, -4.101532459259033, -3.302178382873535, -2.502824306488037, -1.703470230102539, -0.904116153717041, -0.10476207733154297, 0.6945919990539551, 1.4939441680908203, 2.2932982444763184, 3.0926523208618164, 3.8920063972473145, 4.6913604736328125, 5.4907145500183105, 6.290068626403809, 7.089422702789307, 7.888776779174805, 8.688131332397461, 9.4874849319458, 10.28683853149414, 11.086193084716797, 11.885547637939453, 12.684901237487793, 13.484254837036133, 14.283609390258789, 15.082963943481445, 15.882317543029785, 16.681671142578125, 17.48102569580078, 18.280380249023438, 19.079734802246094, 19.879087448120117, 20.678442001342773, 21.47779655456543, 22.277149200439453, 23.07650375366211, 23.875858306884766, 24.675212860107422, 25.474567413330078, 26.2739200592041, 27.073274612426758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 9.0, 26.0, 16.0, 21.0, 29.0, 50.0, 61.0, 57.0, 74.0, 94.0, 96.0, 92.0, 91.0, 64.0, 51.0, 34.0, 31.0, 29.0, 22.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.219627380371094, -43.7860107421875, -42.35239791870117, -40.91878128051758, -39.48516845703125, -38.051551818847656, -36.61793518066406, -35.18431854248047, -33.75070571899414, -32.31708908081055, -30.88347625732422, -29.449859619140625, -28.016244888305664, -26.582630157470703, -25.14901351928711, -23.71539878845215, -22.281784057617188, -20.848169326782227, -19.414554595947266, -17.980937957763672, -16.54732322692871, -15.11370849609375, -13.680092811584473, -12.246477127075195, -10.812862396240234, -9.379247665405273, -7.945631980895996, -6.512016773223877, -5.078401565551758, -3.6447863578796387, -2.2111711502075195, -0.7775554656982422, 0.6560592651367188, 2.089674472808838, 3.523289680480957, 4.956904888153076, 6.390520095825195, 7.8241353034973145, 9.257750511169434, 10.691366195678711, 12.124980926513672, 13.558595657348633, 14.99221134185791, 16.425827026367188, 17.85944175720215, 19.29305648803711, 20.726673126220703, 22.160287857055664, 23.593902587890625, 25.027517318725586, 26.461132049560547, 27.89474868774414, 29.3283634185791, 30.761978149414062, 32.195594787597656, 33.62921142578125, 35.06282424926758, 36.49644088745117, 37.9300537109375, 39.363670349121094, 40.79728698730469, 42.230899810791016, 43.66451644897461, 45.09812927246094, 46.53174591064453]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 16.0, 20.0, 14.0, 39.0, 34.0, 52.0, 81.0, 101.0, 159.0, 212.0, 313.0, 457.0, 775.0, 1185.0, 2053.0, 3938.0, 8291.0, 22207.0, 103419.0, 3934269.0, 77218.0, 20115.0, 8370.0, 4210.0, 2318.0, 1406.0, 899.0, 578.0, 440.0, 276.0, 207.0, 154.0, 119.0, 83.0, 67.0, 33.0, 46.0, 16.0, 14.0, 15.0, 12.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.025390625, -0.9937820434570312, -0.9621734619140625, -0.9305648803710938, -0.898956298828125, -0.8673477172851562, -0.8357391357421875, -0.8041305541992188, -0.77252197265625, -0.7409133911132812, -0.7093048095703125, -0.6776962280273438, -0.646087646484375, -0.6144790649414062, -0.5828704833984375, -0.5512619018554688, -0.5196533203125, -0.48804473876953125, -0.4564361572265625, -0.42482757568359375, -0.393218994140625, -0.36161041259765625, -0.3300018310546875, -0.29839324951171875, -0.26678466796875, -0.23517608642578125, -0.2035675048828125, -0.17195892333984375, -0.140350341796875, -0.10874176025390625, -0.0771331787109375, -0.04552459716796875, -0.013916015625, 0.01769256591796875, 0.0493011474609375, 0.08090972900390625, 0.112518310546875, 0.14412689208984375, 0.1757354736328125, 0.20734405517578125, 0.23895263671875, 0.27056121826171875, 0.3021697998046875, 0.33377838134765625, 0.365386962890625, 0.39699554443359375, 0.4286041259765625, 0.46021270751953125, 0.4918212890625, 0.5234298706054688, 0.5550384521484375, 0.5866470336914062, 0.618255615234375, 0.6498641967773438, 0.6814727783203125, 0.7130813598632812, 0.74468994140625, 0.7762985229492188, 0.8079071044921875, 0.8395156860351562, 0.871124267578125, 0.9027328491210938, 0.9343414306640625, 0.9659500122070312, 0.99755859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 6.0, 8.0, 16.0, 10.0, 12.0, 24.0, 134.0, 669.0, 16.0, 11.0, 10.0, 17.0, 8.0, 4.0, 4.0, 5.0, 1.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29450225830078125, -0.2850494384765625, -0.27559661865234375, -0.266143798828125, -0.25669097900390625, -0.2472381591796875, -0.23778533935546875, -0.22833251953125, -0.21887969970703125, -0.2094268798828125, -0.19997406005859375, -0.190521240234375, -0.18106842041015625, -0.1716156005859375, -0.16216278076171875, -0.1527099609375, -0.14325714111328125, -0.1338043212890625, -0.12435150146484375, -0.114898681640625, -0.10544586181640625, -0.0959930419921875, -0.08654022216796875, -0.07708740234375, -0.06763458251953125, -0.0581817626953125, -0.04872894287109375, -0.039276123046875, -0.02982330322265625, -0.0203704833984375, -0.01091766357421875, -0.00146484375, 0.00798797607421875, 0.0174407958984375, 0.02689361572265625, 0.036346435546875, 0.04579925537109375, 0.0552520751953125, 0.06470489501953125, 0.07415771484375, 0.08361053466796875, 0.0930633544921875, 0.10251617431640625, 0.111968994140625, 0.12142181396484375, 0.1308746337890625, 0.14032745361328125, 0.1497802734375, 0.15923309326171875, 0.1686859130859375, 0.17813873291015625, 0.187591552734375, 0.19704437255859375, 0.2064971923828125, 0.21595001220703125, 0.22540283203125, 0.23485565185546875, 0.2443084716796875, 0.25376129150390625, 0.263214111328125, 0.27266693115234375, 0.2821197509765625, 0.29157257080078125, 0.301025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 6.0, 7.0, 17.0, 28.0, 26.0, 59.0, 80.0, 133.0, 205.0, 333.0, 535.0, 807.0, 1414.0, 2539.0, 4896.0, 10233.0, 26102.0, 82879.0, 489448.0, 3179223.0, 298901.0, 60327.0, 19506.0, 7983.0, 3735.0, 2017.0, 1141.0, 648.0, 388.0, 241.0, 136.0, 98.0, 64.0, 48.0, 23.0, 18.0, 12.0, 9.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7017669677734375, -0.679412841796875, -0.6570587158203125, -0.63470458984375, -0.6123504638671875, -0.589996337890625, -0.5676422119140625, -0.5452880859375, -0.5229339599609375, -0.500579833984375, -0.4782257080078125, -0.45587158203125, -0.4335174560546875, -0.411163330078125, -0.3888092041015625, -0.366455078125, -0.3441009521484375, -0.321746826171875, -0.2993927001953125, -0.27703857421875, -0.2546844482421875, -0.232330322265625, -0.2099761962890625, -0.1876220703125, -0.1652679443359375, -0.142913818359375, -0.1205596923828125, -0.09820556640625, -0.0758514404296875, -0.053497314453125, -0.0311431884765625, -0.0087890625, 0.0135650634765625, 0.035919189453125, 0.0582733154296875, 0.08062744140625, 0.1029815673828125, 0.125335693359375, 0.1476898193359375, 0.1700439453125, 0.1923980712890625, 0.214752197265625, 0.2371063232421875, 0.25946044921875, 0.2818145751953125, 0.304168701171875, 0.3265228271484375, 0.348876953125, 0.3712310791015625, 0.393585205078125, 0.4159393310546875, 0.43829345703125, 0.4606475830078125, 0.483001708984375, 0.5053558349609375, 0.5277099609375, 0.5500640869140625, 0.572418212890625, 0.5947723388671875, 0.61712646484375, 0.6394805908203125, 0.661834716796875, 0.6841888427734375, 0.70654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 11.0, 14.0, 26.0, 27.0, 38.0, 55.0, 63.0, 112.0, 220.0, 419.0, 1340.0, 935.0, 321.0, 170.0, 91.0, 61.0, 38.0, 29.0, 25.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.37078857421875, -0.3594970703125, -0.34820556640625, -0.3369140625, -0.32562255859375, -0.3143310546875, -0.30303955078125, -0.291748046875, -0.28045654296875, -0.2691650390625, -0.25787353515625, -0.24658203125, -0.23529052734375, -0.2239990234375, -0.21270751953125, -0.201416015625, -0.19012451171875, -0.1788330078125, -0.16754150390625, -0.15625, -0.14495849609375, -0.1336669921875, -0.12237548828125, -0.111083984375, -0.09979248046875, -0.0885009765625, -0.07720947265625, -0.06591796875, -0.05462646484375, -0.0433349609375, -0.03204345703125, -0.020751953125, -0.00946044921875, 0.0018310546875, 0.01312255859375, 0.0244140625, 0.03570556640625, 0.0469970703125, 0.05828857421875, 0.069580078125, 0.08087158203125, 0.0921630859375, 0.10345458984375, 0.11474609375, 0.12603759765625, 0.1373291015625, 0.14862060546875, 0.159912109375, 0.17120361328125, 0.1824951171875, 0.19378662109375, 0.205078125, 0.21636962890625, 0.2276611328125, 0.23895263671875, 0.250244140625, 0.26153564453125, 0.2728271484375, 0.28411865234375, 0.29541015625, 0.30670166015625, 0.3179931640625, 0.32928466796875, 0.340576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 15.0, 40.0, 61.0, 139.0, 183.0, 221.0, 131.0, 92.0, 53.0, 29.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9518307447433472, -1.8877747058868408, -1.8237186670303345, -1.7596626281738281, -1.6956065893173218, -1.6315505504608154, -1.5674943923950195, -1.5034384727478027, -1.4393823146820068, -1.3753262758255005, -1.3112702369689941, -1.2472141981124878, -1.1831581592559814, -1.119102120399475, -1.0550460815429688, -0.9909899830818176, -0.926934003829956, -0.8628779649734497, -0.7988219261169434, -0.734765887260437, -0.6707098484039307, -0.6066538095474243, -0.5425977110862732, -0.47854167222976685, -0.4144856333732605, -0.35042959451675415, -0.2863735556602478, -0.22231748700141907, -0.15826144814491272, -0.09420540928840637, -0.030149340629577637, 0.03390669822692871, 0.09796285629272461, 0.16201889514923096, 0.2260749489068985, 0.29013100266456604, 0.3541870415210724, 0.41824308037757874, 0.48229914903640747, 0.5463551878929138, 0.6104112267494202, 0.6744672656059265, 0.7385233044624329, 0.802579402923584, 0.8666354417800903, 0.9306914806365967, 0.994747519493103, 1.0588035583496094, 1.1228595972061157, 1.186915636062622, 1.2509716749191284, 1.3150277137756348, 1.3790837526321411, 1.4431397914886475, 1.5071959495544434, 1.5712518692016602, 1.635308027267456, 1.6993640661239624, 1.7634201049804688, 1.827476143836975, 1.8915321826934814, 1.9555882215499878, 2.019644260406494, 2.08370041847229, 2.147756338119507]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 12.0, 11.0, 16.0, 22.0, 22.0, 34.0, 34.0, 47.0, 58.0, 55.0, 59.0, 75.0, 86.0, 71.0, 78.0, 61.0, 55.0, 49.0, 40.0, 29.0, 19.0, 12.0, 15.0, 17.0, 7.0, 5.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5357944965362549, -1.4858287572860718, -1.4358630180358887, -1.3858972787857056, -1.3359315395355225, -1.285965919494629, -1.2360001802444458, -1.1860344409942627, -1.1360687017440796, -1.0861029624938965, -1.0361372232437134, -0.986171543598175, -0.9362058043479919, -0.8862400650978088, -0.8362743854522705, -0.7863086462020874, -0.7363429069519043, -0.6863771677017212, -0.6364114284515381, -0.5864457488059998, -0.5364800095558167, -0.48651427030563354, -0.4365485608577728, -0.3865828514099121, -0.336617112159729, -0.2866513729095459, -0.23668566346168518, -0.18671993911266327, -0.13675421476364136, -0.08678849041461945, -0.036822766065597534, 0.013142943382263184, 0.06310880184173584, 0.11307452619075775, 0.16304025053977966, 0.21300597488880157, 0.2629716992378235, 0.3129374384880066, 0.3629031479358673, 0.412868857383728, 0.46283459663391113, 0.5128003358840942, 0.5627660751342773, 0.6127317547798157, 0.6626974940299988, 0.7126632332801819, 0.7626289129257202, 0.8125946521759033, 0.8625603914260864, 0.9125261306762695, 0.9624918699264526, 1.0124576091766357, 1.0624232292175293, 1.1123889684677124, 1.1623547077178955, 1.2123204469680786, 1.2622861862182617, 1.3122519254684448, 1.362217664718628, 1.412183403968811, 1.4621491432189941, 1.5121147632598877, 1.5620805025100708, 1.612046241760254, 1.662011981010437]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 11.0, 16.0, 23.0, 36.0, 46.0, 66.0, 78.0, 132.0, 180.0, 279.0, 353.0, 531.0, 715.0, 1045.0, 1611.0, 2498.0, 3894.0, 6443.0, 11357.0, 22655.0, 94297.0, 818239.0, 42155.0, 17335.0, 9247.0, 5385.0, 3254.0, 2114.0, 1378.0, 983.0, 657.0, 462.0, 318.0, 230.0, 167.0, 112.0, 81.0, 50.0, 29.0, 22.0, 23.0, 15.0, 12.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9169921875, -0.8886184692382812, -0.8602447509765625, -0.8318710327148438, -0.803497314453125, -0.7751235961914062, -0.7467498779296875, -0.7183761596679688, -0.69000244140625, -0.6616287231445312, -0.6332550048828125, -0.6048812866210938, -0.576507568359375, -0.5481338500976562, -0.5197601318359375, -0.49138641357421875, -0.4630126953125, -0.43463897705078125, -0.4062652587890625, -0.37789154052734375, -0.349517822265625, -0.32114410400390625, -0.2927703857421875, -0.26439666748046875, -0.23602294921875, -0.20764923095703125, -0.1792755126953125, -0.15090179443359375, -0.122528076171875, -0.09415435791015625, -0.0657806396484375, -0.03740692138671875, -0.009033203125, 0.01934051513671875, 0.0477142333984375, 0.07608795166015625, 0.104461669921875, 0.13283538818359375, 0.1612091064453125, 0.18958282470703125, 0.21795654296875, 0.24633026123046875, 0.2747039794921875, 0.30307769775390625, 0.331451416015625, 0.35982513427734375, 0.3881988525390625, 0.41657257080078125, 0.4449462890625, 0.47332000732421875, 0.5016937255859375, 0.5300674438476562, 0.558441162109375, 0.5868148803710938, 0.6151885986328125, 0.6435623168945312, 0.67193603515625, 0.7003097534179688, 0.7286834716796875, 0.7570571899414062, 0.785430908203125, 0.8138046264648438, 0.8421783447265625, 0.8705520629882812, 0.89892578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 3.0, 5.0, 5.0, 11.0, 9.0, 19.0, 20.0, 82.0, 405.0, 299.0, 45.0, 9.0, 10.0, 14.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27338409423828125, -0.2645416259765625, -0.25569915771484375, -0.246856689453125, -0.23801422119140625, -0.2291717529296875, -0.22032928466796875, -0.21148681640625, -0.20264434814453125, -0.1938018798828125, -0.18495941162109375, -0.176116943359375, -0.16727447509765625, -0.1584320068359375, -0.14958953857421875, -0.1407470703125, -0.13190460205078125, -0.1230621337890625, -0.11421966552734375, -0.105377197265625, -0.09653472900390625, -0.0876922607421875, -0.07884979248046875, -0.07000732421875, -0.06116485595703125, -0.0523223876953125, -0.04347991943359375, -0.034637451171875, -0.02579498291015625, -0.0169525146484375, -0.00811004638671875, 0.000732421875, 0.00957489013671875, 0.0184173583984375, 0.02725982666015625, 0.036102294921875, 0.04494476318359375, 0.0537872314453125, 0.06262969970703125, 0.07147216796875, 0.08031463623046875, 0.0891571044921875, 0.09799957275390625, 0.106842041015625, 0.11568450927734375, 0.1245269775390625, 0.13336944580078125, 0.1422119140625, 0.15105438232421875, 0.1598968505859375, 0.16873931884765625, 0.177581787109375, 0.18642425537109375, 0.1952667236328125, 0.20410919189453125, 0.21295166015625, 0.22179412841796875, 0.2306365966796875, 0.23947906494140625, 0.248321533203125, 0.25716400146484375, 0.2660064697265625, 0.27484893798828125, 0.28369140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 11.0, 12.0, 19.0, 28.0, 29.0, 59.0, 78.0, 105.0, 127.0, 187.0, 257.0, 400.0, 629.0, 966.0, 1425.0, 2361.0, 4091.0, 6827.0, 12397.0, 22583.0, 43917.0, 90770.0, 208490.0, 333726.0, 164491.0, 73426.0, 36048.0, 19150.0, 10370.0, 5988.0, 3524.0, 2084.0, 1368.0, 827.0, 555.0, 378.0, 252.0, 177.0, 118.0, 73.0, 65.0, 38.0, 43.0, 22.0, 20.0, 11.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.548828125, -0.5301361083984375, -0.511444091796875, -0.4927520751953125, -0.47406005859375, -0.4553680419921875, -0.436676025390625, -0.4179840087890625, -0.3992919921875, -0.3805999755859375, -0.361907958984375, -0.3432159423828125, -0.32452392578125, -0.3058319091796875, -0.287139892578125, -0.2684478759765625, -0.249755859375, -0.2310638427734375, -0.212371826171875, -0.1936798095703125, -0.17498779296875, -0.1562957763671875, -0.137603759765625, -0.1189117431640625, -0.1002197265625, -0.0815277099609375, -0.062835693359375, -0.0441436767578125, -0.02545166015625, -0.0067596435546875, 0.011932373046875, 0.0306243896484375, 0.04931640625, 0.0680084228515625, 0.086700439453125, 0.1053924560546875, 0.12408447265625, 0.1427764892578125, 0.161468505859375, 0.1801605224609375, 0.1988525390625, 0.2175445556640625, 0.236236572265625, 0.2549285888671875, 0.27362060546875, 0.2923126220703125, 0.311004638671875, 0.3296966552734375, 0.348388671875, 0.3670806884765625, 0.385772705078125, 0.4044647216796875, 0.42315673828125, 0.4418487548828125, 0.460540771484375, 0.4792327880859375, 0.4979248046875, 0.5166168212890625, 0.535308837890625, 0.5540008544921875, 0.57269287109375, 0.5913848876953125, 0.610076904296875, 0.6287689208984375, 0.6474609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 11.0, 16.0, 11.0, 9.0, 21.0, 22.0, 16.0, 25.0, 32.0, 35.0, 31.0, 32.0, 44.0, 34.0, 33.0, 44.0, 48.0, 46.0, 49.0, 48.0, 50.0, 36.0, 42.0, 36.0, 29.0, 28.0, 27.0, 22.0, 17.0, 13.0, 23.0, 11.0, 16.0, 10.0, 7.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.1455078125, -1.1130828857421875, -1.080657958984375, -1.0482330322265625, -1.01580810546875, -0.9833831787109375, -0.950958251953125, -0.9185333251953125, -0.8861083984375, -0.8536834716796875, -0.821258544921875, -0.7888336181640625, -0.75640869140625, -0.7239837646484375, -0.691558837890625, -0.6591339111328125, -0.626708984375, -0.5942840576171875, -0.561859130859375, -0.5294342041015625, -0.49700927734375, -0.4645843505859375, -0.432159423828125, -0.3997344970703125, -0.3673095703125, -0.3348846435546875, -0.302459716796875, -0.2700347900390625, -0.23760986328125, -0.2051849365234375, -0.172760009765625, -0.1403350830078125, -0.10791015625, -0.0754852294921875, -0.043060302734375, -0.0106353759765625, 0.02178955078125, 0.0542144775390625, 0.086639404296875, 0.1190643310546875, 0.1514892578125, 0.1839141845703125, 0.216339111328125, 0.2487640380859375, 0.28118896484375, 0.3136138916015625, 0.346038818359375, 0.3784637451171875, 0.410888671875, 0.4433135986328125, 0.475738525390625, 0.5081634521484375, 0.54058837890625, 0.5730133056640625, 0.605438232421875, 0.6378631591796875, 0.6702880859375, 0.7027130126953125, 0.735137939453125, 0.7675628662109375, 0.79998779296875, 0.8324127197265625, 0.864837646484375, 0.8972625732421875, 0.9296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 10.0, 17.0, 28.0, 37.0, 66.0, 146.0, 383.0, 1507.0, 13761.0, 969298.0, 59222.0, 3063.0, 583.0, 205.0, 93.0, 54.0, 31.0, 14.0, 15.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.3023681640625, -3.204345703125, -3.1063232421875, -3.00830078125, -2.9102783203125, -2.812255859375, -2.7142333984375, -2.6162109375, -2.5181884765625, -2.420166015625, -2.3221435546875, -2.22412109375, -2.1260986328125, -2.028076171875, -1.9300537109375, -1.83203125, -1.7340087890625, -1.635986328125, -1.5379638671875, -1.43994140625, -1.3419189453125, -1.243896484375, -1.1458740234375, -1.0478515625, -0.9498291015625, -0.851806640625, -0.7537841796875, -0.65576171875, -0.5577392578125, -0.459716796875, -0.3616943359375, -0.263671875, -0.1656494140625, -0.067626953125, 0.0303955078125, 0.12841796875, 0.2264404296875, 0.324462890625, 0.4224853515625, 0.5205078125, 0.6185302734375, 0.716552734375, 0.8145751953125, 0.91259765625, 1.0106201171875, 1.108642578125, 1.2066650390625, 1.3046875, 1.4027099609375, 1.500732421875, 1.5987548828125, 1.69677734375, 1.7947998046875, 1.892822265625, 1.9908447265625, 2.0888671875, 2.1868896484375, 2.284912109375, 2.3829345703125, 2.48095703125, 2.5789794921875, 2.677001953125, 2.7750244140625, 2.873046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 23.0, 59.0, 101.0, 170.0, 211.0, 195.0, 90.0, 73.0, 28.0, 14.0, 9.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001780986785888672, -0.00017400365322828293, -0.00016990862786769867, -0.0001658136025071144, -0.00016171857714653015, -0.0001576235517859459, -0.00015352852642536163, -0.00014943350106477737, -0.00014533847570419312, -0.00014124345034360886, -0.0001371484249830246, -0.00013305339962244034, -0.00012895837426185608, -0.00012486334890127182, -0.00012076832354068756, -0.0001166732981801033, -0.00011257827281951904, -0.00010848324745893478, -0.00010438822209835052, -0.00010029319673776627, -9.619817137718201e-05, -9.210314601659775e-05, -8.800812065601349e-05, -8.391309529542923e-05, -7.981806993484497e-05, -7.572304457426071e-05, -7.162801921367645e-05, -6.75329938530922e-05, -6.343796849250793e-05, -5.9342943131923676e-05, -5.5247917771339417e-05, -5.115289241075516e-05, -4.70578670501709e-05, -4.296284168958664e-05, -3.886781632900238e-05, -3.477279096841812e-05, -3.067776560783386e-05, -2.6582740247249603e-05, -2.2487714886665344e-05, -1.8392689526081085e-05, -1.4297664165496826e-05, -1.0202638804912567e-05, -6.107613444328308e-06, -2.012588083744049e-06, 2.08243727684021e-06, 6.177462637424469e-06, 1.0272487998008728e-05, 1.4367513358592987e-05, 1.8462538719177246e-05, 2.2557564079761505e-05, 2.6652589440345764e-05, 3.074761480093002e-05, 3.484264016151428e-05, 3.893766552209854e-05, 4.30326908826828e-05, 4.712771624326706e-05, 5.122274160385132e-05, 5.531776696443558e-05, 5.9412792325019836e-05, 6.35078176856041e-05, 6.760284304618835e-05, 7.169786840677261e-05, 7.579289376735687e-05, 7.988791912794113e-05, 8.398294448852539e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 22.0, 25.0, 40.0, 51.0, 77.0, 118.0, 214.0, 340.0, 652.0, 1574.0, 3997.0, 14091.0, 81610.0, 685396.0, 221721.0, 27545.0, 6560.0, 2275.0, 990.0, 480.0, 299.0, 132.0, 120.0, 58.0, 48.0, 25.0, 22.0, 13.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.987945556640625, -0.94952392578125, -0.911102294921875, -0.8726806640625, -0.834259033203125, -0.79583740234375, -0.757415771484375, -0.718994140625, -0.680572509765625, -0.64215087890625, -0.603729248046875, -0.5653076171875, -0.526885986328125, -0.48846435546875, -0.450042724609375, -0.41162109375, -0.373199462890625, -0.33477783203125, -0.296356201171875, -0.2579345703125, -0.219512939453125, -0.18109130859375, -0.142669677734375, -0.104248046875, -0.065826416015625, -0.02740478515625, 0.011016845703125, 0.0494384765625, 0.087860107421875, 0.12628173828125, 0.164703369140625, 0.203125, 0.241546630859375, 0.27996826171875, 0.318389892578125, 0.3568115234375, 0.395233154296875, 0.43365478515625, 0.472076416015625, 0.510498046875, 0.548919677734375, 0.58734130859375, 0.625762939453125, 0.6641845703125, 0.702606201171875, 0.74102783203125, 0.779449462890625, 0.81787109375, 0.856292724609375, 0.89471435546875, 0.933135986328125, 0.9715576171875, 1.009979248046875, 1.04840087890625, 1.086822509765625, 1.125244140625, 1.163665771484375, 1.20208740234375, 1.240509033203125, 1.2789306640625, 1.317352294921875, 1.35577392578125, 1.394195556640625, 1.4326171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 9.0, 8.0, 11.0, 25.0, 40.0, 43.0, 91.0, 121.0, 121.0, 131.0, 131.0, 105.0, 68.0, 34.0, 21.0, 17.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.899139404296875, -0.85394287109375, -0.808746337890625, -0.7635498046875, -0.718353271484375, -0.67315673828125, -0.627960205078125, -0.582763671875, -0.537567138671875, -0.49237060546875, -0.447174072265625, -0.4019775390625, -0.356781005859375, -0.31158447265625, -0.266387939453125, -0.22119140625, -0.175994873046875, -0.13079833984375, -0.085601806640625, -0.0404052734375, 0.004791259765625, 0.04998779296875, 0.095184326171875, 0.140380859375, 0.185577392578125, 0.23077392578125, 0.275970458984375, 0.3211669921875, 0.366363525390625, 0.41156005859375, 0.456756591796875, 0.501953125, 0.547149658203125, 0.59234619140625, 0.637542724609375, 0.6827392578125, 0.727935791015625, 0.77313232421875, 0.818328857421875, 0.863525390625, 0.908721923828125, 0.95391845703125, 0.999114990234375, 1.0443115234375, 1.089508056640625, 1.13470458984375, 1.179901123046875, 1.22509765625, 1.270294189453125, 1.31549072265625, 1.360687255859375, 1.4058837890625, 1.451080322265625, 1.49627685546875, 1.541473388671875, 1.586669921875, 1.631866455078125, 1.67706298828125, 1.722259521484375, 1.7674560546875, 1.812652587890625, 1.85784912109375, 1.903045654296875, 1.9482421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 14.0, 11.0, 28.0, 45.0, 91.0, 168.0, 233.0, 164.0, 81.0, 53.0, 38.0, 23.0, 14.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.532609939575195, -9.185256004333496, -8.837903022766113, -8.490549087524414, -8.143196105957031, -7.795842170715332, -7.448488235473633, -7.101134777069092, -6.753781318664551, -6.40642786026001, -6.059074401855469, -5.7117204666137695, -5.3643670082092285, -5.0170135498046875, -4.669659614562988, -4.322306156158447, -3.9749526977539062, -3.6275992393493652, -3.280245542526245, -2.932891845703125, -2.585538387298584, -2.238184928894043, -1.8908312320709229, -1.5434775352478027, -1.1961240768432617, -0.8487704992294312, -0.5014169216156006, -0.15406334400177002, 0.19329023361206055, 0.5406438112258911, 0.8879973888397217, 1.2353510856628418, 1.5827054977416992, 1.9300590753555298, 2.2774126529693604, 2.6247663497924805, 2.9721198081970215, 3.3194732666015625, 3.6668269634246826, 4.014180660247803, 4.361534118652344, 4.708887577056885, 5.056241035461426, 5.403594970703125, 5.750948429107666, 6.098301887512207, 6.445655822753906, 6.793009281158447, 7.140362739562988, 7.487716197967529, 7.83506965637207, 8.18242359161377, 8.529777526855469, 8.877130508422852, 9.22448444366455, 9.57183837890625, 9.919191360473633, 10.266545295715332, 10.613898277282715, 10.961252212524414, 11.308605194091797, 11.655959129333496, 12.003313064575195, 12.350666046142578, 12.698019981384277]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 3.0, 8.0, 15.0, 15.0, 13.0, 39.0, 62.0, 106.0, 130.0, 167.0, 140.0, 99.0, 59.0, 30.0, 28.0, 14.0, 10.0, 6.0, 6.0, 5.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.883638381958008, -21.227081298828125, -20.57052230834961, -19.913965225219727, -19.257408142089844, -18.600849151611328, -17.944292068481445, -17.287734985351562, -16.631175994873047, -15.974617958068848, -15.318059921264648, -14.661502838134766, -14.004944801330566, -13.348386764526367, -12.691829681396484, -12.035271644592285, -11.378713607788086, -10.722155570983887, -10.065597534179688, -9.409040451049805, -8.752482414245605, -8.095924377441406, -7.439366817474365, -6.782809257507324, -6.126251220703125, -5.469693183898926, -4.813135623931885, -4.156578063964844, -3.5000200271606445, -2.8434622287750244, -2.1869044303894043, -1.5303468704223633, -0.8737907409667969, -0.21723294258117676, 0.43932485580444336, 1.0958826541900635, 1.7524404525756836, 2.4089982509613037, 3.065556049346924, 3.722113609313965, 4.378671646118164, 5.035229682922363, 5.691787242889404, 6.348344802856445, 7.0049028396606445, 7.661460876464844, 8.318017959594727, 8.974575996398926, 9.631134033203125, 10.287692070007324, 10.944250106811523, 11.600807189941406, 12.257365226745605, 12.913923263549805, 13.570480346679688, 14.227038383483887, 14.883596420288086, 15.540154457092285, 16.196712493896484, 16.853269577026367, 17.50982666015625, 18.166385650634766, 18.82294273376465, 19.47949981689453, 20.136058807373047]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 4.0, 13.0, 16.0, 25.0, 20.0, 33.0, 52.0, 76.0, 104.0, 125.0, 195.0, 255.0, 351.0, 457.0, 609.0, 907.0, 1297.0, 1928.0, 3221.0, 5923.0, 13002.0, 38951.0, 468225.0, 3567649.0, 57537.0, 15798.0, 6954.0, 3611.0, 2226.0, 1443.0, 963.0, 677.0, 466.0, 344.0, 234.0, 151.0, 121.0, 76.0, 73.0, 43.0, 33.0, 24.0, 17.0, 18.0, 13.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.412109375, -2.33929443359375, -2.2664794921875, -2.19366455078125, -2.120849609375, -2.04803466796875, -1.9752197265625, -1.90240478515625, -1.82958984375, -1.75677490234375, -1.6839599609375, -1.61114501953125, -1.538330078125, -1.46551513671875, -1.3927001953125, -1.31988525390625, -1.2470703125, -1.17425537109375, -1.1014404296875, -1.02862548828125, -0.955810546875, -0.88299560546875, -0.8101806640625, -0.73736572265625, -0.66455078125, -0.59173583984375, -0.5189208984375, -0.44610595703125, -0.373291015625, -0.30047607421875, -0.2276611328125, -0.15484619140625, -0.08203125, -0.00921630859375, 0.0635986328125, 0.13641357421875, 0.209228515625, 0.28204345703125, 0.3548583984375, 0.42767333984375, 0.50048828125, 0.57330322265625, 0.6461181640625, 0.71893310546875, 0.791748046875, 0.86456298828125, 0.9373779296875, 1.01019287109375, 1.0830078125, 1.15582275390625, 1.2286376953125, 1.30145263671875, 1.374267578125, 1.44708251953125, 1.5198974609375, 1.59271240234375, 1.66552734375, 1.73834228515625, 1.8111572265625, 1.88397216796875, 1.956787109375, 2.02960205078125, 2.1024169921875, 2.17523193359375, 2.248046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 12.0, 13.0, 18.0, 10.0, 27.0, 54.0, 96.0, 164.0, 219.0, 134.0, 79.0, 27.0, 21.0, 11.0, 10.0, 12.0, 5.0, 7.0, 6.0, 5.0, 8.0, 5.0, 8.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21610069274902344, -0.20917892456054688, -0.2022571563720703, -0.19533538818359375, -0.1884136199951172, -0.18149185180664062, -0.17457008361816406, -0.1676483154296875, -0.16072654724121094, -0.15380477905273438, -0.1468830108642578, -0.13996124267578125, -0.1330394744873047, -0.12611770629882812, -0.11919593811035156, -0.112274169921875, -0.10535240173339844, -0.09843063354492188, -0.09150886535644531, -0.08458709716796875, -0.07766532897949219, -0.07074356079101562, -0.06382179260253906, -0.0569000244140625, -0.04997825622558594, -0.043056488037109375, -0.03613471984863281, -0.02921295166015625, -0.022291183471679688, -0.015369415283203125, -0.008447647094726562, -0.00152587890625, 0.0053958892822265625, 0.012317657470703125, 0.019239425659179688, 0.02616119384765625, 0.03308296203613281, 0.040004730224609375, 0.04692649841308594, 0.0538482666015625, 0.06077003479003906, 0.06769180297851562, 0.07461357116699219, 0.08153533935546875, 0.08845710754394531, 0.09537887573242188, 0.10230064392089844, 0.109222412109375, 0.11614418029785156, 0.12306594848632812, 0.1299877166748047, 0.13690948486328125, 0.1438312530517578, 0.15075302124023438, 0.15767478942871094, 0.1645965576171875, 0.17151832580566406, 0.17844009399414062, 0.1853618621826172, 0.19228363037109375, 0.1992053985595703, 0.20612716674804688, 0.21304893493652344, 0.219970703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 15.0, 23.0, 21.0, 22.0, 43.0, 58.0, 76.0, 129.0, 162.0, 221.0, 385.0, 575.0, 813.0, 1251.0, 1941.0, 3234.0, 5487.0, 10211.0, 21073.0, 55148.0, 263442.0, 3427296.0, 299124.0, 58122.0, 21331.0, 10090.0, 5411.0, 3054.0, 1941.0, 1097.0, 777.0, 505.0, 371.0, 232.0, 161.0, 108.0, 81.0, 75.0, 42.0, 22.0, 25.0, 19.0, 17.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.494140625, -1.4481964111328125, -1.402252197265625, -1.3563079833984375, -1.31036376953125, -1.2644195556640625, -1.218475341796875, -1.1725311279296875, -1.1265869140625, -1.0806427001953125, -1.034698486328125, -0.9887542724609375, -0.94281005859375, -0.8968658447265625, -0.850921630859375, -0.8049774169921875, -0.759033203125, -0.7130889892578125, -0.667144775390625, -0.6212005615234375, -0.57525634765625, -0.5293121337890625, -0.483367919921875, -0.4374237060546875, -0.3914794921875, -0.3455352783203125, -0.299591064453125, -0.2536468505859375, -0.20770263671875, -0.1617584228515625, -0.115814208984375, -0.0698699951171875, -0.02392578125, 0.0220184326171875, 0.067962646484375, 0.1139068603515625, 0.15985107421875, 0.2057952880859375, 0.251739501953125, 0.2976837158203125, 0.3436279296875, 0.3895721435546875, 0.435516357421875, 0.4814605712890625, 0.52740478515625, 0.5733489990234375, 0.619293212890625, 0.6652374267578125, 0.711181640625, 0.7571258544921875, 0.803070068359375, 0.8490142822265625, 0.89495849609375, 0.9409027099609375, 0.986846923828125, 1.0327911376953125, 1.0787353515625, 1.1246795654296875, 1.170623779296875, 1.2165679931640625, 1.26251220703125, 1.3084564208984375, 1.354400634765625, 1.4003448486328125, 1.4462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 8.0, 2.0, 7.0, 12.0, 7.0, 12.0, 15.0, 10.0, 20.0, 25.0, 36.0, 43.0, 82.0, 178.0, 573.0, 2012.0, 483.0, 214.0, 124.0, 62.0, 40.0, 18.0, 17.0, 9.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.453125, -0.4409942626953125, -0.428863525390625, -0.4167327880859375, -0.40460205078125, -0.3924713134765625, -0.380340576171875, -0.3682098388671875, -0.3560791015625, -0.3439483642578125, -0.331817626953125, -0.3196868896484375, -0.30755615234375, -0.2954254150390625, -0.283294677734375, -0.2711639404296875, -0.259033203125, -0.2469024658203125, -0.234771728515625, -0.2226409912109375, -0.21051025390625, -0.1983795166015625, -0.186248779296875, -0.1741180419921875, -0.1619873046875, -0.1498565673828125, -0.137725830078125, -0.1255950927734375, -0.11346435546875, -0.1013336181640625, -0.089202880859375, -0.0770721435546875, -0.06494140625, -0.0528106689453125, -0.040679931640625, -0.0285491943359375, -0.01641845703125, -0.0042877197265625, 0.007843017578125, 0.0199737548828125, 0.0321044921875, 0.0442352294921875, 0.056365966796875, 0.0684967041015625, 0.08062744140625, 0.0927581787109375, 0.104888916015625, 0.1170196533203125, 0.129150390625, 0.1412811279296875, 0.153411865234375, 0.1655426025390625, 0.17767333984375, 0.1898040771484375, 0.201934814453125, 0.2140655517578125, 0.2261962890625, 0.2383270263671875, 0.250457763671875, 0.2625885009765625, 0.27471923828125, 0.2868499755859375, 0.298980712890625, 0.3111114501953125, 0.3232421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 39.0, 93.0, 370.0, 316.0, 83.0, 40.0, 19.0, 15.0, 4.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7284982204437256, -1.5678640604019165, -1.4072299003601074, -1.2465956211090088, -1.0859615802764893, -0.9253273606300354, -0.7646931409835815, -0.6040589809417725, -0.4434248208999634, -0.2827906608581543, -0.12215647101402283, 0.03847771883010864, 0.19911187887191772, 0.3597460389137268, 0.5203802585601807, 0.6810144186019897, 0.8416485786437988, 1.002282738685608, 1.162916898727417, 1.3235511779785156, 1.4841852188110352, 1.6448194980621338, 1.8054536581039429, 1.966087818145752, 2.1267218589782715, 2.28735613822937, 2.4479901790618896, 2.6086244583129883, 2.769258499145508, 2.9298927783966064, 3.090527057647705, 3.2511610984802246, 3.411795139312744, 3.5724294185638428, 3.7330634593963623, 3.893697738647461, 4.0543317794799805, 4.2149658203125, 4.375600337982178, 4.536234378814697, 4.696868419647217, 4.857502460479736, 5.018136978149414, 5.178771018981934, 5.339405059814453, 5.500039100646973, 5.66067361831665, 5.82130765914917, 5.981942176818848, 6.142576217651367, 6.303210735321045, 6.4638447761535645, 6.624478816986084, 6.7851128578186035, 6.945747375488281, 7.106381416320801, 7.26701545715332, 7.42764949798584, 7.588284015655518, 7.748918056488037, 7.909552097320557, 8.070186614990234, 8.230820655822754, 8.391454696655273, 8.552088737487793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 13.0, 24.0, 38.0, 44.0, 49.0, 72.0, 95.0, 82.0, 94.0, 85.0, 80.0, 74.0, 61.0, 37.0, 32.0, 26.0, 15.0, 21.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.585054874420166, -2.4972848892211914, -2.409514904022217, -2.321744918823242, -2.2339749336242676, -2.146204948425293, -2.0584349632263184, -1.9706652164459229, -1.8828952312469482, -1.7951252460479736, -1.707355260848999, -1.6195852756500244, -1.5318154096603394, -1.4440454244613647, -1.3562754392623901, -1.268505573272705, -1.180735468864441, -1.0929654836654663, -1.0051954984664917, -0.9174255728721619, -0.829655647277832, -0.7418856620788574, -0.6541156768798828, -0.566345751285553, -0.47857576608657837, -0.39080581068992615, -0.3030358552932739, -0.21526587009429932, -0.1274959146976471, -0.03972595930099487, 0.048044025897979736, 0.13581395149230957, 0.22358393669128418, 0.3113538920879364, 0.3991238474845886, 0.48689383268356323, 0.5746637582778931, 0.6624337434768677, 0.7502037286758423, 0.8379736542701721, 0.9257436394691467, 1.0135135650634766, 1.1012835502624512, 1.1890535354614258, 1.2768235206604004, 1.364593505859375, 1.4523634910583496, 1.5401333570480347, 1.6279033422470093, 1.7156733274459839, 1.8034433126449585, 1.8912131786346436, 1.9789831638336182, 2.0667531490325928, 2.1545231342315674, 2.242293119430542, 2.3300631046295166, 2.417833089828491, 2.505603075027466, 2.5933730602264404, 2.681143045425415, 2.7689127922058105, 2.856682777404785, 2.9444527626037598, 3.0322227478027344]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 27.0, 30.0, 45.0, 55.0, 88.0, 117.0, 166.0, 246.0, 351.0, 487.0, 761.0, 1073.0, 1659.0, 2739.0, 4374.0, 7843.0, 14667.0, 33647.0, 117876.0, 547799.0, 221257.0, 49483.0, 19535.0, 9669.0, 5390.0, 3179.0, 1980.0, 1326.0, 812.0, 548.0, 353.0, 281.0, 181.0, 150.0, 94.0, 66.0, 50.0, 28.0, 31.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.03369140625, -1.0, -0.96630859375, -0.9326171875, -0.89892578125, -0.865234375, -0.83154296875, -0.7978515625, -0.76416015625, -0.73046875, -0.69677734375, -0.6630859375, -0.62939453125, -0.595703125, -0.56201171875, -0.5283203125, -0.49462890625, -0.4609375, -0.42724609375, -0.3935546875, -0.35986328125, -0.326171875, -0.29248046875, -0.2587890625, -0.22509765625, -0.19140625, -0.15771484375, -0.1240234375, -0.09033203125, -0.056640625, -0.02294921875, 0.0107421875, 0.04443359375, 0.078125, 0.11181640625, 0.1455078125, 0.17919921875, 0.212890625, 0.24658203125, 0.2802734375, 0.31396484375, 0.34765625, 0.38134765625, 0.4150390625, 0.44873046875, 0.482421875, 0.51611328125, 0.5498046875, 0.58349609375, 0.6171875, 0.65087890625, 0.6845703125, 0.71826171875, 0.751953125, 0.78564453125, 0.8193359375, 0.85302734375, 0.88671875, 0.92041015625, 0.9541015625, 0.98779296875, 1.021484375, 1.05517578125, 1.0888671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 3.0, 5.0, 4.0, 15.0, 13.0, 13.0, 37.0, 43.0, 68.0, 94.0, 113.0, 126.0, 126.0, 80.0, 65.0, 43.0, 22.0, 22.0, 14.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.1686725616455078, -0.16315078735351562, -0.15762901306152344, -0.15210723876953125, -0.14658546447753906, -0.14106369018554688, -0.1355419158935547, -0.1300201416015625, -0.12449836730957031, -0.11897659301757812, -0.11345481872558594, -0.10793304443359375, -0.10241127014160156, -0.09688949584960938, -0.09136772155761719, -0.085845947265625, -0.08032417297363281, -0.07480239868164062, -0.06928062438964844, -0.06375885009765625, -0.05823707580566406, -0.052715301513671875, -0.04719352722167969, -0.0416717529296875, -0.03614997863769531, -0.030628204345703125, -0.025106430053710938, -0.01958465576171875, -0.014062881469726562, -0.008541107177734375, -0.0030193328857421875, 0.00250244140625, 0.008024215698242188, 0.013545989990234375, 0.019067764282226562, 0.02458953857421875, 0.030111312866210938, 0.035633087158203125, 0.04115486145019531, 0.0466766357421875, 0.05219841003417969, 0.057720184326171875, 0.06324195861816406, 0.06876373291015625, 0.07428550720214844, 0.07980728149414062, 0.08532905578613281, 0.090850830078125, 0.09637260437011719, 0.10189437866210938, 0.10741615295410156, 0.11293792724609375, 0.11845970153808594, 0.12398147583007812, 0.1295032501220703, 0.1350250244140625, 0.1405467987060547, 0.14606857299804688, 0.15159034729003906, 0.15711212158203125, 0.16263389587402344, 0.16815567016601562, 0.1736774444580078, 0.17919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 17.0, 28.0, 92.0, 193.0, 558.0, 1912.0, 8475.0, 48539.0, 393786.0, 518268.0, 62780.0, 10759.0, 2206.0, 599.0, 169.0, 89.0, 25.0, 10.0, 11.0, 8.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.44921875, -2.3910064697265625, -2.332794189453125, -2.2745819091796875, -2.21636962890625, -2.1581573486328125, -2.099945068359375, -2.0417327880859375, -1.9835205078125, -1.9253082275390625, -1.867095947265625, -1.8088836669921875, -1.75067138671875, -1.6924591064453125, -1.634246826171875, -1.5760345458984375, -1.517822265625, -1.4596099853515625, -1.401397705078125, -1.3431854248046875, -1.28497314453125, -1.2267608642578125, -1.168548583984375, -1.1103363037109375, -1.0521240234375, -0.9939117431640625, -0.935699462890625, -0.8774871826171875, -0.81927490234375, -0.7610626220703125, -0.702850341796875, -0.6446380615234375, -0.58642578125, -0.5282135009765625, -0.470001220703125, -0.4117889404296875, -0.35357666015625, -0.2953643798828125, -0.237152099609375, -0.1789398193359375, -0.1207275390625, -0.0625152587890625, -0.004302978515625, 0.0539093017578125, 0.11212158203125, 0.1703338623046875, 0.228546142578125, 0.2867584228515625, 0.344970703125, 0.4031829833984375, 0.461395263671875, 0.5196075439453125, 0.57781982421875, 0.6360321044921875, 0.694244384765625, 0.7524566650390625, 0.8106689453125, 0.8688812255859375, 0.927093505859375, 0.9853057861328125, 1.04351806640625, 1.1017303466796875, 1.159942626953125, 1.2181549072265625, 1.2763671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 4.0, 12.0, 10.0, 13.0, 15.0, 14.0, 25.0, 26.0, 28.0, 23.0, 37.0, 25.0, 43.0, 45.0, 44.0, 43.0, 45.0, 37.0, 32.0, 45.0, 52.0, 47.0, 39.0, 36.0, 39.0, 30.0, 24.0, 29.0, 17.0, 20.0, 18.0, 19.0, 6.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7307281494140625, -0.708526611328125, -0.6863250732421875, -0.66412353515625, -0.6419219970703125, -0.619720458984375, -0.5975189208984375, -0.5753173828125, -0.5531158447265625, -0.530914306640625, -0.5087127685546875, -0.48651123046875, -0.4643096923828125, -0.442108154296875, -0.4199066162109375, -0.397705078125, -0.3755035400390625, -0.353302001953125, -0.3311004638671875, -0.30889892578125, -0.2866973876953125, -0.264495849609375, -0.2422943115234375, -0.2200927734375, -0.1978912353515625, -0.175689697265625, -0.1534881591796875, -0.13128662109375, -0.1090850830078125, -0.086883544921875, -0.0646820068359375, -0.04248046875, -0.0202789306640625, 0.001922607421875, 0.0241241455078125, 0.04632568359375, 0.0685272216796875, 0.090728759765625, 0.1129302978515625, 0.1351318359375, 0.1573333740234375, 0.179534912109375, 0.2017364501953125, 0.22393798828125, 0.2461395263671875, 0.268341064453125, 0.2905426025390625, 0.312744140625, 0.3349456787109375, 0.357147216796875, 0.3793487548828125, 0.40155029296875, 0.4237518310546875, 0.445953369140625, 0.4681549072265625, 0.4903564453125, 0.5125579833984375, 0.534759521484375, 0.5569610595703125, 0.57916259765625, 0.6013641357421875, 0.623565673828125, 0.6457672119140625, 0.66796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 21.0, 94.0, 569.0, 36103.0, 1009069.0, 2391.0, 212.0, 44.0, 17.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8502197265625, -7.598876953125, -7.3475341796875, -7.09619140625, -6.8448486328125, -6.593505859375, -6.3421630859375, -6.0908203125, -5.8394775390625, -5.588134765625, -5.3367919921875, -5.08544921875, -4.8341064453125, -4.582763671875, -4.3314208984375, -4.080078125, -3.8287353515625, -3.577392578125, -3.3260498046875, -3.07470703125, -2.8233642578125, -2.572021484375, -2.3206787109375, -2.0693359375, -1.8179931640625, -1.566650390625, -1.3153076171875, -1.06396484375, -0.8126220703125, -0.561279296875, -0.3099365234375, -0.05859375, 0.1927490234375, 0.444091796875, 0.6954345703125, 0.94677734375, 1.1981201171875, 1.449462890625, 1.7008056640625, 1.9521484375, 2.2034912109375, 2.454833984375, 2.7061767578125, 2.95751953125, 3.2088623046875, 3.460205078125, 3.7115478515625, 3.962890625, 4.2142333984375, 4.465576171875, 4.7169189453125, 4.96826171875, 5.2196044921875, 5.470947265625, 5.7222900390625, 5.9736328125, 6.2249755859375, 6.476318359375, 6.7276611328125, 6.97900390625, 7.2303466796875, 7.481689453125, 7.7330322265625, 7.984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 7.0, 9.0, 9.0, 17.0, 38.0, 49.0, 71.0, 103.0, 134.0, 114.0, 111.0, 98.0, 64.0, 59.0, 38.0, 19.0, 13.0, 12.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010782480239868164, -0.00010478310286998749, -0.00010174140334129333, -9.869970381259918e-05, -9.565800428390503e-05, -9.261630475521088e-05, -8.957460522651672e-05, -8.653290569782257e-05, -8.349120616912842e-05, -8.044950664043427e-05, -7.740780711174011e-05, -7.436610758304596e-05, -7.13244080543518e-05, -6.828270852565765e-05, -6.52410089969635e-05, -6.219930946826935e-05, -5.9157609939575195e-05, -5.611591041088104e-05, -5.307421088218689e-05, -5.003251135349274e-05, -4.6990811824798584e-05, -4.394911229610443e-05, -4.090741276741028e-05, -3.7865713238716125e-05, -3.482401371002197e-05, -3.178231418132782e-05, -2.8740614652633667e-05, -2.5698915123939514e-05, -2.265721559524536e-05, -1.961551606655121e-05, -1.6573816537857056e-05, -1.3532117009162903e-05, -1.049041748046875e-05, -7.448717951774597e-06, -4.407018423080444e-06, -1.3653188943862915e-06, 1.6763806343078613e-06, 4.718080163002014e-06, 7.759779691696167e-06, 1.080147922039032e-05, 1.3843178749084473e-05, 1.6884878277778625e-05, 1.992657780647278e-05, 2.296827733516693e-05, 2.6009976863861084e-05, 2.9051676392555237e-05, 3.209337592124939e-05, 3.513507544994354e-05, 3.8176774978637695e-05, 4.121847450733185e-05, 4.4260174036026e-05, 4.7301873564720154e-05, 5.034357309341431e-05, 5.338527262210846e-05, 5.642697215080261e-05, 5.9468671679496765e-05, 6.251037120819092e-05, 6.555207073688507e-05, 6.859377026557922e-05, 7.163546979427338e-05, 7.467716932296753e-05, 7.771886885166168e-05, 8.076056838035583e-05, 8.380226790904999e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 38.0, 45.0, 62.0, 105.0, 198.0, 353.0, 675.0, 1488.0, 3448.0, 10119.0, 40093.0, 223842.0, 584376.0, 141574.0, 28359.0, 7979.0, 2989.0, 1319.0, 648.0, 313.0, 164.0, 122.0, 83.0, 46.0, 22.0, 14.0, 13.0, 13.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8389816284179688, -0.8083343505859375, -0.7776870727539062, -0.747039794921875, -0.7163925170898438, -0.6857452392578125, -0.6550979614257812, -0.62445068359375, -0.5938034057617188, -0.5631561279296875, -0.5325088500976562, -0.501861572265625, -0.47121429443359375, -0.4405670166015625, -0.40991973876953125, -0.3792724609375, -0.34862518310546875, -0.3179779052734375, -0.28733062744140625, -0.256683349609375, -0.22603607177734375, -0.1953887939453125, -0.16474151611328125, -0.13409423828125, -0.10344696044921875, -0.0727996826171875, -0.04215240478515625, -0.011505126953125, 0.01914215087890625, 0.0497894287109375, 0.08043670654296875, 0.111083984375, 0.14173126220703125, 0.1723785400390625, 0.20302581787109375, 0.233673095703125, 0.26432037353515625, 0.2949676513671875, 0.32561492919921875, 0.35626220703125, 0.38690948486328125, 0.4175567626953125, 0.44820404052734375, 0.478851318359375, 0.5094985961914062, 0.5401458740234375, 0.5707931518554688, 0.6014404296875, 0.6320877075195312, 0.6627349853515625, 0.6933822631835938, 0.724029541015625, 0.7546768188476562, 0.7853240966796875, 0.8159713745117188, 0.84661865234375, 0.8772659301757812, 0.9079132080078125, 0.9385604858398438, 0.969207763671875, 0.9998550415039062, 1.0305023193359375, 1.0611495971679688, 1.091796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 14.0, 10.0, 15.0, 18.0, 37.0, 55.0, 55.0, 57.0, 95.0, 108.0, 114.0, 107.0, 77.0, 66.0, 42.0, 31.0, 28.0, 19.0, 16.0, 12.0, 6.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6923828125, -0.6668853759765625, -0.641387939453125, -0.6158905029296875, -0.59039306640625, -0.5648956298828125, -0.539398193359375, -0.5139007568359375, -0.4884033203125, -0.4629058837890625, -0.437408447265625, -0.4119110107421875, -0.38641357421875, -0.3609161376953125, -0.335418701171875, -0.3099212646484375, -0.284423828125, -0.2589263916015625, -0.233428955078125, -0.2079315185546875, -0.18243408203125, -0.1569366455078125, -0.131439208984375, -0.1059417724609375, -0.0804443359375, -0.0549468994140625, -0.029449462890625, -0.0039520263671875, 0.02154541015625, 0.0470428466796875, 0.072540283203125, 0.0980377197265625, 0.12353515625, 0.1490325927734375, 0.174530029296875, 0.2000274658203125, 0.22552490234375, 0.2510223388671875, 0.276519775390625, 0.3020172119140625, 0.3275146484375, 0.3530120849609375, 0.378509521484375, 0.4040069580078125, 0.42950439453125, 0.4550018310546875, 0.480499267578125, 0.5059967041015625, 0.531494140625, 0.5569915771484375, 0.582489013671875, 0.6079864501953125, 0.63348388671875, 0.6589813232421875, 0.684478759765625, 0.7099761962890625, 0.7354736328125, 0.7609710693359375, 0.786468505859375, 0.8119659423828125, 0.83746337890625, 0.8629608154296875, 0.888458251953125, 0.9139556884765625, 0.939453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 7.0, 7.0, 34.0, 78.0, 232.0, 359.0, 174.0, 63.0, 24.0, 9.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.288938522338867, -12.865629196166992, -12.442319869995117, -12.019010543823242, -11.595702171325684, -11.172392845153809, -10.749083518981934, -10.325774192810059, -9.902464866638184, -9.479155540466309, -9.055846214294434, -8.632537841796875, -8.209228515625, -7.785919189453125, -7.36260986328125, -6.939300537109375, -6.515991687774658, -6.092682361602783, -5.669373512268066, -5.246064186096191, -4.822754859924316, -4.399445533752441, -3.9761366844177246, -3.5528273582458496, -3.1295182704925537, -2.706209182739258, -2.282899856567383, -1.859590768814087, -1.4362815618515015, -1.012972354888916, -0.5896632671356201, -0.16635394096374512, 0.2569551467895508, 0.6802643537521362, 1.1035735607147217, 1.5268826484680176, 1.950191855430603, 2.3735010623931885, 2.7968101501464844, 3.2201194763183594, 3.6434285640716553, 4.066737651824951, 4.490046977996826, 4.913355827331543, 5.336665153503418, 5.759974479675293, 6.183283805847168, 6.606593132019043, 7.02990198135376, 7.453211307525635, 7.876520156860352, 8.299829483032227, 8.723138809204102, 9.146448135375977, 9.569757461547852, 9.993066787719727, 10.416375160217285, 10.83968448638916, 11.262993812561035, 11.686302185058594, 12.109611511230469, 12.532920837402344, 12.956230163574219, 13.379539489746094, 13.802848815917969]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 21.0, 31.0, 48.0, 63.0, 78.0, 99.0, 126.0, 96.0, 89.0, 80.0, 77.0, 43.0, 25.0, 18.0, 17.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.368463516235352, -11.058740615844727, -10.749017715454102, -10.43929386138916, -10.129570960998535, -9.81984806060791, -9.510124206542969, -9.200401306152344, -8.890678405761719, -8.580955505371094, -8.271232604980469, -7.961508750915527, -7.651785850524902, -7.342062950134277, -7.032339572906494, -6.722616195678711, -6.412893295288086, -6.103170394897461, -5.793447017669678, -5.4837236404418945, -5.1740007400512695, -4.8642778396606445, -4.554554462432861, -4.244831085205078, -3.935108184814453, -3.625385046005249, -3.315661907196045, -3.005938768386841, -2.6962156295776367, -2.3864924907684326, -2.0767693519592285, -1.7670462131500244, -1.4573240280151367, -1.1476008892059326, -0.8378777503967285, -0.5281546115875244, -0.2184314727783203, 0.09129166603088379, 0.4010148048400879, 0.710737943649292, 1.020461082458496, 1.3301842212677002, 1.6399073600769043, 1.9496304988861084, 2.2593536376953125, 2.5690767765045166, 2.8787999153137207, 3.188523054122925, 3.498246192932129, 3.807969331741333, 4.117692470550537, 4.42741584777832, 4.737138748168945, 5.04686164855957, 5.3565850257873535, 5.666308403015137, 5.976031303405762, 6.285754203796387, 6.59547758102417, 6.905200958251953, 7.214923858642578, 7.524646759033203, 7.834370136260986, 8.14409351348877, 8.453816413879395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 15.0, 11.0, 26.0, 30.0, 56.0, 59.0, 89.0, 133.0, 226.0, 287.0, 509.0, 854.0, 1990.0, 4732.0, 18400.0, 533718.0, 3598484.0, 24700.0, 5617.0, 2055.0, 945.0, 476.0, 295.0, 190.0, 108.0, 85.0, 51.0, 38.0, 27.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6171875, -6.43377685546875, -6.2503662109375, -6.06695556640625, -5.883544921875, -5.70013427734375, -5.5167236328125, -5.33331298828125, -5.14990234375, -4.96649169921875, -4.7830810546875, -4.59967041015625, -4.416259765625, -4.23284912109375, -4.0494384765625, -3.86602783203125, -3.6826171875, -3.49920654296875, -3.3157958984375, -3.13238525390625, -2.948974609375, -2.76556396484375, -2.5821533203125, -2.39874267578125, -2.21533203125, -2.03192138671875, -1.8485107421875, -1.66510009765625, -1.481689453125, -1.29827880859375, -1.1148681640625, -0.93145751953125, -0.748046875, -0.56463623046875, -0.3812255859375, -0.19781494140625, -0.014404296875, 0.16900634765625, 0.3524169921875, 0.53582763671875, 0.71923828125, 0.90264892578125, 1.0860595703125, 1.26947021484375, 1.452880859375, 1.63629150390625, 1.8197021484375, 2.00311279296875, 2.1865234375, 2.36993408203125, 2.5533447265625, 2.73675537109375, 2.920166015625, 3.10357666015625, 3.2869873046875, 3.47039794921875, 3.65380859375, 3.83721923828125, 4.0206298828125, 4.20404052734375, 4.387451171875, 4.57086181640625, 4.7542724609375, 4.93768310546875, 5.12109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 9.0, 12.0, 18.0, 20.0, 29.0, 59.0, 76.0, 107.0, 118.0, 121.0, 106.0, 102.0, 57.0, 45.0, 18.0, 24.0, 8.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.2125415802001953, -0.20572280883789062, -0.19890403747558594, -0.19208526611328125, -0.18526649475097656, -0.17844772338867188, -0.1716289520263672, -0.1648101806640625, -0.1579914093017578, -0.15117263793945312, -0.14435386657714844, -0.13753509521484375, -0.13071632385253906, -0.12389755249023438, -0.11707878112792969, -0.110260009765625, -0.10344123840332031, -0.09662246704101562, -0.08980369567871094, -0.08298492431640625, -0.07616615295410156, -0.06934738159179688, -0.06252861022949219, -0.0557098388671875, -0.04889106750488281, -0.042072296142578125, -0.03525352478027344, -0.02843475341796875, -0.021615982055664062, -0.014797210693359375, -0.007978439331054688, -0.00115966796875, 0.0056591033935546875, 0.012477874755859375, 0.019296646118164062, 0.02611541748046875, 0.03293418884277344, 0.039752960205078125, 0.04657173156738281, 0.0533905029296875, 0.06020927429199219, 0.06702804565429688, 0.07384681701660156, 0.08066558837890625, 0.08748435974121094, 0.09430313110351562, 0.10112190246582031, 0.107940673828125, 0.11475944519042969, 0.12157821655273438, 0.12839698791503906, 0.13521575927734375, 0.14203453063964844, 0.14885330200195312, 0.1556720733642578, 0.1624908447265625, 0.1693096160888672, 0.17612838745117188, 0.18294715881347656, 0.18976593017578125, 0.19658470153808594, 0.20340347290039062, 0.2102222442626953, 0.217041015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 19.0, 19.0, 31.0, 31.0, 59.0, 78.0, 158.0, 789.0, 333734.0, 3857683.0, 1167.0, 195.0, 89.0, 68.0, 45.0, 33.0, 19.0, 11.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.541015625, -11.97265625, -11.404296875, -10.8359375, -10.267578125, -9.69921875, -9.130859375, -8.5625, -7.994140625, -7.42578125, -6.857421875, -6.2890625, -5.720703125, -5.15234375, -4.583984375, -4.015625, -3.447265625, -2.87890625, -2.310546875, -1.7421875, -1.173828125, -0.60546875, -0.037109375, 0.53125, 1.099609375, 1.66796875, 2.236328125, 2.8046875, 3.373046875, 3.94140625, 4.509765625, 5.078125, 5.646484375, 6.21484375, 6.783203125, 7.3515625, 7.919921875, 8.48828125, 9.056640625, 9.625, 10.193359375, 10.76171875, 11.330078125, 11.8984375, 12.466796875, 13.03515625, 13.603515625, 14.171875, 14.740234375, 15.30859375, 15.876953125, 16.4453125, 17.013671875, 17.58203125, 18.150390625, 18.71875, 19.287109375, 19.85546875, 20.423828125, 20.9921875, 21.560546875, 22.12890625, 22.697265625, 23.265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 18.0, 7.0, 18.0, 24.0, 32.0, 51.0, 83.0, 129.0, 219.0, 441.0, 1678.0, 713.0, 257.0, 124.0, 75.0, 52.0, 42.0, 32.0, 25.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5732421875, -0.5584335327148438, -0.5436248779296875, -0.5288162231445312, -0.514007568359375, -0.49919891357421875, -0.4843902587890625, -0.46958160400390625, -0.45477294921875, -0.43996429443359375, -0.4251556396484375, -0.41034698486328125, -0.395538330078125, -0.38072967529296875, -0.3659210205078125, -0.35111236572265625, -0.3363037109375, -0.32149505615234375, -0.3066864013671875, -0.29187774658203125, -0.277069091796875, -0.26226043701171875, -0.2474517822265625, -0.23264312744140625, -0.21783447265625, -0.20302581787109375, -0.1882171630859375, -0.17340850830078125, -0.158599853515625, -0.14379119873046875, -0.1289825439453125, -0.11417388916015625, -0.099365234375, -0.08455657958984375, -0.0697479248046875, -0.05493927001953125, -0.040130615234375, -0.02532196044921875, -0.0105133056640625, 0.00429534912109375, 0.01910400390625, 0.03391265869140625, 0.0487213134765625, 0.06352996826171875, 0.078338623046875, 0.09314727783203125, 0.1079559326171875, 0.12276458740234375, 0.1375732421875, 0.15238189697265625, 0.1671905517578125, 0.18199920654296875, 0.196807861328125, 0.21161651611328125, 0.2264251708984375, 0.24123382568359375, 0.25604248046875, 0.27085113525390625, 0.2856597900390625, 0.30046844482421875, 0.315277099609375, 0.33008575439453125, 0.3448944091796875, 0.35970306396484375, 0.37451171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 15.0, 22.0, 19.0, 29.0, 62.0, 88.0, 173.0, 159.0, 143.0, 104.0, 68.0, 34.0, 24.0, 12.0, 10.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378148317337036, -2.3036506175994873, -2.2291531562805176, -2.1546554565429688, -2.08015775680542, -2.00566029548645, -1.9311625957489014, -1.856665015220642, -1.7821674346923828, -1.7076698541641235, -1.6331722736358643, -1.5586745738983154, -1.4841769933700562, -1.4096794128417969, -1.335181713104248, -1.2606841325759888, -1.1861865520477295, -1.1116889715194702, -1.037191390991211, -0.9626936912536621, -0.8881961107254028, -0.8136985301971436, -0.7392008900642395, -0.6647032499313354, -0.5902056694030762, -0.5157080888748169, -0.44121044874191284, -0.3667128384113312, -0.2922152280807495, -0.21771761775016785, -0.14322000741958618, -0.06872236728668213, 0.005774974822998047, 0.08027258515357971, 0.15477019548416138, 0.22926780581474304, 0.3037654161453247, 0.37826302647590637, 0.45276063680648804, 0.5272582769393921, 0.6017558574676514, 0.6762534379959106, 0.7507510781288147, 0.8252487182617188, 0.899746298789978, 0.9742438793182373, 1.0487415790557861, 1.1232391595840454, 1.1977367401123047, 1.272234320640564, 1.3467319011688232, 1.421229600906372, 1.4957271814346313, 1.5702247619628906, 1.6447224617004395, 1.7192200422286987, 1.793717622756958, 1.8682152032852173, 1.9427127838134766, 2.0172104835510254, 2.091708183288574, 2.166205644607544, 2.2407033443450928, 2.3152008056640625, 2.3896985054016113]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 12.0, 19.0, 22.0, 18.0, 26.0, 35.0, 41.0, 38.0, 48.0, 57.0, 67.0, 67.0, 52.0, 66.0, 65.0, 55.0, 51.0, 56.0, 47.0, 30.0, 19.0, 22.0, 16.0, 17.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7533705234527588, -1.6853567361831665, -1.6173430681228638, -1.5493292808532715, -1.4813156127929688, -1.4133018255233765, -1.3452880382537842, -1.2772743701934814, -1.2092607021331787, -1.1412469148635864, -1.0732332468032837, -1.0052194595336914, -0.9372057914733887, -0.8691920042037964, -0.8011782765388489, -0.7331645488739014, -0.6651507616043091, -0.5971370339393616, -0.5291233062744141, -0.46110954880714417, -0.39309582114219666, -0.32508209347724915, -0.25706833600997925, -0.18905460834503174, -0.12104088068008423, -0.05302714556455612, 0.014986589550971985, 0.08300033211708069, 0.1510140597820282, 0.2190277874469757, 0.2870415449142456, 0.3550552725791931, 0.4230690002441406, 0.49108272790908813, 0.5590964555740356, 0.6271102428436279, 0.6951239109039307, 0.763137698173523, 0.8311514258384705, 0.899165153503418, 0.9671788811683655, 1.035192608833313, 1.1032063961029053, 1.171220064163208, 1.2392338514328003, 1.307247519493103, 1.3752613067626953, 1.443274974822998, 1.5112887620925903, 1.5793025493621826, 1.6473162174224854, 1.7153300046920776, 1.7833436727523804, 1.8513574600219727, 1.9193711280822754, 1.9873849153518677, 2.05539870262146, 2.1234123706817627, 2.1914262771606445, 2.2594399452209473, 2.32745361328125, 2.3954672813415527, 2.4634811878204346, 2.5314948558807373, 2.59950852394104]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 10.0, 6.0, 10.0, 14.0, 20.0, 30.0, 41.0, 52.0, 82.0, 131.0, 186.0, 320.0, 461.0, 900.0, 1833.0, 4715.0, 16211.0, 99137.0, 705809.0, 183069.0, 24219.0, 6231.0, 2336.0, 1087.0, 611.0, 349.0, 218.0, 142.0, 107.0, 79.0, 41.0, 22.0, 24.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.478515625, -2.404815673828125, -2.33111572265625, -2.257415771484375, -2.1837158203125, -2.110015869140625, -2.03631591796875, -1.962615966796875, -1.888916015625, -1.815216064453125, -1.74151611328125, -1.667816162109375, -1.5941162109375, -1.520416259765625, -1.44671630859375, -1.373016357421875, -1.29931640625, -1.225616455078125, -1.15191650390625, -1.078216552734375, -1.0045166015625, -0.930816650390625, -0.85711669921875, -0.783416748046875, -0.709716796875, -0.636016845703125, -0.56231689453125, -0.488616943359375, -0.4149169921875, -0.341217041015625, -0.26751708984375, -0.193817138671875, -0.1201171875, -0.046417236328125, 0.02728271484375, 0.100982666015625, 0.1746826171875, 0.248382568359375, 0.32208251953125, 0.395782470703125, 0.469482421875, 0.543182373046875, 0.61688232421875, 0.690582275390625, 0.7642822265625, 0.837982177734375, 0.91168212890625, 0.985382080078125, 1.05908203125, 1.132781982421875, 1.20648193359375, 1.280181884765625, 1.3538818359375, 1.427581787109375, 1.50128173828125, 1.574981689453125, 1.648681640625, 1.722381591796875, 1.79608154296875, 1.869781494140625, 1.9434814453125, 2.017181396484375, 2.09088134765625, 2.164581298828125, 2.23828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 7.0, 14.0, 21.0, 35.0, 67.0, 69.0, 99.0, 116.0, 135.0, 114.0, 103.0, 69.0, 50.0, 26.0, 19.0, 18.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210205078125, -0.20248031616210938, -0.19475555419921875, -0.18703079223632812, -0.1793060302734375, -0.17158126831054688, -0.16385650634765625, -0.15613174438476562, -0.148406982421875, -0.14068222045898438, -0.13295745849609375, -0.12523269653320312, -0.1175079345703125, -0.10978317260742188, -0.10205841064453125, -0.09433364868164062, -0.08660888671875, -0.07888412475585938, -0.07115936279296875, -0.06343460083007812, -0.0557098388671875, -0.047985076904296875, -0.04026031494140625, -0.032535552978515625, -0.024810791015625, -0.017086029052734375, -0.00936126708984375, -0.001636505126953125, 0.0060882568359375, 0.013813018798828125, 0.02153778076171875, 0.029262542724609375, 0.0369873046875, 0.044712066650390625, 0.05243682861328125, 0.060161590576171875, 0.0678863525390625, 0.07561111450195312, 0.08333587646484375, 0.09106063842773438, 0.098785400390625, 0.10651016235351562, 0.11423492431640625, 0.12195968627929688, 0.1296844482421875, 0.13740921020507812, 0.14513397216796875, 0.15285873413085938, 0.16058349609375, 0.16830825805664062, 0.17603302001953125, 0.18375778198242188, 0.1914825439453125, 0.19920730590820312, 0.20693206787109375, 0.21465682983398438, 0.222381591796875, 0.23010635375976562, 0.23783111572265625, 0.24555587768554688, 0.2532806396484375, 0.2610054016113281, 0.26873016357421875, 0.2764549255371094, 0.2841796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 27.0, 37.0, 54.0, 90.0, 110.0, 179.0, 247.0, 421.0, 605.0, 1013.0, 1685.0, 2929.0, 5146.0, 9695.0, 18800.0, 38538.0, 87884.0, 233314.0, 356271.0, 164350.0, 64836.0, 29671.0, 14534.0, 7522.0, 4219.0, 2426.0, 1386.0, 909.0, 567.0, 329.0, 205.0, 158.0, 105.0, 75.0, 51.0, 31.0, 23.0, 17.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.0375823974609375, -1.000946044921875, -0.9643096923828125, -0.92767333984375, -0.8910369873046875, -0.854400634765625, -0.8177642822265625, -0.7811279296875, -0.7444915771484375, -0.707855224609375, -0.6712188720703125, -0.63458251953125, -0.5979461669921875, -0.561309814453125, -0.5246734619140625, -0.488037109375, -0.4514007568359375, -0.414764404296875, -0.3781280517578125, -0.34149169921875, -0.3048553466796875, -0.268218994140625, -0.2315826416015625, -0.1949462890625, -0.1583099365234375, -0.121673583984375, -0.0850372314453125, -0.04840087890625, -0.0117645263671875, 0.024871826171875, 0.0615081787109375, 0.09814453125, 0.1347808837890625, 0.171417236328125, 0.2080535888671875, 0.24468994140625, 0.2813262939453125, 0.317962646484375, 0.3545989990234375, 0.3912353515625, 0.4278717041015625, 0.464508056640625, 0.5011444091796875, 0.53778076171875, 0.5744171142578125, 0.611053466796875, 0.6476898193359375, 0.684326171875, 0.7209625244140625, 0.757598876953125, 0.7942352294921875, 0.83087158203125, 0.8675079345703125, 0.904144287109375, 0.9407806396484375, 0.9774169921875, 1.0140533447265625, 1.050689697265625, 1.0873260498046875, 1.12396240234375, 1.1605987548828125, 1.197235107421875, 1.2338714599609375, 1.2705078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 8.0, 7.0, 8.0, 5.0, 17.0, 21.0, 22.0, 18.0, 24.0, 21.0, 37.0, 41.0, 25.0, 46.0, 46.0, 33.0, 41.0, 55.0, 60.0, 37.0, 53.0, 34.0, 35.0, 39.0, 32.0, 25.0, 28.0, 35.0, 29.0, 24.0, 14.0, 12.0, 16.0, 4.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92138671875, -0.8895187377929688, -0.8576507568359375, -0.8257827758789062, -0.793914794921875, -0.7620468139648438, -0.7301788330078125, -0.6983108520507812, -0.66644287109375, -0.6345748901367188, -0.6027069091796875, -0.5708389282226562, -0.538970947265625, -0.5071029663085938, -0.4752349853515625, -0.44336700439453125, -0.4114990234375, -0.37963104248046875, -0.3477630615234375, -0.31589508056640625, -0.284027099609375, -0.25215911865234375, -0.2202911376953125, -0.18842315673828125, -0.15655517578125, -0.12468719482421875, -0.0928192138671875, -0.06095123291015625, -0.029083251953125, 0.00278472900390625, 0.0346527099609375, 0.06652069091796875, 0.098388671875, 0.13025665283203125, 0.1621246337890625, 0.19399261474609375, 0.225860595703125, 0.25772857666015625, 0.2895965576171875, 0.32146453857421875, 0.35333251953125, 0.38520050048828125, 0.4170684814453125, 0.44893646240234375, 0.480804443359375, 0.5126724243164062, 0.5445404052734375, 0.5764083862304688, 0.6082763671875, 0.6401443481445312, 0.6720123291015625, 0.7038803100585938, 0.735748291015625, 0.7676162719726562, 0.7994842529296875, 0.8313522338867188, 0.86322021484375, 0.8950881958007812, 0.9269561767578125, 0.9588241577148438, 0.990692138671875, 1.0225601196289062, 1.0544281005859375, 1.0862960815429688, 1.1181640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 6.0, 12.0, 13.0, 31.0, 36.0, 52.0, 67.0, 125.0, 199.0, 372.0, 735.0, 1617.0, 4382.0, 16346.0, 108219.0, 674712.0, 206463.0, 25172.0, 5849.0, 2118.0, 894.0, 437.0, 253.0, 148.0, 89.0, 63.0, 31.0, 32.0, 14.0, 18.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.459716796875, -1.41357421875, -1.367431640625, -1.3212890625, -1.275146484375, -1.22900390625, -1.182861328125, -1.13671875, -1.090576171875, -1.04443359375, -0.998291015625, -0.9521484375, -0.906005859375, -0.85986328125, -0.813720703125, -0.767578125, -0.721435546875, -0.67529296875, -0.629150390625, -0.5830078125, -0.536865234375, -0.49072265625, -0.444580078125, -0.3984375, -0.352294921875, -0.30615234375, -0.260009765625, -0.2138671875, -0.167724609375, -0.12158203125, -0.075439453125, -0.029296875, 0.016845703125, 0.06298828125, 0.109130859375, 0.1552734375, 0.201416015625, 0.24755859375, 0.293701171875, 0.33984375, 0.385986328125, 0.43212890625, 0.478271484375, 0.5244140625, 0.570556640625, 0.61669921875, 0.662841796875, 0.708984375, 0.755126953125, 0.80126953125, 0.847412109375, 0.8935546875, 0.939697265625, 0.98583984375, 1.031982421875, 1.078125, 1.124267578125, 1.17041015625, 1.216552734375, 1.2626953125, 1.308837890625, 1.35498046875, 1.401123046875, 1.447265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 12.0, 24.0, 19.0, 34.0, 43.0, 51.0, 64.0, 67.0, 100.0, 110.0, 93.0, 71.0, 59.0, 46.0, 36.0, 31.0, 30.0, 20.0, 17.0, 15.0, 5.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013208389282226562, -0.00012873392552137375, -0.00012538395822048187, -0.00012203399091959, -0.00011868402361869812, -0.00011533405631780624, -0.00011198408901691437, -0.00010863412171602249, -0.00010528415441513062, -0.00010193418711423874, -9.858421981334686e-05, -9.523425251245499e-05, -9.188428521156311e-05, -8.853431791067123e-05, -8.518435060977936e-05, -8.183438330888748e-05, -7.84844160079956e-05, -7.513444870710373e-05, -7.178448140621185e-05, -6.843451410531998e-05, -6.50845468044281e-05, -6.173457950353622e-05, -5.838461220264435e-05, -5.503464490175247e-05, -5.1684677600860596e-05, -4.833471029996872e-05, -4.498474299907684e-05, -4.163477569818497e-05, -3.828480839729309e-05, -3.4934841096401215e-05, -3.158487379550934e-05, -2.8234906494617462e-05, -2.4884939193725586e-05, -2.153497189283371e-05, -1.8185004591941833e-05, -1.4835037291049957e-05, -1.1485069990158081e-05, -8.135102689266205e-06, -4.785135388374329e-06, -1.4351680874824524e-06, 1.914799213409424e-06, 5.2647665143013e-06, 8.614733815193176e-06, 1.1964701116085052e-05, 1.531466841697693e-05, 1.8664635717868805e-05, 2.201460301876068e-05, 2.5364570319652557e-05, 2.8714537620544434e-05, 3.206450492143631e-05, 3.5414472222328186e-05, 3.876443952322006e-05, 4.211440682411194e-05, 4.5464374125003815e-05, 4.881434142589569e-05, 5.216430872678757e-05, 5.551427602767944e-05, 5.886424332857132e-05, 6.22142106294632e-05, 6.556417793035507e-05, 6.891414523124695e-05, 7.226411253213882e-05, 7.56140798330307e-05, 7.896404713392258e-05, 8.231401443481445e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 10.0, 14.0, 24.0, 28.0, 63.0, 98.0, 195.0, 362.0, 912.0, 2739.0, 12808.0, 245221.0, 748810.0, 30382.0, 4399.0, 1324.0, 527.0, 268.0, 132.0, 96.0, 34.0, 26.0, 19.0, 18.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.504241943359375, -2.42645263671875, -2.348663330078125, -2.2708740234375, -2.193084716796875, -2.11529541015625, -2.037506103515625, -1.959716796875, -1.881927490234375, -1.80413818359375, -1.726348876953125, -1.6485595703125, -1.570770263671875, -1.49298095703125, -1.415191650390625, -1.33740234375, -1.259613037109375, -1.18182373046875, -1.104034423828125, -1.0262451171875, -0.948455810546875, -0.87066650390625, -0.792877197265625, -0.715087890625, -0.637298583984375, -0.55950927734375, -0.481719970703125, -0.4039306640625, -0.326141357421875, -0.24835205078125, -0.170562744140625, -0.0927734375, -0.014984130859375, 0.06280517578125, 0.140594482421875, 0.2183837890625, 0.296173095703125, 0.37396240234375, 0.451751708984375, 0.529541015625, 0.607330322265625, 0.68511962890625, 0.762908935546875, 0.8406982421875, 0.918487548828125, 0.99627685546875, 1.074066162109375, 1.15185546875, 1.229644775390625, 1.30743408203125, 1.385223388671875, 1.4630126953125, 1.540802001953125, 1.61859130859375, 1.696380615234375, 1.774169921875, 1.851959228515625, 1.92974853515625, 2.007537841796875, 2.0853271484375, 2.163116455078125, 2.24090576171875, 2.318695068359375, 2.396484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 12.0, 27.0, 42.0, 49.0, 82.0, 102.0, 144.0, 141.0, 138.0, 76.0, 76.0, 44.0, 24.0, 13.0, 5.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6004791259765625, -0.569122314453125, -0.5377655029296875, -0.50640869140625, -0.4750518798828125, -0.443695068359375, -0.4123382568359375, -0.3809814453125, -0.3496246337890625, -0.318267822265625, -0.2869110107421875, -0.25555419921875, -0.2241973876953125, -0.192840576171875, -0.1614837646484375, -0.130126953125, -0.0987701416015625, -0.067413330078125, -0.0360565185546875, -0.00469970703125, 0.0266571044921875, 0.058013916015625, 0.0893707275390625, 0.1207275390625, 0.1520843505859375, 0.183441162109375, 0.2147979736328125, 0.24615478515625, 0.2775115966796875, 0.308868408203125, 0.3402252197265625, 0.37158203125, 0.4029388427734375, 0.434295654296875, 0.4656524658203125, 0.49700927734375, 0.5283660888671875, 0.559722900390625, 0.5910797119140625, 0.6224365234375, 0.6537933349609375, 0.685150146484375, 0.7165069580078125, 0.74786376953125, 0.7792205810546875, 0.810577392578125, 0.8419342041015625, 0.873291015625, 0.9046478271484375, 0.936004638671875, 0.9673614501953125, 0.99871826171875, 1.0300750732421875, 1.061431884765625, 1.0927886962890625, 1.1241455078125, 1.1555023193359375, 1.186859130859375, 1.2182159423828125, 1.24957275390625, 1.2809295654296875, 1.312286376953125, 1.3436431884765625, 1.375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 14.0, 25.0, 53.0, 83.0, 138.0, 201.0, 191.0, 122.0, 57.0, 30.0, 21.0, 13.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.404948234558105, -10.979870796203613, -10.554794311523438, -10.129716873168945, -9.704639434814453, -9.279562950134277, -8.854485511779785, -8.42940902709961, -8.004331588745117, -7.579254627227783, -7.154177665710449, -6.729100227355957, -6.304023265838623, -5.878946304321289, -5.453868865966797, -5.028791904449463, -4.603714942932129, -4.178637981414795, -3.753560781478882, -3.3284835815429688, -2.9034066200256348, -2.478329658508301, -2.0532524585723877, -1.6281752586364746, -1.2030982971191406, -0.7780212163925171, -0.35294413566589355, 0.07213294506072998, 0.4972100257873535, 0.9222869873046875, 1.3473641872406006, 1.7724413871765137, 2.197519302368164, 2.622596263885498, 3.047673463821411, 3.472750663757324, 3.897827625274658, 4.322904586791992, 4.747982025146484, 5.173058986663818, 5.598135948181152, 6.023212909698486, 6.44828987121582, 6.8733673095703125, 7.2984442710876465, 7.7235212326049805, 8.148598670959473, 8.573675155639648, 8.99875259399414, 9.423830032348633, 9.848906517028809, 10.2739839553833, 10.699060440063477, 11.124137878417969, 11.549215316772461, 11.974292755126953, 12.399369239807129, 12.824446678161621, 13.249523162841797, 13.674600601196289, 14.099678039550781, 14.524754524230957, 14.94983196258545, 15.374908447265625, 15.799985885620117]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 15.0, 15.0, 25.0, 40.0, 37.0, 45.0, 85.0, 65.0, 84.0, 83.0, 81.0, 90.0, 82.0, 61.0, 43.0, 40.0, 19.0, 19.0, 14.0, 16.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.438114166259766, -13.978090286254883, -13.518067359924316, -13.058043479919434, -12.598020553588867, -12.137996673583984, -11.677972793579102, -11.217948913574219, -10.757925987243652, -10.29790210723877, -9.837879180908203, -9.37785530090332, -8.917831420898438, -8.457808494567871, -7.997784614562988, -7.537761211395264, -7.077737808227539, -6.6177144050598145, -6.15769100189209, -5.697667121887207, -5.237643718719482, -4.777620315551758, -4.317596435546875, -3.8575730323791504, -3.397549629211426, -2.937526226043701, -2.4775025844573975, -2.0174789428710938, -1.5574555397033691, -1.0974321365356445, -0.6374084949493408, -0.1773848533630371, 0.2826385498046875, 0.7426620721817017, 1.2026855945587158, 1.66270911693573, 2.122732639312744, 2.5827560424804688, 3.0427796840667725, 3.502803325653076, 3.962826728820801, 4.422850131988525, 4.88287353515625, 5.342897415161133, 5.802920818328857, 6.262944221496582, 6.722968101501465, 7.1829915046691895, 7.643014907836914, 8.103038787841797, 8.563061714172363, 9.023085594177246, 9.483108520507812, 9.943132400512695, 10.403156280517578, 10.863180160522461, 11.323203086853027, 11.78322696685791, 12.243249893188477, 12.70327377319336, 13.163297653198242, 13.623320579528809, 14.083344459533691, 14.543367385864258, 15.00339126586914]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 5.0, 16.0, 22.0, 39.0, 96.0, 187.0, 373.0, 1015.0, 4843.0, 242356.0, 3936734.0, 6964.0, 1058.0, 333.0, 124.0, 50.0, 27.0, 14.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.786865234375, -21.18310546875, -20.579345703125, -19.9755859375, -19.371826171875, -18.76806640625, -18.164306640625, -17.560546875, -16.956787109375, -16.35302734375, -15.749267578125, -15.1455078125, -14.541748046875, -13.93798828125, -13.334228515625, -12.73046875, -12.126708984375, -11.52294921875, -10.919189453125, -10.3154296875, -9.711669921875, -9.10791015625, -8.504150390625, -7.900390625, -7.296630859375, -6.69287109375, -6.089111328125, -5.4853515625, -4.881591796875, -4.27783203125, -3.674072265625, -3.0703125, -2.466552734375, -1.86279296875, -1.259033203125, -0.6552734375, -0.051513671875, 0.55224609375, 1.156005859375, 1.759765625, 2.363525390625, 2.96728515625, 3.571044921875, 4.1748046875, 4.778564453125, 5.38232421875, 5.986083984375, 6.58984375, 7.193603515625, 7.79736328125, 8.401123046875, 9.0048828125, 9.608642578125, 10.21240234375, 10.816162109375, 11.419921875, 12.023681640625, 12.62744140625, 13.231201171875, 13.8349609375, 14.438720703125, 15.04248046875, 15.646240234375, 16.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 19.0, 30.0, 31.0, 70.0, 92.0, 117.0, 142.0, 130.0, 118.0, 87.0, 46.0, 39.0, 22.0, 12.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5353240966796875, -0.520355224609375, -0.5053863525390625, -0.49041748046875, -0.4754486083984375, -0.460479736328125, -0.4455108642578125, -0.4305419921875, -0.4155731201171875, -0.400604248046875, -0.3856353759765625, -0.37066650390625, -0.3556976318359375, -0.340728759765625, -0.3257598876953125, -0.310791015625, -0.2958221435546875, -0.280853271484375, -0.2658843994140625, -0.25091552734375, -0.2359466552734375, -0.220977783203125, -0.2060089111328125, -0.1910400390625, -0.1760711669921875, -0.161102294921875, -0.1461334228515625, -0.13116455078125, -0.1161956787109375, -0.101226806640625, -0.0862579345703125, -0.0712890625, -0.0563201904296875, -0.041351318359375, -0.0263824462890625, -0.01141357421875, 0.0035552978515625, 0.018524169921875, 0.0334930419921875, 0.0484619140625, 0.0634307861328125, 0.078399658203125, 0.0933685302734375, 0.10833740234375, 0.1233062744140625, 0.138275146484375, 0.1532440185546875, 0.168212890625, 0.1831817626953125, 0.198150634765625, 0.2131195068359375, 0.22808837890625, 0.2430572509765625, 0.258026123046875, 0.2729949951171875, 0.2879638671875, 0.3029327392578125, 0.317901611328125, 0.3328704833984375, 0.34783935546875, 0.3628082275390625, 0.377777099609375, 0.3927459716796875, 0.40771484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 12.0, 12.0, 35.0, 46.0, 56.0, 126.0, 232.0, 657.0, 2711.0, 23682.0, 3856970.0, 297438.0, 9935.0, 1478.0, 403.0, 176.0, 112.0, 56.0, 43.0, 31.0, 34.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.42578125, -5.17718505859375, -4.9285888671875, -4.67999267578125, -4.431396484375, -4.18280029296875, -3.9342041015625, -3.68560791015625, -3.43701171875, -3.18841552734375, -2.9398193359375, -2.69122314453125, -2.442626953125, -2.19403076171875, -1.9454345703125, -1.69683837890625, -1.4482421875, -1.19964599609375, -0.9510498046875, -0.70245361328125, -0.453857421875, -0.20526123046875, 0.0433349609375, 0.29193115234375, 0.54052734375, 0.78912353515625, 1.0377197265625, 1.28631591796875, 1.534912109375, 1.78350830078125, 2.0321044921875, 2.28070068359375, 2.529296875, 2.77789306640625, 3.0264892578125, 3.27508544921875, 3.523681640625, 3.77227783203125, 4.0208740234375, 4.26947021484375, 4.51806640625, 4.76666259765625, 5.0152587890625, 5.26385498046875, 5.512451171875, 5.76104736328125, 6.0096435546875, 6.25823974609375, 6.5068359375, 6.75543212890625, 7.0040283203125, 7.25262451171875, 7.501220703125, 7.74981689453125, 7.9984130859375, 8.24700927734375, 8.49560546875, 8.74420166015625, 8.9927978515625, 9.24139404296875, 9.489990234375, 9.73858642578125, 9.9871826171875, 10.23577880859375, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 9.0, 9.0, 19.0, 28.0, 36.0, 62.0, 68.0, 147.0, 348.0, 1751.0, 915.0, 263.0, 132.0, 76.0, 42.0, 41.0, 25.0, 21.0, 17.0, 10.0, 5.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6959381103515625, -0.674102783203125, -0.6522674560546875, -0.63043212890625, -0.6085968017578125, -0.586761474609375, -0.5649261474609375, -0.5430908203125, -0.5212554931640625, -0.499420166015625, -0.4775848388671875, -0.45574951171875, -0.4339141845703125, -0.412078857421875, -0.3902435302734375, -0.368408203125, -0.3465728759765625, -0.324737548828125, -0.3029022216796875, -0.28106689453125, -0.2592315673828125, -0.237396240234375, -0.2155609130859375, -0.1937255859375, -0.1718902587890625, -0.150054931640625, -0.1282196044921875, -0.10638427734375, -0.0845489501953125, -0.062713623046875, -0.0408782958984375, -0.01904296875, 0.0027923583984375, 0.024627685546875, 0.0464630126953125, 0.06829833984375, 0.0901336669921875, 0.111968994140625, 0.1338043212890625, 0.1556396484375, 0.1774749755859375, 0.199310302734375, 0.2211456298828125, 0.24298095703125, 0.2648162841796875, 0.286651611328125, 0.3084869384765625, 0.330322265625, 0.3521575927734375, 0.373992919921875, 0.3958282470703125, 0.41766357421875, 0.4394989013671875, 0.461334228515625, 0.4831695556640625, 0.5050048828125, 0.5268402099609375, 0.548675537109375, 0.5705108642578125, 0.59234619140625, 0.6141815185546875, 0.636016845703125, 0.6578521728515625, 0.6796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 16.0, 98.0, 535.0, 302.0, 44.0, 12.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.450634002685547, -20.897205352783203, -20.34377670288086, -19.790348052978516, -19.236919403076172, -18.683490753173828, -18.130062103271484, -17.57663345336914, -17.023204803466797, -16.469776153564453, -15.91634750366211, -15.362918853759766, -14.809490203857422, -14.256061553955078, -13.702632904052734, -13.14920425415039, -12.59577465057373, -12.042346000671387, -11.488917350769043, -10.9354887008667, -10.382060050964355, -9.828631401062012, -9.275201797485352, -8.721773147583008, -8.168344497680664, -7.61491584777832, -7.061487197875977, -6.508058547973633, -5.954629898071289, -5.401201248168945, -4.847772121429443, -4.2943434715271, -3.740915298461914, -3.1874866485595703, -2.6340579986572266, -2.0806291103363037, -1.52720046043396, -0.9737718105316162, -0.42034292221069336, 0.1330857276916504, 0.6865143775939941, 1.239943027496338, 1.7933717966079712, 2.3468005657196045, 2.9002292156219482, 3.453657865524292, 4.007086753845215, 4.560515403747559, 5.113944053649902, 5.667372703552246, 6.22080135345459, 6.774230003356934, 7.327658653259277, 7.881087303161621, 8.434516906738281, 8.987945556640625, 9.541374206542969, 10.094802856445312, 10.648231506347656, 11.20166015625, 11.755088806152344, 12.308517456054688, 12.861946105957031, 13.415374755859375, 13.968803405761719]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 11.0, 14.0, 18.0, 20.0, 28.0, 34.0, 47.0, 55.0, 54.0, 61.0, 71.0, 62.0, 60.0, 71.0, 66.0, 54.0, 50.0, 55.0, 39.0, 24.0, 26.0, 24.0, 20.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.167453289031982, -4.066217422485352, -3.9649815559387207, -3.86374568939209, -3.76250958442688, -3.661273717880249, -3.560037851333618, -3.4588019847869873, -3.3575661182403564, -3.2563302516937256, -3.1550943851470947, -3.0538582801818848, -2.952622413635254, -2.851386547088623, -2.750150680541992, -2.6489148139953613, -2.5476789474487305, -2.4464430809020996, -2.3452072143554688, -2.243971347808838, -2.142735242843628, -2.041499376296997, -1.9402635097503662, -1.8390276432037354, -1.7377915382385254, -1.6365556716918945, -1.5353196859359741, -1.4340838193893433, -1.3328479528427124, -1.231611967086792, -1.1303761005401611, -1.0291402339935303, -0.9279043674468994, -0.8266684412956238, -0.7254325747489929, -0.6241966485977173, -0.5229607820510864, -0.4217248558998108, -0.32048892974853516, -0.2192530632019043, -0.11801713705062866, -0.016781233251094818, 0.08445467054843903, 0.18569058179855347, 0.2869264781475067, 0.38816237449645996, 0.4893983006477356, 0.5906341671943665, 0.6918700933456421, 0.7931060194969177, 0.8943418860435486, 0.9955778121948242, 1.096813678741455, 1.198049545288086, 1.2992855310440063, 1.4005213975906372, 1.5017573833465576, 1.6029932498931885, 1.7042292356491089, 1.8054651021957397, 1.9067009687423706, 2.007936954498291, 2.109172821044922, 2.2104086875915527, 2.3116445541381836]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 10.0, 8.0, 8.0, 7.0, 12.0, 22.0, 37.0, 34.0, 45.0, 55.0, 73.0, 101.0, 153.0, 206.0, 309.0, 478.0, 747.0, 1253.0, 2759.0, 7521.0, 32104.0, 267888.0, 631366.0, 80394.0, 13965.0, 4194.0, 1904.0, 942.0, 606.0, 363.0, 259.0, 192.0, 135.0, 97.0, 81.0, 49.0, 34.0, 29.0, 31.0, 22.0, 16.0, 5.0, 12.0, 6.0, 1.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.769134521484375, -2.67108154296875, -2.573028564453125, -2.4749755859375, -2.376922607421875, -2.27886962890625, -2.180816650390625, -2.082763671875, -1.984710693359375, -1.88665771484375, -1.788604736328125, -1.6905517578125, -1.592498779296875, -1.49444580078125, -1.396392822265625, -1.29833984375, -1.200286865234375, -1.10223388671875, -1.004180908203125, -0.9061279296875, -0.808074951171875, -0.71002197265625, -0.611968994140625, -0.513916015625, -0.415863037109375, -0.31781005859375, -0.219757080078125, -0.1217041015625, -0.023651123046875, 0.07440185546875, 0.172454833984375, 0.2705078125, 0.368560791015625, 0.46661376953125, 0.564666748046875, 0.6627197265625, 0.760772705078125, 0.85882568359375, 0.956878662109375, 1.054931640625, 1.152984619140625, 1.25103759765625, 1.349090576171875, 1.4471435546875, 1.545196533203125, 1.64324951171875, 1.741302490234375, 1.83935546875, 1.937408447265625, 2.03546142578125, 2.133514404296875, 2.2315673828125, 2.329620361328125, 2.42767333984375, 2.525726318359375, 2.623779296875, 2.721832275390625, 2.81988525390625, 2.917938232421875, 3.0159912109375, 3.114044189453125, 3.21209716796875, 3.310150146484375, 3.408203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 15.0, 28.0, 72.0, 87.0, 117.0, 158.0, 172.0, 130.0, 95.0, 49.0, 37.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5757675170898438, -0.5577850341796875, -0.5398025512695312, -0.521820068359375, -0.5038375854492188, -0.4858551025390625, -0.46787261962890625, -0.44989013671875, -0.43190765380859375, -0.4139251708984375, -0.39594268798828125, -0.377960205078125, -0.35997772216796875, -0.3419952392578125, -0.32401275634765625, -0.3060302734375, -0.28804779052734375, -0.2700653076171875, -0.25208282470703125, -0.234100341796875, -0.21611785888671875, -0.1981353759765625, -0.18015289306640625, -0.16217041015625, -0.14418792724609375, -0.1262054443359375, -0.10822296142578125, -0.090240478515625, -0.07225799560546875, -0.0542755126953125, -0.03629302978515625, -0.018310546875, -0.00032806396484375, 0.0176544189453125, 0.03563690185546875, 0.053619384765625, 0.07160186767578125, 0.0895843505859375, 0.10756683349609375, 0.12554931640625, 0.14353179931640625, 0.1615142822265625, 0.17949676513671875, 0.197479248046875, 0.21546173095703125, 0.2334442138671875, 0.25142669677734375, 0.2694091796875, 0.28739166259765625, 0.3053741455078125, 0.32335662841796875, 0.341339111328125, 0.35932159423828125, 0.3773040771484375, 0.39528656005859375, 0.41326904296875, 0.43125152587890625, 0.4492340087890625, 0.46721649169921875, 0.485198974609375, 0.5031814575195312, 0.5211639404296875, 0.5391464233398438, 0.55712890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 10.0, 16.0, 27.0, 33.0, 44.0, 66.0, 108.0, 157.0, 265.0, 475.0, 851.0, 1645.0, 3416.0, 8335.0, 27350.0, 140322.0, 625875.0, 187232.0, 34374.0, 9788.0, 3887.0, 1889.0, 943.0, 552.0, 301.0, 215.0, 107.0, 72.0, 47.0, 30.0, 13.0, 14.0, 14.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -1.991455078125, -1.91650390625, -1.841552734375, -1.7666015625, -1.691650390625, -1.61669921875, -1.541748046875, -1.466796875, -1.391845703125, -1.31689453125, -1.241943359375, -1.1669921875, -1.092041015625, -1.01708984375, -0.942138671875, -0.8671875, -0.792236328125, -0.71728515625, -0.642333984375, -0.5673828125, -0.492431640625, -0.41748046875, -0.342529296875, -0.267578125, -0.192626953125, -0.11767578125, -0.042724609375, 0.0322265625, 0.107177734375, 0.18212890625, 0.257080078125, 0.33203125, 0.406982421875, 0.48193359375, 0.556884765625, 0.6318359375, 0.706787109375, 0.78173828125, 0.856689453125, 0.931640625, 1.006591796875, 1.08154296875, 1.156494140625, 1.2314453125, 1.306396484375, 1.38134765625, 1.456298828125, 1.53125, 1.606201171875, 1.68115234375, 1.756103515625, 1.8310546875, 1.906005859375, 1.98095703125, 2.055908203125, 2.130859375, 2.205810546875, 2.28076171875, 2.355712890625, 2.4306640625, 2.505615234375, 2.58056640625, 2.655517578125, 2.73046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 23.0, 22.0, 29.0, 37.0, 62.0, 58.0, 77.0, 63.0, 93.0, 76.0, 89.0, 77.0, 57.0, 51.0, 41.0, 22.0, 25.0, 19.0, 21.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7398681640625, -1.677001953125, -1.6141357421875, -1.55126953125, -1.4884033203125, -1.425537109375, -1.3626708984375, -1.2998046875, -1.2369384765625, -1.174072265625, -1.1112060546875, -1.04833984375, -0.9854736328125, -0.922607421875, -0.8597412109375, -0.796875, -0.7340087890625, -0.671142578125, -0.6082763671875, -0.54541015625, -0.4825439453125, -0.419677734375, -0.3568115234375, -0.2939453125, -0.2310791015625, -0.168212890625, -0.1053466796875, -0.04248046875, 0.0203857421875, 0.083251953125, 0.1461181640625, 0.208984375, 0.2718505859375, 0.334716796875, 0.3975830078125, 0.46044921875, 0.5233154296875, 0.586181640625, 0.6490478515625, 0.7119140625, 0.7747802734375, 0.837646484375, 0.9005126953125, 0.96337890625, 1.0262451171875, 1.089111328125, 1.1519775390625, 1.21484375, 1.2777099609375, 1.340576171875, 1.4034423828125, 1.46630859375, 1.5291748046875, 1.592041015625, 1.6549072265625, 1.7177734375, 1.7806396484375, 1.843505859375, 1.9063720703125, 1.96923828125, 2.0321044921875, 2.094970703125, 2.1578369140625, 2.220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 11.0, 8.0, 21.0, 39.0, 53.0, 104.0, 224.0, 580.0, 2558.0, 44667.0, 986779.0, 11330.0, 1345.0, 429.0, 201.0, 95.0, 37.0, 33.0, 9.0, 13.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3590087890625, -6.178955078125, -5.9989013671875, -5.81884765625, -5.6387939453125, -5.458740234375, -5.2786865234375, -5.0986328125, -4.9185791015625, -4.738525390625, -4.5584716796875, -4.37841796875, -4.1983642578125, -4.018310546875, -3.8382568359375, -3.658203125, -3.4781494140625, -3.298095703125, -3.1180419921875, -2.93798828125, -2.7579345703125, -2.577880859375, -2.3978271484375, -2.2177734375, -2.0377197265625, -1.857666015625, -1.6776123046875, -1.49755859375, -1.3175048828125, -1.137451171875, -0.9573974609375, -0.77734375, -0.5972900390625, -0.417236328125, -0.2371826171875, -0.05712890625, 0.1229248046875, 0.302978515625, 0.4830322265625, 0.6630859375, 0.8431396484375, 1.023193359375, 1.2032470703125, 1.38330078125, 1.5633544921875, 1.743408203125, 1.9234619140625, 2.103515625, 2.2835693359375, 2.463623046875, 2.6436767578125, 2.82373046875, 3.0037841796875, 3.183837890625, 3.3638916015625, 3.5439453125, 3.7239990234375, 3.904052734375, 4.0841064453125, 4.26416015625, 4.4442138671875, 4.624267578125, 4.8043212890625, 4.984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 11.0, 9.0, 14.0, 26.0, 41.0, 40.0, 87.0, 125.0, 192.0, 167.0, 104.0, 73.0, 45.0, 10.0, 10.0, 13.0, 10.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024008750915527344, -0.0002327561378479004, -0.00022542476654052734, -0.0002180933952331543, -0.00021076202392578125, -0.0002034306526184082, -0.00019609928131103516, -0.0001887679100036621, -0.00018143653869628906, -0.00017410516738891602, -0.00016677379608154297, -0.00015944242477416992, -0.00015211105346679688, -0.00014477968215942383, -0.00013744831085205078, -0.00013011693954467773, -0.0001227855682373047, -0.00011545419692993164, -0.0001081228256225586, -0.00010079145431518555, -9.34600830078125e-05, -8.612871170043945e-05, -7.87973403930664e-05, -7.146596908569336e-05, -6.413459777832031e-05, -5.6803226470947266e-05, -4.947185516357422e-05, -4.214048385620117e-05, -3.4809112548828125e-05, -2.7477741241455078e-05, -2.014636993408203e-05, -1.2814998626708984e-05, -5.4836273193359375e-06, 1.8477439880371094e-06, 9.179115295410156e-06, 1.6510486602783203e-05, 2.384185791015625e-05, 3.11732292175293e-05, 3.8504600524902344e-05, 4.583597183227539e-05, 5.316734313964844e-05, 6.0498714447021484e-05, 6.783008575439453e-05, 7.516145706176758e-05, 8.249282836914062e-05, 8.982419967651367e-05, 9.715557098388672e-05, 0.00010448694229125977, 0.00011181831359863281, 0.00011914968490600586, 0.0001264810562133789, 0.00013381242752075195, 0.000141143798828125, 0.00014847517013549805, 0.0001558065414428711, 0.00016313791275024414, 0.0001704692840576172, 0.00017780065536499023, 0.00018513202667236328, 0.00019246339797973633, 0.00019979476928710938, 0.00020712614059448242, 0.00021445751190185547, 0.00022178888320922852, 0.00022912025451660156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 12.0, 8.0, 6.0, 10.0, 22.0, 17.0, 39.0, 68.0, 126.0, 156.0, 322.0, 515.0, 1123.0, 2485.0, 6937.0, 27671.0, 400651.0, 559262.0, 35523.0, 8122.0, 2882.0, 1236.0, 565.0, 292.0, 173.0, 113.0, 63.0, 41.0, 34.0, 19.0, 10.0, 16.0, 7.0, 4.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8662109375, -1.811431884765625, -1.75665283203125, -1.701873779296875, -1.6470947265625, -1.592315673828125, -1.53753662109375, -1.482757568359375, -1.427978515625, -1.373199462890625, -1.31842041015625, -1.263641357421875, -1.2088623046875, -1.154083251953125, -1.09930419921875, -1.044525146484375, -0.98974609375, -0.934967041015625, -0.88018798828125, -0.825408935546875, -0.7706298828125, -0.715850830078125, -0.66107177734375, -0.606292724609375, -0.551513671875, -0.496734619140625, -0.44195556640625, -0.387176513671875, -0.3323974609375, -0.277618408203125, -0.22283935546875, -0.168060302734375, -0.11328125, -0.058502197265625, -0.00372314453125, 0.051055908203125, 0.1058349609375, 0.160614013671875, 0.21539306640625, 0.270172119140625, 0.324951171875, 0.379730224609375, 0.43450927734375, 0.489288330078125, 0.5440673828125, 0.598846435546875, 0.65362548828125, 0.708404541015625, 0.76318359375, 0.817962646484375, 0.87274169921875, 0.927520751953125, 0.9822998046875, 1.037078857421875, 1.09185791015625, 1.146636962890625, 1.201416015625, 1.256195068359375, 1.31097412109375, 1.365753173828125, 1.4205322265625, 1.475311279296875, 1.53009033203125, 1.584869384765625, 1.6396484375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 13.0, 17.0, 26.0, 68.0, 141.0, 223.0, 221.0, 126.0, 69.0, 41.0, 17.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3406219482421875, -1.297454833984375, -1.2542877197265625, -1.21112060546875, -1.1679534912109375, -1.124786376953125, -1.0816192626953125, -1.0384521484375, -0.9952850341796875, -0.952117919921875, -0.9089508056640625, -0.86578369140625, -0.8226165771484375, -0.779449462890625, -0.7362823486328125, -0.693115234375, -0.6499481201171875, -0.606781005859375, -0.5636138916015625, -0.52044677734375, -0.4772796630859375, -0.434112548828125, -0.3909454345703125, -0.3477783203125, -0.3046112060546875, -0.261444091796875, -0.2182769775390625, -0.17510986328125, -0.1319427490234375, -0.088775634765625, -0.0456085205078125, -0.00244140625, 0.0407257080078125, 0.083892822265625, 0.1270599365234375, 0.17022705078125, 0.2133941650390625, 0.256561279296875, 0.2997283935546875, 0.3428955078125, 0.3860626220703125, 0.429229736328125, 0.4723968505859375, 0.51556396484375, 0.5587310791015625, 0.601898193359375, 0.6450653076171875, 0.688232421875, 0.7313995361328125, 0.774566650390625, 0.8177337646484375, 0.86090087890625, 0.9040679931640625, 0.947235107421875, 0.9904022216796875, 1.0335693359375, 1.0767364501953125, 1.119903564453125, 1.1630706787109375, 1.20623779296875, 1.2494049072265625, 1.292572021484375, 1.3357391357421875, 1.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 17.0, 24.0, 37.0, 55.0, 140.0, 203.0, 212.0, 143.0, 73.0, 31.0, 23.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.99288558959961, -16.475082397460938, -15.95727825164795, -15.439474105834961, -14.921669960021973, -14.403865814208984, -13.886062622070312, -13.368258476257324, -12.850454330444336, -12.332650184631348, -11.814846992492676, -11.297042846679688, -10.7792387008667, -10.261434555053711, -9.743631362915039, -9.22582721710205, -8.708024024963379, -8.19021987915039, -7.6724162101745605, -7.1546125411987305, -6.636808395385742, -6.119004726409912, -5.601201057434082, -5.083396911621094, -4.565593242645264, -4.047789573669434, -3.5299854278564453, -3.0121817588806152, -2.494377851486206, -1.9765739440917969, -1.4587702751159668, -0.9409663677215576, -0.42316246032714844, 0.09464138746261597, 0.6124452352523804, 1.1302490234375, 1.6480529308319092, 2.1658568382263184, 2.6836605072021484, 3.2014644145965576, 3.719268321990967, 4.237071990966797, 4.754876136779785, 5.272679805755615, 5.790483474731445, 6.308287620544434, 6.826091289520264, 7.343894958496094, 7.861699104309082, 8.37950325012207, 8.897306442260742, 9.41511058807373, 9.932914733886719, 10.45071792602539, 10.968522071838379, 11.486326217651367, 12.004129409790039, 12.521933555603027, 13.0397367477417, 13.557540893554688, 14.075345039367676, 14.593149185180664, 15.110952377319336, 15.628756523132324, 16.146560668945312]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 9.0, 16.0, 23.0, 19.0, 32.0, 39.0, 42.0, 60.0, 52.0, 55.0, 76.0, 71.0, 86.0, 53.0, 51.0, 60.0, 37.0, 33.0, 37.0, 26.0, 25.0, 18.0, 12.0, 14.0, 11.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.542821884155273, -14.108731269836426, -13.674640655517578, -13.24055004119873, -12.806459426879883, -12.372369766235352, -11.938279151916504, -11.504188537597656, -11.070097923278809, -10.636007308959961, -10.201916694641113, -9.767826080322266, -9.333736419677734, -8.89964485168457, -8.465555191040039, -8.031464576721191, -7.597373962402344, -7.163283348083496, -6.729192733764648, -6.295102596282959, -5.861011981964111, -5.426921367645264, -4.992831230163574, -4.558740615844727, -4.124650001525879, -3.6905593872070312, -3.2564690113067627, -2.822378635406494, -2.3882880210876465, -1.9541974067687988, -1.5201070308685303, -1.0860166549682617, -0.6519260406494141, -0.21783554553985596, 0.21625494956970215, 0.6503454446792603, 1.0844359397888184, 1.518526554107666, 1.9526169300079346, 2.386707305908203, 2.820797920227051, 3.2548885345458984, 3.688978910446167, 4.1230692863464355, 4.557159900665283, 4.991250514984131, 5.42534065246582, 5.859431266784668, 6.293521881103516, 6.727612495422363, 7.161703109741211, 7.5957932472229, 8.029884338378906, 8.463973999023438, 8.898064613342285, 9.332155227661133, 9.76624584197998, 10.200336456298828, 10.634427070617676, 11.068517684936523, 11.502607345581055, 11.936698913574219, 12.37078857421875, 12.804879188537598, 13.238969802856445]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 5.0, 12.0, 5.0, 11.0, 7.0, 11.0, 18.0, 24.0, 24.0, 32.0, 42.0, 51.0, 71.0, 78.0, 104.0, 144.0, 195.0, 262.0, 361.0, 552.0, 838.0, 1502.0, 2551.0, 5224.0, 11179.0, 28399.0, 107046.0, 3193786.0, 723786.0, 75447.0, 22802.0, 9428.0, 4444.0, 2390.0, 1266.0, 739.0, 495.0, 299.0, 219.0, 135.0, 101.0, 56.0, 38.0, 35.0, 33.0, 8.0, 11.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.189453125, -3.107421875, -3.025390625, -2.943359375, -2.861328125, -2.779296875, -2.697265625, -2.615234375, -2.533203125, -2.451171875, -2.369140625, -2.287109375, -2.205078125, -2.123046875, -2.041015625, -1.958984375, -1.876953125, -1.794921875, -1.712890625, -1.630859375, -1.548828125, -1.466796875, -1.384765625, -1.302734375, -1.220703125, -1.138671875, -1.056640625, -0.974609375, -0.892578125, -0.810546875, -0.728515625, -0.646484375, -0.564453125, -0.482421875, -0.400390625, -0.318359375, -0.236328125, -0.154296875, -0.072265625, 0.009765625, 0.091796875, 0.173828125, 0.255859375, 0.337890625, 0.419921875, 0.501953125, 0.583984375, 0.666015625, 0.748046875, 0.830078125, 0.912109375, 0.994140625, 1.076171875, 1.158203125, 1.240234375, 1.322265625, 1.404296875, 1.486328125, 1.568359375, 1.650390625, 1.732421875, 1.814453125, 1.896484375, 1.978515625, 2.060546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 22.0, 33.0, 49.0, 60.0, 84.0, 69.0, 77.0, 100.0, 93.0, 61.0, 61.0, 66.0, 43.0, 42.0, 39.0, 15.0, 10.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.529296875, -0.5162696838378906, -0.5032424926757812, -0.4902153015136719, -0.4771881103515625, -0.4641609191894531, -0.45113372802734375, -0.4381065368652344, -0.425079345703125, -0.4120521545410156, -0.39902496337890625, -0.3859977722167969, -0.3729705810546875, -0.3599433898925781, -0.34691619873046875, -0.3338890075683594, -0.32086181640625, -0.3078346252441406, -0.29480743408203125, -0.2817802429199219, -0.2687530517578125, -0.2557258605957031, -0.24269866943359375, -0.22967147827148438, -0.216644287109375, -0.20361709594726562, -0.19058990478515625, -0.17756271362304688, -0.1645355224609375, -0.15150833129882812, -0.13848114013671875, -0.12545394897460938, -0.1124267578125, -0.09939956665039062, -0.08637237548828125, -0.07334518432617188, -0.0603179931640625, -0.047290802001953125, -0.03426361083984375, -0.021236419677734375, -0.008209228515625, 0.004817962646484375, 0.01784515380859375, 0.030872344970703125, 0.0438995361328125, 0.056926727294921875, 0.06995391845703125, 0.08298110961914062, 0.09600830078125, 0.10903549194335938, 0.12206268310546875, 0.13508987426757812, 0.1481170654296875, 0.16114425659179688, 0.17417144775390625, 0.18719863891601562, 0.200225830078125, 0.21325302124023438, 0.22628021240234375, 0.23930740356445312, 0.2523345947265625, 0.2653617858886719, 0.27838897705078125, 0.2914161682128906, 0.304443359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 10.0, 12.0, 14.0, 24.0, 46.0, 82.0, 128.0, 248.0, 518.0, 1246.0, 3289.0, 13288.0, 154921.0, 3921132.0, 83921.0, 10237.0, 2893.0, 1161.0, 490.0, 263.0, 131.0, 78.0, 58.0, 30.0, 15.0, 7.0, 2.0, 6.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.5, -4.36529541015625, -4.2305908203125, -4.09588623046875, -3.961181640625, -3.82647705078125, -3.6917724609375, -3.55706787109375, -3.42236328125, -3.28765869140625, -3.1529541015625, -3.01824951171875, -2.883544921875, -2.74884033203125, -2.6141357421875, -2.47943115234375, -2.3447265625, -2.21002197265625, -2.0753173828125, -1.94061279296875, -1.805908203125, -1.67120361328125, -1.5364990234375, -1.40179443359375, -1.26708984375, -1.13238525390625, -0.9976806640625, -0.86297607421875, -0.728271484375, -0.59356689453125, -0.4588623046875, -0.32415771484375, -0.189453125, -0.05474853515625, 0.0799560546875, 0.21466064453125, 0.349365234375, 0.48406982421875, 0.6187744140625, 0.75347900390625, 0.88818359375, 1.02288818359375, 1.1575927734375, 1.29229736328125, 1.427001953125, 1.56170654296875, 1.6964111328125, 1.83111572265625, 1.9658203125, 2.10052490234375, 2.2352294921875, 2.36993408203125, 2.504638671875, 2.63934326171875, 2.7740478515625, 2.90875244140625, 3.04345703125, 3.17816162109375, 3.3128662109375, 3.44757080078125, 3.582275390625, 3.71697998046875, 3.8516845703125, 3.98638916015625, 4.12109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 12.0, 16.0, 21.0, 39.0, 58.0, 100.0, 176.0, 469.0, 2117.0, 570.0, 194.0, 85.0, 67.0, 36.0, 39.0, 15.0, 7.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61572265625, -0.5925521850585938, -0.5693817138671875, -0.5462112426757812, -0.523040771484375, -0.49987030029296875, -0.4766998291015625, -0.45352935791015625, -0.43035888671875, -0.40718841552734375, -0.3840179443359375, -0.36084747314453125, -0.337677001953125, -0.31450653076171875, -0.2913360595703125, -0.26816558837890625, -0.2449951171875, -0.22182464599609375, -0.1986541748046875, -0.17548370361328125, -0.152313232421875, -0.12914276123046875, -0.1059722900390625, -0.08280181884765625, -0.05963134765625, -0.03646087646484375, -0.0132904052734375, 0.00988006591796875, 0.033050537109375, 0.05622100830078125, 0.0793914794921875, 0.10256195068359375, 0.125732421875, 0.14890289306640625, 0.1720733642578125, 0.19524383544921875, 0.218414306640625, 0.24158477783203125, 0.2647552490234375, 0.28792572021484375, 0.31109619140625, 0.33426666259765625, 0.3574371337890625, 0.38060760498046875, 0.403778076171875, 0.42694854736328125, 0.4501190185546875, 0.47328948974609375, 0.4964599609375, 0.5196304321289062, 0.5428009033203125, 0.5659713745117188, 0.589141845703125, 0.6123123168945312, 0.6354827880859375, 0.6586532592773438, 0.68182373046875, 0.7049942016601562, 0.7281646728515625, 0.7513351440429688, 0.774505615234375, 0.7976760864257812, 0.8208465576171875, 0.8440170288085938, 0.8671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 20.0, 33.0, 128.0, 256.0, 339.0, 139.0, 56.0, 17.0, 13.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.124211311340332, -9.889419555664062, -9.65462875366211, -9.41983699798584, -9.18504524230957, -8.950254440307617, -8.715462684631348, -8.480670928955078, -8.245880126953125, -8.011088371276855, -7.776297092437744, -7.541505813598633, -7.3067145347595215, -7.07192325592041, -6.837131500244141, -6.602340221405029, -6.36754846572876, -6.132757186889648, -5.897965431213379, -5.663174152374268, -5.428382873535156, -5.193591117858887, -4.958799839019775, -4.724008560180664, -4.4892168045043945, -4.254425525665283, -4.019633769989014, -3.7848424911499023, -3.550051212310791, -3.3152596950531006, -3.08046817779541, -2.845676898956299, -2.6108856201171875, -2.376094102859497, -2.1413028240203857, -1.9065113067626953, -1.6717199087142944, -1.4369285106658936, -1.2021369934082031, -0.9673455953598022, -0.7325541973114014, -0.4977627694606781, -0.26297134160995483, -0.02817988395690918, 0.2066115140914917, 0.4414029121398926, 0.676194429397583, 0.9109858274459839, 1.1457772254943848, 1.3805686235427856, 1.6153600215911865, 1.850151538848877, 2.0849428176879883, 2.3197343349456787, 2.554525852203369, 2.7893171310424805, 3.024108648300171, 3.2589001655578613, 3.4936914443969727, 3.728482961654663, 3.9632744789123535, 4.198065757751465, 4.432857513427734, 4.667648792266846, 4.902440071105957]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 16.0, 20.0, 18.0, 31.0, 45.0, 52.0, 54.0, 44.0, 60.0, 70.0, 65.0, 60.0, 63.0, 54.0, 56.0, 58.0, 43.0, 35.0, 27.0, 24.0, 20.0, 20.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1959757804870605, -2.1162328720092773, -2.036489963531494, -1.9567471742630005, -1.8770042657852173, -1.797261357307434, -1.7175185680389404, -1.6377756595611572, -1.558032751083374, -1.4782898426055908, -1.3985469341278076, -1.318804144859314, -1.2390612363815308, -1.1593183279037476, -1.079575538635254, -0.9998326301574707, -0.9200897216796875, -0.8403468132019043, -0.7606039643287659, -0.6808611154556274, -0.6011182069778442, -0.521375298500061, -0.4416324496269226, -0.3618896007537842, -0.282146692276001, -0.20240381360054016, -0.12266093492507935, -0.04291805624961853, 0.036824822425842285, 0.1165677011013031, 0.19631057977676392, 0.27605342864990234, 0.35579633712768555, 0.43553921580314636, 0.5152820944786072, 0.5950249433517456, 0.6747678518295288, 0.754510760307312, 0.8342536091804504, 0.9139964580535889, 0.9937393665313721, 1.0734822750091553, 1.1532251834869385, 1.2329679727554321, 1.3127108812332153, 1.3924537897109985, 1.4721965789794922, 1.5519394874572754, 1.6316823959350586, 1.7114253044128418, 1.791168212890625, 1.8709110021591187, 1.9506539106369019, 2.0303966999053955, 2.1101396083831787, 2.189882516860962, 2.269625425338745, 2.3493683338165283, 2.4291112422943115, 2.5088541507720947, 2.588596820831299, 2.668339729309082, 2.7480826377868652, 2.8278255462646484, 2.9075684547424316]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 10.0, 10.0, 17.0, 20.0, 27.0, 38.0, 55.0, 87.0, 115.0, 214.0, 306.0, 467.0, 879.0, 1536.0, 2904.0, 6466.0, 17007.0, 56175.0, 246303.0, 509209.0, 147731.0, 36676.0, 12047.0, 4826.0, 2328.0, 1165.0, 729.0, 424.0, 259.0, 157.0, 114.0, 64.0, 52.0, 41.0, 31.0, 23.0, 9.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.5, -2.434783935546875, -2.36956787109375, -2.304351806640625, -2.2391357421875, -2.173919677734375, -2.10870361328125, -2.043487548828125, -1.978271484375, -1.913055419921875, -1.84783935546875, -1.782623291015625, -1.7174072265625, -1.652191162109375, -1.58697509765625, -1.521759033203125, -1.45654296875, -1.391326904296875, -1.32611083984375, -1.260894775390625, -1.1956787109375, -1.130462646484375, -1.06524658203125, -1.000030517578125, -0.934814453125, -0.869598388671875, -0.80438232421875, -0.739166259765625, -0.6739501953125, -0.608734130859375, -0.54351806640625, -0.478302001953125, -0.4130859375, -0.347869873046875, -0.28265380859375, -0.217437744140625, -0.1522216796875, -0.087005615234375, -0.02178955078125, 0.043426513671875, 0.108642578125, 0.173858642578125, 0.23907470703125, 0.304290771484375, 0.3695068359375, 0.434722900390625, 0.49993896484375, 0.565155029296875, 0.63037109375, 0.695587158203125, 0.76080322265625, 0.826019287109375, 0.8912353515625, 0.956451416015625, 1.02166748046875, 1.086883544921875, 1.152099609375, 1.217315673828125, 1.28253173828125, 1.347747802734375, 1.4129638671875, 1.478179931640625, 1.54339599609375, 1.608612060546875, 1.673828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 14.0, 16.0, 20.0, 36.0, 61.0, 74.0, 88.0, 96.0, 94.0, 107.0, 77.0, 77.0, 65.0, 41.0, 37.0, 21.0, 23.0, 13.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5732498168945312, -0.5581207275390625, -0.5429916381835938, -0.527862548828125, -0.5127334594726562, -0.4976043701171875, -0.48247528076171875, -0.46734619140625, -0.45221710205078125, -0.4370880126953125, -0.42195892333984375, -0.406829833984375, -0.39170074462890625, -0.3765716552734375, -0.36144256591796875, -0.3463134765625, -0.33118438720703125, -0.3160552978515625, -0.30092620849609375, -0.285797119140625, -0.27066802978515625, -0.2555389404296875, -0.24040985107421875, -0.22528076171875, -0.21015167236328125, -0.1950225830078125, -0.17989349365234375, -0.164764404296875, -0.14963531494140625, -0.1345062255859375, -0.11937713623046875, -0.104248046875, -0.08911895751953125, -0.0739898681640625, -0.05886077880859375, -0.043731689453125, -0.02860260009765625, -0.0134735107421875, 0.00165557861328125, 0.01678466796875, 0.03191375732421875, 0.0470428466796875, 0.06217193603515625, 0.077301025390625, 0.09243011474609375, 0.1075592041015625, 0.12268829345703125, 0.1378173828125, 0.15294647216796875, 0.1680755615234375, 0.18320465087890625, 0.198333740234375, 0.21346282958984375, 0.2285919189453125, 0.24372100830078125, 0.25885009765625, 0.27397918701171875, 0.2891082763671875, 0.30423736572265625, 0.319366455078125, 0.33449554443359375, 0.3496246337890625, 0.36475372314453125, 0.3798828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 8.0, 19.0, 12.0, 33.0, 34.0, 40.0, 70.0, 94.0, 118.0, 207.0, 299.0, 620.0, 1082.0, 2035.0, 3976.0, 8658.0, 22841.0, 76346.0, 338952.0, 438871.0, 104457.0, 29264.0, 10598.0, 4633.0, 2320.0, 1199.0, 672.0, 405.0, 238.0, 137.0, 79.0, 67.0, 36.0, 30.0, 25.0, 27.0, 15.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5682373046875, -1.512451171875, -1.4566650390625, -1.40087890625, -1.3450927734375, -1.289306640625, -1.2335205078125, -1.177734375, -1.1219482421875, -1.066162109375, -1.0103759765625, -0.95458984375, -0.8988037109375, -0.843017578125, -0.7872314453125, -0.7314453125, -0.6756591796875, -0.619873046875, -0.5640869140625, -0.50830078125, -0.4525146484375, -0.396728515625, -0.3409423828125, -0.28515625, -0.2293701171875, -0.173583984375, -0.1177978515625, -0.06201171875, -0.0062255859375, 0.049560546875, 0.1053466796875, 0.1611328125, 0.2169189453125, 0.272705078125, 0.3284912109375, 0.38427734375, 0.4400634765625, 0.495849609375, 0.5516357421875, 0.607421875, 0.6632080078125, 0.718994140625, 0.7747802734375, 0.83056640625, 0.8863525390625, 0.942138671875, 0.9979248046875, 1.0537109375, 1.1094970703125, 1.165283203125, 1.2210693359375, 1.27685546875, 1.3326416015625, 1.388427734375, 1.4442138671875, 1.5, 1.5557861328125, 1.611572265625, 1.6673583984375, 1.72314453125, 1.7789306640625, 1.834716796875, 1.8905029296875, 1.9462890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 6.0, 7.0, 14.0, 13.0, 19.0, 27.0, 38.0, 38.0, 47.0, 56.0, 76.0, 74.0, 79.0, 72.0, 73.0, 65.0, 58.0, 45.0, 31.0, 27.0, 27.0, 22.0, 20.0, 7.0, 7.0, 5.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.716552734375, -1.65576171875, -1.594970703125, -1.5341796875, -1.473388671875, -1.41259765625, -1.351806640625, -1.291015625, -1.230224609375, -1.16943359375, -1.108642578125, -1.0478515625, -0.987060546875, -0.92626953125, -0.865478515625, -0.8046875, -0.743896484375, -0.68310546875, -0.622314453125, -0.5615234375, -0.500732421875, -0.43994140625, -0.379150390625, -0.318359375, -0.257568359375, -0.19677734375, -0.135986328125, -0.0751953125, -0.014404296875, 0.04638671875, 0.107177734375, 0.16796875, 0.228759765625, 0.28955078125, 0.350341796875, 0.4111328125, 0.471923828125, 0.53271484375, 0.593505859375, 0.654296875, 0.715087890625, 0.77587890625, 0.836669921875, 0.8974609375, 0.958251953125, 1.01904296875, 1.079833984375, 1.140625, 1.201416015625, 1.26220703125, 1.322998046875, 1.3837890625, 1.444580078125, 1.50537109375, 1.566162109375, 1.626953125, 1.687744140625, 1.74853515625, 1.809326171875, 1.8701171875, 1.930908203125, 1.99169921875, 2.052490234375, 2.11328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 13.0, 15.0, 21.0, 35.0, 68.0, 80.0, 172.0, 473.0, 1233.0, 4781.0, 30394.0, 711924.0, 279068.0, 15705.0, 2961.0, 887.0, 322.0, 145.0, 82.0, 44.0, 32.0, 18.0, 13.0, 15.0, 12.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2954559326171875, -1.252044677734375, -1.2086334228515625, -1.16522216796875, -1.1218109130859375, -1.078399658203125, -1.0349884033203125, -0.9915771484375, -0.9481658935546875, -0.904754638671875, -0.8613433837890625, -0.81793212890625, -0.7745208740234375, -0.731109619140625, -0.6876983642578125, -0.644287109375, -0.6008758544921875, -0.557464599609375, -0.5140533447265625, -0.47064208984375, -0.4272308349609375, -0.383819580078125, -0.3404083251953125, -0.2969970703125, -0.2535858154296875, -0.210174560546875, -0.1667633056640625, -0.12335205078125, -0.0799407958984375, -0.036529541015625, 0.0068817138671875, 0.05029296875, 0.0937042236328125, 0.137115478515625, 0.1805267333984375, 0.22393798828125, 0.2673492431640625, 0.310760498046875, 0.3541717529296875, 0.3975830078125, 0.4409942626953125, 0.484405517578125, 0.5278167724609375, 0.57122802734375, 0.6146392822265625, 0.658050537109375, 0.7014617919921875, 0.744873046875, 0.7882843017578125, 0.831695556640625, 0.8751068115234375, 0.91851806640625, 0.9619293212890625, 1.005340576171875, 1.0487518310546875, 1.0921630859375, 1.1355743408203125, 1.178985595703125, 1.2223968505859375, 1.26580810546875, 1.3092193603515625, 1.352630615234375, 1.3960418701171875, 1.439453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 16.0, 14.0, 12.0, 21.0, 23.0, 30.0, 44.0, 59.0, 59.0, 88.0, 99.0, 110.0, 63.0, 68.0, 66.0, 50.0, 33.0, 25.0, 23.0, 17.0, 6.0, 2.0, 10.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.77799466252327e-05, -8.484162390232086e-05, -8.190330117940903e-05, -7.896497845649719e-05, -7.602665573358536e-05, -7.308833301067352e-05, -7.015001028776169e-05, -6.721168756484985e-05, -6.427336484193802e-05, -6.133504211902618e-05, -5.839671939611435e-05, -5.5458396673202515e-05, -5.252007395029068e-05, -4.9581751227378845e-05, -4.664342850446701e-05, -4.3705105781555176e-05, -4.076678305864334e-05, -3.7828460335731506e-05, -3.489013761281967e-05, -3.195181488990784e-05, -2.9013492166996002e-05, -2.6075169444084167e-05, -2.3136846721172333e-05, -2.0198523998260498e-05, -1.7260201275348663e-05, -1.4321878552436829e-05, -1.1383555829524994e-05, -8.44523310661316e-06, -5.5069103837013245e-06, -2.5685876607894897e-06, 3.6973506212234497e-07, 3.3080577850341797e-06, 6.246380507946014e-06, 9.184703230857849e-06, 1.2123025953769684e-05, 1.5061348676681519e-05, 1.7999671399593353e-05, 2.0937994122505188e-05, 2.3876316845417023e-05, 2.6814639568328857e-05, 2.9752962291240692e-05, 3.269128501415253e-05, 3.562960773706436e-05, 3.8567930459976196e-05, 4.150625318288803e-05, 4.4444575905799866e-05, 4.73828986287117e-05, 5.0321221351623535e-05, 5.325954407453537e-05, 5.6197866797447205e-05, 5.913618952035904e-05, 6.207451224327087e-05, 6.501283496618271e-05, 6.795115768909454e-05, 7.088948041200638e-05, 7.382780313491821e-05, 7.676612585783005e-05, 7.970444858074188e-05, 8.264277130365372e-05, 8.558109402656555e-05, 8.851941674947739e-05, 9.145773947238922e-05, 9.439606219530106e-05, 9.733438491821289e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 10.0, 13.0, 21.0, 35.0, 58.0, 83.0, 83.0, 151.0, 258.0, 388.0, 696.0, 1455.0, 2926.0, 7007.0, 19449.0, 80842.0, 544797.0, 321897.0, 44996.0, 13219.0, 5166.0, 2303.0, 1093.0, 563.0, 345.0, 224.0, 139.0, 99.0, 58.0, 46.0, 34.0, 28.0, 24.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.8017578125, -0.7805633544921875, -0.759368896484375, -0.7381744384765625, -0.71697998046875, -0.6957855224609375, -0.674591064453125, -0.6533966064453125, -0.6322021484375, -0.6110076904296875, -0.589813232421875, -0.5686187744140625, -0.54742431640625, -0.5262298583984375, -0.505035400390625, -0.4838409423828125, -0.462646484375, -0.4414520263671875, -0.420257568359375, -0.3990631103515625, -0.37786865234375, -0.3566741943359375, -0.335479736328125, -0.3142852783203125, -0.2930908203125, -0.2718963623046875, -0.250701904296875, -0.2295074462890625, -0.20831298828125, -0.1871185302734375, -0.165924072265625, -0.1447296142578125, -0.12353515625, -0.1023406982421875, -0.081146240234375, -0.0599517822265625, -0.03875732421875, -0.0175628662109375, 0.003631591796875, 0.0248260498046875, 0.0460205078125, 0.0672149658203125, 0.088409423828125, 0.1096038818359375, 0.13079833984375, 0.1519927978515625, 0.173187255859375, 0.1943817138671875, 0.215576171875, 0.2367706298828125, 0.257965087890625, 0.2791595458984375, 0.30035400390625, 0.3215484619140625, 0.342742919921875, 0.3639373779296875, 0.3851318359375, 0.4063262939453125, 0.427520751953125, 0.4487152099609375, 0.46990966796875, 0.4911041259765625, 0.512298583984375, 0.5334930419921875, 0.5546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 16.0, 23.0, 50.0, 74.0, 117.0, 161.0, 145.0, 137.0, 82.0, 63.0, 42.0, 16.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.841064453125, -0.81787109375, -0.794677734375, -0.771484375, -0.748291015625, -0.72509765625, -0.701904296875, -0.6787109375, -0.655517578125, -0.63232421875, -0.609130859375, -0.5859375, -0.562744140625, -0.53955078125, -0.516357421875, -0.4931640625, -0.469970703125, -0.44677734375, -0.423583984375, -0.400390625, -0.377197265625, -0.35400390625, -0.330810546875, -0.3076171875, -0.284423828125, -0.26123046875, -0.238037109375, -0.21484375, -0.191650390625, -0.16845703125, -0.145263671875, -0.1220703125, -0.098876953125, -0.07568359375, -0.052490234375, -0.029296875, -0.006103515625, 0.01708984375, 0.040283203125, 0.0634765625, 0.086669921875, 0.10986328125, 0.133056640625, 0.15625, 0.179443359375, 0.20263671875, 0.225830078125, 0.2490234375, 0.272216796875, 0.29541015625, 0.318603515625, 0.341796875, 0.364990234375, 0.38818359375, 0.411376953125, 0.4345703125, 0.457763671875, 0.48095703125, 0.504150390625, 0.52734375, 0.550537109375, 0.57373046875, 0.596923828125, 0.6201171875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 18.0, 78.0, 240.0, 442.0, 147.0, 51.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.11605453491211, -11.13099193572998, -10.145928382873535, -9.160865783691406, -8.175802230834961, -7.190739631652832, -6.205677032470703, -5.220613956451416, -4.235550880432129, -3.250487804412842, -2.265424966812134, -1.2803621292114258, -0.29529905319213867, 0.6897640228271484, 1.6748266220092773, 2.6598896980285645, 3.6449527740478516, 4.630015850067139, 5.615078926086426, 6.600141525268555, 7.585204601287842, 8.570267677307129, 9.555330276489258, 10.540393829345703, 11.525456428527832, 12.510519027709961, 13.495582580566406, 14.480645179748535, 15.465707778930664, 16.45077133178711, 17.435832977294922, 18.420896530151367, 19.405960083007812, 20.391023635864258, 21.37608528137207, 22.361148834228516, 23.34621238708496, 24.331275939941406, 25.31633758544922, 26.301401138305664, 27.28646469116211, 28.271528244018555, 29.256589889526367, 30.241653442382812, 31.226716995239258, 32.2117805480957, 33.196842193603516, 34.18190383911133, 35.166969299316406, 36.15203094482422, 37.1370964050293, 38.12215805053711, 39.10721969604492, 40.09228515625, 41.07734680175781, 42.062408447265625, 43.04747009277344, 44.03253173828125, 45.01759719848633, 46.00265884399414, 46.98772048950195, 47.97278594970703, 48.957847595214844, 49.942909240722656, 50.927974700927734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 19.0, 21.0, 32.0, 50.0, 61.0, 60.0, 80.0, 81.0, 89.0, 92.0, 76.0, 69.0, 60.0, 49.0, 38.0, 41.0, 23.0, 17.0, 9.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.135910034179688, -11.665919303894043, -11.195928573608398, -10.725937843322754, -10.25594711303711, -9.785955429077148, -9.315964698791504, -8.84597396850586, -8.375983238220215, -7.90599250793457, -7.436001777648926, -6.966010570526123, -6.4960198402404785, -6.026029109954834, -5.556037902832031, -5.086047172546387, -4.616056442260742, -4.146065711975098, -3.676074743270874, -3.2060837745666504, -2.736093044281006, -2.2661023139953613, -1.7961113452911377, -1.326120376586914, -0.8561296463012695, -0.38613879680633545, 0.08385205268859863, 0.5538429021835327, 1.0238337516784668, 1.4938244819641113, 1.963815450668335, 2.4338064193725586, 2.903797149658203, 3.3737878799438477, 3.8437788486480713, 4.313769817352295, 4.7837605476379395, 5.253751277923584, 5.723742485046387, 6.193733215332031, 6.663723945617676, 7.13371467590332, 7.603705406188965, 8.07369613647461, 8.54368782043457, 9.013677597045898, 9.48366928100586, 9.953660011291504, 10.423650741577148, 10.893641471862793, 11.363632202148438, 11.833622932434082, 12.303613662719727, 12.773605346679688, 13.243596076965332, 13.713586807250977, 14.183577537536621, 14.653568267822266, 15.12355899810791, 15.593549728393555, 16.063541412353516, 16.533531188964844, 17.003522872924805, 17.473514556884766, 17.943504333496094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 9.0, 11.0, 15.0, 14.0, 29.0, 22.0, 31.0, 23.0, 56.0, 70.0, 81.0, 124.0, 197.0, 265.0, 403.0, 658.0, 1189.0, 2189.0, 4750.0, 11641.0, 38283.0, 265997.0, 3679933.0, 142909.0, 27409.0, 9295.0, 3829.0, 1894.0, 1046.0, 623.0, 372.0, 255.0, 159.0, 140.0, 92.0, 78.0, 51.0, 40.0, 25.0, 23.0, 11.0, 4.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.19140625, -2.13116455078125, -2.0709228515625, -2.01068115234375, -1.950439453125, -1.89019775390625, -1.8299560546875, -1.76971435546875, -1.70947265625, -1.64923095703125, -1.5889892578125, -1.52874755859375, -1.468505859375, -1.40826416015625, -1.3480224609375, -1.28778076171875, -1.2275390625, -1.16729736328125, -1.1070556640625, -1.04681396484375, -0.986572265625, -0.92633056640625, -0.8660888671875, -0.80584716796875, -0.74560546875, -0.68536376953125, -0.6251220703125, -0.56488037109375, -0.504638671875, -0.44439697265625, -0.3841552734375, -0.32391357421875, -0.263671875, -0.20343017578125, -0.1431884765625, -0.08294677734375, -0.022705078125, 0.03753662109375, 0.0977783203125, 0.15802001953125, 0.21826171875, 0.27850341796875, 0.3387451171875, 0.39898681640625, 0.459228515625, 0.51947021484375, 0.5797119140625, 0.63995361328125, 0.7001953125, 0.76043701171875, 0.8206787109375, 0.88092041015625, 0.941162109375, 1.00140380859375, 1.0616455078125, 1.12188720703125, 1.18212890625, 1.24237060546875, 1.3026123046875, 1.36285400390625, 1.423095703125, 1.48333740234375, 1.5435791015625, 1.60382080078125, 1.6640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 4.0, 15.0, 15.0, 18.0, 25.0, 45.0, 39.0, 56.0, 78.0, 74.0, 100.0, 81.0, 79.0, 68.0, 63.0, 57.0, 46.0, 33.0, 22.0, 19.0, 14.0, 9.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4619140625, -0.449188232421875, -0.43646240234375, -0.423736572265625, -0.4110107421875, -0.398284912109375, -0.38555908203125, -0.372833251953125, -0.360107421875, -0.347381591796875, -0.33465576171875, -0.321929931640625, -0.3092041015625, -0.296478271484375, -0.28375244140625, -0.271026611328125, -0.25830078125, -0.245574951171875, -0.23284912109375, -0.220123291015625, -0.2073974609375, -0.194671630859375, -0.18194580078125, -0.169219970703125, -0.156494140625, -0.143768310546875, -0.13104248046875, -0.118316650390625, -0.1055908203125, -0.092864990234375, -0.08013916015625, -0.067413330078125, -0.0546875, -0.041961669921875, -0.02923583984375, -0.016510009765625, -0.0037841796875, 0.008941650390625, 0.02166748046875, 0.034393310546875, 0.047119140625, 0.059844970703125, 0.07257080078125, 0.085296630859375, 0.0980224609375, 0.110748291015625, 0.12347412109375, 0.136199951171875, 0.14892578125, 0.161651611328125, 0.17437744140625, 0.187103271484375, 0.1998291015625, 0.212554931640625, 0.22528076171875, 0.238006591796875, 0.250732421875, 0.263458251953125, 0.27618408203125, 0.288909912109375, 0.3016357421875, 0.314361572265625, 0.32708740234375, 0.339813232421875, 0.3525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 6.0, 33.0, 46.0, 64.0, 94.0, 168.0, 303.0, 606.0, 1537.0, 5002.0, 27148.0, 816624.0, 3294427.0, 38437.0, 6125.0, 1997.0, 788.0, 385.0, 211.0, 95.0, 58.0, 39.0, 22.0, 15.0, 8.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.26531982421875, -2.1712646484375, -2.07720947265625, -1.983154296875, -1.88909912109375, -1.7950439453125, -1.70098876953125, -1.60693359375, -1.51287841796875, -1.4188232421875, -1.32476806640625, -1.230712890625, -1.13665771484375, -1.0426025390625, -0.94854736328125, -0.8544921875, -0.76043701171875, -0.6663818359375, -0.57232666015625, -0.478271484375, -0.38421630859375, -0.2901611328125, -0.19610595703125, -0.10205078125, -0.00799560546875, 0.0860595703125, 0.18011474609375, 0.274169921875, 0.36822509765625, 0.4622802734375, 0.55633544921875, 0.650390625, 0.74444580078125, 0.8385009765625, 0.93255615234375, 1.026611328125, 1.12066650390625, 1.2147216796875, 1.30877685546875, 1.40283203125, 1.49688720703125, 1.5909423828125, 1.68499755859375, 1.779052734375, 1.87310791015625, 1.9671630859375, 2.06121826171875, 2.1552734375, 2.24932861328125, 2.3433837890625, 2.43743896484375, 2.531494140625, 2.62554931640625, 2.7196044921875, 2.81365966796875, 2.90771484375, 3.00177001953125, 3.0958251953125, 3.18988037109375, 3.283935546875, 3.37799072265625, 3.4720458984375, 3.56610107421875, 3.66015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 15.0, 30.0, 34.0, 44.0, 82.0, 164.0, 429.0, 2022.0, 739.0, 238.0, 95.0, 63.0, 28.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.68994140625, -0.670623779296875, -0.65130615234375, -0.631988525390625, -0.6126708984375, -0.593353271484375, -0.57403564453125, -0.554718017578125, -0.535400390625, -0.516082763671875, -0.49676513671875, -0.477447509765625, -0.4581298828125, -0.438812255859375, -0.41949462890625, -0.400177001953125, -0.380859375, -0.361541748046875, -0.34222412109375, -0.322906494140625, -0.3035888671875, -0.284271240234375, -0.26495361328125, -0.245635986328125, -0.226318359375, -0.207000732421875, -0.18768310546875, -0.168365478515625, -0.1490478515625, -0.129730224609375, -0.11041259765625, -0.091094970703125, -0.07177734375, -0.052459716796875, -0.03314208984375, -0.013824462890625, 0.0054931640625, 0.024810791015625, 0.04412841796875, 0.063446044921875, 0.082763671875, 0.102081298828125, 0.12139892578125, 0.140716552734375, 0.1600341796875, 0.179351806640625, 0.19866943359375, 0.217987060546875, 0.2373046875, 0.256622314453125, 0.27593994140625, 0.295257568359375, 0.3145751953125, 0.333892822265625, 0.35321044921875, 0.372528076171875, 0.391845703125, 0.411163330078125, 0.43048095703125, 0.449798583984375, 0.4691162109375, 0.488433837890625, 0.50775146484375, 0.527069091796875, 0.54638671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 23.0, 35.0, 47.0, 86.0, 145.0, 187.0, 174.0, 119.0, 68.0, 49.0, 20.0, 23.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1480159759521484, -3.045922040939331, -2.9438281059265137, -2.8417341709136963, -2.739640235900879, -2.6375465393066406, -2.5354526042938232, -2.433358669281006, -2.3312647342681885, -2.229170799255371, -2.1270768642425537, -2.0249829292297363, -1.9228891134262085, -1.8207951784133911, -1.7187013626098633, -1.616607427597046, -1.5145134925842285, -1.4124195575714111, -1.3103256225585938, -1.208231806755066, -1.1061378717422485, -1.0040439367294312, -0.9019500613212585, -0.7998561859130859, -0.6977622509002686, -0.5956683158874512, -0.49357444047927856, -0.39148053526878357, -0.2893866300582886, -0.1872926950454712, -0.08519881963729858, 0.016895055770874023, 0.1189889907836914, 0.2210828959941864, 0.3231768012046814, 0.4252707064151764, 0.5273646116256714, 0.6294585466384888, 0.7315524220466614, 0.833646297454834, 0.9357402324676514, 1.0378341674804688, 1.1399281024932861, 1.242021918296814, 1.3441158533096313, 1.4462097883224487, 1.5483036041259766, 1.650397539138794, 1.7524914741516113, 1.8545854091644287, 1.956679344177246, 2.0587732791900635, 2.160867214202881, 2.262960910797119, 2.3650548458099365, 2.467148780822754, 2.5692427158355713, 2.6713366508483887, 2.773430585861206, 2.8755245208740234, 2.9776182174682617, 3.079712390899658, 3.1818060874938965, 3.283900022506714, 3.3859939575195312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 9.0, 17.0, 17.0, 30.0, 39.0, 28.0, 39.0, 36.0, 47.0, 41.0, 40.0, 46.0, 68.0, 56.0, 51.0, 46.0, 49.0, 44.0, 35.0, 34.0, 35.0, 30.0, 18.0, 24.0, 18.0, 13.0, 15.0, 10.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5459598302841187, -1.4918259382247925, -1.4376921653747559, -1.3835582733154297, -1.3294243812561035, -1.275290608406067, -1.2211567163467407, -1.167022943496704, -1.112889051437378, -1.0587551593780518, -1.0046213865280151, -0.950487494468689, -0.8963536620140076, -0.8422198295593262, -0.7880859375, -0.7339521050453186, -0.6798182725906372, -0.6256844401359558, -0.5715506076812744, -0.5174167156219482, -0.46328288316726685, -0.40914905071258545, -0.35501518845558167, -0.3008813261985779, -0.24674749374389648, -0.1926136463880539, -0.1384797990322113, -0.08434595167636871, -0.030212104320526123, 0.023921728134155273, 0.07805559039115906, 0.13218945264816284, 0.1863234043121338, 0.24045725166797638, 0.29459109902381897, 0.34872496128082275, 0.40285879373550415, 0.45699262619018555, 0.5111265182495117, 0.5652603507041931, 0.6193941831588745, 0.6735280156135559, 0.7276618480682373, 0.7817957401275635, 0.8359295725822449, 0.8900634050369263, 0.9441972970962524, 0.9983311295509338, 1.0524649620056152, 1.1065988540649414, 1.160732626914978, 1.2148665189743042, 1.2690002918243408, 1.323134183883667, 1.3772680759429932, 1.4314019680023193, 1.485535740852356, 1.5396696329116821, 1.5938034057617188, 1.647937297821045, 1.702071189880371, 1.7562049627304077, 1.8103388547897339, 1.8644726276397705, 1.9186065196990967]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 11.0, 22.0, 30.0, 42.0, 56.0, 64.0, 132.0, 184.0, 291.0, 473.0, 867.0, 1504.0, 2831.0, 6262.0, 17450.0, 69233.0, 334411.0, 463733.0, 110032.0, 25040.0, 8135.0, 3417.0, 1749.0, 976.0, 568.0, 375.0, 219.0, 160.0, 102.0, 57.0, 42.0, 19.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.8974609375, -1.8345184326171875, -1.771575927734375, -1.7086334228515625, -1.64569091796875, -1.5827484130859375, -1.519805908203125, -1.4568634033203125, -1.3939208984375, -1.3309783935546875, -1.268035888671875, -1.2050933837890625, -1.14215087890625, -1.0792083740234375, -1.016265869140625, -0.9533233642578125, -0.890380859375, -0.8274383544921875, -0.764495849609375, -0.7015533447265625, -0.63861083984375, -0.5756683349609375, -0.512725830078125, -0.4497833251953125, -0.3868408203125, -0.3238983154296875, -0.260955810546875, -0.1980133056640625, -0.13507080078125, -0.0721282958984375, -0.009185791015625, 0.0537567138671875, 0.11669921875, 0.1796417236328125, 0.242584228515625, 0.3055267333984375, 0.36846923828125, 0.4314117431640625, 0.494354248046875, 0.5572967529296875, 0.6202392578125, 0.6831817626953125, 0.746124267578125, 0.8090667724609375, 0.87200927734375, 0.9349517822265625, 0.997894287109375, 1.0608367919921875, 1.123779296875, 1.1867218017578125, 1.249664306640625, 1.3126068115234375, 1.37554931640625, 1.4384918212890625, 1.501434326171875, 1.5643768310546875, 1.6273193359375, 1.6902618408203125, 1.753204345703125, 1.8161468505859375, 1.87908935546875, 1.9420318603515625, 2.004974365234375, 2.0679168701171875, 2.130859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 13.0, 9.0, 29.0, 27.0, 50.0, 52.0, 71.0, 92.0, 80.0, 91.0, 88.0, 86.0, 65.0, 59.0, 45.0, 38.0, 32.0, 16.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.497314453125, -0.4833412170410156, -0.46936798095703125, -0.4553947448730469, -0.4414215087890625, -0.4274482727050781, -0.41347503662109375, -0.3995018005371094, -0.385528564453125, -0.3715553283691406, -0.35758209228515625, -0.3436088562011719, -0.3296356201171875, -0.3156623840332031, -0.30168914794921875, -0.2877159118652344, -0.27374267578125, -0.2597694396972656, -0.24579620361328125, -0.23182296752929688, -0.2178497314453125, -0.20387649536132812, -0.18990325927734375, -0.17593002319335938, -0.161956787109375, -0.14798355102539062, -0.13401031494140625, -0.12003707885742188, -0.1060638427734375, -0.09209060668945312, -0.07811737060546875, -0.06414413452148438, -0.0501708984375, -0.036197662353515625, -0.02222442626953125, -0.008251190185546875, 0.0057220458984375, 0.019695281982421875, 0.03366851806640625, 0.047641754150390625, 0.061614990234375, 0.07558822631835938, 0.08956146240234375, 0.10353469848632812, 0.1175079345703125, 0.13148117065429688, 0.14545440673828125, 0.15942764282226562, 0.17340087890625, 0.18737411499023438, 0.20134735107421875, 0.21532058715820312, 0.2292938232421875, 0.24326705932617188, 0.25724029541015625, 0.2712135314941406, 0.285186767578125, 0.2991600036621094, 0.31313323974609375, 0.3271064758300781, 0.3410797119140625, 0.3550529479980469, 0.36902618408203125, 0.3829994201660156, 0.39697265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 10.0, 25.0, 32.0, 50.0, 55.0, 89.0, 128.0, 179.0, 319.0, 598.0, 1185.0, 2516.0, 6352.0, 19212.0, 75328.0, 366338.0, 442402.0, 96914.0, 23372.0, 7519.0, 2929.0, 1292.0, 631.0, 386.0, 243.0, 157.0, 97.0, 55.0, 30.0, 21.0, 26.0, 20.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6945037841796875, -1.639984130859375, -1.5854644775390625, -1.53094482421875, -1.4764251708984375, -1.421905517578125, -1.3673858642578125, -1.3128662109375, -1.2583465576171875, -1.203826904296875, -1.1493072509765625, -1.09478759765625, -1.0402679443359375, -0.985748291015625, -0.9312286376953125, -0.876708984375, -0.8221893310546875, -0.767669677734375, -0.7131500244140625, -0.65863037109375, -0.6041107177734375, -0.549591064453125, -0.4950714111328125, -0.4405517578125, -0.3860321044921875, -0.331512451171875, -0.2769927978515625, -0.22247314453125, -0.1679534912109375, -0.113433837890625, -0.0589141845703125, -0.00439453125, 0.0501251220703125, 0.104644775390625, 0.1591644287109375, 0.21368408203125, 0.2682037353515625, 0.322723388671875, 0.3772430419921875, 0.4317626953125, 0.4862823486328125, 0.540802001953125, 0.5953216552734375, 0.64984130859375, 0.7043609619140625, 0.758880615234375, 0.8134002685546875, 0.867919921875, 0.9224395751953125, 0.976959228515625, 1.0314788818359375, 1.08599853515625, 1.1405181884765625, 1.195037841796875, 1.2495574951171875, 1.3040771484375, 1.3585968017578125, 1.413116455078125, 1.4676361083984375, 1.52215576171875, 1.5766754150390625, 1.631195068359375, 1.6857147216796875, 1.740234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 5.0, 3.0, 6.0, 10.0, 12.0, 13.0, 27.0, 29.0, 36.0, 35.0, 46.0, 53.0, 62.0, 63.0, 63.0, 50.0, 61.0, 72.0, 55.0, 62.0, 37.0, 30.0, 35.0, 30.0, 21.0, 14.0, 12.0, 14.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.94140625, -1.8896026611328125, -1.837799072265625, -1.7859954833984375, -1.73419189453125, -1.6823883056640625, -1.630584716796875, -1.5787811279296875, -1.5269775390625, -1.4751739501953125, -1.423370361328125, -1.3715667724609375, -1.31976318359375, -1.2679595947265625, -1.216156005859375, -1.1643524169921875, -1.112548828125, -1.0607452392578125, -1.008941650390625, -0.9571380615234375, -0.90533447265625, -0.8535308837890625, -0.801727294921875, -0.7499237060546875, -0.6981201171875, -0.6463165283203125, -0.594512939453125, -0.5427093505859375, -0.49090576171875, -0.4391021728515625, -0.387298583984375, -0.3354949951171875, -0.28369140625, -0.2318878173828125, -0.180084228515625, -0.1282806396484375, -0.07647705078125, -0.0246734619140625, 0.027130126953125, 0.0789337158203125, 0.1307373046875, 0.1825408935546875, 0.234344482421875, 0.2861480712890625, 0.33795166015625, 0.3897552490234375, 0.441558837890625, 0.4933624267578125, 0.545166015625, 0.5969696044921875, 0.648773193359375, 0.7005767822265625, 0.75238037109375, 0.8041839599609375, 0.855987548828125, 0.9077911376953125, 0.9595947265625, 1.0113983154296875, 1.063201904296875, 1.1150054931640625, 1.16680908203125, 1.2186126708984375, 1.270416259765625, 1.3222198486328125, 1.3740234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 14.0, 27.0, 55.0, 93.0, 167.0, 308.0, 704.0, 1895.0, 6973.0, 48827.0, 671121.0, 291244.0, 20693.0, 4006.0, 1302.0, 514.0, 255.0, 139.0, 72.0, 54.0, 18.0, 13.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.05859375, -1.0281829833984375, -0.997772216796875, -0.9673614501953125, -0.93695068359375, -0.9065399169921875, -0.876129150390625, -0.8457183837890625, -0.8153076171875, -0.7848968505859375, -0.754486083984375, -0.7240753173828125, -0.69366455078125, -0.6632537841796875, -0.632843017578125, -0.6024322509765625, -0.572021484375, -0.5416107177734375, -0.511199951171875, -0.4807891845703125, -0.45037841796875, -0.4199676513671875, -0.389556884765625, -0.3591461181640625, -0.3287353515625, -0.2983245849609375, -0.267913818359375, -0.2375030517578125, -0.20709228515625, -0.1766815185546875, -0.146270751953125, -0.1158599853515625, -0.08544921875, -0.0550384521484375, -0.024627685546875, 0.0057830810546875, 0.03619384765625, 0.0666046142578125, 0.097015380859375, 0.1274261474609375, 0.1578369140625, 0.1882476806640625, 0.218658447265625, 0.2490692138671875, 0.27947998046875, 0.3098907470703125, 0.340301513671875, 0.3707122802734375, 0.401123046875, 0.4315338134765625, 0.461944580078125, 0.4923553466796875, 0.52276611328125, 0.5531768798828125, 0.583587646484375, 0.6139984130859375, 0.6444091796875, 0.6748199462890625, 0.705230712890625, 0.7356414794921875, 0.76605224609375, 0.7964630126953125, 0.826873779296875, 0.8572845458984375, 0.8876953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 11.0, 25.0, 23.0, 25.0, 41.0, 60.0, 72.0, 88.0, 98.0, 104.0, 96.0, 81.0, 65.0, 52.0, 44.0, 28.0, 19.0, 14.0, 7.0, 4.0, 12.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011944770812988281, -0.00011563487350940704, -0.00011182203888893127, -0.0001080092042684555, -0.00010419636964797974, -0.00010038353502750397, -9.65707004070282e-05, -9.275786578655243e-05, -8.894503116607666e-05, -8.513219654560089e-05, -8.131936192512512e-05, -7.750652730464935e-05, -7.369369268417358e-05, -6.988085806369781e-05, -6.606802344322205e-05, -6.225518882274628e-05, -5.844235420227051e-05, -5.462951958179474e-05, -5.081668496131897e-05, -4.70038503408432e-05, -4.319101572036743e-05, -3.937818109989166e-05, -3.5565346479415894e-05, -3.1752511858940125e-05, -2.7939677238464355e-05, -2.4126842617988586e-05, -2.0314007997512817e-05, -1.650117337703705e-05, -1.268833875656128e-05, -8.87550413608551e-06, -5.062669515609741e-06, -1.2498348951339722e-06, 2.562999725341797e-06, 6.375834345817566e-06, 1.0188668966293335e-05, 1.4001503586769104e-05, 1.7814338207244873e-05, 2.1627172827720642e-05, 2.544000744819641e-05, 2.925284206867218e-05, 3.306567668914795e-05, 3.687851130962372e-05, 4.069134593009949e-05, 4.4504180550575256e-05, 4.8317015171051025e-05, 5.2129849791526794e-05, 5.5942684412002563e-05, 5.975551903247833e-05, 6.35683536529541e-05, 6.738118827342987e-05, 7.119402289390564e-05, 7.500685751438141e-05, 7.881969213485718e-05, 8.263252675533295e-05, 8.644536137580872e-05, 9.025819599628448e-05, 9.407103061676025e-05, 9.788386523723602e-05, 0.00010169669985771179, 0.00010550953447818756, 0.00010932236909866333, 0.0001131352037191391, 0.00011694803833961487, 0.00012076087296009064, 0.0001245737075805664]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 9.0, 23.0, 33.0, 70.0, 119.0, 268.0, 698.0, 2157.0, 10511.0, 143935.0, 810995.0, 70055.0, 7029.0, 1591.0, 575.0, 252.0, 95.0, 45.0, 28.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.4041595458984375, -1.371795654296875, -1.3394317626953125, -1.30706787109375, -1.2747039794921875, -1.242340087890625, -1.2099761962890625, -1.1776123046875, -1.1452484130859375, -1.112884521484375, -1.0805206298828125, -1.04815673828125, -1.0157928466796875, -0.983428955078125, -0.9510650634765625, -0.918701171875, -0.8863372802734375, -0.853973388671875, -0.8216094970703125, -0.78924560546875, -0.7568817138671875, -0.724517822265625, -0.6921539306640625, -0.6597900390625, -0.6274261474609375, -0.595062255859375, -0.5626983642578125, -0.53033447265625, -0.4979705810546875, -0.465606689453125, -0.4332427978515625, -0.40087890625, -0.3685150146484375, -0.336151123046875, -0.3037872314453125, -0.27142333984375, -0.2390594482421875, -0.206695556640625, -0.1743316650390625, -0.1419677734375, -0.1096038818359375, -0.077239990234375, -0.0448760986328125, -0.01251220703125, 0.0198516845703125, 0.052215576171875, 0.0845794677734375, 0.116943359375, 0.1493072509765625, 0.181671142578125, 0.2140350341796875, 0.24639892578125, 0.2787628173828125, 0.311126708984375, 0.3434906005859375, 0.3758544921875, 0.4082183837890625, 0.440582275390625, 0.4729461669921875, 0.50531005859375, 0.5376739501953125, 0.570037841796875, 0.6024017333984375, 0.634765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 10.0, 21.0, 19.0, 47.0, 31.0, 68.0, 92.0, 110.0, 122.0, 137.0, 97.0, 65.0, 56.0, 44.0, 23.0, 13.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7294921875, -0.7124176025390625, -0.695343017578125, -0.6782684326171875, -0.66119384765625, -0.6441192626953125, -0.627044677734375, -0.6099700927734375, -0.5928955078125, -0.5758209228515625, -0.558746337890625, -0.5416717529296875, -0.52459716796875, -0.5075225830078125, -0.490447998046875, -0.4733734130859375, -0.456298828125, -0.4392242431640625, -0.422149658203125, -0.4050750732421875, -0.38800048828125, -0.3709259033203125, -0.353851318359375, -0.3367767333984375, -0.3197021484375, -0.3026275634765625, -0.285552978515625, -0.2684783935546875, -0.25140380859375, -0.2343292236328125, -0.217254638671875, -0.2001800537109375, -0.18310546875, -0.1660308837890625, -0.148956298828125, -0.1318817138671875, -0.11480712890625, -0.0977325439453125, -0.080657958984375, -0.0635833740234375, -0.0465087890625, -0.0294342041015625, -0.012359619140625, 0.0047149658203125, 0.02178955078125, 0.0388641357421875, 0.055938720703125, 0.0730133056640625, 0.090087890625, 0.1071624755859375, 0.124237060546875, 0.1413116455078125, 0.15838623046875, 0.1754608154296875, 0.192535400390625, 0.2096099853515625, 0.2266845703125, 0.2437591552734375, 0.260833740234375, 0.2779083251953125, 0.29498291015625, 0.3120574951171875, 0.329132080078125, 0.3462066650390625, 0.36328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 11.0, 5.0, 7.0, 16.0, 20.0, 34.0, 47.0, 81.0, 120.0, 162.0, 158.0, 126.0, 69.0, 53.0, 39.0, 18.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.183361053466797, -11.862210273742676, -11.541058540344238, -11.219907760620117, -10.898756980895996, -10.577606201171875, -10.256454467773438, -9.935303688049316, -9.614152908325195, -9.293002128601074, -8.971850395202637, -8.650699615478516, -8.329548835754395, -8.008398056030273, -7.687246322631836, -7.366095542907715, -7.044943809509277, -6.723792552947998, -6.402641773223877, -6.081490516662598, -5.760339736938477, -5.439188480377197, -5.118037223815918, -4.796886444091797, -4.475735187530518, -4.154583930969238, -3.833433151245117, -3.512281894683838, -3.1911308765411377, -2.8699798583984375, -2.548828601837158, -2.227677583694458, -1.9065256118774414, -1.5853745937347412, -1.2642234563827515, -0.9430723786354065, -0.6219213008880615, -0.30077028274536133, 0.020380854606628418, 0.34153199195861816, 0.6626830101013184, 0.9838340878486633, 1.3049851655960083, 1.626136302947998, 1.9472873210906982, 2.2684383392333984, 2.5895895957946777, 2.910740613937378, 3.231891632080078, 3.5530426502227783, 3.8741936683654785, 4.195344924926758, 4.516495704650879, 4.837646961212158, 5.1587982177734375, 5.479948997497559, 5.801100254058838, 6.122251510620117, 6.443402290344238, 6.764553546905518, 7.085704803466797, 7.406855583190918, 7.728006839752197, 8.049158096313477, 8.370308876037598]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 12.0, 15.0, 21.0, 25.0, 25.0, 47.0, 43.0, 65.0, 51.0, 59.0, 85.0, 79.0, 75.0, 84.0, 67.0, 54.0, 30.0, 36.0, 26.0, 32.0, 13.0, 14.0, 15.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.267683029174805, -15.89025592803955, -15.51282787322998, -15.135400772094727, -14.757972717285156, -14.380545616149902, -14.003117561340332, -13.625690460205078, -13.248262405395508, -12.870835304260254, -12.493407249450684, -12.11598014831543, -11.73855209350586, -11.361124992370605, -10.983696937561035, -10.606269836425781, -10.228841781616211, -9.851414680480957, -9.473986625671387, -9.096559524536133, -8.719131469726562, -8.341704368591309, -7.964276313781738, -7.586849212646484, -7.2094221115112305, -6.831994533538818, -6.454566955566406, -6.077139377593994, -5.699711799621582, -5.32228422164917, -4.944856643676758, -4.567429542541504, -4.190001487731934, -3.8125739097595215, -3.4351463317871094, -3.0577187538146973, -2.680291175842285, -2.302863597869873, -1.92543625831604, -1.548008680343628, -1.1705811023712158, -0.7931535243988037, -0.4157260060310364, -0.03829848766326904, 0.33912909030914307, 0.7165566682815552, 1.0939841270446777, 1.4714117050170898, 1.848839282989502, 2.226266860961914, 2.603694438934326, 2.9811220169067383, 3.3585495948791504, 3.7359771728515625, 4.113404273986816, 4.490832328796387, 4.868259429931641, 5.245687007904053, 5.623114585876465, 6.000542163848877, 6.377969741821289, 6.755397319793701, 7.132824897766113, 7.510251998901367, 7.8876800537109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 10.0, 15.0, 17.0, 20.0, 28.0, 27.0, 44.0, 39.0, 55.0, 66.0, 106.0, 122.0, 196.0, 262.0, 365.0, 586.0, 1003.0, 1834.0, 3794.0, 8953.0, 27618.0, 151565.0, 3674503.0, 265498.0, 36975.0, 11083.0, 4393.0, 2130.0, 1082.0, 636.0, 430.0, 245.0, 160.0, 108.0, 74.0, 61.0, 37.0, 31.0, 22.0, 22.0, 22.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.4140625, -2.34222412109375, -2.2703857421875, -2.19854736328125, -2.126708984375, -2.05487060546875, -1.9830322265625, -1.91119384765625, -1.83935546875, -1.76751708984375, -1.6956787109375, -1.62384033203125, -1.552001953125, -1.48016357421875, -1.4083251953125, -1.33648681640625, -1.2646484375, -1.19281005859375, -1.1209716796875, -1.04913330078125, -0.977294921875, -0.90545654296875, -0.8336181640625, -0.76177978515625, -0.68994140625, -0.61810302734375, -0.5462646484375, -0.47442626953125, -0.402587890625, -0.33074951171875, -0.2589111328125, -0.18707275390625, -0.115234375, -0.04339599609375, 0.0284423828125, 0.10028076171875, 0.172119140625, 0.24395751953125, 0.3157958984375, 0.38763427734375, 0.45947265625, 0.53131103515625, 0.6031494140625, 0.67498779296875, 0.746826171875, 0.81866455078125, 0.8905029296875, 0.96234130859375, 1.0341796875, 1.10601806640625, 1.1778564453125, 1.24969482421875, 1.321533203125, 1.39337158203125, 1.4652099609375, 1.53704833984375, 1.60888671875, 1.68072509765625, 1.7525634765625, 1.82440185546875, 1.896240234375, 1.96807861328125, 2.0399169921875, 2.11175537109375, 2.18359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 18.0, 20.0, 31.0, 53.0, 56.0, 71.0, 88.0, 94.0, 91.0, 89.0, 69.0, 77.0, 51.0, 46.0, 39.0, 30.0, 17.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.47998046875, -0.466064453125, -0.4521484375, -0.438232421875, -0.42431640625, -0.410400390625, -0.396484375, -0.382568359375, -0.36865234375, -0.354736328125, -0.3408203125, -0.326904296875, -0.31298828125, -0.299072265625, -0.28515625, -0.271240234375, -0.25732421875, -0.243408203125, -0.2294921875, -0.215576171875, -0.20166015625, -0.187744140625, -0.173828125, -0.159912109375, -0.14599609375, -0.132080078125, -0.1181640625, -0.104248046875, -0.09033203125, -0.076416015625, -0.0625, -0.048583984375, -0.03466796875, -0.020751953125, -0.0068359375, 0.007080078125, 0.02099609375, 0.034912109375, 0.048828125, 0.062744140625, 0.07666015625, 0.090576171875, 0.1044921875, 0.118408203125, 0.13232421875, 0.146240234375, 0.16015625, 0.174072265625, 0.18798828125, 0.201904296875, 0.2158203125, 0.229736328125, 0.24365234375, 0.257568359375, 0.271484375, 0.285400390625, 0.29931640625, 0.313232421875, 0.3271484375, 0.341064453125, 0.35498046875, 0.368896484375, 0.3828125, 0.396728515625, 0.41064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 7.0, 18.0, 46.0, 78.0, 112.0, 234.0, 507.0, 1160.0, 2944.0, 8940.0, 48239.0, 3818852.0, 286479.0, 18504.0, 4893.0, 1762.0, 715.0, 337.0, 172.0, 99.0, 59.0, 30.0, 27.0, 11.0, 13.0, 8.0, 6.0, 8.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8984375, -2.7813720703125, -2.664306640625, -2.5472412109375, -2.43017578125, -2.3131103515625, -2.196044921875, -2.0789794921875, -1.9619140625, -1.8448486328125, -1.727783203125, -1.6107177734375, -1.49365234375, -1.3765869140625, -1.259521484375, -1.1424560546875, -1.025390625, -0.9083251953125, -0.791259765625, -0.6741943359375, -0.55712890625, -0.4400634765625, -0.322998046875, -0.2059326171875, -0.0888671875, 0.0281982421875, 0.145263671875, 0.2623291015625, 0.37939453125, 0.4964599609375, 0.613525390625, 0.7305908203125, 0.84765625, 0.9647216796875, 1.081787109375, 1.1988525390625, 1.31591796875, 1.4329833984375, 1.550048828125, 1.6671142578125, 1.7841796875, 1.9012451171875, 2.018310546875, 2.1353759765625, 2.25244140625, 2.3695068359375, 2.486572265625, 2.6036376953125, 2.720703125, 2.8377685546875, 2.954833984375, 3.0718994140625, 3.18896484375, 3.3060302734375, 3.423095703125, 3.5401611328125, 3.6572265625, 3.7742919921875, 3.891357421875, 4.0084228515625, 4.12548828125, 4.2425537109375, 4.359619140625, 4.4766845703125, 4.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 7.0, 17.0, 17.0, 29.0, 76.0, 127.0, 368.0, 2040.0, 932.0, 244.0, 85.0, 44.0, 27.0, 11.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.9521484375, -0.912109375, -0.8720703125, -0.83203125, -0.7919921875, -0.751953125, -0.7119140625, -0.671875, -0.6318359375, -0.591796875, -0.5517578125, -0.51171875, -0.4716796875, -0.431640625, -0.3916015625, -0.3515625, -0.3115234375, -0.271484375, -0.2314453125, -0.19140625, -0.1513671875, -0.111328125, -0.0712890625, -0.03125, 0.0087890625, 0.048828125, 0.0888671875, 0.12890625, 0.1689453125, 0.208984375, 0.2490234375, 0.2890625, 0.3291015625, 0.369140625, 0.4091796875, 0.44921875, 0.4892578125, 0.529296875, 0.5693359375, 0.609375, 0.6494140625, 0.689453125, 0.7294921875, 0.76953125, 0.8095703125, 0.849609375, 0.8896484375, 0.9296875, 0.9697265625, 1.009765625, 1.0498046875, 1.08984375, 1.1298828125, 1.169921875, 1.2099609375, 1.25, 1.2900390625, 1.330078125, 1.3701171875, 1.41015625, 1.4501953125, 1.490234375, 1.5302734375, 1.5703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 35.0, 143.0, 305.0, 305.0, 125.0, 42.0, 17.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.918496131896973, -13.593974113464355, -13.269453048706055, -12.944931030273438, -12.62040901184082, -12.29588794708252, -11.971365928649902, -11.646844863891602, -11.322322845458984, -10.997800827026367, -10.673279762268066, -10.34875774383545, -10.024236679077148, -9.699714660644531, -9.375192642211914, -9.050670623779297, -8.726149559020996, -8.401627540588379, -8.077106475830078, -7.752584457397461, -7.428062915802002, -7.103541374206543, -6.779019355773926, -6.454497814178467, -6.129976272583008, -5.805454730987549, -5.48093318939209, -5.156411170959473, -4.831889629364014, -4.507368087768555, -4.1828460693359375, -3.8583245277404785, -3.5338029861450195, -3.2092814445495605, -2.8847596645355225, -2.5602378845214844, -2.2357163429260254, -1.9111946821212769, -1.5866730213165283, -1.2621512413024902, -0.9376296997070312, -0.6131080389022827, -0.2885863780975342, 0.035935282707214355, 0.3604569435119629, 0.6849786043167114, 1.00950026512146, 1.334022045135498, 1.658543586730957, 1.9830652475357056, 2.307586908340454, 2.632108688354492, 2.956630229949951, 3.28115177154541, 3.6056735515594482, 3.9301953315734863, 4.254716873168945, 4.579238414764404, 4.903759956359863, 5.2282819747924805, 5.5528035163879395, 5.877325057983398, 6.201847076416016, 6.526368618011475, 6.850890159606934]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 11.0, 8.0, 8.0, 9.0, 25.0, 25.0, 34.0, 38.0, 57.0, 55.0, 67.0, 63.0, 94.0, 73.0, 80.0, 79.0, 62.0, 52.0, 38.0, 40.0, 28.0, 21.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.513881683349609, -4.385019302368164, -4.256156921386719, -4.127294063568115, -3.99843168258667, -3.8695693016052246, -3.7407069206237793, -3.611844539642334, -3.4829819202423096, -3.3541195392608643, -3.22525691986084, -3.0963945388793945, -2.967532157897949, -2.838669538497925, -2.7098071575164795, -2.580944538116455, -2.4520821571350098, -2.3232197761535645, -2.19435715675354, -2.0654947757720947, -1.9366322755813599, -1.807769775390625, -1.6789073944091797, -1.5500448942184448, -1.42118239402771, -1.292319893836975, -1.1634573936462402, -1.034595012664795, -0.9057325124740601, -0.7768700122833252, -0.6480075716972351, -0.519145131111145, -0.39028310775756836, -0.2614206373691559, -0.1325581669807434, -0.0036956965923309326, 0.12516677379608154, 0.2540292739868164, 0.3828917145729065, 0.5117541551589966, 0.6406166553497314, 0.7694791555404663, 0.8983415961265564, 1.0272040367126465, 1.1560665369033813, 1.2849290370941162, 1.4137914180755615, 1.5426539182662964, 1.6715164184570312, 1.8003789186477661, 1.929241418838501, 2.0581037998199463, 2.1869664192199707, 2.315828800201416, 2.4446911811828613, 2.5735535621643066, 2.702416181564331, 2.8312785625457764, 2.960141181945801, 3.089003562927246, 3.2178659439086914, 3.346728563308716, 3.475590944290161, 3.6044535636901855, 3.733315944671631]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 13.0, 15.0, 19.0, 25.0, 28.0, 49.0, 50.0, 78.0, 97.0, 145.0, 215.0, 268.0, 394.0, 572.0, 800.0, 1341.0, 2155.0, 4026.0, 9110.0, 29719.0, 147955.0, 547188.0, 236848.0, 43495.0, 11920.0, 4794.0, 2552.0, 1566.0, 945.0, 659.0, 425.0, 288.0, 201.0, 161.0, 99.0, 78.0, 57.0, 42.0, 34.0, 18.0, 23.0, 11.0, 18.0, 9.0, 5.0, 8.0, 7.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.9375, -1.8781280517578125, -1.818756103515625, -1.7593841552734375, -1.70001220703125, -1.6406402587890625, -1.581268310546875, -1.5218963623046875, -1.4625244140625, -1.4031524658203125, -1.343780517578125, -1.2844085693359375, -1.22503662109375, -1.1656646728515625, -1.106292724609375, -1.0469207763671875, -0.987548828125, -0.9281768798828125, -0.868804931640625, -0.8094329833984375, -0.75006103515625, -0.6906890869140625, -0.631317138671875, -0.5719451904296875, -0.5125732421875, -0.4532012939453125, -0.393829345703125, -0.3344573974609375, -0.27508544921875, -0.2157135009765625, -0.156341552734375, -0.0969696044921875, -0.03759765625, 0.0217742919921875, 0.081146240234375, 0.1405181884765625, 0.19989013671875, 0.2592620849609375, 0.318634033203125, 0.3780059814453125, 0.4373779296875, 0.4967498779296875, 0.556121826171875, 0.6154937744140625, 0.67486572265625, 0.7342376708984375, 0.793609619140625, 0.8529815673828125, 0.912353515625, 0.9717254638671875, 1.031097412109375, 1.0904693603515625, 1.14984130859375, 1.2092132568359375, 1.268585205078125, 1.3279571533203125, 1.3873291015625, 1.4467010498046875, 1.506072998046875, 1.5654449462890625, 1.62481689453125, 1.6841888427734375, 1.743560791015625, 1.8029327392578125, 1.8623046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 9.0, 14.0, 18.0, 35.0, 45.0, 70.0, 95.0, 104.0, 139.0, 100.0, 109.0, 88.0, 53.0, 38.0, 25.0, 14.0, 17.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6025390625, -0.5846481323242188, -0.5667572021484375, -0.5488662719726562, -0.530975341796875, -0.5130844116210938, -0.4951934814453125, -0.47730255126953125, -0.45941162109375, -0.44152069091796875, -0.4236297607421875, -0.40573883056640625, -0.387847900390625, -0.36995697021484375, -0.3520660400390625, -0.33417510986328125, -0.3162841796875, -0.29839324951171875, -0.2805023193359375, -0.26261138916015625, -0.244720458984375, -0.22682952880859375, -0.2089385986328125, -0.19104766845703125, -0.17315673828125, -0.15526580810546875, -0.1373748779296875, -0.11948394775390625, -0.101593017578125, -0.08370208740234375, -0.0658111572265625, -0.04792022705078125, -0.030029296875, -0.01213836669921875, 0.0057525634765625, 0.02364349365234375, 0.041534423828125, 0.05942535400390625, 0.0773162841796875, 0.09520721435546875, 0.11309814453125, 0.13098907470703125, 0.1488800048828125, 0.16677093505859375, 0.184661865234375, 0.20255279541015625, 0.2204437255859375, 0.23833465576171875, 0.2562255859375, 0.27411651611328125, 0.2920074462890625, 0.30989837646484375, 0.327789306640625, 0.34568023681640625, 0.3635711669921875, 0.38146209716796875, 0.39935302734375, 0.41724395751953125, 0.4351348876953125, 0.45302581787109375, 0.470916748046875, 0.48880767822265625, 0.5066986083984375, 0.5245895385742188, 0.54248046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 14.0, 15.0, 17.0, 29.0, 43.0, 57.0, 80.0, 91.0, 178.0, 289.0, 465.0, 853.0, 1622.0, 3329.0, 7738.0, 20960.0, 64275.0, 204074.0, 407638.0, 225997.0, 71943.0, 23205.0, 8342.0, 3452.0, 1580.0, 818.0, 460.0, 343.0, 197.0, 115.0, 75.0, 59.0, 56.0, 27.0, 30.0, 13.0, 14.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.0478515625, -1.015655517578125, -0.98345947265625, -0.951263427734375, -0.9190673828125, -0.886871337890625, -0.85467529296875, -0.822479248046875, -0.790283203125, -0.758087158203125, -0.72589111328125, -0.693695068359375, -0.6614990234375, -0.629302978515625, -0.59710693359375, -0.564910888671875, -0.53271484375, -0.500518798828125, -0.46832275390625, -0.436126708984375, -0.4039306640625, -0.371734619140625, -0.33953857421875, -0.307342529296875, -0.275146484375, -0.242950439453125, -0.21075439453125, -0.178558349609375, -0.1463623046875, -0.114166259765625, -0.08197021484375, -0.049774169921875, -0.017578125, 0.014617919921875, 0.04681396484375, 0.079010009765625, 0.1112060546875, 0.143402099609375, 0.17559814453125, 0.207794189453125, 0.239990234375, 0.272186279296875, 0.30438232421875, 0.336578369140625, 0.3687744140625, 0.400970458984375, 0.43316650390625, 0.465362548828125, 0.49755859375, 0.529754638671875, 0.56195068359375, 0.594146728515625, 0.6263427734375, 0.658538818359375, 0.69073486328125, 0.722930908203125, 0.755126953125, 0.787322998046875, 0.81951904296875, 0.851715087890625, 0.8839111328125, 0.916107177734375, 0.94830322265625, 0.980499267578125, 1.0126953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 11.0, 10.0, 20.0, 24.0, 33.0, 35.0, 35.0, 44.0, 44.0, 39.0, 45.0, 49.0, 49.0, 52.0, 50.0, 47.0, 47.0, 39.0, 26.0, 41.0, 42.0, 40.0, 25.0, 28.0, 20.0, 18.0, 20.0, 14.0, 8.0, 8.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.07421875, -1.0384674072265625, -1.002716064453125, -0.9669647216796875, -0.93121337890625, -0.8954620361328125, -0.859710693359375, -0.8239593505859375, -0.7882080078125, -0.7524566650390625, -0.716705322265625, -0.6809539794921875, -0.64520263671875, -0.6094512939453125, -0.573699951171875, -0.5379486083984375, -0.502197265625, -0.4664459228515625, -0.430694580078125, -0.3949432373046875, -0.35919189453125, -0.3234405517578125, -0.287689208984375, -0.2519378662109375, -0.2161865234375, -0.1804351806640625, -0.144683837890625, -0.1089324951171875, -0.07318115234375, -0.0374298095703125, -0.001678466796875, 0.0340728759765625, 0.06982421875, 0.1055755615234375, 0.141326904296875, 0.1770782470703125, 0.21282958984375, 0.2485809326171875, 0.284332275390625, 0.3200836181640625, 0.3558349609375, 0.3915863037109375, 0.427337646484375, 0.4630889892578125, 0.49884033203125, 0.5345916748046875, 0.570343017578125, 0.6060943603515625, 0.641845703125, 0.6775970458984375, 0.713348388671875, 0.7490997314453125, 0.78485107421875, 0.8206024169921875, 0.856353759765625, 0.8921051025390625, 0.9278564453125, 0.9636077880859375, 0.999359130859375, 1.0351104736328125, 1.07086181640625, 1.1066131591796875, 1.142364501953125, 1.1781158447265625, 1.2138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 9.0, 20.0, 25.0, 36.0, 79.0, 140.0, 286.0, 689.0, 2442.0, 14629.0, 336289.0, 660035.0, 28585.0, 3648.0, 928.0, 324.0, 143.0, 84.0, 48.0, 47.0, 23.0, 16.0, 10.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3769760131835938, -1.3408660888671875, -1.3047561645507812, -1.268646240234375, -1.2325363159179688, -1.1964263916015625, -1.1603164672851562, -1.12420654296875, -1.0880966186523438, -1.0519866943359375, -1.0158767700195312, -0.979766845703125, -0.9436569213867188, -0.9075469970703125, -0.8714370727539062, -0.8353271484375, -0.7992172241210938, -0.7631072998046875, -0.7269973754882812, -0.690887451171875, -0.6547775268554688, -0.6186676025390625, -0.5825576782226562, -0.54644775390625, -0.5103378295898438, -0.4742279052734375, -0.43811798095703125, -0.402008056640625, -0.36589813232421875, -0.3297882080078125, -0.29367828369140625, -0.257568359375, -0.22145843505859375, -0.1853485107421875, -0.14923858642578125, -0.113128662109375, -0.07701873779296875, -0.0409088134765625, -0.00479888916015625, 0.03131103515625, 0.06742095947265625, 0.1035308837890625, 0.13964080810546875, 0.175750732421875, 0.21186065673828125, 0.2479705810546875, 0.28408050537109375, 0.3201904296875, 0.35630035400390625, 0.3924102783203125, 0.42852020263671875, 0.464630126953125, 0.5007400512695312, 0.5368499755859375, 0.5729598999023438, 0.60906982421875, 0.6451797485351562, 0.6812896728515625, 0.7173995971679688, 0.753509521484375, 0.7896194458007812, 0.8257293701171875, 0.8618392944335938, 0.89794921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 19.0, 25.0, 22.0, 48.0, 72.0, 151.0, 186.0, 185.0, 124.0, 79.0, 45.0, 27.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00029659271240234375, -0.0002903798595070839, -0.00028416700661182404, -0.0002779541537165642, -0.0002717413008213043, -0.00026552844792604446, -0.0002593155950307846, -0.00025310274213552475, -0.0002468898892402649, -0.00024067703634500504, -0.00023446418344974518, -0.00022825133055448532, -0.00022203847765922546, -0.0002158256247639656, -0.00020961277186870575, -0.0002033999189734459, -0.00019718706607818604, -0.00019097421318292618, -0.00018476136028766632, -0.00017854850739240646, -0.0001723356544971466, -0.00016612280160188675, -0.0001599099487066269, -0.00015369709581136703, -0.00014748424291610718, -0.00014127139002084732, -0.00013505853712558746, -0.0001288456842303276, -0.00012263283133506775, -0.00011641997843980789, -0.00011020712554454803, -0.00010399427264928818, -9.778141975402832e-05, -9.156856685876846e-05, -8.53557139635086e-05, -7.914286106824875e-05, -7.293000817298889e-05, -6.671715527772903e-05, -6.050430238246918e-05, -5.429144948720932e-05, -4.807859659194946e-05, -4.1865743696689606e-05, -3.565289080142975e-05, -2.944003790616989e-05, -2.3227185010910034e-05, -1.7014332115650177e-05, -1.080147922039032e-05, -4.588626325130463e-06, 1.6242265701293945e-06, 7.837079465389252e-06, 1.4049932360649109e-05, 2.0262785255908966e-05, 2.6475638151168823e-05, 3.268849104642868e-05, 3.890134394168854e-05, 4.5114196836948395e-05, 5.132704973220825e-05, 5.753990262746811e-05, 6.375275552272797e-05, 6.996560841798782e-05, 7.617846131324768e-05, 8.239131420850754e-05, 8.86041671037674e-05, 9.481701999902725e-05, 0.00010102987289428711]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 10.0, 11.0, 18.0, 18.0, 34.0, 64.0, 122.0, 178.0, 432.0, 877.0, 2112.0, 6519.0, 27920.0, 183318.0, 594887.0, 192797.0, 28529.0, 6717.0, 2236.0, 844.0, 421.0, 223.0, 97.0, 59.0, 38.0, 25.0, 17.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5064926147460938, -0.4880828857421875, -0.46967315673828125, -0.451263427734375, -0.43285369873046875, -0.4144439697265625, -0.39603424072265625, -0.37762451171875, -0.35921478271484375, -0.3408050537109375, -0.32239532470703125, -0.303985595703125, -0.28557586669921875, -0.2671661376953125, -0.24875640869140625, -0.2303466796875, -0.21193695068359375, -0.1935272216796875, -0.17511749267578125, -0.156707763671875, -0.13829803466796875, -0.1198883056640625, -0.10147857666015625, -0.08306884765625, -0.06465911865234375, -0.0462493896484375, -0.02783966064453125, -0.009429931640625, 0.00897979736328125, 0.0273895263671875, 0.04579925537109375, 0.064208984375, 0.08261871337890625, 0.1010284423828125, 0.11943817138671875, 0.137847900390625, 0.15625762939453125, 0.1746673583984375, 0.19307708740234375, 0.21148681640625, 0.22989654541015625, 0.2483062744140625, 0.26671600341796875, 0.285125732421875, 0.30353546142578125, 0.3219451904296875, 0.34035491943359375, 0.3587646484375, 0.37717437744140625, 0.3955841064453125, 0.41399383544921875, 0.432403564453125, 0.45081329345703125, 0.4692230224609375, 0.48763275146484375, 0.50604248046875, 0.5244522094726562, 0.5428619384765625, 0.5612716674804688, 0.579681396484375, 0.5980911254882812, 0.6165008544921875, 0.6349105834960938, 0.6533203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 8.0, 19.0, 16.0, 22.0, 34.0, 40.0, 59.0, 64.0, 79.0, 105.0, 78.0, 87.0, 75.0, 64.0, 66.0, 33.0, 41.0, 25.0, 21.0, 16.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.34468841552734375, -0.3300018310546875, -0.31531524658203125, -0.300628662109375, -0.28594207763671875, -0.2712554931640625, -0.25656890869140625, -0.24188232421875, -0.22719573974609375, -0.2125091552734375, -0.19782257080078125, -0.183135986328125, -0.16844940185546875, -0.1537628173828125, -0.13907623291015625, -0.1243896484375, -0.10970306396484375, -0.0950164794921875, -0.08032989501953125, -0.065643310546875, -0.05095672607421875, -0.0362701416015625, -0.02158355712890625, -0.00689697265625, 0.00778961181640625, 0.0224761962890625, 0.03716278076171875, 0.051849365234375, 0.06653594970703125, 0.0812225341796875, 0.09590911865234375, 0.110595703125, 0.12528228759765625, 0.1399688720703125, 0.15465545654296875, 0.169342041015625, 0.18402862548828125, 0.1987152099609375, 0.21340179443359375, 0.22808837890625, 0.24277496337890625, 0.2574615478515625, 0.27214813232421875, 0.286834716796875, 0.30152130126953125, 0.3162078857421875, 0.33089447021484375, 0.3455810546875, 0.36026763916015625, 0.3749542236328125, 0.38964080810546875, 0.404327392578125, 0.41901397705078125, 0.4337005615234375, 0.44838714599609375, 0.46307373046875, 0.47776031494140625, 0.4924468994140625, 0.5071334838867188, 0.521820068359375, 0.5365066528320312, 0.5511932373046875, 0.5658798217773438, 0.58056640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 14.0, 26.0, 68.0, 129.0, 227.0, 242.0, 156.0, 58.0, 45.0, 21.0, 7.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.999469757080078, -18.576515197753906, -18.153560638427734, -17.730607986450195, -17.307653427124023, -16.88469886779785, -16.46174430847168, -16.03879165649414, -15.615837097167969, -15.192882537841797, -14.769928932189941, -14.34697437286377, -13.924020767211914, -13.501066207885742, -13.07811164855957, -12.655158042907715, -12.232203483581543, -11.809248924255371, -11.386295318603516, -10.963340759277344, -10.540387153625488, -10.117432594299316, -9.694478988647461, -9.271524429321289, -8.848569869995117, -8.425615310668945, -8.00266170501709, -7.579707145690918, -7.1567535400390625, -6.733798980712891, -6.310844898223877, -5.887890815734863, -5.464937210083008, -5.041983127593994, -4.6190290451049805, -4.196074485778809, -3.773120641708374, -3.3501665592193604, -2.9272122383117676, -2.504258155822754, -2.0813040733337402, -1.6583499908447266, -1.2353957891464233, -0.8124415874481201, -0.38948750495910645, 0.03346657752990723, 0.4564208984375, 0.8793749809265137, 1.3023290634155273, 1.725283145904541, 2.1482372283935547, 2.5711915493011475, 2.994145631790161, 3.417099714279175, 3.8400540351867676, 4.263008117675781, 4.685962200164795, 5.108916282653809, 5.531870365142822, 5.954824447631836, 6.377779006958008, 6.800732612609863, 7.223687171936035, 7.646641254425049, 8.069595336914062]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 8.0, 21.0, 15.0, 22.0, 20.0, 26.0, 31.0, 37.0, 31.0, 46.0, 51.0, 52.0, 69.0, 64.0, 67.0, 57.0, 46.0, 60.0, 47.0, 33.0, 43.0, 35.0, 30.0, 19.0, 20.0, 8.0, 14.0, 14.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.585875034332275, -7.340003490447998, -7.094131946563721, -6.848260402679443, -6.602388858795166, -6.356517314910889, -6.1106462478637695, -5.864774703979492, -5.618903160095215, -5.3730316162109375, -5.12716007232666, -4.881288528442383, -4.6354169845581055, -4.389545440673828, -4.143673896789551, -3.8978025913238525, -3.651930809020996, -3.4060592651367188, -3.1601877212524414, -2.914316177368164, -2.6684446334838867, -2.4225730895996094, -2.176701784133911, -1.9308302402496338, -1.6849586963653564, -1.439087152481079, -1.1932156085968018, -0.947344183921814, -0.7014726400375366, -0.4556010961532593, -0.20972967147827148, 0.03614187240600586, 0.282012939453125, 0.5278844833374023, 0.7737559676170349, 1.0196274518966675, 1.2654989957809448, 1.5113705396652222, 1.75724196434021, 2.0031135082244873, 2.2489850521087646, 2.494856595993042, 2.7407281398773193, 2.9865994453430176, 3.232470989227295, 3.4783425331115723, 3.7242140769958496, 3.970085620880127, 4.215957164764404, 4.461828708648682, 4.707700252532959, 4.953571796417236, 5.199443340301514, 5.445314884185791, 5.69118595123291, 5.9370574951171875, 6.182929039001465, 6.428800582885742, 6.6746721267700195, 6.920543670654297, 7.166415214538574, 7.412286758422852, 7.658158302307129, 7.904029846191406, 8.149901390075684]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 10.0, 21.0, 9.0, 24.0, 32.0, 43.0, 85.0, 136.0, 233.0, 407.0, 736.0, 1454.0, 4116.0, 21644.0, 1121111.0, 3012390.0, 24269.0, 4391.0, 1522.0, 737.0, 330.0, 221.0, 138.0, 83.0, 42.0, 20.0, 20.0, 14.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.50390625, -3.409271240234375, -3.31463623046875, -3.220001220703125, -3.1253662109375, -3.030731201171875, -2.93609619140625, -2.841461181640625, -2.746826171875, -2.652191162109375, -2.55755615234375, -2.462921142578125, -2.3682861328125, -2.273651123046875, -2.17901611328125, -2.084381103515625, -1.98974609375, -1.895111083984375, -1.80047607421875, -1.705841064453125, -1.6112060546875, -1.516571044921875, -1.42193603515625, -1.327301025390625, -1.232666015625, -1.138031005859375, -1.04339599609375, -0.948760986328125, -0.8541259765625, -0.759490966796875, -0.66485595703125, -0.570220947265625, -0.4755859375, -0.380950927734375, -0.28631591796875, -0.191680908203125, -0.0970458984375, -0.002410888671875, 0.09222412109375, 0.186859130859375, 0.281494140625, 0.376129150390625, 0.47076416015625, 0.565399169921875, 0.6600341796875, 0.754669189453125, 0.84930419921875, 0.943939208984375, 1.03857421875, 1.133209228515625, 1.22784423828125, 1.322479248046875, 1.4171142578125, 1.511749267578125, 1.60638427734375, 1.701019287109375, 1.795654296875, 1.890289306640625, 1.98492431640625, 2.079559326171875, 2.1741943359375, 2.268829345703125, 2.36346435546875, 2.458099365234375, 2.552734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 19.0, 35.0, 27.0, 77.0, 103.0, 110.0, 119.0, 122.0, 94.0, 89.0, 71.0, 34.0, 23.0, 24.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.63525390625, -0.6164703369140625, -0.597686767578125, -0.5789031982421875, -0.56011962890625, -0.5413360595703125, -0.522552490234375, -0.5037689208984375, -0.4849853515625, -0.4662017822265625, -0.447418212890625, -0.4286346435546875, -0.40985107421875, -0.3910675048828125, -0.372283935546875, -0.3535003662109375, -0.334716796875, -0.3159332275390625, -0.297149658203125, -0.2783660888671875, -0.25958251953125, -0.2407989501953125, -0.222015380859375, -0.2032318115234375, -0.1844482421875, -0.1656646728515625, -0.146881103515625, -0.1280975341796875, -0.10931396484375, -0.0905303955078125, -0.071746826171875, -0.0529632568359375, -0.0341796875, -0.0153961181640625, 0.003387451171875, 0.0221710205078125, 0.04095458984375, 0.0597381591796875, 0.078521728515625, 0.0973052978515625, 0.1160888671875, 0.1348724365234375, 0.153656005859375, 0.1724395751953125, 0.19122314453125, 0.2100067138671875, 0.228790283203125, 0.2475738525390625, 0.266357421875, 0.2851409912109375, 0.303924560546875, 0.3227081298828125, 0.34149169921875, 0.3602752685546875, 0.379058837890625, 0.3978424072265625, 0.4166259765625, 0.4354095458984375, 0.454193115234375, 0.4729766845703125, 0.49176025390625, 0.5105438232421875, 0.529327392578125, 0.5481109619140625, 0.56689453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 13.0, 10.0, 16.0, 28.0, 47.0, 65.0, 104.0, 169.0, 282.0, 528.0, 1124.0, 2770.0, 11407.0, 96060.0, 3834917.0, 222057.0, 18116.0, 3854.0, 1395.0, 625.0, 277.0, 152.0, 70.0, 52.0, 61.0, 22.0, 17.0, 15.0, 11.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.4822845458984375, -2.419647216796875, -2.3570098876953125, -2.29437255859375, -2.2317352294921875, -2.169097900390625, -2.1064605712890625, -2.0438232421875, -1.9811859130859375, -1.918548583984375, -1.8559112548828125, -1.79327392578125, -1.7306365966796875, -1.667999267578125, -1.6053619384765625, -1.542724609375, -1.4800872802734375, -1.417449951171875, -1.3548126220703125, -1.29217529296875, -1.2295379638671875, -1.166900634765625, -1.1042633056640625, -1.0416259765625, -0.9789886474609375, -0.916351318359375, -0.8537139892578125, -0.79107666015625, -0.7284393310546875, -0.665802001953125, -0.6031646728515625, -0.54052734375, -0.4778900146484375, -0.415252685546875, -0.3526153564453125, -0.28997802734375, -0.2273406982421875, -0.164703369140625, -0.1020660400390625, -0.0394287109375, 0.0232086181640625, 0.085845947265625, 0.1484832763671875, 0.21112060546875, 0.2737579345703125, 0.336395263671875, 0.3990325927734375, 0.461669921875, 0.5243072509765625, 0.586944580078125, 0.6495819091796875, 0.71221923828125, 0.7748565673828125, 0.837493896484375, 0.9001312255859375, 0.9627685546875, 1.0254058837890625, 1.088043212890625, 1.1506805419921875, 1.21331787109375, 1.2759552001953125, 1.338592529296875, 1.4012298583984375, 1.4638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 16.0, 29.0, 55.0, 140.0, 373.0, 2223.0, 848.0, 190.0, 74.0, 46.0, 33.0, 11.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0830612182617188, -1.0577239990234375, -1.0323867797851562, -1.007049560546875, -0.9817123413085938, -0.9563751220703125, -0.9310379028320312, -0.90570068359375, -0.8803634643554688, -0.8550262451171875, -0.8296890258789062, -0.804351806640625, -0.7790145874023438, -0.7536773681640625, -0.7283401489257812, -0.7030029296875, -0.6776657104492188, -0.6523284912109375, -0.6269912719726562, -0.601654052734375, -0.5763168334960938, -0.5509796142578125, -0.5256423950195312, -0.50030517578125, -0.47496795654296875, -0.4496307373046875, -0.42429351806640625, -0.398956298828125, -0.37361907958984375, -0.3482818603515625, -0.32294464111328125, -0.297607421875, -0.27227020263671875, -0.2469329833984375, -0.22159576416015625, -0.196258544921875, -0.17092132568359375, -0.1455841064453125, -0.12024688720703125, -0.09490966796875, -0.06957244873046875, -0.0442352294921875, -0.01889801025390625, 0.006439208984375, 0.03177642822265625, 0.0571136474609375, 0.08245086669921875, 0.1077880859375, 0.13312530517578125, 0.1584625244140625, 0.18379974365234375, 0.209136962890625, 0.23447418212890625, 0.2598114013671875, 0.28514862060546875, 0.31048583984375, 0.33582305908203125, 0.3611602783203125, 0.38649749755859375, 0.411834716796875, 0.43717193603515625, 0.4625091552734375, 0.48784637451171875, 0.51318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 22.0, 44.0, 113.0, 188.0, 246.0, 213.0, 94.0, 39.0, 22.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.731424808502197, -5.589971542358398, -5.4485182762146, -5.307065486907959, -5.16561222076416, -5.024158954620361, -4.8827056884765625, -4.741252422332764, -4.599799156188965, -4.458345890045166, -4.316892623901367, -4.175439834594727, -4.033986568450928, -3.892533302307129, -3.75108003616333, -3.6096267700195312, -3.4681739807128906, -3.326720714569092, -3.185267686843872, -3.0438144207000732, -2.9023613929748535, -2.7609081268310547, -2.619454860687256, -2.478001594543457, -2.3365485668182373, -2.1950953006744385, -2.0536422729492188, -1.91218900680542, -1.7707358598709106, -1.6292827129364014, -1.4878294467926025, -1.3463762998580933, -1.2049236297607422, -1.063470482826233, -0.9220172762870789, -0.7805640697479248, -0.6391109228134155, -0.49765777587890625, -0.3562045693397522, -0.21475136280059814, -0.07329821586608887, 0.0681549608707428, 0.20960813760757446, 0.35106131434440613, 0.4925144910812378, 0.6339676380157471, 0.7754208445549011, 0.9168740510940552, 1.0583271980285645, 1.1997803449630737, 1.341233491897583, 1.4826867580413818, 1.6241399049758911, 1.7655930519104004, 1.9070463180541992, 2.048499584197998, 2.1899526119232178, 2.3314058780670166, 2.4728589057922363, 2.614312171936035, 2.755765438079834, 2.8972184658050537, 3.0386717319488525, 3.1801247596740723, 3.321578025817871]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 11.0, 10.0, 12.0, 13.0, 31.0, 29.0, 32.0, 43.0, 36.0, 34.0, 55.0, 45.0, 50.0, 56.0, 54.0, 52.0, 63.0, 45.0, 36.0, 36.0, 46.0, 37.0, 29.0, 22.0, 23.0, 24.0, 10.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8159911632537842, -1.7610372304916382, -1.7060832977294922, -1.6511292457580566, -1.5961753129959106, -1.5412213802337646, -1.4862674474716187, -1.4313135147094727, -1.376359462738037, -1.3214055299758911, -1.2664515972137451, -1.2114975452423096, -1.1565436124801636, -1.1015896797180176, -1.0466357469558716, -0.9916818141937256, -0.9367278814315796, -0.8817739486694336, -0.8268199563026428, -0.7718660235404968, -0.716912031173706, -0.6619580984115601, -0.6070041656494141, -0.5520502328872681, -0.4970962405204773, -0.4421422779560089, -0.3871883153915405, -0.33223438262939453, -0.27728042006492615, -0.22232645750045776, -0.16737252473831177, -0.11241856217384338, -0.057464599609375, -0.002510644495487213, 0.052443310618400574, 0.10739725828170776, 0.16235122084617615, 0.21730518341064453, 0.2722591161727905, 0.3272130787372589, 0.3821670413017273, 0.4371210038661957, 0.49207496643066406, 0.5470288991928101, 0.601982831954956, 0.6569368243217468, 0.7118907570838928, 0.7668447494506836, 0.8217986822128296, 0.8767526149749756, 0.9317066073417664, 0.9866605401039124, 1.0416145324707031, 1.0965684652328491, 1.1515223979949951, 1.2064763307571411, 1.261430263519287, 1.316384196281433, 1.371338129043579, 1.4262921810150146, 1.4812461137771606, 1.5362000465393066, 1.5911539793014526, 1.6461079120635986, 1.7010619640350342]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 12.0, 8.0, 20.0, 12.0, 28.0, 26.0, 47.0, 62.0, 100.0, 111.0, 163.0, 237.0, 363.0, 485.0, 723.0, 1046.0, 1715.0, 2884.0, 6307.0, 19033.0, 90177.0, 452068.0, 375415.0, 68958.0, 15558.0, 5386.0, 2770.0, 1582.0, 1012.0, 704.0, 460.0, 323.0, 195.0, 151.0, 104.0, 82.0, 65.0, 54.0, 30.0, 22.0, 13.0, 19.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.61541748046875, -1.5531005859375, -1.49078369140625, -1.428466796875, -1.36614990234375, -1.3038330078125, -1.24151611328125, -1.17919921875, -1.11688232421875, -1.0545654296875, -0.99224853515625, -0.929931640625, -0.86761474609375, -0.8052978515625, -0.74298095703125, -0.6806640625, -0.61834716796875, -0.5560302734375, -0.49371337890625, -0.431396484375, -0.36907958984375, -0.3067626953125, -0.24444580078125, -0.18212890625, -0.11981201171875, -0.0574951171875, 0.00482177734375, 0.067138671875, 0.12945556640625, 0.1917724609375, 0.25408935546875, 0.31640625, 0.37872314453125, 0.4410400390625, 0.50335693359375, 0.565673828125, 0.62799072265625, 0.6903076171875, 0.75262451171875, 0.81494140625, 0.87725830078125, 0.9395751953125, 1.00189208984375, 1.064208984375, 1.12652587890625, 1.1888427734375, 1.25115966796875, 1.3134765625, 1.37579345703125, 1.4381103515625, 1.50042724609375, 1.562744140625, 1.62506103515625, 1.6873779296875, 1.74969482421875, 1.81201171875, 1.87432861328125, 1.9366455078125, 1.99896240234375, 2.061279296875, 2.12359619140625, 2.1859130859375, 2.24822998046875, 2.310546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 30.0, 28.0, 62.0, 70.0, 111.0, 112.0, 134.0, 110.0, 109.0, 78.0, 52.0, 33.0, 20.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.63232421875, -0.61279296875, -0.59326171875, -0.57373046875, -0.55419921875, -0.53466796875, -0.51513671875, -0.49560546875, -0.47607421875, -0.45654296875, -0.43701171875, -0.41748046875, -0.39794921875, -0.37841796875, -0.35888671875, -0.33935546875, -0.31982421875, -0.30029296875, -0.28076171875, -0.26123046875, -0.24169921875, -0.22216796875, -0.20263671875, -0.18310546875, -0.16357421875, -0.14404296875, -0.12451171875, -0.10498046875, -0.08544921875, -0.06591796875, -0.04638671875, -0.02685546875, -0.00732421875, 0.01220703125, 0.03173828125, 0.05126953125, 0.07080078125, 0.09033203125, 0.10986328125, 0.12939453125, 0.14892578125, 0.16845703125, 0.18798828125, 0.20751953125, 0.22705078125, 0.24658203125, 0.26611328125, 0.28564453125, 0.30517578125, 0.32470703125, 0.34423828125, 0.36376953125, 0.38330078125, 0.40283203125, 0.42236328125, 0.44189453125, 0.46142578125, 0.48095703125, 0.50048828125, 0.52001953125, 0.53955078125, 0.55908203125, 0.57861328125, 0.59814453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 14.0, 20.0, 21.0, 42.0, 45.0, 59.0, 120.0, 173.0, 272.0, 565.0, 1141.0, 2746.0, 7596.0, 23118.0, 82573.0, 295424.0, 427337.0, 147784.0, 39729.0, 12031.0, 4135.0, 1711.0, 797.0, 403.0, 269.0, 155.0, 87.0, 61.0, 42.0, 23.0, 19.0, 10.0, 9.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.10711669921875, -1.0716552734375, -1.03619384765625, -1.000732421875, -0.96527099609375, -0.9298095703125, -0.89434814453125, -0.85888671875, -0.82342529296875, -0.7879638671875, -0.75250244140625, -0.717041015625, -0.68157958984375, -0.6461181640625, -0.61065673828125, -0.5751953125, -0.53973388671875, -0.5042724609375, -0.46881103515625, -0.433349609375, -0.39788818359375, -0.3624267578125, -0.32696533203125, -0.29150390625, -0.25604248046875, -0.2205810546875, -0.18511962890625, -0.149658203125, -0.11419677734375, -0.0787353515625, -0.04327392578125, -0.0078125, 0.02764892578125, 0.0631103515625, 0.09857177734375, 0.134033203125, 0.16949462890625, 0.2049560546875, 0.24041748046875, 0.27587890625, 0.31134033203125, 0.3468017578125, 0.38226318359375, 0.417724609375, 0.45318603515625, 0.4886474609375, 0.52410888671875, 0.5595703125, 0.59503173828125, 0.6304931640625, 0.66595458984375, 0.701416015625, 0.73687744140625, 0.7723388671875, 0.80780029296875, 0.84326171875, 0.87872314453125, 0.9141845703125, 0.94964599609375, 0.985107421875, 1.02056884765625, 1.0560302734375, 1.09149169921875, 1.126953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 5.0, 7.0, 14.0, 10.0, 11.0, 22.0, 23.0, 38.0, 20.0, 35.0, 35.0, 56.0, 52.0, 62.0, 52.0, 50.0, 50.0, 56.0, 54.0, 52.0, 52.0, 44.0, 31.0, 31.0, 39.0, 21.0, 23.0, 16.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2007293701171875, -1.160247802734375, -1.1197662353515625, -1.07928466796875, -1.0388031005859375, -0.998321533203125, -0.9578399658203125, -0.9173583984375, -0.8768768310546875, -0.836395263671875, -0.7959136962890625, -0.75543212890625, -0.7149505615234375, -0.674468994140625, -0.6339874267578125, -0.593505859375, -0.5530242919921875, -0.512542724609375, -0.4720611572265625, -0.43157958984375, -0.3910980224609375, -0.350616455078125, -0.3101348876953125, -0.2696533203125, -0.2291717529296875, -0.188690185546875, -0.1482086181640625, -0.10772705078125, -0.0672454833984375, -0.026763916015625, 0.0137176513671875, 0.05419921875, 0.0946807861328125, 0.135162353515625, 0.1756439208984375, 0.21612548828125, 0.2566070556640625, 0.297088623046875, 0.3375701904296875, 0.3780517578125, 0.4185333251953125, 0.459014892578125, 0.4994964599609375, 0.53997802734375, 0.5804595947265625, 0.620941162109375, 0.6614227294921875, 0.701904296875, 0.7423858642578125, 0.782867431640625, 0.8233489990234375, 0.86383056640625, 0.9043121337890625, 0.944793701171875, 0.9852752685546875, 1.0257568359375, 1.0662384033203125, 1.106719970703125, 1.1472015380859375, 1.18768310546875, 1.2281646728515625, 1.268646240234375, 1.3091278076171875, 1.349609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 16.0, 27.0, 39.0, 63.0, 103.0, 161.0, 282.0, 617.0, 1377.0, 4309.0, 20513.0, 162677.0, 629782.0, 196792.0, 24055.0, 4790.0, 1583.0, 634.0, 299.0, 172.0, 100.0, 46.0, 32.0, 21.0, 14.0, 10.0, 8.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.669921875, -0.6505279541015625, -0.631134033203125, -0.6117401123046875, -0.59234619140625, -0.5729522705078125, -0.553558349609375, -0.5341644287109375, -0.5147705078125, -0.4953765869140625, -0.475982666015625, -0.4565887451171875, -0.43719482421875, -0.4178009033203125, -0.398406982421875, -0.3790130615234375, -0.359619140625, -0.3402252197265625, -0.320831298828125, -0.3014373779296875, -0.28204345703125, -0.2626495361328125, -0.243255615234375, -0.2238616943359375, -0.2044677734375, -0.1850738525390625, -0.165679931640625, -0.1462860107421875, -0.12689208984375, -0.1074981689453125, -0.088104248046875, -0.0687103271484375, -0.04931640625, -0.0299224853515625, -0.010528564453125, 0.0088653564453125, 0.02825927734375, 0.0476531982421875, 0.067047119140625, 0.0864410400390625, 0.1058349609375, 0.1252288818359375, 0.144622802734375, 0.1640167236328125, 0.18341064453125, 0.2028045654296875, 0.222198486328125, 0.2415924072265625, 0.260986328125, 0.2803802490234375, 0.299774169921875, 0.3191680908203125, 0.33856201171875, 0.3579559326171875, 0.377349853515625, 0.3967437744140625, 0.4161376953125, 0.4355316162109375, 0.454925537109375, 0.4743194580078125, 0.49371337890625, 0.5131072998046875, 0.532501220703125, 0.5518951416015625, 0.5712890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 9.0, 5.0, 7.0, 16.0, 20.0, 20.0, 28.0, 40.0, 39.0, 32.0, 66.0, 67.0, 90.0, 86.0, 91.0, 78.0, 63.0, 55.0, 45.0, 26.0, 20.0, 34.0, 12.0, 17.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.00010198354721069336, -9.93385910987854e-05, -9.669363498687744e-05, -9.404867887496948e-05, -9.140372276306152e-05, -8.875876665115356e-05, -8.61138105392456e-05, -8.346885442733765e-05, -8.082389831542969e-05, -7.817894220352173e-05, -7.553398609161377e-05, -7.288902997970581e-05, -7.024407386779785e-05, -6.759911775588989e-05, -6.495416164398193e-05, -6.230920553207397e-05, -5.9664249420166016e-05, -5.701929330825806e-05, -5.43743371963501e-05, -5.172938108444214e-05, -4.908442497253418e-05, -4.643946886062622e-05, -4.379451274871826e-05, -4.11495566368103e-05, -3.8504600524902344e-05, -3.5859644412994385e-05, -3.3214688301086426e-05, -3.056973218917847e-05, -2.7924776077270508e-05, -2.527981996536255e-05, -2.263486385345459e-05, -1.998990774154663e-05, -1.7344951629638672e-05, -1.4699995517730713e-05, -1.2055039405822754e-05, -9.410083293914795e-06, -6.765127182006836e-06, -4.120171070098877e-06, -1.475214958190918e-06, 1.169741153717041e-06, 3.814697265625e-06, 6.459653377532959e-06, 9.104609489440918e-06, 1.1749565601348877e-05, 1.4394521713256836e-05, 1.7039477825164795e-05, 1.9684433937072754e-05, 2.2329390048980713e-05, 2.4974346160888672e-05, 2.761930227279663e-05, 3.026425838470459e-05, 3.290921449661255e-05, 3.555417060852051e-05, 3.819912672042847e-05, 4.0844082832336426e-05, 4.3489038944244385e-05, 4.6133995056152344e-05, 4.87789511680603e-05, 5.142390727996826e-05, 5.406886339187622e-05, 5.671381950378418e-05, 5.935877561569214e-05, 6.20037317276001e-05, 6.464868783950806e-05, 6.729364395141602e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 3.0, 5.0, 5.0, 12.0, 23.0, 34.0, 47.0, 92.0, 142.0, 247.0, 478.0, 925.0, 2345.0, 6628.0, 25313.0, 126810.0, 484769.0, 317235.0, 62270.0, 13981.0, 4137.0, 1531.0, 682.0, 365.0, 197.0, 103.0, 62.0, 45.0, 24.0, 11.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.40769195556640625, -0.3930206298828125, -0.37834930419921875, -0.363677978515625, -0.34900665283203125, -0.3343353271484375, -0.31966400146484375, -0.30499267578125, -0.29032135009765625, -0.2756500244140625, -0.26097869873046875, -0.246307373046875, -0.23163604736328125, -0.2169647216796875, -0.20229339599609375, -0.1876220703125, -0.17295074462890625, -0.1582794189453125, -0.14360809326171875, -0.128936767578125, -0.11426544189453125, -0.0995941162109375, -0.08492279052734375, -0.07025146484375, -0.05558013916015625, -0.0409088134765625, -0.02623748779296875, -0.011566162109375, 0.00310516357421875, 0.0177764892578125, 0.03244781494140625, 0.047119140625, 0.06179046630859375, 0.0764617919921875, 0.09113311767578125, 0.105804443359375, 0.12047576904296875, 0.1351470947265625, 0.14981842041015625, 0.16448974609375, 0.17916107177734375, 0.1938323974609375, 0.20850372314453125, 0.223175048828125, 0.23784637451171875, 0.2525177001953125, 0.26718902587890625, 0.2818603515625, 0.29653167724609375, 0.3112030029296875, 0.32587432861328125, 0.340545654296875, 0.35521697998046875, 0.3698883056640625, 0.38455963134765625, 0.39923095703125, 0.41390228271484375, 0.4285736083984375, 0.44324493408203125, 0.457916259765625, 0.47258758544921875, 0.4872589111328125, 0.5019302368164062, 0.5166015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 10.0, 11.0, 24.0, 39.0, 27.0, 48.0, 81.0, 93.0, 94.0, 116.0, 88.0, 84.0, 69.0, 47.0, 44.0, 30.0, 22.0, 17.0, 16.0, 10.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3066825866699219, -0.29183197021484375, -0.2769813537597656, -0.2621307373046875, -0.24728012084960938, -0.23242950439453125, -0.21757888793945312, -0.202728271484375, -0.18787765502929688, -0.17302703857421875, -0.15817642211914062, -0.1433258056640625, -0.12847518920898438, -0.11362457275390625, -0.09877395629882812, -0.08392333984375, -0.06907272338867188, -0.05422210693359375, -0.039371490478515625, -0.0245208740234375, -0.009670257568359375, 0.00518035888671875, 0.020030975341796875, 0.034881591796875, 0.049732208251953125, 0.06458282470703125, 0.07943344116210938, 0.0942840576171875, 0.10913467407226562, 0.12398529052734375, 0.13883590698242188, 0.1536865234375, 0.16853713989257812, 0.18338775634765625, 0.19823837280273438, 0.2130889892578125, 0.22793960571289062, 0.24279022216796875, 0.2576408386230469, 0.272491455078125, 0.2873420715332031, 0.30219268798828125, 0.3170433044433594, 0.3318939208984375, 0.3467445373535156, 0.36159515380859375, 0.3764457702636719, 0.39129638671875, 0.4061470031738281, 0.42099761962890625, 0.4358482360839844, 0.4506988525390625, 0.4655494689941406, 0.48040008544921875, 0.4952507019042969, 0.510101318359375, 0.5249519348144531, 0.5398025512695312, 0.5546531677246094, 0.5695037841796875, 0.5843544006347656, 0.5992050170898438, 0.6140556335449219, 0.62890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 2.0, 7.0, 10.0, 18.0, 21.0, 44.0, 57.0, 94.0, 142.0, 130.0, 140.0, 107.0, 79.0, 52.0, 29.0, 19.0, 17.0, 5.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.574131965637207, -8.32158088684082, -8.069028854370117, -7.816477298736572, -7.563925743103027, -7.311374187469482, -7.0588226318359375, -6.806271076202393, -6.553719520568848, -6.301167964935303, -6.048616409301758, -5.796064853668213, -5.543513298034668, -5.290961742401123, -5.038410186767578, -4.785858631134033, -4.533307075500488, -4.280755519866943, -4.028203964233398, -3.7756524085998535, -3.5231008529663086, -3.2705492973327637, -3.0179977416992188, -2.765446186065674, -2.512894630432129, -2.260343074798584, -2.007791519165039, -1.7552399635314941, -1.5026884078979492, -1.2501368522644043, -0.9975852966308594, -0.7450337409973145, -0.49248218536376953, -0.2399306297302246, 0.012620925903320312, 0.26517248153686523, 0.5177240371704102, 0.7702755928039551, 1.0228271484375, 1.275378704071045, 1.5279302597045898, 1.7804818153381348, 2.0330333709716797, 2.2855849266052246, 2.5381364822387695, 2.7906880378723145, 3.0432395935058594, 3.2957911491394043, 3.548342704772949, 3.800894260406494, 4.053445816040039, 4.305997371673584, 4.558548927307129, 4.811100482940674, 5.063652038574219, 5.316203594207764, 5.568755149841309, 5.8213067054748535, 6.073858261108398, 6.326409816741943, 6.578961372375488, 6.831512928009033, 7.084064483642578, 7.336616039276123, 7.589167594909668]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 2.0, 8.0, 10.0, 17.0, 11.0, 16.0, 19.0, 25.0, 27.0, 25.0, 32.0, 30.0, 24.0, 34.0, 32.0, 38.0, 54.0, 42.0, 33.0, 50.0, 42.0, 32.0, 48.0, 38.0, 52.0, 36.0, 30.0, 29.0, 18.0, 18.0, 14.0, 16.0, 16.0, 11.0, 13.0, 15.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.057811737060547, -4.880091667175293, -4.702371120452881, -4.524651050567627, -4.346930980682373, -4.169210433959961, -3.991490364074707, -3.813770055770874, -3.636049747467041, -3.458329439163208, -3.280609369277954, -3.102889060974121, -2.925168752670288, -2.747448444366455, -2.569728374481201, -2.392008066177368, -2.2142879962921143, -2.0365676879882812, -1.8588474988937378, -1.6811273097991943, -1.5034070014953613, -1.3256868124008179, -1.1479666233062744, -0.9702463150024414, -0.792526125907898, -0.6148058772087097, -0.43708565831184387, -0.259365439414978, -0.0816451907157898, 0.09607505798339844, 0.2737952470779419, 0.4515155553817749, 0.6292357444763184, 0.8069559931755066, 0.9846762418746948, 1.1623964309692383, 1.3401167392730713, 1.5178369283676147, 1.6955571174621582, 1.8732774257659912, 2.050997734069824, 2.2287180423736572, 2.406438112258911, 2.584158420562744, 2.761878728866577, 2.93959903717041, 3.117319107055664, 3.295039415359497, 3.472759485244751, 3.650479793548584, 3.828199863433838, 4.00592041015625, 4.183640480041504, 4.361360549926758, 4.539080619812012, 4.716801166534424, 4.894521236419678, 5.072241306304932, 5.249961853027344, 5.427681922912598, 5.605401992797852, 5.783122539520264, 5.960842609405518, 6.13856315612793, 6.316283226013184]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 8.0, 19.0, 23.0, 33.0, 54.0, 78.0, 112.0, 211.0, 379.0, 635.0, 1261.0, 3009.0, 11725.0, 112893.0, 3965518.0, 83878.0, 9656.0, 2550.0, 1022.0, 486.0, 304.0, 138.0, 101.0, 52.0, 43.0, 17.0, 16.0, 15.0, 3.0, 4.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.1015625, -3.0059814453125, -2.910400390625, -2.8148193359375, -2.71923828125, -2.6236572265625, -2.528076171875, -2.4324951171875, -2.3369140625, -2.2413330078125, -2.145751953125, -2.0501708984375, -1.95458984375, -1.8590087890625, -1.763427734375, -1.6678466796875, -1.572265625, -1.4766845703125, -1.381103515625, -1.2855224609375, -1.18994140625, -1.0943603515625, -0.998779296875, -0.9031982421875, -0.8076171875, -0.7120361328125, -0.616455078125, -0.5208740234375, -0.42529296875, -0.3297119140625, -0.234130859375, -0.1385498046875, -0.04296875, 0.0526123046875, 0.148193359375, 0.2437744140625, 0.33935546875, 0.4349365234375, 0.530517578125, 0.6260986328125, 0.7216796875, 0.8172607421875, 0.912841796875, 1.0084228515625, 1.10400390625, 1.1995849609375, 1.295166015625, 1.3907470703125, 1.486328125, 1.5819091796875, 1.677490234375, 1.7730712890625, 1.86865234375, 1.9642333984375, 2.059814453125, 2.1553955078125, 2.2509765625, 2.3465576171875, 2.442138671875, 2.5377197265625, 2.63330078125, 2.7288818359375, 2.824462890625, 2.9200439453125, 3.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 11.0, 25.0, 28.0, 45.0, 72.0, 102.0, 112.0, 108.0, 120.0, 96.0, 84.0, 68.0, 40.0, 23.0, 18.0, 12.0, 9.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6087417602539062, -0.5895538330078125, -0.5703659057617188, -0.551177978515625, -0.5319900512695312, -0.5128021240234375, -0.49361419677734375, -0.47442626953125, -0.45523834228515625, -0.4360504150390625, -0.41686248779296875, -0.397674560546875, -0.37848663330078125, -0.3592987060546875, -0.34011077880859375, -0.3209228515625, -0.30173492431640625, -0.2825469970703125, -0.26335906982421875, -0.244171142578125, -0.22498321533203125, -0.2057952880859375, -0.18660736083984375, -0.16741943359375, -0.14823150634765625, -0.1290435791015625, -0.10985565185546875, -0.090667724609375, -0.07147979736328125, -0.0522918701171875, -0.03310394287109375, -0.013916015625, 0.00527191162109375, 0.0244598388671875, 0.04364776611328125, 0.062835693359375, 0.08202362060546875, 0.1012115478515625, 0.12039947509765625, 0.13958740234375, 0.15877532958984375, 0.1779632568359375, 0.19715118408203125, 0.216339111328125, 0.23552703857421875, 0.2547149658203125, 0.27390289306640625, 0.2930908203125, 0.31227874755859375, 0.3314666748046875, 0.35065460205078125, 0.369842529296875, 0.38903045654296875, 0.4082183837890625, 0.42740631103515625, 0.44659423828125, 0.46578216552734375, 0.4849700927734375, 0.5041580200195312, 0.523345947265625, 0.5425338745117188, 0.5617218017578125, 0.5809097290039062, 0.60009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 9.0, 10.0, 9.0, 16.0, 14.0, 22.0, 48.0, 43.0, 70.0, 103.0, 165.0, 274.0, 468.0, 1213.0, 3821.0, 21926.0, 632759.0, 3479291.0, 45092.0, 5833.0, 1652.0, 561.0, 305.0, 152.0, 110.0, 79.0, 53.0, 47.0, 25.0, 30.0, 27.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.041961669921875, -1.96673583984375, -1.891510009765625, -1.8162841796875, -1.741058349609375, -1.66583251953125, -1.590606689453125, -1.515380859375, -1.440155029296875, -1.36492919921875, -1.289703369140625, -1.2144775390625, -1.139251708984375, -1.06402587890625, -0.988800048828125, -0.91357421875, -0.838348388671875, -0.76312255859375, -0.687896728515625, -0.6126708984375, -0.537445068359375, -0.46221923828125, -0.386993408203125, -0.311767578125, -0.236541748046875, -0.16131591796875, -0.086090087890625, -0.0108642578125, 0.064361572265625, 0.13958740234375, 0.214813232421875, 0.2900390625, 0.365264892578125, 0.44049072265625, 0.515716552734375, 0.5909423828125, 0.666168212890625, 0.74139404296875, 0.816619873046875, 0.891845703125, 0.967071533203125, 1.04229736328125, 1.117523193359375, 1.1927490234375, 1.267974853515625, 1.34320068359375, 1.418426513671875, 1.49365234375, 1.568878173828125, 1.64410400390625, 1.719329833984375, 1.7945556640625, 1.869781494140625, 1.94500732421875, 2.020233154296875, 2.095458984375, 2.170684814453125, 2.24591064453125, 2.321136474609375, 2.3963623046875, 2.471588134765625, 2.54681396484375, 2.622039794921875, 2.697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 16.0, 37.0, 101.0, 441.0, 2614.0, 636.0, 134.0, 50.0, 20.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.065948486328125, -1.01666259765625, -0.967376708984375, -0.9180908203125, -0.868804931640625, -0.81951904296875, -0.770233154296875, -0.720947265625, -0.671661376953125, -0.62237548828125, -0.573089599609375, -0.5238037109375, -0.474517822265625, -0.42523193359375, -0.375946044921875, -0.32666015625, -0.277374267578125, -0.22808837890625, -0.178802490234375, -0.1295166015625, -0.080230712890625, -0.03094482421875, 0.018341064453125, 0.067626953125, 0.116912841796875, 0.16619873046875, 0.215484619140625, 0.2647705078125, 0.314056396484375, 0.36334228515625, 0.412628173828125, 0.4619140625, 0.511199951171875, 0.56048583984375, 0.609771728515625, 0.6590576171875, 0.708343505859375, 0.75762939453125, 0.806915283203125, 0.856201171875, 0.905487060546875, 0.95477294921875, 1.004058837890625, 1.0533447265625, 1.102630615234375, 1.15191650390625, 1.201202392578125, 1.25048828125, 1.299774169921875, 1.34906005859375, 1.398345947265625, 1.4476318359375, 1.496917724609375, 1.54620361328125, 1.595489501953125, 1.644775390625, 1.694061279296875, 1.74334716796875, 1.792633056640625, 1.8419189453125, 1.891204833984375, 1.94049072265625, 1.989776611328125, 2.0390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 33.0, 67.0, 154.0, 230.0, 236.0, 139.0, 68.0, 37.0, 14.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.674568176269531, -7.492204666137695, -7.309841156005859, -7.127477645874023, -6.9451141357421875, -6.762750148773193, -6.580386638641357, -6.3980231285095215, -6.2156596183776855, -6.03329610824585, -5.850932598114014, -5.668569087982178, -5.486205101013184, -5.303841590881348, -5.121478080749512, -4.939114570617676, -4.75675106048584, -4.574387550354004, -4.392024040222168, -4.209660530090332, -4.027297019958496, -3.844933271408081, -3.662569522857666, -3.48020601272583, -3.297842502593994, -3.115478992462158, -2.9331154823303223, -2.7507517337799072, -2.5683882236480713, -2.3860247135162354, -2.2036609649658203, -2.0212974548339844, -1.8389344215393066, -1.6565709114074707, -1.4742072820663452, -1.2918436527252197, -1.1094801425933838, -0.9271165728569031, -0.7447530031204224, -0.5623893737792969, -0.38002586364746094, -0.19766229391098022, -0.015298724174499512, 0.1670648455619812, 0.3494284152984619, 0.5317919850349426, 0.7141555547714233, 0.8965191841125488, 1.0788826942443848, 1.2612462043762207, 1.4436098337173462, 1.6259734630584717, 1.8083369731903076, 1.9907004833221436, 2.1730642318725586, 2.3554277420043945, 2.5377912521362305, 2.7201547622680664, 2.9025182723999023, 3.0848820209503174, 3.2672455310821533, 3.4496090412139893, 3.6319727897644043, 3.8143362998962402, 3.996699810028076]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 13.0, 11.0, 21.0, 28.0, 41.0, 42.0, 61.0, 51.0, 71.0, 81.0, 84.0, 84.0, 75.0, 57.0, 54.0, 58.0, 40.0, 33.0, 17.0, 24.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150228977203369, -3.053276538848877, -2.956324338912964, -2.859372138977051, -2.7624197006225586, -2.6654672622680664, -2.5685150623321533, -2.4715628623962402, -2.374610424041748, -2.277657985687256, -2.1807057857513428, -2.0837535858154297, -1.9868011474609375, -1.8898488283157349, -1.7928965091705322, -1.6959441900253296, -1.598991870880127, -1.5020395517349243, -1.4050872325897217, -1.308134913444519, -1.2111825942993164, -1.1142302751541138, -1.0172779560089111, -0.9203256368637085, -0.8233733177185059, -0.7264209985733032, -0.6294686794281006, -0.532516360282898, -0.4355640411376953, -0.3386117219924927, -0.24165940284729004, -0.1447070837020874, -0.047754764556884766, 0.04919755458831787, 0.1461498737335205, 0.24310219287872314, 0.3400545120239258, 0.4370068311691284, 0.533959150314331, 0.6309114694595337, 0.7278637886047363, 0.824816107749939, 0.9217684268951416, 1.0187207460403442, 1.1156730651855469, 1.2126253843307495, 1.3095777034759521, 1.4065300226211548, 1.5034823417663574, 1.60043466091156, 1.6973869800567627, 1.7943392992019653, 1.891291618347168, 1.9882439374923706, 2.0851962566375732, 2.1821484565734863, 2.2791008949279785, 2.3760533332824707, 2.473005533218384, 2.569957733154297, 2.666910171508789, 2.7638626098632812, 2.8608148097991943, 2.9577670097351074, 3.0547194480895996]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 10.0, 11.0, 21.0, 29.0, 39.0, 55.0, 88.0, 155.0, 268.0, 411.0, 830.0, 1600.0, 3588.0, 10924.0, 81771.0, 742213.0, 179336.0, 18080.0, 4742.0, 2061.0, 997.0, 509.0, 271.0, 185.0, 112.0, 81.0, 42.0, 31.0, 20.0, 11.0, 4.0, 9.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.52325439453125, -2.4351806640625, -2.34710693359375, -2.259033203125, -2.17095947265625, -2.0828857421875, -1.99481201171875, -1.90673828125, -1.81866455078125, -1.7305908203125, -1.64251708984375, -1.554443359375, -1.46636962890625, -1.3782958984375, -1.29022216796875, -1.2021484375, -1.11407470703125, -1.0260009765625, -0.93792724609375, -0.849853515625, -0.76177978515625, -0.6737060546875, -0.58563232421875, -0.49755859375, -0.40948486328125, -0.3214111328125, -0.23333740234375, -0.145263671875, -0.05718994140625, 0.0308837890625, 0.11895751953125, 0.20703125, 0.29510498046875, 0.3831787109375, 0.47125244140625, 0.559326171875, 0.64739990234375, 0.7354736328125, 0.82354736328125, 0.91162109375, 0.99969482421875, 1.0877685546875, 1.17584228515625, 1.263916015625, 1.35198974609375, 1.4400634765625, 1.52813720703125, 1.6162109375, 1.70428466796875, 1.7923583984375, 1.88043212890625, 1.968505859375, 2.05657958984375, 2.1446533203125, 2.23272705078125, 2.32080078125, 2.40887451171875, 2.4969482421875, 2.58502197265625, 2.673095703125, 2.76116943359375, 2.8492431640625, 2.93731689453125, 3.025390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 7.0, 11.0, 12.0, 25.0, 36.0, 53.0, 76.0, 104.0, 116.0, 114.0, 113.0, 108.0, 69.0, 59.0, 32.0, 23.0, 16.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66552734375, -0.6450347900390625, -0.624542236328125, -0.6040496826171875, -0.58355712890625, -0.5630645751953125, -0.542572021484375, -0.5220794677734375, -0.5015869140625, -0.4810943603515625, -0.460601806640625, -0.4401092529296875, -0.41961669921875, -0.3991241455078125, -0.378631591796875, -0.3581390380859375, -0.337646484375, -0.3171539306640625, -0.296661376953125, -0.2761688232421875, -0.25567626953125, -0.2351837158203125, -0.214691162109375, -0.1941986083984375, -0.1737060546875, -0.1532135009765625, -0.132720947265625, -0.1122283935546875, -0.09173583984375, -0.0712432861328125, -0.050750732421875, -0.0302581787109375, -0.009765625, 0.0107269287109375, 0.031219482421875, 0.0517120361328125, 0.07220458984375, 0.0926971435546875, 0.113189697265625, 0.1336822509765625, 0.1541748046875, 0.1746673583984375, 0.195159912109375, 0.2156524658203125, 0.23614501953125, 0.2566375732421875, 0.277130126953125, 0.2976226806640625, 0.318115234375, 0.3386077880859375, 0.359100341796875, 0.3795928955078125, 0.40008544921875, 0.4205780029296875, 0.441070556640625, 0.4615631103515625, 0.4820556640625, 0.5025482177734375, 0.523040771484375, 0.5435333251953125, 0.56402587890625, 0.5845184326171875, 0.605010986328125, 0.6255035400390625, 0.64599609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 14.0, 15.0, 24.0, 28.0, 41.0, 68.0, 93.0, 143.0, 212.0, 336.0, 679.0, 1482.0, 3619.0, 10272.0, 37078.0, 153646.0, 496753.0, 258198.0, 60478.0, 16191.0, 5098.0, 1969.0, 873.0, 420.0, 243.0, 175.0, 92.0, 68.0, 49.0, 41.0, 33.0, 21.0, 18.0, 10.0, 8.0, 7.0, 4.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.220703125, -1.1855010986328125, -1.150299072265625, -1.1150970458984375, -1.07989501953125, -1.0446929931640625, -1.009490966796875, -0.9742889404296875, -0.9390869140625, -0.9038848876953125, -0.868682861328125, -0.8334808349609375, -0.79827880859375, -0.7630767822265625, -0.727874755859375, -0.6926727294921875, -0.657470703125, -0.6222686767578125, -0.587066650390625, -0.5518646240234375, -0.51666259765625, -0.4814605712890625, -0.446258544921875, -0.4110565185546875, -0.3758544921875, -0.3406524658203125, -0.305450439453125, -0.2702484130859375, -0.23504638671875, -0.1998443603515625, -0.164642333984375, -0.1294403076171875, -0.09423828125, -0.0590362548828125, -0.023834228515625, 0.0113677978515625, 0.04656982421875, 0.0817718505859375, 0.116973876953125, 0.1521759033203125, 0.1873779296875, 0.2225799560546875, 0.257781982421875, 0.2929840087890625, 0.32818603515625, 0.3633880615234375, 0.398590087890625, 0.4337921142578125, 0.468994140625, 0.5041961669921875, 0.539398193359375, 0.5746002197265625, 0.60980224609375, 0.6450042724609375, 0.680206298828125, 0.7154083251953125, 0.7506103515625, 0.7858123779296875, 0.821014404296875, 0.8562164306640625, 0.89141845703125, 0.9266204833984375, 0.961822509765625, 0.9970245361328125, 1.0322265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 1.0, 9.0, 11.0, 10.0, 19.0, 19.0, 18.0, 29.0, 17.0, 18.0, 36.0, 29.0, 30.0, 37.0, 38.0, 40.0, 52.0, 45.0, 51.0, 36.0, 42.0, 42.0, 46.0, 33.0, 29.0, 32.0, 29.0, 33.0, 19.0, 22.0, 20.0, 17.0, 17.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0], "bins": [-1.1005859375, -1.0685272216796875, -1.036468505859375, -1.0044097900390625, -0.97235107421875, -0.9402923583984375, -0.908233642578125, -0.8761749267578125, -0.8441162109375, -0.8120574951171875, -0.779998779296875, -0.7479400634765625, -0.71588134765625, -0.6838226318359375, -0.651763916015625, -0.6197052001953125, -0.587646484375, -0.5555877685546875, -0.523529052734375, -0.4914703369140625, -0.45941162109375, -0.4273529052734375, -0.395294189453125, -0.3632354736328125, -0.3311767578125, -0.2991180419921875, -0.267059326171875, -0.2350006103515625, -0.20294189453125, -0.1708831787109375, -0.138824462890625, -0.1067657470703125, -0.07470703125, -0.0426483154296875, -0.010589599609375, 0.0214691162109375, 0.05352783203125, 0.0855865478515625, 0.117645263671875, 0.1497039794921875, 0.1817626953125, 0.2138214111328125, 0.245880126953125, 0.2779388427734375, 0.30999755859375, 0.3420562744140625, 0.374114990234375, 0.4061737060546875, 0.438232421875, 0.4702911376953125, 0.502349853515625, 0.5344085693359375, 0.56646728515625, 0.5985260009765625, 0.630584716796875, 0.6626434326171875, 0.6947021484375, 0.7267608642578125, 0.758819580078125, 0.7908782958984375, 0.82293701171875, 0.8549957275390625, 0.887054443359375, 0.9191131591796875, 0.951171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 11.0, 28.0, 23.0, 43.0, 109.0, 227.0, 655.0, 2589.0, 26418.0, 838266.0, 171438.0, 6882.0, 1141.0, 406.0, 125.0, 80.0, 47.0, 20.0, 19.0, 8.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.1595458984375, -1.121826171875, -1.0841064453125, -1.04638671875, -1.0086669921875, -0.970947265625, -0.9332275390625, -0.8955078125, -0.8577880859375, -0.820068359375, -0.7823486328125, -0.74462890625, -0.7069091796875, -0.669189453125, -0.6314697265625, -0.59375, -0.5560302734375, -0.518310546875, -0.4805908203125, -0.44287109375, -0.4051513671875, -0.367431640625, -0.3297119140625, -0.2919921875, -0.2542724609375, -0.216552734375, -0.1788330078125, -0.14111328125, -0.1033935546875, -0.065673828125, -0.0279541015625, 0.009765625, 0.0474853515625, 0.085205078125, 0.1229248046875, 0.16064453125, 0.1983642578125, 0.236083984375, 0.2738037109375, 0.3115234375, 0.3492431640625, 0.386962890625, 0.4246826171875, 0.46240234375, 0.5001220703125, 0.537841796875, 0.5755615234375, 0.61328125, 0.6510009765625, 0.688720703125, 0.7264404296875, 0.76416015625, 0.8018798828125, 0.839599609375, 0.8773193359375, 0.9150390625, 0.9527587890625, 0.990478515625, 1.0281982421875, 1.06591796875, 1.1036376953125, 1.141357421875, 1.1790771484375, 1.216796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 12.0, 11.0, 15.0, 18.0, 22.0, 39.0, 46.0, 67.0, 59.0, 83.0, 91.0, 102.0, 78.0, 66.0, 54.0, 43.0, 31.0, 26.0, 25.0, 14.0, 15.0, 8.0, 20.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.779764175415039e-05, -8.535757660865784e-05, -8.291751146316528e-05, -8.047744631767273e-05, -7.803738117218018e-05, -7.559731602668762e-05, -7.315725088119507e-05, -7.071718573570251e-05, -6.827712059020996e-05, -6.583705544471741e-05, -6.339699029922485e-05, -6.09569251537323e-05, -5.8516860008239746e-05, -5.607679486274719e-05, -5.363672971725464e-05, -5.1196664571762085e-05, -4.875659942626953e-05, -4.631653428077698e-05, -4.3876469135284424e-05, -4.143640398979187e-05, -3.8996338844299316e-05, -3.655627369880676e-05, -3.411620855331421e-05, -3.1676143407821655e-05, -2.92360782623291e-05, -2.6796013116836548e-05, -2.4355947971343994e-05, -2.191588282585144e-05, -1.9475817680358887e-05, -1.7035752534866333e-05, -1.459568738937378e-05, -1.2155622243881226e-05, -9.715557098388672e-06, -7.275491952896118e-06, -4.8354268074035645e-06, -2.3953616619110107e-06, 4.470348358154297e-08, 2.4847686290740967e-06, 4.92483377456665e-06, 7.364898920059204e-06, 9.804964065551758e-06, 1.2245029211044312e-05, 1.4685094356536865e-05, 1.712515950202942e-05, 1.9565224647521973e-05, 2.2005289793014526e-05, 2.444535493850708e-05, 2.6885420083999634e-05, 2.9325485229492188e-05, 3.176555037498474e-05, 3.4205615520477295e-05, 3.664568066596985e-05, 3.90857458114624e-05, 4.1525810956954956e-05, 4.396587610244751e-05, 4.6405941247940063e-05, 4.884600639343262e-05, 5.128607153892517e-05, 5.3726136684417725e-05, 5.616620182991028e-05, 5.860626697540283e-05, 6.104633212089539e-05, 6.348639726638794e-05, 6.592646241188049e-05, 6.836652755737305e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 15.0, 20.0, 34.0, 64.0, 82.0, 149.0, 443.0, 2122.0, 37973.0, 971714.0, 33079.0, 2016.0, 456.0, 159.0, 89.0, 53.0, 30.0, 16.0, 12.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.01171875, -1.9607696533203125, -1.909820556640625, -1.8588714599609375, -1.80792236328125, -1.7569732666015625, -1.706024169921875, -1.6550750732421875, -1.6041259765625, -1.5531768798828125, -1.502227783203125, -1.4512786865234375, -1.40032958984375, -1.3493804931640625, -1.298431396484375, -1.2474822998046875, -1.196533203125, -1.1455841064453125, -1.094635009765625, -1.0436859130859375, -0.99273681640625, -0.9417877197265625, -0.890838623046875, -0.8398895263671875, -0.7889404296875, -0.7379913330078125, -0.687042236328125, -0.6360931396484375, -0.58514404296875, -0.5341949462890625, -0.483245849609375, -0.4322967529296875, -0.38134765625, -0.3303985595703125, -0.279449462890625, -0.2285003662109375, -0.17755126953125, -0.1266021728515625, -0.075653076171875, -0.0247039794921875, 0.0262451171875, 0.0771942138671875, 0.128143310546875, 0.1790924072265625, 0.23004150390625, 0.2809906005859375, 0.331939697265625, 0.3828887939453125, 0.433837890625, 0.4847869873046875, 0.535736083984375, 0.5866851806640625, 0.63763427734375, 0.6885833740234375, 0.739532470703125, 0.7904815673828125, 0.8414306640625, 0.8923797607421875, 0.943328857421875, 0.9942779541015625, 1.04522705078125, 1.0961761474609375, 1.147125244140625, 1.1980743408203125, 1.2490234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 10.0, 15.0, 16.0, 21.0, 23.0, 34.0, 41.0, 49.0, 51.0, 95.0, 97.0, 99.0, 75.0, 82.0, 57.0, 53.0, 40.0, 28.0, 24.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.426513671875, -0.4127540588378906, -0.39899444580078125, -0.3852348327636719, -0.3714752197265625, -0.3577156066894531, -0.34395599365234375, -0.3301963806152344, -0.316436767578125, -0.3026771545410156, -0.28891754150390625, -0.2751579284667969, -0.2613983154296875, -0.24763870239257812, -0.23387908935546875, -0.22011947631835938, -0.20635986328125, -0.19260025024414062, -0.17884063720703125, -0.16508102416992188, -0.1513214111328125, -0.13756179809570312, -0.12380218505859375, -0.11004257202148438, -0.096282958984375, -0.08252334594726562, -0.06876373291015625, -0.055004119873046875, -0.0412445068359375, -0.027484893798828125, -0.01372528076171875, 3.4332275390625e-05, 0.0137939453125, 0.027553558349609375, 0.04131317138671875, 0.055072784423828125, 0.0688323974609375, 0.08259201049804688, 0.09635162353515625, 0.11011123657226562, 0.123870849609375, 0.13763046264648438, 0.15139007568359375, 0.16514968872070312, 0.1789093017578125, 0.19266891479492188, 0.20642852783203125, 0.22018814086914062, 0.23394775390625, 0.24770736694335938, 0.26146697998046875, 0.2752265930175781, 0.2889862060546875, 0.3027458190917969, 0.31650543212890625, 0.3302650451660156, 0.344024658203125, 0.3577842712402344, 0.37154388427734375, 0.3853034973144531, 0.3990631103515625, 0.4128227233886719, 0.42658233642578125, 0.4403419494628906, 0.4541015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 22.0, 34.0, 157.0, 353.0, 299.0, 110.0, 22.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.736228942871094, -27.10340690612793, -26.470584869384766, -25.83776092529297, -25.204938888549805, -24.57211685180664, -23.939294815063477, -23.306472778320312, -22.67365074157715, -22.040828704833984, -21.40800666809082, -20.775184631347656, -20.14236068725586, -19.509538650512695, -18.87671661376953, -18.243894577026367, -17.611072540283203, -16.97825050354004, -16.345428466796875, -15.712605476379395, -15.07978343963623, -14.44696044921875, -13.814138412475586, -13.181316375732422, -12.548492431640625, -11.915670394897461, -11.28284740447998, -10.650025367736816, -10.017203330993652, -9.384380340576172, -8.751558303833008, -8.118736267089844, -7.48591423034668, -6.853091716766357, -6.220269680023193, -5.587447166442871, -4.954625129699707, -4.321802616119385, -3.6889801025390625, -3.0561580657958984, -2.423335552215576, -1.790513277053833, -1.1576908826828003, -0.5248684883117676, 0.10795378684997559, 0.7407760620117188, 1.373598575592041, 2.006420612335205, 2.6392431259155273, 3.2720654010772705, 3.9048876762390137, 4.537710189819336, 5.1705322265625, 5.803354740142822, 6.4361772537231445, 7.068999290466309, 7.701821804046631, 8.334644317626953, 8.967466354370117, 9.600288391113281, 10.233111381530762, 10.865933418273926, 11.498756408691406, 12.13157844543457, 12.764400482177734]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 7.0, 9.0, 13.0, 10.0, 15.0, 15.0, 21.0, 20.0, 25.0, 23.0, 32.0, 40.0, 21.0, 39.0, 48.0, 56.0, 46.0, 55.0, 38.0, 45.0, 38.0, 47.0, 45.0, 37.0, 47.0, 26.0, 25.0, 23.0, 19.0, 23.0, 10.0, 11.0, 12.0, 8.0, 13.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.246608734130859, -5.0803542137146, -4.914100170135498, -4.747845649719238, -4.581591606140137, -4.415337085723877, -4.249083042144775, -4.082828521728516, -3.916574478149414, -3.7503201961517334, -3.5840659141540527, -3.417811632156372, -3.2515573501586914, -3.0853030681610107, -2.91904878616333, -2.7527942657470703, -2.5865399837493896, -2.420285701751709, -2.2540314197540283, -2.0877771377563477, -1.921522855758667, -1.7552685737609863, -1.5890141725540161, -1.4227598905563354, -1.2565056085586548, -1.0902513265609741, -0.9239970445632935, -0.757742702960968, -0.5914884209632874, -0.4252341389656067, -0.25897979736328125, -0.09272551536560059, 0.07352876663208008, 0.23978306353092194, 0.4060373604297638, 0.5722916722297668, 0.7385459542274475, 0.9048002362251282, 1.0710545778274536, 1.2373088598251343, 1.403563141822815, 1.5698174238204956, 1.7360717058181763, 1.9023261070251465, 2.068580389022827, 2.234834671020508, 2.4010889530181885, 2.567343235015869, 2.73359751701355, 2.8998517990112305, 3.066106081008911, 3.232360363006592, 3.3986146450042725, 3.564868927001953, 3.731123447418213, 3.8973774909973145, 4.063632011413574, 4.229886531829834, 4.3961405754089355, 4.562395095825195, 4.728649139404297, 4.894903659820557, 5.061157703399658, 5.227412223815918, 5.3936662673950195]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 20.0, 24.0, 32.0, 36.0, 54.0, 83.0, 118.0, 172.0, 266.0, 470.0, 803.0, 1684.0, 4405.0, 17388.0, 228431.0, 3874682.0, 51682.0, 8546.0, 2766.0, 1159.0, 554.0, 311.0, 162.0, 137.0, 78.0, 58.0, 37.0, 29.0, 13.0, 10.0, 17.0, 5.0, 10.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.876953125, -2.79974365234375, -2.7225341796875, -2.64532470703125, -2.568115234375, -2.49090576171875, -2.4136962890625, -2.33648681640625, -2.25927734375, -2.18206787109375, -2.1048583984375, -2.02764892578125, -1.950439453125, -1.87322998046875, -1.7960205078125, -1.71881103515625, -1.6416015625, -1.56439208984375, -1.4871826171875, -1.40997314453125, -1.332763671875, -1.25555419921875, -1.1783447265625, -1.10113525390625, -1.02392578125, -0.94671630859375, -0.8695068359375, -0.79229736328125, -0.715087890625, -0.63787841796875, -0.5606689453125, -0.48345947265625, -0.40625, -0.32904052734375, -0.2518310546875, -0.17462158203125, -0.097412109375, -0.02020263671875, 0.0570068359375, 0.13421630859375, 0.21142578125, 0.28863525390625, 0.3658447265625, 0.44305419921875, 0.520263671875, 0.59747314453125, 0.6746826171875, 0.75189208984375, 0.8291015625, 0.90631103515625, 0.9835205078125, 1.06072998046875, 1.137939453125, 1.21514892578125, 1.2923583984375, 1.36956787109375, 1.44677734375, 1.52398681640625, 1.6011962890625, 1.67840576171875, 1.755615234375, 1.83282470703125, 1.9100341796875, 1.98724365234375, 2.064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 20.0, 37.0, 52.0, 82.0, 100.0, 98.0, 144.0, 94.0, 94.0, 91.0, 55.0, 38.0, 27.0, 17.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6387786865234375, -0.617889404296875, -0.5970001220703125, -0.57611083984375, -0.5552215576171875, -0.534332275390625, -0.5134429931640625, -0.4925537109375, -0.4716644287109375, -0.450775146484375, -0.4298858642578125, -0.40899658203125, -0.3881072998046875, -0.367218017578125, -0.3463287353515625, -0.325439453125, -0.3045501708984375, -0.283660888671875, -0.2627716064453125, -0.24188232421875, -0.2209930419921875, -0.200103759765625, -0.1792144775390625, -0.1583251953125, -0.1374359130859375, -0.116546630859375, -0.0956573486328125, -0.07476806640625, -0.0538787841796875, -0.032989501953125, -0.0121002197265625, 0.0087890625, 0.0296783447265625, 0.050567626953125, 0.0714569091796875, 0.09234619140625, 0.1132354736328125, 0.134124755859375, 0.1550140380859375, 0.1759033203125, 0.1967926025390625, 0.217681884765625, 0.2385711669921875, 0.25946044921875, 0.2803497314453125, 0.301239013671875, 0.3221282958984375, 0.343017578125, 0.3639068603515625, 0.384796142578125, 0.4056854248046875, 0.42657470703125, 0.4474639892578125, 0.468353271484375, 0.4892425537109375, 0.5101318359375, 0.5310211181640625, 0.551910400390625, 0.5727996826171875, 0.59368896484375, 0.6145782470703125, 0.635467529296875, 0.6563568115234375, 0.67724609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 9.0, 8.0, 17.0, 11.0, 27.0, 33.0, 62.0, 90.0, 108.0, 146.0, 257.0, 566.0, 1191.0, 2939.0, 9417.0, 46859.0, 3058069.0, 1022895.0, 38110.0, 8431.0, 2663.0, 1062.0, 533.0, 290.0, 156.0, 97.0, 71.0, 44.0, 32.0, 23.0, 15.0, 3.0, 9.0, 10.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.34375, -2.2835693359375, -2.223388671875, -2.1632080078125, -2.10302734375, -2.0428466796875, -1.982666015625, -1.9224853515625, -1.8623046875, -1.8021240234375, -1.741943359375, -1.6817626953125, -1.62158203125, -1.5614013671875, -1.501220703125, -1.4410400390625, -1.380859375, -1.3206787109375, -1.260498046875, -1.2003173828125, -1.14013671875, -1.0799560546875, -1.019775390625, -0.9595947265625, -0.8994140625, -0.8392333984375, -0.779052734375, -0.7188720703125, -0.65869140625, -0.5985107421875, -0.538330078125, -0.4781494140625, -0.41796875, -0.3577880859375, -0.297607421875, -0.2374267578125, -0.17724609375, -0.1170654296875, -0.056884765625, 0.0032958984375, 0.0634765625, 0.1236572265625, 0.183837890625, 0.2440185546875, 0.30419921875, 0.3643798828125, 0.424560546875, 0.4847412109375, 0.544921875, 0.6051025390625, 0.665283203125, 0.7254638671875, 0.78564453125, 0.8458251953125, 0.906005859375, 0.9661865234375, 1.0263671875, 1.0865478515625, 1.146728515625, 1.2069091796875, 1.26708984375, 1.3272705078125, 1.387451171875, 1.4476318359375, 1.5078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 13.0, 7.0, 29.0, 51.0, 106.0, 353.0, 2512.0, 699.0, 141.0, 69.0, 32.0, 21.0, 16.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2874984741210938, -1.2566375732421875, -1.2257766723632812, -1.194915771484375, -1.1640548706054688, -1.1331939697265625, -1.1023330688476562, -1.07147216796875, -1.0406112670898438, -1.0097503662109375, -0.9788894653320312, -0.948028564453125, -0.9171676635742188, -0.8863067626953125, -0.8554458618164062, -0.8245849609375, -0.7937240600585938, -0.7628631591796875, -0.7320022583007812, -0.701141357421875, -0.6702804565429688, -0.6394195556640625, -0.6085586547851562, -0.57769775390625, -0.5468368530273438, -0.5159759521484375, -0.48511505126953125, -0.454254150390625, -0.42339324951171875, -0.3925323486328125, -0.36167144775390625, -0.330810546875, -0.29994964599609375, -0.2690887451171875, -0.23822784423828125, -0.207366943359375, -0.17650604248046875, -0.1456451416015625, -0.11478424072265625, -0.08392333984375, -0.05306243896484375, -0.0222015380859375, 0.00865936279296875, 0.039520263671875, 0.07038116455078125, 0.1012420654296875, 0.13210296630859375, 0.1629638671875, 0.19382476806640625, 0.2246856689453125, 0.25554656982421875, 0.286407470703125, 0.31726837158203125, 0.3481292724609375, 0.37899017333984375, 0.40985107421875, 0.44071197509765625, 0.4715728759765625, 0.5024337768554688, 0.533294677734375, 0.5641555786132812, 0.5950164794921875, 0.6258773803710938, 0.65673828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 3.0, 10.0, 21.0, 30.0, 70.0, 102.0, 160.0, 212.0, 165.0, 108.0, 55.0, 29.0, 15.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6022846698760986, -3.4805939197540283, -3.358903169631958, -3.2372124195098877, -3.1155216693878174, -2.993830919265747, -2.872140407562256, -2.7504496574401855, -2.6287589073181152, -2.507068157196045, -2.3853774070739746, -2.2636866569519043, -2.141995906829834, -2.0203051567077637, -1.898614525794983, -1.7769237756729126, -1.6552329063415527, -1.5335421562194824, -1.411851406097412, -1.2901606559753418, -1.1684699058532715, -1.0467791557312012, -0.9250885248184204, -0.8033977746963501, -0.6817070245742798, -0.5600162744522095, -0.43832555413246155, -0.3166348338127136, -0.1949440836906433, -0.073253333568573, 0.04843735694885254, 0.17012810707092285, 0.29181909561157227, 0.4135098457336426, 0.5352005958557129, 0.6568912863731384, 0.7785820364952087, 0.900272786617279, 1.0219634771347046, 1.143654227256775, 1.2653449773788452, 1.3870357275009155, 1.5087264776229858, 1.6304171085357666, 1.752107858657837, 1.8737986087799072, 1.9954893589019775, 2.117180109024048, 2.238870859146118, 2.3605616092681885, 2.482252359390259, 2.603943109512329, 2.7256338596343994, 2.8473246097564697, 2.969015121459961, 3.0907058715820312, 3.2123966217041016, 3.334087371826172, 3.455778121948242, 3.5774688720703125, 3.699159622192383, 3.820850372314453, 3.9425411224365234, 4.064231872558594, 4.185922622680664]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 13.0, 18.0, 14.0, 27.0, 42.0, 27.0, 52.0, 55.0, 53.0, 54.0, 68.0, 69.0, 73.0, 58.0, 76.0, 50.0, 49.0, 40.0, 37.0, 33.0, 15.0, 18.0, 13.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4217028617858887, -2.3500778675079346, -2.2784526348114014, -2.2068276405334473, -2.135202646255493, -2.063577651977539, -1.9919524192810059, -1.9203274250030518, -1.848702311515808, -1.7770771980285645, -1.7054522037506104, -1.6338270902633667, -1.562201976776123, -1.490576982498169, -1.4189518690109253, -1.3473267555236816, -1.2757017612457275, -1.2040766477584839, -1.1324516534805298, -1.0608265399932861, -0.9892014861106873, -0.9175764322280884, -0.8459513187408447, -0.7743262648582458, -0.702701210975647, -0.6310761570930481, -0.5594511032104492, -0.48782598972320557, -0.4162009358406067, -0.3445758819580078, -0.27295079827308655, -0.20132571458816528, -0.1297008991241455, -0.05807583034038544, 0.013549238443374634, 0.0851743072271347, 0.15679937601089478, 0.22842442989349365, 0.3000495135784149, 0.3716745972633362, 0.44329965114593506, 0.5149247050285339, 0.5865497589111328, 0.6581748723983765, 0.7297999262809753, 0.8014249801635742, 0.8730500936508179, 0.9446751475334167, 1.0163002014160156, 1.0879253149032593, 1.1595503091812134, 1.231175422668457, 1.3028004169464111, 1.3744255304336548, 1.4460506439208984, 1.5176756381988525, 1.5893007516860962, 1.6609258651733398, 1.732550859451294, 1.8041759729385376, 1.8758010864257812, 1.9474260807037354, 2.0190510749816895, 2.0906763076782227, 2.1623013019561768]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 15.0, 27.0, 64.0, 109.0, 203.0, 468.0, 961.0, 2392.0, 9452.0, 153239.0, 830390.0, 43063.0, 5102.0, 1638.0, 729.0, 337.0, 157.0, 102.0, 29.0, 31.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.390625, -4.26971435546875, -4.1488037109375, -4.02789306640625, -3.906982421875, -3.78607177734375, -3.6651611328125, -3.54425048828125, -3.42333984375, -3.30242919921875, -3.1815185546875, -3.06060791015625, -2.939697265625, -2.81878662109375, -2.6978759765625, -2.57696533203125, -2.4560546875, -2.33514404296875, -2.2142333984375, -2.09332275390625, -1.972412109375, -1.85150146484375, -1.7305908203125, -1.60968017578125, -1.48876953125, -1.36785888671875, -1.2469482421875, -1.12603759765625, -1.005126953125, -0.88421630859375, -0.7633056640625, -0.64239501953125, -0.521484375, -0.40057373046875, -0.2796630859375, -0.15875244140625, -0.037841796875, 0.08306884765625, 0.2039794921875, 0.32489013671875, 0.44580078125, 0.56671142578125, 0.6876220703125, 0.80853271484375, 0.929443359375, 1.05035400390625, 1.1712646484375, 1.29217529296875, 1.4130859375, 1.53399658203125, 1.6549072265625, 1.77581787109375, 1.896728515625, 2.01763916015625, 2.1385498046875, 2.25946044921875, 2.38037109375, 2.50128173828125, 2.6221923828125, 2.74310302734375, 2.864013671875, 2.98492431640625, 3.1058349609375, 3.22674560546875, 3.34765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 16.0, 21.0, 31.0, 70.0, 84.0, 109.0, 113.0, 135.0, 118.0, 86.0, 65.0, 52.0, 45.0, 16.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6797256469726562, -0.6573028564453125, -0.6348800659179688, -0.612457275390625, -0.5900344848632812, -0.5676116943359375, -0.5451889038085938, -0.52276611328125, -0.5003433227539062, -0.4779205322265625, -0.45549774169921875, -0.433074951171875, -0.41065216064453125, -0.3882293701171875, -0.36580657958984375, -0.3433837890625, -0.32096099853515625, -0.2985382080078125, -0.27611541748046875, -0.253692626953125, -0.23126983642578125, -0.2088470458984375, -0.18642425537109375, -0.16400146484375, -0.14157867431640625, -0.1191558837890625, -0.09673309326171875, -0.074310302734375, -0.05188751220703125, -0.0294647216796875, -0.00704193115234375, 0.015380859375, 0.03780364990234375, 0.0602264404296875, 0.08264923095703125, 0.105072021484375, 0.12749481201171875, 0.1499176025390625, 0.17234039306640625, 0.19476318359375, 0.21718597412109375, 0.2396087646484375, 0.26203155517578125, 0.284454345703125, 0.30687713623046875, 0.3292999267578125, 0.35172271728515625, 0.3741455078125, 0.39656829833984375, 0.4189910888671875, 0.44141387939453125, 0.463836669921875, 0.48625946044921875, 0.5086822509765625, 0.5311050415039062, 0.55352783203125, 0.5759506225585938, 0.5983734130859375, 0.6207962036132812, 0.643218994140625, 0.6656417846679688, 0.6880645751953125, 0.7104873657226562, 0.73291015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 7.0, 3.0, 11.0, 17.0, 19.0, 21.0, 16.0, 33.0, 36.0, 65.0, 90.0, 92.0, 141.0, 225.0, 404.0, 670.0, 1503.0, 3169.0, 7527.0, 21030.0, 60498.0, 174017.0, 392050.0, 248701.0, 88130.0, 30667.0, 11111.0, 4252.0, 1885.0, 812.0, 493.0, 254.0, 153.0, 114.0, 70.0, 60.0, 55.0, 31.0, 24.0, 24.0, 21.0, 16.0, 8.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.912109375, -0.8865432739257812, -0.8609771728515625, -0.8354110717773438, -0.809844970703125, -0.7842788696289062, -0.7587127685546875, -0.7331466674804688, -0.70758056640625, -0.6820144653320312, -0.6564483642578125, -0.6308822631835938, -0.605316162109375, -0.5797500610351562, -0.5541839599609375, -0.5286178588867188, -0.5030517578125, -0.47748565673828125, -0.4519195556640625, -0.42635345458984375, -0.400787353515625, -0.37522125244140625, -0.3496551513671875, -0.32408905029296875, -0.29852294921875, -0.27295684814453125, -0.2473907470703125, -0.22182464599609375, -0.196258544921875, -0.17069244384765625, -0.1451263427734375, -0.11956024169921875, -0.093994140625, -0.06842803955078125, -0.0428619384765625, -0.01729583740234375, 0.008270263671875, 0.03383636474609375, 0.0594024658203125, 0.08496856689453125, 0.11053466796875, 0.13610076904296875, 0.1616668701171875, 0.18723297119140625, 0.212799072265625, 0.23836517333984375, 0.2639312744140625, 0.28949737548828125, 0.3150634765625, 0.34062957763671875, 0.3661956787109375, 0.39176177978515625, 0.417327880859375, 0.44289398193359375, 0.4684600830078125, 0.49402618408203125, 0.51959228515625, 0.5451583862304688, 0.5707244873046875, 0.5962905883789062, 0.621856689453125, 0.6474227905273438, 0.6729888916015625, 0.6985549926757812, 0.72412109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 8.0, 12.0, 16.0, 14.0, 19.0, 18.0, 18.0, 36.0, 38.0, 35.0, 43.0, 30.0, 38.0, 36.0, 41.0, 50.0, 41.0, 35.0, 45.0, 43.0, 45.0, 34.0, 37.0, 21.0, 30.0, 26.0, 32.0, 21.0, 16.0, 19.0, 10.0, 18.0, 7.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.9775390625, -0.9475173950195312, -0.9174957275390625, -0.8874740600585938, -0.857452392578125, -0.8274307250976562, -0.7974090576171875, -0.7673873901367188, -0.73736572265625, -0.7073440551757812, -0.6773223876953125, -0.6473007202148438, -0.617279052734375, -0.5872573852539062, -0.5572357177734375, -0.5272140502929688, -0.4971923828125, -0.46717071533203125, -0.4371490478515625, -0.40712738037109375, -0.377105712890625, -0.34708404541015625, -0.3170623779296875, -0.28704071044921875, -0.25701904296875, -0.22699737548828125, -0.1969757080078125, -0.16695404052734375, -0.136932373046875, -0.10691070556640625, -0.0768890380859375, -0.04686737060546875, -0.016845703125, 0.01317596435546875, 0.0431976318359375, 0.07321929931640625, 0.103240966796875, 0.13326263427734375, 0.1632843017578125, 0.19330596923828125, 0.22332763671875, 0.25334930419921875, 0.2833709716796875, 0.31339263916015625, 0.343414306640625, 0.37343597412109375, 0.4034576416015625, 0.43347930908203125, 0.4635009765625, 0.49352264404296875, 0.5235443115234375, 0.5535659790039062, 0.583587646484375, 0.6136093139648438, 0.6436309814453125, 0.6736526489257812, 0.70367431640625, 0.7336959838867188, 0.7637176513671875, 0.7937393188476562, 0.823760986328125, 0.8537826538085938, 0.8838043212890625, 0.9138259887695312, 0.94384765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 17.0, 19.0, 31.0, 33.0, 64.0, 84.0, 126.0, 181.0, 267.0, 475.0, 839.0, 1862.0, 5082.0, 18995.0, 104653.0, 486940.0, 347572.0, 61980.0, 12310.0, 3619.0, 1535.0, 683.0, 415.0, 259.0, 142.0, 101.0, 64.0, 51.0, 38.0, 18.0, 23.0, 13.0, 10.0, 4.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390869140625, -0.3773231506347656, -0.36377716064453125, -0.3502311706542969, -0.3366851806640625, -0.3231391906738281, -0.30959320068359375, -0.2960472106933594, -0.282501220703125, -0.2689552307128906, -0.25540924072265625, -0.24186325073242188, -0.2283172607421875, -0.21477127075195312, -0.20122528076171875, -0.18767929077148438, -0.17413330078125, -0.16058731079101562, -0.14704132080078125, -0.13349533081054688, -0.1199493408203125, -0.10640335083007812, -0.09285736083984375, -0.07931137084960938, -0.065765380859375, -0.052219390869140625, -0.03867340087890625, -0.025127410888671875, -0.0115814208984375, 0.001964569091796875, 0.01551055908203125, 0.029056549072265625, 0.0426025390625, 0.056148529052734375, 0.06969451904296875, 0.08324050903320312, 0.0967864990234375, 0.11033248901367188, 0.12387847900390625, 0.13742446899414062, 0.150970458984375, 0.16451644897460938, 0.17806243896484375, 0.19160842895507812, 0.2051544189453125, 0.21870040893554688, 0.23224639892578125, 0.24579238891601562, 0.25933837890625, 0.2728843688964844, 0.28643035888671875, 0.2999763488769531, 0.3135223388671875, 0.3270683288574219, 0.34061431884765625, 0.3541603088378906, 0.367706298828125, 0.3812522888183594, 0.39479827880859375, 0.4083442687988281, 0.4218902587890625, 0.4354362487792969, 0.44898223876953125, 0.4625282287597656, 0.47607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 12.0, 15.0, 23.0, 19.0, 22.0, 53.0, 42.0, 56.0, 77.0, 97.0, 83.0, 93.0, 80.0, 69.0, 60.0, 49.0, 35.0, 26.0, 15.0, 16.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.367134094238281e-05, -7.12154433131218e-05, -6.875954568386078e-05, -6.630364805459976e-05, -6.384775042533875e-05, -6.139185279607773e-05, -5.893595516681671e-05, -5.6480057537555695e-05, -5.402415990829468e-05, -5.156826227903366e-05, -4.9112364649772644e-05, -4.665646702051163e-05, -4.420056939125061e-05, -4.1744671761989594e-05, -3.928877413272858e-05, -3.683287650346756e-05, -3.437697887420654e-05, -3.1921081244945526e-05, -2.946518361568451e-05, -2.7009285986423492e-05, -2.4553388357162476e-05, -2.209749072790146e-05, -1.9641593098640442e-05, -1.7185695469379425e-05, -1.4729797840118408e-05, -1.2273900210857391e-05, -9.818002581596375e-06, -7.362104952335358e-06, -4.906207323074341e-06, -2.450309693813324e-06, 5.587935447692871e-09, 2.4614855647087097e-06, 4.9173831939697266e-06, 7.373280823230743e-06, 9.82917845249176e-06, 1.2285076081752777e-05, 1.4740973711013794e-05, 1.719687134027481e-05, 1.9652768969535828e-05, 2.2108666598796844e-05, 2.456456422805786e-05, 2.7020461857318878e-05, 2.9476359486579895e-05, 3.193225711584091e-05, 3.438815474510193e-05, 3.6844052374362946e-05, 3.929995000362396e-05, 4.175584763288498e-05, 4.4211745262145996e-05, 4.666764289140701e-05, 4.912354052066803e-05, 5.157943814992905e-05, 5.4035335779190063e-05, 5.649123340845108e-05, 5.89471310377121e-05, 6.140302866697311e-05, 6.385892629623413e-05, 6.631482392549515e-05, 6.877072155475616e-05, 7.122661918401718e-05, 7.36825168132782e-05, 7.613841444253922e-05, 7.859431207180023e-05, 8.105020970106125e-05, 8.350610733032227e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 17.0, 26.0, 51.0, 74.0, 108.0, 206.0, 422.0, 885.0, 2104.0, 6383.0, 31648.0, 257637.0, 625006.0, 102358.0, 14954.0, 3862.0, 1447.0, 640.0, 296.0, 156.0, 96.0, 57.0, 30.0, 23.0, 10.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4482421875, -0.43181610107421875, -0.4153900146484375, -0.39896392822265625, -0.382537841796875, -0.36611175537109375, -0.3496856689453125, -0.33325958251953125, -0.31683349609375, -0.30040740966796875, -0.2839813232421875, -0.26755523681640625, -0.251129150390625, -0.23470306396484375, -0.2182769775390625, -0.20185089111328125, -0.1854248046875, -0.16899871826171875, -0.1525726318359375, -0.13614654541015625, -0.119720458984375, -0.10329437255859375, -0.0868682861328125, -0.07044219970703125, -0.05401611328125, -0.03759002685546875, -0.0211639404296875, -0.00473785400390625, 0.011688232421875, 0.02811431884765625, 0.0445404052734375, 0.06096649169921875, 0.077392578125, 0.09381866455078125, 0.1102447509765625, 0.12667083740234375, 0.143096923828125, 0.15952301025390625, 0.1759490966796875, 0.19237518310546875, 0.20880126953125, 0.22522735595703125, 0.2416534423828125, 0.25807952880859375, 0.274505615234375, 0.29093170166015625, 0.3073577880859375, 0.32378387451171875, 0.3402099609375, 0.35663604736328125, 0.3730621337890625, 0.38948822021484375, 0.405914306640625, 0.42234039306640625, 0.4387664794921875, 0.45519256591796875, 0.47161865234375, 0.48804473876953125, 0.5044708251953125, 0.5208969116210938, 0.537322998046875, 0.5537490844726562, 0.5701751708984375, 0.5866012573242188, 0.60302734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 17.0, 14.0, 22.0, 27.0, 29.0, 41.0, 45.0, 56.0, 81.0, 84.0, 75.0, 87.0, 80.0, 80.0, 52.0, 48.0, 34.0, 23.0, 23.0, 15.0, 17.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37548828125, -0.36331939697265625, -0.3511505126953125, -0.33898162841796875, -0.326812744140625, -0.31464385986328125, -0.3024749755859375, -0.29030609130859375, -0.27813720703125, -0.26596832275390625, -0.2537994384765625, -0.24163055419921875, -0.229461669921875, -0.21729278564453125, -0.2051239013671875, -0.19295501708984375, -0.1807861328125, -0.16861724853515625, -0.1564483642578125, -0.14427947998046875, -0.132110595703125, -0.11994171142578125, -0.1077728271484375, -0.09560394287109375, -0.08343505859375, -0.07126617431640625, -0.0590972900390625, -0.04692840576171875, -0.034759521484375, -0.02259063720703125, -0.0104217529296875, 0.00174713134765625, 0.013916015625, 0.02608489990234375, 0.0382537841796875, 0.05042266845703125, 0.062591552734375, 0.07476043701171875, 0.0869293212890625, 0.09909820556640625, 0.11126708984375, 0.12343597412109375, 0.1356048583984375, 0.14777374267578125, 0.159942626953125, 0.17211151123046875, 0.1842803955078125, 0.19644927978515625, 0.2086181640625, 0.22078704833984375, 0.2329559326171875, 0.24512481689453125, 0.257293701171875, 0.26946258544921875, 0.2816314697265625, 0.29380035400390625, 0.30596923828125, 0.31813812255859375, 0.3303070068359375, 0.34247589111328125, 0.354644775390625, 0.36681365966796875, 0.3789825439453125, 0.39115142822265625, 0.4033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 14.0, 13.0, 15.0, 31.0, 33.0, 51.0, 51.0, 92.0, 105.0, 117.0, 94.0, 97.0, 81.0, 67.0, 46.0, 35.0, 28.0, 11.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.698837280273438, -8.522096633911133, -8.345356941223145, -8.16861629486084, -7.991876602172852, -7.815136432647705, -7.638396263122559, -7.461655616760254, -7.284915924072266, -7.108175754547119, -6.931435585021973, -6.754695415496826, -6.57795524597168, -6.401215076446533, -6.224474906921387, -6.047734260559082, -5.8709940910339355, -5.694253921508789, -5.517513751983643, -5.340773582458496, -5.16403341293335, -4.987293243408203, -4.810552597045898, -4.63381290435791, -4.4570722579956055, -4.280332088470459, -4.1035919189453125, -3.926851749420166, -3.7501115798950195, -3.573371410369873, -3.3966310024261475, -3.219890832901001, -3.0431504249572754, -2.866410255432129, -2.6896700859069824, -2.512929916381836, -2.3361897468566895, -2.159449577331543, -1.9827091693878174, -1.805968999862671, -1.6292288303375244, -1.452488660812378, -1.2757484912872314, -1.0990082025527954, -0.9222680330276489, -0.7455278635025024, -0.5687875747680664, -0.3920474052429199, -0.21530723571777344, -0.038567036390304565, 0.1381731629371643, 0.31491339206695557, 0.49165356159210205, 0.6683937311172485, 0.8451340198516846, 1.021874189376831, 1.1986143589019775, 1.375354528427124, 1.5520946979522705, 1.7288349866867065, 1.905575156211853, 2.082315444946289, 2.2590556144714355, 2.435795783996582, 2.6125359535217285]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 16.0, 12.0, 13.0, 24.0, 26.0, 16.0, 23.0, 38.0, 24.0, 30.0, 42.0, 32.0, 48.0, 41.0, 45.0, 56.0, 49.0, 44.0, 34.0, 44.0, 37.0, 42.0, 36.0, 30.0, 21.0, 21.0, 25.0, 18.0, 15.0, 10.0, 15.0, 15.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.717818260192871, -5.5656938552856445, -5.413569450378418, -5.261444568634033, -5.109320163726807, -4.95719575881958, -4.805070877075195, -4.652946472167969, -4.500822067260742, -4.348697662353516, -4.196573257446289, -4.044448375701904, -3.8923239707946777, -3.740199565887451, -3.5880749225616455, -3.43595027923584, -3.2838258743286133, -3.1317014694213867, -2.979576826095581, -2.8274521827697754, -2.675327777862549, -2.5232033729553223, -2.3710787296295166, -2.218954086303711, -2.0668296813964844, -1.9147051572799683, -1.7625806331634521, -1.610456109046936, -1.45833158493042, -1.3062070608139038, -1.1540825366973877, -1.0019580125808716, -0.8498339653015137, -0.6977094411849976, -0.5455849170684814, -0.39346039295196533, -0.24133586883544922, -0.0892113447189331, 0.06291317939758301, 0.21503770351409912, 0.36716222763061523, 0.5192867517471313, 0.6714112758636475, 0.8235357999801636, 0.9756603240966797, 1.1277848482131958, 1.279909372329712, 1.432033896446228, 1.5841584205627441, 1.7362829446792603, 1.8884074687957764, 2.040532112121582, 2.1926565170288086, 2.344780921936035, 2.496905565261841, 2.6490302085876465, 2.801154613494873, 2.9532790184020996, 3.1054036617279053, 3.257528305053711, 3.4096527099609375, 3.561777114868164, 3.7139017581939697, 3.8660264015197754, 4.018150806427002]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 22.0, 19.0, 27.0, 42.0, 71.0, 122.0, 173.0, 309.0, 662.0, 1754.0, 6957.0, 82158.0, 4066714.0, 28721.0, 4225.0, 1191.0, 485.0, 238.0, 130.0, 85.0, 52.0, 29.0, 17.0, 14.0, 8.0, 12.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46875, -5.3046875, -5.140625, -4.9765625, -4.8125, -4.6484375, -4.484375, -4.3203125, -4.15625, -3.9921875, -3.828125, -3.6640625, -3.5, -3.3359375, -3.171875, -3.0078125, -2.84375, -2.6796875, -2.515625, -2.3515625, -2.1875, -2.0234375, -1.859375, -1.6953125, -1.53125, -1.3671875, -1.203125, -1.0390625, -0.875, -0.7109375, -0.546875, -0.3828125, -0.21875, -0.0546875, 0.109375, 0.2734375, 0.4375, 0.6015625, 0.765625, 0.9296875, 1.09375, 1.2578125, 1.421875, 1.5859375, 1.75, 1.9140625, 2.078125, 2.2421875, 2.40625, 2.5703125, 2.734375, 2.8984375, 3.0625, 3.2265625, 3.390625, 3.5546875, 3.71875, 3.8828125, 4.046875, 4.2109375, 4.375, 4.5390625, 4.703125, 4.8671875, 5.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 15.0, 24.0, 37.0, 60.0, 81.0, 117.0, 118.0, 120.0, 96.0, 89.0, 65.0, 66.0, 28.0, 30.0, 10.0, 13.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7012786865234375, -0.678924560546875, -0.6565704345703125, -0.63421630859375, -0.6118621826171875, -0.589508056640625, -0.5671539306640625, -0.5447998046875, -0.5224456787109375, -0.500091552734375, -0.4777374267578125, -0.45538330078125, -0.4330291748046875, -0.410675048828125, -0.3883209228515625, -0.365966796875, -0.3436126708984375, -0.321258544921875, -0.2989044189453125, -0.27655029296875, -0.2541961669921875, -0.231842041015625, -0.2094879150390625, -0.1871337890625, -0.1647796630859375, -0.142425537109375, -0.1200714111328125, -0.09771728515625, -0.0753631591796875, -0.053009033203125, -0.0306549072265625, -0.00830078125, 0.0140533447265625, 0.036407470703125, 0.0587615966796875, 0.08111572265625, 0.1034698486328125, 0.125823974609375, 0.1481781005859375, 0.1705322265625, 0.1928863525390625, 0.215240478515625, 0.2375946044921875, 0.25994873046875, 0.2823028564453125, 0.304656982421875, 0.3270111083984375, 0.349365234375, 0.3717193603515625, 0.394073486328125, 0.4164276123046875, 0.43878173828125, 0.4611358642578125, 0.483489990234375, 0.5058441162109375, 0.5281982421875, 0.5505523681640625, 0.572906494140625, 0.5952606201171875, 0.61761474609375, 0.6399688720703125, 0.662322998046875, 0.6846771240234375, 0.70703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 13.0, 16.0, 12.0, 22.0, 35.0, 31.0, 47.0, 70.0, 105.0, 113.0, 198.0, 239.0, 377.0, 571.0, 820.0, 1418.0, 2434.0, 5533.0, 16340.0, 83085.0, 3706939.0, 324832.0, 33326.0, 8895.0, 3742.0, 1781.0, 1091.0, 661.0, 436.0, 305.0, 198.0, 156.0, 122.0, 83.0, 65.0, 42.0, 32.0, 27.0, 20.0, 15.0, 8.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8282318115234375, -1.768768310546875, -1.7093048095703125, -1.64984130859375, -1.5903778076171875, -1.530914306640625, -1.4714508056640625, -1.4119873046875, -1.3525238037109375, -1.293060302734375, -1.2335968017578125, -1.17413330078125, -1.1146697998046875, -1.055206298828125, -0.9957427978515625, -0.936279296875, -0.8768157958984375, -0.817352294921875, -0.7578887939453125, -0.69842529296875, -0.6389617919921875, -0.579498291015625, -0.5200347900390625, -0.4605712890625, -0.4011077880859375, -0.341644287109375, -0.2821807861328125, -0.22271728515625, -0.1632537841796875, -0.103790283203125, -0.0443267822265625, 0.01513671875, 0.0746002197265625, 0.134063720703125, 0.1935272216796875, 0.25299072265625, 0.3124542236328125, 0.371917724609375, 0.4313812255859375, 0.4908447265625, 0.5503082275390625, 0.609771728515625, 0.6692352294921875, 0.72869873046875, 0.7881622314453125, 0.847625732421875, 0.9070892333984375, 0.966552734375, 1.0260162353515625, 1.085479736328125, 1.1449432373046875, 1.20440673828125, 1.2638702392578125, 1.323333740234375, 1.3827972412109375, 1.4422607421875, 1.5017242431640625, 1.561187744140625, 1.6206512451171875, 1.68011474609375, 1.7395782470703125, 1.799041748046875, 1.8585052490234375, 1.91796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 59.0, 175.0, 2627.0, 889.0, 152.0, 53.0, 25.0, 15.0, 8.0, 2.0, 2.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.458984375, -1.4171600341796875, -1.375335693359375, -1.3335113525390625, -1.29168701171875, -1.2498626708984375, -1.208038330078125, -1.1662139892578125, -1.1243896484375, -1.0825653076171875, -1.040740966796875, -0.9989166259765625, -0.95709228515625, -0.9152679443359375, -0.873443603515625, -0.8316192626953125, -0.789794921875, -0.7479705810546875, -0.706146240234375, -0.6643218994140625, -0.62249755859375, -0.5806732177734375, -0.538848876953125, -0.4970245361328125, -0.4552001953125, -0.4133758544921875, -0.371551513671875, -0.3297271728515625, -0.28790283203125, -0.2460784912109375, -0.204254150390625, -0.1624298095703125, -0.12060546875, -0.0787811279296875, -0.036956787109375, 0.0048675537109375, 0.04669189453125, 0.0885162353515625, 0.130340576171875, 0.1721649169921875, 0.2139892578125, 0.2558135986328125, 0.297637939453125, 0.3394622802734375, 0.38128662109375, 0.4231109619140625, 0.464935302734375, 0.5067596435546875, 0.548583984375, 0.5904083251953125, 0.632232666015625, 0.6740570068359375, 0.71588134765625, 0.7577056884765625, 0.799530029296875, 0.8413543701171875, 0.8831787109375, 0.9250030517578125, 0.966827392578125, 1.0086517333984375, 1.05047607421875, 1.0923004150390625, 1.134124755859375, 1.1759490966796875, 1.2177734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 8.0, 25.0, 48.0, 128.0, 226.0, 237.0, 155.0, 91.0, 25.0, 22.0, 13.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4178354740142822, -3.2553305625915527, -3.092825412750244, -2.9303205013275146, -2.767815589904785, -2.6053104400634766, -2.442805528640747, -2.2803006172180176, -2.117795467376709, -1.95529043674469, -1.7927855253219604, -1.6302804946899414, -1.467775583267212, -1.3052705526351929, -1.1427655220031738, -0.9802606105804443, -0.8177556991577148, -0.6552507281303406, -0.4927457273006439, -0.33024072647094727, -0.167735755443573, -0.0052307844161987305, 0.1572742462158203, 0.3197791576385498, 0.48228418827056885, 0.6447891592979431, 0.8072941303253174, 0.9697991609573364, 1.1323041915893555, 1.294809103012085, 1.457314133644104, 1.6198190450668335, 1.7823243141174316, 1.9448293447494507, 2.1073343753814697, 2.269839286804199, 2.4323441982269287, 2.594849109649658, 2.757354259490967, 2.9198591709136963, 3.082364082336426, 3.2448689937591553, 3.407374143600464, 3.5698790550231934, 3.732383966445923, 3.8948888778686523, 4.057394027709961, 4.2198991775512695, 4.382404327392578, 4.544909477233887, 4.707414150238037, 4.869919300079346, 5.032424449920654, 5.194929122924805, 5.357434272766113, 5.519939422607422, 5.682444095611572, 5.844949245452881, 6.007453918457031, 6.16995906829834, 6.332464218139648, 6.494968891143799, 6.657474040985107, 6.819978713989258, 6.982483863830566]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 7.0, 34.0, 40.0, 43.0, 60.0, 63.0, 80.0, 75.0, 91.0, 77.0, 91.0, 90.0, 54.0, 43.0, 38.0, 27.0, 16.0, 12.0, 9.0, 10.0, 5.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9185948371887207, -3.8101539611816406, -3.7017130851745605, -3.5932722091674805, -3.4848310947418213, -3.376390218734741, -3.267949342727661, -3.159508466720581, -3.051067352294922, -2.942626476287842, -2.8341856002807617, -2.7257447242736816, -2.6173036098480225, -2.5088627338409424, -2.4004218578338623, -2.2919809818267822, -2.183540105819702, -2.075099229812622, -1.9666582345962524, -1.8582173585891724, -1.7497763633728027, -1.6413354873657227, -1.5328946113586426, -1.4244537353515625, -1.3160127401351929, -1.2075718641281128, -1.0991308689117432, -0.9906899929046631, -0.8822490572929382, -0.7738081216812134, -0.6653672456741333, -0.5569263100624084, -0.4484851360321045, -0.34004420042037964, -0.23160329461097717, -0.12316238880157471, -0.014721453189849854, 0.093719482421875, 0.20216035842895508, 0.31060129404067993, 0.4190422296524048, 0.5274831652641296, 0.6359241008758545, 0.7443649768829346, 0.8528059124946594, 0.9612468481063843, 1.0696877241134644, 1.178128719329834, 1.286569595336914, 1.3950104713439941, 1.5034514665603638, 1.6118923425674438, 1.7203333377838135, 1.8287742137908936, 1.9372150897979736, 2.0456559658050537, 2.154097080230713, 2.262537956237793, 2.370978832244873, 2.479419708251953, 2.5878608226776123, 2.6963016986846924, 2.8047425746917725, 2.9131834506988525, 3.0216243267059326]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 28.0, 48.0, 86.0, 173.0, 252.0, 495.0, 1006.0, 2052.0, 5512.0, 30889.0, 399416.0, 552925.0, 43886.0, 6976.0, 2405.0, 1074.0, 601.0, 287.0, 161.0, 89.0, 73.0, 36.0, 13.0, 9.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.103515625, -3.000335693359375, -2.89715576171875, -2.793975830078125, -2.6907958984375, -2.587615966796875, -2.48443603515625, -2.381256103515625, -2.278076171875, -2.174896240234375, -2.07171630859375, -1.968536376953125, -1.8653564453125, -1.762176513671875, -1.65899658203125, -1.555816650390625, -1.45263671875, -1.349456787109375, -1.24627685546875, -1.143096923828125, -1.0399169921875, -0.936737060546875, -0.83355712890625, -0.730377197265625, -0.627197265625, -0.524017333984375, -0.42083740234375, -0.317657470703125, -0.2144775390625, -0.111297607421875, -0.00811767578125, 0.095062255859375, 0.1982421875, 0.301422119140625, 0.40460205078125, 0.507781982421875, 0.6109619140625, 0.714141845703125, 0.81732177734375, 0.920501708984375, 1.023681640625, 1.126861572265625, 1.23004150390625, 1.333221435546875, 1.4364013671875, 1.539581298828125, 1.64276123046875, 1.745941162109375, 1.84912109375, 1.952301025390625, 2.05548095703125, 2.158660888671875, 2.2618408203125, 2.365020751953125, 2.46820068359375, 2.571380615234375, 2.674560546875, 2.777740478515625, 2.88092041015625, 2.984100341796875, 3.0872802734375, 3.190460205078125, 3.29364013671875, 3.396820068359375, 3.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 18.0, 53.0, 62.0, 94.0, 129.0, 111.0, 123.0, 84.0, 74.0, 73.0, 45.0, 46.0, 17.0, 15.0, 3.0, 9.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77978515625, -0.7555084228515625, -0.731231689453125, -0.7069549560546875, -0.68267822265625, -0.6584014892578125, -0.634124755859375, -0.6098480224609375, -0.5855712890625, -0.5612945556640625, -0.537017822265625, -0.5127410888671875, -0.48846435546875, -0.4641876220703125, -0.439910888671875, -0.4156341552734375, -0.391357421875, -0.3670806884765625, -0.342803955078125, -0.3185272216796875, -0.29425048828125, -0.2699737548828125, -0.245697021484375, -0.2214202880859375, -0.1971435546875, -0.1728668212890625, -0.148590087890625, -0.1243133544921875, -0.10003662109375, -0.0757598876953125, -0.051483154296875, -0.0272064208984375, -0.0029296875, 0.0213470458984375, 0.045623779296875, 0.0699005126953125, 0.09417724609375, 0.1184539794921875, 0.142730712890625, 0.1670074462890625, 0.1912841796875, 0.2155609130859375, 0.239837646484375, 0.2641143798828125, 0.28839111328125, 0.3126678466796875, 0.336944580078125, 0.3612213134765625, 0.385498046875, 0.4097747802734375, 0.434051513671875, 0.4583282470703125, 0.48260498046875, 0.5068817138671875, 0.531158447265625, 0.5554351806640625, 0.5797119140625, 0.6039886474609375, 0.628265380859375, 0.6525421142578125, 0.67681884765625, 0.7010955810546875, 0.725372314453125, 0.7496490478515625, 0.77392578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 18.0, 23.0, 37.0, 51.0, 72.0, 94.0, 164.0, 249.0, 436.0, 820.0, 1561.0, 3123.0, 7368.0, 18734.0, 56279.0, 181777.0, 408451.0, 248042.0, 78771.0, 25104.0, 9307.0, 3910.0, 1856.0, 913.0, 490.0, 327.0, 196.0, 117.0, 65.0, 60.0, 34.0, 25.0, 20.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.9598846435546875, -0.928558349609375, -0.8972320556640625, -0.86590576171875, -0.8345794677734375, -0.803253173828125, -0.7719268798828125, -0.7406005859375, -0.7092742919921875, -0.677947998046875, -0.6466217041015625, -0.61529541015625, -0.5839691162109375, -0.552642822265625, -0.5213165283203125, -0.489990234375, -0.4586639404296875, -0.427337646484375, -0.3960113525390625, -0.36468505859375, -0.3333587646484375, -0.302032470703125, -0.2707061767578125, -0.2393798828125, -0.2080535888671875, -0.176727294921875, -0.1454010009765625, -0.11407470703125, -0.0827484130859375, -0.051422119140625, -0.0200958251953125, 0.01123046875, 0.0425567626953125, 0.073883056640625, 0.1052093505859375, 0.13653564453125, 0.1678619384765625, 0.199188232421875, 0.2305145263671875, 0.2618408203125, 0.2931671142578125, 0.324493408203125, 0.3558197021484375, 0.38714599609375, 0.4184722900390625, 0.449798583984375, 0.4811248779296875, 0.512451171875, 0.5437774658203125, 0.575103759765625, 0.6064300537109375, 0.63775634765625, 0.6690826416015625, 0.700408935546875, 0.7317352294921875, 0.7630615234375, 0.7943878173828125, 0.825714111328125, 0.8570404052734375, 0.88836669921875, 0.9196929931640625, 0.951019287109375, 0.9823455810546875, 1.013671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 9.0, 9.0, 11.0, 9.0, 7.0, 17.0, 17.0, 17.0, 30.0, 36.0, 27.0, 28.0, 49.0, 54.0, 51.0, 63.0, 46.0, 63.0, 58.0, 47.0, 45.0, 49.0, 34.0, 35.0, 32.0, 33.0, 28.0, 16.0, 9.0, 15.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.42730712890625, -1.3800048828125, -1.33270263671875, -1.285400390625, -1.23809814453125, -1.1907958984375, -1.14349365234375, -1.09619140625, -1.04888916015625, -1.0015869140625, -0.95428466796875, -0.906982421875, -0.85968017578125, -0.8123779296875, -0.76507568359375, -0.7177734375, -0.67047119140625, -0.6231689453125, -0.57586669921875, -0.528564453125, -0.48126220703125, -0.4339599609375, -0.38665771484375, -0.33935546875, -0.29205322265625, -0.2447509765625, -0.19744873046875, -0.150146484375, -0.10284423828125, -0.0555419921875, -0.00823974609375, 0.0390625, 0.08636474609375, 0.1336669921875, 0.18096923828125, 0.228271484375, 0.27557373046875, 0.3228759765625, 0.37017822265625, 0.41748046875, 0.46478271484375, 0.5120849609375, 0.55938720703125, 0.606689453125, 0.65399169921875, 0.7012939453125, 0.74859619140625, 0.7958984375, 0.84320068359375, 0.8905029296875, 0.93780517578125, 0.985107421875, 1.03240966796875, 1.0797119140625, 1.12701416015625, 1.17431640625, 1.22161865234375, 1.2689208984375, 1.31622314453125, 1.363525390625, 1.41082763671875, 1.4581298828125, 1.50543212890625, 1.552734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 18.0, 34.0, 61.0, 146.0, 379.0, 1474.0, 11004.0, 594144.0, 430626.0, 8683.0, 1307.0, 406.0, 147.0, 54.0, 34.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -2.0, -1.951171875, -1.90234375, -1.853515625, -1.8046875, -1.755859375, -1.70703125, -1.658203125, -1.609375, -1.560546875, -1.51171875, -1.462890625, -1.4140625, -1.365234375, -1.31640625, -1.267578125, -1.21875, -1.169921875, -1.12109375, -1.072265625, -1.0234375, -0.974609375, -0.92578125, -0.876953125, -0.828125, -0.779296875, -0.73046875, -0.681640625, -0.6328125, -0.583984375, -0.53515625, -0.486328125, -0.4375, -0.388671875, -0.33984375, -0.291015625, -0.2421875, -0.193359375, -0.14453125, -0.095703125, -0.046875, 0.001953125, 0.05078125, 0.099609375, 0.1484375, 0.197265625, 0.24609375, 0.294921875, 0.34375, 0.392578125, 0.44140625, 0.490234375, 0.5390625, 0.587890625, 0.63671875, 0.685546875, 0.734375, 0.783203125, 0.83203125, 0.880859375, 0.9296875, 0.978515625, 1.02734375, 1.076171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 15.0, 14.0, 31.0, 46.0, 75.0, 120.0, 139.0, 162.0, 129.0, 97.0, 58.0, 41.0, 21.0, 13.0, 8.0, 5.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.00021147727966308594, -0.0002070888876914978, -0.00020270049571990967, -0.00019831210374832153, -0.0001939237117767334, -0.00018953531980514526, -0.00018514692783355713, -0.000180758535861969, -0.00017637014389038086, -0.00017198175191879272, -0.0001675933599472046, -0.00016320496797561646, -0.00015881657600402832, -0.00015442818403244019, -0.00015003979206085205, -0.00014565140008926392, -0.00014126300811767578, -0.00013687461614608765, -0.0001324862241744995, -0.00012809783220291138, -0.00012370944023132324, -0.00011932104825973511, -0.00011493265628814697, -0.00011054426431655884, -0.0001061558723449707, -0.00010176748037338257, -9.737908840179443e-05, -9.29906964302063e-05, -8.860230445861816e-05, -8.421391248703003e-05, -7.98255205154419e-05, -7.543712854385376e-05, -7.104873657226562e-05, -6.666034460067749e-05, -6.227195262908936e-05, -5.788356065750122e-05, -5.3495168685913086e-05, -4.910677671432495e-05, -4.4718384742736816e-05, -4.032999277114868e-05, -3.594160079956055e-05, -3.155320882797241e-05, -2.7164816856384277e-05, -2.2776424884796143e-05, -1.8388032913208008e-05, -1.3999640941619873e-05, -9.611248970031738e-06, -5.2228569984436035e-06, -8.344650268554688e-07, 3.553926944732666e-06, 7.9423189163208e-06, 1.2330710887908936e-05, 1.671910285949707e-05, 2.1107494831085205e-05, 2.549588680267334e-05, 2.9884278774261475e-05, 3.427267074584961e-05, 3.8661062717437744e-05, 4.304945468902588e-05, 4.7437846660614014e-05, 5.182623863220215e-05, 5.621463060379028e-05, 6.060302257537842e-05, 6.499141454696655e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 9.0, 18.0, 37.0, 37.0, 77.0, 159.0, 360.0, 1071.0, 3927.0, 21570.0, 225159.0, 702962.0, 79484.0, 10226.0, 2212.0, 684.0, 249.0, 114.0, 69.0, 36.0, 23.0, 21.0, 13.0, 10.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7437515258789062, -0.7165069580078125, -0.6892623901367188, -0.662017822265625, -0.6347732543945312, -0.6075286865234375, -0.5802841186523438, -0.55303955078125, -0.5257949829101562, -0.4985504150390625, -0.47130584716796875, -0.444061279296875, -0.41681671142578125, -0.3895721435546875, -0.36232757568359375, -0.3350830078125, -0.30783843994140625, -0.2805938720703125, -0.25334930419921875, -0.226104736328125, -0.19886016845703125, -0.1716156005859375, -0.14437103271484375, -0.11712646484375, -0.08988189697265625, -0.0626373291015625, -0.03539276123046875, -0.008148193359375, 0.01909637451171875, 0.0463409423828125, 0.07358551025390625, 0.100830078125, 0.12807464599609375, 0.1553192138671875, 0.18256378173828125, 0.209808349609375, 0.23705291748046875, 0.2642974853515625, 0.29154205322265625, 0.31878662109375, 0.34603118896484375, 0.3732757568359375, 0.40052032470703125, 0.427764892578125, 0.45500946044921875, 0.4822540283203125, 0.5094985961914062, 0.5367431640625, 0.5639877319335938, 0.5912322998046875, 0.6184768676757812, 0.645721435546875, 0.6729660034179688, 0.7002105712890625, 0.7274551391601562, 0.75469970703125, 0.7819442749023438, 0.8091888427734375, 0.8364334106445312, 0.863677978515625, 0.8909225463867188, 0.9181671142578125, 0.9454116821289062, 0.97265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 23.0, 21.0, 31.0, 56.0, 74.0, 112.0, 156.0, 132.0, 112.0, 90.0, 54.0, 46.0, 16.0, 18.0, 13.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2978515625, -1.268402099609375, -1.23895263671875, -1.209503173828125, -1.1800537109375, -1.150604248046875, -1.12115478515625, -1.091705322265625, -1.062255859375, -1.032806396484375, -1.00335693359375, -0.973907470703125, -0.9444580078125, -0.915008544921875, -0.88555908203125, -0.856109619140625, -0.82666015625, -0.797210693359375, -0.76776123046875, -0.738311767578125, -0.7088623046875, -0.679412841796875, -0.64996337890625, -0.620513916015625, -0.591064453125, -0.561614990234375, -0.53216552734375, -0.502716064453125, -0.4732666015625, -0.443817138671875, -0.41436767578125, -0.384918212890625, -0.35546875, -0.326019287109375, -0.29656982421875, -0.267120361328125, -0.2376708984375, -0.208221435546875, -0.17877197265625, -0.149322509765625, -0.119873046875, -0.090423583984375, -0.06097412109375, -0.031524658203125, -0.0020751953125, 0.027374267578125, 0.05682373046875, 0.086273193359375, 0.11572265625, 0.145172119140625, 0.17462158203125, 0.204071044921875, 0.2335205078125, 0.262969970703125, 0.29241943359375, 0.321868896484375, 0.351318359375, 0.380767822265625, 0.41021728515625, 0.439666748046875, 0.4691162109375, 0.498565673828125, 0.52801513671875, 0.557464599609375, 0.5869140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 31.0, 98.0, 293.0, 369.0, 149.0, 45.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.15915298461914, -47.269290924072266, -46.379432678222656, -45.48957061767578, -44.59971237182617, -43.7098503112793, -42.81999206542969, -41.93013000488281, -41.04026794433594, -40.15040588378906, -39.26054763793945, -38.37068557739258, -37.48082733154297, -36.590965270996094, -35.701107025146484, -34.81124496459961, -33.92138671875, -33.031524658203125, -32.141666412353516, -31.251806259155273, -30.36194610595703, -29.472084045410156, -28.582223892211914, -27.692363739013672, -26.80250358581543, -25.912643432617188, -25.022783279418945, -24.132923126220703, -23.243061065673828, -22.35320281982422, -21.463340759277344, -20.5734806060791, -19.683622360229492, -18.79376220703125, -17.903902053833008, -17.014041900634766, -16.12417984008789, -15.234320640563965, -14.344459533691406, -13.454599380493164, -12.564739227294922, -11.67487907409668, -10.785018920898438, -9.895157814025879, -9.005297660827637, -8.115437507629395, -7.225576877593994, -6.335716247558594, -5.445856094360352, -4.555995941162109, -3.666135311126709, -2.7762749195098877, -1.8864145278930664, -0.9965543746948242, -0.10669374465942383, 0.7831668853759766, 1.6730270385742188, 2.56288743019104, 3.4527478218078613, 4.342608451843262, 5.232468605041504, 6.122328758239746, 7.0121893882751465, 7.902050018310547, 8.791910171508789]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 9.0, 15.0, 12.0, 18.0, 19.0, 17.0, 17.0, 25.0, 26.0, 21.0, 31.0, 35.0, 44.0, 41.0, 37.0, 32.0, 42.0, 42.0, 40.0, 45.0, 44.0, 37.0, 35.0, 39.0, 36.0, 30.0, 26.0, 22.0, 20.0, 16.0, 16.0, 12.0, 18.0, 11.0, 7.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.000665187835693, -6.785818099975586, -6.5709710121154785, -6.356123924255371, -6.141276836395264, -5.926429748535156, -5.711583137512207, -5.4967360496521, -5.281888961791992, -5.067041873931885, -4.852194786071777, -4.63734769821167, -4.4225006103515625, -4.207653999328613, -3.9928066730499268, -3.7779598236083984, -3.563112497329712, -3.3482654094696045, -3.133418321609497, -2.9185714721679688, -2.7037243843078613, -2.488877296447754, -2.2740302085876465, -2.059183120727539, -1.8443361520767212, -1.6294890642166138, -1.414642095565796, -1.1997950077056885, -0.9849479794502258, -0.7701009511947632, -0.5552538633346558, -0.3404068946838379, -0.12555980682373047, 0.08928723633289337, 0.3041342794895172, 0.5189813375473022, 0.7338283658027649, 0.9486753940582275, 1.163522481918335, 1.3783694505691528, 1.5932165384292603, 1.8080636262893677, 2.0229105949401855, 2.237757682800293, 2.4526047706604004, 2.667451858520508, 2.8822989463806152, 3.0971457958221436, 3.311992883682251, 3.5268399715423584, 3.741687059402466, 3.956533908843994, 4.171380996704102, 4.386228084564209, 4.601075172424316, 4.815922260284424, 5.030769348144531, 5.245616436004639, 5.460463523864746, 5.6753106117248535, 5.890157699584961, 6.10500431060791, 6.319851875305176, 6.534698486328125, 6.749545574188232]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 6.0, 12.0, 20.0, 19.0, 35.0, 31.0, 54.0, 48.0, 65.0, 115.0, 144.0, 207.0, 365.0, 538.0, 956.0, 1705.0, 3611.0, 9285.0, 32687.0, 319047.0, 3720014.0, 76978.0, 16842.0, 5734.0, 2516.0, 1225.0, 695.0, 417.0, 276.0, 183.0, 112.0, 77.0, 61.0, 38.0, 34.0, 26.0, 13.0, 15.0, 12.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.76953125, -2.68621826171875, -2.6029052734375, -2.51959228515625, -2.436279296875, -2.35296630859375, -2.2696533203125, -2.18634033203125, -2.10302734375, -2.01971435546875, -1.9364013671875, -1.85308837890625, -1.769775390625, -1.68646240234375, -1.6031494140625, -1.51983642578125, -1.4365234375, -1.35321044921875, -1.2698974609375, -1.18658447265625, -1.103271484375, -1.01995849609375, -0.9366455078125, -0.85333251953125, -0.77001953125, -0.68670654296875, -0.6033935546875, -0.52008056640625, -0.436767578125, -0.35345458984375, -0.2701416015625, -0.18682861328125, -0.103515625, -0.02020263671875, 0.0631103515625, 0.14642333984375, 0.229736328125, 0.31304931640625, 0.3963623046875, 0.47967529296875, 0.56298828125, 0.64630126953125, 0.7296142578125, 0.81292724609375, 0.896240234375, 0.97955322265625, 1.0628662109375, 1.14617919921875, 1.2294921875, 1.31280517578125, 1.3961181640625, 1.47943115234375, 1.562744140625, 1.64605712890625, 1.7293701171875, 1.81268310546875, 1.89599609375, 1.97930908203125, 2.0626220703125, 2.14593505859375, 2.229248046875, 2.31256103515625, 2.3958740234375, 2.47918701171875, 2.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 9.0, 13.0, 20.0, 29.0, 52.0, 68.0, 79.0, 100.0, 100.0, 102.0, 94.0, 84.0, 69.0, 40.0, 47.0, 22.0, 24.0, 14.0, 11.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7890625, -0.7645950317382812, -0.7401275634765625, -0.7156600952148438, -0.691192626953125, -0.6667251586914062, -0.6422576904296875, -0.6177902221679688, -0.59332275390625, -0.5688552856445312, -0.5443878173828125, -0.5199203491210938, -0.495452880859375, -0.47098541259765625, -0.4465179443359375, -0.42205047607421875, -0.3975830078125, -0.37311553955078125, -0.3486480712890625, -0.32418060302734375, -0.299713134765625, -0.27524566650390625, -0.2507781982421875, -0.22631072998046875, -0.20184326171875, -0.17737579345703125, -0.1529083251953125, -0.12844085693359375, -0.103973388671875, -0.07950592041015625, -0.0550384521484375, -0.03057098388671875, -0.006103515625, 0.01836395263671875, 0.0428314208984375, 0.06729888916015625, 0.091766357421875, 0.11623382568359375, 0.1407012939453125, 0.16516876220703125, 0.18963623046875, 0.21410369873046875, 0.2385711669921875, 0.26303863525390625, 0.287506103515625, 0.31197357177734375, 0.3364410400390625, 0.36090850830078125, 0.3853759765625, 0.40984344482421875, 0.4343109130859375, 0.45877838134765625, 0.483245849609375, 0.5077133178710938, 0.5321807861328125, 0.5566482543945312, 0.58111572265625, 0.6055831909179688, 0.6300506591796875, 0.6545181274414062, 0.678985595703125, 0.7034530639648438, 0.7279205322265625, 0.7523880004882812, 0.77685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 11.0, 14.0, 33.0, 29.0, 41.0, 69.0, 95.0, 115.0, 203.0, 253.0, 423.0, 620.0, 1083.0, 2448.0, 7586.0, 37593.0, 1162235.0, 2922803.0, 44487.0, 8354.0, 2622.0, 1163.0, 702.0, 421.0, 277.0, 181.0, 140.0, 88.0, 56.0, 35.0, 20.0, 27.0, 20.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.86358642578125, -2.7818603515625, -2.70013427734375, -2.618408203125, -2.53668212890625, -2.4549560546875, -2.37322998046875, -2.29150390625, -2.20977783203125, -2.1280517578125, -2.04632568359375, -1.964599609375, -1.88287353515625, -1.8011474609375, -1.71942138671875, -1.6376953125, -1.55596923828125, -1.4742431640625, -1.39251708984375, -1.310791015625, -1.22906494140625, -1.1473388671875, -1.06561279296875, -0.98388671875, -0.90216064453125, -0.8204345703125, -0.73870849609375, -0.656982421875, -0.57525634765625, -0.4935302734375, -0.41180419921875, -0.330078125, -0.24835205078125, -0.1666259765625, -0.08489990234375, -0.003173828125, 0.07855224609375, 0.1602783203125, 0.24200439453125, 0.32373046875, 0.40545654296875, 0.4871826171875, 0.56890869140625, 0.650634765625, 0.73236083984375, 0.8140869140625, 0.89581298828125, 0.9775390625, 1.05926513671875, 1.1409912109375, 1.22271728515625, 1.304443359375, 1.38616943359375, 1.4678955078125, 1.54962158203125, 1.63134765625, 1.71307373046875, 1.7947998046875, 1.87652587890625, 1.958251953125, 2.03997802734375, 2.1217041015625, 2.20343017578125, 2.28515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 26.0, 59.0, 172.0, 1556.0, 1921.0, 188.0, 59.0, 31.0, 18.0, 9.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.5897674560546875, -1.526214599609375, -1.4626617431640625, -1.39910888671875, -1.3355560302734375, -1.272003173828125, -1.2084503173828125, -1.1448974609375, -1.0813446044921875, -1.017791748046875, -0.9542388916015625, -0.89068603515625, -0.8271331787109375, -0.763580322265625, -0.7000274658203125, -0.636474609375, -0.5729217529296875, -0.509368896484375, -0.4458160400390625, -0.38226318359375, -0.3187103271484375, -0.255157470703125, -0.1916046142578125, -0.1280517578125, -0.0644989013671875, -0.000946044921875, 0.0626068115234375, 0.12615966796875, 0.1897125244140625, 0.253265380859375, 0.3168182373046875, 0.38037109375, 0.4439239501953125, 0.507476806640625, 0.5710296630859375, 0.63458251953125, 0.6981353759765625, 0.761688232421875, 0.8252410888671875, 0.8887939453125, 0.9523468017578125, 1.015899658203125, 1.0794525146484375, 1.14300537109375, 1.2065582275390625, 1.270111083984375, 1.3336639404296875, 1.397216796875, 1.4607696533203125, 1.524322509765625, 1.5878753662109375, 1.65142822265625, 1.7149810791015625, 1.778533935546875, 1.8420867919921875, 1.9056396484375, 1.9691925048828125, 2.032745361328125, 2.0962982177734375, 2.15985107421875, 2.2234039306640625, 2.286956787109375, 2.3505096435546875, 2.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 9.0, 15.0, 27.0, 47.0, 90.0, 128.0, 176.0, 181.0, 117.0, 104.0, 38.0, 27.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.853998184204102, -6.669008731842041, -6.484019756317139, -6.299030303955078, -6.114041328430176, -5.929051876068115, -5.744062423706055, -5.559073448181152, -5.374083995819092, -5.189094543457031, -5.004105567932129, -4.819116115570068, -4.634126663208008, -4.4491376876831055, -4.264148235321045, -4.079158782958984, -3.894169807434082, -3.7091805934906006, -3.524191379547119, -3.3392019271850586, -3.154212713241577, -2.9692234992980957, -2.784234046936035, -2.5992448329925537, -2.4142556190490723, -2.229266405105591, -2.0442771911621094, -1.8592877388000488, -1.6742985248565674, -1.489309310913086, -1.304319977760315, -1.119330644607544, -0.9343414306640625, -0.7493521571159363, -0.5643628835678101, -0.37937361001968384, -0.19438433647155762, -0.009395062923431396, 0.17559421062469482, 0.3605835437774658, 0.5455727577209473, 0.7305620312690735, 0.9155513048171997, 1.1005406379699707, 1.2855298519134521, 1.4705190658569336, 1.6555083990097046, 1.8404977321624756, 2.025486946105957, 2.2104761600494385, 2.39546537399292, 2.5804548263549805, 2.765444040298462, 2.9504332542419434, 3.135422706604004, 3.3204119205474854, 3.505401134490967, 3.6903903484344482, 3.8753795623779297, 4.06036901473999, 4.245358467102051, 4.430347442626953, 4.615336894989014, 4.800326347351074, 4.985315322875977]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 9.0, 9.0, 12.0, 16.0, 33.0, 42.0, 51.0, 53.0, 66.0, 81.0, 76.0, 77.0, 96.0, 64.0, 73.0, 50.0, 53.0, 41.0, 24.0, 18.0, 21.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.932065963745117, -3.772571563720703, -3.613077163696289, -3.453583002090454, -3.29408860206604, -3.134594202041626, -2.975100040435791, -2.815605640411377, -2.656111240386963, -2.496616840362549, -2.3371224403381348, -2.1776282787323, -2.0181338787078857, -1.8586394786834717, -1.6991451978683472, -1.5396509170532227, -1.3801565170288086, -1.2206621170043945, -1.06116783618927, -0.9016734957695007, -0.7421791553497314, -0.5826848149299622, -0.42319047451019287, -0.26369619369506836, -0.1042017936706543, 0.05529254674911499, 0.21478688716888428, 0.37428122758865356, 0.5337755680084229, 0.6932699084281921, 0.8527642488479614, 1.012258529663086, 1.1717529296875, 1.331247329711914, 1.4907416105270386, 1.650235891342163, 1.8097302913665771, 1.9692246913909912, 2.128718852996826, 2.2882132530212402, 2.4477076530456543, 2.6072020530700684, 2.7666964530944824, 2.9261906147003174, 3.0856850147247314, 3.2451794147491455, 3.4046735763549805, 3.5641679763793945, 3.7236623764038086, 3.8831567764282227, 4.042651176452637, 4.202145576477051, 4.361639976501465, 4.521133899688721, 4.680628299713135, 4.840122699737549, 4.999617099761963, 5.159111499786377, 5.318605899810791, 5.478100299835205, 5.637594223022461, 5.797088623046875, 5.956583023071289, 6.116077423095703, 6.275571823120117]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 14.0, 16.0, 27.0, 26.0, 49.0, 78.0, 93.0, 127.0, 160.0, 237.0, 398.0, 621.0, 1058.0, 1722.0, 3652.0, 8466.0, 24708.0, 91722.0, 357865.0, 400129.0, 110030.0, 28707.0, 9585.0, 3978.0, 1957.0, 1104.0, 664.0, 367.0, 312.0, 203.0, 130.0, 101.0, 62.0, 34.0, 36.0, 28.0, 14.0, 18.0, 13.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.005859375, -1.94329833984375, -1.8807373046875, -1.81817626953125, -1.755615234375, -1.69305419921875, -1.6304931640625, -1.56793212890625, -1.50537109375, -1.44281005859375, -1.3802490234375, -1.31768798828125, -1.255126953125, -1.19256591796875, -1.1300048828125, -1.06744384765625, -1.0048828125, -0.94232177734375, -0.8797607421875, -0.81719970703125, -0.754638671875, -0.69207763671875, -0.6295166015625, -0.56695556640625, -0.50439453125, -0.44183349609375, -0.3792724609375, -0.31671142578125, -0.254150390625, -0.19158935546875, -0.1290283203125, -0.06646728515625, -0.00390625, 0.05865478515625, 0.1212158203125, 0.18377685546875, 0.246337890625, 0.30889892578125, 0.3714599609375, 0.43402099609375, 0.49658203125, 0.55914306640625, 0.6217041015625, 0.68426513671875, 0.746826171875, 0.80938720703125, 0.8719482421875, 0.93450927734375, 0.9970703125, 1.05963134765625, 1.1221923828125, 1.18475341796875, 1.247314453125, 1.30987548828125, 1.3724365234375, 1.43499755859375, 1.49755859375, 1.56011962890625, 1.6226806640625, 1.68524169921875, 1.747802734375, 1.81036376953125, 1.8729248046875, 1.93548583984375, 1.998046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 16.0, 27.0, 32.0, 50.0, 65.0, 89.0, 106.0, 98.0, 106.0, 94.0, 81.0, 69.0, 39.0, 32.0, 27.0, 19.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81103515625, -0.783966064453125, -0.75689697265625, -0.729827880859375, -0.7027587890625, -0.675689697265625, -0.64862060546875, -0.621551513671875, -0.594482421875, -0.567413330078125, -0.54034423828125, -0.513275146484375, -0.4862060546875, -0.459136962890625, -0.43206787109375, -0.404998779296875, -0.3779296875, -0.350860595703125, -0.32379150390625, -0.296722412109375, -0.2696533203125, -0.242584228515625, -0.21551513671875, -0.188446044921875, -0.161376953125, -0.134307861328125, -0.10723876953125, -0.080169677734375, -0.0531005859375, -0.026031494140625, 0.00103759765625, 0.028106689453125, 0.05517578125, 0.082244873046875, 0.10931396484375, 0.136383056640625, 0.1634521484375, 0.190521240234375, 0.21759033203125, 0.244659423828125, 0.271728515625, 0.298797607421875, 0.32586669921875, 0.352935791015625, 0.3800048828125, 0.407073974609375, 0.43414306640625, 0.461212158203125, 0.48828125, 0.515350341796875, 0.54241943359375, 0.569488525390625, 0.5965576171875, 0.623626708984375, 0.65069580078125, 0.677764892578125, 0.704833984375, 0.731903076171875, 0.75897216796875, 0.786041259765625, 0.8131103515625, 0.840179443359375, 0.86724853515625, 0.894317626953125, 0.92138671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 12.0, 26.0, 22.0, 33.0, 50.0, 105.0, 155.0, 259.0, 433.0, 820.0, 1670.0, 3509.0, 8394.0, 21835.0, 67962.0, 247397.0, 454936.0, 165859.0, 47052.0, 16078.0, 6304.0, 2744.0, 1260.0, 647.0, 350.0, 222.0, 113.0, 95.0, 53.0, 49.0, 30.0, 24.0, 16.0, 11.0, 6.0, 0.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4266204833984375, -1.379608154296875, -1.3325958251953125, -1.28558349609375, -1.2385711669921875, -1.191558837890625, -1.1445465087890625, -1.0975341796875, -1.0505218505859375, -1.003509521484375, -0.9564971923828125, -0.90948486328125, -0.8624725341796875, -0.815460205078125, -0.7684478759765625, -0.721435546875, -0.6744232177734375, -0.627410888671875, -0.5803985595703125, -0.53338623046875, -0.4863739013671875, -0.439361572265625, -0.3923492431640625, -0.3453369140625, -0.2983245849609375, -0.251312255859375, -0.2042999267578125, -0.15728759765625, -0.1102752685546875, -0.063262939453125, -0.0162506103515625, 0.03076171875, 0.0777740478515625, 0.124786376953125, 0.1717987060546875, 0.21881103515625, 0.2658233642578125, 0.312835693359375, 0.3598480224609375, 0.4068603515625, 0.4538726806640625, 0.500885009765625, 0.5478973388671875, 0.59490966796875, 0.6419219970703125, 0.688934326171875, 0.7359466552734375, 0.782958984375, 0.8299713134765625, 0.876983642578125, 0.9239959716796875, 0.97100830078125, 1.0180206298828125, 1.065032958984375, 1.1120452880859375, 1.1590576171875, 1.2060699462890625, 1.253082275390625, 1.3000946044921875, 1.34710693359375, 1.3941192626953125, 1.441131591796875, 1.4881439208984375, 1.53515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 12.0, 16.0, 27.0, 34.0, 35.0, 28.0, 56.0, 56.0, 74.0, 70.0, 60.0, 67.0, 69.0, 70.0, 59.0, 50.0, 37.0, 25.0, 26.0, 30.0, 21.0, 15.0, 9.0, 6.0, 8.0, 3.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.294921875, -3.21002197265625, -3.1251220703125, -3.04022216796875, -2.955322265625, -2.87042236328125, -2.7855224609375, -2.70062255859375, -2.61572265625, -2.53082275390625, -2.4459228515625, -2.36102294921875, -2.276123046875, -2.19122314453125, -2.1063232421875, -2.02142333984375, -1.9365234375, -1.85162353515625, -1.7667236328125, -1.68182373046875, -1.596923828125, -1.51202392578125, -1.4271240234375, -1.34222412109375, -1.25732421875, -1.17242431640625, -1.0875244140625, -1.00262451171875, -0.917724609375, -0.83282470703125, -0.7479248046875, -0.66302490234375, -0.578125, -0.49322509765625, -0.4083251953125, -0.32342529296875, -0.238525390625, -0.15362548828125, -0.0687255859375, 0.01617431640625, 0.10107421875, 0.18597412109375, 0.2708740234375, 0.35577392578125, 0.440673828125, 0.52557373046875, 0.6104736328125, 0.69537353515625, 0.7802734375, 0.86517333984375, 0.9500732421875, 1.03497314453125, 1.119873046875, 1.20477294921875, 1.2896728515625, 1.37457275390625, 1.45947265625, 1.54437255859375, 1.6292724609375, 1.71417236328125, 1.799072265625, 1.88397216796875, 1.9688720703125, 2.05377197265625, 2.138671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 15.0, 19.0, 41.0, 58.0, 92.0, 187.0, 365.0, 718.0, 1976.0, 6228.0, 28617.0, 258445.0, 654641.0, 78747.0, 12883.0, 3266.0, 1097.0, 551.0, 239.0, 154.0, 83.0, 43.0, 33.0, 18.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1300048828125, -1.094970703125, -1.0599365234375, -1.02490234375, -0.9898681640625, -0.954833984375, -0.9197998046875, -0.884765625, -0.8497314453125, -0.814697265625, -0.7796630859375, -0.74462890625, -0.7095947265625, -0.674560546875, -0.6395263671875, -0.6044921875, -0.5694580078125, -0.534423828125, -0.4993896484375, -0.46435546875, -0.4293212890625, -0.394287109375, -0.3592529296875, -0.32421875, -0.2891845703125, -0.254150390625, -0.2191162109375, -0.18408203125, -0.1490478515625, -0.114013671875, -0.0789794921875, -0.0439453125, -0.0089111328125, 0.026123046875, 0.0611572265625, 0.09619140625, 0.1312255859375, 0.166259765625, 0.2012939453125, 0.236328125, 0.2713623046875, 0.306396484375, 0.3414306640625, 0.37646484375, 0.4114990234375, 0.446533203125, 0.4815673828125, 0.5166015625, 0.5516357421875, 0.586669921875, 0.6217041015625, 0.65673828125, 0.6917724609375, 0.726806640625, 0.7618408203125, 0.796875, 0.8319091796875, 0.866943359375, 0.9019775390625, 0.93701171875, 0.9720458984375, 1.007080078125, 1.0421142578125, 1.0771484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 27.0, 37.0, 65.0, 93.0, 143.0, 159.0, 175.0, 110.0, 62.0, 32.0, 27.0, 18.0, 17.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.605979382991791e-05, -7.925555109977722e-05, -7.245130836963654e-05, -6.564706563949585e-05, -5.8842822909355164e-05, -5.203858017921448e-05, -4.523433744907379e-05, -3.8430094718933105e-05, -3.162585198879242e-05, -2.4821609258651733e-05, -1.8017366528511047e-05, -1.1213123798370361e-05, -4.408881068229675e-06, 2.3953616619110107e-06, 9.199604392051697e-06, 1.6003847122192383e-05, 2.280808985233307e-05, 2.9612332582473755e-05, 3.641657531261444e-05, 4.322081804275513e-05, 5.002506077289581e-05, 5.68293035030365e-05, 6.363354623317719e-05, 7.043778896331787e-05, 7.724203169345856e-05, 8.404627442359924e-05, 9.085051715373993e-05, 9.765475988388062e-05, 0.0001044590026140213, 0.00011126324534416199, 0.00011806748807430267, 0.00012487173080444336, 0.00013167597353458405, 0.00013848021626472473, 0.00014528445899486542, 0.0001520887017250061, 0.0001588929444551468, 0.00016569718718528748, 0.00017250142991542816, 0.00017930567264556885, 0.00018610991537570953, 0.00019291415810585022, 0.0001997184008359909, 0.0002065226435661316, 0.00021332688629627228, 0.00022013112902641296, 0.00022693537175655365, 0.00023373961448669434, 0.00024054385721683502, 0.0002473480999469757, 0.0002541523426771164, 0.0002609565854072571, 0.00026776082813739777, 0.00027456507086753845, 0.00028136931359767914, 0.0002881735563278198, 0.0002949777990579605, 0.0003017820417881012, 0.0003085862845182419, 0.00031539052724838257, 0.00032219476997852325, 0.00032899901270866394, 0.0003358032554388046, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 17.0, 17.0, 42.0, 48.0, 86.0, 96.0, 223.0, 318.0, 632.0, 1130.0, 2466.0, 6266.0, 19539.0, 81246.0, 387271.0, 423959.0, 91758.0, 21123.0, 6722.0, 2758.0, 1289.0, 612.0, 379.0, 198.0, 136.0, 64.0, 59.0, 30.0, 23.0, 12.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.5995330810546875, -0.576507568359375, -0.5534820556640625, -0.53045654296875, -0.5074310302734375, -0.484405517578125, -0.4613800048828125, -0.4383544921875, -0.4153289794921875, -0.392303466796875, -0.3692779541015625, -0.34625244140625, -0.3232269287109375, -0.300201416015625, -0.2771759033203125, -0.254150390625, -0.2311248779296875, -0.208099365234375, -0.1850738525390625, -0.16204833984375, -0.1390228271484375, -0.115997314453125, -0.0929718017578125, -0.0699462890625, -0.0469207763671875, -0.023895263671875, -0.0008697509765625, 0.02215576171875, 0.0451812744140625, 0.068206787109375, 0.0912322998046875, 0.1142578125, 0.1372833251953125, 0.160308837890625, 0.1833343505859375, 0.20635986328125, 0.2293853759765625, 0.252410888671875, 0.2754364013671875, 0.2984619140625, 0.3214874267578125, 0.344512939453125, 0.3675384521484375, 0.39056396484375, 0.4135894775390625, 0.436614990234375, 0.4596405029296875, 0.482666015625, 0.5056915283203125, 0.528717041015625, 0.5517425537109375, 0.57476806640625, 0.5977935791015625, 0.620819091796875, 0.6438446044921875, 0.6668701171875, 0.6898956298828125, 0.712921142578125, 0.7359466552734375, 0.75897216796875, 0.7819976806640625, 0.805023193359375, 0.8280487060546875, 0.85107421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 11.0, 11.0, 17.0, 16.0, 30.0, 44.0, 57.0, 77.0, 105.0, 131.0, 122.0, 107.0, 80.0, 42.0, 32.0, 43.0, 22.0, 8.0, 10.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.090087890625, -1.05224609375, -1.014404296875, -0.9765625, -0.938720703125, -0.90087890625, -0.863037109375, -0.8251953125, -0.787353515625, -0.74951171875, -0.711669921875, -0.673828125, -0.635986328125, -0.59814453125, -0.560302734375, -0.5224609375, -0.484619140625, -0.44677734375, -0.408935546875, -0.37109375, -0.333251953125, -0.29541015625, -0.257568359375, -0.2197265625, -0.181884765625, -0.14404296875, -0.106201171875, -0.068359375, -0.030517578125, 0.00732421875, 0.045166015625, 0.0830078125, 0.120849609375, 0.15869140625, 0.196533203125, 0.234375, 0.272216796875, 0.31005859375, 0.347900390625, 0.3857421875, 0.423583984375, 0.46142578125, 0.499267578125, 0.537109375, 0.574951171875, 0.61279296875, 0.650634765625, 0.6884765625, 0.726318359375, 0.76416015625, 0.802001953125, 0.83984375, 0.877685546875, 0.91552734375, 0.953369140625, 0.9912109375, 1.029052734375, 1.06689453125, 1.104736328125, 1.142578125, 1.180419921875, 1.21826171875, 1.256103515625, 1.2939453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 17.0, 21.0, 55.0, 72.0, 110.0, 151.0, 157.0, 162.0, 97.0, 59.0, 42.0, 16.0, 17.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.332056999206543, -7.817634582519531, -7.3032121658325195, -6.788789749145508, -6.274367332458496, -5.759944915771484, -5.245522499084473, -4.731100082397461, -4.216677665710449, -3.7022552490234375, -3.187832832336426, -2.673410415649414, -2.1589879989624023, -1.6445655822753906, -1.130143165588379, -0.6157207489013672, -0.10129833221435547, 0.41312408447265625, 0.927546501159668, 1.4419689178466797, 1.9563913345336914, 2.470813751220703, 2.985236167907715, 3.4996585845947266, 4.014081001281738, 4.52850341796875, 5.042925834655762, 5.557348251342773, 6.071770668029785, 6.586193084716797, 7.100615501403809, 7.61503791809082, 8.129459381103516, 8.643881797790527, 9.158304214477539, 9.67272663116455, 10.187149047851562, 10.701571464538574, 11.215993881225586, 11.730416297912598, 12.24483871459961, 12.759261131286621, 13.273683547973633, 13.788105964660645, 14.302528381347656, 14.816950798034668, 15.33137321472168, 15.845795631408691, 16.360218048095703, 16.87464141845703, 17.389062881469727, 17.903484344482422, 18.41790771484375, 18.932331085205078, 19.446752548217773, 19.96117401123047, 20.475597381591797, 20.990020751953125, 21.50444221496582, 22.018863677978516, 22.533287048339844, 23.047710418701172, 23.562131881713867, 24.076553344726562, 24.59097671508789]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 7.0, 10.0, 17.0, 17.0, 24.0, 31.0, 33.0, 43.0, 38.0, 51.0, 39.0, 52.0, 42.0, 39.0, 66.0, 64.0, 55.0, 52.0, 52.0, 35.0, 42.0, 30.0, 23.0, 25.0, 22.0, 14.0, 21.0, 13.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.562973022460938, -11.183988571166992, -10.805004119873047, -10.426019668579102, -10.047036170959473, -9.668051719665527, -9.289067268371582, -8.910082817077637, -8.531098365783691, -8.152113914489746, -7.773129940032959, -7.394145488739014, -7.015161037445068, -6.636177062988281, -6.257192611694336, -5.878208160400391, -5.4992241859436035, -5.120239734649658, -4.741255760192871, -4.362271308898926, -3.9832868576049805, -3.6043026447296143, -3.225318431854248, -2.8463339805603027, -2.4673497676849365, -2.0883655548095703, -1.709381103515625, -1.3303968906402588, -0.951412558555603, -0.5724282264709473, -0.19344401359558105, 0.18554043769836426, 0.5645246505737305, 0.9435089826583862, 1.322493314743042, 1.7014775276184082, 2.0804619789123535, 2.4594461917877197, 2.838430404663086, 3.2174148559570312, 3.5963990688323975, 3.9753832817077637, 4.354367733001709, 4.733351707458496, 5.112336158752441, 5.491320610046387, 5.870305061340332, 6.249289512634277, 6.6282734870910645, 7.00725793838501, 7.386241912841797, 7.765226364135742, 8.144210815429688, 8.523195266723633, 8.902179718017578, 9.281164169311523, 9.660147666931152, 10.039132118225098, 10.418116569519043, 10.797100067138672, 11.176084518432617, 11.555068969726562, 11.934053421020508, 12.313037872314453, 12.692022323608398]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 8.0, 24.0, 29.0, 56.0, 74.0, 150.0, 296.0, 618.0, 1636.0, 6240.0, 51202.0, 4096515.0, 30251.0, 4669.0, 1367.0, 532.0, 236.0, 134.0, 69.0, 41.0, 23.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.5234375, -4.37939453125, -4.2353515625, -4.09130859375, -3.947265625, -3.80322265625, -3.6591796875, -3.51513671875, -3.37109375, -3.22705078125, -3.0830078125, -2.93896484375, -2.794921875, -2.65087890625, -2.5068359375, -2.36279296875, -2.21875, -2.07470703125, -1.9306640625, -1.78662109375, -1.642578125, -1.49853515625, -1.3544921875, -1.21044921875, -1.06640625, -0.92236328125, -0.7783203125, -0.63427734375, -0.490234375, -0.34619140625, -0.2021484375, -0.05810546875, 0.0859375, 0.22998046875, 0.3740234375, 0.51806640625, 0.662109375, 0.80615234375, 0.9501953125, 1.09423828125, 1.23828125, 1.38232421875, 1.5263671875, 1.67041015625, 1.814453125, 1.95849609375, 2.1025390625, 2.24658203125, 2.390625, 2.53466796875, 2.6787109375, 2.82275390625, 2.966796875, 3.11083984375, 3.2548828125, 3.39892578125, 3.54296875, 3.68701171875, 3.8310546875, 3.97509765625, 4.119140625, 4.26318359375, 4.4072265625, 4.55126953125, 4.6953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 20.0, 20.0, 18.0, 48.0, 60.0, 48.0, 84.0, 84.0, 100.0, 95.0, 91.0, 70.0, 68.0, 35.0, 51.0, 31.0, 17.0, 11.0, 12.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8783721923828125, -0.849029541015625, -0.8196868896484375, -0.79034423828125, -0.7610015869140625, -0.731658935546875, -0.7023162841796875, -0.6729736328125, -0.6436309814453125, -0.614288330078125, -0.5849456787109375, -0.55560302734375, -0.5262603759765625, -0.496917724609375, -0.4675750732421875, -0.438232421875, -0.4088897705078125, -0.379547119140625, -0.3502044677734375, -0.32086181640625, -0.2915191650390625, -0.262176513671875, -0.2328338623046875, -0.2034912109375, -0.1741485595703125, -0.144805908203125, -0.1154632568359375, -0.08612060546875, -0.0567779541015625, -0.027435302734375, 0.0019073486328125, 0.03125, 0.0605926513671875, 0.089935302734375, 0.1192779541015625, 0.14862060546875, 0.1779632568359375, 0.207305908203125, 0.2366485595703125, 0.2659912109375, 0.2953338623046875, 0.324676513671875, 0.3540191650390625, 0.38336181640625, 0.4127044677734375, 0.442047119140625, 0.4713897705078125, 0.500732421875, 0.5300750732421875, 0.559417724609375, 0.5887603759765625, 0.61810302734375, 0.6474456787109375, 0.676788330078125, 0.7061309814453125, 0.7354736328125, 0.7648162841796875, 0.794158935546875, 0.8235015869140625, 0.85284423828125, 0.8821868896484375, 0.911529541015625, 0.9408721923828125, 0.97021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 17.0, 12.0, 22.0, 25.0, 25.0, 38.0, 54.0, 78.0, 76.0, 108.0, 146.0, 256.0, 379.0, 762.0, 1671.0, 4634.0, 22595.0, 3870615.0, 271619.0, 14341.0, 3618.0, 1305.0, 626.0, 353.0, 248.0, 168.0, 122.0, 86.0, 53.0, 48.0, 30.0, 27.0, 29.0, 17.0, 12.0, 7.0, 10.0, 13.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.953125, -3.82513427734375, -3.6971435546875, -3.56915283203125, -3.441162109375, -3.31317138671875, -3.1851806640625, -3.05718994140625, -2.92919921875, -2.80120849609375, -2.6732177734375, -2.54522705078125, -2.417236328125, -2.28924560546875, -2.1612548828125, -2.03326416015625, -1.9052734375, -1.77728271484375, -1.6492919921875, -1.52130126953125, -1.393310546875, -1.26531982421875, -1.1373291015625, -1.00933837890625, -0.88134765625, -0.75335693359375, -0.6253662109375, -0.49737548828125, -0.369384765625, -0.24139404296875, -0.1134033203125, 0.01458740234375, 0.142578125, 0.27056884765625, 0.3985595703125, 0.52655029296875, 0.654541015625, 0.78253173828125, 0.9105224609375, 1.03851318359375, 1.16650390625, 1.29449462890625, 1.4224853515625, 1.55047607421875, 1.678466796875, 1.80645751953125, 1.9344482421875, 2.06243896484375, 2.1904296875, 2.31842041015625, 2.4464111328125, 2.57440185546875, 2.702392578125, 2.83038330078125, 2.9583740234375, 3.08636474609375, 3.21435546875, 3.34234619140625, 3.4703369140625, 3.59832763671875, 3.726318359375, 3.85430908203125, 3.9822998046875, 4.11029052734375, 4.23828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 6.0, 13.0, 26.0, 106.0, 3401.0, 426.0, 55.0, 19.0, 10.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9326171875, -0.891876220703125, -0.85113525390625, -0.810394287109375, -0.7696533203125, -0.728912353515625, -0.68817138671875, -0.647430419921875, -0.606689453125, -0.565948486328125, -0.52520751953125, -0.484466552734375, -0.4437255859375, -0.402984619140625, -0.36224365234375, -0.321502685546875, -0.28076171875, -0.240020751953125, -0.19927978515625, -0.158538818359375, -0.1177978515625, -0.077056884765625, -0.03631591796875, 0.004425048828125, 0.045166015625, 0.085906982421875, 0.12664794921875, 0.167388916015625, 0.2081298828125, 0.248870849609375, 0.28961181640625, 0.330352783203125, 0.37109375, 0.411834716796875, 0.45257568359375, 0.493316650390625, 0.5340576171875, 0.574798583984375, 0.61553955078125, 0.656280517578125, 0.697021484375, 0.737762451171875, 0.77850341796875, 0.819244384765625, 0.8599853515625, 0.900726318359375, 0.94146728515625, 0.982208251953125, 1.02294921875, 1.063690185546875, 1.10443115234375, 1.145172119140625, 1.1859130859375, 1.226654052734375, 1.26739501953125, 1.308135986328125, 1.348876953125, 1.389617919921875, 1.43035888671875, 1.471099853515625, 1.5118408203125, 1.552581787109375, 1.59332275390625, 1.634063720703125, 1.6748046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 42.0, 72.0, 217.0, 314.0, 182.0, 94.0, 44.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0910727977752686, -2.906198263168335, -2.7213237285614014, -2.5364491939544678, -2.351574659347534, -2.1667001247406006, -1.9818254709243774, -1.7969509363174438, -1.6120764017105103, -1.4272018671035767, -1.242327332496643, -1.05745267868042, -0.8725782036781311, -0.6877036690711975, -0.5028290748596191, -0.31795454025268555, -0.13308000564575195, 0.051794543862342834, 0.23666909337043762, 0.4215436577796936, 0.6064181923866272, 0.7912927269935608, 0.9761673212051392, 1.1610418558120728, 1.3459163904190063, 1.53079092502594, 1.7156654596328735, 1.9005401134490967, 2.0854146480560303, 2.270289182662964, 2.4551637172698975, 2.640038251876831, 2.8249125480651855, 3.009787082672119, 3.1946616172790527, 3.3795361518859863, 3.56441068649292, 3.7492852210998535, 3.934159755706787, 4.119034290313721, 4.303908824920654, 4.488783359527588, 4.6736578941345215, 4.858532428741455, 5.043406963348389, 5.228281497955322, 5.413156032562256, 5.5980305671691895, 5.782905578613281, 5.967780113220215, 6.152654647827148, 6.337529182434082, 6.522403717041016, 6.707278251647949, 6.892152786254883, 7.077027320861816, 7.26190185546875, 7.446776390075684, 7.631650924682617, 7.816525459289551, 8.001399993896484, 8.186274528503418, 8.371149063110352, 8.556023597717285, 8.740898132324219]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 5.0, 5.0, 21.0, 16.0, 17.0, 20.0, 27.0, 29.0, 28.0, 35.0, 31.0, 49.0, 44.0, 43.0, 56.0, 55.0, 55.0, 50.0, 43.0, 49.0, 46.0, 38.0, 36.0, 40.0, 25.0, 24.0, 16.0, 21.0, 22.0, 8.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1871438026428223, -2.120305061340332, -2.053466558456421, -1.9866278171539307, -1.91978919506073, -1.8529505729675293, -1.7861119508743286, -1.719273328781128, -1.6524345874786377, -1.585595965385437, -1.5187573432922363, -1.451918601989746, -1.3850799798965454, -1.3182413578033447, -1.251402735710144, -1.1845641136169434, -1.1177254915237427, -1.050886869430542, -0.9840481877326965, -0.9172095656394958, -0.8503708839416504, -0.7835322618484497, -0.716693639755249, -0.6498550176620483, -0.5830163359642029, -0.5161777138710022, -0.44933903217315674, -0.38250041007995605, -0.315661758184433, -0.2488231062889099, -0.18198448419570923, -0.11514583230018616, -0.048307180404663086, 0.01853146404027939, 0.08537010848522186, 0.15220874547958374, 0.2190473973751068, 0.2858860492706299, 0.35272467136383057, 0.41956332325935364, 0.4864019751548767, 0.5532405972480774, 0.6200792789459229, 0.6869179010391235, 0.7537565231323242, 0.8205952048301697, 0.8874338269233704, 0.9542725086212158, 1.0211111307144165, 1.0879497528076172, 1.1547883749008179, 1.2216269969940186, 1.2884657382965088, 1.3553043603897095, 1.4221429824829102, 1.4889816045761108, 1.5558202266693115, 1.6226588487625122, 1.689497470855713, 1.7563362121582031, 1.8231748342514038, 1.8900134563446045, 1.9568520784378052, 2.023690700531006, 2.090529441833496]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 30.0, 20.0, 48.0, 107.0, 164.0, 270.0, 511.0, 1015.0, 2281.0, 5734.0, 17249.0, 60332.0, 224394.0, 452267.0, 204294.0, 54223.0, 15931.0, 5364.0, 2218.0, 993.0, 439.0, 281.0, 149.0, 72.0, 64.0, 40.0, 20.0, 10.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.205078125, -2.1326904296875, -2.060302734375, -1.9879150390625, -1.91552734375, -1.8431396484375, -1.770751953125, -1.6983642578125, -1.6259765625, -1.5535888671875, -1.481201171875, -1.4088134765625, -1.33642578125, -1.2640380859375, -1.191650390625, -1.1192626953125, -1.046875, -0.9744873046875, -0.902099609375, -0.8297119140625, -0.75732421875, -0.6849365234375, -0.612548828125, -0.5401611328125, -0.4677734375, -0.3953857421875, -0.322998046875, -0.2506103515625, -0.17822265625, -0.1058349609375, -0.033447265625, 0.0389404296875, 0.111328125, 0.1837158203125, 0.256103515625, 0.3284912109375, 0.40087890625, 0.4732666015625, 0.545654296875, 0.6180419921875, 0.6904296875, 0.7628173828125, 0.835205078125, 0.9075927734375, 0.97998046875, 1.0523681640625, 1.124755859375, 1.1971435546875, 1.26953125, 1.3419189453125, 1.414306640625, 1.4866943359375, 1.55908203125, 1.6314697265625, 1.703857421875, 1.7762451171875, 1.8486328125, 1.9210205078125, 1.993408203125, 2.0657958984375, 2.13818359375, 2.2105712890625, 2.282958984375, 2.3553466796875, 2.427734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 14.0, 15.0, 11.0, 28.0, 27.0, 46.0, 34.0, 47.0, 53.0, 68.0, 66.0, 68.0, 72.0, 76.0, 59.0, 44.0, 52.0, 49.0, 38.0, 24.0, 24.0, 24.0, 17.0, 10.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.909515380859375, -0.88006591796875, -0.850616455078125, -0.8211669921875, -0.791717529296875, -0.76226806640625, -0.732818603515625, -0.703369140625, -0.673919677734375, -0.64447021484375, -0.615020751953125, -0.5855712890625, -0.556121826171875, -0.52667236328125, -0.497222900390625, -0.4677734375, -0.438323974609375, -0.40887451171875, -0.379425048828125, -0.3499755859375, -0.320526123046875, -0.29107666015625, -0.261627197265625, -0.232177734375, -0.202728271484375, -0.17327880859375, -0.143829345703125, -0.1143798828125, -0.084930419921875, -0.05548095703125, -0.026031494140625, 0.00341796875, 0.032867431640625, 0.06231689453125, 0.091766357421875, 0.1212158203125, 0.150665283203125, 0.18011474609375, 0.209564208984375, 0.239013671875, 0.268463134765625, 0.29791259765625, 0.327362060546875, 0.3568115234375, 0.386260986328125, 0.41571044921875, 0.445159912109375, 0.474609375, 0.504058837890625, 0.53350830078125, 0.562957763671875, 0.5924072265625, 0.621856689453125, 0.65130615234375, 0.680755615234375, 0.710205078125, 0.739654541015625, 0.76910400390625, 0.798553466796875, 0.8280029296875, 0.857452392578125, 0.88690185546875, 0.916351318359375, 0.94580078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 39.0, 52.0, 57.0, 103.0, 143.0, 265.0, 527.0, 1016.0, 2444.0, 6116.0, 17876.0, 70046.0, 373663.0, 457119.0, 85728.0, 21067.0, 6977.0, 2739.0, 1221.0, 537.0, 269.0, 148.0, 116.0, 65.0, 46.0, 28.0, 27.0, 25.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80047607421875, -2.7103271484375, -2.62017822265625, -2.530029296875, -2.43988037109375, -2.3497314453125, -2.25958251953125, -2.16943359375, -2.07928466796875, -1.9891357421875, -1.89898681640625, -1.808837890625, -1.71868896484375, -1.6285400390625, -1.53839111328125, -1.4482421875, -1.35809326171875, -1.2679443359375, -1.17779541015625, -1.087646484375, -0.99749755859375, -0.9073486328125, -0.81719970703125, -0.72705078125, -0.63690185546875, -0.5467529296875, -0.45660400390625, -0.366455078125, -0.27630615234375, -0.1861572265625, -0.09600830078125, -0.005859375, 0.08428955078125, 0.1744384765625, 0.26458740234375, 0.354736328125, 0.44488525390625, 0.5350341796875, 0.62518310546875, 0.71533203125, 0.80548095703125, 0.8956298828125, 0.98577880859375, 1.075927734375, 1.16607666015625, 1.2562255859375, 1.34637451171875, 1.4365234375, 1.52667236328125, 1.6168212890625, 1.70697021484375, 1.797119140625, 1.88726806640625, 1.9774169921875, 2.06756591796875, 2.15771484375, 2.24786376953125, 2.3380126953125, 2.42816162109375, 2.518310546875, 2.60845947265625, 2.6986083984375, 2.78875732421875, 2.87890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 5.0, 5.0, 13.0, 12.0, 13.0, 17.0, 18.0, 23.0, 27.0, 36.0, 29.0, 49.0, 33.0, 51.0, 54.0, 51.0, 48.0, 54.0, 51.0, 40.0, 53.0, 50.0, 33.0, 41.0, 36.0, 28.0, 23.0, 14.0, 13.0, 13.0, 11.0, 4.0, 5.0, 6.0, 8.0, 4.0, 1.0, 6.0, 3.0, 0.0, 3.0, 5.0], "bins": [-4.78515625, -4.6619873046875, -4.538818359375, -4.4156494140625, -4.29248046875, -4.1693115234375, -4.046142578125, -3.9229736328125, -3.7998046875, -3.6766357421875, -3.553466796875, -3.4302978515625, -3.30712890625, -3.1839599609375, -3.060791015625, -2.9376220703125, -2.814453125, -2.6912841796875, -2.568115234375, -2.4449462890625, -2.32177734375, -2.1986083984375, -2.075439453125, -1.9522705078125, -1.8291015625, -1.7059326171875, -1.582763671875, -1.4595947265625, -1.33642578125, -1.2132568359375, -1.090087890625, -0.9669189453125, -0.84375, -0.7205810546875, -0.597412109375, -0.4742431640625, -0.35107421875, -0.2279052734375, -0.104736328125, 0.0184326171875, 0.1416015625, 0.2647705078125, 0.387939453125, 0.5111083984375, 0.63427734375, 0.7574462890625, 0.880615234375, 1.0037841796875, 1.126953125, 1.2501220703125, 1.373291015625, 1.4964599609375, 1.61962890625, 1.7427978515625, 1.865966796875, 1.9891357421875, 2.1123046875, 2.2354736328125, 2.358642578125, 2.4818115234375, 2.60498046875, 2.7281494140625, 2.851318359375, 2.9744873046875, 3.09765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 12.0, 16.0, 19.0, 64.0, 124.0, 308.0, 1087.0, 7519.0, 1012012.0, 24793.0, 1871.0, 424.0, 161.0, 62.0, 31.0, 17.0, 15.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.6126708984375, -7.405029296875, -7.1973876953125, -6.98974609375, -6.7821044921875, -6.574462890625, -6.3668212890625, -6.1591796875, -5.9515380859375, -5.743896484375, -5.5362548828125, -5.32861328125, -5.1209716796875, -4.913330078125, -4.7056884765625, -4.498046875, -4.2904052734375, -4.082763671875, -3.8751220703125, -3.66748046875, -3.4598388671875, -3.252197265625, -3.0445556640625, -2.8369140625, -2.6292724609375, -2.421630859375, -2.2139892578125, -2.00634765625, -1.7987060546875, -1.591064453125, -1.3834228515625, -1.17578125, -0.9681396484375, -0.760498046875, -0.5528564453125, -0.34521484375, -0.1375732421875, 0.070068359375, 0.2777099609375, 0.4853515625, 0.6929931640625, 0.900634765625, 1.1082763671875, 1.31591796875, 1.5235595703125, 1.731201171875, 1.9388427734375, 2.146484375, 2.3541259765625, 2.561767578125, 2.7694091796875, 2.97705078125, 3.1846923828125, 3.392333984375, 3.5999755859375, 3.8076171875, 4.0152587890625, 4.222900390625, 4.4305419921875, 4.63818359375, 4.8458251953125, 5.053466796875, 5.2611083984375, 5.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 9.0, 4.0, 20.0, 27.0, 48.0, 88.0, 99.0, 151.0, 164.0, 136.0, 109.0, 53.0, 35.0, 16.0, 18.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028228759765625, -0.0002748984843492508, -0.0002675093710422516, -0.0002601202577352524, -0.0002527311444282532, -0.00024534203112125397, -0.00023795291781425476, -0.00023056380450725555, -0.00022317469120025635, -0.00021578557789325714, -0.00020839646458625793, -0.00020100735127925873, -0.00019361823797225952, -0.00018622912466526031, -0.0001788400113582611, -0.0001714508980512619, -0.0001640617847442627, -0.0001566726714372635, -0.00014928355813026428, -0.00014189444482326508, -0.00013450533151626587, -0.00012711621820926666, -0.00011972710490226746, -0.00011233799159526825, -0.00010494887828826904, -9.755976498126984e-05, -9.017065167427063e-05, -8.278153836727142e-05, -7.539242506027222e-05, -6.800331175327301e-05, -6.0614198446273804e-05, -5.32250851392746e-05, -4.583597183227539e-05, -3.8446858525276184e-05, -3.105774521827698e-05, -2.366863191127777e-05, -1.6279518604278564e-05, -8.890405297279358e-06, -1.5012919902801514e-06, 5.887821316719055e-06, 1.3276934623718262e-05, 2.0666047930717468e-05, 2.8055161237716675e-05, 3.544427454471588e-05, 4.283338785171509e-05, 5.0222501158714294e-05, 5.76116144657135e-05, 6.500072777271271e-05, 7.238984107971191e-05, 7.977895438671112e-05, 8.716806769371033e-05, 9.455718100070953e-05, 0.00010194629430770874, 0.00010933540761470795, 0.00011672452092170715, 0.00012411363422870636, 0.00013150274753570557, 0.00013889186084270477, 0.00014628097414970398, 0.00015367008745670319, 0.0001610592007637024, 0.0001684483140707016, 0.0001758374273777008, 0.0001832265406847, 0.00019061565399169922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 15.0, 33.0, 61.0, 92.0, 195.0, 476.0, 1209.0, 4130.0, 47458.0, 949587.0, 39361.0, 3872.0, 1177.0, 478.0, 195.0, 106.0, 43.0, 18.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.064453125, -2.9700927734375, -2.875732421875, -2.7813720703125, -2.68701171875, -2.5926513671875, -2.498291015625, -2.4039306640625, -2.3095703125, -2.2152099609375, -2.120849609375, -2.0264892578125, -1.93212890625, -1.8377685546875, -1.743408203125, -1.6490478515625, -1.5546875, -1.4603271484375, -1.365966796875, -1.2716064453125, -1.17724609375, -1.0828857421875, -0.988525390625, -0.8941650390625, -0.7998046875, -0.7054443359375, -0.611083984375, -0.5167236328125, -0.42236328125, -0.3280029296875, -0.233642578125, -0.1392822265625, -0.044921875, 0.0494384765625, 0.143798828125, 0.2381591796875, 0.33251953125, 0.4268798828125, 0.521240234375, 0.6156005859375, 0.7099609375, 0.8043212890625, 0.898681640625, 0.9930419921875, 1.08740234375, 1.1817626953125, 1.276123046875, 1.3704833984375, 1.46484375, 1.5592041015625, 1.653564453125, 1.7479248046875, 1.84228515625, 1.9366455078125, 2.031005859375, 2.1253662109375, 2.2197265625, 2.3140869140625, 2.408447265625, 2.5028076171875, 2.59716796875, 2.6915283203125, 2.785888671875, 2.8802490234375, 2.974609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 13.0, 11.0, 22.0, 62.0, 108.0, 220.0, 252.0, 143.0, 74.0, 35.0, 19.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.513671875, -2.413848876953125, -2.31402587890625, -2.214202880859375, -2.1143798828125, -2.014556884765625, -1.91473388671875, -1.814910888671875, -1.715087890625, -1.615264892578125, -1.51544189453125, -1.415618896484375, -1.3157958984375, -1.215972900390625, -1.11614990234375, -1.016326904296875, -0.91650390625, -0.816680908203125, -0.71685791015625, -0.617034912109375, -0.5172119140625, -0.417388916015625, -0.31756591796875, -0.217742919921875, -0.117919921875, -0.018096923828125, 0.08172607421875, 0.181549072265625, 0.2813720703125, 0.381195068359375, 0.48101806640625, 0.580841064453125, 0.6806640625, 0.780487060546875, 0.88031005859375, 0.980133056640625, 1.0799560546875, 1.179779052734375, 1.27960205078125, 1.379425048828125, 1.479248046875, 1.579071044921875, 1.67889404296875, 1.778717041015625, 1.8785400390625, 1.978363037109375, 2.07818603515625, 2.178009033203125, 2.27783203125, 2.377655029296875, 2.47747802734375, 2.577301025390625, 2.6771240234375, 2.776947021484375, 2.87677001953125, 2.976593017578125, 3.076416015625, 3.176239013671875, 3.27606201171875, 3.375885009765625, 3.4757080078125, 3.575531005859375, 3.67535400390625, 3.775177001953125, 3.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 17.0, 16.0, 32.0, 26.0, 44.0, 53.0, 51.0, 68.0, 95.0, 115.0, 91.0, 72.0, 54.0, 69.0, 51.0, 42.0, 16.0, 20.0, 22.0, 7.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.282142639160156, -16.755569458007812, -16.2289981842041, -15.702425003051758, -15.17585277557373, -14.649280548095703, -14.12270736694336, -13.596135139465332, -13.069562911987305, -12.542990684509277, -12.016417503356934, -11.489845275878906, -10.963273048400879, -10.436700820922852, -9.910127639770508, -9.38355541229248, -8.856982231140137, -8.33041000366211, -7.803837299346924, -7.277264595031738, -6.750692367553711, -6.224119663238525, -5.69754695892334, -5.1709747314453125, -4.644402027130127, -4.117829322814941, -3.591257095336914, -3.0646843910217285, -2.538111925125122, -2.0115394592285156, -1.48496675491333, -0.9583942890167236, -0.4318218231201172, 0.09475070238113403, 0.6213232278823853, 1.1478958129882812, 1.6744682788848877, 2.201040744781494, 2.7276134490966797, 3.254185914993286, 3.7807583808898926, 4.307331085205078, 4.8339033126831055, 5.360476016998291, 5.887048721313477, 6.413620948791504, 6.9401936531066895, 7.466766357421875, 7.993338584899902, 8.51991081237793, 9.046483993530273, 9.5730562210083, 10.099628448486328, 10.626201629638672, 11.1527738571167, 11.679346084594727, 12.20591926574707, 12.732491493225098, 13.259064674377441, 13.785636901855469, 14.312209129333496, 14.838781356811523, 15.365354537963867, 15.891926765441895, 16.418498992919922]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 10.0, 7.0, 10.0, 8.0, 12.0, 10.0, 20.0, 18.0, 31.0, 25.0, 36.0, 38.0, 44.0, 36.0, 49.0, 53.0, 44.0, 60.0, 35.0, 45.0, 37.0, 48.0, 33.0, 24.0, 33.0, 32.0, 30.0, 24.0, 21.0, 17.0, 21.0, 12.0, 12.0, 6.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.726259231567383, -17.16609001159668, -16.605920791625977, -16.045751571655273, -15.485581398010254, -14.92541217803955, -14.365242004394531, -13.805072784423828, -13.244903564453125, -12.684734344482422, -12.124565124511719, -11.5643949508667, -11.004225730895996, -10.444056510925293, -9.883886337280273, -9.32371711730957, -8.763547897338867, -8.203378677368164, -7.643208980560303, -7.083039283752441, -6.522870063781738, -5.962700843811035, -5.402531147003174, -4.8423614501953125, -4.282192230224609, -3.722022771835327, -3.161853313446045, -2.6016838550567627, -2.0415143966674805, -1.4813449382781982, -0.921175479888916, -0.3610060214996338, 0.19916534423828125, 0.7593348026275635, 1.3195042610168457, 1.879673719406128, 2.43984317779541, 3.0000126361846924, 3.5601820945739746, 4.120351791381836, 4.680521011352539, 5.240690231323242, 5.8008599281311035, 6.361029624938965, 6.921198844909668, 7.481368064880371, 8.04153823852539, 8.601707458496094, 9.161876678466797, 9.7220458984375, 10.282215118408203, 10.842385292053223, 11.402554512023926, 11.962723731994629, 12.522893905639648, 13.083063125610352, 13.643232345581055, 14.203401565551758, 14.763570785522461, 15.32374095916748, 15.883910179138184, 16.444080352783203, 17.004249572753906, 17.56441879272461, 18.124588012695312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 7.0, 8.0, 21.0, 24.0, 53.0, 55.0, 83.0, 160.0, 178.0, 300.0, 524.0, 966.0, 2013.0, 5072.0, 16349.0, 111334.0, 4005365.0, 36108.0, 8989.0, 3228.0, 1409.0, 726.0, 404.0, 306.0, 191.0, 132.0, 70.0, 53.0, 44.0, 19.0, 20.0, 14.0, 16.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.974517822265625, -2.87286376953125, -2.771209716796875, -2.6695556640625, -2.567901611328125, -2.46624755859375, -2.364593505859375, -2.262939453125, -2.161285400390625, -2.05963134765625, -1.957977294921875, -1.8563232421875, -1.754669189453125, -1.65301513671875, -1.551361083984375, -1.44970703125, -1.348052978515625, -1.24639892578125, -1.144744873046875, -1.0430908203125, -0.941436767578125, -0.83978271484375, -0.738128662109375, -0.636474609375, -0.534820556640625, -0.43316650390625, -0.331512451171875, -0.2298583984375, -0.128204345703125, -0.02655029296875, 0.075103759765625, 0.1767578125, 0.278411865234375, 0.38006591796875, 0.481719970703125, 0.5833740234375, 0.685028076171875, 0.78668212890625, 0.888336181640625, 0.989990234375, 1.091644287109375, 1.19329833984375, 1.294952392578125, 1.3966064453125, 1.498260498046875, 1.59991455078125, 1.701568603515625, 1.80322265625, 1.904876708984375, 2.00653076171875, 2.108184814453125, 2.2098388671875, 2.311492919921875, 2.41314697265625, 2.514801025390625, 2.616455078125, 2.718109130859375, 2.81976318359375, 2.921417236328125, 3.0230712890625, 3.124725341796875, 3.22637939453125, 3.328033447265625, 3.4296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 17.0, 18.0, 20.0, 32.0, 44.0, 51.0, 70.0, 62.0, 64.0, 64.0, 57.0, 78.0, 62.0, 51.0, 47.0, 52.0, 39.0, 35.0, 18.0, 18.0, 19.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.939422607421875, -0.90716552734375, -0.874908447265625, -0.8426513671875, -0.810394287109375, -0.77813720703125, -0.745880126953125, -0.713623046875, -0.681365966796875, -0.64910888671875, -0.616851806640625, -0.5845947265625, -0.552337646484375, -0.52008056640625, -0.487823486328125, -0.45556640625, -0.423309326171875, -0.39105224609375, -0.358795166015625, -0.3265380859375, -0.294281005859375, -0.26202392578125, -0.229766845703125, -0.197509765625, -0.165252685546875, -0.13299560546875, -0.100738525390625, -0.0684814453125, -0.036224365234375, -0.00396728515625, 0.028289794921875, 0.060546875, 0.092803955078125, 0.12506103515625, 0.157318115234375, 0.1895751953125, 0.221832275390625, 0.25408935546875, 0.286346435546875, 0.318603515625, 0.350860595703125, 0.38311767578125, 0.415374755859375, 0.4476318359375, 0.479888916015625, 0.51214599609375, 0.544403076171875, 0.57666015625, 0.608917236328125, 0.64117431640625, 0.673431396484375, 0.7056884765625, 0.737945556640625, 0.77020263671875, 0.802459716796875, 0.834716796875, 0.866973876953125, 0.89923095703125, 0.931488037109375, 0.9637451171875, 0.996002197265625, 1.02825927734375, 1.060516357421875, 1.0927734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 15.0, 10.0, 10.0, 19.0, 25.0, 33.0, 46.0, 75.0, 99.0, 139.0, 182.0, 253.0, 383.0, 682.0, 1146.0, 2166.0, 4221.0, 9329.0, 24707.0, 98071.0, 3856366.0, 144230.0, 30360.0, 10957.0, 4788.0, 2463.0, 1261.0, 769.0, 424.0, 319.0, 205.0, 149.0, 98.0, 79.0, 44.0, 31.0, 28.0, 20.0, 18.0, 17.0, 9.0, 2.0, 8.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0], "bins": [-2.833984375, -2.754364013671875, -2.67474365234375, -2.595123291015625, -2.5155029296875, -2.435882568359375, -2.35626220703125, -2.276641845703125, -2.197021484375, -2.117401123046875, -2.03778076171875, -1.958160400390625, -1.8785400390625, -1.798919677734375, -1.71929931640625, -1.639678955078125, -1.56005859375, -1.480438232421875, -1.40081787109375, -1.321197509765625, -1.2415771484375, -1.161956787109375, -1.08233642578125, -1.002716064453125, -0.923095703125, -0.843475341796875, -0.76385498046875, -0.684234619140625, -0.6046142578125, -0.524993896484375, -0.44537353515625, -0.365753173828125, -0.2861328125, -0.206512451171875, -0.12689208984375, -0.047271728515625, 0.0323486328125, 0.111968994140625, 0.19158935546875, 0.271209716796875, 0.350830078125, 0.430450439453125, 0.51007080078125, 0.589691162109375, 0.6693115234375, 0.748931884765625, 0.82855224609375, 0.908172607421875, 0.98779296875, 1.067413330078125, 1.14703369140625, 1.226654052734375, 1.3062744140625, 1.385894775390625, 1.46551513671875, 1.545135498046875, 1.624755859375, 1.704376220703125, 1.78399658203125, 1.863616943359375, 1.9432373046875, 2.022857666015625, 2.10247802734375, 2.182098388671875, 2.26171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 23.0, 45.0, 48.0, 156.0, 3257.0, 314.0, 84.0, 45.0, 28.0, 18.0, 7.0, 9.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1884002685546875, -1.156097412109375, -1.1237945556640625, -1.09149169921875, -1.0591888427734375, -1.026885986328125, -0.9945831298828125, -0.9622802734375, -0.9299774169921875, -0.897674560546875, -0.8653717041015625, -0.83306884765625, -0.8007659912109375, -0.768463134765625, -0.7361602783203125, -0.703857421875, -0.6715545654296875, -0.639251708984375, -0.6069488525390625, -0.57464599609375, -0.5423431396484375, -0.510040283203125, -0.4777374267578125, -0.4454345703125, -0.4131317138671875, -0.380828857421875, -0.3485260009765625, -0.31622314453125, -0.2839202880859375, -0.251617431640625, -0.2193145751953125, -0.18701171875, -0.1547088623046875, -0.122406005859375, -0.0901031494140625, -0.05780029296875, -0.0254974365234375, 0.006805419921875, 0.0391082763671875, 0.0714111328125, 0.1037139892578125, 0.136016845703125, 0.1683197021484375, 0.20062255859375, 0.2329254150390625, 0.265228271484375, 0.2975311279296875, 0.329833984375, 0.3621368408203125, 0.394439697265625, 0.4267425537109375, 0.45904541015625, 0.4913482666015625, 0.523651123046875, 0.5559539794921875, 0.5882568359375, 0.6205596923828125, 0.652862548828125, 0.6851654052734375, 0.71746826171875, 0.7497711181640625, 0.782073974609375, 0.8143768310546875, 0.8466796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 7.0, 13.0, 21.0, 37.0, 53.0, 54.0, 78.0, 92.0, 111.0, 98.0, 114.0, 97.0, 73.0, 60.0, 42.0, 12.0, 20.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5895838737487793, -3.4941811561584473, -3.398778200149536, -3.303375482559204, -3.207972526550293, -3.112569808959961, -3.017167091369629, -2.9217641353607178, -2.8263611793518066, -2.7309584617614746, -2.6355555057525635, -2.5401527881622314, -2.4447498321533203, -2.3493471145629883, -2.2539443969726562, -2.158541440963745, -2.063138723373413, -1.9677358865737915, -1.87233304977417, -1.776930332183838, -1.6815273761749268, -1.5861246585845947, -1.4907218217849731, -1.3953189849853516, -1.29991614818573, -1.2045133113861084, -1.1091104745864868, -1.0137076377868652, -0.9183048605918884, -0.8229020237922668, -0.72749924659729, -0.6320964097976685, -0.5366935729980469, -0.4412907361984253, -0.3458879292011261, -0.2504851222038269, -0.15508228540420532, -0.05967944860458374, 0.035723328590393066, 0.13112616539001465, 0.22652900218963623, 0.3219318389892578, 0.417334645986557, 0.5127374529838562, 0.6081402897834778, 0.7035431265830994, 0.7989459037780762, 0.8943487405776978, 0.9897515773773193, 1.085154414176941, 1.1805572509765625, 1.2759599685668945, 1.3713629245758057, 1.4667656421661377, 1.5621684789657593, 1.6575713157653809, 1.7529741525650024, 1.848376989364624, 1.9437798261642456, 2.039182662963867, 2.134585380554199, 2.2299883365631104, 2.3253910541534424, 2.4207940101623535, 2.5161967277526855]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 22.0, 14.0, 28.0, 26.0, 26.0, 23.0, 32.0, 40.0, 32.0, 32.0, 45.0, 43.0, 40.0, 50.0, 46.0, 56.0, 40.0, 34.0, 55.0, 51.0, 36.0, 35.0, 29.0, 18.0, 23.0, 17.0, 19.0, 9.0, 7.0, 10.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9960172176361084, -1.9374629259109497, -1.8789085149765015, -1.8203542232513428, -1.761799931526184, -1.7032456398010254, -1.6446912288665771, -1.5861369371414185, -1.5275826454162598, -1.469028353691101, -1.4104739427566528, -1.3519196510314941, -1.2933653593063354, -1.2348110675811768, -1.1762566566467285, -1.1177023649215698, -1.0591480731964111, -1.0005937814712524, -0.942039430141449, -0.8834850788116455, -0.8249307870864868, -0.7663764357566833, -0.7078220844268799, -0.6492677927017212, -0.590713381767273, -0.5321590304374695, -0.4736047387123108, -0.4150503873825073, -0.35649609565734863, -0.29794174432754517, -0.2393874228000641, -0.180833101272583, -0.12227880954742432, -0.06372448801994324, -0.005170159041881561, 0.053384169936180115, 0.1119384914636612, 0.17049282789230347, 0.22904714941978455, 0.2876014709472656, 0.3461557924747467, 0.4047101140022278, 0.46326443552970886, 0.5218187570571899, 0.5803731083869934, 0.6389274597167969, 0.6974817514419556, 0.7560360431671143, 0.8145903944969177, 0.8731447458267212, 0.9316990375518799, 0.9902533888816833, 1.0488077402114868, 1.1073620319366455, 1.1659163236618042, 1.224470615386963, 1.2830250263214111, 1.3415793180465698, 1.400133728981018, 1.4586880207061768, 1.5172423124313354, 1.5757966041564941, 1.6343510150909424, 1.692905306816101, 1.7514595985412598]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 17.0, 25.0, 42.0, 62.0, 69.0, 117.0, 172.0, 282.0, 449.0, 777.0, 1381.0, 2470.0, 4807.0, 10066.0, 22641.0, 56024.0, 140962.0, 288561.0, 283734.0, 138478.0, 54614.0, 22130.0, 9854.0, 4856.0, 2541.0, 1359.0, 757.0, 455.0, 291.0, 175.0, 122.0, 92.0, 45.0, 46.0, 17.0, 14.0, 13.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6358795166015625, -1.581329345703125, -1.5267791748046875, -1.47222900390625, -1.4176788330078125, -1.363128662109375, -1.3085784912109375, -1.2540283203125, -1.1994781494140625, -1.144927978515625, -1.0903778076171875, -1.03582763671875, -0.9812774658203125, -0.926727294921875, -0.8721771240234375, -0.817626953125, -0.7630767822265625, -0.708526611328125, -0.6539764404296875, -0.59942626953125, -0.5448760986328125, -0.490325927734375, -0.4357757568359375, -0.3812255859375, -0.3266754150390625, -0.272125244140625, -0.2175750732421875, -0.16302490234375, -0.1084747314453125, -0.053924560546875, 0.0006256103515625, 0.05517578125, 0.1097259521484375, 0.164276123046875, 0.2188262939453125, 0.27337646484375, 0.3279266357421875, 0.382476806640625, 0.4370269775390625, 0.4915771484375, 0.5461273193359375, 0.600677490234375, 0.6552276611328125, 0.70977783203125, 0.7643280029296875, 0.818878173828125, 0.8734283447265625, 0.927978515625, 0.9825286865234375, 1.037078857421875, 1.0916290283203125, 1.14617919921875, 1.2007293701171875, 1.255279541015625, 1.3098297119140625, 1.3643798828125, 1.4189300537109375, 1.473480224609375, 1.5280303955078125, 1.58258056640625, 1.6371307373046875, 1.691680908203125, 1.7462310791015625, 1.80078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 7.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 28.0, 34.0, 37.0, 42.0, 50.0, 55.0, 47.0, 65.0, 65.0, 67.0, 54.0, 53.0, 49.0, 46.0, 41.0, 42.0, 24.0, 32.0, 22.0, 16.0, 11.0, 9.0, 13.0, 3.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.013671875, -0.9827423095703125, -0.951812744140625, -0.9208831787109375, -0.88995361328125, -0.8590240478515625, -0.828094482421875, -0.7971649169921875, -0.7662353515625, -0.7353057861328125, -0.704376220703125, -0.6734466552734375, -0.64251708984375, -0.6115875244140625, -0.580657958984375, -0.5497283935546875, -0.518798828125, -0.4878692626953125, -0.456939697265625, -0.4260101318359375, -0.39508056640625, -0.3641510009765625, -0.333221435546875, -0.3022918701171875, -0.2713623046875, -0.2404327392578125, -0.209503173828125, -0.1785736083984375, -0.14764404296875, -0.1167144775390625, -0.085784912109375, -0.0548553466796875, -0.02392578125, 0.0070037841796875, 0.037933349609375, 0.0688629150390625, 0.09979248046875, 0.1307220458984375, 0.161651611328125, 0.1925811767578125, 0.2235107421875, 0.2544403076171875, 0.285369873046875, 0.3162994384765625, 0.34722900390625, 0.3781585693359375, 0.409088134765625, 0.4400177001953125, 0.470947265625, 0.5018768310546875, 0.532806396484375, 0.5637359619140625, 0.59466552734375, 0.6255950927734375, 0.656524658203125, 0.6874542236328125, 0.7183837890625, 0.7493133544921875, 0.780242919921875, 0.8111724853515625, 0.84210205078125, 0.8730316162109375, 0.903961181640625, 0.9348907470703125, 0.9658203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 8.0, 14.0, 12.0, 18.0, 30.0, 44.0, 83.0, 136.0, 235.0, 446.0, 849.0, 2099.0, 5715.0, 21016.0, 114378.0, 597073.0, 252189.0, 39528.0, 9219.0, 2959.0, 1261.0, 565.0, 261.0, 135.0, 96.0, 46.0, 35.0, 22.0, 21.0, 18.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.89453125, -3.791229248046875, -3.68792724609375, -3.584625244140625, -3.4813232421875, -3.378021240234375, -3.27471923828125, -3.171417236328125, -3.068115234375, -2.964813232421875, -2.86151123046875, -2.758209228515625, -2.6549072265625, -2.551605224609375, -2.44830322265625, -2.345001220703125, -2.24169921875, -2.138397216796875, -2.03509521484375, -1.931793212890625, -1.8284912109375, -1.725189208984375, -1.62188720703125, -1.518585205078125, -1.415283203125, -1.311981201171875, -1.20867919921875, -1.105377197265625, -1.0020751953125, -0.898773193359375, -0.79547119140625, -0.692169189453125, -0.5888671875, -0.485565185546875, -0.38226318359375, -0.278961181640625, -0.1756591796875, -0.072357177734375, 0.03094482421875, 0.134246826171875, 0.237548828125, 0.340850830078125, 0.44415283203125, 0.547454833984375, 0.6507568359375, 0.754058837890625, 0.85736083984375, 0.960662841796875, 1.06396484375, 1.167266845703125, 1.27056884765625, 1.373870849609375, 1.4771728515625, 1.580474853515625, 1.68377685546875, 1.787078857421875, 1.890380859375, 1.993682861328125, 2.09698486328125, 2.200286865234375, 2.3035888671875, 2.406890869140625, 2.51019287109375, 2.613494873046875, 2.716796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 19.0, 33.0, 29.0, 39.0, 44.0, 64.0, 60.0, 56.0, 77.0, 72.0, 65.0, 68.0, 58.0, 50.0, 39.0, 34.0, 33.0, 27.0, 12.0, 16.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.61956787109375, -5.4500732421875, -5.28057861328125, -5.111083984375, -4.94158935546875, -4.7720947265625, -4.60260009765625, -4.43310546875, -4.26361083984375, -4.0941162109375, -3.92462158203125, -3.755126953125, -3.58563232421875, -3.4161376953125, -3.24664306640625, -3.0771484375, -2.90765380859375, -2.7381591796875, -2.56866455078125, -2.399169921875, -2.22967529296875, -2.0601806640625, -1.89068603515625, -1.72119140625, -1.55169677734375, -1.3822021484375, -1.21270751953125, -1.043212890625, -0.87371826171875, -0.7042236328125, -0.53472900390625, -0.365234375, -0.19573974609375, -0.0262451171875, 0.14324951171875, 0.312744140625, 0.48223876953125, 0.6517333984375, 0.82122802734375, 0.99072265625, 1.16021728515625, 1.3297119140625, 1.49920654296875, 1.668701171875, 1.83819580078125, 2.0076904296875, 2.17718505859375, 2.3466796875, 2.51617431640625, 2.6856689453125, 2.85516357421875, 3.024658203125, 3.19415283203125, 3.3636474609375, 3.53314208984375, 3.70263671875, 3.87213134765625, 4.0416259765625, 4.21112060546875, 4.380615234375, 4.55010986328125, 4.7196044921875, 4.88909912109375, 5.05859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 16.0, 44.0, 49.0, 130.0, 250.0, 764.0, 2911.0, 26775.0, 885850.0, 123724.0, 6099.0, 1259.0, 376.0, 146.0, 70.0, 32.0, 24.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.4852294921875, -3.378662109375, -3.2720947265625, -3.16552734375, -3.0589599609375, -2.952392578125, -2.8458251953125, -2.7392578125, -2.6326904296875, -2.526123046875, -2.4195556640625, -2.31298828125, -2.2064208984375, -2.099853515625, -1.9932861328125, -1.88671875, -1.7801513671875, -1.673583984375, -1.5670166015625, -1.46044921875, -1.3538818359375, -1.247314453125, -1.1407470703125, -1.0341796875, -0.9276123046875, -0.821044921875, -0.7144775390625, -0.60791015625, -0.5013427734375, -0.394775390625, -0.2882080078125, -0.181640625, -0.0750732421875, 0.031494140625, 0.1380615234375, 0.24462890625, 0.3511962890625, 0.457763671875, 0.5643310546875, 0.6708984375, 0.7774658203125, 0.884033203125, 0.9906005859375, 1.09716796875, 1.2037353515625, 1.310302734375, 1.4168701171875, 1.5234375, 1.6300048828125, 1.736572265625, 1.8431396484375, 1.94970703125, 2.0562744140625, 2.162841796875, 2.2694091796875, 2.3759765625, 2.4825439453125, 2.589111328125, 2.6956787109375, 2.80224609375, 2.9088134765625, 3.015380859375, 3.1219482421875, 3.228515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 16.0, 20.0, 27.0, 34.0, 58.0, 77.0, 115.0, 125.0, 110.0, 112.0, 80.0, 59.0, 50.0, 34.0, 19.0, 11.0, 7.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002899169921875, -0.0002820640802383423, -0.00027421116828918457, -0.00026635825634002686, -0.00025850534439086914, -0.0002506524324417114, -0.0002427995204925537, -0.000234946608543396, -0.00022709369659423828, -0.00021924078464508057, -0.00021138787269592285, -0.00020353496074676514, -0.00019568204879760742, -0.0001878291368484497, -0.000179976224899292, -0.00017212331295013428, -0.00016427040100097656, -0.00015641748905181885, -0.00014856457710266113, -0.00014071166515350342, -0.0001328587532043457, -0.000125005841255188, -0.00011715292930603027, -0.00010930001735687256, -0.00010144710540771484, -9.359419345855713e-05, -8.574128150939941e-05, -7.78883695602417e-05, -7.003545761108398e-05, -6.218254566192627e-05, -5.4329633712768555e-05, -4.647672176361084e-05, -3.8623809814453125e-05, -3.077089786529541e-05, -2.2917985916137695e-05, -1.506507396697998e-05, -7.212162017822266e-06, 6.407499313354492e-07, 8.493661880493164e-06, 1.634657382965088e-05, 2.4199485778808594e-05, 3.205239772796631e-05, 3.9905309677124023e-05, 4.775822162628174e-05, 5.561113357543945e-05, 6.346404552459717e-05, 7.131695747375488e-05, 7.91698694229126e-05, 8.702278137207031e-05, 9.487569332122803e-05, 0.00010272860527038574, 0.00011058151721954346, 0.00011843442916870117, 0.0001262873411178589, 0.0001341402530670166, 0.00014199316501617432, 0.00014984607696533203, 0.00015769898891448975, 0.00016555190086364746, 0.00017340481281280518, 0.0001812577247619629, 0.0001891106367111206, 0.00019696354866027832, 0.00020481646060943604, 0.00021266937255859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 19.0, 39.0, 74.0, 129.0, 281.0, 670.0, 2086.0, 13223.0, 422643.0, 588630.0, 16800.0, 2527.0, 727.0, 293.0, 146.0, 84.0, 68.0, 23.0, 18.0, 18.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.388763427734375, -2.29705810546875, -2.205352783203125, -2.1136474609375, -2.021942138671875, -1.93023681640625, -1.838531494140625, -1.746826171875, -1.655120849609375, -1.56341552734375, -1.471710205078125, -1.3800048828125, -1.288299560546875, -1.19659423828125, -1.104888916015625, -1.01318359375, -0.921478271484375, -0.82977294921875, -0.738067626953125, -0.6463623046875, -0.554656982421875, -0.46295166015625, -0.371246337890625, -0.279541015625, -0.187835693359375, -0.09613037109375, -0.004425048828125, 0.0872802734375, 0.178985595703125, 0.27069091796875, 0.362396240234375, 0.4541015625, 0.545806884765625, 0.63751220703125, 0.729217529296875, 0.8209228515625, 0.912628173828125, 1.00433349609375, 1.096038818359375, 1.187744140625, 1.279449462890625, 1.37115478515625, 1.462860107421875, 1.5545654296875, 1.646270751953125, 1.73797607421875, 1.829681396484375, 1.92138671875, 2.013092041015625, 2.10479736328125, 2.196502685546875, 2.2882080078125, 2.379913330078125, 2.47161865234375, 2.563323974609375, 2.655029296875, 2.746734619140625, 2.83843994140625, 2.930145263671875, 3.0218505859375, 3.113555908203125, 3.20526123046875, 3.296966552734375, 3.388671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 11.0, 23.0, 66.0, 116.0, 190.0, 215.0, 177.0, 111.0, 39.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.3228759765625, -2.196533203125, -2.0701904296875, -1.94384765625, -1.8175048828125, -1.691162109375, -1.5648193359375, -1.4384765625, -1.3121337890625, -1.185791015625, -1.0594482421875, -0.93310546875, -0.8067626953125, -0.680419921875, -0.5540771484375, -0.427734375, -0.3013916015625, -0.175048828125, -0.0487060546875, 0.07763671875, 0.2039794921875, 0.330322265625, 0.4566650390625, 0.5830078125, 0.7093505859375, 0.835693359375, 0.9620361328125, 1.08837890625, 1.2147216796875, 1.341064453125, 1.4674072265625, 1.59375, 1.7200927734375, 1.846435546875, 1.9727783203125, 2.09912109375, 2.2254638671875, 2.351806640625, 2.4781494140625, 2.6044921875, 2.7308349609375, 2.857177734375, 2.9835205078125, 3.10986328125, 3.2362060546875, 3.362548828125, 3.4888916015625, 3.615234375, 3.7415771484375, 3.867919921875, 3.9942626953125, 4.12060546875, 4.2469482421875, 4.373291015625, 4.4996337890625, 4.6259765625, 4.7523193359375, 4.878662109375, 5.0050048828125, 5.13134765625, 5.2576904296875, 5.384033203125, 5.5103759765625, 5.63671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 22.0, 144.0, 469.0, 318.0, 48.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.7418975830078, -159.59458923339844, -156.447265625, -153.29995727539062, -150.1526336669922, -147.0053253173828, -143.85800170898438, -140.710693359375, -137.56338500976562, -134.41607666015625, -131.2687530517578, -128.12144470214844, -124.97412872314453, -121.82681274414062, -118.67949676513672, -115.53218078613281, -112.3848648071289, -109.237548828125, -106.0902328491211, -102.94291687011719, -99.79560852050781, -96.6482925415039, -93.5009765625, -90.3536605834961, -87.20634460449219, -84.05902862548828, -80.91171264648438, -77.764404296875, -74.6170883178711, -71.46977233886719, -68.32245635986328, -65.17514038085938, -62.02782440185547, -58.88050842285156, -55.73319625854492, -52.585880279541016, -49.438568115234375, -46.29125213623047, -43.14393615722656, -39.996620178222656, -36.849308013916016, -33.70199203491211, -30.55467987060547, -27.407363891601562, -24.26004981994629, -21.112735748291016, -17.96541976928711, -14.818105697631836, -11.670791625976562, -8.523477554321289, -5.376162528991699, -2.2288475036621094, 0.9184665679931641, 4.0657806396484375, 7.213096618652344, 10.360410690307617, 13.50772476196289, 16.655038833618164, 19.802352905273438, 22.949668884277344, 26.096982955932617, 29.24429702758789, 32.3916130065918, 35.53892517089844, 38.686241149902344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 6.0, 16.0, 16.0, 14.0, 22.0, 19.0, 11.0, 22.0, 30.0, 33.0, 40.0, 45.0, 48.0, 58.0, 50.0, 48.0, 51.0, 53.0, 47.0, 52.0, 41.0, 38.0, 45.0, 24.0, 31.0, 21.0, 19.0, 19.0, 17.0, 10.0, 10.0, 5.0, 4.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.56472396850586, -15.96933650970459, -15.373950004577637, -14.778562545776367, -14.183176040649414, -13.587788581848145, -12.992401123046875, -12.397014617919922, -11.801627159118652, -11.206239700317383, -10.61085319519043, -10.01546573638916, -9.42007827758789, -8.824691772460938, -8.229304313659668, -7.633917331695557, -7.038530349731445, -6.443143367767334, -5.847756385803223, -5.252368927001953, -4.656981945037842, -4.0615949630737305, -3.46620774269104, -2.8708205223083496, -2.2754335403442383, -1.6800464391708374, -1.0846593379974365, -0.48927223682403564, 0.10611486434936523, 0.7015018463134766, 1.296889066696167, 1.8922762870788574, 2.4876632690429688, 3.08305025100708, 3.6784374713897705, 4.273824691772461, 4.869211673736572, 5.464598655700684, 6.059986114501953, 6.6553730964660645, 7.250760078430176, 7.846147060394287, 8.441534042358398, 9.036921501159668, 9.632308959960938, 10.22769546508789, 10.82308292388916, 11.41847038269043, 12.013856887817383, 12.609244346618652, 13.204630851745605, 13.800018310546875, 14.395404815673828, 14.990792274475098, 15.586179733276367, 16.18156623840332, 16.776954650878906, 17.37234115600586, 17.967729568481445, 18.5631160736084, 19.15850257873535, 19.753890991210938, 20.34927749633789, 20.944664001464844, 21.540050506591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 23.0, 30.0, 40.0, 65.0, 73.0, 138.0, 194.0, 369.0, 730.0, 1420.0, 3324.0, 9262.0, 49579.0, 4093969.0, 23942.0, 6153.0, 2393.0, 1069.0, 602.0, 322.0, 194.0, 120.0, 71.0, 63.0, 31.0, 22.0, 9.0, 13.0, 9.0, 10.0, 2.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.61883544921875, -4.4759521484375, -4.33306884765625, -4.190185546875, -4.04730224609375, -3.9044189453125, -3.76153564453125, -3.61865234375, -3.47576904296875, -3.3328857421875, -3.19000244140625, -3.047119140625, -2.90423583984375, -2.7613525390625, -2.61846923828125, -2.4755859375, -2.33270263671875, -2.1898193359375, -2.04693603515625, -1.904052734375, -1.76116943359375, -1.6182861328125, -1.47540283203125, -1.33251953125, -1.18963623046875, -1.0467529296875, -0.90386962890625, -0.760986328125, -0.61810302734375, -0.4752197265625, -0.33233642578125, -0.189453125, -0.04656982421875, 0.0963134765625, 0.23919677734375, 0.382080078125, 0.52496337890625, 0.6678466796875, 0.81072998046875, 0.95361328125, 1.09649658203125, 1.2393798828125, 1.38226318359375, 1.525146484375, 1.66802978515625, 1.8109130859375, 1.95379638671875, 2.0966796875, 2.23956298828125, 2.3824462890625, 2.52532958984375, 2.668212890625, 2.81109619140625, 2.9539794921875, 3.09686279296875, 3.23974609375, 3.38262939453125, 3.5255126953125, 3.66839599609375, 3.811279296875, 3.95416259765625, 4.0970458984375, 4.23992919921875, 4.3828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 9.0, 20.0, 20.0, 27.0, 32.0, 39.0, 58.0, 53.0, 65.0, 61.0, 62.0, 83.0, 54.0, 68.0, 56.0, 40.0, 41.0, 39.0, 25.0, 35.0, 20.0, 18.0, 13.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9173049926757812, -0.8809967041015625, -0.8446884155273438, -0.808380126953125, -0.7720718383789062, -0.7357635498046875, -0.6994552612304688, -0.66314697265625, -0.6268386840820312, -0.5905303955078125, -0.5542221069335938, -0.517913818359375, -0.48160552978515625, -0.4452972412109375, -0.40898895263671875, -0.3726806640625, -0.33637237548828125, -0.3000640869140625, -0.26375579833984375, -0.227447509765625, -0.19113922119140625, -0.1548309326171875, -0.11852264404296875, -0.08221435546875, -0.04590606689453125, -0.0095977783203125, 0.02671051025390625, 0.063018798828125, 0.09932708740234375, 0.1356353759765625, 0.17194366455078125, 0.208251953125, 0.24456024169921875, 0.2808685302734375, 0.31717681884765625, 0.353485107421875, 0.38979339599609375, 0.4261016845703125, 0.46240997314453125, 0.49871826171875, 0.5350265502929688, 0.5713348388671875, 0.6076431274414062, 0.643951416015625, 0.6802597045898438, 0.7165679931640625, 0.7528762817382812, 0.7891845703125, 0.8254928588867188, 0.8618011474609375, 0.8981094360351562, 0.934417724609375, 0.9707260131835938, 1.0070343017578125, 1.0433425903320312, 1.07965087890625, 1.1159591674804688, 1.1522674560546875, 1.1885757446289062, 1.224884033203125, 1.2611923217773438, 1.2975006103515625, 1.3338088989257812, 1.3701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 11.0, 11.0, 14.0, 34.0, 46.0, 52.0, 87.0, 118.0, 159.0, 269.0, 364.0, 598.0, 925.0, 1679.0, 3008.0, 6455.0, 16747.0, 84031.0, 4020331.0, 37538.0, 10906.0, 4760.0, 2367.0, 1349.0, 793.0, 513.0, 323.0, 216.0, 155.0, 106.0, 80.0, 46.0, 43.0, 27.0, 23.0, 16.0, 10.0, 14.0, 8.0, 4.0, 7.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89111328125, -3.7626953125, -3.63427734375, -3.505859375, -3.37744140625, -3.2490234375, -3.12060546875, -2.9921875, -2.86376953125, -2.7353515625, -2.60693359375, -2.478515625, -2.35009765625, -2.2216796875, -2.09326171875, -1.96484375, -1.83642578125, -1.7080078125, -1.57958984375, -1.451171875, -1.32275390625, -1.1943359375, -1.06591796875, -0.9375, -0.80908203125, -0.6806640625, -0.55224609375, -0.423828125, -0.29541015625, -0.1669921875, -0.03857421875, 0.08984375, 0.21826171875, 0.3466796875, 0.47509765625, 0.603515625, 0.73193359375, 0.8603515625, 0.98876953125, 1.1171875, 1.24560546875, 1.3740234375, 1.50244140625, 1.630859375, 1.75927734375, 1.8876953125, 2.01611328125, 2.14453125, 2.27294921875, 2.4013671875, 2.52978515625, 2.658203125, 2.78662109375, 2.9150390625, 3.04345703125, 3.171875, 3.30029296875, 3.4287109375, 3.55712890625, 3.685546875, 3.81396484375, 3.9423828125, 4.07080078125, 4.19921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 5.0, 11.0, 18.0, 19.0, 29.0, 52.0, 341.0, 3439.0, 56.0, 32.0, 22.0, 8.0, 7.0, 4.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9632034301757812, -0.9288482666015625, -0.8944931030273438, -0.860137939453125, -0.8257827758789062, -0.7914276123046875, -0.7570724487304688, -0.72271728515625, -0.6883621215820312, -0.6540069580078125, -0.6196517944335938, -0.585296630859375, -0.5509414672851562, -0.5165863037109375, -0.48223114013671875, -0.4478759765625, -0.41352081298828125, -0.3791656494140625, -0.34481048583984375, -0.310455322265625, -0.27610015869140625, -0.2417449951171875, -0.20738983154296875, -0.17303466796875, -0.13867950439453125, -0.1043243408203125, -0.06996917724609375, -0.035614013671875, -0.00125885009765625, 0.0330963134765625, 0.06745147705078125, 0.101806640625, 0.13616180419921875, 0.1705169677734375, 0.20487213134765625, 0.239227294921875, 0.27358245849609375, 0.3079376220703125, 0.34229278564453125, 0.37664794921875, 0.41100311279296875, 0.4453582763671875, 0.47971343994140625, 0.514068603515625, 0.5484237670898438, 0.5827789306640625, 0.6171340942382812, 0.6514892578125, 0.6858444213867188, 0.7201995849609375, 0.7545547485351562, 0.788909912109375, 0.8232650756835938, 0.8576202392578125, 0.8919754028320312, 0.92633056640625, 0.9606857299804688, 0.9950408935546875, 1.0293960571289062, 1.063751220703125, 1.0981063842773438, 1.1324615478515625, 1.1668167114257812, 1.201171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 21.0, 39.0, 91.0, 206.0, 239.0, 196.0, 105.0, 66.0, 24.0, 14.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39384126663208, -6.150108337402344, -5.906374931335449, -5.662641525268555, -5.418908596038818, -5.175175666809082, -4.9314422607421875, -4.687708854675293, -4.443975925445557, -4.20024299621582, -3.956509590148926, -3.7127764225006104, -3.469043254852295, -3.2253100872039795, -2.981576919555664, -2.7378437519073486, -2.494110584259033, -2.2503774166107178, -2.0066442489624023, -1.762911081314087, -1.5191779136657715, -1.275444746017456, -1.0317115783691406, -0.7879784107208252, -0.5442452430725098, -0.30051207542419434, -0.056778907775878906, 0.18695425987243652, 0.43068742752075195, 0.6744205951690674, 0.9181537628173828, 1.1618869304656982, 1.4056196212768555, 1.649352788925171, 1.8930859565734863, 2.1368191242218018, 2.380552291870117, 2.6242854595184326, 2.868018627166748, 3.1117517948150635, 3.355484962463379, 3.5992181301116943, 3.8429512977600098, 4.086684226989746, 4.330417633056641, 4.574151039123535, 4.8178839683532715, 5.061616897583008, 5.305350303649902, 5.549083709716797, 5.792816638946533, 6.0365495681762695, 6.280282974243164, 6.524016380310059, 6.767749309539795, 7.011482238769531, 7.255215644836426, 7.49894905090332, 7.742681980133057, 7.986414909362793, 8.230148315429688, 8.473881721496582, 8.717615127563477, 8.961347579956055, 9.20508098602295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 6.0, 5.0, 10.0, 15.0, 18.0, 16.0, 14.0, 21.0, 28.0, 28.0, 30.0, 36.0, 35.0, 44.0, 30.0, 46.0, 39.0, 59.0, 41.0, 43.0, 35.0, 48.0, 35.0, 42.0, 33.0, 32.0, 39.0, 31.0, 27.0, 20.0, 13.0, 11.0, 17.0, 7.0, 11.0, 10.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.346281051635742, -2.2719013690948486, -2.197521686553955, -2.1231422424316406, -2.048762559890747, -1.9743828773498535, -1.9000033140182495, -1.8256237506866455, -1.751244068145752, -1.6768643856048584, -1.6024848222732544, -1.5281052589416504, -1.4537255764007568, -1.3793458938598633, -1.3049663305282593, -1.2305867671966553, -1.1562070846557617, -1.0818274021148682, -1.0074478387832642, -0.9330682158470154, -0.8586885929107666, -0.7843089699745178, -0.709929347038269, -0.6355497241020203, -0.5611701011657715, -0.4867904782295227, -0.4124108552932739, -0.33803123235702515, -0.26365160942077637, -0.1892719864845276, -0.11489236354827881, -0.04051274061203003, 0.03386688232421875, 0.10824650526046753, 0.1826261281967163, 0.2570057511329651, 0.33138537406921387, 0.40576499700546265, 0.4801446199417114, 0.5545242428779602, 0.628903865814209, 0.7032834887504578, 0.7776631116867065, 0.8520427346229553, 0.9264223575592041, 1.0008020401000977, 1.0751816034317017, 1.1495611667633057, 1.2239408493041992, 1.2983205318450928, 1.3727000951766968, 1.4470796585083008, 1.5214593410491943, 1.595839023590088, 1.670218586921692, 1.744598150253296, 1.8189778327941895, 1.893357515335083, 1.967737078666687, 2.042116641998291, 2.1164963245391846, 2.190876007080078, 2.2652554512023926, 2.339635133743286, 2.4140148162841797]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 12.0, 16.0, 22.0, 43.0, 64.0, 120.0, 191.0, 319.0, 535.0, 1020.0, 1889.0, 3768.0, 8104.0, 18634.0, 47976.0, 132487.0, 323040.0, 309211.0, 123371.0, 44908.0, 17735.0, 7438.0, 3576.0, 1767.0, 945.0, 581.0, 321.0, 175.0, 99.0, 61.0, 46.0, 26.0, 15.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9080047607421875, -1.844329833984375, -1.7806549072265625, -1.71697998046875, -1.6533050537109375, -1.589630126953125, -1.5259552001953125, -1.4622802734375, -1.3986053466796875, -1.334930419921875, -1.2712554931640625, -1.20758056640625, -1.1439056396484375, -1.080230712890625, -1.0165557861328125, -0.952880859375, -0.8892059326171875, -0.825531005859375, -0.7618560791015625, -0.69818115234375, -0.6345062255859375, -0.570831298828125, -0.5071563720703125, -0.4434814453125, -0.3798065185546875, -0.316131591796875, -0.2524566650390625, -0.18878173828125, -0.1251068115234375, -0.061431884765625, 0.0022430419921875, 0.06591796875, 0.1295928955078125, 0.193267822265625, 0.2569427490234375, 0.32061767578125, 0.3842926025390625, 0.447967529296875, 0.5116424560546875, 0.5753173828125, 0.6389923095703125, 0.702667236328125, 0.7663421630859375, 0.83001708984375, 0.8936920166015625, 0.957366943359375, 1.0210418701171875, 1.084716796875, 1.1483917236328125, 1.212066650390625, 1.2757415771484375, 1.33941650390625, 1.4030914306640625, 1.466766357421875, 1.5304412841796875, 1.5941162109375, 1.6577911376953125, 1.721466064453125, 1.7851409912109375, 1.84881591796875, 1.9124908447265625, 1.976165771484375, 2.0398406982421875, 2.103515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 9.0, 14.0, 16.0, 38.0, 29.0, 28.0, 44.0, 40.0, 45.0, 46.0, 61.0, 49.0, 57.0, 54.0, 62.0, 46.0, 44.0, 31.0, 40.0, 40.0, 34.0, 20.0, 31.0, 21.0, 9.0, 8.0, 15.0, 4.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9202651977539062, -0.8869171142578125, -0.8535690307617188, -0.820220947265625, -0.7868728637695312, -0.7535247802734375, -0.7201766967773438, -0.68682861328125, -0.6534805297851562, -0.6201324462890625, -0.5867843627929688, -0.553436279296875, -0.5200881958007812, -0.4867401123046875, -0.45339202880859375, -0.4200439453125, -0.38669586181640625, -0.3533477783203125, -0.31999969482421875, -0.286651611328125, -0.25330352783203125, -0.2199554443359375, -0.18660736083984375, -0.15325927734375, -0.11991119384765625, -0.0865631103515625, -0.05321502685546875, -0.019866943359375, 0.01348114013671875, 0.0468292236328125, 0.08017730712890625, 0.113525390625, 0.14687347412109375, 0.1802215576171875, 0.21356964111328125, 0.246917724609375, 0.28026580810546875, 0.3136138916015625, 0.34696197509765625, 0.38031005859375, 0.41365814208984375, 0.4470062255859375, 0.48035430908203125, 0.513702392578125, 0.5470504760742188, 0.5803985595703125, 0.6137466430664062, 0.6470947265625, 0.6804428100585938, 0.7137908935546875, 0.7471389770507812, 0.780487060546875, 0.8138351440429688, 0.8471832275390625, 0.8805313110351562, 0.91387939453125, 0.9472274780273438, 0.9805755615234375, 1.0139236450195312, 1.047271728515625, 1.0806198120117188, 1.1139678955078125, 1.1473159790039062, 1.1806640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 7.0, 6.0, 7.0, 15.0, 15.0, 22.0, 38.0, 68.0, 107.0, 187.0, 388.0, 927.0, 2962.0, 13700.0, 104296.0, 716800.0, 181686.0, 21092.0, 4028.0, 1187.0, 456.0, 192.0, 140.0, 71.0, 51.0, 24.0, 18.0, 11.0, 8.0, 10.0, 5.0, 5.0, 5.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89239501953125, -3.7652587890625, -3.63812255859375, -3.510986328125, -3.38385009765625, -3.2567138671875, -3.12957763671875, -3.00244140625, -2.87530517578125, -2.7481689453125, -2.62103271484375, -2.493896484375, -2.36676025390625, -2.2396240234375, -2.11248779296875, -1.9853515625, -1.85821533203125, -1.7310791015625, -1.60394287109375, -1.476806640625, -1.34967041015625, -1.2225341796875, -1.09539794921875, -0.96826171875, -0.84112548828125, -0.7139892578125, -0.58685302734375, -0.459716796875, -0.33258056640625, -0.2054443359375, -0.07830810546875, 0.048828125, 0.17596435546875, 0.3031005859375, 0.43023681640625, 0.557373046875, 0.68450927734375, 0.8116455078125, 0.93878173828125, 1.06591796875, 1.19305419921875, 1.3201904296875, 1.44732666015625, 1.574462890625, 1.70159912109375, 1.8287353515625, 1.95587158203125, 2.0830078125, 2.21014404296875, 2.3372802734375, 2.46441650390625, 2.591552734375, 2.71868896484375, 2.8458251953125, 2.97296142578125, 3.10009765625, 3.22723388671875, 3.3543701171875, 3.48150634765625, 3.608642578125, 3.73577880859375, 3.8629150390625, 3.99005126953125, 4.1171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 11.0, 4.0, 13.0, 13.0, 12.0, 13.0, 20.0, 11.0, 25.0, 27.0, 20.0, 31.0, 34.0, 40.0, 37.0, 37.0, 51.0, 44.0, 39.0, 43.0, 36.0, 36.0, 37.0, 45.0, 40.0, 36.0, 30.0, 27.0, 23.0, 24.0, 15.0, 23.0, 19.0, 14.0, 13.0, 10.0, 7.0, 12.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.046875, -3.93145751953125, -3.8160400390625, -3.70062255859375, -3.585205078125, -3.46978759765625, -3.3543701171875, -3.23895263671875, -3.12353515625, -3.00811767578125, -2.8927001953125, -2.77728271484375, -2.661865234375, -2.54644775390625, -2.4310302734375, -2.31561279296875, -2.2001953125, -2.08477783203125, -1.9693603515625, -1.85394287109375, -1.738525390625, -1.62310791015625, -1.5076904296875, -1.39227294921875, -1.27685546875, -1.16143798828125, -1.0460205078125, -0.93060302734375, -0.815185546875, -0.69976806640625, -0.5843505859375, -0.46893310546875, -0.353515625, -0.23809814453125, -0.1226806640625, -0.00726318359375, 0.108154296875, 0.22357177734375, 0.3389892578125, 0.45440673828125, 0.56982421875, 0.68524169921875, 0.8006591796875, 0.91607666015625, 1.031494140625, 1.14691162109375, 1.2623291015625, 1.37774658203125, 1.4931640625, 1.60858154296875, 1.7239990234375, 1.83941650390625, 1.954833984375, 2.07025146484375, 2.1856689453125, 2.30108642578125, 2.41650390625, 2.53192138671875, 2.6473388671875, 2.76275634765625, 2.878173828125, 2.99359130859375, 3.1090087890625, 3.22442626953125, 3.33984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 22.0, 51.0, 51.0, 62.0, 139.0, 328.0, 828.0, 2826.0, 15529.0, 343292.0, 656704.0, 23356.0, 3529.0, 970.0, 408.0, 169.0, 103.0, 50.0, 25.0, 23.0, 16.0, 10.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.3536376953125, -3.258056640625, -3.1624755859375, -3.06689453125, -2.9713134765625, -2.875732421875, -2.7801513671875, -2.6845703125, -2.5889892578125, -2.493408203125, -2.3978271484375, -2.30224609375, -2.2066650390625, -2.111083984375, -2.0155029296875, -1.919921875, -1.8243408203125, -1.728759765625, -1.6331787109375, -1.53759765625, -1.4420166015625, -1.346435546875, -1.2508544921875, -1.1552734375, -1.0596923828125, -0.964111328125, -0.8685302734375, -0.77294921875, -0.6773681640625, -0.581787109375, -0.4862060546875, -0.390625, -0.2950439453125, -0.199462890625, -0.1038818359375, -0.00830078125, 0.0872802734375, 0.182861328125, 0.2784423828125, 0.3740234375, 0.4696044921875, 0.565185546875, 0.6607666015625, 0.75634765625, 0.8519287109375, 0.947509765625, 1.0430908203125, 1.138671875, 1.2342529296875, 1.329833984375, 1.4254150390625, 1.52099609375, 1.6165771484375, 1.712158203125, 1.8077392578125, 1.9033203125, 1.9989013671875, 2.094482421875, 2.1900634765625, 2.28564453125, 2.3812255859375, 2.476806640625, 2.5723876953125, 2.66796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 11.0, 15.0, 27.0, 29.0, 54.0, 66.0, 86.0, 107.0, 119.0, 104.0, 92.0, 76.0, 41.0, 31.0, 37.0, 16.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00029087066650390625, -0.0002825148403644562, -0.0002741590142250061, -0.00026580318808555603, -0.00025744736194610596, -0.0002490915358066559, -0.0002407357096672058, -0.00023237988352775574, -0.00022402405738830566, -0.0002156682312488556, -0.00020731240510940552, -0.00019895657896995544, -0.00019060075283050537, -0.0001822449266910553, -0.00017388910055160522, -0.00016553327441215515, -0.00015717744827270508, -0.000148821622133255, -0.00014046579599380493, -0.00013210996985435486, -0.00012375414371490479, -0.00011539831757545471, -0.00010704249143600464, -9.868666529655457e-05, -9.033083915710449e-05, -8.197501301765442e-05, -7.361918687820435e-05, -6.526336073875427e-05, -5.69075345993042e-05, -4.8551708459854126e-05, -4.019588232040405e-05, -3.184005618095398e-05, -2.3484230041503906e-05, -1.5128403902053833e-05, -6.77257776260376e-06, 1.5832483768463135e-06, 9.939074516296387e-06, 1.829490065574646e-05, 2.6650726795196533e-05, 3.5006552934646606e-05, 4.336237907409668e-05, 5.171820521354675e-05, 6.0074031352996826e-05, 6.84298574924469e-05, 7.678568363189697e-05, 8.514150977134705e-05, 9.349733591079712e-05, 0.00010185316205024719, 0.00011020898818969727, 0.00011856481432914734, 0.0001269206404685974, 0.00013527646660804749, 0.00014363229274749756, 0.00015198811888694763, 0.0001603439450263977, 0.00016869977116584778, 0.00017705559730529785, 0.00018541142344474792, 0.000193767249584198, 0.00020212307572364807, 0.00021047890186309814, 0.00021883472800254822, 0.0002271905541419983, 0.00023554638028144836, 0.00024390220642089844]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 17.0, 22.0, 35.0, 58.0, 109.0, 215.0, 465.0, 1297.0, 5242.0, 48450.0, 876484.0, 105370.0, 7906.0, 1754.0, 585.0, 241.0, 122.0, 75.0, 38.0, 24.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.36859130859375, -4.2684326171875, -4.16827392578125, -4.068115234375, -3.96795654296875, -3.8677978515625, -3.76763916015625, -3.66748046875, -3.56732177734375, -3.4671630859375, -3.36700439453125, -3.266845703125, -3.16668701171875, -3.0665283203125, -2.96636962890625, -2.8662109375, -2.76605224609375, -2.6658935546875, -2.56573486328125, -2.465576171875, -2.36541748046875, -2.2652587890625, -2.16510009765625, -2.06494140625, -1.96478271484375, -1.8646240234375, -1.76446533203125, -1.664306640625, -1.56414794921875, -1.4639892578125, -1.36383056640625, -1.263671875, -1.16351318359375, -1.0633544921875, -0.96319580078125, -0.863037109375, -0.76287841796875, -0.6627197265625, -0.56256103515625, -0.46240234375, -0.36224365234375, -0.2620849609375, -0.16192626953125, -0.061767578125, 0.03839111328125, 0.1385498046875, 0.23870849609375, 0.3388671875, 0.43902587890625, 0.5391845703125, 0.63934326171875, 0.739501953125, 0.83966064453125, 0.9398193359375, 1.03997802734375, 1.14013671875, 1.24029541015625, 1.3404541015625, 1.44061279296875, 1.540771484375, 1.64093017578125, 1.7410888671875, 1.84124755859375, 1.94140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 9.0, 15.0, 23.0, 36.0, 83.0, 115.0, 163.0, 161.0, 128.0, 108.0, 67.0, 31.0, 28.0, 12.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.78515625, -3.686370849609375, -3.58758544921875, -3.488800048828125, -3.3900146484375, -3.291229248046875, -3.19244384765625, -3.093658447265625, -2.994873046875, -2.896087646484375, -2.79730224609375, -2.698516845703125, -2.5997314453125, -2.500946044921875, -2.40216064453125, -2.303375244140625, -2.20458984375, -2.105804443359375, -2.00701904296875, -1.908233642578125, -1.8094482421875, -1.710662841796875, -1.61187744140625, -1.513092041015625, -1.414306640625, -1.315521240234375, -1.21673583984375, -1.117950439453125, -1.0191650390625, -0.920379638671875, -0.82159423828125, -0.722808837890625, -0.6240234375, -0.525238037109375, -0.42645263671875, -0.327667236328125, -0.2288818359375, -0.130096435546875, -0.03131103515625, 0.067474365234375, 0.166259765625, 0.265045166015625, 0.36383056640625, 0.462615966796875, 0.5614013671875, 0.660186767578125, 0.75897216796875, 0.857757568359375, 0.95654296875, 1.055328369140625, 1.15411376953125, 1.252899169921875, 1.3516845703125, 1.450469970703125, 1.54925537109375, 1.648040771484375, 1.746826171875, 1.845611572265625, 1.94439697265625, 2.043182373046875, 2.1419677734375, 2.240753173828125, 2.33953857421875, 2.438323974609375, 2.537109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 24.0, 93.0, 269.0, 346.0, 185.0, 49.0, 16.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-113.35630798339844, -111.19064331054688, -109.02497100830078, -106.85930633544922, -104.69363403320312, -102.52796936035156, -100.36229705810547, -98.1966323852539, -96.03096008300781, -93.86529541015625, -91.69962310791016, -89.5339584350586, -87.3682861328125, -85.20262145996094, -83.03694915771484, -80.87128448486328, -78.70561981201172, -76.53995513916016, -74.37428283691406, -72.2086181640625, -70.0429458618164, -67.87728118896484, -65.71160888671875, -63.54594421386719, -61.38027572631836, -59.21460723876953, -57.0489387512207, -54.883270263671875, -52.71760559082031, -50.55193328857422, -48.386268615722656, -46.22060012817383, -44.054927825927734, -41.889259338378906, -39.72359085083008, -37.55792236328125, -35.39225769042969, -33.226585388183594, -31.06092071533203, -28.895252227783203, -26.729583740234375, -24.563915252685547, -22.39824676513672, -20.232580184936523, -18.066911697387695, -15.901243209838867, -13.735575675964355, -11.569908142089844, -9.404239654541016, -7.238571643829346, -5.072903633117676, -2.907235622406006, -0.7415676116943359, 1.4241008758544922, 3.589768409729004, 5.755435943603516, 7.921104431152344, 10.086772918701172, 12.252440452575684, 14.418107986450195, 16.583776473999023, 18.74944496154785, 20.915111541748047, 23.080780029296875, 25.246448516845703]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 11.0, 11.0, 19.0, 15.0, 22.0, 21.0, 29.0, 34.0, 42.0, 37.0, 37.0, 47.0, 39.0, 59.0, 63.0, 60.0, 53.0, 45.0, 55.0, 43.0, 29.0, 39.0, 31.0, 29.0, 18.0, 21.0, 9.0, 18.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-23.170543670654297, -22.52720069885254, -21.88385581970215, -21.24051284790039, -20.597169876098633, -19.953826904296875, -19.310482025146484, -18.667139053344727, -18.02379608154297, -17.38045310974121, -16.73710823059082, -16.093765258789062, -15.450422286987305, -14.80707836151123, -14.163734436035156, -13.520391464233398, -12.877047538757324, -12.23370361328125, -11.590360641479492, -10.947016716003418, -10.30367374420166, -9.660329818725586, -9.016986846923828, -8.373642921447754, -7.730299472808838, -7.086956024169922, -6.443612575531006, -5.80026912689209, -5.156925201416016, -4.513582229614258, -3.8702383041381836, -3.2268948554992676, -2.5835514068603516, -1.9402079582214355, -1.29686439037323, -0.6535208225250244, -0.010177373886108398, 0.6331660747528076, 1.2765097618103027, 1.9198532104492188, 2.5631966590881348, 3.206540107727051, 3.849883556365967, 4.493227005004883, 5.136570930480957, 5.779913902282715, 6.423257827758789, 7.066601276397705, 7.709944725036621, 8.353288650512695, 8.996631622314453, 9.639975547790527, 10.283318519592285, 10.92666244506836, 11.570005416870117, 12.213349342346191, 12.856693267822266, 13.50003719329834, 14.143380165100098, 14.786724090576172, 15.43006706237793, 16.073410034179688, 16.716754913330078, 17.360097885131836, 18.003440856933594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 24.0, 26.0, 32.0, 57.0, 77.0, 131.0, 229.0, 368.0, 616.0, 1228.0, 2837.0, 9861.0, 73895.0, 4056716.0, 37012.0, 6598.0, 2139.0, 985.0, 567.0, 281.0, 189.0, 123.0, 82.0, 63.0, 37.0, 25.0, 18.0, 19.0, 5.0, 8.0, 1.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.46124267578125, -3.3131103515625, -3.16497802734375, -3.016845703125, -2.86871337890625, -2.7205810546875, -2.57244873046875, -2.42431640625, -2.27618408203125, -2.1280517578125, -1.97991943359375, -1.831787109375, -1.68365478515625, -1.5355224609375, -1.38739013671875, -1.2392578125, -1.09112548828125, -0.9429931640625, -0.79486083984375, -0.646728515625, -0.49859619140625, -0.3504638671875, -0.20233154296875, -0.05419921875, 0.09393310546875, 0.2420654296875, 0.39019775390625, 0.538330078125, 0.68646240234375, 0.8345947265625, 0.98272705078125, 1.130859375, 1.27899169921875, 1.4271240234375, 1.57525634765625, 1.723388671875, 1.87152099609375, 2.0196533203125, 2.16778564453125, 2.31591796875, 2.46405029296875, 2.6121826171875, 2.76031494140625, 2.908447265625, 3.05657958984375, 3.2047119140625, 3.35284423828125, 3.5009765625, 3.64910888671875, 3.7972412109375, 3.94537353515625, 4.093505859375, 4.24163818359375, 4.3897705078125, 4.53790283203125, 4.68603515625, 4.83416748046875, 4.9822998046875, 5.13043212890625, 5.278564453125, 5.42669677734375, 5.5748291015625, 5.72296142578125, 5.87109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 9.0, 14.0, 16.0, 37.0, 44.0, 59.0, 76.0, 102.0, 99.0, 101.0, 89.0, 80.0, 76.0, 56.0, 39.0, 39.0, 16.0, 10.0, 10.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.791015625, -1.7340545654296875, -1.677093505859375, -1.6201324462890625, -1.56317138671875, -1.5062103271484375, -1.449249267578125, -1.3922882080078125, -1.3353271484375, -1.2783660888671875, -1.221405029296875, -1.1644439697265625, -1.10748291015625, -1.0505218505859375, -0.993560791015625, -0.9365997314453125, -0.879638671875, -0.8226776123046875, -0.765716552734375, -0.7087554931640625, -0.65179443359375, -0.5948333740234375, -0.537872314453125, -0.4809112548828125, -0.4239501953125, -0.3669891357421875, -0.310028076171875, -0.2530670166015625, -0.19610595703125, -0.1391448974609375, -0.082183837890625, -0.0252227783203125, 0.03173828125, 0.0886993408203125, 0.145660400390625, 0.2026214599609375, 0.25958251953125, 0.3165435791015625, 0.373504638671875, 0.4304656982421875, 0.4874267578125, 0.5443878173828125, 0.601348876953125, 0.6583099365234375, 0.71527099609375, 0.7722320556640625, 0.829193115234375, 0.8861541748046875, 0.943115234375, 1.0000762939453125, 1.057037353515625, 1.1139984130859375, 1.17095947265625, 1.2279205322265625, 1.284881591796875, 1.3418426513671875, 1.3988037109375, 1.4557647705078125, 1.512725830078125, 1.5696868896484375, 1.62664794921875, 1.6836090087890625, 1.740570068359375, 1.7975311279296875, 1.8544921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 16.0, 17.0, 26.0, 45.0, 47.0, 56.0, 109.0, 131.0, 201.0, 294.0, 381.0, 586.0, 992.0, 1854.0, 3736.0, 7788.0, 20004.0, 78790.0, 3807073.0, 214495.0, 34566.0, 11633.0, 5038.0, 2505.0, 1412.0, 792.0, 489.0, 337.0, 232.0, 161.0, 129.0, 92.0, 70.0, 45.0, 34.0, 29.0, 16.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.71875, -2.633056640625, -2.54736328125, -2.461669921875, -2.3759765625, -2.290283203125, -2.20458984375, -2.118896484375, -2.033203125, -1.947509765625, -1.86181640625, -1.776123046875, -1.6904296875, -1.604736328125, -1.51904296875, -1.433349609375, -1.34765625, -1.261962890625, -1.17626953125, -1.090576171875, -1.0048828125, -0.919189453125, -0.83349609375, -0.747802734375, -0.662109375, -0.576416015625, -0.49072265625, -0.405029296875, -0.3193359375, -0.233642578125, -0.14794921875, -0.062255859375, 0.0234375, 0.109130859375, 0.19482421875, 0.280517578125, 0.3662109375, 0.451904296875, 0.53759765625, 0.623291015625, 0.708984375, 0.794677734375, 0.88037109375, 0.966064453125, 1.0517578125, 1.137451171875, 1.22314453125, 1.308837890625, 1.39453125, 1.480224609375, 1.56591796875, 1.651611328125, 1.7373046875, 1.822998046875, 1.90869140625, 1.994384765625, 2.080078125, 2.165771484375, 2.25146484375, 2.337158203125, 2.4228515625, 2.508544921875, 2.59423828125, 2.679931640625, 2.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 11.0, 10.0, 8.0, 12.0, 19.0, 35.0, 56.0, 90.0, 213.0, 3031.0, 269.0, 101.0, 70.0, 41.0, 18.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97119140625, -0.9315872192382812, -0.8919830322265625, -0.8523788452148438, -0.812774658203125, -0.7731704711914062, -0.7335662841796875, -0.6939620971679688, -0.65435791015625, -0.6147537231445312, -0.5751495361328125, -0.5355453491210938, -0.495941162109375, -0.45633697509765625, -0.4167327880859375, -0.37712860107421875, -0.3375244140625, -0.29792022705078125, -0.2583160400390625, -0.21871185302734375, -0.179107666015625, -0.13950347900390625, -0.0998992919921875, -0.06029510498046875, -0.02069091796875, 0.01891326904296875, 0.0585174560546875, 0.09812164306640625, 0.137725830078125, 0.17733001708984375, 0.2169342041015625, 0.25653839111328125, 0.296142578125, 0.33574676513671875, 0.3753509521484375, 0.41495513916015625, 0.454559326171875, 0.49416351318359375, 0.5337677001953125, 0.5733718872070312, 0.61297607421875, 0.6525802612304688, 0.6921844482421875, 0.7317886352539062, 0.771392822265625, 0.8109970092773438, 0.8506011962890625, 0.8902053833007812, 0.9298095703125, 0.9694137573242188, 1.0090179443359375, 1.0486221313476562, 1.088226318359375, 1.1278305053710938, 1.1674346923828125, 1.2070388793945312, 1.24664306640625, 1.2862472534179688, 1.3258514404296875, 1.3654556274414062, 1.405059814453125, 1.4446640014648438, 1.4842681884765625, 1.5238723754882812, 1.5634765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 16.0, 31.0, 35.0, 66.0, 86.0, 102.0, 118.0, 105.0, 99.0, 83.0, 64.0, 42.0, 28.0, 25.0, 24.0, 16.0, 15.0, 13.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5456020832061768, -3.344350814819336, -3.143099784851074, -2.9418485164642334, -2.7405972480773926, -2.539346218109131, -2.33809494972229, -2.136843681335449, -1.9355926513671875, -1.7343415021896362, -1.533090353012085, -1.3318390846252441, -1.1305879354476929, -0.9293367862701416, -0.7280855178833008, -0.5268343687057495, -0.32558321952819824, -0.12433204054832458, 0.07691913843154907, 0.2781703472137451, 0.4794214963912964, 0.6806726455688477, 0.8819239139556885, 1.0831750631332397, 1.284426212310791, 1.4856773614883423, 1.6869285106658936, 1.8881797790527344, 2.089430809020996, 2.290682077407837, 2.4919333457946777, 2.6931843757629395, 2.8944358825683594, 3.0956871509552, 3.296938180923462, 3.4981894493103027, 3.6994404792785645, 3.9006917476654053, 4.101943016052246, 4.303194046020508, 4.5044450759887695, 4.705696105957031, 4.906947612762451, 5.108198642730713, 5.309449672698975, 5.5107011795043945, 5.711952209472656, 5.913203239440918, 6.114454746246338, 6.3157057762146, 6.5169572830200195, 6.718208312988281, 6.919459342956543, 7.120710372924805, 7.321961879730225, 7.523212909698486, 7.724464416503906, 7.925715446472168, 8.12696647644043, 8.328218460083008, 8.52946949005127, 8.730720520019531, 8.931971549987793, 9.133222579956055, 9.334473609924316]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 16.0, 5.0, 10.0, 14.0, 11.0, 13.0, 19.0, 14.0, 25.0, 21.0, 20.0, 34.0, 29.0, 22.0, 32.0, 27.0, 25.0, 32.0, 37.0, 34.0, 30.0, 34.0, 38.0, 44.0, 34.0, 30.0, 34.0, 23.0, 37.0, 32.0, 33.0, 22.0, 12.0, 28.0, 27.0, 16.0, 11.0, 13.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8851871490478516, -3.7598843574523926, -3.6345813274383545, -3.5092785358428955, -3.3839755058288574, -3.2586727142333984, -3.1333699226379395, -3.0080671310424805, -2.8827641010284424, -2.7574613094329834, -2.6321582794189453, -2.5068554878234863, -2.3815526962280273, -2.2562496662139893, -2.1309468746185303, -2.005643844604492, -1.8803410530090332, -1.7550381422042847, -1.6297352313995361, -1.5044324398040771, -1.3791295289993286, -1.25382661819458, -1.128523826599121, -1.0032209157943726, -0.877918004989624, -0.7526150941848755, -0.6273122429847717, -0.502009391784668, -0.37670648097991943, -0.2514035701751709, -0.12610071897506714, -0.0007978677749633789, 0.12450456619262695, 0.2498074471950531, 0.37511032819747925, 0.500413179397583, 0.6257160902023315, 0.7510190010070801, 0.8763218522071838, 1.0016247034072876, 1.1269276142120361, 1.2522305250167847, 1.3775334358215332, 1.5028362274169922, 1.6281391382217407, 1.7534420490264893, 1.8787448406219482, 2.0040478706359863, 2.1293506622314453, 2.2546534538269043, 2.3799564838409424, 2.5052592754364014, 2.6305623054504395, 2.7558650970458984, 2.8811678886413574, 3.0064706802368164, 3.1317737102508545, 3.2570765018463135, 3.3823795318603516, 3.5076823234558105, 3.6329851150512695, 3.7582881450653076, 3.8835909366607666, 4.008893966674805, 4.134196758270264]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 11.0, 9.0, 11.0, 21.0, 29.0, 44.0, 51.0, 100.0, 139.0, 256.0, 489.0, 953.0, 1776.0, 3909.0, 10122.0, 28554.0, 92678.0, 306794.0, 397029.0, 140079.0, 41239.0, 13941.0, 5521.0, 2235.0, 1109.0, 606.0, 324.0, 192.0, 116.0, 80.0, 35.0, 31.0, 18.0, 12.0, 15.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.1015625, -3.020294189453125, -2.93902587890625, -2.857757568359375, -2.7764892578125, -2.695220947265625, -2.61395263671875, -2.532684326171875, -2.451416015625, -2.370147705078125, -2.28887939453125, -2.207611083984375, -2.1263427734375, -2.045074462890625, -1.96380615234375, -1.882537841796875, -1.80126953125, -1.720001220703125, -1.63873291015625, -1.557464599609375, -1.4761962890625, -1.394927978515625, -1.31365966796875, -1.232391357421875, -1.151123046875, -1.069854736328125, -0.98858642578125, -0.907318115234375, -0.8260498046875, -0.744781494140625, -0.66351318359375, -0.582244873046875, -0.5009765625, -0.419708251953125, -0.33843994140625, -0.257171630859375, -0.1759033203125, -0.094635009765625, -0.01336669921875, 0.067901611328125, 0.149169921875, 0.230438232421875, 0.31170654296875, 0.392974853515625, 0.4742431640625, 0.555511474609375, 0.63677978515625, 0.718048095703125, 0.79931640625, 0.880584716796875, 0.96185302734375, 1.043121337890625, 1.1243896484375, 1.205657958984375, 1.28692626953125, 1.368194580078125, 1.449462890625, 1.530731201171875, 1.61199951171875, 1.693267822265625, 1.7745361328125, 1.855804443359375, 1.93707275390625, 2.018341064453125, 2.099609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 9.0, 5.0, 11.0, 13.0, 22.0, 35.0, 36.0, 42.0, 43.0, 73.0, 81.0, 74.0, 75.0, 83.0, 60.0, 57.0, 51.0, 47.0, 51.0, 30.0, 24.0, 14.0, 12.0, 14.0, 10.0, 9.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.5506591796875, -1.501708984375, -1.4527587890625, -1.40380859375, -1.3548583984375, -1.305908203125, -1.2569580078125, -1.2080078125, -1.1590576171875, -1.110107421875, -1.0611572265625, -1.01220703125, -0.9632568359375, -0.914306640625, -0.8653564453125, -0.81640625, -0.7674560546875, -0.718505859375, -0.6695556640625, -0.62060546875, -0.5716552734375, -0.522705078125, -0.4737548828125, -0.4248046875, -0.3758544921875, -0.326904296875, -0.2779541015625, -0.22900390625, -0.1800537109375, -0.131103515625, -0.0821533203125, -0.033203125, 0.0157470703125, 0.064697265625, 0.1136474609375, 0.16259765625, 0.2115478515625, 0.260498046875, 0.3094482421875, 0.3583984375, 0.4073486328125, 0.456298828125, 0.5052490234375, 0.55419921875, 0.6031494140625, 0.652099609375, 0.7010498046875, 0.75, 0.7989501953125, 0.847900390625, 0.8968505859375, 0.94580078125, 0.9947509765625, 1.043701171875, 1.0926513671875, 1.1416015625, 1.1905517578125, 1.239501953125, 1.2884521484375, 1.33740234375, 1.3863525390625, 1.435302734375, 1.4842529296875, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 6.0, 6.0, 7.0, 8.0, 8.0, 17.0, 35.0, 20.0, 43.0, 63.0, 90.0, 114.0, 225.0, 350.0, 576.0, 1168.0, 2511.0, 6446.0, 22367.0, 108384.0, 535327.0, 297693.0, 52321.0, 12619.0, 4208.0, 1756.0, 864.0, 506.0, 255.0, 167.0, 103.0, 82.0, 52.0, 33.0, 28.0, 34.0, 11.0, 12.0, 9.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.326171875, -3.22772216796875, -3.1292724609375, -3.03082275390625, -2.932373046875, -2.83392333984375, -2.7354736328125, -2.63702392578125, -2.53857421875, -2.44012451171875, -2.3416748046875, -2.24322509765625, -2.144775390625, -2.04632568359375, -1.9478759765625, -1.84942626953125, -1.7509765625, -1.65252685546875, -1.5540771484375, -1.45562744140625, -1.357177734375, -1.25872802734375, -1.1602783203125, -1.06182861328125, -0.96337890625, -0.86492919921875, -0.7664794921875, -0.66802978515625, -0.569580078125, -0.47113037109375, -0.3726806640625, -0.27423095703125, -0.17578125, -0.07733154296875, 0.0211181640625, 0.11956787109375, 0.218017578125, 0.31646728515625, 0.4149169921875, 0.51336669921875, 0.61181640625, 0.71026611328125, 0.8087158203125, 0.90716552734375, 1.005615234375, 1.10406494140625, 1.2025146484375, 1.30096435546875, 1.3994140625, 1.49786376953125, 1.5963134765625, 1.69476318359375, 1.793212890625, 1.89166259765625, 1.9901123046875, 2.08856201171875, 2.18701171875, 2.28546142578125, 2.3839111328125, 2.48236083984375, 2.580810546875, 2.67926025390625, 2.7777099609375, 2.87615966796875, 2.974609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 19.0, 23.0, 28.0, 39.0, 44.0, 51.0, 48.0, 56.0, 71.0, 77.0, 62.0, 48.0, 48.0, 66.0, 54.0, 47.0, 33.0, 28.0, 37.0, 27.0, 10.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29296875, -6.10784912109375, -5.9227294921875, -5.73760986328125, -5.552490234375, -5.36737060546875, -5.1822509765625, -4.99713134765625, -4.81201171875, -4.62689208984375, -4.4417724609375, -4.25665283203125, -4.071533203125, -3.88641357421875, -3.7012939453125, -3.51617431640625, -3.3310546875, -3.14593505859375, -2.9608154296875, -2.77569580078125, -2.590576171875, -2.40545654296875, -2.2203369140625, -2.03521728515625, -1.85009765625, -1.66497802734375, -1.4798583984375, -1.29473876953125, -1.109619140625, -0.92449951171875, -0.7393798828125, -0.55426025390625, -0.369140625, -0.18402099609375, 0.0010986328125, 0.18621826171875, 0.371337890625, 0.55645751953125, 0.7415771484375, 0.92669677734375, 1.11181640625, 1.29693603515625, 1.4820556640625, 1.66717529296875, 1.852294921875, 2.03741455078125, 2.2225341796875, 2.40765380859375, 2.5927734375, 2.77789306640625, 2.9630126953125, 3.14813232421875, 3.333251953125, 3.51837158203125, 3.7034912109375, 3.88861083984375, 4.07373046875, 4.25885009765625, 4.4439697265625, 4.62908935546875, 4.814208984375, 4.99932861328125, 5.1844482421875, 5.36956787109375, 5.5546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 10.0, 11.0, 17.0, 20.0, 58.0, 135.0, 316.0, 930.0, 4832.0, 97352.0, 902893.0, 37901.0, 2998.0, 642.0, 221.0, 100.0, 46.0, 27.0, 16.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.314453125, -3.238037109375, -3.16162109375, -3.085205078125, -3.0087890625, -2.932373046875, -2.85595703125, -2.779541015625, -2.703125, -2.626708984375, -2.55029296875, -2.473876953125, -2.3974609375, -2.321044921875, -2.24462890625, -2.168212890625, -2.091796875, -2.015380859375, -1.93896484375, -1.862548828125, -1.7861328125, -1.709716796875, -1.63330078125, -1.556884765625, -1.48046875, -1.404052734375, -1.32763671875, -1.251220703125, -1.1748046875, -1.098388671875, -1.02197265625, -0.945556640625, -0.869140625, -0.792724609375, -0.71630859375, -0.639892578125, -0.5634765625, -0.487060546875, -0.41064453125, -0.334228515625, -0.2578125, -0.181396484375, -0.10498046875, -0.028564453125, 0.0478515625, 0.124267578125, 0.20068359375, 0.277099609375, 0.353515625, 0.429931640625, 0.50634765625, 0.582763671875, 0.6591796875, 0.735595703125, 0.81201171875, 0.888427734375, 0.96484375, 1.041259765625, 1.11767578125, 1.194091796875, 1.2705078125, 1.346923828125, 1.42333984375, 1.499755859375, 1.576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 10.0, 15.0, 19.0, 21.0, 35.0, 47.0, 74.0, 85.0, 100.0, 109.0, 106.0, 75.0, 54.0, 73.0, 48.0, 29.0, 24.0, 19.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002689361572265625, -0.0002620033919811249, -0.00025507062673568726, -0.00024813786149024963, -0.000241205096244812, -0.0002342723309993744, -0.00022733956575393677, -0.00022040680050849915, -0.00021347403526306152, -0.0002065412700176239, -0.00019960850477218628, -0.00019267573952674866, -0.00018574297428131104, -0.0001788102090358734, -0.0001718774437904358, -0.00016494467854499817, -0.00015801191329956055, -0.00015107914805412292, -0.0001441463828086853, -0.00013721361756324768, -0.00013028085231781006, -0.00012334808707237244, -0.00011641532182693481, -0.00010948255658149719, -0.00010254979133605957, -9.561702609062195e-05, -8.868426084518433e-05, -8.17514955997467e-05, -7.481873035430908e-05, -6.788596510887146e-05, -6.095319986343384e-05, -5.4020434617996216e-05, -4.7087669372558594e-05, -4.015490412712097e-05, -3.322213888168335e-05, -2.6289373636245728e-05, -1.9356608390808105e-05, -1.2423843145370483e-05, -5.491077899932861e-06, 1.4416873455047607e-06, 8.374452590942383e-06, 1.5307217836380005e-05, 2.2239983081817627e-05, 2.917274832725525e-05, 3.610551357269287e-05, 4.303827881813049e-05, 4.9971044063568115e-05, 5.690380930900574e-05, 6.383657455444336e-05, 7.076933979988098e-05, 7.77021050453186e-05, 8.463487029075623e-05, 9.156763553619385e-05, 9.850040078163147e-05, 0.00010543316602706909, 0.00011236593127250671, 0.00011929869651794434, 0.00012623146176338196, 0.00013316422700881958, 0.0001400969922542572, 0.00014702975749969482, 0.00015396252274513245, 0.00016089528799057007, 0.0001678280532360077, 0.0001747608184814453]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 5.0, 11.0, 10.0, 10.0, 16.0, 24.0, 47.0, 51.0, 84.0, 172.0, 311.0, 540.0, 1126.0, 3000.0, 10576.0, 64159.0, 604797.0, 320168.0, 32473.0, 6865.0, 2186.0, 875.0, 426.0, 226.0, 125.0, 79.0, 42.0, 43.0, 21.0, 24.0, 16.0, 5.0, 8.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.2109375, -1.1689453125, -1.126953125, -1.0849609375, -1.04296875, -1.0009765625, -0.958984375, -0.9169921875, -0.875, -0.8330078125, -0.791015625, -0.7490234375, -0.70703125, -0.6650390625, -0.623046875, -0.5810546875, -0.5390625, -0.4970703125, -0.455078125, -0.4130859375, -0.37109375, -0.3291015625, -0.287109375, -0.2451171875, -0.203125, -0.1611328125, -0.119140625, -0.0771484375, -0.03515625, 0.0068359375, 0.048828125, 0.0908203125, 0.1328125, 0.1748046875, 0.216796875, 0.2587890625, 0.30078125, 0.3427734375, 0.384765625, 0.4267578125, 0.46875, 0.5107421875, 0.552734375, 0.5947265625, 0.63671875, 0.6787109375, 0.720703125, 0.7626953125, 0.8046875, 0.8466796875, 0.888671875, 0.9306640625, 0.97265625, 1.0146484375, 1.056640625, 1.0986328125, 1.140625, 1.1826171875, 1.224609375, 1.2666015625, 1.30859375, 1.3505859375, 1.392578125, 1.4345703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 11.0, 2.0, 10.0, 17.0, 18.0, 29.0, 35.0, 52.0, 61.0, 82.0, 90.0, 91.0, 84.0, 70.0, 75.0, 51.0, 46.0, 41.0, 29.0, 26.0, 16.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4423828125, -1.402130126953125, -1.36187744140625, -1.321624755859375, -1.2813720703125, -1.241119384765625, -1.20086669921875, -1.160614013671875, -1.120361328125, -1.080108642578125, -1.03985595703125, -0.999603271484375, -0.9593505859375, -0.919097900390625, -0.87884521484375, -0.838592529296875, -0.79833984375, -0.758087158203125, -0.71783447265625, -0.677581787109375, -0.6373291015625, -0.597076416015625, -0.55682373046875, -0.516571044921875, -0.476318359375, -0.436065673828125, -0.39581298828125, -0.355560302734375, -0.3153076171875, -0.275054931640625, -0.23480224609375, -0.194549560546875, -0.154296875, -0.114044189453125, -0.07379150390625, -0.033538818359375, 0.0067138671875, 0.046966552734375, 0.08721923828125, 0.127471923828125, 0.167724609375, 0.207977294921875, 0.24822998046875, 0.288482666015625, 0.3287353515625, 0.368988037109375, 0.40924072265625, 0.449493408203125, 0.48974609375, 0.529998779296875, 0.57025146484375, 0.610504150390625, 0.6507568359375, 0.691009521484375, 0.73126220703125, 0.771514892578125, 0.811767578125, 0.852020263671875, 0.89227294921875, 0.932525634765625, 0.9727783203125, 1.013031005859375, 1.05328369140625, 1.093536376953125, 1.1337890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 23.0, 44.0, 76.0, 154.0, 198.0, 169.0, 154.0, 83.0, 39.0, 29.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.013925552368164, -23.882144927978516, -22.750364303588867, -21.61858367919922, -20.48680305480957, -19.355022430419922, -18.223241806030273, -17.091461181640625, -15.959680557250977, -14.827899932861328, -13.69611930847168, -12.564338684082031, -11.432558059692383, -10.300777435302734, -9.168996810913086, -8.037216186523438, -6.905435562133789, -5.773654937744141, -4.641874313354492, -3.5100936889648438, -2.3783130645751953, -1.2465324401855469, -0.11475181579589844, 1.01702880859375, 2.1488094329833984, 3.280590057373047, 4.412370681762695, 5.544151306152344, 6.675931930541992, 7.807712554931641, 8.939493179321289, 10.071273803710938, 11.203056335449219, 12.334836959838867, 13.466617584228516, 14.598398208618164, 15.730178833007812, 16.86195945739746, 17.99374008178711, 19.125520706176758, 20.257301330566406, 21.389081954956055, 22.520862579345703, 23.65264320373535, 24.784423828125, 25.91620445251465, 27.047985076904297, 28.179765701293945, 29.311546325683594, 30.443326950073242, 31.57510757446289, 32.706886291503906, 33.83866882324219, 34.97045135498047, 36.102230072021484, 37.2340087890625, 38.36579132080078, 39.49757385253906, 40.62935256958008, 41.761131286621094, 42.892913818359375, 44.024696350097656, 45.15647506713867, 46.28825378417969, 47.42003631591797]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 9.0, 18.0, 15.0, 20.0, 21.0, 22.0, 35.0, 32.0, 44.0, 47.0, 47.0, 54.0, 68.0, 60.0, 55.0, 57.0, 60.0, 43.0, 47.0, 17.0, 46.0, 35.0, 23.0, 23.0, 24.0, 19.0, 11.0, 5.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.314420700073242, -25.57833480834961, -24.842247009277344, -24.10616111755371, -23.370073318481445, -22.633987426757812, -21.897899627685547, -21.161813735961914, -20.42572784423828, -19.68964195251465, -18.953554153442383, -18.21746826171875, -17.481380462646484, -16.74529457092285, -16.00920867919922, -15.273120880126953, -14.537034034729004, -13.800947189331055, -13.064860343933105, -12.328773498535156, -11.592687606811523, -10.856600761413574, -10.120513916015625, -9.384428024291992, -8.648340225219727, -7.912253379821777, -7.176167011260986, -6.440080165863037, -5.703993797302246, -4.967906951904297, -4.231820106506348, -3.4957337379455566, -2.7596473693847656, -2.0235607624053955, -1.2874740362167358, -0.5513873100280762, 0.18469929695129395, 0.9207859039306641, 1.6568727493286133, 2.3929591178894043, 3.1290459632873535, 3.8651325702667236, 4.601219177246094, 5.337306022644043, 6.073392868041992, 6.809479236602783, 7.545566082000732, 8.281652450561523, 9.017739295959473, 9.753826141357422, 10.489912986755371, 11.22599983215332, 11.962085723876953, 12.698172569274902, 13.434259414672852, 14.170345306396484, 14.90643310546875, 15.6425199508667, 16.37860679626465, 17.11469268798828, 17.850780487060547, 18.58686637878418, 19.322952270507812, 20.059040069580078, 20.79512596130371]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 18.0, 33.0, 51.0, 85.0, 145.0, 244.0, 465.0, 1029.0, 2223.0, 5363.0, 15076.0, 56912.0, 624502.0, 3312957.0, 133772.0, 26368.0, 8526.0, 3376.0, 1384.0, 758.0, 400.0, 202.0, 109.0, 92.0, 52.0, 36.0, 20.0, 15.0, 14.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.998077392578125, -1.92193603515625, -1.845794677734375, -1.7696533203125, -1.693511962890625, -1.61737060546875, -1.541229248046875, -1.465087890625, -1.388946533203125, -1.31280517578125, -1.236663818359375, -1.1605224609375, -1.084381103515625, -1.00823974609375, -0.932098388671875, -0.85595703125, -0.779815673828125, -0.70367431640625, -0.627532958984375, -0.5513916015625, -0.475250244140625, -0.39910888671875, -0.322967529296875, -0.246826171875, -0.170684814453125, -0.09454345703125, -0.018402099609375, 0.0577392578125, 0.133880615234375, 0.21002197265625, 0.286163330078125, 0.3623046875, 0.438446044921875, 0.51458740234375, 0.590728759765625, 0.6668701171875, 0.743011474609375, 0.81915283203125, 0.895294189453125, 0.971435546875, 1.047576904296875, 1.12371826171875, 1.199859619140625, 1.2760009765625, 1.352142333984375, 1.42828369140625, 1.504425048828125, 1.58056640625, 1.656707763671875, 1.73284912109375, 1.808990478515625, 1.8851318359375, 1.961273193359375, 2.03741455078125, 2.113555908203125, 2.189697265625, 2.265838623046875, 2.34197998046875, 2.418121337890625, 2.4942626953125, 2.570404052734375, 2.64654541015625, 2.722686767578125, 2.798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 8.0, 12.0, 25.0, 20.0, 31.0, 35.0, 32.0, 40.0, 46.0, 54.0, 53.0, 65.0, 62.0, 58.0, 56.0, 60.0, 42.0, 37.0, 39.0, 42.0, 38.0, 25.0, 23.0, 12.0, 16.0, 10.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9319381713867188, -0.8975677490234375, -0.8631973266601562, -0.828826904296875, -0.7944564819335938, -0.7600860595703125, -0.7257156372070312, -0.69134521484375, -0.6569747924804688, -0.6226043701171875, -0.5882339477539062, -0.553863525390625, -0.5194931030273438, -0.4851226806640625, -0.45075225830078125, -0.4163818359375, -0.38201141357421875, -0.3476409912109375, -0.31327056884765625, -0.278900146484375, -0.24452972412109375, -0.2101593017578125, -0.17578887939453125, -0.14141845703125, -0.10704803466796875, -0.0726776123046875, -0.03830718994140625, -0.003936767578125, 0.03043365478515625, 0.0648040771484375, 0.09917449951171875, 0.133544921875, 0.16791534423828125, 0.2022857666015625, 0.23665618896484375, 0.271026611328125, 0.30539703369140625, 0.3397674560546875, 0.37413787841796875, 0.40850830078125, 0.44287872314453125, 0.4772491455078125, 0.5116195678710938, 0.545989990234375, 0.5803604125976562, 0.6147308349609375, 0.6491012573242188, 0.6834716796875, 0.7178421020507812, 0.7522125244140625, 0.7865829467773438, 0.820953369140625, 0.8553237915039062, 0.8896942138671875, 0.9240646362304688, 0.95843505859375, 0.9928054809570312, 1.0271759033203125, 1.0615463256835938, 1.095916748046875, 1.1302871704101562, 1.1646575927734375, 1.1990280151367188, 1.2333984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 0.0, 6.0, 9.0, 5.0, 14.0, 25.0, 28.0, 81.0, 146.0, 350.0, 1000.0, 3940.0, 22370.0, 373989.0, 3718752.0, 62358.0, 8333.0, 1928.0, 534.0, 189.0, 88.0, 46.0, 24.0, 19.0, 12.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.35546875, -4.20648193359375, -4.0574951171875, -3.90850830078125, -3.759521484375, -3.61053466796875, -3.4615478515625, -3.31256103515625, -3.16357421875, -3.01458740234375, -2.8656005859375, -2.71661376953125, -2.567626953125, -2.41864013671875, -2.2696533203125, -2.12066650390625, -1.9716796875, -1.82269287109375, -1.6737060546875, -1.52471923828125, -1.375732421875, -1.22674560546875, -1.0777587890625, -0.92877197265625, -0.77978515625, -0.63079833984375, -0.4818115234375, -0.33282470703125, -0.183837890625, -0.03485107421875, 0.1141357421875, 0.26312255859375, 0.412109375, 0.56109619140625, 0.7100830078125, 0.85906982421875, 1.008056640625, 1.15704345703125, 1.3060302734375, 1.45501708984375, 1.60400390625, 1.75299072265625, 1.9019775390625, 2.05096435546875, 2.199951171875, 2.34893798828125, 2.4979248046875, 2.64691162109375, 2.7958984375, 2.94488525390625, 3.0938720703125, 3.24285888671875, 3.391845703125, 3.54083251953125, 3.6898193359375, 3.83880615234375, 3.98779296875, 4.13677978515625, 4.2857666015625, 4.43475341796875, 4.583740234375, 4.73272705078125, 4.8817138671875, 5.03070068359375, 5.1796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 8.0, 13.0, 19.0, 24.0, 36.0, 51.0, 102.0, 144.0, 304.0, 767.0, 1511.0, 583.0, 208.0, 95.0, 45.0, 41.0, 29.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2188720703125, -4.105712890625, -3.9925537109375, -3.87939453125, -3.7662353515625, -3.653076171875, -3.5399169921875, -3.4267578125, -3.3135986328125, -3.200439453125, -3.0872802734375, -2.97412109375, -2.8609619140625, -2.747802734375, -2.6346435546875, -2.521484375, -2.4083251953125, -2.295166015625, -2.1820068359375, -2.06884765625, -1.9556884765625, -1.842529296875, -1.7293701171875, -1.6162109375, -1.5030517578125, -1.389892578125, -1.2767333984375, -1.16357421875, -1.0504150390625, -0.937255859375, -0.8240966796875, -0.7109375, -0.5977783203125, -0.484619140625, -0.3714599609375, -0.25830078125, -0.1451416015625, -0.031982421875, 0.0811767578125, 0.1943359375, 0.3074951171875, 0.420654296875, 0.5338134765625, 0.64697265625, 0.7601318359375, 0.873291015625, 0.9864501953125, 1.099609375, 1.2127685546875, 1.325927734375, 1.4390869140625, 1.55224609375, 1.6654052734375, 1.778564453125, 1.8917236328125, 2.0048828125, 2.1180419921875, 2.231201171875, 2.3443603515625, 2.45751953125, 2.5706787109375, 2.683837890625, 2.7969970703125, 2.91015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 21.0, 33.0, 76.0, 133.0, 243.0, 219.0, 127.0, 78.0, 29.0, 12.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203954696655273, -27.14052963256836, -26.077106475830078, -25.013681411743164, -23.95025634765625, -22.88683319091797, -21.823408126831055, -20.75998306274414, -19.69655990600586, -18.633134841918945, -17.569711685180664, -16.50628662109375, -15.442862510681152, -14.379438400268555, -13.31601333618164, -12.252589225769043, -11.189165115356445, -10.125741004943848, -9.06231689453125, -7.998891830444336, -6.935467720031738, -5.872043609619141, -4.808619022369385, -3.745194435119629, -2.6817703247070312, -1.6183459758758545, -0.5549216270446777, 0.508502721786499, 1.5719270706176758, 2.6353511810302734, 3.6987757682800293, 4.762200355529785, 5.82562255859375, 6.889046669006348, 7.9524712562561035, 9.01589584350586, 10.079319953918457, 11.142744064331055, 12.206169128417969, 13.269593238830566, 14.333017349243164, 15.396441459655762, 16.45986557006836, 17.523290634155273, 18.586715698242188, 19.65013885498047, 20.713563919067383, 21.776988983154297, 22.840412139892578, 23.903837203979492, 24.967260360717773, 26.030685424804688, 27.09410858154297, 28.157533645629883, 29.220958709716797, 30.284381866455078, 31.347806930541992, 32.411231994628906, 33.47465515136719, 34.53807830810547, 35.601505279541016, 36.6649284362793, 37.72835159301758, 38.791778564453125, 39.855201721191406]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 17.0, 16.0, 23.0, 29.0, 31.0, 41.0, 27.0, 47.0, 54.0, 58.0, 65.0, 83.0, 64.0, 66.0, 62.0, 55.0, 44.0, 41.0, 33.0, 30.0, 23.0, 19.0, 16.0, 9.0, 3.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64159393310547, -16.08203887939453, -15.522483825683594, -14.962928771972656, -14.403374671936035, -13.843819618225098, -13.28426456451416, -12.724709510803223, -12.165155410766602, -11.605600357055664, -11.046045303344727, -10.486490249633789, -9.926936149597168, -9.36738109588623, -8.807826042175293, -8.248270988464355, -7.688715934753418, -7.1291608810424805, -6.569606304168701, -6.010051250457764, -5.450496673583984, -4.890941619873047, -4.331386566162109, -3.771831750869751, -3.2122769355773926, -2.652722120285034, -2.093167304992676, -1.5336122512817383, -0.9740574359893799, -0.4145026206970215, 0.14505243301391602, 0.7046072483062744, 1.2641620635986328, 1.8237168788909912, 2.3832716941833496, 2.942826747894287, 3.5023815631866455, 4.061936378479004, 4.621491432189941, 5.181046485900879, 5.740601062774658, 6.300156116485596, 6.859710693359375, 7.4192657470703125, 7.97882080078125, 8.538375854492188, 9.097930908203125, 9.657485008239746, 10.217040061950684, 10.776595115661621, 11.336150169372559, 11.89570426940918, 12.455259323120117, 13.014814376831055, 13.574369430541992, 14.13392448425293, 14.693479537963867, 15.253034591674805, 15.812589645385742, 16.37214469909668, 16.931699752807617, 17.491252899169922, 18.05080795288086, 18.610363006591797, 19.169918060302734]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 8.0, 7.0, 9.0, 21.0, 23.0, 35.0, 56.0, 91.0, 127.0, 186.0, 300.0, 517.0, 863.0, 1439.0, 2460.0, 4559.0, 8779.0, 17123.0, 36152.0, 76015.0, 157046.0, 264373.0, 235266.0, 125374.0, 59923.0, 28160.0, 13727.0, 7011.0, 3756.0, 2095.0, 1177.0, 692.0, 394.0, 264.0, 166.0, 123.0, 83.0, 54.0, 38.0, 30.0, 19.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3171844482421875, -1.273040771484375, -1.2288970947265625, -1.18475341796875, -1.1406097412109375, -1.096466064453125, -1.0523223876953125, -1.0081787109375, -0.9640350341796875, -0.919891357421875, -0.8757476806640625, -0.83160400390625, -0.7874603271484375, -0.743316650390625, -0.6991729736328125, -0.655029296875, -0.6108856201171875, -0.566741943359375, -0.5225982666015625, -0.47845458984375, -0.4343109130859375, -0.390167236328125, -0.3460235595703125, -0.3018798828125, -0.2577362060546875, -0.213592529296875, -0.1694488525390625, -0.12530517578125, -0.0811614990234375, -0.037017822265625, 0.0071258544921875, 0.05126953125, 0.0954132080078125, 0.139556884765625, 0.1837005615234375, 0.22784423828125, 0.2719879150390625, 0.316131591796875, 0.3602752685546875, 0.4044189453125, 0.4485626220703125, 0.492706298828125, 0.5368499755859375, 0.58099365234375, 0.6251373291015625, 0.669281005859375, 0.7134246826171875, 0.757568359375, 0.8017120361328125, 0.845855712890625, 0.8899993896484375, 0.93414306640625, 0.9782867431640625, 1.022430419921875, 1.0665740966796875, 1.1107177734375, 1.1548614501953125, 1.199005126953125, 1.2431488037109375, 1.28729248046875, 1.3314361572265625, 1.375579833984375, 1.4197235107421875, 1.4638671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 0.0, 4.0, 6.0, 13.0, 16.0, 19.0, 25.0, 29.0, 32.0, 33.0, 53.0, 33.0, 46.0, 63.0, 47.0, 44.0, 54.0, 49.0, 56.0, 48.0, 62.0, 36.0, 40.0, 32.0, 24.0, 20.0, 31.0, 18.0, 16.0, 10.0, 8.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0244140625, -0.9920806884765625, -0.959747314453125, -0.9274139404296875, -0.89508056640625, -0.8627471923828125, -0.830413818359375, -0.7980804443359375, -0.7657470703125, -0.7334136962890625, -0.701080322265625, -0.6687469482421875, -0.63641357421875, -0.6040802001953125, -0.571746826171875, -0.5394134521484375, -0.507080078125, -0.4747467041015625, -0.442413330078125, -0.4100799560546875, -0.37774658203125, -0.3454132080078125, -0.313079833984375, -0.2807464599609375, -0.2484130859375, -0.2160797119140625, -0.183746337890625, -0.1514129638671875, -0.11907958984375, -0.0867462158203125, -0.054412841796875, -0.0220794677734375, 0.01025390625, 0.0425872802734375, 0.074920654296875, 0.1072540283203125, 0.13958740234375, 0.1719207763671875, 0.204254150390625, 0.2365875244140625, 0.2689208984375, 0.3012542724609375, 0.333587646484375, 0.3659210205078125, 0.39825439453125, 0.4305877685546875, 0.462921142578125, 0.4952545166015625, 0.527587890625, 0.5599212646484375, 0.592254638671875, 0.6245880126953125, 0.65692138671875, 0.6892547607421875, 0.721588134765625, 0.7539215087890625, 0.7862548828125, 0.8185882568359375, 0.850921630859375, 0.8832550048828125, 0.91558837890625, 0.9479217529296875, 0.980255126953125, 1.0125885009765625, 1.044921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 9.0, 9.0, 20.0, 28.0, 40.0, 63.0, 110.0, 146.0, 213.0, 335.0, 553.0, 872.0, 1865.0, 4383.0, 14832.0, 77468.0, 561147.0, 323038.0, 46319.0, 10096.0, 3351.0, 1501.0, 829.0, 495.0, 262.0, 193.0, 117.0, 93.0, 42.0, 34.0, 24.0, 21.0, 12.0, 9.0, 10.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8101806640625, -2.716064453125, -2.6219482421875, -2.52783203125, -2.4337158203125, -2.339599609375, -2.2454833984375, -2.1513671875, -2.0572509765625, -1.963134765625, -1.8690185546875, -1.77490234375, -1.6807861328125, -1.586669921875, -1.4925537109375, -1.3984375, -1.3043212890625, -1.210205078125, -1.1160888671875, -1.02197265625, -0.9278564453125, -0.833740234375, -0.7396240234375, -0.6455078125, -0.5513916015625, -0.457275390625, -0.3631591796875, -0.26904296875, -0.1749267578125, -0.080810546875, 0.0133056640625, 0.107421875, 0.2015380859375, 0.295654296875, 0.3897705078125, 0.48388671875, 0.5780029296875, 0.672119140625, 0.7662353515625, 0.8603515625, 0.9544677734375, 1.048583984375, 1.1427001953125, 1.23681640625, 1.3309326171875, 1.425048828125, 1.5191650390625, 1.61328125, 1.7073974609375, 1.801513671875, 1.8956298828125, 1.98974609375, 2.0838623046875, 2.177978515625, 2.2720947265625, 2.3662109375, 2.4603271484375, 2.554443359375, 2.6485595703125, 2.74267578125, 2.8367919921875, 2.930908203125, 3.0250244140625, 3.119140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 7.0, 11.0, 9.0, 16.0, 14.0, 14.0, 18.0, 22.0, 28.0, 36.0, 37.0, 25.0, 46.0, 40.0, 36.0, 46.0, 53.0, 37.0, 45.0, 52.0, 37.0, 37.0, 44.0, 33.0, 42.0, 37.0, 27.0, 15.0, 25.0, 18.0, 16.0, 12.0, 3.0, 5.0, 8.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.626953125, -3.511871337890625, -3.39678955078125, -3.281707763671875, -3.1666259765625, -3.051544189453125, -2.93646240234375, -2.821380615234375, -2.706298828125, -2.591217041015625, -2.47613525390625, -2.361053466796875, -2.2459716796875, -2.130889892578125, -2.01580810546875, -1.900726318359375, -1.78564453125, -1.670562744140625, -1.55548095703125, -1.440399169921875, -1.3253173828125, -1.210235595703125, -1.09515380859375, -0.980072021484375, -0.864990234375, -0.749908447265625, -0.63482666015625, -0.519744873046875, -0.4046630859375, -0.289581298828125, -0.17449951171875, -0.059417724609375, 0.0556640625, 0.170745849609375, 0.28582763671875, 0.400909423828125, 0.5159912109375, 0.631072998046875, 0.74615478515625, 0.861236572265625, 0.976318359375, 1.091400146484375, 1.20648193359375, 1.321563720703125, 1.4366455078125, 1.551727294921875, 1.66680908203125, 1.781890869140625, 1.89697265625, 2.012054443359375, 2.12713623046875, 2.242218017578125, 2.3572998046875, 2.472381591796875, 2.58746337890625, 2.702545166015625, 2.817626953125, 2.932708740234375, 3.04779052734375, 3.162872314453125, 3.2779541015625, 3.393035888671875, 3.50811767578125, 3.623199462890625, 3.73828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 1.0, 8.0, 16.0, 25.0, 41.0, 67.0, 114.0, 229.0, 451.0, 1068.0, 3575.0, 22706.0, 591134.0, 405261.0, 18668.0, 3258.0, 1078.0, 425.0, 181.0, 97.0, 46.0, 33.0, 24.0, 12.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.42718505859375, -1.3699951171875, -1.31280517578125, -1.255615234375, -1.19842529296875, -1.1412353515625, -1.08404541015625, -1.02685546875, -0.96966552734375, -0.9124755859375, -0.85528564453125, -0.798095703125, -0.74090576171875, -0.6837158203125, -0.62652587890625, -0.5693359375, -0.51214599609375, -0.4549560546875, -0.39776611328125, -0.340576171875, -0.28338623046875, -0.2261962890625, -0.16900634765625, -0.11181640625, -0.05462646484375, 0.0025634765625, 0.05975341796875, 0.116943359375, 0.17413330078125, 0.2313232421875, 0.28851318359375, 0.345703125, 0.40289306640625, 0.4600830078125, 0.51727294921875, 0.574462890625, 0.63165283203125, 0.6888427734375, 0.74603271484375, 0.80322265625, 0.86041259765625, 0.9176025390625, 0.97479248046875, 1.031982421875, 1.08917236328125, 1.1463623046875, 1.20355224609375, 1.2607421875, 1.31793212890625, 1.3751220703125, 1.43231201171875, 1.489501953125, 1.54669189453125, 1.6038818359375, 1.66107177734375, 1.71826171875, 1.77545166015625, 1.8326416015625, 1.88983154296875, 1.947021484375, 2.00421142578125, 2.0614013671875, 2.11859130859375, 2.17578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 11.0, 18.0, 16.0, 30.0, 32.0, 30.0, 40.0, 63.0, 74.0, 94.0, 101.0, 93.0, 81.0, 73.0, 70.0, 31.0, 37.0, 22.0, 18.0, 13.0, 11.0, 1.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00025326013565063477, -0.00024688243865966797, -0.00024050474166870117, -0.00023412704467773438, -0.00022774934768676758, -0.00022137165069580078, -0.00021499395370483398, -0.0002086162567138672, -0.0002022385597229004, -0.0001958608627319336, -0.0001894831657409668, -0.00018310546875, -0.0001767277717590332, -0.0001703500747680664, -0.0001639723777770996, -0.0001575946807861328, -0.00015121698379516602, -0.00014483928680419922, -0.00013846158981323242, -0.00013208389282226562, -0.00012570619583129883, -0.00011932849884033203, -0.00011295080184936523, -0.00010657310485839844, -0.00010019540786743164, -9.381771087646484e-05, -8.744001388549805e-05, -8.106231689453125e-05, -7.468461990356445e-05, -6.830692291259766e-05, -6.192922592163086e-05, -5.555152893066406e-05, -4.9173831939697266e-05, -4.279613494873047e-05, -3.641843795776367e-05, -3.0040740966796875e-05, -2.3663043975830078e-05, -1.728534698486328e-05, -1.0907649993896484e-05, -4.5299530029296875e-06, 1.8477439880371094e-06, 8.225440979003906e-06, 1.4603137969970703e-05, 2.09808349609375e-05, 2.7358531951904297e-05, 3.3736228942871094e-05, 4.011392593383789e-05, 4.649162292480469e-05, 5.2869319915771484e-05, 5.924701690673828e-05, 6.562471389770508e-05, 7.200241088867188e-05, 7.838010787963867e-05, 8.475780487060547e-05, 9.113550186157227e-05, 9.751319885253906e-05, 0.00010389089584350586, 0.00011026859283447266, 0.00011664628982543945, 0.00012302398681640625, 0.00012940168380737305, 0.00013577938079833984, 0.00014215707778930664, 0.00014853477478027344]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 20.0, 22.0, 31.0, 43.0, 76.0, 148.0, 277.0, 554.0, 1278.0, 3431.0, 13945.0, 123505.0, 764892.0, 120715.0, 13728.0, 3409.0, 1228.0, 540.0, 271.0, 161.0, 97.0, 60.0, 37.0, 27.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8165740966796875, -1.772796630859375, -1.7290191650390625, -1.68524169921875, -1.6414642333984375, -1.597686767578125, -1.5539093017578125, -1.5101318359375, -1.4663543701171875, -1.422576904296875, -1.3787994384765625, -1.33502197265625, -1.2912445068359375, -1.247467041015625, -1.2036895751953125, -1.159912109375, -1.1161346435546875, -1.072357177734375, -1.0285797119140625, -0.98480224609375, -0.9410247802734375, -0.897247314453125, -0.8534698486328125, -0.8096923828125, -0.7659149169921875, -0.722137451171875, -0.6783599853515625, -0.63458251953125, -0.5908050537109375, -0.547027587890625, -0.5032501220703125, -0.45947265625, -0.4156951904296875, -0.371917724609375, -0.3281402587890625, -0.28436279296875, -0.2405853271484375, -0.196807861328125, -0.1530303955078125, -0.1092529296875, -0.0654754638671875, -0.021697998046875, 0.0220794677734375, 0.06585693359375, 0.1096343994140625, 0.153411865234375, 0.1971893310546875, 0.240966796875, 0.2847442626953125, 0.328521728515625, 0.3722991943359375, 0.41607666015625, 0.4598541259765625, 0.503631591796875, 0.5474090576171875, 0.5911865234375, 0.6349639892578125, 0.678741455078125, 0.7225189208984375, 0.76629638671875, 0.8100738525390625, 0.853851318359375, 0.8976287841796875, 0.94140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 21.0, 24.0, 36.0, 42.0, 74.0, 78.0, 62.0, 92.0, 116.0, 96.0, 90.0, 69.0, 44.0, 41.0, 29.0, 29.0, 14.0, 4.0, 11.0, 6.0, 0.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.103515625, -2.0527496337890625, -2.001983642578125, -1.9512176513671875, -1.90045166015625, -1.8496856689453125, -1.798919677734375, -1.7481536865234375, -1.6973876953125, -1.6466217041015625, -1.595855712890625, -1.5450897216796875, -1.49432373046875, -1.4435577392578125, -1.392791748046875, -1.3420257568359375, -1.291259765625, -1.2404937744140625, -1.189727783203125, -1.1389617919921875, -1.08819580078125, -1.0374298095703125, -0.986663818359375, -0.9358978271484375, -0.8851318359375, -0.8343658447265625, -0.783599853515625, -0.7328338623046875, -0.68206787109375, -0.6313018798828125, -0.580535888671875, -0.5297698974609375, -0.47900390625, -0.4282379150390625, -0.377471923828125, -0.3267059326171875, -0.27593994140625, -0.2251739501953125, -0.174407958984375, -0.1236419677734375, -0.0728759765625, -0.0221099853515625, 0.028656005859375, 0.0794219970703125, 0.13018798828125, 0.1809539794921875, 0.231719970703125, 0.2824859619140625, 0.333251953125, 0.3840179443359375, 0.434783935546875, 0.4855499267578125, 0.53631591796875, 0.5870819091796875, 0.637847900390625, 0.6886138916015625, 0.7393798828125, 0.7901458740234375, 0.840911865234375, 0.8916778564453125, 0.94244384765625, 0.9932098388671875, 1.043975830078125, 1.0947418212890625, 1.1455078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 21.0, 107.0, 242.0, 357.0, 193.0, 48.0, 11.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57146453857422, -38.9788818359375, -37.38629913330078, -35.79371643066406, -34.201133728027344, -32.608551025390625, -31.01597023010254, -29.42338752746582, -27.8308048248291, -26.238222122192383, -24.645639419555664, -23.053058624267578, -21.46047592163086, -19.86789321899414, -18.275310516357422, -16.682727813720703, -15.090145111083984, -13.497562408447266, -11.904979705810547, -10.312397956848145, -8.719815254211426, -7.127232551574707, -5.534650802612305, -3.942068099975586, -2.349485397338867, -0.7569029331207275, 0.8356795310974121, 2.4282617568969727, 4.020844459533691, 5.61342716217041, 7.2060089111328125, 8.798591613769531, 10.391170501708984, 11.983753204345703, 13.576335906982422, 15.168917655944824, 16.76150131225586, 18.354084014892578, 19.946664810180664, 21.539247512817383, 23.1318302154541, 24.72441291809082, 26.31699562072754, 27.909576416015625, 29.502159118652344, 31.094741821289062, 32.68732452392578, 34.2799072265625, 35.87248992919922, 37.46507263183594, 39.057655334472656, 40.650238037109375, 42.242820739746094, 43.83540344238281, 45.42798614501953, 47.02056884765625, 48.61315155029297, 50.20573425292969, 51.798316955566406, 53.390899658203125, 54.983482360839844, 56.57606506347656, 58.16864776611328, 59.76123046875, 61.35380935668945]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 16.0, 13.0, 23.0, 35.0, 30.0, 30.0, 49.0, 74.0, 73.0, 71.0, 81.0, 77.0, 58.0, 63.0, 51.0, 44.0, 50.0, 30.0, 23.0, 16.0, 10.0, 12.0, 19.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.497474670410156, -23.804574966430664, -23.11167335510254, -22.418773651123047, -21.725872039794922, -21.03297233581543, -20.340072631835938, -19.647171020507812, -18.95427131652832, -18.261371612548828, -17.568470001220703, -16.87557029724121, -16.18267059326172, -15.489768981933594, -14.796869277954102, -14.103968620300293, -13.411067962646484, -12.718167304992676, -12.025266647338867, -11.332366943359375, -10.639466285705566, -9.946565628051758, -9.253665924072266, -8.560765266418457, -7.867864608764648, -7.17496395111084, -6.4820637702941895, -5.789163589477539, -5.0962629318237305, -4.403362274169922, -3.7104620933532715, -3.017561912536621, -2.3246631622314453, -1.6317627429962158, -0.9388623237609863, -0.24596190452575684, 0.44693851470947266, 1.1398389339447021, 1.8327393531799316, 2.525639533996582, 3.2185401916503906, 3.91144061088562, 4.60434103012085, 5.2972412109375, 5.990141868591309, 6.683042526245117, 7.375942707061768, 8.068842887878418, 8.761743545532227, 9.454644203186035, 10.147544860839844, 10.840444564819336, 11.533345222473145, 12.226245880126953, 12.919145584106445, 13.612046241760254, 14.304946899414062, 14.997847557067871, 15.69074821472168, 16.383647918701172, 17.076549530029297, 17.76944923400879, 18.46234893798828, 19.155250549316406, 19.8481502532959]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 9.0, 13.0, 13.0, 12.0, 15.0, 30.0, 24.0, 45.0, 77.0, 116.0, 222.0, 619.0, 4986.0, 170221.0, 3997475.0, 18003.0, 1497.0, 383.0, 170.0, 99.0, 71.0, 46.0, 32.0, 24.0, 19.0, 12.0, 14.0, 7.0, 8.0, 4.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.86016845703125, -5.6890869140625, -5.51800537109375, -5.346923828125, -5.17584228515625, -5.0047607421875, -4.83367919921875, -4.66259765625, -4.49151611328125, -4.3204345703125, -4.14935302734375, -3.978271484375, -3.80718994140625, -3.6361083984375, -3.46502685546875, -3.2939453125, -3.12286376953125, -2.9517822265625, -2.78070068359375, -2.609619140625, -2.43853759765625, -2.2674560546875, -2.09637451171875, -1.92529296875, -1.75421142578125, -1.5831298828125, -1.41204833984375, -1.240966796875, -1.06988525390625, -0.8988037109375, -0.72772216796875, -0.556640625, -0.38555908203125, -0.2144775390625, -0.04339599609375, 0.127685546875, 0.29876708984375, 0.4698486328125, 0.64093017578125, 0.81201171875, 0.98309326171875, 1.1541748046875, 1.32525634765625, 1.496337890625, 1.66741943359375, 1.8385009765625, 2.00958251953125, 2.1806640625, 2.35174560546875, 2.5228271484375, 2.69390869140625, 2.864990234375, 3.03607177734375, 3.2071533203125, 3.37823486328125, 3.54931640625, 3.72039794921875, 3.8914794921875, 4.06256103515625, 4.233642578125, 4.40472412109375, 4.5758056640625, 4.74688720703125, 4.91796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 22.0, 42.0, 69.0, 99.0, 137.0, 125.0, 147.0, 116.0, 95.0, 55.0, 46.0, 20.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.280487060546875, -2.19573974609375, -2.110992431640625, -2.0262451171875, -1.941497802734375, -1.85675048828125, -1.772003173828125, -1.687255859375, -1.602508544921875, -1.51776123046875, -1.433013916015625, -1.3482666015625, -1.263519287109375, -1.17877197265625, -1.094024658203125, -1.00927734375, -0.924530029296875, -0.83978271484375, -0.755035400390625, -0.6702880859375, -0.585540771484375, -0.50079345703125, -0.416046142578125, -0.331298828125, -0.246551513671875, -0.16180419921875, -0.077056884765625, 0.0076904296875, 0.092437744140625, 0.17718505859375, 0.261932373046875, 0.3466796875, 0.431427001953125, 0.51617431640625, 0.600921630859375, 0.6856689453125, 0.770416259765625, 0.85516357421875, 0.939910888671875, 1.024658203125, 1.109405517578125, 1.19415283203125, 1.278900146484375, 1.3636474609375, 1.448394775390625, 1.53314208984375, 1.617889404296875, 1.70263671875, 1.787384033203125, 1.87213134765625, 1.956878662109375, 2.0416259765625, 2.126373291015625, 2.21112060546875, 2.295867919921875, 2.380615234375, 2.465362548828125, 2.55010986328125, 2.634857177734375, 2.7196044921875, 2.804351806640625, 2.88909912109375, 2.973846435546875, 3.05859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 2.0, 8.0, 3.0, 14.0, 10.0, 25.0, 36.0, 76.0, 155.0, 291.0, 691.0, 1528.0, 3573.0, 9308.0, 25867.0, 103746.0, 1586633.0, 2290769.0, 123967.0, 29106.0, 10393.0, 4275.0, 1946.0, 860.0, 427.0, 246.0, 122.0, 70.0, 35.0, 32.0, 22.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.468719482421875, -1.41009521484375, -1.351470947265625, -1.2928466796875, -1.234222412109375, -1.17559814453125, -1.116973876953125, -1.058349609375, -0.999725341796875, -0.94110107421875, -0.882476806640625, -0.8238525390625, -0.765228271484375, -0.70660400390625, -0.647979736328125, -0.58935546875, -0.530731201171875, -0.47210693359375, -0.413482666015625, -0.3548583984375, -0.296234130859375, -0.23760986328125, -0.178985595703125, -0.120361328125, -0.061737060546875, -0.00311279296875, 0.055511474609375, 0.1141357421875, 0.172760009765625, 0.23138427734375, 0.290008544921875, 0.3486328125, 0.407257080078125, 0.46588134765625, 0.524505615234375, 0.5831298828125, 0.641754150390625, 0.70037841796875, 0.759002685546875, 0.817626953125, 0.876251220703125, 0.93487548828125, 0.993499755859375, 1.0521240234375, 1.110748291015625, 1.16937255859375, 1.227996826171875, 1.28662109375, 1.345245361328125, 1.40386962890625, 1.462493896484375, 1.5211181640625, 1.579742431640625, 1.63836669921875, 1.696990966796875, 1.755615234375, 1.814239501953125, 1.87286376953125, 1.931488037109375, 1.9901123046875, 2.048736572265625, 2.10736083984375, 2.165985107421875, 2.224609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 7.0, 6.0, 17.0, 16.0, 32.0, 30.0, 56.0, 80.0, 121.0, 237.0, 401.0, 725.0, 868.0, 592.0, 308.0, 182.0, 104.0, 73.0, 43.0, 35.0, 21.0, 19.0, 9.0, 11.0, 5.0, 9.0, 4.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.318084716796875, -1.25921630859375, -1.200347900390625, -1.1414794921875, -1.082611083984375, -1.02374267578125, -0.964874267578125, -0.906005859375, -0.847137451171875, -0.78826904296875, -0.729400634765625, -0.6705322265625, -0.611663818359375, -0.55279541015625, -0.493927001953125, -0.43505859375, -0.376190185546875, -0.31732177734375, -0.258453369140625, -0.1995849609375, -0.140716552734375, -0.08184814453125, -0.022979736328125, 0.035888671875, 0.094757080078125, 0.15362548828125, 0.212493896484375, 0.2713623046875, 0.330230712890625, 0.38909912109375, 0.447967529296875, 0.5068359375, 0.565704345703125, 0.62457275390625, 0.683441162109375, 0.7423095703125, 0.801177978515625, 0.86004638671875, 0.918914794921875, 0.977783203125, 1.036651611328125, 1.09552001953125, 1.154388427734375, 1.2132568359375, 1.272125244140625, 1.33099365234375, 1.389862060546875, 1.44873046875, 1.507598876953125, 1.56646728515625, 1.625335693359375, 1.6842041015625, 1.743072509765625, 1.80194091796875, 1.860809326171875, 1.919677734375, 1.978546142578125, 2.03741455078125, 2.096282958984375, 2.1551513671875, 2.214019775390625, 2.27288818359375, 2.331756591796875, 2.390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 17.0, 55.0, 126.0, 255.0, 266.0, 154.0, 63.0, 29.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.99540328979492, -39.19813537597656, -38.40087127685547, -37.60360336303711, -36.80633544921875, -36.00906753540039, -35.2118034362793, -34.41453552246094, -33.61726760864258, -32.81999969482422, -32.022735595703125, -31.225467681884766, -30.428199768066406, -29.63093376159668, -28.833667755126953, -28.036399841308594, -27.239133834838867, -26.44186782836914, -25.64459991455078, -24.847333908081055, -24.050065994262695, -23.25279998779297, -22.45553207397461, -21.658266067504883, -20.861000061035156, -20.06373405456543, -19.26646614074707, -18.469200134277344, -17.671932220458984, -16.874666213989258, -16.07740020751953, -15.280132293701172, -14.482866287231445, -13.685599327087402, -12.88833236694336, -12.091066360473633, -11.293798446655273, -10.496532440185547, -9.699265480041504, -8.901998519897461, -8.104731559753418, -7.307464599609375, -6.510197639465332, -5.712931156158447, -4.915664196014404, -4.118397235870361, -3.3211307525634766, -2.5238637924194336, -1.7265968322753906, -0.9293299913406372, -0.1320631504058838, 0.6652035713195801, 1.462470531463623, 2.259737491607666, 3.057003974914551, 3.8542709350585938, 4.651537895202637, 5.44880485534668, 6.246071815490723, 7.043338298797607, 7.84060525894165, 8.637872695922852, 9.435138702392578, 10.232405662536621, 11.029672622680664]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 6.0, 19.0, 11.0, 22.0, 23.0, 24.0, 30.0, 34.0, 46.0, 47.0, 49.0, 55.0, 49.0, 59.0, 55.0, 58.0, 52.0, 37.0, 35.0, 39.0, 28.0, 43.0, 33.0, 23.0, 21.0, 21.0, 20.0, 7.0, 4.0, 8.0, 1.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.039276123046875, -10.732244491577148, -10.425213813781738, -10.118182182312012, -9.811151504516602, -9.504119873046875, -9.197089195251465, -8.890057563781738, -8.583026885986328, -8.275995254516602, -7.968964576721191, -7.661933422088623, -7.354902267456055, -7.047871112823486, -6.740839958190918, -6.433808326721191, -6.126777172088623, -5.819746017456055, -5.512714862823486, -5.205683708190918, -4.89865255355835, -4.591621398925781, -4.284589767456055, -3.9775588512420654, -3.670527696609497, -3.3634965419769287, -3.0564653873443604, -2.749433994293213, -2.4424028396606445, -2.135371685028076, -1.8283405303955078, -1.5213093757629395, -1.214278221130371, -0.9072470664978027, -0.6002158522605896, -0.29318463802337646, 0.013846516609191895, 0.32087767124176025, 0.6279089450836182, 0.9349400997161865, 1.2419712543487549, 1.5490024089813232, 1.8560335636138916, 2.163064956665039, 2.4700961112976074, 2.777127265930176, 3.084158420562744, 3.3911895751953125, 3.698220729827881, 4.005251884460449, 4.312283039093018, 4.619314193725586, 4.926345348358154, 5.233376502990723, 5.540408134460449, 5.847438812255859, 6.154470443725586, 6.461501598358154, 6.768532752990723, 7.075563907623291, 7.382595062255859, 7.689626216888428, 7.996657371520996, 8.303689002990723, 8.610719680786133]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 9.0, 10.0, 5.0, 9.0, 22.0, 28.0, 45.0, 83.0, 127.0, 222.0, 370.0, 760.0, 1398.0, 3137.0, 7238.0, 18420.0, 50847.0, 153870.0, 381970.0, 280231.0, 95131.0, 32760.0, 12184.0, 5114.0, 2258.0, 1047.0, 560.0, 270.0, 152.0, 112.0, 64.0, 35.0, 26.0, 12.0, 14.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.91900634765625, -1.8604736328125, -1.80194091796875, -1.743408203125, -1.68487548828125, -1.6263427734375, -1.56781005859375, -1.50927734375, -1.45074462890625, -1.3922119140625, -1.33367919921875, -1.275146484375, -1.21661376953125, -1.1580810546875, -1.09954833984375, -1.041015625, -0.98248291015625, -0.9239501953125, -0.86541748046875, -0.806884765625, -0.74835205078125, -0.6898193359375, -0.63128662109375, -0.57275390625, -0.51422119140625, -0.4556884765625, -0.39715576171875, -0.338623046875, -0.28009033203125, -0.2215576171875, -0.16302490234375, -0.1044921875, -0.04595947265625, 0.0125732421875, 0.07110595703125, 0.129638671875, 0.18817138671875, 0.2467041015625, 0.30523681640625, 0.36376953125, 0.42230224609375, 0.4808349609375, 0.53936767578125, 0.597900390625, 0.65643310546875, 0.7149658203125, 0.77349853515625, 0.83203125, 0.89056396484375, 0.9490966796875, 1.00762939453125, 1.066162109375, 1.12469482421875, 1.1832275390625, 1.24176025390625, 1.30029296875, 1.35882568359375, 1.4173583984375, 1.47589111328125, 1.534423828125, 1.59295654296875, 1.6514892578125, 1.71002197265625, 1.7685546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 8.0, 10.0, 17.0, 22.0, 33.0, 42.0, 48.0, 61.0, 67.0, 78.0, 113.0, 80.0, 86.0, 82.0, 67.0, 44.0, 50.0, 31.0, 19.0, 15.0, 7.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7284393310546875, -1.677581787109375, -1.6267242431640625, -1.57586669921875, -1.5250091552734375, -1.474151611328125, -1.4232940673828125, -1.3724365234375, -1.3215789794921875, -1.270721435546875, -1.2198638916015625, -1.16900634765625, -1.1181488037109375, -1.067291259765625, -1.0164337158203125, -0.965576171875, -0.9147186279296875, -0.863861083984375, -0.8130035400390625, -0.76214599609375, -0.7112884521484375, -0.660430908203125, -0.6095733642578125, -0.5587158203125, -0.5078582763671875, -0.457000732421875, -0.4061431884765625, -0.35528564453125, -0.3044281005859375, -0.253570556640625, -0.2027130126953125, -0.15185546875, -0.1009979248046875, -0.050140380859375, 0.0007171630859375, 0.05157470703125, 0.1024322509765625, 0.153289794921875, 0.2041473388671875, 0.2550048828125, 0.3058624267578125, 0.356719970703125, 0.4075775146484375, 0.45843505859375, 0.5092926025390625, 0.560150146484375, 0.6110076904296875, 0.661865234375, 0.7127227783203125, 0.763580322265625, 0.8144378662109375, 0.86529541015625, 0.9161529541015625, 0.967010498046875, 1.0178680419921875, 1.0687255859375, 1.1195831298828125, 1.170440673828125, 1.2212982177734375, 1.27215576171875, 1.3230133056640625, 1.373870849609375, 1.4247283935546875, 1.4755859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 11.0, 13.0, 18.0, 17.0, 30.0, 59.0, 61.0, 94.0, 143.0, 201.0, 399.0, 703.0, 1519.0, 4191.0, 15835.0, 88121.0, 595014.0, 285102.0, 42752.0, 9047.0, 2773.0, 1107.0, 547.0, 290.0, 179.0, 104.0, 63.0, 47.0, 29.0, 21.0, 8.0, 8.0, 6.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.93359375, -2.841339111328125, -2.74908447265625, -2.656829833984375, -2.5645751953125, -2.472320556640625, -2.38006591796875, -2.287811279296875, -2.195556640625, -2.103302001953125, -2.01104736328125, -1.918792724609375, -1.8265380859375, -1.734283447265625, -1.64202880859375, -1.549774169921875, -1.45751953125, -1.365264892578125, -1.27301025390625, -1.180755615234375, -1.0885009765625, -0.996246337890625, -0.90399169921875, -0.811737060546875, -0.719482421875, -0.627227783203125, -0.53497314453125, -0.442718505859375, -0.3504638671875, -0.258209228515625, -0.16595458984375, -0.073699951171875, 0.0185546875, 0.110809326171875, 0.20306396484375, 0.295318603515625, 0.3875732421875, 0.479827880859375, 0.57208251953125, 0.664337158203125, 0.756591796875, 0.848846435546875, 0.94110107421875, 1.033355712890625, 1.1256103515625, 1.217864990234375, 1.31011962890625, 1.402374267578125, 1.49462890625, 1.586883544921875, 1.67913818359375, 1.771392822265625, 1.8636474609375, 1.955902099609375, 2.04815673828125, 2.140411376953125, 2.232666015625, 2.324920654296875, 2.41717529296875, 2.509429931640625, 2.6016845703125, 2.693939208984375, 2.78619384765625, 2.878448486328125, 2.970703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 0.0, 8.0, 5.0, 14.0, 6.0, 13.0, 12.0, 14.0, 16.0, 20.0, 25.0, 27.0, 26.0, 39.0, 39.0, 33.0, 53.0, 61.0, 43.0, 54.0, 47.0, 60.0, 50.0, 41.0, 50.0, 32.0, 25.0, 31.0, 33.0, 17.0, 13.0, 13.0, 16.0, 14.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.3446044921875, -3.238037109375, -3.1314697265625, -3.02490234375, -2.9183349609375, -2.811767578125, -2.7052001953125, -2.5986328125, -2.4920654296875, -2.385498046875, -2.2789306640625, -2.17236328125, -2.0657958984375, -1.959228515625, -1.8526611328125, -1.74609375, -1.6395263671875, -1.532958984375, -1.4263916015625, -1.31982421875, -1.2132568359375, -1.106689453125, -1.0001220703125, -0.8935546875, -0.7869873046875, -0.680419921875, -0.5738525390625, -0.46728515625, -0.3607177734375, -0.254150390625, -0.1475830078125, -0.041015625, 0.0655517578125, 0.172119140625, 0.2786865234375, 0.38525390625, 0.4918212890625, 0.598388671875, 0.7049560546875, 0.8115234375, 0.9180908203125, 1.024658203125, 1.1312255859375, 1.23779296875, 1.3443603515625, 1.450927734375, 1.5574951171875, 1.6640625, 1.7706298828125, 1.877197265625, 1.9837646484375, 2.09033203125, 2.1968994140625, 2.303466796875, 2.4100341796875, 2.5166015625, 2.6231689453125, 2.729736328125, 2.8363037109375, 2.94287109375, 3.0494384765625, 3.156005859375, 3.2625732421875, 3.369140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 15.0, 25.0, 30.0, 93.0, 242.0, 1038.0, 11156.0, 936631.0, 96247.0, 2386.0, 430.0, 132.0, 47.0, 37.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.588165283203125, -1.49859619140625, -1.409027099609375, -1.3194580078125, -1.229888916015625, -1.14031982421875, -1.050750732421875, -0.961181640625, -0.871612548828125, -0.78204345703125, -0.692474365234375, -0.6029052734375, -0.513336181640625, -0.42376708984375, -0.334197998046875, -0.24462890625, -0.155059814453125, -0.06549072265625, 0.024078369140625, 0.1136474609375, 0.203216552734375, 0.29278564453125, 0.382354736328125, 0.471923828125, 0.561492919921875, 0.65106201171875, 0.740631103515625, 0.8302001953125, 0.919769287109375, 1.00933837890625, 1.098907470703125, 1.1884765625, 1.278045654296875, 1.36761474609375, 1.457183837890625, 1.5467529296875, 1.636322021484375, 1.72589111328125, 1.815460205078125, 1.905029296875, 1.994598388671875, 2.08416748046875, 2.173736572265625, 2.2633056640625, 2.352874755859375, 2.44244384765625, 2.532012939453125, 2.62158203125, 2.711151123046875, 2.80072021484375, 2.890289306640625, 2.9798583984375, 3.069427490234375, 3.15899658203125, 3.248565673828125, 3.338134765625, 3.427703857421875, 3.51727294921875, 3.606842041015625, 3.6964111328125, 3.785980224609375, 3.87554931640625, 3.965118408203125, 4.0546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 17.0, 35.0, 35.0, 46.0, 55.0, 48.0, 59.0, 56.0, 89.0, 60.0, 68.0, 57.0, 52.0, 40.0, 42.0, 24.0, 27.0, 21.0, 19.0, 12.0, 11.0, 11.0, 9.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001404285430908203, -0.00013588741421699524, -0.00013134628534317017, -0.0001268051564693451, -0.00012226402759552002, -0.00011772289872169495, -0.00011318176984786987, -0.0001086406409740448, -0.00010409951210021973, -9.955838322639465e-05, -9.501725435256958e-05, -9.047612547874451e-05, -8.593499660491943e-05, -8.139386773109436e-05, -7.685273885726929e-05, -7.231160998344421e-05, -6.777048110961914e-05, -6.322935223579407e-05, -5.8688223361968994e-05, -5.414709448814392e-05, -4.960596561431885e-05, -4.5064836740493774e-05, -4.05237078666687e-05, -3.598257899284363e-05, -3.1441450119018555e-05, -2.690032124519348e-05, -2.2359192371368408e-05, -1.7818063497543335e-05, -1.3276934623718262e-05, -8.735805749893188e-06, -4.194676876068115e-06, 3.46451997756958e-07, 4.887580871582031e-06, 9.428709745407104e-06, 1.3969838619232178e-05, 1.851096749305725e-05, 2.3052096366882324e-05, 2.7593225240707397e-05, 3.213435411453247e-05, 3.6675482988357544e-05, 4.121661186218262e-05, 4.575774073600769e-05, 5.0298869609832764e-05, 5.483999848365784e-05, 5.938112735748291e-05, 6.392225623130798e-05, 6.846338510513306e-05, 7.300451397895813e-05, 7.75456428527832e-05, 8.208677172660828e-05, 8.662790060043335e-05, 9.116902947425842e-05, 9.57101583480835e-05, 0.00010025128722190857, 0.00010479241609573364, 0.00010933354496955872, 0.00011387467384338379, 0.00011841580271720886, 0.00012295693159103394, 0.000127498060464859, 0.00013203918933868408, 0.00013658031821250916, 0.00014112144708633423, 0.0001456625759601593, 0.00015020370483398438]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 13.0, 21.0, 41.0, 51.0, 71.0, 157.0, 271.0, 621.0, 1441.0, 4864.0, 34892.0, 689701.0, 294675.0, 16544.0, 3118.0, 1022.0, 467.0, 227.0, 114.0, 80.0, 49.0, 40.0, 20.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.560546875, -1.5157623291015625, -1.470977783203125, -1.4261932373046875, -1.38140869140625, -1.3366241455078125, -1.291839599609375, -1.2470550537109375, -1.2022705078125, -1.1574859619140625, -1.112701416015625, -1.0679168701171875, -1.02313232421875, -0.9783477783203125, -0.933563232421875, -0.8887786865234375, -0.843994140625, -0.7992095947265625, -0.754425048828125, -0.7096405029296875, -0.66485595703125, -0.6200714111328125, -0.575286865234375, -0.5305023193359375, -0.4857177734375, -0.4409332275390625, -0.396148681640625, -0.3513641357421875, -0.30657958984375, -0.2617950439453125, -0.217010498046875, -0.1722259521484375, -0.12744140625, -0.0826568603515625, -0.037872314453125, 0.0069122314453125, 0.05169677734375, 0.0964813232421875, 0.141265869140625, 0.1860504150390625, 0.2308349609375, 0.2756195068359375, 0.320404052734375, 0.3651885986328125, 0.40997314453125, 0.4547576904296875, 0.499542236328125, 0.5443267822265625, 0.589111328125, 0.6338958740234375, 0.678680419921875, 0.7234649658203125, 0.76824951171875, 0.8130340576171875, 0.857818603515625, 0.9026031494140625, 0.9473876953125, 0.9921722412109375, 1.036956787109375, 1.0817413330078125, 1.12652587890625, 1.1713104248046875, 1.216094970703125, 1.2608795166015625, 1.3056640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 15.0, 33.0, 33.0, 60.0, 81.0, 81.0, 118.0, 126.0, 113.0, 104.0, 80.0, 57.0, 35.0, 21.0, 14.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.129730224609375, -1.08367919921875, -1.037628173828125, -0.9915771484375, -0.945526123046875, -0.89947509765625, -0.853424072265625, -0.807373046875, -0.761322021484375, -0.71527099609375, -0.669219970703125, -0.6231689453125, -0.577117919921875, -0.53106689453125, -0.485015869140625, -0.43896484375, -0.392913818359375, -0.34686279296875, -0.300811767578125, -0.2547607421875, -0.208709716796875, -0.16265869140625, -0.116607666015625, -0.070556640625, -0.024505615234375, 0.02154541015625, 0.067596435546875, 0.1136474609375, 0.159698486328125, 0.20574951171875, 0.251800537109375, 0.2978515625, 0.343902587890625, 0.38995361328125, 0.436004638671875, 0.4820556640625, 0.528106689453125, 0.57415771484375, 0.620208740234375, 0.666259765625, 0.712310791015625, 0.75836181640625, 0.804412841796875, 0.8504638671875, 0.896514892578125, 0.94256591796875, 0.988616943359375, 1.03466796875, 1.080718994140625, 1.12677001953125, 1.172821044921875, 1.2188720703125, 1.264923095703125, 1.31097412109375, 1.357025146484375, 1.403076171875, 1.449127197265625, 1.49517822265625, 1.541229248046875, 1.5872802734375, 1.633331298828125, 1.67938232421875, 1.725433349609375, 1.771484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 22.0, 65.0, 94.0, 209.0, 289.0, 167.0, 99.0, 26.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.257118225097656, -43.23796463012695, -42.218814849853516, -41.19966125488281, -40.180511474609375, -39.16135787963867, -38.14220428466797, -37.12305450439453, -36.10390090942383, -35.084747314453125, -34.06559753417969, -33.046443939208984, -32.02729034423828, -31.008140563964844, -29.98898696899414, -28.96983528137207, -27.95068359375, -26.93153190612793, -25.91238021850586, -24.893226623535156, -23.874074935913086, -22.854923248291016, -21.835769653320312, -20.816617965698242, -19.797466278076172, -18.7783145904541, -17.75916290283203, -16.740009307861328, -15.720857620239258, -14.701705932617188, -13.6825532913208, -12.663400650024414, -11.644245147705078, -10.625093460083008, -9.605940818786621, -8.586788177490234, -7.567636489868164, -6.5484843254089355, -5.529332160949707, -4.5101799964904785, -3.49102783203125, -2.4718756675720215, -1.452723503112793, -0.43357133865356445, 0.5855808258056641, 1.6047329902648926, 2.623885154724121, 3.6430373191833496, 4.662189483642578, 5.681341648101807, 6.700493812561035, 7.719645977020264, 8.738798141479492, 9.757949829101562, 10.77710247039795, 11.796255111694336, 12.815406799316406, 13.834558486938477, 14.853711128234863, 15.87286376953125, 16.89201545715332, 17.91116714477539, 18.930320739746094, 19.949472427368164, 20.968624114990234]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 16.0, 27.0, 27.0, 27.0, 39.0, 60.0, 61.0, 62.0, 69.0, 96.0, 99.0, 65.0, 61.0, 52.0, 52.0, 35.0, 45.0, 35.0, 13.0, 21.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.88585662841797, -20.139802932739258, -19.393747329711914, -18.647693634033203, -17.90163803100586, -17.15558433532715, -16.409530639648438, -15.66347599029541, -14.917421340942383, -14.171366691589355, -13.425312042236328, -12.679258346557617, -11.93320369720459, -11.187149047851562, -10.441095352172852, -9.695040702819824, -8.948986053466797, -8.20293140411377, -7.4568772315979, -6.710823059082031, -5.964768409729004, -5.218713760375977, -4.472659587860107, -3.7266054153442383, -2.980550765991211, -2.2344963550567627, -1.4884419441223145, -0.7423875331878662, 0.0036668777465820312, 0.7497212886810303, 1.4957756996154785, 2.2418298721313477, 2.987882614135742, 3.7339370250701904, 4.479991436004639, 5.226045608520508, 5.972100257873535, 6.7181549072265625, 7.464209079742432, 8.2102632522583, 8.956317901611328, 9.702372550964355, 10.448427200317383, 11.194480895996094, 11.940535545349121, 12.686590194702148, 13.43264389038086, 14.178698539733887, 14.924753189086914, 15.670807838439941, 16.41686248779297, 17.16291618347168, 17.90896987915039, 18.655025482177734, 19.401079177856445, 20.147132873535156, 20.8931884765625, 21.63924217224121, 22.385297775268555, 23.131351470947266, 23.87740707397461, 24.62346076965332, 25.36951446533203, 26.115570068359375, 26.861623764038086]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 19.0, 31.0, 48.0, 80.0, 130.0, 252.0, 559.0, 1200.0, 3149.0, 10871.0, 55866.0, 743970.0, 3059850.0, 278162.0, 29675.0, 6513.0, 2050.0, 863.0, 432.0, 210.0, 118.0, 81.0, 42.0, 30.0, 22.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.25506591796875, -1.2034912109375, -1.15191650390625, -1.100341796875, -1.04876708984375, -0.9971923828125, -0.94561767578125, -0.89404296875, -0.84246826171875, -0.7908935546875, -0.73931884765625, -0.687744140625, -0.63616943359375, -0.5845947265625, -0.53302001953125, -0.4814453125, -0.42987060546875, -0.3782958984375, -0.32672119140625, -0.275146484375, -0.22357177734375, -0.1719970703125, -0.12042236328125, -0.06884765625, -0.01727294921875, 0.0343017578125, 0.08587646484375, 0.137451171875, 0.18902587890625, 0.2406005859375, 0.29217529296875, 0.34375, 0.39532470703125, 0.4468994140625, 0.49847412109375, 0.550048828125, 0.60162353515625, 0.6531982421875, 0.70477294921875, 0.75634765625, 0.80792236328125, 0.8594970703125, 0.91107177734375, 0.962646484375, 1.01422119140625, 1.0657958984375, 1.11737060546875, 1.1689453125, 1.22052001953125, 1.2720947265625, 1.32366943359375, 1.375244140625, 1.42681884765625, 1.4783935546875, 1.52996826171875, 1.58154296875, 1.63311767578125, 1.6846923828125, 1.73626708984375, 1.787841796875, 1.83941650390625, 1.8909912109375, 1.94256591796875, 1.994140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 4.0, 9.0, 16.0, 20.0, 29.0, 37.0, 46.0, 52.0, 54.0, 59.0, 83.0, 80.0, 78.0, 73.0, 67.0, 67.0, 55.0, 48.0, 35.0, 19.0, 23.0, 11.0, 12.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9523696899414062, -0.9110870361328125, -0.8698043823242188, -0.828521728515625, -0.7872390747070312, -0.7459564208984375, -0.7046737670898438, -0.66339111328125, -0.6221084594726562, -0.5808258056640625, -0.5395431518554688, -0.498260498046875, -0.45697784423828125, -0.4156951904296875, -0.37441253662109375, -0.3331298828125, -0.29184722900390625, -0.2505645751953125, -0.20928192138671875, -0.167999267578125, -0.12671661376953125, -0.0854339599609375, -0.04415130615234375, -0.00286865234375, 0.03841400146484375, 0.0796966552734375, 0.12097930908203125, 0.162261962890625, 0.20354461669921875, 0.2448272705078125, 0.28610992431640625, 0.327392578125, 0.36867523193359375, 0.4099578857421875, 0.45124053955078125, 0.492523193359375, 0.5338058471679688, 0.5750885009765625, 0.6163711547851562, 0.65765380859375, 0.6989364624023438, 0.7402191162109375, 0.7815017700195312, 0.822784423828125, 0.8640670776367188, 0.9053497314453125, 0.9466323852539062, 0.9879150390625, 1.0291976928710938, 1.0704803466796875, 1.1117630004882812, 1.153045654296875, 1.1943283081054688, 1.2356109619140625, 1.2768936157226562, 1.31817626953125, 1.3594589233398438, 1.4007415771484375, 1.4420242309570312, 1.483306884765625, 1.5245895385742188, 1.5658721923828125, 1.6071548461914062, 1.6484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 15.0, 22.0, 25.0, 38.0, 42.0, 73.0, 124.0, 243.0, 464.0, 999.0, 2495.0, 7320.0, 30758.0, 253667.0, 3533940.0, 319314.0, 32899.0, 7294.0, 2398.0, 979.0, 512.0, 246.0, 150.0, 76.0, 64.0, 28.0, 14.0, 18.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.159332275390625, -2.08624267578125, -2.013153076171875, -1.9400634765625, -1.866973876953125, -1.79388427734375, -1.720794677734375, -1.647705078125, -1.574615478515625, -1.50152587890625, -1.428436279296875, -1.3553466796875, -1.282257080078125, -1.20916748046875, -1.136077880859375, -1.06298828125, -0.989898681640625, -0.91680908203125, -0.843719482421875, -0.7706298828125, -0.697540283203125, -0.62445068359375, -0.551361083984375, -0.478271484375, -0.405181884765625, -0.33209228515625, -0.259002685546875, -0.1859130859375, -0.112823486328125, -0.03973388671875, 0.033355712890625, 0.1064453125, 0.179534912109375, 0.25262451171875, 0.325714111328125, 0.3988037109375, 0.471893310546875, 0.54498291015625, 0.618072509765625, 0.691162109375, 0.764251708984375, 0.83734130859375, 0.910430908203125, 0.9835205078125, 1.056610107421875, 1.12969970703125, 1.202789306640625, 1.27587890625, 1.348968505859375, 1.42205810546875, 1.495147705078125, 1.5682373046875, 1.641326904296875, 1.71441650390625, 1.787506103515625, 1.860595703125, 1.933685302734375, 2.00677490234375, 2.079864501953125, 2.1529541015625, 2.226043701171875, 2.29913330078125, 2.372222900390625, 2.4453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 5.0, 13.0, 25.0, 23.0, 43.0, 59.0, 100.0, 164.0, 315.0, 711.0, 1014.0, 737.0, 376.0, 178.0, 110.0, 69.0, 40.0, 26.0, 12.0, 9.0, 3.0, 5.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09735107421875, -3.0052490234375, -2.91314697265625, -2.821044921875, -2.72894287109375, -2.6368408203125, -2.54473876953125, -2.45263671875, -2.36053466796875, -2.2684326171875, -2.17633056640625, -2.084228515625, -1.99212646484375, -1.9000244140625, -1.80792236328125, -1.7158203125, -1.62371826171875, -1.5316162109375, -1.43951416015625, -1.347412109375, -1.25531005859375, -1.1632080078125, -1.07110595703125, -0.97900390625, -0.88690185546875, -0.7947998046875, -0.70269775390625, -0.610595703125, -0.51849365234375, -0.4263916015625, -0.33428955078125, -0.2421875, -0.15008544921875, -0.0579833984375, 0.03411865234375, 0.126220703125, 0.21832275390625, 0.3104248046875, 0.40252685546875, 0.49462890625, 0.58673095703125, 0.6788330078125, 0.77093505859375, 0.863037109375, 0.95513916015625, 1.0472412109375, 1.13934326171875, 1.2314453125, 1.32354736328125, 1.4156494140625, 1.50775146484375, 1.599853515625, 1.69195556640625, 1.7840576171875, 1.87615966796875, 1.96826171875, 2.06036376953125, 2.1524658203125, 2.24456787109375, 2.336669921875, 2.42877197265625, 2.5208740234375, 2.61297607421875, 2.705078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 22.0, 33.0, 109.0, 202.0, 257.0, 173.0, 105.0, 37.0, 15.0, 5.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.569122314453125, -23.75977325439453, -22.950424194335938, -22.141075134277344, -21.33172607421875, -20.522377014160156, -19.71302604675293, -18.903676986694336, -18.094327926635742, -17.28497886657715, -16.475629806518555, -15.666279792785645, -14.85693073272705, -14.047581672668457, -13.238231658935547, -12.428882598876953, -11.61953353881836, -10.810184478759766, -10.000835418701172, -9.191485404968262, -8.382136344909668, -7.572787284851074, -6.763437747955322, -5.95408821105957, -5.144739151000977, -4.335390090942383, -3.526040554046631, -2.716691255569458, -1.9073419570922852, -1.0979928970336914, -0.28864336013793945, 0.5207061767578125, 1.330057144165039, 2.139406442642212, 2.9487557411193848, 3.7581050395965576, 4.5674543380737305, 5.376803398132324, 6.186152935028076, 6.995502471923828, 7.804851531982422, 8.614200592041016, 9.42354965209961, 10.23289966583252, 11.042248725891113, 11.851597785949707, 12.660947799682617, 13.470296859741211, 14.279645919799805, 15.088994979858398, 15.898344039916992, 16.707693099975586, 17.517044067382812, 18.326393127441406, 19.1357421875, 19.945091247558594, 20.754440307617188, 21.56378936767578, 22.373138427734375, 23.18248748779297, 23.991836547851562, 24.801185607910156, 25.610536575317383, 26.419885635375977, 27.22923469543457]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 14.0, 15.0, 28.0, 20.0, 32.0, 26.0, 28.0, 37.0, 38.0, 40.0, 48.0, 43.0, 38.0, 51.0, 49.0, 45.0, 48.0, 39.0, 36.0, 35.0, 29.0, 27.0, 36.0, 26.0, 19.0, 15.0, 15.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.81758975982666, -10.494715690612793, -10.17184066772461, -9.848966598510742, -9.526092529296875, -9.203218460083008, -8.880343437194824, -8.557469367980957, -8.23459529876709, -7.9117207527160645, -7.588846683502197, -7.265972137451172, -6.943098068237305, -6.620223522186279, -6.297348976135254, -5.974474906921387, -5.651600360870361, -5.328725814819336, -5.005851745605469, -4.682977199554443, -4.360103130340576, -4.037228584289551, -3.7143542766571045, -3.391479969024658, -3.068605661392212, -2.7457313537597656, -2.4228570461273193, -2.099982738494873, -1.7771083116531372, -1.454234004020691, -1.131359577178955, -0.8084852695465088, -0.4856109619140625, -0.16273662447929382, 0.16013771295547485, 0.4830120801925659, 0.8058863878250122, 1.1287606954574585, 1.4516351222991943, 1.7745094299316406, 2.097383737564087, 2.420258045196533, 2.7431323528289795, 3.066006660461426, 3.388881206512451, 3.7117552757263184, 4.034629821777344, 4.357503890991211, 4.680378437042236, 5.003252983093262, 5.326127052307129, 5.649001598358154, 5.9718756675720215, 6.294750213623047, 6.617624282836914, 6.9404988288879395, 7.263373374938965, 7.58624792098999, 7.909121990203857, 8.231996536254883, 8.55487060546875, 8.877744674682617, 9.2006196975708, 9.523493766784668, 9.846367835998535]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 11.0, 12.0, 19.0, 26.0, 65.0, 90.0, 165.0, 246.0, 422.0, 742.0, 1656.0, 3257.0, 7405.0, 17309.0, 42954.0, 106416.0, 234440.0, 311552.0, 185660.0, 80064.0, 31923.0, 13000.0, 5614.0, 2630.0, 1261.0, 695.0, 371.0, 208.0, 134.0, 64.0, 57.0, 34.0, 17.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.267181396484375, -1.22674560546875, -1.186309814453125, -1.1458740234375, -1.105438232421875, -1.06500244140625, -1.024566650390625, -0.984130859375, -0.943695068359375, -0.90325927734375, -0.862823486328125, -0.8223876953125, -0.781951904296875, -0.74151611328125, -0.701080322265625, -0.66064453125, -0.620208740234375, -0.57977294921875, -0.539337158203125, -0.4989013671875, -0.458465576171875, -0.41802978515625, -0.377593994140625, -0.337158203125, -0.296722412109375, -0.25628662109375, -0.215850830078125, -0.1754150390625, -0.134979248046875, -0.09454345703125, -0.054107666015625, -0.013671875, 0.026763916015625, 0.06719970703125, 0.107635498046875, 0.1480712890625, 0.188507080078125, 0.22894287109375, 0.269378662109375, 0.309814453125, 0.350250244140625, 0.39068603515625, 0.431121826171875, 0.4715576171875, 0.511993408203125, 0.55242919921875, 0.592864990234375, 0.63330078125, 0.673736572265625, 0.71417236328125, 0.754608154296875, 0.7950439453125, 0.835479736328125, 0.87591552734375, 0.916351318359375, 0.956787109375, 0.997222900390625, 1.03765869140625, 1.078094482421875, 1.1185302734375, 1.158966064453125, 1.19940185546875, 1.239837646484375, 1.2802734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 10.0, 14.0, 13.0, 19.0, 32.0, 21.0, 55.0, 39.0, 42.0, 54.0, 49.0, 58.0, 61.0, 67.0, 55.0, 51.0, 55.0, 45.0, 35.0, 35.0, 30.0, 32.0, 22.0, 19.0, 12.0, 16.0, 7.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0615234375, -1.0304412841796875, -0.999359130859375, -0.9682769775390625, -0.93719482421875, -0.9061126708984375, -0.875030517578125, -0.8439483642578125, -0.8128662109375, -0.7817840576171875, -0.750701904296875, -0.7196197509765625, -0.68853759765625, -0.6574554443359375, -0.626373291015625, -0.5952911376953125, -0.564208984375, -0.5331268310546875, -0.502044677734375, -0.4709625244140625, -0.43988037109375, -0.4087982177734375, -0.377716064453125, -0.3466339111328125, -0.3155517578125, -0.2844696044921875, -0.253387451171875, -0.2223052978515625, -0.19122314453125, -0.1601409912109375, -0.129058837890625, -0.0979766845703125, -0.06689453125, -0.0358123779296875, -0.004730224609375, 0.0263519287109375, 0.05743408203125, 0.0885162353515625, 0.119598388671875, 0.1506805419921875, 0.1817626953125, 0.2128448486328125, 0.243927001953125, 0.2750091552734375, 0.30609130859375, 0.3371734619140625, 0.368255615234375, 0.3993377685546875, 0.430419921875, 0.4615020751953125, 0.492584228515625, 0.5236663818359375, 0.55474853515625, 0.5858306884765625, 0.616912841796875, 0.6479949951171875, 0.6790771484375, 0.7101593017578125, 0.741241455078125, 0.7723236083984375, 0.80340576171875, 0.8344879150390625, 0.865570068359375, 0.8966522216796875, 0.927734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 14.0, 14.0, 24.0, 37.0, 40.0, 59.0, 106.0, 128.0, 183.0, 263.0, 377.0, 586.0, 1020.0, 2016.0, 5548.0, 26407.0, 253199.0, 672252.0, 69672.0, 10071.0, 2979.0, 1276.0, 720.0, 457.0, 305.0, 186.0, 149.0, 127.0, 77.0, 63.0, 54.0, 30.0, 23.0, 16.0, 11.0, 15.0, 12.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-3.125, -3.03094482421875, -2.9368896484375, -2.84283447265625, -2.748779296875, -2.65472412109375, -2.5606689453125, -2.46661376953125, -2.37255859375, -2.27850341796875, -2.1844482421875, -2.09039306640625, -1.996337890625, -1.90228271484375, -1.8082275390625, -1.71417236328125, -1.6201171875, -1.52606201171875, -1.4320068359375, -1.33795166015625, -1.243896484375, -1.14984130859375, -1.0557861328125, -0.96173095703125, -0.86767578125, -0.77362060546875, -0.6795654296875, -0.58551025390625, -0.491455078125, -0.39739990234375, -0.3033447265625, -0.20928955078125, -0.115234375, -0.02117919921875, 0.0728759765625, 0.16693115234375, 0.260986328125, 0.35504150390625, 0.4490966796875, 0.54315185546875, 0.63720703125, 0.73126220703125, 0.8253173828125, 0.91937255859375, 1.013427734375, 1.10748291015625, 1.2015380859375, 1.29559326171875, 1.3896484375, 1.48370361328125, 1.5777587890625, 1.67181396484375, 1.765869140625, 1.85992431640625, 1.9539794921875, 2.04803466796875, 2.14208984375, 2.23614501953125, 2.3302001953125, 2.42425537109375, 2.518310546875, 2.61236572265625, 2.7064208984375, 2.80047607421875, 2.89453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 10.0, 12.0, 14.0, 7.0, 11.0, 13.0, 31.0, 25.0, 41.0, 31.0, 37.0, 47.0, 37.0, 30.0, 47.0, 42.0, 53.0, 41.0, 41.0, 31.0, 39.0, 32.0, 37.0, 37.0, 26.0, 41.0, 22.0, 22.0, 18.0, 19.0, 15.0, 11.0, 5.0, 11.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.427734375, -3.32080078125, -3.2138671875, -3.10693359375, -3.0, -2.89306640625, -2.7861328125, -2.67919921875, -2.572265625, -2.46533203125, -2.3583984375, -2.25146484375, -2.14453125, -2.03759765625, -1.9306640625, -1.82373046875, -1.716796875, -1.60986328125, -1.5029296875, -1.39599609375, -1.2890625, -1.18212890625, -1.0751953125, -0.96826171875, -0.861328125, -0.75439453125, -0.6474609375, -0.54052734375, -0.43359375, -0.32666015625, -0.2197265625, -0.11279296875, -0.005859375, 0.10107421875, 0.2080078125, 0.31494140625, 0.421875, 0.52880859375, 0.6357421875, 0.74267578125, 0.849609375, 0.95654296875, 1.0634765625, 1.17041015625, 1.27734375, 1.38427734375, 1.4912109375, 1.59814453125, 1.705078125, 1.81201171875, 1.9189453125, 2.02587890625, 2.1328125, 2.23974609375, 2.3466796875, 2.45361328125, 2.560546875, 2.66748046875, 2.7744140625, 2.88134765625, 2.98828125, 3.09521484375, 3.2021484375, 3.30908203125, 3.416015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 27.0, 42.0, 75.0, 222.0, 536.0, 2536.0, 41220.0, 941287.0, 58537.0, 3031.0, 645.0, 206.0, 80.0, 35.0, 19.0, 11.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.58502197265625, -1.5313720703125, -1.47772216796875, -1.424072265625, -1.37042236328125, -1.3167724609375, -1.26312255859375, -1.20947265625, -1.15582275390625, -1.1021728515625, -1.04852294921875, -0.994873046875, -0.94122314453125, -0.8875732421875, -0.83392333984375, -0.7802734375, -0.72662353515625, -0.6729736328125, -0.61932373046875, -0.565673828125, -0.51202392578125, -0.4583740234375, -0.40472412109375, -0.35107421875, -0.29742431640625, -0.2437744140625, -0.19012451171875, -0.136474609375, -0.08282470703125, -0.0291748046875, 0.02447509765625, 0.078125, 0.13177490234375, 0.1854248046875, 0.23907470703125, 0.292724609375, 0.34637451171875, 0.4000244140625, 0.45367431640625, 0.50732421875, 0.56097412109375, 0.6146240234375, 0.66827392578125, 0.721923828125, 0.77557373046875, 0.8292236328125, 0.88287353515625, 0.9365234375, 0.99017333984375, 1.0438232421875, 1.09747314453125, 1.151123046875, 1.20477294921875, 1.2584228515625, 1.31207275390625, 1.36572265625, 1.41937255859375, 1.4730224609375, 1.52667236328125, 1.580322265625, 1.63397216796875, 1.6876220703125, 1.74127197265625, 1.794921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 25.0, 17.0, 27.0, 47.0, 47.0, 92.0, 130.0, 117.0, 134.0, 94.0, 68.0, 49.0, 37.0, 24.0, 23.0, 17.0, 12.0, 4.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003330707550048828, -0.00032491981983184814, -0.0003167688846588135, -0.0003086179494857788, -0.00030046701431274414, -0.00029231607913970947, -0.0002841651439666748, -0.00027601420879364014, -0.00026786327362060547, -0.0002597123384475708, -0.00025156140327453613, -0.00024341046810150146, -0.0002352595329284668, -0.00022710859775543213, -0.00021895766258239746, -0.0002108067274093628, -0.00020265579223632812, -0.00019450485706329346, -0.0001863539218902588, -0.00017820298671722412, -0.00017005205154418945, -0.00016190111637115479, -0.00015375018119812012, -0.00014559924602508545, -0.00013744831085205078, -0.0001292973756790161, -0.00012114644050598145, -0.00011299550533294678, -0.00010484457015991211, -9.669363498687744e-05, -8.854269981384277e-05, -8.03917646408081e-05, -7.224082946777344e-05, -6.408989429473877e-05, -5.59389591217041e-05, -4.7788023948669434e-05, -3.9637088775634766e-05, -3.14861536026001e-05, -2.333521842956543e-05, -1.5184283256530762e-05, -7.033348083496094e-06, 1.1175870895385742e-06, 9.268522262573242e-06, 1.741945743560791e-05, 2.5570392608642578e-05, 3.3721327781677246e-05, 4.1872262954711914e-05, 5.002319812774658e-05, 5.817413330078125e-05, 6.632506847381592e-05, 7.447600364685059e-05, 8.262693881988525e-05, 9.077787399291992e-05, 9.892880916595459e-05, 0.00010707974433898926, 0.00011523067951202393, 0.0001233816146850586, 0.00013153254985809326, 0.00013968348503112793, 0.0001478344202041626, 0.00015598535537719727, 0.00016413629055023193, 0.0001722872257232666, 0.00018043816089630127, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 9.0, 17.0, 17.0, 36.0, 53.0, 108.0, 217.0, 429.0, 977.0, 2664.0, 13423.0, 196161.0, 778581.0, 47242.0, 5775.0, 1572.0, 599.0, 297.0, 161.0, 85.0, 57.0, 20.0, 24.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2838287353515625, -1.250274658203125, -1.2167205810546875, -1.18316650390625, -1.1496124267578125, -1.116058349609375, -1.0825042724609375, -1.0489501953125, -1.0153961181640625, -0.981842041015625, -0.9482879638671875, -0.91473388671875, -0.8811798095703125, -0.847625732421875, -0.8140716552734375, -0.780517578125, -0.7469635009765625, -0.713409423828125, -0.6798553466796875, -0.64630126953125, -0.6127471923828125, -0.579193115234375, -0.5456390380859375, -0.5120849609375, -0.4785308837890625, -0.444976806640625, -0.4114227294921875, -0.37786865234375, -0.3443145751953125, -0.310760498046875, -0.2772064208984375, -0.24365234375, -0.2100982666015625, -0.176544189453125, -0.1429901123046875, -0.10943603515625, -0.0758819580078125, -0.042327880859375, -0.0087738037109375, 0.0247802734375, 0.0583343505859375, 0.091888427734375, 0.1254425048828125, 0.15899658203125, 0.1925506591796875, 0.226104736328125, 0.2596588134765625, 0.293212890625, 0.3267669677734375, 0.360321044921875, 0.3938751220703125, 0.42742919921875, 0.4609832763671875, 0.494537353515625, 0.5280914306640625, 0.5616455078125, 0.5951995849609375, 0.628753662109375, 0.6623077392578125, 0.69586181640625, 0.7294158935546875, 0.762969970703125, 0.7965240478515625, 0.830078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 4.0, 10.0, 9.0, 10.0, 17.0, 21.0, 31.0, 39.0, 34.0, 41.0, 55.0, 72.0, 66.0, 63.0, 75.0, 59.0, 59.0, 55.0, 46.0, 44.0, 35.0, 34.0, 18.0, 16.0, 15.0, 12.0, 8.0, 4.0, 10.0, 4.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6647186279296875, -0.643402099609375, -0.6220855712890625, -0.60076904296875, -0.5794525146484375, -0.558135986328125, -0.5368194580078125, -0.5155029296875, -0.4941864013671875, -0.472869873046875, -0.4515533447265625, -0.43023681640625, -0.4089202880859375, -0.387603759765625, -0.3662872314453125, -0.344970703125, -0.3236541748046875, -0.302337646484375, -0.2810211181640625, -0.25970458984375, -0.2383880615234375, -0.217071533203125, -0.1957550048828125, -0.1744384765625, -0.1531219482421875, -0.131805419921875, -0.1104888916015625, -0.08917236328125, -0.0678558349609375, -0.046539306640625, -0.0252227783203125, -0.00390625, 0.0174102783203125, 0.038726806640625, 0.0600433349609375, 0.08135986328125, 0.1026763916015625, 0.123992919921875, 0.1453094482421875, 0.1666259765625, 0.1879425048828125, 0.209259033203125, 0.2305755615234375, 0.25189208984375, 0.2732086181640625, 0.294525146484375, 0.3158416748046875, 0.337158203125, 0.3584747314453125, 0.379791259765625, 0.4011077880859375, 0.42242431640625, 0.4437408447265625, 0.465057373046875, 0.4863739013671875, 0.5076904296875, 0.5290069580078125, 0.550323486328125, 0.5716400146484375, 0.59295654296875, 0.6142730712890625, 0.635589599609375, 0.6569061279296875, 0.67822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 11.0, 29.0, 33.0, 90.0, 154.0, 215.0, 213.0, 117.0, 55.0, 39.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.04113006591797, -19.432435989379883, -18.823741912841797, -18.215045928955078, -17.606351852416992, -16.997657775878906, -16.38896369934082, -15.780268669128418, -15.171573638916016, -14.56287956237793, -13.954184532165527, -13.345490455627441, -12.736795425415039, -12.128101348876953, -11.519407272338867, -10.910712242126465, -10.302018165588379, -9.693324089050293, -9.08462905883789, -8.475934982299805, -7.867239952087402, -7.258545875549316, -6.649851322174072, -6.041156768798828, -5.432462215423584, -4.82376766204834, -4.215073108673096, -3.6063787937164307, -2.9976842403411865, -2.3889896869659424, -1.7802953720092773, -1.1716008186340332, -0.5629062652587891, 0.0457882285118103, 0.6544827222824097, 1.2631771564483643, 1.8718717098236084, 2.4805662631988525, 3.0892605781555176, 3.6979551315307617, 4.306649684906006, 4.91534423828125, 5.524038791656494, 6.132733345031738, 6.741427421569824, 7.350122451782227, 7.9588165283203125, 8.567510604858398, 9.1762056350708, 9.784899711608887, 10.393594741821289, 11.002288818359375, 11.610983848571777, 12.219677925109863, 12.828372955322266, 13.437067031860352, 14.045761108398438, 14.654455184936523, 15.263150215148926, 15.871844291687012, 16.480539321899414, 17.0892333984375, 17.697927474975586, 18.306621551513672, 18.91531753540039]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 0.0, 4.0, 6.0, 8.0, 18.0, 11.0, 24.0, 21.0, 32.0, 42.0, 37.0, 33.0, 71.0, 60.0, 89.0, 116.0, 74.0, 64.0, 43.0, 50.0, 56.0, 32.0, 32.0, 23.0, 14.0, 11.0, 11.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.731983184814453, -26.08621597290039, -25.440446853637695, -24.794679641723633, -24.14891242980957, -23.503145217895508, -22.857376098632812, -22.21160888671875, -21.565841674804688, -20.920074462890625, -20.27430534362793, -19.628538131713867, -18.982770919799805, -18.337003707885742, -17.691234588623047, -17.045467376708984, -16.399700164794922, -15.753931999206543, -15.10816478729248, -14.462396621704102, -13.816629409790039, -13.17086124420166, -12.525093078613281, -11.879325866699219, -11.233556747436523, -10.587788581848145, -9.942021369934082, -9.296253204345703, -8.65048599243164, -8.004717826843262, -7.358950138092041, -6.71318244934082, -6.067415237426758, -5.421647548675537, -4.775879859924316, -4.1301116943359375, -3.484344244003296, -2.838576555252075, -2.1928086280822754, -1.5470409393310547, -0.901273250579834, -0.2555055022239685, 0.390262246131897, 1.0360300540924072, 1.681797742843628, 2.3275654315948486, 2.9733333587646484, 3.619101047515869, 4.26486873626709, 4.9106364250183105, 5.556404113769531, 6.20217227935791, 6.847939491271973, 7.493707656860352, 8.139474868774414, 8.785243034362793, 9.431011199951172, 10.07677936553955, 10.722546577453613, 11.368314743041992, 12.014081954956055, 12.659850120544434, 13.305618286132812, 13.951385498046875, 14.597152709960938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 17.0, 13.0, 29.0, 57.0, 90.0, 141.0, 304.0, 548.0, 1106.0, 2600.0, 7023.0, 24979.0, 126243.0, 919856.0, 2500677.0, 503236.0, 77142.0, 18822.0, 6155.0, 2586.0, 1265.0, 633.0, 352.0, 174.0, 88.0, 42.0, 32.0, 8.0, 13.0, 9.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3505859375, -1.3171234130859375, -1.283660888671875, -1.2501983642578125, -1.21673583984375, -1.1832733154296875, -1.149810791015625, -1.1163482666015625, -1.0828857421875, -1.0494232177734375, -1.015960693359375, -0.9824981689453125, -0.94903564453125, -0.9155731201171875, -0.882110595703125, -0.8486480712890625, -0.815185546875, -0.7817230224609375, -0.748260498046875, -0.7147979736328125, -0.68133544921875, -0.6478729248046875, -0.614410400390625, -0.5809478759765625, -0.5474853515625, -0.5140228271484375, -0.480560302734375, -0.4470977783203125, -0.41363525390625, -0.3801727294921875, -0.346710205078125, -0.3132476806640625, -0.27978515625, -0.2463226318359375, -0.212860107421875, -0.1793975830078125, -0.14593505859375, -0.1124725341796875, -0.079010009765625, -0.0455474853515625, -0.0120849609375, 0.0213775634765625, 0.054840087890625, 0.0883026123046875, 0.12176513671875, 0.1552276611328125, 0.188690185546875, 0.2221527099609375, 0.255615234375, 0.2890777587890625, 0.322540283203125, 0.3560028076171875, 0.38946533203125, 0.4229278564453125, 0.456390380859375, 0.4898529052734375, 0.5233154296875, 0.5567779541015625, 0.590240478515625, 0.6237030029296875, 0.65716552734375, 0.6906280517578125, 0.724090576171875, 0.7575531005859375, 0.791015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 24.0, 43.0, 51.0, 71.0, 88.0, 88.0, 106.0, 105.0, 99.0, 85.0, 53.0, 45.0, 36.0, 25.0, 19.0, 11.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4375, -2.3855438232421875, -2.333587646484375, -2.2816314697265625, -2.22967529296875, -2.1777191162109375, -2.125762939453125, -2.0738067626953125, -2.0218505859375, -1.9698944091796875, -1.917938232421875, -1.8659820556640625, -1.81402587890625, -1.7620697021484375, -1.710113525390625, -1.6581573486328125, -1.606201171875, -1.5542449951171875, -1.502288818359375, -1.4503326416015625, -1.39837646484375, -1.3464202880859375, -1.294464111328125, -1.2425079345703125, -1.1905517578125, -1.1385955810546875, -1.086639404296875, -1.0346832275390625, -0.98272705078125, -0.9307708740234375, -0.878814697265625, -0.8268585205078125, -0.77490234375, -0.7229461669921875, -0.670989990234375, -0.6190338134765625, -0.56707763671875, -0.5151214599609375, -0.463165283203125, -0.4112091064453125, -0.3592529296875, -0.3072967529296875, -0.255340576171875, -0.2033843994140625, -0.15142822265625, -0.0994720458984375, -0.047515869140625, 0.0044403076171875, 0.056396484375, 0.1083526611328125, 0.160308837890625, 0.2122650146484375, 0.26422119140625, 0.3161773681640625, 0.368133544921875, 0.4200897216796875, 0.4720458984375, 0.5240020751953125, 0.575958251953125, 0.6279144287109375, 0.67987060546875, 0.7318267822265625, 0.783782958984375, 0.8357391357421875, 0.8876953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 10.0, 12.0, 20.0, 31.0, 50.0, 84.0, 156.0, 248.0, 449.0, 1015.0, 2702.0, 7728.0, 29591.0, 186522.0, 2978607.0, 879457.0, 80889.0, 17803.0, 5165.0, 1895.0, 808.0, 421.0, 218.0, 150.0, 73.0, 53.0, 36.0, 24.0, 19.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.71875, -1.6693115234375, -1.619873046875, -1.5704345703125, -1.52099609375, -1.4715576171875, -1.422119140625, -1.3726806640625, -1.3232421875, -1.2738037109375, -1.224365234375, -1.1749267578125, -1.12548828125, -1.0760498046875, -1.026611328125, -0.9771728515625, -0.927734375, -0.8782958984375, -0.828857421875, -0.7794189453125, -0.72998046875, -0.6805419921875, -0.631103515625, -0.5816650390625, -0.5322265625, -0.4827880859375, -0.433349609375, -0.3839111328125, -0.33447265625, -0.2850341796875, -0.235595703125, -0.1861572265625, -0.13671875, -0.0872802734375, -0.037841796875, 0.0115966796875, 0.06103515625, 0.1104736328125, 0.159912109375, 0.2093505859375, 0.2587890625, 0.3082275390625, 0.357666015625, 0.4071044921875, 0.45654296875, 0.5059814453125, 0.555419921875, 0.6048583984375, 0.654296875, 0.7037353515625, 0.753173828125, 0.8026123046875, 0.85205078125, 0.9014892578125, 0.950927734375, 1.0003662109375, 1.0498046875, 1.0992431640625, 1.148681640625, 1.1981201171875, 1.24755859375, 1.2969970703125, 1.346435546875, 1.3958740234375, 1.4453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 15.0, 14.0, 17.0, 26.0, 24.0, 63.0, 101.0, 121.0, 265.0, 442.0, 686.0, 775.0, 589.0, 305.0, 191.0, 139.0, 74.0, 34.0, 38.0, 43.0, 31.0, 18.0, 10.0, 10.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.8517913818359375, -1.790496826171875, -1.7292022705078125, -1.66790771484375, -1.6066131591796875, -1.545318603515625, -1.4840240478515625, -1.4227294921875, -1.3614349365234375, -1.300140380859375, -1.2388458251953125, -1.17755126953125, -1.1162567138671875, -1.054962158203125, -0.9936676025390625, -0.932373046875, -0.8710784912109375, -0.809783935546875, -0.7484893798828125, -0.68719482421875, -0.6259002685546875, -0.564605712890625, -0.5033111572265625, -0.4420166015625, -0.3807220458984375, -0.319427490234375, -0.2581329345703125, -0.19683837890625, -0.1355438232421875, -0.074249267578125, -0.0129547119140625, 0.04833984375, 0.1096343994140625, 0.170928955078125, 0.2322235107421875, 0.29351806640625, 0.3548126220703125, 0.416107177734375, 0.4774017333984375, 0.5386962890625, 0.5999908447265625, 0.661285400390625, 0.7225799560546875, 0.78387451171875, 0.8451690673828125, 0.906463623046875, 0.9677581787109375, 1.029052734375, 1.0903472900390625, 1.151641845703125, 1.2129364013671875, 1.27423095703125, 1.3355255126953125, 1.396820068359375, 1.4581146240234375, 1.5194091796875, 1.5807037353515625, 1.641998291015625, 1.7032928466796875, 1.76458740234375, 1.8258819580078125, 1.887176513671875, 1.9484710693359375, 2.009765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 31.0, 217.0, 438.0, 233.0, 53.0, 10.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.59027099609375, -34.2432746887207, -32.896278381347656, -31.549283981323242, -30.202289581298828, -28.85529327392578, -27.508296966552734, -26.16130256652832, -24.814308166503906, -23.46731185913086, -22.120317459106445, -20.7733211517334, -19.426326751708984, -18.079330444335938, -16.73233413696289, -15.385339736938477, -14.03834342956543, -12.6913480758667, -11.344352722167969, -9.997356414794922, -8.650362014770508, -7.303366184234619, -5.9563703536987305, -4.609375, -3.2623796463012695, -1.9153841733932495, -0.5683887004852295, 0.7786068916320801, 2.1256022453308105, 3.472597599029541, 4.81959342956543, 6.16658878326416, 7.513584136962891, 8.860579490661621, 10.207574844360352, 11.554571151733398, 12.901565551757812, 14.24856185913086, 15.59555721282959, 16.94255256652832, 18.289546966552734, 19.63654327392578, 20.983537673950195, 22.330533981323242, 23.677528381347656, 25.024524688720703, 26.37152099609375, 27.718515396118164, 29.06551170349121, 30.412508010864258, 31.759502410888672, 33.10649871826172, 34.453495025634766, 35.80048751831055, 37.147483825683594, 38.49448013305664, 39.84147644042969, 41.188472747802734, 42.53546905517578, 43.88246154785156, 45.22945785522461, 46.576454162597656, 47.9234504699707, 49.27044677734375, 50.61743927001953]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 11.0, 4.0, 6.0, 9.0, 13.0, 12.0, 24.0, 30.0, 37.0, 46.0, 53.0, 68.0, 45.0, 62.0, 78.0, 44.0, 65.0, 64.0, 53.0, 38.0, 49.0, 37.0, 36.0, 22.0, 25.0, 27.0, 10.0, 14.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546370506286621, -11.097363471984863, -10.648356437683105, -10.199349403381348, -9.750341415405273, -9.301334381103516, -8.852327346801758, -8.4033203125, -7.954313278198242, -7.505306243896484, -7.056299209594727, -6.6072916984558105, -6.158284664154053, -5.709277629852295, -5.260270118713379, -4.811263084411621, -4.362256050109863, -3.9132490158081055, -3.4642417430877686, -3.0152344703674316, -2.566227436065674, -2.117220401763916, -1.668213129043579, -1.2192058563232422, -0.7701988220214844, -0.321191668510437, 0.12781548500061035, 0.5768226385116577, 1.025829792022705, 1.474836826324463, 1.9238440990447998, 2.3728513717651367, 2.821859359741211, 3.2708663940429688, 3.7198736667633057, 4.168880939483643, 4.6178879737854, 5.066895008087158, 5.515902519226074, 5.964909553527832, 6.41391658782959, 6.862923622131348, 7.3119306564331055, 7.7609381675720215, 8.209945678710938, 8.658952713012695, 9.107959747314453, 9.556966781616211, 10.005973815917969, 10.454980850219727, 10.903987884521484, 11.352994918823242, 11.802001953125, 12.251008987426758, 12.700016975402832, 13.14902400970459, 13.598031044006348, 14.047038078308105, 14.496045112609863, 14.945052146911621, 15.394060134887695, 15.843067169189453, 16.29207420349121, 16.74108123779297, 17.190088272094727]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 21.0, 29.0, 35.0, 68.0, 127.0, 203.0, 416.0, 675.0, 1341.0, 2549.0, 5086.0, 10830.0, 24784.0, 56589.0, 131326.0, 269742.0, 285153.0, 145975.0, 63145.0, 26937.0, 12056.0, 5513.0, 2769.0, 1354.0, 811.0, 437.0, 221.0, 142.0, 74.0, 49.0, 40.0, 10.0, 7.0, 9.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0368804931640625, -0.998565673828125, -0.9602508544921875, -0.92193603515625, -0.8836212158203125, -0.845306396484375, -0.8069915771484375, -0.7686767578125, -0.7303619384765625, -0.692047119140625, -0.6537322998046875, -0.61541748046875, -0.5771026611328125, -0.538787841796875, -0.5004730224609375, -0.462158203125, -0.4238433837890625, -0.385528564453125, -0.3472137451171875, -0.30889892578125, -0.2705841064453125, -0.232269287109375, -0.1939544677734375, -0.1556396484375, -0.1173248291015625, -0.079010009765625, -0.0406951904296875, -0.00238037109375, 0.0359344482421875, 0.074249267578125, 0.1125640869140625, 0.15087890625, 0.1891937255859375, 0.227508544921875, 0.2658233642578125, 0.30413818359375, 0.3424530029296875, 0.380767822265625, 0.4190826416015625, 0.4573974609375, 0.4957122802734375, 0.534027099609375, 0.5723419189453125, 0.61065673828125, 0.6489715576171875, 0.687286376953125, 0.7256011962890625, 0.763916015625, 0.8022308349609375, 0.840545654296875, 0.8788604736328125, 0.91717529296875, 0.9554901123046875, 0.993804931640625, 1.0321197509765625, 1.0704345703125, 1.1087493896484375, 1.147064208984375, 1.1853790283203125, 1.22369384765625, 1.2620086669921875, 1.300323486328125, 1.3386383056640625, 1.376953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 10.0, 14.0, 14.0, 18.0, 22.0, 27.0, 36.0, 43.0, 53.0, 46.0, 60.0, 56.0, 70.0, 45.0, 56.0, 55.0, 50.0, 60.0, 38.0, 41.0, 22.0, 33.0, 29.0, 19.0, 18.0, 7.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0156402587890625, -0.985382080078125, -0.9551239013671875, -0.92486572265625, -0.8946075439453125, -0.864349365234375, -0.8340911865234375, -0.8038330078125, -0.7735748291015625, -0.743316650390625, -0.7130584716796875, -0.68280029296875, -0.6525421142578125, -0.622283935546875, -0.5920257568359375, -0.561767578125, -0.5315093994140625, -0.501251220703125, -0.4709930419921875, -0.44073486328125, -0.4104766845703125, -0.380218505859375, -0.3499603271484375, -0.3197021484375, -0.2894439697265625, -0.259185791015625, -0.2289276123046875, -0.19866943359375, -0.1684112548828125, -0.138153076171875, -0.1078948974609375, -0.07763671875, -0.0473785400390625, -0.017120361328125, 0.0131378173828125, 0.04339599609375, 0.0736541748046875, 0.103912353515625, 0.1341705322265625, 0.1644287109375, 0.1946868896484375, 0.224945068359375, 0.2552032470703125, 0.28546142578125, 0.3157196044921875, 0.345977783203125, 0.3762359619140625, 0.406494140625, 0.4367523193359375, 0.467010498046875, 0.4972686767578125, 0.52752685546875, 0.5577850341796875, 0.588043212890625, 0.6183013916015625, 0.6485595703125, 0.6788177490234375, 0.709075927734375, 0.7393341064453125, 0.76959228515625, 0.7998504638671875, 0.830108642578125, 0.8603668212890625, 0.890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 12.0, 16.0, 22.0, 35.0, 34.0, 60.0, 70.0, 105.0, 157.0, 208.0, 330.0, 503.0, 932.0, 1827.0, 4932.0, 21657.0, 181740.0, 717725.0, 97391.0, 13417.0, 3601.0, 1528.0, 786.0, 457.0, 301.0, 196.0, 137.0, 105.0, 65.0, 44.0, 35.0, 34.0, 29.0, 9.0, 12.0, 6.0, 10.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5, -2.40863037109375, -2.3172607421875, -2.22589111328125, -2.134521484375, -2.04315185546875, -1.9517822265625, -1.86041259765625, -1.76904296875, -1.67767333984375, -1.5863037109375, -1.49493408203125, -1.403564453125, -1.31219482421875, -1.2208251953125, -1.12945556640625, -1.0380859375, -0.94671630859375, -0.8553466796875, -0.76397705078125, -0.672607421875, -0.58123779296875, -0.4898681640625, -0.39849853515625, -0.30712890625, -0.21575927734375, -0.1243896484375, -0.03302001953125, 0.058349609375, 0.14971923828125, 0.2410888671875, 0.33245849609375, 0.423828125, 0.51519775390625, 0.6065673828125, 0.69793701171875, 0.789306640625, 0.88067626953125, 0.9720458984375, 1.06341552734375, 1.15478515625, 1.24615478515625, 1.3375244140625, 1.42889404296875, 1.520263671875, 1.61163330078125, 1.7030029296875, 1.79437255859375, 1.8857421875, 1.97711181640625, 2.0684814453125, 2.15985107421875, 2.251220703125, 2.34259033203125, 2.4339599609375, 2.52532958984375, 2.61669921875, 2.70806884765625, 2.7994384765625, 2.89080810546875, 2.982177734375, 3.07354736328125, 3.1649169921875, 3.25628662109375, 3.34765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 15.0, 18.0, 17.0, 24.0, 14.0, 21.0, 35.0, 24.0, 33.0, 37.0, 44.0, 38.0, 49.0, 55.0, 59.0, 41.0, 55.0, 54.0, 44.0, 43.0, 41.0, 35.0, 34.0, 31.0, 16.0, 19.0, 21.0, 16.0, 8.0, 8.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.828399658203125, -2.72711181640625, -2.625823974609375, -2.5245361328125, -2.423248291015625, -2.32196044921875, -2.220672607421875, -2.119384765625, -2.018096923828125, -1.91680908203125, -1.815521240234375, -1.7142333984375, -1.612945556640625, -1.51165771484375, -1.410369873046875, -1.30908203125, -1.207794189453125, -1.10650634765625, -1.005218505859375, -0.9039306640625, -0.802642822265625, -0.70135498046875, -0.600067138671875, -0.498779296875, -0.397491455078125, -0.29620361328125, -0.194915771484375, -0.0936279296875, 0.007659912109375, 0.10894775390625, 0.210235595703125, 0.3115234375, 0.412811279296875, 0.51409912109375, 0.615386962890625, 0.7166748046875, 0.817962646484375, 0.91925048828125, 1.020538330078125, 1.121826171875, 1.223114013671875, 1.32440185546875, 1.425689697265625, 1.5269775390625, 1.628265380859375, 1.72955322265625, 1.830841064453125, 1.93212890625, 2.033416748046875, 2.13470458984375, 2.235992431640625, 2.3372802734375, 2.438568115234375, 2.53985595703125, 2.641143798828125, 2.742431640625, 2.843719482421875, 2.94500732421875, 3.046295166015625, 3.1475830078125, 3.248870849609375, 3.35015869140625, 3.451446533203125, 3.552734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 6.0, 16.0, 17.0, 32.0, 36.0, 84.0, 135.0, 308.0, 809.0, 2632.0, 13474.0, 122817.0, 780671.0, 110924.0, 12663.0, 2516.0, 748.0, 330.0, 127.0, 84.0, 40.0, 19.0, 21.0, 18.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.989013671875, -0.95947265625, -0.929931640625, -0.900390625, -0.870849609375, -0.84130859375, -0.811767578125, -0.7822265625, -0.752685546875, -0.72314453125, -0.693603515625, -0.6640625, -0.634521484375, -0.60498046875, -0.575439453125, -0.5458984375, -0.516357421875, -0.48681640625, -0.457275390625, -0.427734375, -0.398193359375, -0.36865234375, -0.339111328125, -0.3095703125, -0.280029296875, -0.25048828125, -0.220947265625, -0.19140625, -0.161865234375, -0.13232421875, -0.102783203125, -0.0732421875, -0.043701171875, -0.01416015625, 0.015380859375, 0.044921875, 0.074462890625, 0.10400390625, 0.133544921875, 0.1630859375, 0.192626953125, 0.22216796875, 0.251708984375, 0.28125, 0.310791015625, 0.34033203125, 0.369873046875, 0.3994140625, 0.428955078125, 0.45849609375, 0.488037109375, 0.517578125, 0.547119140625, 0.57666015625, 0.606201171875, 0.6357421875, 0.665283203125, 0.69482421875, 0.724365234375, 0.75390625, 0.783447265625, 0.81298828125, 0.842529296875, 0.8720703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 10.0, 9.0, 11.0, 8.0, 19.0, 31.0, 32.0, 35.0, 69.0, 98.0, 117.0, 120.0, 114.0, 86.0, 87.0, 44.0, 29.0, 25.0, 13.0, 12.0, 9.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021505355834960938, -0.0002069510519504547, -0.00019884854555130005, -0.00019074603915214539, -0.00018264353275299072, -0.00017454102635383606, -0.0001664385199546814, -0.00015833601355552673, -0.00015023350715637207, -0.0001421310007572174, -0.00013402849435806274, -0.00012592598795890808, -0.00011782348155975342, -0.00010972097516059875, -0.00010161846876144409, -9.351596236228943e-05, -8.541345596313477e-05, -7.73109495639801e-05, -6.920844316482544e-05, -6.110593676567078e-05, -5.300343036651611e-05, -4.490092396736145e-05, -3.679841756820679e-05, -2.8695911169052124e-05, -2.059340476989746e-05, -1.2490898370742798e-05, -4.388391971588135e-06, 3.7141144275665283e-06, 1.1816620826721191e-05, 1.9919127225875854e-05, 2.8021633625030518e-05, 3.612414002418518e-05, 4.4226646423339844e-05, 5.232915282249451e-05, 6.043165922164917e-05, 6.853416562080383e-05, 7.66366720199585e-05, 8.473917841911316e-05, 9.284168481826782e-05, 0.00010094419121742249, 0.00010904669761657715, 0.00011714920401573181, 0.00012525171041488647, 0.00013335421681404114, 0.0001414567232131958, 0.00014955922961235046, 0.00015766173601150513, 0.0001657642424106598, 0.00017386674880981445, 0.00018196925520896912, 0.00019007176160812378, 0.00019817426800727844, 0.0002062767744064331, 0.00021437928080558777, 0.00022248178720474243, 0.0002305842936038971, 0.00023868680000305176, 0.0002467893064022064, 0.0002548918128013611, 0.00026299431920051575, 0.0002710968255996704, 0.0002791993319988251, 0.00028730183839797974, 0.0002954043447971344, 0.00030350685119628906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 8.0, 10.0, 14.0, 20.0, 23.0, 48.0, 81.0, 162.0, 325.0, 645.0, 1574.0, 5123.0, 28776.0, 324271.0, 632019.0, 45118.0, 6863.0, 1929.0, 775.0, 356.0, 193.0, 81.0, 62.0, 33.0, 15.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73046875, -0.7035140991210938, -0.6765594482421875, -0.6496047973632812, -0.622650146484375, -0.5956954956054688, -0.5687408447265625, -0.5417861938476562, -0.51483154296875, -0.48787689208984375, -0.4609222412109375, -0.43396759033203125, -0.407012939453125, -0.38005828857421875, -0.3531036376953125, -0.32614898681640625, -0.2991943359375, -0.27223968505859375, -0.2452850341796875, -0.21833038330078125, -0.191375732421875, -0.16442108154296875, -0.1374664306640625, -0.11051177978515625, -0.08355712890625, -0.05660247802734375, -0.0296478271484375, -0.00269317626953125, 0.024261474609375, 0.05121612548828125, 0.0781707763671875, 0.10512542724609375, 0.132080078125, 0.15903472900390625, 0.1859893798828125, 0.21294403076171875, 0.239898681640625, 0.26685333251953125, 0.2938079833984375, 0.32076263427734375, 0.34771728515625, 0.37467193603515625, 0.4016265869140625, 0.42858123779296875, 0.455535888671875, 0.48249053955078125, 0.5094451904296875, 0.5363998413085938, 0.5633544921875, 0.5903091430664062, 0.6172637939453125, 0.6442184448242188, 0.671173095703125, 0.6981277465820312, 0.7250823974609375, 0.7520370483398438, 0.77899169921875, 0.8059463500976562, 0.8329010009765625, 0.8598556518554688, 0.886810302734375, 0.9137649536132812, 0.9407196044921875, 0.9676742553710938, 0.99462890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 21.0, 30.0, 34.0, 37.0, 52.0, 56.0, 80.0, 91.0, 87.0, 91.0, 93.0, 77.0, 56.0, 57.0, 43.0, 18.0, 17.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.40940093994140625, -0.3847198486328125, -0.36003875732421875, -0.335357666015625, -0.31067657470703125, -0.2859954833984375, -0.26131439208984375, -0.23663330078125, -0.21195220947265625, -0.1872711181640625, -0.16259002685546875, -0.137908935546875, -0.11322784423828125, -0.0885467529296875, -0.06386566162109375, -0.0391845703125, -0.01450347900390625, 0.0101776123046875, 0.03485870361328125, 0.059539794921875, 0.08422088623046875, 0.1089019775390625, 0.13358306884765625, 0.15826416015625, 0.18294525146484375, 0.2076263427734375, 0.23230743408203125, 0.256988525390625, 0.28166961669921875, 0.3063507080078125, 0.33103179931640625, 0.355712890625, 0.38039398193359375, 0.4050750732421875, 0.42975616455078125, 0.454437255859375, 0.47911834716796875, 0.5037994384765625, 0.5284805297851562, 0.55316162109375, 0.5778427124023438, 0.6025238037109375, 0.6272048950195312, 0.651885986328125, 0.6765670776367188, 0.7012481689453125, 0.7259292602539062, 0.7506103515625, 0.7752914428710938, 0.7999725341796875, 0.8246536254882812, 0.849334716796875, 0.8740158081054688, 0.8986968994140625, 0.9233779907226562, 0.94805908203125, 0.9727401733398438, 0.9974212646484375, 1.0221023559570312, 1.046783447265625, 1.0714645385742188, 1.0961456298828125, 1.1208267211914062, 1.1455078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 13.0, 21.0, 43.0, 82.0, 117.0, 259.0, 204.0, 113.0, 63.0, 33.0, 13.0, 15.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.277312278747559, -12.66807746887207, -12.058841705322266, -11.449606895446777, -10.840372085571289, -10.231136322021484, -9.621901512145996, -9.012666702270508, -8.403430938720703, -7.794195652008057, -7.18496036529541, -6.575725555419922, -5.966490268707275, -5.357254981994629, -4.748020172119141, -4.138784885406494, -3.5295495986938477, -2.920314311981201, -2.311079263687134, -1.7018440961837769, -1.09260892868042, -0.48337364196777344, 0.12586140632629395, 0.7350964546203613, 1.3443317413330078, 1.9535669088363647, 2.5628020763397217, 3.172037124633789, 3.7812724113464355, 4.390507698059082, 4.99974250793457, 5.608977794647217, 6.21821403503418, 6.827449321746826, 7.436684608459473, 8.045919418334961, 8.655155181884766, 9.264389991760254, 9.873624801635742, 10.482860565185547, 11.092095375061035, 11.701330184936523, 12.310565948486328, 12.919800758361816, 13.529035568237305, 14.13827133178711, 14.747506141662598, 15.356740951538086, 15.96597671508789, 16.575212478637695, 17.184446334838867, 17.793682098388672, 18.402917861938477, 19.01215362548828, 19.621387481689453, 20.230623245239258, 20.839859008789062, 21.449094772338867, 22.05832862854004, 22.667564392089844, 23.27680015563965, 23.886035919189453, 24.495269775390625, 25.10450553894043, 25.7137393951416]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 9.0, 12.0, 18.0, 10.0, 10.0, 13.0, 22.0, 26.0, 29.0, 41.0, 34.0, 29.0, 34.0, 71.0, 79.0, 85.0, 70.0, 55.0, 44.0, 37.0, 36.0, 33.0, 28.0, 26.0, 13.0, 22.0, 17.0, 9.0, 11.0, 11.0, 5.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.883549690246582, -13.452656745910645, -13.02176284790039, -12.590869903564453, -12.159976959228516, -11.729084014892578, -11.29819107055664, -10.867297172546387, -10.43640422821045, -10.005511283874512, -9.574617385864258, -9.14372444152832, -8.712831497192383, -8.281938552856445, -7.85104513168335, -7.420151710510254, -6.989258766174316, -6.558365821838379, -6.127472400665283, -5.6965789794921875, -5.26568603515625, -4.8347930908203125, -4.403899669647217, -3.9730064868927, -3.5421133041381836, -3.111220121383667, -2.6803269386291504, -2.249433755874634, -1.8185405731201172, -1.3876473903656006, -0.956754207611084, -0.5258610248565674, -0.09496688842773438, 0.3359262943267822, 0.7668194770812988, 1.1977126598358154, 1.628605842590332, 2.0594990253448486, 2.4903922080993652, 2.921285390853882, 3.3521785736083984, 3.783071756362915, 4.213964939117432, 4.644858360290527, 5.075751304626465, 5.506644248962402, 5.937537670135498, 6.368431091308594, 6.799324035644531, 7.230216979980469, 7.6611104011535645, 8.09200382232666, 8.522896766662598, 8.953789710998535, 9.384683609008789, 9.815576553344727, 10.246469497680664, 10.677362442016602, 11.108255386352539, 11.539149284362793, 11.97004222869873, 12.400935173034668, 12.831829071044922, 13.26272201538086, 13.693614959716797]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 14.0, 13.0, 19.0, 43.0, 58.0, 95.0, 187.0, 385.0, 889.0, 2632.0, 9492.0, 55217.0, 630481.0, 2895416.0, 534025.0, 51102.0, 9878.0, 2646.0, 893.0, 378.0, 179.0, 81.0, 50.0, 39.0, 21.0, 18.0, 9.0, 6.0, 1.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.3904876708984375, -1.351287841796875, -1.3120880126953125, -1.27288818359375, -1.2336883544921875, -1.194488525390625, -1.1552886962890625, -1.1160888671875, -1.0768890380859375, -1.037689208984375, -0.9984893798828125, -0.95928955078125, -0.9200897216796875, -0.880889892578125, -0.8416900634765625, -0.802490234375, -0.7632904052734375, -0.724090576171875, -0.6848907470703125, -0.64569091796875, -0.6064910888671875, -0.567291259765625, -0.5280914306640625, -0.4888916015625, -0.4496917724609375, -0.410491943359375, -0.3712921142578125, -0.33209228515625, -0.2928924560546875, -0.253692626953125, -0.2144927978515625, -0.17529296875, -0.1360931396484375, -0.096893310546875, -0.0576934814453125, -0.01849365234375, 0.0207061767578125, 0.059906005859375, 0.0991058349609375, 0.1383056640625, 0.1775054931640625, 0.216705322265625, 0.2559051513671875, 0.29510498046875, 0.3343048095703125, 0.373504638671875, 0.4127044677734375, 0.451904296875, 0.4911041259765625, 0.530303955078125, 0.5695037841796875, 0.60870361328125, 0.6479034423828125, 0.687103271484375, 0.7263031005859375, 0.7655029296875, 0.8047027587890625, 0.843902587890625, 0.8831024169921875, 0.92230224609375, 0.9615020751953125, 1.000701904296875, 1.0399017333984375, 1.0791015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 20.0, 15.0, 30.0, 31.0, 36.0, 43.0, 44.0, 66.0, 51.0, 71.0, 58.0, 55.0, 52.0, 61.0, 46.0, 40.0, 38.0, 42.0, 41.0, 24.0, 33.0, 13.0, 14.0, 12.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.06640625, -1.0360107421875, -1.005615234375, -0.9752197265625, -0.94482421875, -0.9144287109375, -0.884033203125, -0.8536376953125, -0.8232421875, -0.7928466796875, -0.762451171875, -0.7320556640625, -0.70166015625, -0.6712646484375, -0.640869140625, -0.6104736328125, -0.580078125, -0.5496826171875, -0.519287109375, -0.4888916015625, -0.45849609375, -0.4281005859375, -0.397705078125, -0.3673095703125, -0.3369140625, -0.3065185546875, -0.276123046875, -0.2457275390625, -0.21533203125, -0.1849365234375, -0.154541015625, -0.1241455078125, -0.09375, -0.0633544921875, -0.032958984375, -0.0025634765625, 0.02783203125, 0.0582275390625, 0.088623046875, 0.1190185546875, 0.1494140625, 0.1798095703125, 0.210205078125, 0.2406005859375, 0.27099609375, 0.3013916015625, 0.331787109375, 0.3621826171875, 0.392578125, 0.4229736328125, 0.453369140625, 0.4837646484375, 0.51416015625, 0.5445556640625, 0.574951171875, 0.6053466796875, 0.6357421875, 0.6661376953125, 0.696533203125, 0.7269287109375, 0.75732421875, 0.7877197265625, 0.818115234375, 0.8485107421875, 0.87890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 3.0, 12.0, 15.0, 29.0, 37.0, 47.0, 102.0, 165.0, 246.0, 542.0, 1134.0, 2808.0, 9240.0, 43062.0, 521962.0, 3370967.0, 208960.0, 25516.0, 5862.0, 1859.0, 808.0, 377.0, 202.0, 112.0, 63.0, 41.0, 29.0, 16.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003265380859375, -1.549285888671875, -1.4982452392578125, -1.44720458984375, -1.3961639404296875, -1.345123291015625, -1.2940826416015625, -1.2430419921875, -1.1920013427734375, -1.140960693359375, -1.0899200439453125, -1.03887939453125, -0.9878387451171875, -0.936798095703125, -0.8857574462890625, -0.834716796875, -0.7836761474609375, -0.732635498046875, -0.6815948486328125, -0.63055419921875, -0.5795135498046875, -0.528472900390625, -0.4774322509765625, -0.4263916015625, -0.3753509521484375, -0.324310302734375, -0.2732696533203125, -0.22222900390625, -0.1711883544921875, -0.120147705078125, -0.0691070556640625, -0.01806640625, 0.0329742431640625, 0.084014892578125, 0.1350555419921875, 0.18609619140625, 0.2371368408203125, 0.288177490234375, 0.3392181396484375, 0.3902587890625, 0.4412994384765625, 0.492340087890625, 0.5433807373046875, 0.59442138671875, 0.6454620361328125, 0.696502685546875, 0.7475433349609375, 0.798583984375, 0.8496246337890625, 0.900665283203125, 0.9517059326171875, 1.00274658203125, 1.0537872314453125, 1.104827880859375, 1.1558685302734375, 1.2069091796875, 1.2579498291015625, 1.308990478515625, 1.3600311279296875, 1.41107177734375, 1.4621124267578125, 1.513153076171875, 1.5641937255859375, 1.615234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 10.0, 23.0, 24.0, 29.0, 46.0, 64.0, 117.0, 198.0, 271.0, 442.0, 570.0, 631.0, 502.0, 385.0, 247.0, 155.0, 90.0, 54.0, 44.0, 34.0, 17.0, 14.0, 14.0, 9.0, 6.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.2996063232421875, -1.253509521484375, -1.2074127197265625, -1.16131591796875, -1.1152191162109375, -1.069122314453125, -1.0230255126953125, -0.9769287109375, -0.9308319091796875, -0.884735107421875, -0.8386383056640625, -0.79254150390625, -0.7464447021484375, -0.700347900390625, -0.6542510986328125, -0.608154296875, -0.5620574951171875, -0.515960693359375, -0.4698638916015625, -0.42376708984375, -0.3776702880859375, -0.331573486328125, -0.2854766845703125, -0.2393798828125, -0.1932830810546875, -0.147186279296875, -0.1010894775390625, -0.05499267578125, -0.0088958740234375, 0.037200927734375, 0.0832977294921875, 0.12939453125, 0.1754913330078125, 0.221588134765625, 0.2676849365234375, 0.31378173828125, 0.3598785400390625, 0.405975341796875, 0.4520721435546875, 0.4981689453125, 0.5442657470703125, 0.590362548828125, 0.6364593505859375, 0.68255615234375, 0.7286529541015625, 0.774749755859375, 0.8208465576171875, 0.866943359375, 0.9130401611328125, 0.959136962890625, 1.0052337646484375, 1.05133056640625, 1.0974273681640625, 1.143524169921875, 1.1896209716796875, 1.2357177734375, 1.2818145751953125, 1.327911376953125, 1.3740081787109375, 1.42010498046875, 1.4662017822265625, 1.512298583984375, 1.5583953857421875, 1.6044921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 23.0, 61.0, 427.0, 396.0, 64.0, 16.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.95310592651367, -48.634666442871094, -47.31623077392578, -45.9977912902832, -44.679351806640625, -43.36091613769531, -42.042476654052734, -40.724037170410156, -39.405601501464844, -38.087162017822266, -36.76872634887695, -35.450286865234375, -34.13185119628906, -32.813411712646484, -31.494972229003906, -30.17653465270996, -28.858097076416016, -27.53965950012207, -26.221221923828125, -24.902782440185547, -23.5843448638916, -22.265907287597656, -20.947467803955078, -19.629030227661133, -18.310592651367188, -16.992155075073242, -15.67371654510498, -14.355278015136719, -13.036840438842773, -11.718402862548828, -10.399964332580566, -9.081525802612305, -7.763092041015625, -6.4446539878845215, -5.126215934753418, -3.8077778816223145, -2.489339828491211, -1.1709017753601074, 0.1475362777709961, 1.4659748077392578, 2.784412384033203, 4.102850437164307, 5.42128849029541, 6.739726543426514, 8.058164596557617, 9.376602172851562, 10.695040702819824, 12.013479232788086, 13.331916809082031, 14.650354385375977, 15.968792915344238, 17.2872314453125, 18.605669021606445, 19.92410659790039, 21.24254608154297, 22.560983657836914, 23.87942123413086, 25.197858810424805, 26.51629638671875, 27.834735870361328, 29.153173446655273, 30.47161102294922, 31.790050506591797, 33.108489990234375, 34.42692565917969]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 14.0, 13.0, 9.0, 16.0, 27.0, 17.0, 18.0, 36.0, 28.0, 44.0, 52.0, 58.0, 48.0, 59.0, 60.0, 60.0, 44.0, 57.0, 36.0, 53.0, 31.0, 35.0, 32.0, 32.0, 22.0, 23.0, 16.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.923690795898438, -10.651545524597168, -10.379400253295898, -10.107254981994629, -9.83510971069336, -9.56296443939209, -9.29081916809082, -9.018672943115234, -8.746528625488281, -8.474383354187012, -8.202238082885742, -7.930092811584473, -7.657947540283203, -7.385802268981934, -7.113656520843506, -6.841511249542236, -6.569365501403809, -6.297220230102539, -6.0250749588012695, -5.7529296875, -5.4807844161987305, -5.208639144897461, -4.936493396759033, -4.664348125457764, -4.392202854156494, -4.120057582855225, -3.847912311553955, -3.5757668018341064, -3.303621530532837, -3.0314762592315674, -2.7593307495117188, -2.487185478210449, -2.215041160583496, -1.9428958892822266, -1.6707504987716675, -1.3986051082611084, -1.1264598369598389, -0.8543145656585693, -0.5821691751480103, -0.31002378463745117, -0.03787851333618164, 0.23426681756973267, 0.506412148475647, 0.7785574793815613, 1.0507028102874756, 1.3228480815887451, 1.5949934720993042, 1.8671388626098633, 2.139284133911133, 2.4114294052124023, 2.683574676513672, 2.9557201862335205, 3.22786545753479, 3.5000107288360596, 3.772156238555908, 4.044301509857178, 4.316446781158447, 4.588592052459717, 4.860737323760986, 5.132882595062256, 5.405028343200684, 5.677173614501953, 5.949318885803223, 6.221464157104492, 6.493609428405762]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 26.0, 28.0, 49.0, 96.0, 124.0, 209.0, 370.0, 533.0, 935.0, 1696.0, 2816.0, 5194.0, 9801.0, 19132.0, 38872.0, 79475.0, 155023.0, 235557.0, 224028.0, 136496.0, 68695.0, 33501.0, 16688.0, 8562.0, 4529.0, 2497.0, 1395.0, 868.0, 512.0, 299.0, 184.0, 130.0, 82.0, 45.0, 27.0, 23.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8707427978515625, -0.842559814453125, -0.8143768310546875, -0.78619384765625, -0.7580108642578125, -0.729827880859375, -0.7016448974609375, -0.6734619140625, -0.6452789306640625, -0.617095947265625, -0.5889129638671875, -0.56072998046875, -0.5325469970703125, -0.504364013671875, -0.4761810302734375, -0.447998046875, -0.4198150634765625, -0.391632080078125, -0.3634490966796875, -0.33526611328125, -0.3070831298828125, -0.278900146484375, -0.2507171630859375, -0.2225341796875, -0.1943511962890625, -0.166168212890625, -0.1379852294921875, -0.10980224609375, -0.0816192626953125, -0.053436279296875, -0.0252532958984375, 0.0029296875, 0.0311126708984375, 0.059295654296875, 0.0874786376953125, 0.11566162109375, 0.1438446044921875, 0.172027587890625, 0.2002105712890625, 0.2283935546875, 0.2565765380859375, 0.284759521484375, 0.3129425048828125, 0.34112548828125, 0.3693084716796875, 0.397491455078125, 0.4256744384765625, 0.453857421875, 0.4820404052734375, 0.510223388671875, 0.5384063720703125, 0.56658935546875, 0.5947723388671875, 0.622955322265625, 0.6511383056640625, 0.6793212890625, 0.7075042724609375, 0.735687255859375, 0.7638702392578125, 0.79205322265625, 0.8202362060546875, 0.848419189453125, 0.8766021728515625, 0.90478515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 10.0, 11.0, 20.0, 23.0, 29.0, 25.0, 36.0, 35.0, 39.0, 63.0, 51.0, 50.0, 62.0, 59.0, 61.0, 55.0, 39.0, 39.0, 49.0, 37.0, 24.0, 28.0, 34.0, 13.0, 20.0, 21.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.013671875, -0.984344482421875, -0.95501708984375, -0.925689697265625, -0.8963623046875, -0.867034912109375, -0.83770751953125, -0.808380126953125, -0.779052734375, -0.749725341796875, -0.72039794921875, -0.691070556640625, -0.6617431640625, -0.632415771484375, -0.60308837890625, -0.573760986328125, -0.54443359375, -0.515106201171875, -0.48577880859375, -0.456451416015625, -0.4271240234375, -0.397796630859375, -0.36846923828125, -0.339141845703125, -0.309814453125, -0.280487060546875, -0.25115966796875, -0.221832275390625, -0.1925048828125, -0.163177490234375, -0.13385009765625, -0.104522705078125, -0.0751953125, -0.045867919921875, -0.01654052734375, 0.012786865234375, 0.0421142578125, 0.071441650390625, 0.10076904296875, 0.130096435546875, 0.159423828125, 0.188751220703125, 0.21807861328125, 0.247406005859375, 0.2767333984375, 0.306060791015625, 0.33538818359375, 0.364715576171875, 0.39404296875, 0.423370361328125, 0.45269775390625, 0.482025146484375, 0.5113525390625, 0.540679931640625, 0.57000732421875, 0.599334716796875, 0.628662109375, 0.657989501953125, 0.68731689453125, 0.716644287109375, 0.7459716796875, 0.775299072265625, 0.80462646484375, 0.833953857421875, 0.86328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 10.0, 9.0, 18.0, 16.0, 39.0, 38.0, 58.0, 75.0, 128.0, 217.0, 428.0, 1083.0, 3454.0, 15112.0, 89748.0, 626788.0, 259822.0, 40284.0, 7592.0, 2001.0, 743.0, 338.0, 184.0, 95.0, 86.0, 57.0, 35.0, 22.0, 15.0, 15.0, 14.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.257110595703125, -2.18609619140625, -2.115081787109375, -2.0440673828125, -1.973052978515625, -1.90203857421875, -1.831024169921875, -1.760009765625, -1.688995361328125, -1.61798095703125, -1.546966552734375, -1.4759521484375, -1.404937744140625, -1.33392333984375, -1.262908935546875, -1.19189453125, -1.120880126953125, -1.04986572265625, -0.978851318359375, -0.9078369140625, -0.836822509765625, -0.76580810546875, -0.694793701171875, -0.623779296875, -0.552764892578125, -0.48175048828125, -0.410736083984375, -0.3397216796875, -0.268707275390625, -0.19769287109375, -0.126678466796875, -0.0556640625, 0.015350341796875, 0.08636474609375, 0.157379150390625, 0.2283935546875, 0.299407958984375, 0.37042236328125, 0.441436767578125, 0.512451171875, 0.583465576171875, 0.65447998046875, 0.725494384765625, 0.7965087890625, 0.867523193359375, 0.93853759765625, 1.009552001953125, 1.08056640625, 1.151580810546875, 1.22259521484375, 1.293609619140625, 1.3646240234375, 1.435638427734375, 1.50665283203125, 1.577667236328125, 1.648681640625, 1.719696044921875, 1.79071044921875, 1.861724853515625, 1.9327392578125, 2.003753662109375, 2.07476806640625, 2.145782470703125, 2.216796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 12.0, 13.0, 18.0, 20.0, 15.0, 25.0, 25.0, 34.0, 41.0, 32.0, 41.0, 55.0, 45.0, 54.0, 52.0, 60.0, 51.0, 49.0, 36.0, 43.0, 35.0, 39.0, 32.0, 19.0, 25.0, 22.0, 21.0, 12.0, 12.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0390625, -2.94879150390625, -2.8585205078125, -2.76824951171875, -2.677978515625, -2.58770751953125, -2.4974365234375, -2.40716552734375, -2.31689453125, -2.22662353515625, -2.1363525390625, -2.04608154296875, -1.955810546875, -1.86553955078125, -1.7752685546875, -1.68499755859375, -1.5947265625, -1.50445556640625, -1.4141845703125, -1.32391357421875, -1.233642578125, -1.14337158203125, -1.0531005859375, -0.96282958984375, -0.87255859375, -0.78228759765625, -0.6920166015625, -0.60174560546875, -0.511474609375, -0.42120361328125, -0.3309326171875, -0.24066162109375, -0.150390625, -0.06011962890625, 0.0301513671875, 0.12042236328125, 0.210693359375, 0.30096435546875, 0.3912353515625, 0.48150634765625, 0.57177734375, 0.66204833984375, 0.7523193359375, 0.84259033203125, 0.932861328125, 1.02313232421875, 1.1134033203125, 1.20367431640625, 1.2939453125, 1.38421630859375, 1.4744873046875, 1.56475830078125, 1.655029296875, 1.74530029296875, 1.8355712890625, 1.92584228515625, 2.01611328125, 2.10638427734375, 2.1966552734375, 2.28692626953125, 2.377197265625, 2.46746826171875, 2.5577392578125, 2.64801025390625, 2.73828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 12.0, 23.0, 27.0, 33.0, 59.0, 115.0, 185.0, 365.0, 913.0, 2413.0, 7340.0, 27607.0, 130535.0, 620114.0, 201151.0, 42087.0, 10268.0, 3163.0, 1094.0, 495.0, 226.0, 120.0, 60.0, 44.0, 31.0, 15.0, 15.0, 4.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.557098388671875, -0.53948974609375, -0.521881103515625, -0.5042724609375, -0.486663818359375, -0.46905517578125, -0.451446533203125, -0.433837890625, -0.416229248046875, -0.39862060546875, -0.381011962890625, -0.3634033203125, -0.345794677734375, -0.32818603515625, -0.310577392578125, -0.29296875, -0.275360107421875, -0.25775146484375, -0.240142822265625, -0.2225341796875, -0.204925537109375, -0.18731689453125, -0.169708251953125, -0.152099609375, -0.134490966796875, -0.11688232421875, -0.099273681640625, -0.0816650390625, -0.064056396484375, -0.04644775390625, -0.028839111328125, -0.01123046875, 0.006378173828125, 0.02398681640625, 0.041595458984375, 0.0592041015625, 0.076812744140625, 0.09442138671875, 0.112030029296875, 0.129638671875, 0.147247314453125, 0.16485595703125, 0.182464599609375, 0.2000732421875, 0.217681884765625, 0.23529052734375, 0.252899169921875, 0.2705078125, 0.288116455078125, 0.30572509765625, 0.323333740234375, 0.3409423828125, 0.358551025390625, 0.37615966796875, 0.393768310546875, 0.411376953125, 0.428985595703125, 0.44659423828125, 0.464202880859375, 0.4818115234375, 0.499420166015625, 0.51702880859375, 0.534637451171875, 0.55224609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 10.0, 10.0, 10.0, 11.0, 23.0, 31.0, 35.0, 50.0, 65.0, 61.0, 82.0, 81.0, 95.0, 94.0, 78.0, 52.0, 42.0, 31.0, 24.0, 24.0, 20.0, 13.0, 10.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017845630645751953, -0.0001732315868139267, -0.00016800686717033386, -0.00016278214752674103, -0.0001575574278831482, -0.00015233270823955536, -0.00014710798859596252, -0.0001418832689523697, -0.00013665854930877686, -0.00013143382966518402, -0.0001262091100215912, -0.00012098439037799835, -0.00011575967073440552, -0.00011053495109081268, -0.00010531023144721985, -0.00010008551180362701, -9.486079216003418e-05, -8.963607251644135e-05, -8.441135287284851e-05, -7.918663322925568e-05, -7.396191358566284e-05, -6.873719394207001e-05, -6.351247429847717e-05, -5.828775465488434e-05, -5.3063035011291504e-05, -4.783831536769867e-05, -4.2613595724105835e-05, -3.7388876080513e-05, -3.2164156436920166e-05, -2.693943679332733e-05, -2.1714717149734497e-05, -1.6489997506141663e-05, -1.1265277862548828e-05, -6.040558218955994e-06, -8.158385753631592e-07, 4.408881068229675e-06, 9.63360071182251e-06, 1.4858320355415344e-05, 2.008303999900818e-05, 2.5307759642601013e-05, 3.053247928619385e-05, 3.575719892978668e-05, 4.0981918573379517e-05, 4.620663821697235e-05, 5.1431357860565186e-05, 5.665607750415802e-05, 6.188079714775085e-05, 6.710551679134369e-05, 7.233023643493652e-05, 7.755495607852936e-05, 8.277967572212219e-05, 8.800439536571503e-05, 9.322911500930786e-05, 9.84538346529007e-05, 0.00010367855429649353, 0.00010890327394008636, 0.0001141279935836792, 0.00011935271322727203, 0.00012457743287086487, 0.0001298021525144577, 0.00013502687215805054, 0.00014025159180164337, 0.0001454763114452362, 0.00015070103108882904, 0.00015592575073242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 17.0, 25.0, 15.0, 63.0, 104.0, 184.0, 418.0, 1155.0, 3856.0, 19141.0, 149111.0, 718847.0, 132845.0, 17342.0, 3495.0, 1074.0, 408.0, 201.0, 74.0, 62.0, 30.0, 23.0, 15.0, 10.0, 6.0, 10.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5849838256835938, -0.5610809326171875, -0.5371780395507812, -0.513275146484375, -0.48937225341796875, -0.4654693603515625, -0.44156646728515625, -0.41766357421875, -0.39376068115234375, -0.3698577880859375, -0.34595489501953125, -0.322052001953125, -0.29814910888671875, -0.2742462158203125, -0.25034332275390625, -0.2264404296875, -0.20253753662109375, -0.1786346435546875, -0.15473175048828125, -0.130828857421875, -0.10692596435546875, -0.0830230712890625, -0.05912017822265625, -0.03521728515625, -0.01131439208984375, 0.0125885009765625, 0.03649139404296875, 0.060394287109375, 0.08429718017578125, 0.1082000732421875, 0.13210296630859375, 0.156005859375, 0.17990875244140625, 0.2038116455078125, 0.22771453857421875, 0.251617431640625, 0.27552032470703125, 0.2994232177734375, 0.32332611083984375, 0.34722900390625, 0.37113189697265625, 0.3950347900390625, 0.41893768310546875, 0.442840576171875, 0.46674346923828125, 0.4906463623046875, 0.5145492553710938, 0.5384521484375, 0.5623550415039062, 0.5862579345703125, 0.6101608276367188, 0.634063720703125, 0.6579666137695312, 0.6818695068359375, 0.7057723999023438, 0.72967529296875, 0.7535781860351562, 0.7774810791015625, 0.8013839721679688, 0.825286865234375, 0.8491897583007812, 0.8730926513671875, 0.8969955444335938, 0.9208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 12.0, 11.0, 10.0, 12.0, 19.0, 24.0, 23.0, 29.0, 38.0, 57.0, 55.0, 59.0, 71.0, 71.0, 67.0, 82.0, 46.0, 50.0, 62.0, 47.0, 34.0, 17.0, 20.0, 19.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.46233367919921875, -0.4446868896484375, -0.42704010009765625, -0.409393310546875, -0.39174652099609375, -0.3740997314453125, -0.35645294189453125, -0.33880615234375, -0.32115936279296875, -0.3035125732421875, -0.28586578369140625, -0.268218994140625, -0.25057220458984375, -0.2329254150390625, -0.21527862548828125, -0.1976318359375, -0.17998504638671875, -0.1623382568359375, -0.14469146728515625, -0.127044677734375, -0.10939788818359375, -0.0917510986328125, -0.07410430908203125, -0.05645751953125, -0.03881072998046875, -0.0211639404296875, -0.00351715087890625, 0.014129638671875, 0.03177642822265625, 0.0494232177734375, 0.06707000732421875, 0.084716796875, 0.10236358642578125, 0.1200103759765625, 0.13765716552734375, 0.155303955078125, 0.17295074462890625, 0.1905975341796875, 0.20824432373046875, 0.22589111328125, 0.24353790283203125, 0.2611846923828125, 0.27883148193359375, 0.296478271484375, 0.31412506103515625, 0.3317718505859375, 0.34941864013671875, 0.3670654296875, 0.38471221923828125, 0.4023590087890625, 0.42000579833984375, 0.437652587890625, 0.45529937744140625, 0.4729461669921875, 0.49059295654296875, 0.50823974609375, 0.5258865356445312, 0.5435333251953125, 0.5611801147460938, 0.578826904296875, 0.5964736938476562, 0.6141204833984375, 0.6317672729492188, 0.6494140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 4.0, 6.0, 23.0, 29.0, 82.0, 152.0, 238.0, 221.0, 123.0, 57.0, 20.0, 11.0, 5.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.959287643432617, -25.39434242248535, -24.829397201538086, -24.26445198059082, -23.699506759643555, -23.13456153869629, -22.569616317749023, -22.004671096801758, -21.439725875854492, -20.874780654907227, -20.30983543395996, -19.744890213012695, -19.17994499206543, -18.614999771118164, -18.0500545501709, -17.485109329223633, -16.920166015625, -16.355220794677734, -15.790275573730469, -15.225330352783203, -14.660385131835938, -14.095439910888672, -13.530494689941406, -12.96554946899414, -12.400604248046875, -11.83565902709961, -11.270713806152344, -10.705768585205078, -10.140823364257812, -9.575878143310547, -9.010932922363281, -8.445987701416016, -7.881043434143066, -7.316098213195801, -6.751152992248535, -6.1862077713012695, -5.621262550354004, -5.056317329406738, -4.491372585296631, -3.9264273643493652, -3.3614821434020996, -2.796536922454834, -2.2315917015075684, -1.6666467189788818, -1.1017014980316162, -0.5367562770843506, 0.028188705444335938, 0.5931339263916016, 1.1580791473388672, 1.7230243682861328, 2.2879695892333984, 2.852914571762085, 3.4178597927093506, 3.982805013656616, 4.547749996185303, 5.112695217132568, 5.677640438079834, 6.2425856590271, 6.807530879974365, 7.372475624084473, 7.937420845031738, 8.502366065979004, 9.06731128692627, 9.632256507873535, 10.1972017288208]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 7.0, 4.0, 1.0, 5.0, 8.0, 9.0, 17.0, 11.0, 15.0, 19.0, 19.0, 13.0, 30.0, 23.0, 28.0, 35.0, 48.0, 50.0, 68.0, 65.0, 64.0, 65.0, 53.0, 31.0, 33.0, 34.0, 24.0, 31.0, 23.0, 21.0, 17.0, 23.0, 18.0, 16.0, 12.0, 14.0, 6.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.511778831481934, -9.186701774597168, -8.861624717712402, -8.536547660827637, -8.211470603942871, -7.8863935470581055, -7.561316013336182, -7.236238956451416, -6.91116189956665, -6.586084842681885, -6.261007785797119, -5.9359307289123535, -5.61085319519043, -5.285776138305664, -4.960699081420898, -4.635622024536133, -4.310544967651367, -3.9854679107666016, -3.660390853881836, -3.335313558578491, -3.0102365016937256, -2.68515944480896, -2.3600821495056152, -2.0350050926208496, -1.709928035736084, -1.3848509788513184, -1.0597738027572632, -0.7346966862678528, -0.4096195697784424, -0.08454251289367676, 0.24053466320037842, 0.5656118392944336, 0.8906879425048828, 1.2157649993896484, 1.5408421754837036, 1.8659193515777588, 2.1909964084625244, 2.51607346534729, 2.8411507606506348, 3.1662278175354004, 3.491304874420166, 3.8163819313049316, 4.141458988189697, 4.466536045074463, 4.791613578796387, 5.116690635681152, 5.441767692565918, 5.766844749450684, 6.091921806335449, 6.416998863220215, 6.7420759201049805, 7.067152976989746, 7.392230033874512, 7.717307090759277, 8.042384147644043, 8.367462158203125, 8.69253921508789, 9.017616271972656, 9.342693328857422, 9.667770385742188, 9.992847442626953, 10.317924499511719, 10.643001556396484, 10.96807861328125, 11.293155670166016]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 19.0, 24.0, 25.0, 53.0, 97.0, 135.0, 228.0, 447.0, 803.0, 1634.0, 3162.0, 7332.0, 19006.0, 53564.0, 170576.0, 543762.0, 1378455.0, 1297000.0, 485051.0, 152190.0, 48621.0, 17743.0, 7332.0, 3466.0, 1650.0, 801.0, 442.0, 272.0, 147.0, 77.0, 56.0, 31.0, 20.0, 19.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4883880615234375, -0.470916748046875, -0.4534454345703125, -0.43597412109375, -0.4185028076171875, -0.401031494140625, -0.3835601806640625, -0.3660888671875, -0.3486175537109375, -0.331146240234375, -0.3136749267578125, -0.29620361328125, -0.2787322998046875, -0.261260986328125, -0.2437896728515625, -0.226318359375, -0.2088470458984375, -0.191375732421875, -0.1739044189453125, -0.15643310546875, -0.1389617919921875, -0.121490478515625, -0.1040191650390625, -0.0865478515625, -0.0690765380859375, -0.051605224609375, -0.0341339111328125, -0.01666259765625, 0.0008087158203125, 0.018280029296875, 0.0357513427734375, 0.05322265625, 0.0706939697265625, 0.088165283203125, 0.1056365966796875, 0.12310791015625, 0.1405792236328125, 0.158050537109375, 0.1755218505859375, 0.1929931640625, 0.2104644775390625, 0.227935791015625, 0.2454071044921875, 0.26287841796875, 0.2803497314453125, 0.297821044921875, 0.3152923583984375, 0.332763671875, 0.3502349853515625, 0.367706298828125, 0.3851776123046875, 0.40264892578125, 0.4201202392578125, 0.437591552734375, 0.4550628662109375, 0.4725341796875, 0.4900054931640625, 0.507476806640625, 0.5249481201171875, 0.54241943359375, 0.5598907470703125, 0.577362060546875, 0.5948333740234375, 0.6123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 12.0, 9.0, 14.0, 17.0, 14.0, 20.0, 22.0, 28.0, 35.0, 37.0, 47.0, 46.0, 55.0, 45.0, 53.0, 52.0, 61.0, 52.0, 50.0, 40.0, 47.0, 34.0, 26.0, 33.0, 22.0, 27.0, 22.0, 14.0, 14.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.96484375, -0.9368820190429688, -0.9089202880859375, -0.8809585571289062, -0.852996826171875, -0.8250350952148438, -0.7970733642578125, -0.7691116333007812, -0.74114990234375, -0.7131881713867188, -0.6852264404296875, -0.6572647094726562, -0.629302978515625, -0.6013412475585938, -0.5733795166015625, -0.5454177856445312, -0.5174560546875, -0.48949432373046875, -0.4615325927734375, -0.43357086181640625, -0.405609130859375, -0.37764739990234375, -0.3496856689453125, -0.32172393798828125, -0.29376220703125, -0.26580047607421875, -0.2378387451171875, -0.20987701416015625, -0.181915283203125, -0.15395355224609375, -0.1259918212890625, -0.09803009033203125, -0.070068359375, -0.04210662841796875, -0.0141448974609375, 0.01381683349609375, 0.041778564453125, 0.06974029541015625, 0.0977020263671875, 0.12566375732421875, 0.15362548828125, 0.18158721923828125, 0.2095489501953125, 0.23751068115234375, 0.265472412109375, 0.29343414306640625, 0.3213958740234375, 0.34935760498046875, 0.3773193359375, 0.40528106689453125, 0.4332427978515625, 0.46120452880859375, 0.489166259765625, 0.5171279907226562, 0.5450897216796875, 0.5730514526367188, 0.60101318359375, 0.6289749145507812, 0.6569366455078125, 0.6848983764648438, 0.712860107421875, 0.7408218383789062, 0.7687835693359375, 0.7967453002929688, 0.82470703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 9.0, 19.0, 24.0, 23.0, 67.0, 121.0, 305.0, 893.0, 3611.0, 26262.0, 1118193.0, 2988474.0, 48750.0, 5562.0, 1213.0, 391.0, 142.0, 79.0, 44.0, 24.0, 16.0, 15.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.164459228515625, -2.09259033203125, -2.020721435546875, -1.9488525390625, -1.876983642578125, -1.80511474609375, -1.733245849609375, -1.661376953125, -1.589508056640625, -1.51763916015625, -1.445770263671875, -1.3739013671875, -1.302032470703125, -1.23016357421875, -1.158294677734375, -1.08642578125, -1.014556884765625, -0.94268798828125, -0.870819091796875, -0.7989501953125, -0.727081298828125, -0.65521240234375, -0.583343505859375, -0.511474609375, -0.439605712890625, -0.36773681640625, -0.295867919921875, -0.2239990234375, -0.152130126953125, -0.08026123046875, -0.008392333984375, 0.0634765625, 0.135345458984375, 0.20721435546875, 0.279083251953125, 0.3509521484375, 0.422821044921875, 0.49468994140625, 0.566558837890625, 0.638427734375, 0.710296630859375, 0.78216552734375, 0.854034423828125, 0.9259033203125, 0.997772216796875, 1.06964111328125, 1.141510009765625, 1.21337890625, 1.285247802734375, 1.35711669921875, 1.428985595703125, 1.5008544921875, 1.572723388671875, 1.64459228515625, 1.716461181640625, 1.788330078125, 1.860198974609375, 1.93206787109375, 2.003936767578125, 2.0758056640625, 2.147674560546875, 2.21954345703125, 2.291412353515625, 2.36328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 2.0, 6.0, 7.0, 17.0, 17.0, 29.0, 39.0, 64.0, 74.0, 116.0, 174.0, 272.0, 369.0, 480.0, 539.0, 497.0, 414.0, 277.0, 209.0, 134.0, 81.0, 62.0, 41.0, 30.0, 17.0, 18.0, 14.0, 6.0, 8.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.213226318359375, -1.17352294921875, -1.133819580078125, -1.0941162109375, -1.054412841796875, -1.01470947265625, -0.975006103515625, -0.935302734375, -0.895599365234375, -0.85589599609375, -0.816192626953125, -0.7764892578125, -0.736785888671875, -0.69708251953125, -0.657379150390625, -0.61767578125, -0.577972412109375, -0.53826904296875, -0.498565673828125, -0.4588623046875, -0.419158935546875, -0.37945556640625, -0.339752197265625, -0.300048828125, -0.260345458984375, -0.22064208984375, -0.180938720703125, -0.1412353515625, -0.101531982421875, -0.06182861328125, -0.022125244140625, 0.017578125, 0.057281494140625, 0.09698486328125, 0.136688232421875, 0.1763916015625, 0.216094970703125, 0.25579833984375, 0.295501708984375, 0.335205078125, 0.374908447265625, 0.41461181640625, 0.454315185546875, 0.4940185546875, 0.533721923828125, 0.57342529296875, 0.613128662109375, 0.65283203125, 0.692535400390625, 0.73223876953125, 0.771942138671875, 0.8116455078125, 0.851348876953125, 0.89105224609375, 0.930755615234375, 0.970458984375, 1.010162353515625, 1.04986572265625, 1.089569091796875, 1.1292724609375, 1.168975830078125, 1.20867919921875, 1.248382568359375, 1.2880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 13.0, 22.0, 33.0, 84.0, 125.0, 180.0, 187.0, 146.0, 86.0, 46.0, 22.0, 19.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.760187149047852, -10.333600997924805, -9.907015800476074, -9.480429649353027, -9.05384349822998, -8.62725830078125, -8.200672149658203, -7.774085998535156, -7.347500324249268, -6.920914649963379, -6.494328498840332, -6.067742824554443, -5.641157150268555, -5.214570999145508, -4.787985324859619, -4.3613996505737305, -3.9348134994506836, -3.508227586746216, -3.081641674041748, -2.6550559997558594, -2.2284700870513916, -1.8018841743469238, -1.3752985000610352, -0.9487125873565674, -0.5221266746520996, -0.09554082155227661, 0.3310450315475464, 0.7576308250427246, 1.1842167377471924, 1.6108026504516602, 2.037388324737549, 2.4639742374420166, 2.8905601501464844, 3.317146062850952, 3.74373197555542, 4.170317649841309, 4.5969038009643555, 5.023489475250244, 5.450075149536133, 5.87666130065918, 6.303246974945068, 6.729832649230957, 7.156418800354004, 7.583004474639893, 8.009590148925781, 8.436176300048828, 8.862762451171875, 9.289347648620605, 9.715933799743652, 10.1425199508667, 10.56910514831543, 10.995691299438477, 11.422277450561523, 11.84886360168457, 12.2754487991333, 12.702034950256348, 13.128620147705078, 13.555206298828125, 13.981791496276855, 14.408377647399902, 14.83496379852295, 15.26154899597168, 15.688135147094727, 16.114721298217773, 16.54130744934082]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 20.0, 11.0, 13.0, 15.0, 36.0, 21.0, 36.0, 39.0, 54.0, 47.0, 41.0, 45.0, 39.0, 54.0, 61.0, 36.0, 34.0, 50.0, 45.0, 42.0, 41.0, 26.0, 20.0, 33.0, 20.0, 15.0, 20.0, 12.0, 12.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.060419082641602, -5.824182987213135, -5.58794641494751, -5.351710319519043, -5.115473747253418, -4.879237651824951, -4.643001556396484, -4.406764984130859, -4.170528888702393, -3.9342925548553467, -3.698056221008301, -3.461820125579834, -3.225583791732788, -2.989347457885742, -2.7531113624572754, -2.5168750286102295, -2.2806386947631836, -2.0444023609161377, -1.8081661462783813, -1.571929931640625, -1.335693597793579, -1.0994572639465332, -0.8632210493087769, -0.6269848346710205, -0.3907485008239746, -0.1545122265815735, 0.08172404766082764, 0.31796032190322876, 0.5541965961456299, 0.7904329299926758, 1.0266691446304321, 1.2629053592681885, 1.4991416931152344, 1.7353780269622803, 1.9716142416000366, 2.207850456237793, 2.444086790084839, 2.6803231239318848, 2.9165592193603516, 3.1527955532073975, 3.3890318870544434, 3.6252682209014893, 3.861504554748535, 4.097740650177002, 4.333976745605469, 4.570213317871094, 4.8064494132995605, 5.042685508728027, 5.278922080993652, 5.515158176422119, 5.751394748687744, 5.987630844116211, 6.223867416381836, 6.460103511810303, 6.6963396072387695, 6.9325761795043945, 7.168812274932861, 7.405048370361328, 7.641284942626953, 7.87752103805542, 8.113757133483887, 8.349993705749512, 8.586230278015137, 8.822465896606445, 9.05870246887207]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 10.0, 10.0, 29.0, 46.0, 60.0, 73.0, 124.0, 169.0, 240.0, 433.0, 617.0, 1035.0, 1843.0, 3038.0, 5518.0, 10755.0, 20852.0, 41717.0, 83479.0, 159600.0, 244352.0, 217691.0, 125873.0, 63769.0, 31999.0, 16073.0, 8327.0, 4483.0, 2490.0, 1396.0, 890.0, 546.0, 327.0, 220.0, 135.0, 104.0, 56.0, 56.0, 31.0, 19.0, 13.0, 13.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76953125, -0.7445526123046875, -0.719573974609375, -0.6945953369140625, -0.66961669921875, -0.6446380615234375, -0.619659423828125, -0.5946807861328125, -0.5697021484375, -0.5447235107421875, -0.519744873046875, -0.4947662353515625, -0.46978759765625, -0.4448089599609375, -0.419830322265625, -0.3948516845703125, -0.369873046875, -0.3448944091796875, -0.319915771484375, -0.2949371337890625, -0.26995849609375, -0.2449798583984375, -0.220001220703125, -0.1950225830078125, -0.1700439453125, -0.1450653076171875, -0.120086669921875, -0.0951080322265625, -0.07012939453125, -0.0451507568359375, -0.020172119140625, 0.0048065185546875, 0.02978515625, 0.0547637939453125, 0.079742431640625, 0.1047210693359375, 0.12969970703125, 0.1546783447265625, 0.179656982421875, 0.2046356201171875, 0.2296142578125, 0.2545928955078125, 0.279571533203125, 0.3045501708984375, 0.32952880859375, 0.3545074462890625, 0.379486083984375, 0.4044647216796875, 0.429443359375, 0.4544219970703125, 0.479400634765625, 0.5043792724609375, 0.52935791015625, 0.5543365478515625, 0.579315185546875, 0.6042938232421875, 0.6292724609375, 0.6542510986328125, 0.679229736328125, 0.7042083740234375, 0.72918701171875, 0.7541656494140625, 0.779144287109375, 0.8041229248046875, 0.8291015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 18.0, 19.0, 25.0, 24.0, 31.0, 33.0, 33.0, 42.0, 45.0, 41.0, 59.0, 58.0, 50.0, 59.0, 52.0, 41.0, 43.0, 52.0, 38.0, 37.0, 27.0, 26.0, 21.0, 24.0, 13.0, 6.0, 11.0, 7.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0009765625, -0.9727554321289062, -0.9445343017578125, -0.9163131713867188, -0.888092041015625, -0.8598709106445312, -0.8316497802734375, -0.8034286499023438, -0.77520751953125, -0.7469863891601562, -0.7187652587890625, -0.6905441284179688, -0.662322998046875, -0.6341018676757812, -0.6058807373046875, -0.5776596069335938, -0.5494384765625, -0.5212173461914062, -0.4929962158203125, -0.46477508544921875, -0.436553955078125, -0.40833282470703125, -0.3801116943359375, -0.35189056396484375, -0.32366943359375, -0.29544830322265625, -0.2672271728515625, -0.23900604248046875, -0.210784912109375, -0.18256378173828125, -0.1543426513671875, -0.12612152099609375, -0.097900390625, -0.06967926025390625, -0.0414581298828125, -0.01323699951171875, 0.014984130859375, 0.04320526123046875, 0.0714263916015625, 0.09964752197265625, 0.12786865234375, 0.15608978271484375, 0.1843109130859375, 0.21253204345703125, 0.240753173828125, 0.26897430419921875, 0.2971954345703125, 0.32541656494140625, 0.3536376953125, 0.38185882568359375, 0.4100799560546875, 0.43830108642578125, 0.466522216796875, 0.49474334716796875, 0.5229644775390625, 0.5511856079101562, 0.57940673828125, 0.6076278686523438, 0.6358489990234375, 0.6640701293945312, 0.692291259765625, 0.7205123901367188, 0.7487335205078125, 0.7769546508789062, 0.80517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 14.0, 6.0, 25.0, 22.0, 32.0, 37.0, 52.0, 60.0, 77.0, 120.0, 182.0, 251.0, 357.0, 573.0, 1008.0, 1917.0, 5098.0, 16786.0, 71799.0, 439197.0, 412825.0, 71463.0, 16759.0, 4950.0, 1994.0, 943.0, 577.0, 384.0, 273.0, 160.0, 150.0, 105.0, 76.0, 55.0, 39.0, 43.0, 27.0, 32.0, 18.0, 19.0, 13.0, 4.0, 6.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.6162109375, -1.5640716552734375, -1.511932373046875, -1.4597930908203125, -1.40765380859375, -1.3555145263671875, -1.303375244140625, -1.2512359619140625, -1.1990966796875, -1.1469573974609375, -1.094818115234375, -1.0426788330078125, -0.99053955078125, -0.9384002685546875, -0.886260986328125, -0.8341217041015625, -0.781982421875, -0.7298431396484375, -0.677703857421875, -0.6255645751953125, -0.57342529296875, -0.5212860107421875, -0.469146728515625, -0.4170074462890625, -0.3648681640625, -0.3127288818359375, -0.260589599609375, -0.2084503173828125, -0.15631103515625, -0.1041717529296875, -0.052032470703125, 0.0001068115234375, 0.05224609375, 0.1043853759765625, 0.156524658203125, 0.2086639404296875, 0.26080322265625, 0.3129425048828125, 0.365081787109375, 0.4172210693359375, 0.4693603515625, 0.5214996337890625, 0.573638916015625, 0.6257781982421875, 0.67791748046875, 0.7300567626953125, 0.782196044921875, 0.8343353271484375, 0.886474609375, 0.9386138916015625, 0.990753173828125, 1.0428924560546875, 1.09503173828125, 1.1471710205078125, 1.199310302734375, 1.2514495849609375, 1.3035888671875, 1.3557281494140625, 1.407867431640625, 1.4600067138671875, 1.51214599609375, 1.5642852783203125, 1.616424560546875, 1.6685638427734375, 1.720703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 14.0, 16.0, 10.0, 14.0, 19.0, 26.0, 29.0, 48.0, 34.0, 46.0, 38.0, 46.0, 47.0, 58.0, 58.0, 35.0, 55.0, 45.0, 46.0, 34.0, 40.0, 34.0, 35.0, 21.0, 26.0, 19.0, 10.0, 11.0, 11.0, 12.0, 14.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.6295166015625, -2.540283203125, -2.4510498046875, -2.36181640625, -2.2725830078125, -2.183349609375, -2.0941162109375, -2.0048828125, -1.9156494140625, -1.826416015625, -1.7371826171875, -1.64794921875, -1.5587158203125, -1.469482421875, -1.3802490234375, -1.291015625, -1.2017822265625, -1.112548828125, -1.0233154296875, -0.93408203125, -0.8448486328125, -0.755615234375, -0.6663818359375, -0.5771484375, -0.4879150390625, -0.398681640625, -0.3094482421875, -0.22021484375, -0.1309814453125, -0.041748046875, 0.0474853515625, 0.13671875, 0.2259521484375, 0.315185546875, 0.4044189453125, 0.49365234375, 0.5828857421875, 0.672119140625, 0.7613525390625, 0.8505859375, 0.9398193359375, 1.029052734375, 1.1182861328125, 1.20751953125, 1.2967529296875, 1.385986328125, 1.4752197265625, 1.564453125, 1.6536865234375, 1.742919921875, 1.8321533203125, 1.92138671875, 2.0106201171875, 2.099853515625, 2.1890869140625, 2.2783203125, 2.3675537109375, 2.456787109375, 2.5460205078125, 2.63525390625, 2.7244873046875, 2.813720703125, 2.9029541015625, 2.9921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 11.0, 11.0, 16.0, 25.0, 38.0, 46.0, 51.0, 82.0, 167.0, 259.0, 444.0, 929.0, 1916.0, 4834.0, 13566.0, 44427.0, 174811.0, 628148.0, 126864.0, 33769.0, 10707.0, 3905.0, 1652.0, 757.0, 435.0, 242.0, 133.0, 76.0, 67.0, 48.0, 25.0, 18.0, 10.0, 13.0, 3.0, 9.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4221000671386719, -0.40865325927734375, -0.3952064514160156, -0.3817596435546875, -0.3683128356933594, -0.35486602783203125, -0.3414192199707031, -0.327972412109375, -0.3145256042480469, -0.30107879638671875, -0.2876319885253906, -0.2741851806640625, -0.2607383728027344, -0.24729156494140625, -0.23384475708007812, -0.22039794921875, -0.20695114135742188, -0.19350433349609375, -0.18005752563476562, -0.1666107177734375, -0.15316390991210938, -0.13971710205078125, -0.12627029418945312, -0.112823486328125, -0.09937667846679688, -0.08592987060546875, -0.07248306274414062, -0.0590362548828125, -0.045589447021484375, -0.03214263916015625, -0.018695831298828125, -0.0052490234375, 0.008197784423828125, 0.02164459228515625, 0.035091400146484375, 0.0485382080078125, 0.061985015869140625, 0.07543182373046875, 0.08887863159179688, 0.102325439453125, 0.11577224731445312, 0.12921905517578125, 0.14266586303710938, 0.1561126708984375, 0.16955947875976562, 0.18300628662109375, 0.19645309448242188, 0.20989990234375, 0.22334671020507812, 0.23679351806640625, 0.2502403259277344, 0.2636871337890625, 0.2771339416503906, 0.29058074951171875, 0.3040275573730469, 0.317474365234375, 0.3309211730957031, 0.34436798095703125, 0.3578147888183594, 0.3712615966796875, 0.3847084045410156, 0.39815521240234375, 0.4116020202636719, 0.425048828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 8.0, 9.0, 16.0, 16.0, 23.0, 48.0, 71.0, 89.0, 125.0, 135.0, 119.0, 100.0, 67.0, 44.0, 29.0, 26.0, 23.0, 15.0, 6.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023281574249267578, -0.00022627972066402435, -0.00021974369883537292, -0.0002132076770067215, -0.00020667165517807007, -0.00020013563334941864, -0.0001935996115207672, -0.00018706358969211578, -0.00018052756786346436, -0.00017399154603481293, -0.0001674555242061615, -0.00016091950237751007, -0.00015438348054885864, -0.00014784745872020721, -0.00014131143689155579, -0.00013477541506290436, -0.00012823939323425293, -0.0001217033714056015, -0.00011516734957695007, -0.00010863132774829865, -0.00010209530591964722, -9.555928409099579e-05, -8.902326226234436e-05, -8.248724043369293e-05, -7.59512186050415e-05, -6.941519677639008e-05, -6.287917494773865e-05, -5.634315311908722e-05, -4.980713129043579e-05, -4.327110946178436e-05, -3.6735087633132935e-05, -3.0199065804481506e-05, -2.3663043975830078e-05, -1.712702214717865e-05, -1.0591000318527222e-05, -4.0549784898757935e-06, 2.4810433387756348e-06, 9.017065167427063e-06, 1.555308699607849e-05, 2.208910882472992e-05, 2.8625130653381348e-05, 3.5161152482032776e-05, 4.1697174310684204e-05, 4.823319613933563e-05, 5.476921796798706e-05, 6.130523979663849e-05, 6.784126162528992e-05, 7.437728345394135e-05, 8.091330528259277e-05, 8.74493271112442e-05, 9.398534893989563e-05, 0.00010052137076854706, 0.00010705739259719849, 0.00011359341442584991, 0.00012012943625450134, 0.00012666545808315277, 0.0001332014799118042, 0.00013973750174045563, 0.00014627352356910706, 0.00015280954539775848, 0.0001593455672264099, 0.00016588158905506134, 0.00017241761088371277, 0.0001789536327123642, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 13.0, 17.0, 21.0, 30.0, 57.0, 113.0, 177.0, 316.0, 620.0, 1553.0, 4644.0, 19043.0, 118800.0, 740728.0, 133734.0, 20729.0, 4984.0, 1585.0, 672.0, 296.0, 175.0, 92.0, 56.0, 34.0, 12.0, 14.0, 8.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.72265625, -0.7038993835449219, -0.6851425170898438, -0.6663856506347656, -0.6476287841796875, -0.6288719177246094, -0.6101150512695312, -0.5913581848144531, -0.572601318359375, -0.5538444519042969, -0.5350875854492188, -0.5163307189941406, -0.4975738525390625, -0.4788169860839844, -0.46006011962890625, -0.4413032531738281, -0.42254638671875, -0.4037895202636719, -0.38503265380859375, -0.3662757873535156, -0.3475189208984375, -0.3287620544433594, -0.31000518798828125, -0.2912483215332031, -0.272491455078125, -0.2537345886230469, -0.23497772216796875, -0.21622085571289062, -0.1974639892578125, -0.17870712280273438, -0.15995025634765625, -0.14119338989257812, -0.1224365234375, -0.10367965698242188, -0.08492279052734375, -0.06616592407226562, -0.0474090576171875, -0.028652191162109375, -0.00989532470703125, 0.008861541748046875, 0.027618408203125, 0.046375274658203125, 0.06513214111328125, 0.08388900756835938, 0.1026458740234375, 0.12140274047851562, 0.14015960693359375, 0.15891647338867188, 0.17767333984375, 0.19643020629882812, 0.21518707275390625, 0.23394393920898438, 0.2527008056640625, 0.2714576721191406, 0.29021453857421875, 0.3089714050292969, 0.327728271484375, 0.3464851379394531, 0.36524200439453125, 0.3839988708496094, 0.4027557373046875, 0.4215126037597656, 0.44026947021484375, 0.4590263366699219, 0.477783203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 1.0, 5.0, 11.0, 13.0, 20.0, 29.0, 34.0, 49.0, 82.0, 100.0, 102.0, 102.0, 119.0, 83.0, 77.0, 44.0, 34.0, 23.0, 19.0, 16.0, 12.0, 5.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5746002197265625, -0.553009033203125, -0.5314178466796875, -0.50982666015625, -0.4882354736328125, -0.466644287109375, -0.4450531005859375, -0.4234619140625, -0.4018707275390625, -0.380279541015625, -0.3586883544921875, -0.33709716796875, -0.3155059814453125, -0.293914794921875, -0.2723236083984375, -0.250732421875, -0.2291412353515625, -0.207550048828125, -0.1859588623046875, -0.16436767578125, -0.1427764892578125, -0.121185302734375, -0.0995941162109375, -0.0780029296875, -0.0564117431640625, -0.034820556640625, -0.0132293701171875, 0.00836181640625, 0.0299530029296875, 0.051544189453125, 0.0731353759765625, 0.0947265625, 0.1163177490234375, 0.137908935546875, 0.1595001220703125, 0.18109130859375, 0.2026824951171875, 0.224273681640625, 0.2458648681640625, 0.2674560546875, 0.2890472412109375, 0.310638427734375, 0.3322296142578125, 0.35382080078125, 0.3754119873046875, 0.397003173828125, 0.4185943603515625, 0.440185546875, 0.4617767333984375, 0.483367919921875, 0.5049591064453125, 0.52655029296875, 0.5481414794921875, 0.569732666015625, 0.5913238525390625, 0.6129150390625, 0.6345062255859375, 0.656097412109375, 0.6776885986328125, 0.69927978515625, 0.7208709716796875, 0.742462158203125, 0.7640533447265625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 7.0, 16.0, 47.0, 63.0, 111.0, 190.0, 291.0, 123.0, 65.0, 36.0, 17.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890586853027344, -19.39608383178711, -18.901580810546875, -18.40707778930664, -17.912574768066406, -17.418071746826172, -16.923568725585938, -16.429065704345703, -15.934563636779785, -15.44006061553955, -14.945557594299316, -14.451054573059082, -13.956552505493164, -13.46204948425293, -12.967546463012695, -12.473043441772461, -11.978540420532227, -11.484037399291992, -10.989534378051758, -10.495031356811523, -10.000528335571289, -9.506025314331055, -9.011523246765137, -8.517020225524902, -8.022517204284668, -7.528014183044434, -7.033511161804199, -6.539008617401123, -6.044505596160889, -5.550002574920654, -5.055500030517578, -4.560997009277344, -4.066493988037109, -3.571990966796875, -3.0774881839752197, -2.5829854011535645, -2.08848237991333, -1.5939793586730957, -1.0994765758514404, -0.6049737930297852, -0.11047077178955078, 0.38403213024139404, 0.8785350322723389, 1.3730379343032837, 1.8675408363342285, 2.362043857574463, 2.856546640396118, 3.3510494232177734, 3.845552444458008, 4.340055465698242, 4.834558486938477, 5.329061031341553, 5.823564052581787, 6.3180670738220215, 6.812569618225098, 7.307072639465332, 7.801575660705566, 8.2960786819458, 8.790581703186035, 9.28508472442627, 9.779586791992188, 10.274089813232422, 10.768592834472656, 11.26309585571289, 11.757598876953125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 6.0, 2.0, 10.0, 6.0, 12.0, 20.0, 14.0, 16.0, 19.0, 23.0, 18.0, 25.0, 26.0, 21.0, 41.0, 46.0, 46.0, 95.0, 115.0, 70.0, 49.0, 34.0, 35.0, 29.0, 31.0, 26.0, 29.0, 21.0, 19.0, 13.0, 10.0, 11.0, 10.0, 6.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.874667167663574, -9.539567947387695, -9.204469680786133, -8.86937141418457, -8.534272193908691, -8.199172973632812, -7.86407470703125, -7.528975963592529, -7.193877220153809, -6.858778476715088, -6.523679733276367, -6.1885809898376465, -5.853482246398926, -5.518383502960205, -5.183284759521484, -4.848186016082764, -4.513087272644043, -4.177988529205322, -3.8428897857666016, -3.507791042327881, -3.17269229888916, -2.8375935554504395, -2.5024948120117188, -2.167396068572998, -1.8322973251342773, -1.4971985816955566, -1.162099838256836, -0.8270010948181152, -0.49190235137939453, -0.15680360794067383, 0.17829513549804688, 0.5133938789367676, 0.8484916687011719, 1.1835904121398926, 1.5186891555786133, 1.853787899017334, 2.1888866424560547, 2.5239853858947754, 2.859084129333496, 3.194182872772217, 3.5292816162109375, 3.864380359649658, 4.199479103088379, 4.5345778465271, 4.86967658996582, 5.204775333404541, 5.539874076843262, 5.874972820281982, 6.210071563720703, 6.545170307159424, 6.8802690505981445, 7.215367794036865, 7.550466537475586, 7.885565280914307, 8.220664024353027, 8.555763244628906, 8.890861511230469, 9.225959777832031, 9.56105899810791, 9.896158218383789, 10.231256484985352, 10.566354751586914, 10.901453971862793, 11.236553192138672, 11.571651458740234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 21.0, 18.0, 25.0, 42.0, 60.0, 88.0, 153.0, 223.0, 380.0, 596.0, 1143.0, 2323.0, 5442.0, 14369.0, 42554.0, 144867.0, 488748.0, 1296868.0, 1409177.0, 549073.0, 161110.0, 48314.0, 16360.0, 6426.0, 2770.0, 1377.0, 691.0, 373.0, 221.0, 133.0, 99.0, 63.0, 52.0, 22.0, 24.0, 17.0, 13.0, 5.0, 6.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.65185546875, -0.6327133178710938, -0.6135711669921875, -0.5944290161132812, -0.575286865234375, -0.5561447143554688, -0.5370025634765625, -0.5178604125976562, -0.49871826171875, -0.47957611083984375, -0.4604339599609375, -0.44129180908203125, -0.422149658203125, -0.40300750732421875, -0.3838653564453125, -0.36472320556640625, -0.3455810546875, -0.32643890380859375, -0.3072967529296875, -0.28815460205078125, -0.269012451171875, -0.24987030029296875, -0.2307281494140625, -0.21158599853515625, -0.19244384765625, -0.17330169677734375, -0.1541595458984375, -0.13501739501953125, -0.115875244140625, -0.09673309326171875, -0.0775909423828125, -0.05844879150390625, -0.039306640625, -0.02016448974609375, -0.0010223388671875, 0.01811981201171875, 0.037261962890625, 0.05640411376953125, 0.0755462646484375, 0.09468841552734375, 0.11383056640625, 0.13297271728515625, 0.1521148681640625, 0.17125701904296875, 0.190399169921875, 0.20954132080078125, 0.2286834716796875, 0.24782562255859375, 0.2669677734375, 0.28610992431640625, 0.3052520751953125, 0.32439422607421875, 0.343536376953125, 0.36267852783203125, 0.3818206787109375, 0.40096282958984375, 0.42010498046875, 0.43924713134765625, 0.4583892822265625, 0.47753143310546875, 0.496673583984375, 0.5158157348632812, 0.5349578857421875, 0.5541000366210938, 0.5732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 7.0, 6.0, 15.0, 10.0, 26.0, 17.0, 29.0, 28.0, 36.0, 36.0, 47.0, 37.0, 54.0, 45.0, 52.0, 57.0, 41.0, 48.0, 44.0, 52.0, 37.0, 30.0, 37.0, 35.0, 35.0, 26.0, 19.0, 15.0, 10.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.96484375, -0.9371109008789062, -0.9093780517578125, -0.8816452026367188, -0.853912353515625, -0.8261795043945312, -0.7984466552734375, -0.7707138061523438, -0.74298095703125, -0.7152481079101562, -0.6875152587890625, -0.6597824096679688, -0.632049560546875, -0.6043167114257812, -0.5765838623046875, -0.5488510131835938, -0.5211181640625, -0.49338531494140625, -0.4656524658203125, -0.43791961669921875, -0.410186767578125, -0.38245391845703125, -0.3547210693359375, -0.32698822021484375, -0.29925537109375, -0.27152252197265625, -0.2437896728515625, -0.21605682373046875, -0.188323974609375, -0.16059112548828125, -0.1328582763671875, -0.10512542724609375, -0.077392578125, -0.04965972900390625, -0.0219268798828125, 0.00580596923828125, 0.033538818359375, 0.06127166748046875, 0.0890045166015625, 0.11673736572265625, 0.14447021484375, 0.17220306396484375, 0.1999359130859375, 0.22766876220703125, 0.255401611328125, 0.28313446044921875, 0.3108673095703125, 0.33860015869140625, 0.3663330078125, 0.39406585693359375, 0.4217987060546875, 0.44953155517578125, 0.477264404296875, 0.5049972534179688, 0.5327301025390625, 0.5604629516601562, 0.58819580078125, 0.6159286499023438, 0.6436614990234375, 0.6713943481445312, 0.699127197265625, 0.7268600463867188, 0.7545928955078125, 0.7823257446289062, 0.81005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 10.0, 22.0, 21.0, 18.0, 38.0, 84.0, 159.0, 279.0, 655.0, 2138.0, 12122.0, 157344.0, 3646417.0, 349956.0, 19916.0, 3219.0, 982.0, 398.0, 201.0, 107.0, 62.0, 35.0, 30.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9404296875, -1.8770294189453125, -1.813629150390625, -1.7502288818359375, -1.68682861328125, -1.6234283447265625, -1.560028076171875, -1.4966278076171875, -1.4332275390625, -1.3698272705078125, -1.306427001953125, -1.2430267333984375, -1.17962646484375, -1.1162261962890625, -1.052825927734375, -0.9894256591796875, -0.926025390625, -0.8626251220703125, -0.799224853515625, -0.7358245849609375, -0.67242431640625, -0.6090240478515625, -0.545623779296875, -0.4822235107421875, -0.4188232421875, -0.3554229736328125, -0.292022705078125, -0.2286224365234375, -0.16522216796875, -0.1018218994140625, -0.038421630859375, 0.0249786376953125, 0.08837890625, 0.1517791748046875, 0.215179443359375, 0.2785797119140625, 0.34197998046875, 0.4053802490234375, 0.468780517578125, 0.5321807861328125, 0.5955810546875, 0.6589813232421875, 0.722381591796875, 0.7857818603515625, 0.84918212890625, 0.9125823974609375, 0.975982666015625, 1.0393829345703125, 1.102783203125, 1.1661834716796875, 1.229583740234375, 1.2929840087890625, 1.35638427734375, 1.4197845458984375, 1.483184814453125, 1.5465850830078125, 1.6099853515625, 1.6733856201171875, 1.736785888671875, 1.8001861572265625, 1.86358642578125, 1.9269866943359375, 1.990386962890625, 2.0537872314453125, 2.1171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 5.0, 5.0, 14.0, 5.0, 9.0, 14.0, 21.0, 26.0, 39.0, 76.0, 105.0, 146.0, 210.0, 312.0, 416.0, 503.0, 515.0, 498.0, 333.0, 230.0, 163.0, 115.0, 61.0, 60.0, 40.0, 41.0, 30.0, 24.0, 16.0, 5.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8788375854492188, -0.8372650146484375, -0.7956924438476562, -0.754119873046875, -0.7125473022460938, -0.6709747314453125, -0.6294021606445312, -0.58782958984375, -0.5462570190429688, -0.5046844482421875, -0.46311187744140625, -0.421539306640625, -0.37996673583984375, -0.3383941650390625, -0.29682159423828125, -0.2552490234375, -0.21367645263671875, -0.1721038818359375, -0.13053131103515625, -0.088958740234375, -0.04738616943359375, -0.0058135986328125, 0.03575897216796875, 0.07733154296875, 0.11890411376953125, 0.1604766845703125, 0.20204925537109375, 0.243621826171875, 0.28519439697265625, 0.3267669677734375, 0.36833953857421875, 0.409912109375, 0.45148468017578125, 0.4930572509765625, 0.5346298217773438, 0.576202392578125, 0.6177749633789062, 0.6593475341796875, 0.7009201049804688, 0.74249267578125, 0.7840652465820312, 0.8256378173828125, 0.8672103881835938, 0.908782958984375, 0.9503555297851562, 0.9919281005859375, 1.0335006713867188, 1.0750732421875, 1.1166458129882812, 1.1582183837890625, 1.1997909545898438, 1.241363525390625, 1.2829360961914062, 1.3245086669921875, 1.3660812377929688, 1.40765380859375, 1.4492263793945312, 1.4907989501953125, 1.5323715209960938, 1.573944091796875, 1.6155166625976562, 1.6570892333984375, 1.6986618041992188, 1.740234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 22.0, 31.0, 70.0, 106.0, 165.0, 183.0, 148.0, 113.0, 62.0, 31.0, 12.0, 15.0, 7.0, 9.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9807820320129395, -6.546756267547607, -6.112730503082275, -5.678705215454102, -5.2446794509887695, -4.8106536865234375, -4.3766279220581055, -3.9426021575927734, -3.5085763931274414, -3.0745506286621094, -2.6405248641967773, -2.2064993381500244, -1.7724735736846924, -1.3384478092193604, -0.9044222831726074, -0.4703965187072754, -0.03637075424194336, 0.3976549506187439, 0.8316806554794312, 1.2657063007354736, 1.6997320652008057, 2.1337578296661377, 2.5677833557128906, 3.0018091201782227, 3.4358348846435547, 3.8698606491088867, 4.303886413574219, 4.737912178039551, 5.171937942504883, 5.605963706970215, 6.039988994598389, 6.474014759063721, 6.908041000366211, 7.342066764831543, 7.776092529296875, 8.210118293762207, 8.644144058227539, 9.078169822692871, 9.512195587158203, 9.946220397949219, 10.380247116088867, 10.8142728805542, 11.248298645019531, 11.682324409484863, 12.116350173950195, 12.550375938415527, 12.98440170288086, 13.418426513671875, 13.852452278137207, 14.286478042602539, 14.720503807067871, 15.154529571533203, 15.588555335998535, 16.022581100463867, 16.456605911254883, 16.89063262939453, 17.324657440185547, 17.758682250976562, 18.19270896911621, 18.626733779907227, 19.060760498046875, 19.49478530883789, 19.92881202697754, 20.362836837768555, 20.796863555908203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 15.0, 16.0, 24.0, 33.0, 46.0, 39.0, 35.0, 35.0, 35.0, 33.0, 47.0, 44.0, 39.0, 47.0, 50.0, 55.0, 46.0, 33.0, 31.0, 29.0, 37.0, 31.0, 36.0, 32.0, 24.0, 13.0, 17.0, 7.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.798887252807617, -6.553752422332764, -6.308617115020752, -6.063482284545898, -5.818346977233887, -5.573212146759033, -5.32807731628418, -5.082942008972168, -4.8378071784973145, -4.592672348022461, -4.347537040710449, -4.102402210235596, -3.857267141342163, -3.6121320724487305, -3.366997241973877, -3.1218621730804443, -2.8767271041870117, -2.631592035293579, -2.3864569664001465, -2.141322135925293, -1.8961870670318604, -1.6510519981384277, -1.4059170484542847, -1.1607820987701416, -0.915647029876709, -0.6705120205879211, -0.4253770112991333, -0.18024200201034546, 0.06489300727844238, 0.310028076171875, 0.5551630258560181, 0.8002979755401611, 1.0454330444335938, 1.2905681133270264, 1.5357030630111694, 1.7808380126953125, 2.025973081588745, 2.2711081504821777, 2.5162429809570312, 2.761378049850464, 3.0065131187438965, 3.251648187637329, 3.4967832565307617, 3.7419180870056152, 3.987053155899048, 4.2321882247924805, 4.477323055267334, 4.7224578857421875, 4.967593193054199, 5.212728023529053, 5.4578633308410645, 5.702998161315918, 5.94813346862793, 6.193268299102783, 6.438403129577637, 6.683538436889648, 6.928673267364502, 7.1738080978393555, 7.418943405151367, 7.664078235626221, 7.909213066101074, 8.154348373413086, 8.399483680725098, 8.644618034362793, 8.889753341674805]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 9.0, 16.0, 27.0, 42.0, 77.0, 106.0, 182.0, 267.0, 471.0, 800.0, 1531.0, 2796.0, 5459.0, 10795.0, 23141.0, 52855.0, 131360.0, 304760.0, 294359.0, 125284.0, 50382.0, 21973.0, 10445.0, 5163.0, 2746.0, 1502.0, 803.0, 448.0, 280.0, 176.0, 97.0, 56.0, 53.0, 30.0, 15.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154296875, -1.1144561767578125, -1.074615478515625, -1.0347747802734375, -0.99493408203125, -0.9550933837890625, -0.915252685546875, -0.8754119873046875, -0.8355712890625, -0.7957305908203125, -0.755889892578125, -0.7160491943359375, -0.67620849609375, -0.6363677978515625, -0.596527099609375, -0.5566864013671875, -0.516845703125, -0.4770050048828125, -0.437164306640625, -0.3973236083984375, -0.35748291015625, -0.3176422119140625, -0.277801513671875, -0.2379608154296875, -0.1981201171875, -0.1582794189453125, -0.118438720703125, -0.0785980224609375, -0.03875732421875, 0.0010833740234375, 0.040924072265625, 0.0807647705078125, 0.12060546875, 0.1604461669921875, 0.200286865234375, 0.2401275634765625, 0.27996826171875, 0.3198089599609375, 0.359649658203125, 0.3994903564453125, 0.4393310546875, 0.4791717529296875, 0.519012451171875, 0.5588531494140625, 0.59869384765625, 0.6385345458984375, 0.678375244140625, 0.7182159423828125, 0.758056640625, 0.7978973388671875, 0.837738037109375, 0.8775787353515625, 0.91741943359375, 0.9572601318359375, 0.997100830078125, 1.0369415283203125, 1.0767822265625, 1.1166229248046875, 1.156463623046875, 1.1963043212890625, 1.23614501953125, 1.2759857177734375, 1.315826416015625, 1.3556671142578125, 1.3955078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 22.0, 29.0, 20.0, 35.0, 37.0, 59.0, 57.0, 40.0, 60.0, 56.0, 56.0, 67.0, 52.0, 50.0, 55.0, 42.0, 35.0, 42.0, 32.0, 27.0, 20.0, 16.0, 10.0, 9.0, 10.0, 9.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9017791748046875, -0.868011474609375, -0.8342437744140625, -0.80047607421875, -0.7667083740234375, -0.732940673828125, -0.6991729736328125, -0.6654052734375, -0.6316375732421875, -0.597869873046875, -0.5641021728515625, -0.53033447265625, -0.4965667724609375, -0.462799072265625, -0.4290313720703125, -0.395263671875, -0.3614959716796875, -0.327728271484375, -0.2939605712890625, -0.26019287109375, -0.2264251708984375, -0.192657470703125, -0.1588897705078125, -0.1251220703125, -0.0913543701171875, -0.057586669921875, -0.0238189697265625, 0.00994873046875, 0.0437164306640625, 0.077484130859375, 0.1112518310546875, 0.14501953125, 0.1787872314453125, 0.212554931640625, 0.2463226318359375, 0.28009033203125, 0.3138580322265625, 0.347625732421875, 0.3813934326171875, 0.4151611328125, 0.4489288330078125, 0.482696533203125, 0.5164642333984375, 0.55023193359375, 0.5839996337890625, 0.617767333984375, 0.6515350341796875, 0.685302734375, 0.7190704345703125, 0.752838134765625, 0.7866058349609375, 0.82037353515625, 0.8541412353515625, 0.887908935546875, 0.9216766357421875, 0.9554443359375, 0.9892120361328125, 1.022979736328125, 1.0567474365234375, 1.09051513671875, 1.1242828369140625, 1.158050537109375, 1.1918182373046875, 1.2255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 14.0, 15.0, 17.0, 27.0, 34.0, 51.0, 74.0, 78.0, 106.0, 132.0, 212.0, 298.0, 418.0, 629.0, 968.0, 1907.0, 4633.0, 18695.0, 123896.0, 756737.0, 113111.0, 17126.0, 4498.0, 1830.0, 957.0, 649.0, 377.0, 285.0, 199.0, 134.0, 99.0, 79.0, 66.0, 52.0, 32.0, 36.0, 17.0, 15.0, 7.0, 5.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.165283203125, -2.09423828125, -2.023193359375, -1.9521484375, -1.881103515625, -1.81005859375, -1.739013671875, -1.66796875, -1.596923828125, -1.52587890625, -1.454833984375, -1.3837890625, -1.312744140625, -1.24169921875, -1.170654296875, -1.099609375, -1.028564453125, -0.95751953125, -0.886474609375, -0.8154296875, -0.744384765625, -0.67333984375, -0.602294921875, -0.53125, -0.460205078125, -0.38916015625, -0.318115234375, -0.2470703125, -0.176025390625, -0.10498046875, -0.033935546875, 0.037109375, 0.108154296875, 0.17919921875, 0.250244140625, 0.3212890625, 0.392333984375, 0.46337890625, 0.534423828125, 0.60546875, 0.676513671875, 0.74755859375, 0.818603515625, 0.8896484375, 0.960693359375, 1.03173828125, 1.102783203125, 1.173828125, 1.244873046875, 1.31591796875, 1.386962890625, 1.4580078125, 1.529052734375, 1.60009765625, 1.671142578125, 1.7421875, 1.813232421875, 1.88427734375, 1.955322265625, 2.0263671875, 2.097412109375, 2.16845703125, 2.239501953125, 2.310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 10.0, 13.0, 12.0, 13.0, 14.0, 24.0, 26.0, 32.0, 32.0, 32.0, 46.0, 43.0, 44.0, 56.0, 45.0, 63.0, 62.0, 53.0, 51.0, 53.0, 41.0, 33.0, 21.0, 30.0, 27.0, 20.0, 17.0, 10.0, 11.0, 16.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1796875, -3.078155517578125, -2.97662353515625, -2.875091552734375, -2.7735595703125, -2.672027587890625, -2.57049560546875, -2.468963623046875, -2.367431640625, -2.265899658203125, -2.16436767578125, -2.062835693359375, -1.9613037109375, -1.859771728515625, -1.75823974609375, -1.656707763671875, -1.55517578125, -1.453643798828125, -1.35211181640625, -1.250579833984375, -1.1490478515625, -1.047515869140625, -0.94598388671875, -0.844451904296875, -0.742919921875, -0.641387939453125, -0.53985595703125, -0.438323974609375, -0.3367919921875, -0.235260009765625, -0.13372802734375, -0.032196044921875, 0.0693359375, 0.170867919921875, 0.27239990234375, 0.373931884765625, 0.4754638671875, 0.576995849609375, 0.67852783203125, 0.780059814453125, 0.881591796875, 0.983123779296875, 1.08465576171875, 1.186187744140625, 1.2877197265625, 1.389251708984375, 1.49078369140625, 1.592315673828125, 1.69384765625, 1.795379638671875, 1.89691162109375, 1.998443603515625, 2.0999755859375, 2.201507568359375, 2.30303955078125, 2.404571533203125, 2.506103515625, 2.607635498046875, 2.70916748046875, 2.810699462890625, 2.9122314453125, 3.013763427734375, 3.11529541015625, 3.216827392578125, 3.318359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 8.0, 21.0, 43.0, 30.0, 64.0, 109.0, 147.0, 286.0, 522.0, 1136.0, 2931.0, 9559.0, 45292.0, 308668.0, 610829.0, 52413.0, 10858.0, 3146.0, 1145.0, 560.0, 302.0, 163.0, 95.0, 61.0, 50.0, 28.0, 22.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4754753112792969, -0.45851898193359375, -0.4415626525878906, -0.4246063232421875, -0.4076499938964844, -0.39069366455078125, -0.3737373352050781, -0.356781005859375, -0.3398246765136719, -0.32286834716796875, -0.3059120178222656, -0.2889556884765625, -0.2719993591308594, -0.25504302978515625, -0.23808670043945312, -0.22113037109375, -0.20417404174804688, -0.18721771240234375, -0.17026138305664062, -0.1533050537109375, -0.13634872436523438, -0.11939239501953125, -0.10243606567382812, -0.085479736328125, -0.06852340698242188, -0.05156707763671875, -0.034610748291015625, -0.0176544189453125, -0.000698089599609375, 0.01625823974609375, 0.033214569091796875, 0.0501708984375, 0.06712722778320312, 0.08408355712890625, 0.10103988647460938, 0.1179962158203125, 0.13495254516601562, 0.15190887451171875, 0.16886520385742188, 0.185821533203125, 0.20277786254882812, 0.21973419189453125, 0.23669052124023438, 0.2536468505859375, 0.2706031799316406, 0.28755950927734375, 0.3045158386230469, 0.32147216796875, 0.3384284973144531, 0.35538482666015625, 0.3723411560058594, 0.3892974853515625, 0.4062538146972656, 0.42321014404296875, 0.4401664733886719, 0.457122802734375, 0.4740791320800781, 0.49103546142578125, 0.5079917907714844, 0.5249481201171875, 0.5419044494628906, 0.5588607788085938, 0.5758171081542969, 0.5927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 7.0, 9.0, 12.0, 11.0, 18.0, 22.0, 24.0, 27.0, 29.0, 44.0, 74.0, 69.0, 77.0, 82.0, 88.0, 82.0, 66.0, 46.0, 38.0, 20.0, 29.0, 18.0, 24.0, 16.0, 9.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001481771469116211, -0.00014331750571727753, -0.00013845786452293396, -0.0001335982233285904, -0.00012873858213424683, -0.00012387894093990326, -0.00011901929974555969, -0.00011415965855121613, -0.00010930001735687256, -0.00010444037616252899, -9.958073496818542e-05, -9.472109377384186e-05, -8.986145257949829e-05, -8.500181138515472e-05, -8.014217019081116e-05, -7.528252899646759e-05, -7.042288780212402e-05, -6.556324660778046e-05, -6.070360541343689e-05, -5.584396421909332e-05, -5.0984323024749756e-05, -4.612468183040619e-05, -4.126504063606262e-05, -3.6405399441719055e-05, -3.154575824737549e-05, -2.668611705303192e-05, -2.1826475858688354e-05, -1.6966834664344788e-05, -1.210719347000122e-05, -7.247552275657654e-06, -2.387911081314087e-06, 2.47173011302948e-06, 7.331371307373047e-06, 1.2191012501716614e-05, 1.705065369606018e-05, 2.1910294890403748e-05, 2.6769936084747314e-05, 3.162957727909088e-05, 3.648921847343445e-05, 4.1348859667778015e-05, 4.620850086212158e-05, 5.106814205646515e-05, 5.5927783250808716e-05, 6.078742444515228e-05, 6.564706563949585e-05, 7.050670683383942e-05, 7.536634802818298e-05, 8.022598922252655e-05, 8.508563041687012e-05, 8.994527161121368e-05, 9.480491280555725e-05, 9.966455399990082e-05, 0.00010452419519424438, 0.00010938383638858795, 0.00011424347758293152, 0.00011910311877727509, 0.00012396275997161865, 0.00012882240116596222, 0.00013368204236030579, 0.00013854168355464935, 0.00014340132474899292, 0.0001482609659433365, 0.00015312060713768005, 0.00015798024833202362, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 5.0, 16.0, 27.0, 26.0, 41.0, 49.0, 110.0, 146.0, 234.0, 382.0, 708.0, 1440.0, 3633.0, 12015.0, 55845.0, 604014.0, 305091.0, 48002.0, 10509.0, 3282.0, 1325.0, 629.0, 394.0, 206.0, 137.0, 83.0, 45.0, 46.0, 24.0, 18.0, 14.0, 12.0, 11.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5430030822753906, -0.5279006958007812, -0.5127983093261719, -0.4976959228515625, -0.4825935363769531, -0.46749114990234375, -0.4523887634277344, -0.437286376953125, -0.4221839904785156, -0.40708160400390625, -0.3919792175292969, -0.3768768310546875, -0.3617744445800781, -0.34667205810546875, -0.3315696716308594, -0.31646728515625, -0.3013648986816406, -0.28626251220703125, -0.2711601257324219, -0.2560577392578125, -0.24095535278320312, -0.22585296630859375, -0.21075057983398438, -0.195648193359375, -0.18054580688476562, -0.16544342041015625, -0.15034103393554688, -0.1352386474609375, -0.12013626098632812, -0.10503387451171875, -0.08993148803710938, -0.0748291015625, -0.059726715087890625, -0.04462432861328125, -0.029521942138671875, -0.0144195556640625, 0.000682830810546875, 0.01578521728515625, 0.030887603759765625, 0.045989990234375, 0.061092376708984375, 0.07619476318359375, 0.09129714965820312, 0.1063995361328125, 0.12150192260742188, 0.13660430908203125, 0.15170669555664062, 0.16680908203125, 0.18191146850585938, 0.19701385498046875, 0.21211624145507812, 0.2272186279296875, 0.24232101440429688, 0.25742340087890625, 0.2725257873535156, 0.287628173828125, 0.3027305603027344, 0.31783294677734375, 0.3329353332519531, 0.3480377197265625, 0.3631401062011719, 0.37824249267578125, 0.3933448791503906, 0.408447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 15.0, 18.0, 19.0, 22.0, 25.0, 31.0, 28.0, 53.0, 65.0, 62.0, 88.0, 75.0, 82.0, 62.0, 45.0, 54.0, 44.0, 41.0, 29.0, 17.0, 17.0, 14.0, 13.0, 9.0, 9.0, 11.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.462158203125, -0.44886016845703125, -0.4355621337890625, -0.42226409912109375, -0.408966064453125, -0.39566802978515625, -0.3823699951171875, -0.36907196044921875, -0.35577392578125, -0.34247589111328125, -0.3291778564453125, -0.31587982177734375, -0.302581787109375, -0.28928375244140625, -0.2759857177734375, -0.26268768310546875, -0.2493896484375, -0.23609161376953125, -0.2227935791015625, -0.20949554443359375, -0.196197509765625, -0.18289947509765625, -0.1696014404296875, -0.15630340576171875, -0.14300537109375, -0.12970733642578125, -0.1164093017578125, -0.10311126708984375, -0.089813232421875, -0.07651519775390625, -0.0632171630859375, -0.04991912841796875, -0.03662109375, -0.02332305908203125, -0.0100250244140625, 0.00327301025390625, 0.016571044921875, 0.02986907958984375, 0.0431671142578125, 0.05646514892578125, 0.06976318359375, 0.08306121826171875, 0.0963592529296875, 0.10965728759765625, 0.122955322265625, 0.13625335693359375, 0.1495513916015625, 0.16284942626953125, 0.1761474609375, 0.18944549560546875, 0.2027435302734375, 0.21604156494140625, 0.229339599609375, 0.24263763427734375, 0.2559356689453125, 0.26923370361328125, 0.28253173828125, 0.29582977294921875, 0.3091278076171875, 0.32242584228515625, 0.335723876953125, 0.34902191162109375, 0.3623199462890625, 0.37561798095703125, 0.388916015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 11.0, 17.0, 23.0, 29.0, 66.0, 96.0, 148.0, 333.0, 131.0, 61.0, 46.0, 16.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.230846405029297, -21.75246238708496, -21.274078369140625, -20.79569435119629, -20.317310333251953, -19.838924407958984, -19.36054039001465, -18.882156372070312, -18.403772354125977, -17.92538833618164, -17.447004318237305, -16.96862030029297, -16.490234375, -16.011850357055664, -15.533466339111328, -15.055082321166992, -14.576698303222656, -14.09831428527832, -13.619930267333984, -13.141545295715332, -12.663161277770996, -12.18477725982666, -11.706392288208008, -11.228008270263672, -10.749624252319336, -10.271240234375, -9.792856216430664, -9.314471244812012, -8.836087226867676, -8.35770320892334, -7.879318714141846, -7.400934219360352, -6.922549247741699, -6.444165229797363, -5.965780735015869, -5.487396240234375, -5.009012222290039, -4.530628204345703, -4.052243709564209, -3.573859453201294, -3.095475196838379, -2.617090940475464, -2.138706684112549, -1.6603224277496338, -1.1819381713867188, -0.7035539150238037, -0.22516965866088867, 0.25321459770202637, 0.7315988540649414, 1.2099831104278564, 1.6883673667907715, 2.1667516231536865, 2.6451358795166016, 3.1235201358795166, 3.6019043922424316, 4.080288887023926, 4.558672904968262, 5.037056922912598, 5.515441417694092, 5.993825912475586, 6.472209930419922, 6.950593948364258, 7.428978443145752, 7.907362937927246, 8.385746955871582]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 12.0, 11.0, 14.0, 15.0, 21.0, 18.0, 21.0, 31.0, 39.0, 38.0, 31.0, 52.0, 145.0, 142.0, 66.0, 45.0, 39.0, 22.0, 31.0, 27.0, 28.0, 21.0, 16.0, 8.0, 9.0, 11.0, 10.0, 13.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.262158393859863, -12.884936332702637, -12.50771427154541, -12.130491256713867, -11.75326919555664, -11.376047134399414, -10.998825073242188, -10.621603012084961, -10.244380950927734, -9.867158889770508, -9.489936828613281, -9.112714767456055, -8.735491752624512, -8.358269691467285, -7.981047630310059, -7.603825569152832, -7.226602554321289, -6.8493804931640625, -6.472157955169678, -6.094935894012451, -5.717713356018066, -5.34049129486084, -4.963269233703613, -4.586047172546387, -4.208824634552002, -3.8316023349761963, -3.4543800354003906, -3.077157974243164, -2.6999356746673584, -2.3227133750915527, -1.9454913139343262, -1.5682690143585205, -1.1910476684570312, -0.8138254284858704, -0.4366031885147095, -0.05938100814819336, 0.3178412914276123, 0.695063591003418, 1.0722856521606445, 1.4495079517364502, 1.8267302513122559, 2.2039525508880615, 2.581174850463867, 2.9583969116210938, 3.3356192111968994, 3.712841510772705, 4.090063571929932, 4.467286109924316, 4.844508171081543, 5.2217302322387695, 5.598952770233154, 5.976174831390381, 6.353397369384766, 6.730619430541992, 7.107841491699219, 7.485063552856445, 7.86228609085083, 8.239508628845215, 8.616730690002441, 8.993952751159668, 9.371174812316895, 9.748397827148438, 10.125619888305664, 10.50284194946289, 10.880064010620117]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 11.0, 12.0, 11.0, 25.0, 38.0, 77.0, 108.0, 182.0, 287.0, 615.0, 1106.0, 2196.0, 5468.0, 18216.0, 92787.0, 529604.0, 1851096.0, 1328823.0, 291840.0, 51548.0, 12515.0, 3966.0, 1652.0, 957.0, 455.0, 285.0, 170.0, 86.0, 54.0, 34.0, 27.0, 7.0, 10.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.83453369140625, -0.7979736328125, -0.76141357421875, -0.724853515625, -0.68829345703125, -0.6517333984375, -0.61517333984375, -0.57861328125, -0.54205322265625, -0.5054931640625, -0.46893310546875, -0.432373046875, -0.39581298828125, -0.3592529296875, -0.32269287109375, -0.2861328125, -0.24957275390625, -0.2130126953125, -0.17645263671875, -0.139892578125, -0.10333251953125, -0.0667724609375, -0.03021240234375, 0.00634765625, 0.04290771484375, 0.0794677734375, 0.11602783203125, 0.152587890625, 0.18914794921875, 0.2257080078125, 0.26226806640625, 0.298828125, 0.33538818359375, 0.3719482421875, 0.40850830078125, 0.445068359375, 0.48162841796875, 0.5181884765625, 0.55474853515625, 0.59130859375, 0.62786865234375, 0.6644287109375, 0.70098876953125, 0.737548828125, 0.77410888671875, 0.8106689453125, 0.84722900390625, 0.8837890625, 0.92034912109375, 0.9569091796875, 0.99346923828125, 1.030029296875, 1.06658935546875, 1.1031494140625, 1.13970947265625, 1.17626953125, 1.21282958984375, 1.2493896484375, 1.28594970703125, 1.322509765625, 1.35906982421875, 1.3956298828125, 1.43218994140625, 1.46875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 12.0, 27.0, 22.0, 26.0, 25.0, 26.0, 38.0, 36.0, 55.0, 39.0, 43.0, 40.0, 50.0, 75.0, 57.0, 48.0, 54.0, 41.0, 29.0, 44.0, 41.0, 29.0, 23.0, 19.0, 13.0, 9.0, 15.0, 7.0, 4.0, 10.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9443359375, -0.9166183471679688, -0.8889007568359375, -0.8611831665039062, -0.833465576171875, -0.8057479858398438, -0.7780303955078125, -0.7503128051757812, -0.72259521484375, -0.6948776245117188, -0.6671600341796875, -0.6394424438476562, -0.611724853515625, -0.5840072631835938, -0.5562896728515625, -0.5285720825195312, -0.5008544921875, -0.47313690185546875, -0.4454193115234375, -0.41770172119140625, -0.389984130859375, -0.36226654052734375, -0.3345489501953125, -0.30683135986328125, -0.27911376953125, -0.25139617919921875, -0.2236785888671875, -0.19596099853515625, -0.168243408203125, -0.14052581787109375, -0.1128082275390625, -0.08509063720703125, -0.057373046875, -0.02965545654296875, -0.0019378662109375, 0.02577972412109375, 0.053497314453125, 0.08121490478515625, 0.1089324951171875, 0.13665008544921875, 0.16436767578125, 0.19208526611328125, 0.2198028564453125, 0.24752044677734375, 0.275238037109375, 0.30295562744140625, 0.3306732177734375, 0.35839080810546875, 0.3861083984375, 0.41382598876953125, 0.4415435791015625, 0.46926116943359375, 0.496978759765625, 0.5246963500976562, 0.5524139404296875, 0.5801315307617188, 0.60784912109375, 0.6355667114257812, 0.6632843017578125, 0.6910018920898438, 0.718719482421875, 0.7464370727539062, 0.7741546630859375, 0.8018722534179688, 0.82958984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 9.0, 14.0, 18.0, 22.0, 38.0, 48.0, 76.0, 130.0, 200.0, 394.0, 743.0, 1641.0, 4814.0, 33327.0, 3487256.0, 643389.0, 15830.0, 3496.0, 1349.0, 605.0, 347.0, 187.0, 108.0, 73.0, 52.0, 24.0, 15.0, 24.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.87628173828125, -3.7545166015625, -3.63275146484375, -3.510986328125, -3.38922119140625, -3.2674560546875, -3.14569091796875, -3.02392578125, -2.90216064453125, -2.7803955078125, -2.65863037109375, -2.536865234375, -2.41510009765625, -2.2933349609375, -2.17156982421875, -2.0498046875, -1.92803955078125, -1.8062744140625, -1.68450927734375, -1.562744140625, -1.44097900390625, -1.3192138671875, -1.19744873046875, -1.07568359375, -0.95391845703125, -0.8321533203125, -0.71038818359375, -0.588623046875, -0.46685791015625, -0.3450927734375, -0.22332763671875, -0.1015625, 0.02020263671875, 0.1419677734375, 0.26373291015625, 0.385498046875, 0.50726318359375, 0.6290283203125, 0.75079345703125, 0.87255859375, 0.99432373046875, 1.1160888671875, 1.23785400390625, 1.359619140625, 1.48138427734375, 1.6031494140625, 1.72491455078125, 1.8466796875, 1.96844482421875, 2.0902099609375, 2.21197509765625, 2.333740234375, 2.45550537109375, 2.5772705078125, 2.69903564453125, 2.82080078125, 2.94256591796875, 3.0643310546875, 3.18609619140625, 3.307861328125, 3.42962646484375, 3.5513916015625, 3.67315673828125, 3.794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 5.0, 16.0, 14.0, 21.0, 36.0, 46.0, 73.0, 108.0, 146.0, 208.0, 328.0, 430.0, 545.0, 509.0, 400.0, 319.0, 225.0, 166.0, 124.0, 92.0, 55.0, 50.0, 29.0, 24.0, 25.0, 15.0, 14.0, 3.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.03125, -1.958160400390625, -1.88507080078125, -1.811981201171875, -1.7388916015625, -1.665802001953125, -1.59271240234375, -1.519622802734375, -1.446533203125, -1.373443603515625, -1.30035400390625, -1.227264404296875, -1.1541748046875, -1.081085205078125, -1.00799560546875, -0.934906005859375, -0.86181640625, -0.788726806640625, -0.71563720703125, -0.642547607421875, -0.5694580078125, -0.496368408203125, -0.42327880859375, -0.350189208984375, -0.277099609375, -0.204010009765625, -0.13092041015625, -0.057830810546875, 0.0152587890625, 0.088348388671875, 0.16143798828125, 0.234527587890625, 0.3076171875, 0.380706787109375, 0.45379638671875, 0.526885986328125, 0.5999755859375, 0.673065185546875, 0.74615478515625, 0.819244384765625, 0.892333984375, 0.965423583984375, 1.03851318359375, 1.111602783203125, 1.1846923828125, 1.257781982421875, 1.33087158203125, 1.403961181640625, 1.47705078125, 1.550140380859375, 1.62322998046875, 1.696319580078125, 1.7694091796875, 1.842498779296875, 1.91558837890625, 1.988677978515625, 2.061767578125, 2.134857177734375, 2.20794677734375, 2.281036376953125, 2.3541259765625, 2.427215576171875, 2.50030517578125, 2.573394775390625, 2.646484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 8.0, 7.0, 22.0, 36.0, 66.0, 119.0, 232.0, 222.0, 147.0, 55.0, 34.0, 19.0, 12.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.069202423095703, -25.97530174255371, -24.88140106201172, -23.787500381469727, -22.693599700927734, -21.59969711303711, -20.505796432495117, -19.411895751953125, -18.317995071411133, -17.22409439086914, -16.13019371032715, -15.03629207611084, -13.942391395568848, -12.848490715026855, -11.754589080810547, -10.660688400268555, -9.566787719726562, -8.47288703918457, -7.37898588180542, -6.2850847244262695, -5.191184043884277, -4.097283363342285, -3.0033822059631348, -1.9094810485839844, -0.8155803680419922, 0.2783205509185791, 1.3722214698791504, 2.4661223888397217, 3.560023307800293, 4.653923988342285, 5.7478251457214355, 6.841726303100586, 7.935626983642578, 9.02952766418457, 10.123428344726562, 11.217329978942871, 12.311230659484863, 13.405131340026855, 14.499032974243164, 15.592933654785156, 16.68683433532715, 17.78073501586914, 18.874635696411133, 19.968536376953125, 21.06243896484375, 22.15633773803711, 23.250240325927734, 24.344141006469727, 25.43804168701172, 26.53194236755371, 27.625843048095703, 28.719743728637695, 29.813644409179688, 30.907546997070312, 32.00144577026367, 33.0953483581543, 34.189247131347656, 35.28314971923828, 36.37704849243164, 37.470951080322266, 38.564849853515625, 39.65875244140625, 40.75265121459961, 41.846553802490234, 42.94045639038086]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 7.0, 17.0, 17.0, 8.0, 18.0, 25.0, 15.0, 24.0, 21.0, 36.0, 32.0, 40.0, 36.0, 45.0, 42.0, 54.0, 58.0, 61.0, 53.0, 49.0, 39.0, 35.0, 27.0, 23.0, 36.0, 24.0, 29.0, 15.0, 13.0, 18.0, 12.0, 17.0, 4.0, 7.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.017311096191406, -14.561007499694824, -14.104703903198242, -13.648401260375977, -13.192097663879395, -12.735794067382812, -12.27949047088623, -11.823186874389648, -11.366883277893066, -10.910579681396484, -10.454276084899902, -9.99797248840332, -9.541669845581055, -9.085366249084473, -8.62906265258789, -8.172759056091309, -7.716455936431885, -7.260152339935303, -6.803849220275879, -6.347545623779297, -5.891242027282715, -5.434938430786133, -4.978635311126709, -4.522331714630127, -4.066028594970703, -3.6097252368927, -3.153421640396118, -2.6971182823181152, -2.240814685821533, -1.7845113277435303, -1.3282079696655273, -0.8719043731689453, -0.4156007766723633, 0.04070267081260681, 0.4970061182975769, 0.9533095359802246, 1.409613013267517, 1.8659164905548096, 2.3222198486328125, 2.7785234451293945, 3.2348268032073975, 3.6911301612854004, 4.147433757781982, 4.603736877441406, 5.060040473937988, 5.51634407043457, 5.972647666931152, 6.428951263427734, 6.885254383087158, 7.34155797958374, 7.797861099243164, 8.254164695739746, 8.710468292236328, 9.16677188873291, 9.623075485229492, 10.079378128051758, 10.53568172454834, 10.991985321044922, 11.448288917541504, 11.904592514038086, 12.360895156860352, 12.817198753356934, 13.273502349853516, 13.729805946350098, 14.18610954284668]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 11.0, 16.0, 11.0, 36.0, 49.0, 68.0, 110.0, 177.0, 266.0, 442.0, 849.0, 1585.0, 3361.0, 7566.0, 20300.0, 65552.0, 288216.0, 511094.0, 100767.0, 28941.0, 10323.0, 4307.0, 1975.0, 1088.0, 530.0, 327.0, 195.0, 124.0, 78.0, 40.0, 35.0, 19.0, 22.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.47198486328125, -1.4215087890625, -1.37103271484375, -1.320556640625, -1.27008056640625, -1.2196044921875, -1.16912841796875, -1.11865234375, -1.06817626953125, -1.0177001953125, -0.96722412109375, -0.916748046875, -0.86627197265625, -0.8157958984375, -0.76531982421875, -0.71484375, -0.66436767578125, -0.6138916015625, -0.56341552734375, -0.512939453125, -0.46246337890625, -0.4119873046875, -0.36151123046875, -0.31103515625, -0.26055908203125, -0.2100830078125, -0.15960693359375, -0.109130859375, -0.05865478515625, -0.0081787109375, 0.04229736328125, 0.0927734375, 0.14324951171875, 0.1937255859375, 0.24420166015625, 0.294677734375, 0.34515380859375, 0.3956298828125, 0.44610595703125, 0.49658203125, 0.54705810546875, 0.5975341796875, 0.64801025390625, 0.698486328125, 0.74896240234375, 0.7994384765625, 0.84991455078125, 0.900390625, 0.95086669921875, 1.0013427734375, 1.05181884765625, 1.102294921875, 1.15277099609375, 1.2032470703125, 1.25372314453125, 1.30419921875, 1.35467529296875, 1.4051513671875, 1.45562744140625, 1.506103515625, 1.55657958984375, 1.6070556640625, 1.65753173828125, 1.7080078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 17.0, 11.0, 33.0, 32.0, 36.0, 41.0, 47.0, 52.0, 65.0, 56.0, 71.0, 74.0, 70.0, 64.0, 74.0, 49.0, 36.0, 37.0, 17.0, 27.0, 16.0, 9.0, 13.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2172393798828125, -1.173736572265625, -1.1302337646484375, -1.08673095703125, -1.0432281494140625, -0.999725341796875, -0.9562225341796875, -0.9127197265625, -0.8692169189453125, -0.825714111328125, -0.7822113037109375, -0.73870849609375, -0.6952056884765625, -0.651702880859375, -0.6082000732421875, -0.564697265625, -0.5211944580078125, -0.477691650390625, -0.4341888427734375, -0.39068603515625, -0.3471832275390625, -0.303680419921875, -0.2601776123046875, -0.2166748046875, -0.1731719970703125, -0.129669189453125, -0.0861663818359375, -0.04266357421875, 0.0008392333984375, 0.044342041015625, 0.0878448486328125, 0.13134765625, 0.1748504638671875, 0.218353271484375, 0.2618560791015625, 0.30535888671875, 0.3488616943359375, 0.392364501953125, 0.4358673095703125, 0.4793701171875, 0.5228729248046875, 0.566375732421875, 0.6098785400390625, 0.65338134765625, 0.6968841552734375, 0.740386962890625, 0.7838897705078125, 0.827392578125, 0.8708953857421875, 0.914398193359375, 0.9579010009765625, 1.00140380859375, 1.0449066162109375, 1.088409423828125, 1.1319122314453125, 1.1754150390625, 1.2189178466796875, 1.262420654296875, 1.3059234619140625, 1.34942626953125, 1.3929290771484375, 1.436431884765625, 1.4799346923828125, 1.5234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 16.0, 25.0, 22.0, 37.0, 48.0, 68.0, 118.0, 199.0, 320.0, 615.0, 1335.0, 4374.0, 30102.0, 887942.0, 110053.0, 9457.0, 2136.0, 745.0, 414.0, 231.0, 91.0, 73.0, 35.0, 28.0, 22.0, 16.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.383514404296875, -2.29437255859375, -2.205230712890625, -2.1160888671875, -2.026947021484375, -1.93780517578125, -1.848663330078125, -1.759521484375, -1.670379638671875, -1.58123779296875, -1.492095947265625, -1.4029541015625, -1.313812255859375, -1.22467041015625, -1.135528564453125, -1.04638671875, -0.957244873046875, -0.86810302734375, -0.778961181640625, -0.6898193359375, -0.600677490234375, -0.51153564453125, -0.422393798828125, -0.333251953125, -0.244110107421875, -0.15496826171875, -0.065826416015625, 0.0233154296875, 0.112457275390625, 0.20159912109375, 0.290740966796875, 0.3798828125, 0.469024658203125, 0.55816650390625, 0.647308349609375, 0.7364501953125, 0.825592041015625, 0.91473388671875, 1.003875732421875, 1.093017578125, 1.182159423828125, 1.27130126953125, 1.360443115234375, 1.4495849609375, 1.538726806640625, 1.62786865234375, 1.717010498046875, 1.80615234375, 1.895294189453125, 1.98443603515625, 2.073577880859375, 2.1627197265625, 2.251861572265625, 2.34100341796875, 2.430145263671875, 2.519287109375, 2.608428955078125, 2.69757080078125, 2.786712646484375, 2.8758544921875, 2.964996337890625, 3.05413818359375, 3.143280029296875, 3.232421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 10.0, 5.0, 13.0, 14.0, 21.0, 22.0, 16.0, 19.0, 27.0, 21.0, 34.0, 40.0, 44.0, 40.0, 65.0, 89.0, 69.0, 73.0, 73.0, 51.0, 49.0, 33.0, 25.0, 23.0, 22.0, 18.0, 22.0, 12.0, 9.0, 4.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.252410888671875, -4.12591552734375, -3.999420166015625, -3.8729248046875, -3.746429443359375, -3.61993408203125, -3.493438720703125, -3.366943359375, -3.240447998046875, -3.11395263671875, -2.987457275390625, -2.8609619140625, -2.734466552734375, -2.60797119140625, -2.481475830078125, -2.35498046875, -2.228485107421875, -2.10198974609375, -1.975494384765625, -1.8489990234375, -1.722503662109375, -1.59600830078125, -1.469512939453125, -1.343017578125, -1.216522216796875, -1.09002685546875, -0.963531494140625, -0.8370361328125, -0.710540771484375, -0.58404541015625, -0.457550048828125, -0.3310546875, -0.204559326171875, -0.07806396484375, 0.048431396484375, 0.1749267578125, 0.301422119140625, 0.42791748046875, 0.554412841796875, 0.680908203125, 0.807403564453125, 0.93389892578125, 1.060394287109375, 1.1868896484375, 1.313385009765625, 1.43988037109375, 1.566375732421875, 1.69287109375, 1.819366455078125, 1.94586181640625, 2.072357177734375, 2.1988525390625, 2.325347900390625, 2.45184326171875, 2.578338623046875, 2.704833984375, 2.831329345703125, 2.95782470703125, 3.084320068359375, 3.2108154296875, 3.337310791015625, 3.46380615234375, 3.590301513671875, 3.716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 19.0, 29.0, 38.0, 71.0, 140.0, 292.0, 562.0, 1562.0, 5998.0, 37034.0, 911672.0, 77768.0, 9427.0, 2391.0, 736.0, 328.0, 168.0, 91.0, 62.0, 39.0, 13.0, 10.0, 7.0, 13.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.67333984375, -0.6533279418945312, -0.6333160400390625, -0.6133041381835938, -0.593292236328125, -0.5732803344726562, -0.5532684326171875, -0.5332565307617188, -0.51324462890625, -0.49323272705078125, -0.4732208251953125, -0.45320892333984375, -0.433197021484375, -0.41318511962890625, -0.3931732177734375, -0.37316131591796875, -0.3531494140625, -0.33313751220703125, -0.3131256103515625, -0.29311370849609375, -0.273101806640625, -0.25308990478515625, -0.2330780029296875, -0.21306610107421875, -0.19305419921875, -0.17304229736328125, -0.1530303955078125, -0.13301849365234375, -0.113006591796875, -0.09299468994140625, -0.0729827880859375, -0.05297088623046875, -0.032958984375, -0.01294708251953125, 0.0070648193359375, 0.02707672119140625, 0.047088623046875, 0.06710052490234375, 0.0871124267578125, 0.10712432861328125, 0.12713623046875, 0.14714813232421875, 0.1671600341796875, 0.18717193603515625, 0.207183837890625, 0.22719573974609375, 0.2472076416015625, 0.26721954345703125, 0.2872314453125, 0.30724334716796875, 0.3272552490234375, 0.34726715087890625, 0.367279052734375, 0.38729095458984375, 0.4073028564453125, 0.42731475830078125, 0.44732666015625, 0.46733856201171875, 0.4873504638671875, 0.5073623657226562, 0.527374267578125, 0.5473861694335938, 0.5673980712890625, 0.5874099731445312, 0.607421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 5.0, 11.0, 13.0, 7.0, 14.0, 12.0, 20.0, 31.0, 28.0, 53.0, 87.0, 88.0, 100.0, 101.0, 103.0, 70.0, 39.0, 37.0, 23.0, 22.0, 20.0, 19.0, 8.0, 11.0, 8.0, 7.0, 6.0, 4.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011773966252803802, -0.00011364743113517761, -0.0001095551997423172, -0.00010546296834945679, -0.00010137073695659637, -9.727850556373596e-05, -9.318627417087555e-05, -8.909404277801514e-05, -8.500181138515472e-05, -8.090957999229431e-05, -7.68173485994339e-05, -7.272511720657349e-05, -6.863288581371307e-05, -6.454065442085266e-05, -6.044842302799225e-05, -5.6356191635131836e-05, -5.226396024227142e-05, -4.817172884941101e-05, -4.40794974565506e-05, -3.9987266063690186e-05, -3.589503467082977e-05, -3.180280327796936e-05, -2.7710571885108948e-05, -2.3618340492248535e-05, -1.9526109099388123e-05, -1.543387770652771e-05, -1.1341646313667297e-05, -7.249414920806885e-06, -3.157183527946472e-06, 9.350478649139404e-07, 5.027279257774353e-06, 9.119510650634766e-06, 1.3211742043495178e-05, 1.730397343635559e-05, 2.1396204829216003e-05, 2.5488436222076416e-05, 2.958066761493683e-05, 3.367289900779724e-05, 3.7765130400657654e-05, 4.1857361793518066e-05, 4.594959318637848e-05, 5.004182457923889e-05, 5.4134055972099304e-05, 5.822628736495972e-05, 6.231851875782013e-05, 6.641075015068054e-05, 7.050298154354095e-05, 7.459521293640137e-05, 7.868744432926178e-05, 8.277967572212219e-05, 8.68719071149826e-05, 9.096413850784302e-05, 9.505636990070343e-05, 9.914860129356384e-05, 0.00010324083268642426, 0.00010733306407928467, 0.00011142529547214508, 0.00011551752686500549, 0.0001196097582578659, 0.00012370198965072632, 0.00012779422104358673, 0.00013188645243644714, 0.00013597868382930756, 0.00014007091522216797]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 16.0, 14.0, 33.0, 46.0, 80.0, 150.0, 264.0, 533.0, 1228.0, 3337.0, 12206.0, 72257.0, 874306.0, 66706.0, 11647.0, 3323.0, 1288.0, 488.0, 245.0, 146.0, 99.0, 48.0, 23.0, 9.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397216796875, -0.384185791015625, -0.37115478515625, -0.358123779296875, -0.3450927734375, -0.332061767578125, -0.31903076171875, -0.305999755859375, -0.29296875, -0.279937744140625, -0.26690673828125, -0.253875732421875, -0.2408447265625, -0.227813720703125, -0.21478271484375, -0.201751708984375, -0.188720703125, -0.175689697265625, -0.16265869140625, -0.149627685546875, -0.1365966796875, -0.123565673828125, -0.11053466796875, -0.097503662109375, -0.08447265625, -0.071441650390625, -0.05841064453125, -0.045379638671875, -0.0323486328125, -0.019317626953125, -0.00628662109375, 0.006744384765625, 0.019775390625, 0.032806396484375, 0.04583740234375, 0.058868408203125, 0.0718994140625, 0.084930419921875, 0.09796142578125, 0.110992431640625, 0.1240234375, 0.137054443359375, 0.15008544921875, 0.163116455078125, 0.1761474609375, 0.189178466796875, 0.20220947265625, 0.215240478515625, 0.228271484375, 0.241302490234375, 0.25433349609375, 0.267364501953125, 0.2803955078125, 0.293426513671875, 0.30645751953125, 0.319488525390625, 0.33251953125, 0.345550537109375, 0.35858154296875, 0.371612548828125, 0.3846435546875, 0.397674560546875, 0.41070556640625, 0.423736572265625, 0.436767578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 15.0, 20.0, 20.0, 37.0, 38.0, 59.0, 62.0, 74.0, 114.0, 107.0, 85.0, 72.0, 62.0, 38.0, 34.0, 23.0, 19.0, 15.0, 13.0, 12.0, 5.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.36083984375, -0.3484230041503906, -0.33600616455078125, -0.3235893249511719, -0.3111724853515625, -0.2987556457519531, -0.28633880615234375, -0.2739219665527344, -0.261505126953125, -0.24908828735351562, -0.23667144775390625, -0.22425460815429688, -0.2118377685546875, -0.19942092895507812, -0.18700408935546875, -0.17458724975585938, -0.16217041015625, -0.14975357055664062, -0.13733673095703125, -0.12491989135742188, -0.1125030517578125, -0.10008621215820312, -0.08766937255859375, -0.07525253295898438, -0.062835693359375, -0.050418853759765625, -0.03800201416015625, -0.025585174560546875, -0.0131683349609375, -0.000751495361328125, 0.01166534423828125, 0.024082183837890625, 0.0364990234375, 0.048915863037109375, 0.06133270263671875, 0.07374954223632812, 0.0861663818359375, 0.09858322143554688, 0.11100006103515625, 0.12341690063476562, 0.135833740234375, 0.14825057983398438, 0.16066741943359375, 0.17308425903320312, 0.1855010986328125, 0.19791793823242188, 0.21033477783203125, 0.22275161743164062, 0.23516845703125, 0.24758529663085938, 0.26000213623046875, 0.2724189758300781, 0.2848358154296875, 0.2972526550292969, 0.30966949462890625, 0.3220863342285156, 0.334503173828125, 0.3469200134277344, 0.35933685302734375, 0.3717536926269531, 0.3841705322265625, 0.3965873718261719, 0.40900421142578125, 0.4214210510253906, 0.433837890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 5.0, 37.0, 78.0, 378.0, 415.0, 71.0, 14.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.805763244628906, -48.72344970703125, -47.64113235473633, -46.55881881713867, -45.47650146484375, -44.394187927246094, -43.31187057495117, -42.229557037353516, -41.147239685058594, -40.06492614746094, -38.982608795166016, -37.90029525756836, -36.81797790527344, -35.73566436767578, -34.65334701538086, -33.5710334777832, -32.48871612548828, -31.406400680541992, -30.324085235595703, -29.241769790649414, -28.159454345703125, -27.077138900756836, -25.994823455810547, -24.91250991821289, -23.830196380615234, -22.747880935668945, -21.665565490722656, -20.583250045776367, -19.500934600830078, -18.41861915588379, -17.3363037109375, -16.253990173339844, -15.171670913696289, -14.08935546875, -13.007040023803711, -11.924724578857422, -10.842409133911133, -9.760093688964844, -8.677779197692871, -7.595463752746582, -6.513148307800293, -5.430832862854004, -4.348517417907715, -3.266202449798584, -2.183887004852295, -1.1015715599060059, -0.019256591796875, 1.063058853149414, 2.145374298095703, 3.227689743041992, 4.310005187988281, 5.392320156097412, 6.474635601043701, 7.55695104598999, 8.639266014099121, 9.72158145904541, 10.8038969039917, 11.886212348937988, 12.968527793884277, 14.05084228515625, 15.133157730102539, 16.215473175048828, 17.297788619995117, 18.380104064941406, 19.462419509887695]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 7.0, 7.0, 8.0, 6.0, 3.0, 15.0, 18.0, 20.0, 12.0, 15.0, 12.0, 17.0, 18.0, 19.0, 17.0, 25.0, 33.0, 126.0, 207.0, 133.0, 37.0, 23.0, 31.0, 24.0, 14.0, 20.0, 10.0, 16.0, 15.0, 13.0, 5.0, 9.0, 6.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.094806671142578, -8.814618110656738, -8.534429550170898, -8.254241943359375, -7.974053382873535, -7.693864822387695, -7.4136762619018555, -7.133487701416016, -6.853299617767334, -6.573111057281494, -6.2929229736328125, -6.012734413146973, -5.732545852661133, -5.452357769012451, -5.172169208526611, -4.89198112487793, -4.61179256439209, -4.33160400390625, -4.051415920257568, -3.7712273597717285, -3.4910390377044678, -3.210850715637207, -2.930662155151367, -2.6504738330841064, -2.3702855110168457, -2.090097188949585, -1.8099087476730347, -1.5297203063964844, -1.2495319843292236, -0.9693436622619629, -0.6891552209854126, -0.4089667797088623, -0.12877845764160156, 0.15140992403030396, 0.4315983057022095, 0.711786687374115, 0.9919750690460205, 1.2721633911132812, 1.5523518323898315, 1.8325402736663818, 2.1127285957336426, 2.3929169178009033, 2.673105239868164, 2.953293800354004, 3.2334821224212646, 3.5136704444885254, 3.7938590049743652, 4.074047088623047, 4.354235649108887, 4.634424209594727, 4.914612293243408, 5.194800853729248, 5.47498893737793, 5.7551774978637695, 6.035366058349609, 6.315554618835449, 6.595742702484131, 6.875931262969971, 7.156119346618652, 7.436307907104492, 7.716496467590332, 7.996684551239014, 8.276872634887695, 8.557061195373535, 8.837249755859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 13.0, 13.0, 22.0, 18.0, 17.0, 18.0, 29.0, 26.0, 27.0, 33.0, 41.0, 93.0, 237.0, 140.0, 52.0, 35.0, 36.0, 23.0, 21.0, 16.0, 16.0, 12.0, 9.0, 2.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.87091064453125, -0.8394775390625, -0.80804443359375, -0.776611328125, -0.74517822265625, -0.7137451171875, -0.68231201171875, -0.65087890625, -0.61944580078125, -0.5880126953125, -0.55657958984375, -0.525146484375, -0.49371337890625, -0.4622802734375, -0.43084716796875, -0.3994140625, -0.36798095703125, -0.3365478515625, -0.30511474609375, -0.273681640625, -0.24224853515625, -0.2108154296875, -0.17938232421875, -0.14794921875, -0.11651611328125, -0.0850830078125, -0.05364990234375, -0.022216796875, 0.00921630859375, 0.0406494140625, 0.07208251953125, 0.103515625, 0.13494873046875, 0.1663818359375, 0.19781494140625, 0.229248046875, 0.26068115234375, 0.2921142578125, 0.32354736328125, 0.35498046875, 0.38641357421875, 0.4178466796875, 0.44927978515625, 0.480712890625, 0.51214599609375, 0.5435791015625, 0.57501220703125, 0.6064453125, 0.63787841796875, 0.6693115234375, 0.70074462890625, 0.732177734375, 0.76361083984375, 0.7950439453125, 0.82647705078125, 0.85791015625, 0.88934326171875, 0.9207763671875, 0.95220947265625, 0.983642578125, 1.01507568359375, 1.0465087890625, 1.07794189453125, 1.109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 7.0, 4.0, 7.0, 6.0, 15.0, 19.0, 25.0, 40.0, 97.0, 215.0, 858.0, 7478.0, 8368660.0, 9792.0, 930.0, 224.0, 91.0, 34.0, 24.0, 12.0, 24.0, 8.0, 7.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.864316940307617, -17.375450134277344, -16.88658332824707, -16.397714614868164, -15.90884780883789, -15.419981002807617, -14.931114196777344, -14.44224739074707, -13.95337963104248, -13.464512825012207, -12.975645065307617, -12.486778259277344, -11.99791145324707, -11.50904369354248, -11.020176887512207, -10.531309127807617, -10.042442321777344, -9.55357551574707, -9.06470775604248, -8.575840950012207, -8.086973190307617, -7.598106384277344, -7.10923957824707, -6.620372295379639, -6.131505012512207, -5.642637729644775, -5.153770446777344, -4.66490364074707, -4.176036357879639, -3.687169075012207, -3.1983020305633545, -2.709434986114502, -2.2205677032470703, -1.7317005395889282, -1.2428333759307861, -0.753966212272644, -0.26509904861450195, 0.2237682342529297, 0.7126352787017822, 1.2015023231506348, 1.6903696060180664, 2.179236888885498, 2.6681039333343506, 3.156970977783203, 3.6458382606506348, 4.134705543518066, 4.62357234954834, 5.1124396324157715, 5.601306915283203, 6.090174198150635, 6.579041481018066, 7.06790828704834, 7.5567755699157715, 8.045642852783203, 8.534509658813477, 9.02337646484375, 9.51224422454834, 10.001111030578613, 10.489978790283203, 10.978845596313477, 11.46771240234375, 11.95658016204834, 12.445446968078613, 12.934314727783203, 13.423181533813477]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 8.0, 0.0, 6.0, 7.0, 1.0, 6.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9409661293029785, -5.722023963928223, -5.503082275390625, -5.284140110015869, -5.065197944641113, -4.846256256103516, -4.62731409072876, -4.408371925354004, -4.189430236816406, -3.9704883098602295, -3.7515463829040527, -3.532604217529297, -3.31366229057312, -3.0947203636169434, -2.8757781982421875, -2.6568362712860107, -2.437894344329834, -2.2189524173736572, -2.0000104904174805, -1.7810683250427246, -1.5621263980865479, -1.343184471130371, -1.1242424249649048, -0.9053003787994385, -0.6863584518432617, -0.4674164652824402, -0.24847447872161865, -0.02953249216079712, 0.18940949440002441, 0.40835142135620117, 0.6272934675216675, 0.8462355136871338, 1.0651779174804688, 1.2841198444366455, 1.5030618906021118, 1.7220039367675781, 1.9409458637237549, 2.1598877906799316, 2.3788299560546875, 2.5977718830108643, 2.816713809967041, 3.0356557369232178, 3.2545976638793945, 3.4735398292541504, 3.692481756210327, 3.911423683166504, 4.13036584854126, 4.349308013916016, 4.568249702453613, 4.787191867828369, 5.006133556365967, 5.225075721740723, 5.44401741027832, 5.662959575653076, 5.881901741027832, 6.10084342956543, 6.3197855949401855, 6.538727760314941, 6.757669448852539, 6.976611614227295, 7.195553779602051, 7.414495468139648, 7.633437633514404, 7.85237979888916, 8.071321487426758]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 26.0, 27.0, 44.0, 44.0, 106.0, 131.0, 238.0, 472.0, 1226.0, 4297.0, 17810.0, 85839.0, 269715.0, 111618.0, 23823.0, 5862.0, 1620.0, 602.0, 288.0, 142.0, 90.0, 63.0, 42.0, 50.0, 22.0, 11.0, 12.0, 8.0, 11.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5318603515625, -8.243408203125, -7.9549560546875, -7.66650390625, -7.3780517578125, -7.089599609375, -6.8011474609375, -6.5126953125, -6.2242431640625, -5.935791015625, -5.6473388671875, -5.35888671875, -5.0704345703125, -4.781982421875, -4.4935302734375, -4.205078125, -3.9166259765625, -3.628173828125, -3.3397216796875, -3.05126953125, -2.7628173828125, -2.474365234375, -2.1859130859375, -1.8974609375, -1.6090087890625, -1.320556640625, -1.0321044921875, -0.74365234375, -0.4552001953125, -0.166748046875, 0.1217041015625, 0.41015625, 0.6986083984375, 0.987060546875, 1.2755126953125, 1.56396484375, 1.8524169921875, 2.140869140625, 2.4293212890625, 2.7177734375, 3.0062255859375, 3.294677734375, 3.5831298828125, 3.87158203125, 4.1600341796875, 4.448486328125, 4.7369384765625, 5.025390625, 5.3138427734375, 5.602294921875, 5.8907470703125, 6.17919921875, 6.4676513671875, 6.756103515625, 7.0445556640625, 7.3330078125, 7.6214599609375, 7.909912109375, 8.1983642578125, 8.48681640625, 8.7752685546875, 9.063720703125, 9.3521728515625, 9.640625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 11.0, 19.0, 17.0, 27.0, 25.0, 41.0, 56.0, 62.0, 73.0, 90.0, 89.0, 83.0, 80.0, 75.0, 65.0, 44.0, 35.0, 21.0, 28.0, 17.0, 6.0, 5.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.407073974609375, -1.35906982421875, -1.311065673828125, -1.2630615234375, -1.215057373046875, -1.16705322265625, -1.119049072265625, -1.071044921875, -1.023040771484375, -0.97503662109375, -0.927032470703125, -0.8790283203125, -0.831024169921875, -0.78302001953125, -0.735015869140625, -0.68701171875, -0.639007568359375, -0.59100341796875, -0.542999267578125, -0.4949951171875, -0.446990966796875, -0.39898681640625, -0.350982666015625, -0.302978515625, -0.254974365234375, -0.20697021484375, -0.158966064453125, -0.1109619140625, -0.062957763671875, -0.01495361328125, 0.033050537109375, 0.0810546875, 0.129058837890625, 0.17706298828125, 0.225067138671875, 0.2730712890625, 0.321075439453125, 0.36907958984375, 0.417083740234375, 0.465087890625, 0.513092041015625, 0.56109619140625, 0.609100341796875, 0.6571044921875, 0.705108642578125, 0.75311279296875, 0.801116943359375, 0.84912109375, 0.897125244140625, 0.94512939453125, 0.993133544921875, 1.0411376953125, 1.089141845703125, 1.13714599609375, 1.185150146484375, 1.233154296875, 1.281158447265625, 1.32916259765625, 1.377166748046875, 1.4251708984375, 1.473175048828125, 1.52117919921875, 1.569183349609375, 1.6171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 9.0, 17.0, 99.0, 217.0, 88.0, 22.0, 11.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.651233673095703, -11.055516242980957, -10.459798812866211, -9.864081382751465, -9.268363952636719, -8.672646522521973, -8.076929092407227, -7.481212139129639, -6.885494709014893, -6.2897772789001465, -5.6940598487854, -5.0983428955078125, -4.502625465393066, -3.906907796859741, -3.311190605163574, -2.715473175048828, -2.119755744934082, -1.524038314819336, -0.9283210039138794, -0.33260369300842285, 0.26311373710632324, 0.8588311672210693, 1.4545483589172363, 2.0502657890319824, 2.6459832191467285, 3.2417006492614746, 3.8374180793762207, 4.433135032653809, 5.028852462768555, 5.624569892883301, 6.220287322998047, 6.816004753112793, 7.411722183227539, 8.007439613342285, 8.603157043457031, 9.198874473571777, 9.794591903686523, 10.39030933380127, 10.986026763916016, 11.581743240356445, 12.177461624145508, 12.773179054260254, 13.368896484375, 13.964613914489746, 14.560331344604492, 15.156048774719238, 15.751766204833984, 16.347482681274414, 16.943199157714844, 17.538915634155273, 18.134634017944336, 18.730350494384766, 19.326068878173828, 19.921785354614258, 20.51750373840332, 21.11322021484375, 21.708938598632812, 22.304655075073242, 22.900373458862305, 23.496089935302734, 24.091808319091797, 24.687524795532227, 25.28324317932129, 25.87895965576172, 26.47467803955078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 5.0, 6.0, 9.0, 16.0, 29.0, 86.0, 130.0, 89.0, 36.0, 13.0, 12.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.590359687805176, -8.335735321044922, -8.081110954284668, -7.826486587524414, -7.57186222076416, -7.317237854003906, -7.062613487243652, -6.807989120483398, -6.5533647537231445, -6.298740386962891, -6.044116020202637, -5.789491653442383, -5.534867286682129, -5.280242919921875, -5.025618553161621, -4.770994186401367, -4.516369819641113, -4.261745452880859, -4.0071210861206055, -3.7524967193603516, -3.4978723526000977, -3.2432479858398438, -2.98862361907959, -2.733999252319336, -2.479374885559082, -2.224750518798828, -1.9701261520385742, -1.7155017852783203, -1.4608774185180664, -1.2062530517578125, -0.9516286849975586, -0.6970043182373047, -0.4423809051513672, -0.18775653839111328, 0.06686782836914062, 0.32149219512939453, 0.5761165618896484, 0.8307409286499023, 1.0853652954101562, 1.3399896621704102, 1.594614028930664, 1.849238395690918, 2.103862762451172, 2.358487129211426, 2.6131114959716797, 2.8677358627319336, 3.1223602294921875, 3.3769845962524414, 3.6316089630126953, 3.886233329772949, 4.140857696533203, 4.395482063293457, 4.650106430053711, 4.904730796813965, 5.159355163574219, 5.413979530334473, 5.668603897094727, 5.9232282638549805, 6.177852630615234, 6.432476997375488, 6.687101364135742, 6.941725730895996, 7.19635009765625, 7.450974464416504, 7.705598831176758]}, "eval/loss": 4.2075958251953125, "eval/wer": 1.9032526775089251, "eval/runtime": 947.3446, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349, "train/train_runtime": 8514.9113, "train/train_samples_per_second": 3.352, "train/train_steps_per_second": 0.21, "train/total_flos": 0.0, "train/train_loss": 4.24715919291492} \ No newline at end of file