diff --git "a/wandb/run-20220317_164055-2lyj41rg/files/wandb-summary.json" "b/wandb/run-20220317_164055-2lyj41rg/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220317_164055-2lyj41rg/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 3.5335, "train/learning_rate": 9.11104513064133e-05, "train/epoch": 2.8, "train/global_step": 2500, "_runtime": 16192, "_timestamp": 1647551447, "_step": 2500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 36.0, 96.0, 211.0, 288.0, 223.0, 96.0, 46.0, 11.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.11555480957031, -36.23134231567383, -33.347129821777344, -30.462919235229492, -27.57870864868164, -24.694496154785156, -21.810283660888672, -18.92607307434082, -16.041860580444336, -13.157649040222168, -10.2734375, -7.389225006103516, -4.505013465881348, -1.6208019256591797, 1.2634105682373047, 4.147621154785156, 7.031833648681641, 9.916045188903809, 12.800256729125977, 15.684469223022461, 18.568679809570312, 21.452892303466797, 24.33710479736328, 27.221315383911133, 30.105527877807617, 32.98973846435547, 35.87395095825195, 38.75816345214844, 41.64237594604492, 44.526588439941406, 47.410797119140625, 50.29500961303711, 53.179222106933594, 56.06343460083008, 58.94764709472656, 61.83185577392578, 64.71607208251953, 67.60028076171875, 70.4844970703125, 73.36870574951172, 76.25291442871094, 79.13712310791016, 82.0213394165039, 84.90554809570312, 87.78976440429688, 90.6739730834961, 93.55818176269531, 96.44239807128906, 99.32661437988281, 102.21082305908203, 105.09503936767578, 107.979248046875, 110.86346435546875, 113.74767303466797, 116.63188171386719, 119.51609802246094, 122.40030670166016, 125.28451538085938, 128.16873168945312, 131.05294799804688, 133.93714904785156, 136.8213653564453, 139.70558166503906, 142.58978271484375, 145.4739990234375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 9.0, 13.0, 9.0, 16.0, 14.0, 23.0, 30.0, 30.0, 37.0, 49.0, 56.0, 59.0, 61.0, 48.0, 58.0, 53.0, 70.0, 60.0, 50.0, 46.0, 41.0, 27.0, 27.0, 21.0, 21.0, 11.0, 17.0, 9.0, 9.0, 9.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.068206787109375, -58.92543411254883, -56.782657623291016, -54.63988494873047, -52.497108459472656, -50.35433578491211, -48.21156311035156, -46.06878662109375, -43.92601013183594, -41.78323745727539, -39.64046096801758, -37.49768829345703, -35.35491180419922, -33.21213912963867, -31.069364547729492, -28.926589965820312, -26.783817291259766, -24.641042709350586, -22.498268127441406, -20.35549545288086, -18.212718963623047, -16.0699462890625, -13.92717170715332, -11.78439712524414, -9.641622543334961, -7.498847961425781, -5.35607385635376, -3.2132997512817383, -1.0705251693725586, 1.072249412536621, 3.2150230407714844, 5.357797622680664, 7.500572204589844, 9.643346786499023, 11.786121368408203, 13.928894996643066, 16.071670532226562, 18.21444320678711, 20.35721778869629, 22.49999237060547, 24.64276695251465, 26.785541534423828, 28.928316116333008, 31.071090698242188, 33.213863372802734, 35.35663986206055, 37.499412536621094, 39.642189025878906, 41.78496170043945, 43.927734375, 46.07051086425781, 48.21328353881836, 50.35606002807617, 52.49883270263672, 54.64160919189453, 56.78438186645508, 58.927154541015625, 61.06992721557617, 63.212703704833984, 65.35547637939453, 67.49825286865234, 69.64102935791016, 71.78379821777344, 73.92657470703125, 76.06935119628906]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 16.0, 13.0, 21.0, 21.0, 25.0, 27.0, 36.0, 52.0, 57.0, 54.0, 44.0, 56.0, 47.0, 64.0, 59.0, 58.0, 54.0, 52.0, 40.0, 33.0, 34.0, 20.0, 20.0, 18.0, 13.0, 11.0, 10.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.470703125, -2.37811279296875, -2.2855224609375, -2.19293212890625, -2.100341796875, -2.00775146484375, -1.9151611328125, -1.82257080078125, -1.72998046875, -1.63739013671875, -1.5447998046875, -1.45220947265625, -1.359619140625, -1.26702880859375, -1.1744384765625, -1.08184814453125, -0.9892578125, -0.89666748046875, -0.8040771484375, -0.71148681640625, -0.618896484375, -0.52630615234375, -0.4337158203125, -0.34112548828125, -0.24853515625, -0.15594482421875, -0.0633544921875, 0.02923583984375, 0.121826171875, 0.21441650390625, 0.3070068359375, 0.39959716796875, 0.4921875, 0.58477783203125, 0.6773681640625, 0.76995849609375, 0.862548828125, 0.95513916015625, 1.0477294921875, 1.14031982421875, 1.23291015625, 1.32550048828125, 1.4180908203125, 1.51068115234375, 1.603271484375, 1.69586181640625, 1.7884521484375, 1.88104248046875, 1.9736328125, 2.06622314453125, 2.1588134765625, 2.25140380859375, 2.343994140625, 2.43658447265625, 2.5291748046875, 2.62176513671875, 2.71435546875, 2.80694580078125, 2.8995361328125, 2.99212646484375, 3.084716796875, 3.17730712890625, 3.2698974609375, 3.36248779296875, 3.455078125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 7.0, 12.0, 9.0, 28.0, 33.0, 48.0, 68.0, 113.0, 177.0, 320.0, 591.0, 1197.0, 2642.0, 8050.0, 44264.0, 730384.0, 3160905.0, 216940.0, 20565.0, 4583.0, 1598.0, 704.0, 432.0, 237.0, 118.0, 76.0, 62.0, 40.0, 26.0, 13.0, 15.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.2286376953125, -9.824462890625, -9.4202880859375, -9.01611328125, -8.6119384765625, -8.207763671875, -7.8035888671875, -7.3994140625, -6.9952392578125, -6.591064453125, -6.1868896484375, -5.78271484375, -5.3785400390625, -4.974365234375, -4.5701904296875, -4.166015625, -3.7618408203125, -3.357666015625, -2.9534912109375, -2.54931640625, -2.1451416015625, -1.740966796875, -1.3367919921875, -0.9326171875, -0.5284423828125, -0.124267578125, 0.2799072265625, 0.68408203125, 1.0882568359375, 1.492431640625, 1.8966064453125, 2.30078125, 2.7049560546875, 3.109130859375, 3.5133056640625, 3.91748046875, 4.3216552734375, 4.725830078125, 5.1300048828125, 5.5341796875, 5.9383544921875, 6.342529296875, 6.7467041015625, 7.15087890625, 7.5550537109375, 7.959228515625, 8.3634033203125, 8.767578125, 9.1717529296875, 9.575927734375, 9.9801025390625, 10.38427734375, 10.7884521484375, 11.192626953125, 11.5968017578125, 12.0009765625, 12.4051513671875, 12.809326171875, 13.2135009765625, 13.61767578125, 14.0218505859375, 14.426025390625, 14.8302001953125, 15.234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 17.0, 30.0, 42.0, 52.0, 90.0, 106.0, 159.0, 291.0, 391.0, 534.0, 581.0, 508.0, 373.0, 310.0, 183.0, 126.0, 98.0, 51.0, 35.0, 24.0, 15.0, 12.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1796875, -9.8216552734375, -9.463623046875, -9.1055908203125, -8.74755859375, -8.3895263671875, -8.031494140625, -7.6734619140625, -7.3154296875, -6.9573974609375, -6.599365234375, -6.2413330078125, -5.88330078125, -5.5252685546875, -5.167236328125, -4.8092041015625, -4.451171875, -4.0931396484375, -3.735107421875, -3.3770751953125, -3.01904296875, -2.6610107421875, -2.302978515625, -1.9449462890625, -1.5869140625, -1.2288818359375, -0.870849609375, -0.5128173828125, -0.15478515625, 0.2032470703125, 0.561279296875, 0.9193115234375, 1.27734375, 1.6353759765625, 1.993408203125, 2.3514404296875, 2.70947265625, 3.0675048828125, 3.425537109375, 3.7835693359375, 4.1416015625, 4.4996337890625, 4.857666015625, 5.2156982421875, 5.57373046875, 5.9317626953125, 6.289794921875, 6.6478271484375, 7.005859375, 7.3638916015625, 7.721923828125, 8.0799560546875, 8.43798828125, 8.7960205078125, 9.154052734375, 9.5120849609375, 9.8701171875, 10.2281494140625, 10.586181640625, 10.9442138671875, 11.30224609375, 11.6602783203125, 12.018310546875, 12.3763427734375, 12.734375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 10.0, 20.0, 36.0, 56.0, 103.0, 157.0, 269.0, 450.0, 792.0, 1711.0, 4981.0, 54911.0, 3484976.0, 627524.0, 12715.0, 2829.0, 1191.0, 648.0, 372.0, 178.0, 115.0, 71.0, 37.0, 31.0, 22.0, 8.0, 9.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.328125, -29.273681640625, -28.21923828125, -27.164794921875, -26.1103515625, -25.055908203125, -24.00146484375, -22.947021484375, -21.892578125, -20.838134765625, -19.78369140625, -18.729248046875, -17.6748046875, -16.620361328125, -15.56591796875, -14.511474609375, -13.45703125, -12.402587890625, -11.34814453125, -10.293701171875, -9.2392578125, -8.184814453125, -7.13037109375, -6.075927734375, -5.021484375, -3.967041015625, -2.91259765625, -1.858154296875, -0.8037109375, 0.250732421875, 1.30517578125, 2.359619140625, 3.4140625, 4.468505859375, 5.52294921875, 6.577392578125, 7.6318359375, 8.686279296875, 9.74072265625, 10.795166015625, 11.849609375, 12.904052734375, 13.95849609375, 15.012939453125, 16.0673828125, 17.121826171875, 18.17626953125, 19.230712890625, 20.28515625, 21.339599609375, 22.39404296875, 23.448486328125, 24.5029296875, 25.557373046875, 26.61181640625, 27.666259765625, 28.720703125, 29.775146484375, 30.82958984375, 31.884033203125, 32.9384765625, 33.992919921875, 35.04736328125, 36.101806640625, 37.15625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 18.0, 28.0, 49.0, 63.0, 115.0, 130.0, 153.0, 151.0, 110.0, 83.0, 48.0, 33.0, 13.0, 6.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.08479309082031, -38.850040435791016, -37.61528778076172, -36.38053894042969, -35.14578628540039, -33.911033630371094, -32.6762809753418, -31.4415283203125, -30.206777572631836, -28.97202491760254, -27.737274169921875, -26.502521514892578, -25.26776885986328, -24.033018112182617, -22.79826545715332, -21.563514709472656, -20.32876205444336, -19.094009399414062, -17.8592586517334, -16.6245059967041, -15.389754295349121, -14.15500259399414, -12.920249938964844, -11.685498237609863, -10.450746536254883, -9.215994834899902, -7.981242656707764, -6.746490478515625, -5.5117387771606445, -4.276987075805664, -3.0422348976135254, -1.8074827194213867, -0.5727272033691406, 0.662024736404419, 1.8967766761779785, 3.131528615951538, 4.366280555725098, 5.601032257080078, 6.835784435272217, 8.070536613464355, 9.305288314819336, 10.540040016174316, 11.774791717529297, 13.009544372558594, 14.244296073913574, 15.479047775268555, 16.71380043029785, 17.948551177978516, 19.183303833007812, 20.41805648803711, 21.652807235717773, 22.88755989074707, 24.122310638427734, 25.35706329345703, 26.591815948486328, 27.826568603515625, 29.06131935119629, 30.296072006225586, 31.53082275390625, 32.76557540893555, 34.000328063964844, 35.235076904296875, 36.46982955932617, 37.70458221435547, 38.939334869384766]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 13.0, 7.0, 6.0, 8.0, 14.0, 16.0, 17.0, 25.0, 19.0, 22.0, 32.0, 28.0, 27.0, 36.0, 33.0, 28.0, 45.0, 49.0, 42.0, 45.0, 39.0, 41.0, 40.0, 41.0, 35.0, 35.0, 36.0, 28.0, 24.0, 21.0, 28.0, 23.0, 12.0, 10.0, 18.0, 9.0, 6.0, 14.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.25507354736328, -33.261024475097656, -32.26697540283203, -31.272924423217773, -30.278873443603516, -29.28482437133789, -28.290775299072266, -27.296724319458008, -26.302675247192383, -25.308626174926758, -24.3145751953125, -23.320526123046875, -22.326475143432617, -21.332426071166992, -20.338375091552734, -19.34432601928711, -18.350276947021484, -17.35622787475586, -16.3621768951416, -15.368127822875977, -14.374077796936035, -13.380027770996094, -12.385977745056152, -11.391927719116211, -10.397876739501953, -9.403826713562012, -8.40977668762207, -7.415727138519287, -6.421677589416504, -5.4276275634765625, -4.433577537536621, -3.439527988433838, -2.4454784393310547, -1.4514286518096924, -0.4573787450790405, 0.5366711616516113, 1.5307209491729736, 2.524770736694336, 3.5188207626342773, 4.5128703117370605, 5.506920337677002, 6.500970363616943, 7.495019912719727, 8.489069938659668, 9.48311996459961, 10.477169036865234, 11.471220016479492, 12.465269088745117, 13.459319114685059, 14.453369140625, 15.447419166564941, 16.441469192504883, 17.435518264770508, 18.429569244384766, 19.42361831665039, 20.417667388916016, 21.411718368530273, 22.4057674407959, 23.399818420410156, 24.39386749267578, 25.38791847229004, 26.381967544555664, 27.376018524169922, 28.370067596435547, 29.364116668701172]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 12.0, 13.0, 11.0, 18.0, 26.0, 24.0, 25.0, 26.0, 37.0, 42.0, 30.0, 30.0, 42.0, 39.0, 32.0, 45.0, 40.0, 36.0, 53.0, 42.0, 39.0, 42.0, 33.0, 34.0, 23.0, 23.0, 14.0, 22.0, 28.0, 17.0, 8.0, 11.0, 12.0, 11.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-2.28125, -2.211761474609375, -2.14227294921875, -2.072784423828125, -2.0032958984375, -1.933807373046875, -1.86431884765625, -1.794830322265625, -1.725341796875, -1.655853271484375, -1.58636474609375, -1.516876220703125, -1.4473876953125, -1.377899169921875, -1.30841064453125, -1.238922119140625, -1.16943359375, -1.099945068359375, -1.03045654296875, -0.960968017578125, -0.8914794921875, -0.821990966796875, -0.75250244140625, -0.683013916015625, -0.613525390625, -0.544036865234375, -0.47454833984375, -0.405059814453125, -0.3355712890625, -0.266082763671875, -0.19659423828125, -0.127105712890625, -0.0576171875, 0.011871337890625, 0.08135986328125, 0.150848388671875, 0.2203369140625, 0.289825439453125, 0.35931396484375, 0.428802490234375, 0.498291015625, 0.567779541015625, 0.63726806640625, 0.706756591796875, 0.7762451171875, 0.845733642578125, 0.91522216796875, 0.984710693359375, 1.05419921875, 1.123687744140625, 1.19317626953125, 1.262664794921875, 1.3321533203125, 1.401641845703125, 1.47113037109375, 1.540618896484375, 1.610107421875, 1.679595947265625, 1.74908447265625, 1.818572998046875, 1.8880615234375, 1.957550048828125, 2.02703857421875, 2.096527099609375, 2.166015625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 16.0, 6.0, 18.0, 35.0, 47.0, 73.0, 128.0, 202.0, 326.0, 513.0, 924.0, 1448.0, 2476.0, 4131.0, 7087.0, 11576.0, 19880.0, 32541.0, 52855.0, 82710.0, 120564.0, 155424.0, 165842.0, 133554.0, 95728.0, 62484.0, 38829.0, 23510.0, 14496.0, 8494.0, 5037.0, 2985.0, 1829.0, 1093.0, 617.0, 415.0, 244.0, 142.0, 97.0, 62.0, 39.0, 34.0, 13.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6675567626953125, -0.646148681640625, -0.6247406005859375, -0.60333251953125, -0.5819244384765625, -0.560516357421875, -0.5391082763671875, -0.5177001953125, -0.4962921142578125, -0.474884033203125, -0.4534759521484375, -0.43206787109375, -0.4106597900390625, -0.389251708984375, -0.3678436279296875, -0.346435546875, -0.3250274658203125, -0.303619384765625, -0.2822113037109375, -0.26080322265625, -0.2393951416015625, -0.217987060546875, -0.1965789794921875, -0.1751708984375, -0.1537628173828125, -0.132354736328125, -0.1109466552734375, -0.08953857421875, -0.0681304931640625, -0.046722412109375, -0.0253143310546875, -0.00390625, 0.0175018310546875, 0.038909912109375, 0.0603179931640625, 0.08172607421875, 0.1031341552734375, 0.124542236328125, 0.1459503173828125, 0.1673583984375, 0.1887664794921875, 0.210174560546875, 0.2315826416015625, 0.25299072265625, 0.2743988037109375, 0.295806884765625, 0.3172149658203125, 0.338623046875, 0.3600311279296875, 0.381439208984375, 0.4028472900390625, 0.42425537109375, 0.4456634521484375, 0.467071533203125, 0.4884796142578125, 0.5098876953125, 0.5312957763671875, 0.552703857421875, 0.5741119384765625, 0.59552001953125, 0.6169281005859375, 0.638336181640625, 0.6597442626953125, 0.68115234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [6.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 10.0, 7.0, 9.0, 18.0, 8.0, 24.0, 21.0, 16.0, 21.0, 27.0, 22.0, 29.0, 40.0, 30.0, 32.0, 30.0, 33.0, 41.0, 42.0, 36.0, 1061.0, 28.0, 26.0, 33.0, 32.0, 28.0, 28.0, 25.0, 21.0, 27.0, 18.0, 24.0, 21.0, 16.0, 16.0, 16.0, 16.0, 11.0, 8.0, 6.0, 7.0, 10.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.2993621826171875, -1.253021240234375, -1.2066802978515625, -1.16033935546875, -1.1139984130859375, -1.067657470703125, -1.0213165283203125, -0.9749755859375, -0.9286346435546875, -0.882293701171875, -0.8359527587890625, -0.78961181640625, -0.7432708740234375, -0.696929931640625, -0.6505889892578125, -0.604248046875, -0.5579071044921875, -0.511566162109375, -0.4652252197265625, -0.41888427734375, -0.3725433349609375, -0.326202392578125, -0.2798614501953125, -0.2335205078125, -0.1871795654296875, -0.140838623046875, -0.0944976806640625, -0.04815673828125, -0.0018157958984375, 0.044525146484375, 0.0908660888671875, 0.13720703125, 0.1835479736328125, 0.229888916015625, 0.2762298583984375, 0.32257080078125, 0.3689117431640625, 0.415252685546875, 0.4615936279296875, 0.5079345703125, 0.5542755126953125, 0.600616455078125, 0.6469573974609375, 0.69329833984375, 0.7396392822265625, 0.785980224609375, 0.8323211669921875, 0.878662109375, 0.9250030517578125, 0.971343994140625, 1.0176849365234375, 1.06402587890625, 1.1103668212890625, 1.156707763671875, 1.2030487060546875, 1.2493896484375, 1.2957305908203125, 1.342071533203125, 1.3884124755859375, 1.43475341796875, 1.4810943603515625, 1.527435302734375, 1.5737762451171875, 1.6201171875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 14.0, 11.0, 23.0, 59.0, 61.0, 122.0, 125.0, 238.0, 363.0, 594.0, 912.0, 1456.0, 2331.0, 3981.0, 6404.0, 10669.0, 17615.0, 28961.0, 45920.0, 71746.0, 109746.0, 206616.0, 904621.0, 330691.0, 129340.0, 82784.0, 54321.0, 33937.0, 20691.0, 12764.0, 7592.0, 4723.0, 2926.0, 1789.0, 1105.0, 715.0, 390.0, 285.0, 187.0, 99.0, 59.0, 43.0, 33.0, 18.0, 8.0, 13.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2464599609375, -0.23891639709472656, -0.23137283325195312, -0.2238292694091797, -0.21628570556640625, -0.2087421417236328, -0.20119857788085938, -0.19365501403808594, -0.1861114501953125, -0.17856788635253906, -0.17102432250976562, -0.1634807586669922, -0.15593719482421875, -0.1483936309814453, -0.14085006713867188, -0.13330650329589844, -0.125762939453125, -0.11821937561035156, -0.11067581176757812, -0.10313224792480469, -0.09558868408203125, -0.08804512023925781, -0.08050155639648438, -0.07295799255371094, -0.0654144287109375, -0.05787086486816406, -0.050327301025390625, -0.04278373718261719, -0.03524017333984375, -0.027696609497070312, -0.020153045654296875, -0.012609481811523438, -0.00506591796875, 0.0024776458740234375, 0.010021209716796875, 0.017564773559570312, 0.02510833740234375, 0.03265190124511719, 0.040195465087890625, 0.04773902893066406, 0.0552825927734375, 0.06282615661621094, 0.07036972045898438, 0.07791328430175781, 0.08545684814453125, 0.09300041198730469, 0.10054397583007812, 0.10808753967285156, 0.115631103515625, 0.12317466735839844, 0.13071823120117188, 0.1382617950439453, 0.14580535888671875, 0.1533489227294922, 0.16089248657226562, 0.16843605041503906, 0.1759796142578125, 0.18352317810058594, 0.19106674194335938, 0.1986103057861328, 0.20615386962890625, 0.2136974334716797, 0.22124099731445312, 0.22878456115722656, 0.236328125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 1.0, 1.0, 4.0, 1.0, 7.0, 0.0, 7.0, 6.0, 13.0, 14.0, 6.0, 28.0, 13.0, 24.0, 21.0, 31.0, 52.0, 46.0, 64.0, 61.0, 56.0, 76.0, 83.0, 58.0, 63.0, 49.0, 32.0, 30.0, 27.0, 26.0, 15.0, 16.0, 13.0, 8.0, 9.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1512451171875, -0.14711666107177734, -0.1429882049560547, -0.13885974884033203, -0.13473129272460938, -0.13060283660888672, -0.12647438049316406, -0.1223459243774414, -0.11821746826171875, -0.1140890121459961, -0.10996055603027344, -0.10583209991455078, -0.10170364379882812, -0.09757518768310547, -0.09344673156738281, -0.08931827545166016, -0.0851898193359375, -0.08106136322021484, -0.07693290710449219, -0.07280445098876953, -0.06867599487304688, -0.06454753875732422, -0.06041908264160156, -0.056290626525878906, -0.05216217041015625, -0.048033714294433594, -0.04390525817871094, -0.03977680206298828, -0.035648345947265625, -0.03151988983154297, -0.027391433715820312, -0.023262977600097656, -0.019134521484375, -0.015006065368652344, -0.010877609252929688, -0.006749153137207031, -0.002620697021484375, 0.0015077590942382812, 0.0056362152099609375, 0.009764671325683594, 0.01389312744140625, 0.018021583557128906, 0.022150039672851562, 0.02627849578857422, 0.030406951904296875, 0.03453540802001953, 0.03866386413574219, 0.042792320251464844, 0.0469207763671875, 0.051049232482910156, 0.05517768859863281, 0.05930614471435547, 0.06343460083007812, 0.06756305694580078, 0.07169151306152344, 0.0758199691772461, 0.07994842529296875, 0.0840768814086914, 0.08820533752441406, 0.09233379364013672, 0.09646224975585938, 0.10059070587158203, 0.10471916198730469, 0.10884761810302734, 0.11297607421875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 7.0, 8.0, 5.0, 6.0, 7.0, 16.0, 17.0, 16.0, 16.0, 24.0, 38.0, 49.0, 65.0, 95.0, 116.0, 164.0, 269.0, 322.0, 531.0, 8613.0, 1025851.0, 10565.0, 555.0, 321.0, 218.0, 170.0, 120.0, 90.0, 48.0, 50.0, 34.0, 28.0, 20.0, 24.0, 12.0, 12.0, 7.0, 9.0, 5.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.119140625, -3.033721923828125, -2.94830322265625, -2.862884521484375, -2.7774658203125, -2.692047119140625, -2.60662841796875, -2.521209716796875, -2.435791015625, -2.350372314453125, -2.26495361328125, -2.179534912109375, -2.0941162109375, -2.008697509765625, -1.92327880859375, -1.837860107421875, -1.75244140625, -1.667022705078125, -1.58160400390625, -1.496185302734375, -1.4107666015625, -1.325347900390625, -1.23992919921875, -1.154510498046875, -1.069091796875, -0.983673095703125, -0.89825439453125, -0.812835693359375, -0.7274169921875, -0.641998291015625, -0.55657958984375, -0.471160888671875, -0.3857421875, -0.300323486328125, -0.21490478515625, -0.129486083984375, -0.0440673828125, 0.041351318359375, 0.12677001953125, 0.212188720703125, 0.297607421875, 0.383026123046875, 0.46844482421875, 0.553863525390625, 0.6392822265625, 0.724700927734375, 0.81011962890625, 0.895538330078125, 0.98095703125, 1.066375732421875, 1.15179443359375, 1.237213134765625, 1.3226318359375, 1.408050537109375, 1.49346923828125, 1.578887939453125, 1.664306640625, 1.749725341796875, 1.83514404296875, 1.920562744140625, 2.0059814453125, 2.091400146484375, 2.17681884765625, 2.262237548828125, 2.34765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 17.0, 33.0, 61.0, 144.0, 399.0, 195.0, 74.0, 41.0, 25.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2582298517227173, -1.2306880950927734, -1.2031463384628296, -1.1756045818328857, -1.148062825202942, -1.120521068572998, -1.0929794311523438, -1.0654375553131104, -1.037895917892456, -1.0103541612625122, -0.9828124046325684, -0.9552706480026245, -0.9277289509773254, -0.9001871943473816, -0.8726454377174377, -0.8451036810874939, -0.8175618648529053, -0.7900201082229614, -0.7624783515930176, -0.7349365949630737, -0.7073948979377747, -0.6798531413078308, -0.652311384677887, -0.6247696280479431, -0.597227931022644, -0.5696861743927002, -0.5421444177627563, -0.5146026611328125, -0.48706093430519104, -0.4595192074775696, -0.43197745084762573, -0.4044356942176819, -0.37689393758773804, -0.3493521809577942, -0.32181045413017273, -0.2942686975002289, -0.26672694087028503, -0.23918519914150238, -0.21164345741271973, -0.18410170078277588, -0.15655995905399323, -0.12901821732521057, -0.10147646069526672, -0.07393471896648407, -0.04639296978712082, -0.01885122060775757, 0.008690521121025085, 0.03623227775096893, 0.06377401947975159, 0.09131576865911484, 0.11885751783847809, 0.14639925956726074, 0.1739410161972046, 0.20148275792598724, 0.2290244996547699, 0.25656625628471375, 0.2841079831123352, 0.31164973974227905, 0.3391914665699005, 0.36673322319984436, 0.3942749798297882, 0.42181670665740967, 0.4493584632873535, 0.47690021991729736, 0.5044419765472412]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 10.0, 14.0, 21.0, 34.0, 31.0, 54.0, 60.0, 52.0, 71.0, 83.0, 90.0, 89.0, 77.0, 56.0, 74.0, 51.0, 49.0, 26.0, 17.0, 19.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4276440143585205, -0.4146178364753723, -0.4015916585922241, -0.3885654807090759, -0.37553930282592773, -0.36251312494277954, -0.34948694705963135, -0.33646076917648315, -0.32343459129333496, -0.31040841341018677, -0.2973822355270386, -0.2843560576438904, -0.2713298797607422, -0.258303701877594, -0.2452775090932846, -0.2322513312101364, -0.21922513842582703, -0.20619896054267883, -0.19317278265953064, -0.18014660477638245, -0.16712042689323425, -0.15409424901008606, -0.14106805622577667, -0.12804187834262848, -0.11501570045948029, -0.10198952257633209, -0.0889633446931839, -0.07593715935945511, -0.06291098147630692, -0.04988480359315872, -0.03685861825942993, -0.02383244037628174, -0.010806262493133545, 0.0022199172526597977, 0.01524609699845314, 0.028272278606891632, 0.041298456490039825, 0.05432463437318802, 0.06735081970691681, 0.080376997590065, 0.0934031754732132, 0.10642935335636139, 0.11945553123950958, 0.13248172402381897, 0.14550790190696716, 0.15853407979011536, 0.17156025767326355, 0.18458643555641174, 0.19761261343955994, 0.21063879132270813, 0.22366496920585632, 0.23669114708900452, 0.2497173249721527, 0.2627435028553009, 0.2757697105407715, 0.2887958884239197, 0.30182206630706787, 0.31484824419021606, 0.32787442207336426, 0.34090059995651245, 0.35392677783966064, 0.36695295572280884, 0.37997913360595703, 0.3930053114891052, 0.4060314893722534]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 9.0, 4.0, 19.0, 16.0, 11.0, 21.0, 25.0, 34.0, 39.0, 46.0, 49.0, 44.0, 43.0, 51.0, 65.0, 60.0, 59.0, 57.0, 37.0, 40.0, 41.0, 37.0, 35.0, 32.0, 23.0, 18.0, 19.0, 12.0, 8.0, 9.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.6873779296875, -2.597412109375, -2.5074462890625, -2.41748046875, -2.3275146484375, -2.237548828125, -2.1475830078125, -2.0576171875, -1.9676513671875, -1.877685546875, -1.7877197265625, -1.69775390625, -1.6077880859375, -1.517822265625, -1.4278564453125, -1.337890625, -1.2479248046875, -1.157958984375, -1.0679931640625, -0.97802734375, -0.8880615234375, -0.798095703125, -0.7081298828125, -0.6181640625, -0.5281982421875, -0.438232421875, -0.3482666015625, -0.25830078125, -0.1683349609375, -0.078369140625, 0.0115966796875, 0.1015625, 0.1915283203125, 0.281494140625, 0.3714599609375, 0.46142578125, 0.5513916015625, 0.641357421875, 0.7313232421875, 0.8212890625, 0.9112548828125, 1.001220703125, 1.0911865234375, 1.18115234375, 1.2711181640625, 1.361083984375, 1.4510498046875, 1.541015625, 1.6309814453125, 1.720947265625, 1.8109130859375, 1.90087890625, 1.9908447265625, 2.080810546875, 2.1707763671875, 2.2607421875, 2.3507080078125, 2.440673828125, 2.5306396484375, 2.62060546875, 2.7105712890625, 2.800537109375, 2.8905029296875, 2.98046875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 15.0, 16.0, 18.0, 28.0, 27.0, 43.0, 62.0, 92.0, 129.0, 206.0, 269.0, 431.0, 694.0, 1095.0, 1806.0, 3387.0, 6457.0, 13946.0, 33422.0, 88291.0, 223079.0, 339349.0, 201793.0, 78018.0, 29705.0, 12496.0, 5821.0, 3031.0, 1799.0, 1017.0, 632.0, 416.0, 281.0, 205.0, 133.0, 91.0, 63.0, 52.0, 35.0, 31.0, 16.0, 9.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.34375, -6.1419677734375, -5.940185546875, -5.7384033203125, -5.53662109375, -5.3348388671875, -5.133056640625, -4.9312744140625, -4.7294921875, -4.5277099609375, -4.325927734375, -4.1241455078125, -3.92236328125, -3.7205810546875, -3.518798828125, -3.3170166015625, -3.115234375, -2.9134521484375, -2.711669921875, -2.5098876953125, -2.30810546875, -2.1063232421875, -1.904541015625, -1.7027587890625, -1.5009765625, -1.2991943359375, -1.097412109375, -0.8956298828125, -0.69384765625, -0.4920654296875, -0.290283203125, -0.0885009765625, 0.11328125, 0.3150634765625, 0.516845703125, 0.7186279296875, 0.92041015625, 1.1221923828125, 1.323974609375, 1.5257568359375, 1.7275390625, 1.9293212890625, 2.131103515625, 2.3328857421875, 2.53466796875, 2.7364501953125, 2.938232421875, 3.1400146484375, 3.341796875, 3.5435791015625, 3.745361328125, 3.9471435546875, 4.14892578125, 4.3507080078125, 4.552490234375, 4.7542724609375, 4.9560546875, 5.1578369140625, 5.359619140625, 5.5614013671875, 5.76318359375, 5.9649658203125, 6.166748046875, 6.3685302734375, 6.5703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 4.0, 3.0, 7.0, 9.0, 5.0, 18.0, 12.0, 18.0, 29.0, 20.0, 28.0, 28.0, 34.0, 48.0, 45.0, 67.0, 86.0, 133.0, 180.0, 1282.0, 250.0, 173.0, 101.0, 85.0, 54.0, 46.0, 49.0, 34.0, 29.0, 24.0, 23.0, 24.0, 20.0, 16.0, 13.0, 8.0, 6.0, 6.0, 6.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.390625, -9.1285400390625, -8.866455078125, -8.6043701171875, -8.34228515625, -8.0802001953125, -7.818115234375, -7.5560302734375, -7.2939453125, -7.0318603515625, -6.769775390625, -6.5076904296875, -6.24560546875, -5.9835205078125, -5.721435546875, -5.4593505859375, -5.197265625, -4.9351806640625, -4.673095703125, -4.4110107421875, -4.14892578125, -3.8868408203125, -3.624755859375, -3.3626708984375, -3.1005859375, -2.8385009765625, -2.576416015625, -2.3143310546875, -2.05224609375, -1.7901611328125, -1.528076171875, -1.2659912109375, -1.00390625, -0.7418212890625, -0.479736328125, -0.2176513671875, 0.04443359375, 0.3065185546875, 0.568603515625, 0.8306884765625, 1.0927734375, 1.3548583984375, 1.616943359375, 1.8790283203125, 2.14111328125, 2.4031982421875, 2.665283203125, 2.9273681640625, 3.189453125, 3.4515380859375, 3.713623046875, 3.9757080078125, 4.23779296875, 4.4998779296875, 4.761962890625, 5.0240478515625, 5.2861328125, 5.5482177734375, 5.810302734375, 6.0723876953125, 6.33447265625, 6.5965576171875, 6.858642578125, 7.1207275390625, 7.3828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 6.0, 5.0, 14.0, 17.0, 16.0, 21.0, 30.0, 28.0, 43.0, 49.0, 69.0, 123.0, 366.0, 1420.0, 51330.0, 3045716.0, 44304.0, 1354.0, 339.0, 131.0, 66.0, 56.0, 33.0, 33.0, 31.0, 18.0, 16.0, 13.0, 12.0, 8.0, 5.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.109375, -30.017333984375, -28.92529296875, -27.833251953125, -26.7412109375, -25.649169921875, -24.55712890625, -23.465087890625, -22.373046875, -21.281005859375, -20.18896484375, -19.096923828125, -18.0048828125, -16.912841796875, -15.82080078125, -14.728759765625, -13.63671875, -12.544677734375, -11.45263671875, -10.360595703125, -9.2685546875, -8.176513671875, -7.08447265625, -5.992431640625, -4.900390625, -3.808349609375, -2.71630859375, -1.624267578125, -0.5322265625, 0.559814453125, 1.65185546875, 2.743896484375, 3.8359375, 4.927978515625, 6.02001953125, 7.112060546875, 8.2041015625, 9.296142578125, 10.38818359375, 11.480224609375, 12.572265625, 13.664306640625, 14.75634765625, 15.848388671875, 16.9404296875, 18.032470703125, 19.12451171875, 20.216552734375, 21.30859375, 22.400634765625, 23.49267578125, 24.584716796875, 25.6767578125, 26.768798828125, 27.86083984375, 28.952880859375, 30.044921875, 31.136962890625, 32.22900390625, 33.321044921875, 34.4130859375, 35.505126953125, 36.59716796875, 37.689208984375, 38.78125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 22.0, 810.0, 187.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.255130767822266, -35.930702209472656, -30.606273651123047, -25.281843185424805, -19.957414627075195, -14.632986068725586, -9.308555603027344, -3.9841270446777344, 1.340301513671875, 6.664730548858643, 11.98915958404541, 17.313589096069336, 22.638017654418945, 27.962446212768555, 33.2868766784668, 38.611305236816406, 43.935733795166016, 49.260162353515625, 54.584590911865234, 59.909019470214844, 65.23345184326172, 70.55787658691406, 75.88230895996094, 81.20674133300781, 86.53116607666016, 91.85559844970703, 97.18002319335938, 102.50445556640625, 107.8288803100586, 113.15331268310547, 118.47773742675781, 123.80216979980469, 129.12660217285156, 134.45103454589844, 139.7754669189453, 145.09988403320312, 150.42431640625, 155.74874877929688, 161.07318115234375, 166.39761352539062, 171.72203063964844, 177.0464630126953, 182.3708953857422, 187.6953125, 193.01974487304688, 198.34417724609375, 203.66860961914062, 208.9930419921875, 214.31747436523438, 219.64190673828125, 224.96633911132812, 230.29075622558594, 235.6151885986328, 240.9396209716797, 246.26405334472656, 251.58847045898438, 256.91290283203125, 262.2373352050781, 267.561767578125, 272.8861999511719, 278.21063232421875, 283.5350341796875, 288.8594665527344, 294.18389892578125, 299.5083312988281]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 1.0, 3.0, 5.0, 10.0, 8.0, 11.0, 13.0, 13.0, 10.0, 13.0, 22.0, 25.0, 21.0, 21.0, 29.0, 26.0, 35.0, 22.0, 25.0, 39.0, 27.0, 48.0, 40.0, 44.0, 33.0, 36.0, 37.0, 25.0, 38.0, 40.0, 38.0, 22.0, 17.0, 22.0, 24.0, 19.0, 18.0, 18.0, 16.0, 8.0, 13.0, 10.0, 10.0, 15.0, 4.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-23.151748657226562, -22.406593322753906, -21.66143798828125, -20.916282653808594, -20.171127319335938, -19.425973892211914, -18.680818557739258, -17.9356632232666, -17.190507888793945, -16.44535255432129, -15.700197219848633, -14.955042839050293, -14.209887504577637, -13.46473217010498, -12.71957778930664, -11.974422454833984, -11.229267120361328, -10.484111785888672, -9.738956451416016, -8.993802070617676, -8.24864673614502, -7.503491401672363, -6.758336544036865, -6.013181686401367, -5.268026351928711, -4.522871017456055, -3.7777161598205566, -3.0325610637664795, -2.2874059677124023, -1.5422508716583252, -0.797095775604248, -0.05194091796875, 0.6932163238525391, 1.4383714199066162, 2.1835265159606934, 2.9286816120147705, 3.6738367080688477, 4.418992042541504, 5.164146900177002, 5.9093017578125, 6.654457092285156, 7.3996124267578125, 8.144767761230469, 8.889922142028809, 9.635077476501465, 10.380232810974121, 11.125387191772461, 11.870542526245117, 12.615697860717773, 13.36085319519043, 14.106008529663086, 14.851162910461426, 15.596318244934082, 16.341472625732422, 17.086627960205078, 17.831783294677734, 18.57693862915039, 19.322093963623047, 20.067249298095703, 20.81240463256836, 21.557559967041016, 22.30271339416504, 23.047868728637695, 23.79302406311035, 24.538179397583008]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 10.0, 4.0, 10.0, 8.0, 7.0, 17.0, 11.0, 14.0, 25.0, 34.0, 45.0, 50.0, 46.0, 47.0, 61.0, 67.0, 63.0, 46.0, 72.0, 50.0, 55.0, 54.0, 32.0, 41.0, 33.0, 21.0, 20.0, 20.0, 10.0, 5.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.12335205078125, -3.0142822265625, -2.90521240234375, -2.796142578125, -2.68707275390625, -2.5780029296875, -2.46893310546875, -2.35986328125, -2.25079345703125, -2.1417236328125, -2.03265380859375, -1.923583984375, -1.81451416015625, -1.7054443359375, -1.59637451171875, -1.4873046875, -1.37823486328125, -1.2691650390625, -1.16009521484375, -1.051025390625, -0.94195556640625, -0.8328857421875, -0.72381591796875, -0.61474609375, -0.50567626953125, -0.3966064453125, -0.28753662109375, -0.178466796875, -0.06939697265625, 0.0396728515625, 0.14874267578125, 0.2578125, 0.36688232421875, 0.4759521484375, 0.58502197265625, 0.694091796875, 0.80316162109375, 0.9122314453125, 1.02130126953125, 1.13037109375, 1.23944091796875, 1.3485107421875, 1.45758056640625, 1.566650390625, 1.67572021484375, 1.7847900390625, 1.89385986328125, 2.0029296875, 2.11199951171875, 2.2210693359375, 2.33013916015625, 2.439208984375, 2.54827880859375, 2.6573486328125, 2.76641845703125, 2.87548828125, 2.98455810546875, 3.0936279296875, 3.20269775390625, 3.311767578125, 3.42083740234375, 3.5299072265625, 3.63897705078125, 3.748046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 10.0, 10.0, 14.0, 13.0, 34.0, 42.0, 66.0, 94.0, 154.0, 223.0, 353.0, 648.0, 1221.0, 2634.0, 7928.0, 48054.0, 965812.0, 3001216.0, 145397.0, 14277.0, 3281.0, 1225.0, 645.0, 327.0, 203.0, 138.0, 96.0, 50.0, 35.0, 27.0, 14.0, 10.0, 12.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.27685546875, -13.7880859375, -13.29931640625, -12.810546875, -12.32177734375, -11.8330078125, -11.34423828125, -10.85546875, -10.36669921875, -9.8779296875, -9.38916015625, -8.900390625, -8.41162109375, -7.9228515625, -7.43408203125, -6.9453125, -6.45654296875, -5.9677734375, -5.47900390625, -4.990234375, -4.50146484375, -4.0126953125, -3.52392578125, -3.03515625, -2.54638671875, -2.0576171875, -1.56884765625, -1.080078125, -0.59130859375, -0.1025390625, 0.38623046875, 0.875, 1.36376953125, 1.8525390625, 2.34130859375, 2.830078125, 3.31884765625, 3.8076171875, 4.29638671875, 4.78515625, 5.27392578125, 5.7626953125, 6.25146484375, 6.740234375, 7.22900390625, 7.7177734375, 8.20654296875, 8.6953125, 9.18408203125, 9.6728515625, 10.16162109375, 10.650390625, 11.13916015625, 11.6279296875, 12.11669921875, 12.60546875, 13.09423828125, 13.5830078125, 14.07177734375, 14.560546875, 15.04931640625, 15.5380859375, 16.02685546875, 16.515625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 11.0, 21.0, 35.0, 65.0, 116.0, 232.0, 372.0, 656.0, 803.0, 682.0, 470.0, 264.0, 142.0, 79.0, 50.0, 28.0, 25.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.552001953125, -11.04150390625, -10.531005859375, -10.0205078125, -9.510009765625, -8.99951171875, -8.489013671875, -7.978515625, -7.468017578125, -6.95751953125, -6.447021484375, -5.9365234375, -5.426025390625, -4.91552734375, -4.405029296875, -3.89453125, -3.384033203125, -2.87353515625, -2.363037109375, -1.8525390625, -1.342041015625, -0.83154296875, -0.321044921875, 0.189453125, 0.699951171875, 1.21044921875, 1.720947265625, 2.2314453125, 2.741943359375, 3.25244140625, 3.762939453125, 4.2734375, 4.783935546875, 5.29443359375, 5.804931640625, 6.3154296875, 6.825927734375, 7.33642578125, 7.846923828125, 8.357421875, 8.867919921875, 9.37841796875, 9.888916015625, 10.3994140625, 10.909912109375, 11.42041015625, 11.930908203125, 12.44140625, 12.951904296875, 13.46240234375, 13.972900390625, 14.4833984375, 14.993896484375, 15.50439453125, 16.014892578125, 16.525390625, 17.035888671875, 17.54638671875, 18.056884765625, 18.5673828125, 19.077880859375, 19.58837890625, 20.098876953125, 20.609375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 13.0, 21.0, 23.0, 58.0, 89.0, 138.0, 319.0, 672.0, 2373.0, 15528.0, 368887.0, 3566847.0, 224635.0, 11450.0, 1985.0, 591.0, 293.0, 134.0, 98.0, 55.0, 31.0, 13.0, 11.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.359375, -26.397216796875, -25.43505859375, -24.472900390625, -23.5107421875, -22.548583984375, -21.58642578125, -20.624267578125, -19.662109375, -18.699951171875, -17.73779296875, -16.775634765625, -15.8134765625, -14.851318359375, -13.88916015625, -12.927001953125, -11.96484375, -11.002685546875, -10.04052734375, -9.078369140625, -8.1162109375, -7.154052734375, -6.19189453125, -5.229736328125, -4.267578125, -3.305419921875, -2.34326171875, -1.381103515625, -0.4189453125, 0.543212890625, 1.50537109375, 2.467529296875, 3.4296875, 4.391845703125, 5.35400390625, 6.316162109375, 7.2783203125, 8.240478515625, 9.20263671875, 10.164794921875, 11.126953125, 12.089111328125, 13.05126953125, 14.013427734375, 14.9755859375, 15.937744140625, 16.89990234375, 17.862060546875, 18.82421875, 19.786376953125, 20.74853515625, 21.710693359375, 22.6728515625, 23.635009765625, 24.59716796875, 25.559326171875, 26.521484375, 27.483642578125, 28.44580078125, 29.407958984375, 30.3701171875, 31.332275390625, 32.29443359375, 33.256591796875, 34.21875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 12.0, 32.0, 32.0, 58.0, 85.0, 73.0, 107.0, 124.0, 129.0, 108.0, 66.0, 61.0, 42.0, 20.0, 25.0, 13.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.87056350708008, -56.6265754699707, -55.38258361816406, -54.13859558105469, -52.89460372924805, -51.65061569213867, -50.40662384033203, -49.162635803222656, -47.91864776611328, -46.674659729003906, -45.430667877197266, -44.18667984008789, -42.94268798828125, -41.698699951171875, -40.454708099365234, -39.21072006225586, -37.96672821044922, -36.722740173339844, -35.4787483215332, -34.23476028442383, -32.99076843261719, -31.746780395507812, -30.502790451049805, -29.258800506591797, -28.01481056213379, -26.77082061767578, -25.526830673217773, -24.282840728759766, -23.03885269165039, -21.79486083984375, -20.550872802734375, -19.306882858276367, -18.062889099121094, -16.818899154663086, -15.574909210205078, -14.330920219421387, -13.086930274963379, -11.842940330505371, -10.59895133972168, -9.354961395263672, -8.110971450805664, -6.866981506347656, -5.622992038726807, -4.379002571105957, -3.135012626647949, -1.8910226821899414, -0.6470332145690918, 0.5969562530517578, 1.8409461975097656, 3.0849359035491943, 4.328925609588623, 5.572915077209473, 6.8169050216674805, 8.060894966125488, 9.30488395690918, 10.548873901367188, 11.792863845825195, 13.036853790283203, 14.280843734741211, 15.524832725524902, 16.768821716308594, 18.012813568115234, 19.25680160522461, 20.500791549682617, 21.744781494140625]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 14.0, 11.0, 12.0, 13.0, 16.0, 19.0, 20.0, 31.0, 39.0, 25.0, 31.0, 38.0, 35.0, 53.0, 43.0, 43.0, 38.0, 38.0, 40.0, 52.0, 45.0, 44.0, 36.0, 39.0, 26.0, 33.0, 25.0, 23.0, 16.0, 14.0, 20.0, 14.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.421844482421875, -33.365421295166016, -32.30899429321289, -31.25257110595703, -30.196147918701172, -29.13972282409668, -28.083297729492188, -27.026874542236328, -25.970449447631836, -24.914024353027344, -23.857601165771484, -22.801176071166992, -21.7447509765625, -20.68832778930664, -19.63190269470215, -18.575477600097656, -17.519054412841797, -16.462629318237305, -15.406206130981445, -14.349781036376953, -13.293356895446777, -12.236932754516602, -11.18050765991211, -10.124083518981934, -9.067659378051758, -8.011235237121582, -6.954810619354248, -5.898386001586914, -4.841961860656738, -3.7855377197265625, -2.7291131019592285, -1.6726884841918945, -0.6162643432617188, 0.44016003608703613, 1.496584415435791, 2.553008794784546, 3.609433174133301, 4.665857315063477, 5.7222819328308105, 6.7787065505981445, 7.83513069152832, 8.891554832458496, 9.947978973388672, 11.004404067993164, 12.06082820892334, 13.117252349853516, 14.173677444458008, 15.230101585388184, 16.28652572631836, 17.34295082092285, 18.39937400817871, 19.455799102783203, 20.512222290039062, 21.568647384643555, 22.625072479248047, 23.681495666503906, 24.7379207611084, 25.79434585571289, 26.85076904296875, 27.907194137573242, 28.963619232177734, 30.020042419433594, 31.076467514038086, 32.13289260864258, 33.18931579589844]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 6.0, 16.0, 13.0, 12.0, 24.0, 22.0, 36.0, 40.0, 39.0, 55.0, 47.0, 57.0, 61.0, 58.0, 40.0, 51.0, 61.0, 53.0, 55.0, 40.0, 40.0, 27.0, 24.0, 32.0, 18.0, 15.0, 8.0, 11.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.468719482421875, -3.36322021484375, -3.257720947265625, -3.1522216796875, -3.046722412109375, -2.94122314453125, -2.835723876953125, -2.730224609375, -2.624725341796875, -2.51922607421875, -2.413726806640625, -2.3082275390625, -2.202728271484375, -2.09722900390625, -1.991729736328125, -1.88623046875, -1.780731201171875, -1.67523193359375, -1.569732666015625, -1.4642333984375, -1.358734130859375, -1.25323486328125, -1.147735595703125, -1.042236328125, -0.936737060546875, -0.83123779296875, -0.725738525390625, -0.6202392578125, -0.514739990234375, -0.40924072265625, -0.303741455078125, -0.1982421875, -0.092742919921875, 0.01275634765625, 0.118255615234375, 0.2237548828125, 0.329254150390625, 0.43475341796875, 0.540252685546875, 0.645751953125, 0.751251220703125, 0.85675048828125, 0.962249755859375, 1.0677490234375, 1.173248291015625, 1.27874755859375, 1.384246826171875, 1.48974609375, 1.595245361328125, 1.70074462890625, 1.806243896484375, 1.9117431640625, 2.017242431640625, 2.12274169921875, 2.228240966796875, 2.333740234375, 2.439239501953125, 2.54473876953125, 2.650238037109375, 2.7557373046875, 2.861236572265625, 2.96673583984375, 3.072235107421875, 3.177734375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 11.0, 20.0, 28.0, 47.0, 78.0, 113.0, 158.0, 201.0, 260.0, 425.0, 654.0, 931.0, 1410.0, 2242.0, 3634.0, 5947.0, 9814.0, 15965.0, 26525.0, 43157.0, 68589.0, 103697.0, 141085.0, 164708.0, 147817.0, 111367.0, 75790.0, 47907.0, 29632.0, 17659.0, 10765.0, 6483.0, 4101.0, 2584.0, 1559.0, 1028.0, 681.0, 433.0, 302.0, 215.0, 163.0, 106.0, 76.0, 58.0, 31.0, 35.0, 16.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.74609375, -0.7224884033203125, -0.698883056640625, -0.6752777099609375, -0.65167236328125, -0.6280670166015625, -0.604461669921875, -0.5808563232421875, -0.5572509765625, -0.5336456298828125, -0.510040283203125, -0.4864349365234375, -0.46282958984375, -0.4392242431640625, -0.415618896484375, -0.3920135498046875, -0.368408203125, -0.3448028564453125, -0.321197509765625, -0.2975921630859375, -0.27398681640625, -0.2503814697265625, -0.226776123046875, -0.2031707763671875, -0.1795654296875, -0.1559600830078125, -0.132354736328125, -0.1087493896484375, -0.08514404296875, -0.0615386962890625, -0.037933349609375, -0.0143280029296875, 0.00927734375, 0.0328826904296875, 0.056488037109375, 0.0800933837890625, 0.10369873046875, 0.1273040771484375, 0.150909423828125, 0.1745147705078125, 0.1981201171875, 0.2217254638671875, 0.245330810546875, 0.2689361572265625, 0.29254150390625, 0.3161468505859375, 0.339752197265625, 0.3633575439453125, 0.386962890625, 0.4105682373046875, 0.434173583984375, 0.4577789306640625, 0.48138427734375, 0.5049896240234375, 0.528594970703125, 0.5522003173828125, 0.5758056640625, 0.5994110107421875, 0.623016357421875, 0.6466217041015625, 0.67022705078125, 0.6938323974609375, 0.717437744140625, 0.7410430908203125, 0.7646484375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 15.0, 8.0, 22.0, 17.0, 24.0, 28.0, 39.0, 33.0, 40.0, 40.0, 60.0, 45.0, 41.0, 51.0, 1081.0, 37.0, 40.0, 50.0, 53.0, 46.0, 37.0, 41.0, 26.0, 31.0, 27.0, 14.0, 13.0, 7.0, 16.0, 7.0, 9.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09375, -2.024200439453125, -1.95465087890625, -1.885101318359375, -1.8155517578125, -1.746002197265625, -1.67645263671875, -1.606903076171875, -1.537353515625, -1.467803955078125, -1.39825439453125, -1.328704833984375, -1.2591552734375, -1.189605712890625, -1.12005615234375, -1.050506591796875, -0.98095703125, -0.911407470703125, -0.84185791015625, -0.772308349609375, -0.7027587890625, -0.633209228515625, -0.56365966796875, -0.494110107421875, -0.424560546875, -0.355010986328125, -0.28546142578125, -0.215911865234375, -0.1463623046875, -0.076812744140625, -0.00726318359375, 0.062286376953125, 0.1318359375, 0.201385498046875, 0.27093505859375, 0.340484619140625, 0.4100341796875, 0.479583740234375, 0.54913330078125, 0.618682861328125, 0.688232421875, 0.757781982421875, 0.82733154296875, 0.896881103515625, 0.9664306640625, 1.035980224609375, 1.10552978515625, 1.175079345703125, 1.24462890625, 1.314178466796875, 1.38372802734375, 1.453277587890625, 1.5228271484375, 1.592376708984375, 1.66192626953125, 1.731475830078125, 1.801025390625, 1.870574951171875, 1.94012451171875, 2.009674072265625, 2.0792236328125, 2.148773193359375, 2.21832275390625, 2.287872314453125, 2.357421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 11.0, 13.0, 14.0, 22.0, 28.0, 55.0, 85.0, 130.0, 207.0, 329.0, 483.0, 808.0, 1425.0, 2595.0, 5016.0, 10579.0, 22814.0, 51987.0, 115830.0, 258307.0, 1136056.0, 269915.0, 120774.0, 53852.0, 23743.0, 10881.0, 5167.0, 2616.0, 1378.0, 741.0, 475.0, 292.0, 159.0, 114.0, 72.0, 44.0, 38.0, 20.0, 19.0, 16.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0], "bins": [-0.599609375, -0.58404541015625, -0.5684814453125, -0.55291748046875, -0.537353515625, -0.52178955078125, -0.5062255859375, -0.49066162109375, -0.47509765625, -0.45953369140625, -0.4439697265625, -0.42840576171875, -0.412841796875, -0.39727783203125, -0.3817138671875, -0.36614990234375, -0.3505859375, -0.33502197265625, -0.3194580078125, -0.30389404296875, -0.288330078125, -0.27276611328125, -0.2572021484375, -0.24163818359375, -0.22607421875, -0.21051025390625, -0.1949462890625, -0.17938232421875, -0.163818359375, -0.14825439453125, -0.1326904296875, -0.11712646484375, -0.1015625, -0.08599853515625, -0.0704345703125, -0.05487060546875, -0.039306640625, -0.02374267578125, -0.0081787109375, 0.00738525390625, 0.02294921875, 0.03851318359375, 0.0540771484375, 0.06964111328125, 0.085205078125, 0.10076904296875, 0.1163330078125, 0.13189697265625, 0.1474609375, 0.16302490234375, 0.1785888671875, 0.19415283203125, 0.209716796875, 0.22528076171875, 0.2408447265625, 0.25640869140625, 0.27197265625, 0.28753662109375, 0.3031005859375, 0.31866455078125, 0.334228515625, 0.34979248046875, 0.3653564453125, 0.38092041015625, 0.396484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 6.0, 1.0, 7.0, 4.0, 10.0, 8.0, 8.0, 8.0, 3.0, 11.0, 11.0, 19.0, 23.0, 30.0, 28.0, 43.0, 57.0, 72.0, 73.0, 80.0, 87.0, 73.0, 51.0, 49.0, 45.0, 38.0, 19.0, 23.0, 16.0, 6.0, 8.0, 7.0, 9.0, 6.0, 4.0, 10.0, 5.0, 0.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.16565895080566406, -0.16029739379882812, -0.1549358367919922, -0.14957427978515625, -0.1442127227783203, -0.13885116577148438, -0.13348960876464844, -0.1281280517578125, -0.12276649475097656, -0.11740493774414062, -0.11204338073730469, -0.10668182373046875, -0.10132026672363281, -0.09595870971679688, -0.09059715270996094, -0.085235595703125, -0.07987403869628906, -0.07451248168945312, -0.06915092468261719, -0.06378936767578125, -0.05842781066894531, -0.053066253662109375, -0.04770469665527344, -0.0423431396484375, -0.03698158264160156, -0.031620025634765625, -0.026258468627929688, -0.02089691162109375, -0.015535354614257812, -0.010173797607421875, -0.0048122406005859375, 0.00054931640625, 0.0059108734130859375, 0.011272430419921875, 0.016633987426757812, 0.02199554443359375, 0.027357101440429688, 0.032718658447265625, 0.03808021545410156, 0.0434417724609375, 0.04880332946777344, 0.054164886474609375, 0.05952644348144531, 0.06488800048828125, 0.07024955749511719, 0.07561111450195312, 0.08097267150878906, 0.086334228515625, 0.09169578552246094, 0.09705734252929688, 0.10241889953613281, 0.10778045654296875, 0.11314201354980469, 0.11850357055664062, 0.12386512756347656, 0.1292266845703125, 0.13458824157714844, 0.13994979858398438, 0.1453113555908203, 0.15067291259765625, 0.1560344696044922, 0.16139602661132812, 0.16675758361816406, 0.172119140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 6.0, 3.0, 5.0, 9.0, 13.0, 10.0, 11.0, 11.0, 16.0, 18.0, 24.0, 19.0, 26.0, 28.0, 15.0, 24.0, 23.0, 39.0, 55.0, 95.0, 103.0, 141.0, 247.0, 401.0, 1931.0, 27363.0, 987550.0, 27071.0, 1958.0, 410.0, 228.0, 167.0, 107.0, 74.0, 59.0, 39.0, 19.0, 29.0, 27.0, 18.0, 25.0, 18.0, 17.0, 10.0, 12.0, 15.0, 19.0, 12.0, 9.0, 8.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.935546875, -2.84521484375, -2.7548828125, -2.66455078125, -2.57421875, -2.48388671875, -2.3935546875, -2.30322265625, -2.212890625, -2.12255859375, -2.0322265625, -1.94189453125, -1.8515625, -1.76123046875, -1.6708984375, -1.58056640625, -1.490234375, -1.39990234375, -1.3095703125, -1.21923828125, -1.12890625, -1.03857421875, -0.9482421875, -0.85791015625, -0.767578125, -0.67724609375, -0.5869140625, -0.49658203125, -0.40625, -0.31591796875, -0.2255859375, -0.13525390625, -0.044921875, 0.04541015625, 0.1357421875, 0.22607421875, 0.31640625, 0.40673828125, 0.4970703125, 0.58740234375, 0.677734375, 0.76806640625, 0.8583984375, 0.94873046875, 1.0390625, 1.12939453125, 1.2197265625, 1.31005859375, 1.400390625, 1.49072265625, 1.5810546875, 1.67138671875, 1.76171875, 1.85205078125, 1.9423828125, 2.03271484375, 2.123046875, 2.21337890625, 2.3037109375, 2.39404296875, 2.484375, 2.57470703125, 2.6650390625, 2.75537109375, 2.845703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 703.0, 309.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609328269958496, -2.3463540077209473, -2.0833797454833984, -1.8204054832458496, -1.5574312210083008, -1.294456958770752, -1.0314826965332031, -0.7685084342956543, -0.5055341720581055, -0.24255990982055664, 0.020414352416992188, 0.283388614654541, 0.5463628768920898, 0.8093371391296387, 1.0723114013671875, 1.3352856636047363, 1.5982599258422852, 1.861234188079834, 2.124208450317383, 2.3871827125549316, 2.6501569747924805, 2.9131312370300293, 3.176105499267578, 3.439079761505127, 3.702054023742676, 3.9650282859802246, 4.228002548217773, 4.490976810455322, 4.753951072692871, 5.01692533493042, 5.279899597167969, 5.542873859405518, 5.805848121643066, 6.068822383880615, 6.331796646118164, 6.594770908355713, 6.857745170593262, 7.1207194328308105, 7.383693695068359, 7.646667957305908, 7.909642219543457, 8.172616958618164, 8.435590744018555, 8.698564529418945, 8.961539268493652, 9.22451400756836, 9.48748779296875, 9.75046157836914, 10.013436317443848, 10.276411056518555, 10.539384841918945, 10.802358627319336, 11.065333366394043, 11.32830810546875, 11.59128189086914, 11.854255676269531, 12.117230415344238, 12.380205154418945, 12.643178939819336, 12.906152725219727, 13.169127464294434, 13.43210220336914, 13.695075988769531, 13.958049774169922, 14.221024513244629]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 15.0, 15.0, 19.0, 29.0, 24.0, 37.0, 58.0, 54.0, 70.0, 57.0, 56.0, 64.0, 68.0, 62.0, 59.0, 66.0, 49.0, 45.0, 35.0, 25.0, 18.0, 24.0, 13.0, 14.0, 8.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.1274861097335815, -1.1010931730270386, -1.0747003555297852, -1.0483074188232422, -1.0219144821166992, -0.995521605014801, -0.9691287279129028, -0.9427357912063599, -0.9163429141044617, -0.8899500370025635, -0.8635571002960205, -0.8371642231941223, -0.8107712864875793, -0.7843784093856812, -0.7579854726791382, -0.73159259557724, -0.7051997184753418, -0.6788068413734436, -0.6524139046669006, -0.6260210275650024, -0.5996280908584595, -0.5732352137565613, -0.5468423366546631, -0.5204493999481201, -0.49405646324157715, -0.46766355633735657, -0.441270649433136, -0.4148777723312378, -0.3884848654270172, -0.36209195852279663, -0.33569905161857605, -0.30930614471435547, -0.2829132676124573, -0.2565203607082367, -0.2301274687051773, -0.20373456180095673, -0.17734166979789734, -0.15094876289367676, -0.12455585598945618, -0.09816296398639679, -0.07177005708217621, -0.045377157628536224, -0.018984254449605942, 0.007408648729324341, 0.033801548182964325, 0.06019444763660431, 0.08658735454082489, 0.11298024654388428, 0.13937315344810486, 0.16576606035232544, 0.19215895235538483, 0.2185518592596054, 0.2449447512626648, 0.2713376581668854, 0.29773056507110596, 0.32412344217300415, 0.3505163788795471, 0.3769092857837677, 0.4033021926879883, 0.4296950697898865, 0.45608797669410706, 0.48248088359832764, 0.5088738203048706, 0.5352666974067688, 0.561659574508667]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 3.0, 7.0, 12.0, 11.0, 27.0, 17.0, 33.0, 28.0, 42.0, 45.0, 42.0, 49.0, 66.0, 68.0, 54.0, 64.0, 65.0, 48.0, 52.0, 48.0, 48.0, 29.0, 37.0, 23.0, 16.0, 12.0, 14.0, 11.0, 3.0, 8.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -3.14361572265625, -3.0333251953125, -2.92303466796875, -2.812744140625, -2.70245361328125, -2.5921630859375, -2.48187255859375, -2.37158203125, -2.26129150390625, -2.1510009765625, -2.04071044921875, -1.930419921875, -1.82012939453125, -1.7098388671875, -1.59954833984375, -1.4892578125, -1.37896728515625, -1.2686767578125, -1.15838623046875, -1.048095703125, -0.93780517578125, -0.8275146484375, -0.71722412109375, -0.60693359375, -0.49664306640625, -0.3863525390625, -0.27606201171875, -0.165771484375, -0.05548095703125, 0.0548095703125, 0.16510009765625, 0.275390625, 0.38568115234375, 0.4959716796875, 0.60626220703125, 0.716552734375, 0.82684326171875, 0.9371337890625, 1.04742431640625, 1.15771484375, 1.26800537109375, 1.3782958984375, 1.48858642578125, 1.598876953125, 1.70916748046875, 1.8194580078125, 1.92974853515625, 2.0400390625, 2.15032958984375, 2.2606201171875, 2.37091064453125, 2.481201171875, 2.59149169921875, 2.7017822265625, 2.81207275390625, 2.92236328125, 3.03265380859375, 3.1429443359375, 3.25323486328125, 3.363525390625, 3.47381591796875, 3.5841064453125, 3.69439697265625, 3.8046875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 7.0, 9.0, 17.0, 29.0, 53.0, 59.0, 137.0, 163.0, 357.0, 564.0, 1031.0, 2104.0, 4860.0, 11797.0, 30726.0, 79561.0, 182933.0, 290322.0, 240992.0, 121706.0, 49196.0, 18319.0, 7133.0, 3115.0, 1595.0, 743.0, 388.0, 251.0, 150.0, 84.0, 53.0, 40.0, 26.0, 7.0, 7.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.94140625, -3.82794189453125, -3.7144775390625, -3.60101318359375, -3.487548828125, -3.37408447265625, -3.2606201171875, -3.14715576171875, -3.03369140625, -2.92022705078125, -2.8067626953125, -2.69329833984375, -2.579833984375, -2.46636962890625, -2.3529052734375, -2.23944091796875, -2.1259765625, -2.01251220703125, -1.8990478515625, -1.78558349609375, -1.672119140625, -1.55865478515625, -1.4451904296875, -1.33172607421875, -1.21826171875, -1.10479736328125, -0.9913330078125, -0.87786865234375, -0.764404296875, -0.65093994140625, -0.5374755859375, -0.42401123046875, -0.310546875, -0.19708251953125, -0.0836181640625, 0.02984619140625, 0.143310546875, 0.25677490234375, 0.3702392578125, 0.48370361328125, 0.59716796875, 0.71063232421875, 0.8240966796875, 0.93756103515625, 1.051025390625, 1.16448974609375, 1.2779541015625, 1.39141845703125, 1.5048828125, 1.61834716796875, 1.7318115234375, 1.84527587890625, 1.958740234375, 2.07220458984375, 2.1856689453125, 2.29913330078125, 2.41259765625, 2.52606201171875, 2.6395263671875, 2.75299072265625, 2.866455078125, 2.97991943359375, 3.0933837890625, 3.20684814453125, 3.3203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 5.0, 9.0, 8.0, 10.0, 15.0, 19.0, 22.0, 26.0, 20.0, 36.0, 33.0, 32.0, 33.0, 39.0, 47.0, 65.0, 102.0, 168.0, 266.0, 1309.0, 209.0, 116.0, 78.0, 54.0, 51.0, 36.0, 38.0, 22.0, 26.0, 25.0, 26.0, 15.0, 16.0, 19.0, 11.0, 6.0, 6.0, 7.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.98828125, -9.6875, -9.38671875, -9.0859375, -8.78515625, -8.484375, -8.18359375, -7.8828125, -7.58203125, -7.28125, -6.98046875, -6.6796875, -6.37890625, -6.078125, -5.77734375, -5.4765625, -5.17578125, -4.875, -4.57421875, -4.2734375, -3.97265625, -3.671875, -3.37109375, -3.0703125, -2.76953125, -2.46875, -2.16796875, -1.8671875, -1.56640625, -1.265625, -0.96484375, -0.6640625, -0.36328125, -0.0625, 0.23828125, 0.5390625, 0.83984375, 1.140625, 1.44140625, 1.7421875, 2.04296875, 2.34375, 2.64453125, 2.9453125, 3.24609375, 3.546875, 3.84765625, 4.1484375, 4.44921875, 4.75, 5.05078125, 5.3515625, 5.65234375, 5.953125, 6.25390625, 6.5546875, 6.85546875, 7.15625, 7.45703125, 7.7578125, 8.05859375, 8.359375, 8.66015625, 8.9609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 6.0, 4.0, 11.0, 13.0, 17.0, 14.0, 22.0, 22.0, 20.0, 33.0, 45.0, 47.0, 68.0, 134.0, 280.0, 782.0, 2696.0, 15710.0, 413455.0, 2590685.0, 110983.0, 7745.0, 1702.0, 520.0, 223.0, 115.0, 76.0, 47.0, 42.0, 27.0, 22.0, 28.0, 27.0, 17.0, 12.0, 10.0, 12.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0234375, -13.5103759765625, -12.997314453125, -12.4842529296875, -11.97119140625, -11.4581298828125, -10.945068359375, -10.4320068359375, -9.9189453125, -9.4058837890625, -8.892822265625, -8.3797607421875, -7.86669921875, -7.3536376953125, -6.840576171875, -6.3275146484375, -5.814453125, -5.3013916015625, -4.788330078125, -4.2752685546875, -3.76220703125, -3.2491455078125, -2.736083984375, -2.2230224609375, -1.7099609375, -1.1968994140625, -0.683837890625, -0.1707763671875, 0.34228515625, 0.8553466796875, 1.368408203125, 1.8814697265625, 2.39453125, 2.9075927734375, 3.420654296875, 3.9337158203125, 4.44677734375, 4.9598388671875, 5.472900390625, 5.9859619140625, 6.4990234375, 7.0120849609375, 7.525146484375, 8.0382080078125, 8.55126953125, 9.0643310546875, 9.577392578125, 10.0904541015625, 10.603515625, 11.1165771484375, 11.629638671875, 12.1427001953125, 12.65576171875, 13.1688232421875, 13.681884765625, 14.1949462890625, 14.7080078125, 15.2210693359375, 15.734130859375, 16.2471923828125, 16.76025390625, 17.2733154296875, 17.786376953125, 18.2994384765625, 18.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 8.0, 143.0, 527.0, 307.0, 30.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.663956642150879, -9.992233276367188, -7.320510387420654, -4.648787498474121, -1.9770641326904297, 0.6946592330932617, 3.3663816452026367, 6.0381059646606445, 8.70982837677002, 11.381551742553711, 14.053274154663086, 16.724998474121094, 19.39672088623047, 22.068443298339844, 24.74016571044922, 27.41189193725586, 30.083614349365234, 32.75533676147461, 35.427059173583984, 38.098785400390625, 40.7705078125, 43.442230224609375, 46.11395263671875, 48.785675048828125, 51.4573974609375, 54.129119873046875, 56.80084228515625, 59.472564697265625, 62.144290924072266, 64.81600952148438, 67.48773193359375, 70.15946197509766, 72.83118438720703, 75.5029067993164, 78.17462921142578, 80.84635162353516, 83.51807403564453, 86.18980407714844, 88.86152648925781, 91.53324890136719, 94.20497131347656, 96.87669372558594, 99.54841613769531, 102.22013854980469, 104.89186096191406, 107.56358337402344, 110.23530578613281, 112.90703582763672, 115.57875061035156, 118.25047302246094, 120.92219543457031, 123.59391784667969, 126.26564025878906, 128.93736267089844, 131.6090850830078, 134.2808074951172, 136.95254516601562, 139.624267578125, 142.29598999023438, 144.96771240234375, 147.63943481445312, 150.3111572265625, 152.98287963867188, 155.65460205078125, 158.32632446289062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 9.0, 20.0, 26.0, 17.0, 22.0, 23.0, 28.0, 31.0, 27.0, 31.0, 27.0, 30.0, 45.0, 42.0, 47.0, 56.0, 51.0, 39.0, 40.0, 49.0, 36.0, 33.0, 24.0, 43.0, 29.0, 24.0, 27.0, 22.0, 15.0, 10.0, 13.0, 13.0, 10.0, 6.0, 3.0, 0.0, 6.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.078866958618164, -30.057695388793945, -29.036523818969727, -28.01535415649414, -26.994182586669922, -25.973011016845703, -24.951839447021484, -23.930667877197266, -22.909496307373047, -21.888324737548828, -20.86715316772461, -19.84598159790039, -18.824811935424805, -17.803640365600586, -16.782468795776367, -15.761297225952148, -14.740127563476562, -13.718955993652344, -12.697785377502441, -11.676613807678223, -10.65544319152832, -9.634271621704102, -8.613100051879883, -7.591928958892822, -6.570757865905762, -5.549586772918701, -4.528415679931641, -3.507244110107422, -2.4860730171203613, -1.4649019241333008, -0.44373035430908203, 0.5774407386779785, 1.5986099243164062, 2.619781017303467, 3.6409523487091064, 4.662123680114746, 5.683294773101807, 6.704465866088867, 7.725637435913086, 8.746809005737305, 9.767979621887207, 10.789151191711426, 11.810321807861328, 12.831493377685547, 13.852664947509766, 14.873835563659668, 15.895007133483887, 16.91617774963379, 17.937349319458008, 18.958520889282227, 19.979692459106445, 21.00086212158203, 22.02203369140625, 23.04320526123047, 24.064376831054688, 25.085548400878906, 26.106719970703125, 27.127891540527344, 28.149063110351562, 29.17023468017578, 30.191404342651367, 31.212575912475586, 32.23374938964844, 33.25491714477539, 34.27608871459961]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 5.0, 6.0, 11.0, 14.0, 24.0, 21.0, 26.0, 31.0, 46.0, 29.0, 42.0, 45.0, 62.0, 59.0, 52.0, 59.0, 52.0, 44.0, 49.0, 45.0, 41.0, 35.0, 32.0, 25.0, 24.0, 16.0, 20.0, 20.0, 12.0, 11.0, 7.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8203125, -2.716949462890625, -2.61358642578125, -2.510223388671875, -2.4068603515625, -2.303497314453125, -2.20013427734375, -2.096771240234375, -1.993408203125, -1.890045166015625, -1.78668212890625, -1.683319091796875, -1.5799560546875, -1.476593017578125, -1.37322998046875, -1.269866943359375, -1.16650390625, -1.063140869140625, -0.95977783203125, -0.856414794921875, -0.7530517578125, -0.649688720703125, -0.54632568359375, -0.442962646484375, -0.339599609375, -0.236236572265625, -0.13287353515625, -0.029510498046875, 0.0738525390625, 0.177215576171875, 0.28057861328125, 0.383941650390625, 0.4873046875, 0.590667724609375, 0.69403076171875, 0.797393798828125, 0.9007568359375, 1.004119873046875, 1.10748291015625, 1.210845947265625, 1.314208984375, 1.417572021484375, 1.52093505859375, 1.624298095703125, 1.7276611328125, 1.831024169921875, 1.93438720703125, 2.037750244140625, 2.14111328125, 2.244476318359375, 2.34783935546875, 2.451202392578125, 2.5545654296875, 2.657928466796875, 2.76129150390625, 2.864654541015625, 2.968017578125, 3.071380615234375, 3.17474365234375, 3.278106689453125, 3.3814697265625, 3.484832763671875, 3.58819580078125, 3.691558837890625, 3.794921875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 9.0, 11.0, 8.0, 11.0, 32.0, 34.0, 48.0, 82.0, 133.0, 159.0, 248.0, 359.0, 585.0, 1119.0, 1970.0, 4566.0, 15205.0, 79924.0, 797698.0, 2853606.0, 376348.0, 46604.0, 9772.0, 2910.0, 1231.0, 571.0, 333.0, 198.0, 138.0, 94.0, 72.0, 57.0, 35.0, 20.0, 25.0, 19.0, 15.0, 6.0, 3.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.767822265625, -9.41064453125, -9.053466796875, -8.6962890625, -8.339111328125, -7.98193359375, -7.624755859375, -7.267578125, -6.910400390625, -6.55322265625, -6.196044921875, -5.8388671875, -5.481689453125, -5.12451171875, -4.767333984375, -4.41015625, -4.052978515625, -3.69580078125, -3.338623046875, -2.9814453125, -2.624267578125, -2.26708984375, -1.909912109375, -1.552734375, -1.195556640625, -0.83837890625, -0.481201171875, -0.1240234375, 0.233154296875, 0.59033203125, 0.947509765625, 1.3046875, 1.661865234375, 2.01904296875, 2.376220703125, 2.7333984375, 3.090576171875, 3.44775390625, 3.804931640625, 4.162109375, 4.519287109375, 4.87646484375, 5.233642578125, 5.5908203125, 5.947998046875, 6.30517578125, 6.662353515625, 7.01953125, 7.376708984375, 7.73388671875, 8.091064453125, 8.4482421875, 8.805419921875, 9.16259765625, 9.519775390625, 9.876953125, 10.234130859375, 10.59130859375, 10.948486328125, 11.3056640625, 11.662841796875, 12.02001953125, 12.377197265625, 12.734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 23.0, 32.0, 44.0, 48.0, 80.0, 126.0, 155.0, 229.0, 306.0, 408.0, 494.0, 486.0, 423.0, 298.0, 263.0, 180.0, 130.0, 100.0, 64.0, 53.0, 37.0, 16.0, 14.0, 12.0, 7.0, 4.0, 9.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-13.2578125, -12.9508056640625, -12.643798828125, -12.3367919921875, -12.02978515625, -11.7227783203125, -11.415771484375, -11.1087646484375, -10.8017578125, -10.4947509765625, -10.187744140625, -9.8807373046875, -9.57373046875, -9.2667236328125, -8.959716796875, -8.6527099609375, -8.345703125, -8.0386962890625, -7.731689453125, -7.4246826171875, -7.11767578125, -6.8106689453125, -6.503662109375, -6.1966552734375, -5.8896484375, -5.5826416015625, -5.275634765625, -4.9686279296875, -4.66162109375, -4.3546142578125, -4.047607421875, -3.7406005859375, -3.43359375, -3.1265869140625, -2.819580078125, -2.5125732421875, -2.20556640625, -1.8985595703125, -1.591552734375, -1.2845458984375, -0.9775390625, -0.6705322265625, -0.363525390625, -0.0565185546875, 0.25048828125, 0.5574951171875, 0.864501953125, 1.1715087890625, 1.478515625, 1.7855224609375, 2.092529296875, 2.3995361328125, 2.70654296875, 3.0135498046875, 3.320556640625, 3.6275634765625, 3.9345703125, 4.2415771484375, 4.548583984375, 4.8555908203125, 5.16259765625, 5.4696044921875, 5.776611328125, 6.0836181640625, 6.390625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 8.0, 11.0, 12.0, 17.0, 27.0, 55.0, 65.0, 104.0, 166.0, 260.0, 561.0, 1457.0, 3682.0, 12432.0, 59301.0, 394102.0, 2274236.0, 1234103.0, 172648.0, 29565.0, 7103.0, 2354.0, 935.0, 415.0, 233.0, 132.0, 87.0, 55.0, 36.0, 21.0, 17.0, 18.0, 7.0, 12.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.0625, -15.5726318359375, -15.082763671875, -14.5928955078125, -14.10302734375, -13.6131591796875, -13.123291015625, -12.6334228515625, -12.1435546875, -11.6536865234375, -11.163818359375, -10.6739501953125, -10.18408203125, -9.6942138671875, -9.204345703125, -8.7144775390625, -8.224609375, -7.7347412109375, -7.244873046875, -6.7550048828125, -6.26513671875, -5.7752685546875, -5.285400390625, -4.7955322265625, -4.3056640625, -3.8157958984375, -3.325927734375, -2.8360595703125, -2.34619140625, -1.8563232421875, -1.366455078125, -0.8765869140625, -0.38671875, 0.1031494140625, 0.593017578125, 1.0828857421875, 1.57275390625, 2.0626220703125, 2.552490234375, 3.0423583984375, 3.5322265625, 4.0220947265625, 4.511962890625, 5.0018310546875, 5.49169921875, 5.9815673828125, 6.471435546875, 6.9613037109375, 7.451171875, 7.9410400390625, 8.430908203125, 8.9207763671875, 9.41064453125, 9.9005126953125, 10.390380859375, 10.8802490234375, 11.3701171875, 11.8599853515625, 12.349853515625, 12.8397216796875, 13.32958984375, 13.8194580078125, 14.309326171875, 14.7991943359375, 15.2890625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 14.0, 15.0, 51.0, 74.0, 102.0, 130.0, 144.0, 162.0, 115.0, 84.0, 58.0, 26.0, 16.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.29423141479492, -58.50652313232422, -56.718814849853516, -54.93110656738281, -53.14339828491211, -51.355690002441406, -49.56798553466797, -47.7802734375, -45.99256896972656, -44.20486068725586, -42.417152404785156, -40.62944412231445, -38.84173583984375, -37.05402755737305, -35.266319274902344, -33.478614807128906, -31.690902709960938, -29.903194427490234, -28.11548614501953, -26.327777862548828, -24.540069580078125, -22.752361297607422, -20.96465492248535, -19.17694664001465, -17.389238357543945, -15.601530075073242, -13.813821792602539, -12.026114463806152, -10.23840618133545, -8.450697898864746, -6.662990570068359, -4.875282287597656, -3.087574005126953, -1.299865961074829, 0.4878420829772949, 2.27554988861084, 4.063258171081543, 5.850966453552246, 7.638673782348633, 9.426382064819336, 11.214090347290039, 13.001798629760742, 14.789506912231445, 16.577213287353516, 18.36492156982422, 20.152629852294922, 21.940338134765625, 23.728046417236328, 25.51575469970703, 27.303462982177734, 29.091171264648438, 30.87887954711914, 32.666587829589844, 34.45429611206055, 36.24200439453125, 38.02970886230469, 39.817420959472656, 41.60512924194336, 43.39283752441406, 45.180545806884766, 46.96825408935547, 48.75596237182617, 50.543670654296875, 52.33137512207031, 54.119083404541016]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 1.0, 6.0, 6.0, 13.0, 16.0, 8.0, 8.0, 19.0, 20.0, 20.0, 18.0, 27.0, 25.0, 26.0, 39.0, 35.0, 44.0, 46.0, 40.0, 35.0, 44.0, 48.0, 47.0, 27.0, 60.0, 39.0, 41.0, 32.0, 27.0, 32.0, 31.0, 20.0, 20.0, 19.0, 16.0, 8.0, 14.0, 5.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.554357528686523, -24.661001205444336, -23.767642974853516, -22.874286651611328, -21.98093032836914, -21.087574005126953, -20.194215774536133, -19.300859451293945, -18.407503128051758, -17.51414680480957, -16.62078857421875, -15.727432250976562, -14.834075927734375, -13.940718650817871, -13.047361373901367, -12.15400505065918, -11.260647773742676, -10.367290496826172, -9.473934173583984, -8.58057689666748, -7.687220573425293, -6.793863296508789, -5.900506496429443, -5.007149696350098, -4.113792896270752, -3.2204360961914062, -2.3270792961120605, -1.4337222576141357, -0.54036545753479, 0.35299158096313477, 1.2463483810424805, 2.139705181121826, 3.033061981201172, 3.9264187812805176, 4.819775581359863, 5.713132858276367, 6.606489181518555, 7.499846458435059, 8.393203735351562, 9.28656005859375, 10.179916381835938, 11.073273658752441, 11.966629981994629, 12.859987258911133, 13.75334358215332, 14.646700859069824, 15.540058135986328, 16.433414459228516, 17.326770782470703, 18.22012710571289, 19.11348533630371, 20.0068416595459, 20.900197982788086, 21.793556213378906, 22.686912536621094, 23.58026885986328, 24.4736270904541, 25.36698341369629, 26.26034164428711, 27.153697967529297, 28.047054290771484, 28.940410614013672, 29.833768844604492, 30.72712516784668, 31.620481491088867]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 16.0, 10.0, 14.0, 14.0, 26.0, 27.0, 22.0, 38.0, 34.0, 37.0, 33.0, 64.0, 54.0, 51.0, 53.0, 59.0, 38.0, 56.0, 43.0, 41.0, 34.0, 33.0, 31.0, 26.0, 25.0, 20.0, 20.0, 16.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.96868896484375, -2.8651123046875, -2.76153564453125, -2.657958984375, -2.55438232421875, -2.4508056640625, -2.34722900390625, -2.24365234375, -2.14007568359375, -2.0364990234375, -1.93292236328125, -1.829345703125, -1.72576904296875, -1.6221923828125, -1.51861572265625, -1.4150390625, -1.31146240234375, -1.2078857421875, -1.10430908203125, -1.000732421875, -0.89715576171875, -0.7935791015625, -0.69000244140625, -0.58642578125, -0.48284912109375, -0.3792724609375, -0.27569580078125, -0.172119140625, -0.06854248046875, 0.0350341796875, 0.13861083984375, 0.2421875, 0.34576416015625, 0.4493408203125, 0.55291748046875, 0.656494140625, 0.76007080078125, 0.8636474609375, 0.96722412109375, 1.07080078125, 1.17437744140625, 1.2779541015625, 1.38153076171875, 1.485107421875, 1.58868408203125, 1.6922607421875, 1.79583740234375, 1.8994140625, 2.00299072265625, 2.1065673828125, 2.21014404296875, 2.313720703125, 2.41729736328125, 2.5208740234375, 2.62445068359375, 2.72802734375, 2.83160400390625, 2.9351806640625, 3.03875732421875, 3.142333984375, 3.24591064453125, 3.3494873046875, 3.45306396484375, 3.556640625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 12.0, 20.0, 16.0, 35.0, 45.0, 60.0, 119.0, 174.0, 243.0, 367.0, 580.0, 881.0, 1352.0, 2219.0, 3543.0, 5435.0, 8422.0, 13557.0, 21306.0, 33157.0, 50526.0, 74026.0, 102475.0, 130164.0, 144288.0, 131036.0, 104306.0, 75579.0, 51391.0, 33628.0, 21826.0, 13768.0, 8678.0, 5566.0, 3546.0, 2192.0, 1377.0, 972.0, 584.0, 349.0, 249.0, 132.0, 124.0, 80.0, 59.0, 27.0, 25.0, 18.0, 8.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6552734375, -0.6351242065429688, -0.6149749755859375, -0.5948257446289062, -0.574676513671875, -0.5545272827148438, -0.5343780517578125, -0.5142288208007812, -0.49407958984375, -0.47393035888671875, -0.4537811279296875, -0.43363189697265625, -0.413482666015625, -0.39333343505859375, -0.3731842041015625, -0.35303497314453125, -0.3328857421875, -0.31273651123046875, -0.2925872802734375, -0.27243804931640625, -0.252288818359375, -0.23213958740234375, -0.2119903564453125, -0.19184112548828125, -0.17169189453125, -0.15154266357421875, -0.1313934326171875, -0.11124420166015625, -0.091094970703125, -0.07094573974609375, -0.0507965087890625, -0.03064727783203125, -0.010498046875, 0.00965118408203125, 0.0298004150390625, 0.04994964599609375, 0.070098876953125, 0.09024810791015625, 0.1103973388671875, 0.13054656982421875, 0.15069580078125, 0.17084503173828125, 0.1909942626953125, 0.21114349365234375, 0.231292724609375, 0.25144195556640625, 0.2715911865234375, 0.29174041748046875, 0.3118896484375, 0.33203887939453125, 0.3521881103515625, 0.37233734130859375, 0.392486572265625, 0.41263580322265625, 0.4327850341796875, 0.45293426513671875, 0.47308349609375, 0.49323272705078125, 0.5133819580078125, 0.5335311889648438, 0.553680419921875, 0.5738296508789062, 0.5939788818359375, 0.6141281127929688, 0.63427734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 8.0, 12.0, 11.0, 8.0, 15.0, 14.0, 17.0, 15.0, 24.0, 21.0, 24.0, 25.0, 23.0, 34.0, 35.0, 28.0, 33.0, 34.0, 42.0, 37.0, 29.0, 1063.0, 48.0, 32.0, 27.0, 36.0, 49.0, 28.0, 30.0, 25.0, 36.0, 24.0, 16.0, 24.0, 19.0, 7.0, 13.0, 8.0, 15.0, 7.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.724609375, -1.6658935546875, -1.607177734375, -1.5484619140625, -1.48974609375, -1.4310302734375, -1.372314453125, -1.3135986328125, -1.2548828125, -1.1961669921875, -1.137451171875, -1.0787353515625, -1.02001953125, -0.9613037109375, -0.902587890625, -0.8438720703125, -0.78515625, -0.7264404296875, -0.667724609375, -0.6090087890625, -0.55029296875, -0.4915771484375, -0.432861328125, -0.3741455078125, -0.3154296875, -0.2567138671875, -0.197998046875, -0.1392822265625, -0.08056640625, -0.0218505859375, 0.036865234375, 0.0955810546875, 0.154296875, 0.2130126953125, 0.271728515625, 0.3304443359375, 0.38916015625, 0.4478759765625, 0.506591796875, 0.5653076171875, 0.6240234375, 0.6827392578125, 0.741455078125, 0.8001708984375, 0.85888671875, 0.9176025390625, 0.976318359375, 1.0350341796875, 1.09375, 1.1524658203125, 1.211181640625, 1.2698974609375, 1.32861328125, 1.3873291015625, 1.446044921875, 1.5047607421875, 1.5634765625, 1.6221923828125, 1.680908203125, 1.7396240234375, 1.79833984375, 1.8570556640625, 1.915771484375, 1.9744873046875, 2.033203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 4.0, 12.0, 17.0, 25.0, 45.0, 55.0, 128.0, 163.0, 320.0, 538.0, 940.0, 1771.0, 2897.0, 5475.0, 10238.0, 20589.0, 39662.0, 75966.0, 142606.0, 347457.0, 1034213.0, 197228.0, 103273.0, 54261.0, 28278.0, 14244.0, 7632.0, 3955.0, 2175.0, 1170.0, 747.0, 407.0, 253.0, 123.0, 90.0, 72.0, 35.0, 21.0, 19.0, 9.0, 5.0, 0.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.408935546875, -0.3966331481933594, -0.38433074951171875, -0.3720283508300781, -0.3597259521484375, -0.3474235534667969, -0.33512115478515625, -0.3228187561035156, -0.310516357421875, -0.2982139587402344, -0.28591156005859375, -0.2736091613769531, -0.2613067626953125, -0.24900436401367188, -0.23670196533203125, -0.22439956665039062, -0.21209716796875, -0.19979476928710938, -0.18749237060546875, -0.17518997192382812, -0.1628875732421875, -0.15058517456054688, -0.13828277587890625, -0.12598037719726562, -0.113677978515625, -0.10137557983398438, -0.08907318115234375, -0.07677078247070312, -0.0644683837890625, -0.052165985107421875, -0.03986358642578125, -0.027561187744140625, -0.0152587890625, -0.002956390380859375, 0.00934600830078125, 0.021648406982421875, 0.0339508056640625, 0.046253204345703125, 0.05855560302734375, 0.07085800170898438, 0.083160400390625, 0.09546279907226562, 0.10776519775390625, 0.12006759643554688, 0.1323699951171875, 0.14467239379882812, 0.15697479248046875, 0.16927719116210938, 0.18157958984375, 0.19388198852539062, 0.20618438720703125, 0.21848678588867188, 0.2307891845703125, 0.24309158325195312, 0.25539398193359375, 0.2676963806152344, 0.279998779296875, 0.2923011779785156, 0.30460357666015625, 0.3169059753417969, 0.3292083740234375, 0.3415107727050781, 0.35381317138671875, 0.3661155700683594, 0.37841796875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 5.0, 6.0, 8.0, 8.0, 12.0, 17.0, 8.0, 20.0, 14.0, 15.0, 18.0, 14.0, 14.0, 23.0, 21.0, 27.0, 39.0, 67.0, 109.0, 112.0, 87.0, 60.0, 41.0, 28.0, 26.0, 19.0, 17.0, 18.0, 20.0, 14.0, 13.0, 12.0, 10.0, 12.0, 9.0, 10.0, 6.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10943603515625, -0.10606002807617188, -0.10268402099609375, -0.09930801391601562, -0.0959320068359375, -0.09255599975585938, -0.08917999267578125, -0.08580398559570312, -0.082427978515625, -0.07905197143554688, -0.07567596435546875, -0.07229995727539062, -0.0689239501953125, -0.06554794311523438, -0.06217193603515625, -0.058795928955078125, -0.055419921875, -0.052043914794921875, -0.04866790771484375, -0.045291900634765625, -0.0419158935546875, -0.038539886474609375, -0.03516387939453125, -0.031787872314453125, -0.028411865234375, -0.025035858154296875, -0.02165985107421875, -0.018283843994140625, -0.0149078369140625, -0.011531829833984375, -0.00815582275390625, -0.004779815673828125, -0.00140380859375, 0.001972198486328125, 0.00534820556640625, 0.008724212646484375, 0.0121002197265625, 0.015476226806640625, 0.01885223388671875, 0.022228240966796875, 0.025604248046875, 0.028980255126953125, 0.03235626220703125, 0.035732269287109375, 0.0391082763671875, 0.042484283447265625, 0.04586029052734375, 0.049236297607421875, 0.0526123046875, 0.055988311767578125, 0.05936431884765625, 0.06274032592773438, 0.0661163330078125, 0.06949234008789062, 0.07286834716796875, 0.07624435424804688, 0.079620361328125, 0.08299636840820312, 0.08637237548828125, 0.08974838256835938, 0.0931243896484375, 0.09650039672851562, 0.09987640380859375, 0.10325241088867188, 0.10662841796875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 7.0, 3.0, 6.0, 4.0, 5.0, 6.0, 16.0, 13.0, 17.0, 23.0, 28.0, 25.0, 31.0, 32.0, 35.0, 39.0, 51.0, 55.0, 69.0, 73.0, 61.0, 111.0, 117.0, 180.0, 418.0, 1660.0, 23937.0, 904224.0, 109861.0, 5580.0, 696.0, 278.0, 148.0, 122.0, 94.0, 64.0, 74.0, 52.0, 51.0, 50.0, 31.0, 33.0, 38.0, 25.0, 19.0, 17.0, 17.0, 15.0, 9.0, 10.0, 14.0, 6.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5380859375, -1.4880523681640625, -1.438018798828125, -1.3879852294921875, -1.33795166015625, -1.2879180908203125, -1.237884521484375, -1.1878509521484375, -1.1378173828125, -1.0877838134765625, -1.037750244140625, -0.9877166748046875, -0.93768310546875, -0.8876495361328125, -0.837615966796875, -0.7875823974609375, -0.737548828125, -0.6875152587890625, -0.637481689453125, -0.5874481201171875, -0.53741455078125, -0.4873809814453125, -0.437347412109375, -0.3873138427734375, -0.3372802734375, -0.2872467041015625, -0.237213134765625, -0.1871795654296875, -0.13714599609375, -0.0871124267578125, -0.037078857421875, 0.0129547119140625, 0.06298828125, 0.1130218505859375, 0.163055419921875, 0.2130889892578125, 0.26312255859375, 0.3131561279296875, 0.363189697265625, 0.4132232666015625, 0.4632568359375, 0.5132904052734375, 0.563323974609375, 0.6133575439453125, 0.66339111328125, 0.7134246826171875, 0.763458251953125, 0.8134918212890625, 0.863525390625, 0.9135589599609375, 0.963592529296875, 1.0136260986328125, 1.06365966796875, 1.1136932373046875, 1.163726806640625, 1.2137603759765625, 1.2637939453125, 1.3138275146484375, 1.363861083984375, 1.4138946533203125, 1.46392822265625, 1.5139617919921875, 1.563995361328125, 1.6140289306640625, 1.6640625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 45.0, 895.0, 70.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5577573776245117, -2.4265780448913574, -2.295398473739624, -2.1642191410064697, -2.0330395698547363, -1.901860237121582, -1.7706807851791382, -1.6395013332366943, -1.5083218812942505, -1.3771424293518066, -1.2459629774093628, -1.114783525466919, -0.9836041331291199, -0.852424681186676, -0.721245288848877, -0.5900658369064331, -0.45888638496398926, -0.3277069330215454, -0.19652751088142395, -0.06534808874130249, 0.06583136320114136, 0.1970108151435852, 0.3281902074813843, 0.4593696594238281, 0.590549111366272, 0.7217285633087158, 0.8529080152511597, 0.9840874075889587, 1.1152667999267578, 1.2464463710784912, 1.3776257038116455, 1.5088051557540894, 1.6399846076965332, 1.771164059638977, 1.902343511581421, 2.033522844314575, 2.1647024154663086, 2.295881748199463, 2.427061080932617, 2.5582406520843506, 2.689420223236084, 2.8205995559692383, 2.9517791271209717, 3.082958459854126, 3.2141380310058594, 3.3453173637390137, 3.476496696472168, 3.6076762676239014, 3.7388556003570557, 3.87003493309021, 4.001214504241943, 4.132393836975098, 4.263573169708252, 4.3947529792785645, 4.525932312011719, 4.657111644744873, 4.788290977478027, 4.919470310211182, 5.050649642944336, 5.181829452514648, 5.313008785247803, 5.444188117980957, 5.575367450714111, 5.706546783447266, 5.837726593017578]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 8.0, 13.0, 25.0, 29.0, 34.0, 35.0, 45.0, 48.0, 64.0, 63.0, 61.0, 71.0, 57.0, 65.0, 61.0, 42.0, 46.0, 44.0, 32.0, 33.0, 29.0, 22.0, 14.0, 19.0, 8.0, 8.0, 0.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6788115501403809, -0.6622877717018127, -0.6457640528678894, -0.6292402744293213, -0.612716555595398, -0.5961927771568298, -0.5796689987182617, -0.5631452798843384, -0.5466215014457703, -0.5300977230072021, -0.5135740041732788, -0.4970502257347107, -0.48052647709846497, -0.46400272846221924, -0.4474789500236511, -0.4309552013874054, -0.41443145275115967, -0.39790770411491394, -0.3813839554786682, -0.3648601770401001, -0.34833642840385437, -0.33181267976760864, -0.3152889013290405, -0.2987651526927948, -0.2822414040565491, -0.26571765542030334, -0.24919389188289642, -0.2326701283454895, -0.21614637970924377, -0.19962263107299805, -0.18309886753559113, -0.1665751039981842, -0.15005141496658325, -0.13352766633033752, -0.1170039027929306, -0.10048014670610428, -0.08395639061927795, -0.06743263453245163, -0.050908878445625305, -0.03438512235879898, -0.017861366271972656, -0.0013376101851463318, 0.015186145901679993, 0.03170990198850632, 0.04823365807533264, 0.06475741416215897, 0.08128117024898529, 0.09780492633581161, 0.11432868242263794, 0.13085243105888367, 0.1473761945962906, 0.1638999581336975, 0.18042370676994324, 0.19694745540618896, 0.2134712189435959, 0.2299949824810028, 0.24651873111724854, 0.26304247975349426, 0.27956622838974, 0.2960900068283081, 0.31261375546455383, 0.32913750410079956, 0.3456612825393677, 0.3621850311756134, 0.37870877981185913]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 10.0, 9.0, 18.0, 18.0, 22.0, 28.0, 33.0, 38.0, 36.0, 60.0, 49.0, 54.0, 69.0, 64.0, 63.0, 69.0, 49.0, 51.0, 33.0, 40.0, 44.0, 29.0, 24.0, 27.0, 17.0, 11.0, 9.0, 4.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.72503662109375, -3.6043701171875, -3.48370361328125, -3.363037109375, -3.24237060546875, -3.1217041015625, -3.00103759765625, -2.88037109375, -2.75970458984375, -2.6390380859375, -2.51837158203125, -2.397705078125, -2.27703857421875, -2.1563720703125, -2.03570556640625, -1.9150390625, -1.79437255859375, -1.6737060546875, -1.55303955078125, -1.432373046875, -1.31170654296875, -1.1910400390625, -1.07037353515625, -0.94970703125, -0.82904052734375, -0.7083740234375, -0.58770751953125, -0.467041015625, -0.34637451171875, -0.2257080078125, -0.10504150390625, 0.015625, 0.13629150390625, 0.2569580078125, 0.37762451171875, 0.498291015625, 0.61895751953125, 0.7396240234375, 0.86029052734375, 0.98095703125, 1.10162353515625, 1.2222900390625, 1.34295654296875, 1.463623046875, 1.58428955078125, 1.7049560546875, 1.82562255859375, 1.9462890625, 2.06695556640625, 2.1876220703125, 2.30828857421875, 2.428955078125, 2.54962158203125, 2.6702880859375, 2.79095458984375, 2.91162109375, 3.03228759765625, 3.1529541015625, 3.27362060546875, 3.394287109375, 3.51495361328125, 3.6356201171875, 3.75628662109375, 3.876953125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 10.0, 16.0, 17.0, 30.0, 34.0, 53.0, 55.0, 114.0, 153.0, 248.0, 425.0, 729.0, 1367.0, 2657.0, 5519.0, 12674.0, 33149.0, 107634.0, 401027.0, 343951.0, 88900.0, 28502.0, 10885.0, 4870.0, 2423.0, 1213.0, 659.0, 399.0, 247.0, 172.0, 112.0, 77.0, 63.0, 40.0, 23.0, 20.0, 15.0, 23.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.07080078125, -4.8955078125, -4.72021484375, -4.544921875, -4.36962890625, -4.1943359375, -4.01904296875, -3.84375, -3.66845703125, -3.4931640625, -3.31787109375, -3.142578125, -2.96728515625, -2.7919921875, -2.61669921875, -2.44140625, -2.26611328125, -2.0908203125, -1.91552734375, -1.740234375, -1.56494140625, -1.3896484375, -1.21435546875, -1.0390625, -0.86376953125, -0.6884765625, -0.51318359375, -0.337890625, -0.16259765625, 0.0126953125, 0.18798828125, 0.36328125, 0.53857421875, 0.7138671875, 0.88916015625, 1.064453125, 1.23974609375, 1.4150390625, 1.59033203125, 1.765625, 1.94091796875, 2.1162109375, 2.29150390625, 2.466796875, 2.64208984375, 2.8173828125, 2.99267578125, 3.16796875, 3.34326171875, 3.5185546875, 3.69384765625, 3.869140625, 4.04443359375, 4.2197265625, 4.39501953125, 4.5703125, 4.74560546875, 4.9208984375, 5.09619140625, 5.271484375, 5.44677734375, 5.6220703125, 5.79736328125, 5.97265625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 10.0, 9.0, 12.0, 10.0, 11.0, 11.0, 15.0, 14.0, 37.0, 32.0, 33.0, 28.0, 36.0, 38.0, 51.0, 58.0, 100.0, 167.0, 283.0, 1353.0, 188.0, 97.0, 66.0, 57.0, 35.0, 37.0, 32.0, 29.0, 30.0, 29.0, 26.0, 17.0, 15.0, 14.0, 15.0, 7.0, 7.0, 6.0, 6.0, 4.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.4075927734375, -10.072998046875, -9.7384033203125, -9.40380859375, -9.0692138671875, -8.734619140625, -8.4000244140625, -8.0654296875, -7.7308349609375, -7.396240234375, -7.0616455078125, -6.72705078125, -6.3924560546875, -6.057861328125, -5.7232666015625, -5.388671875, -5.0540771484375, -4.719482421875, -4.3848876953125, -4.05029296875, -3.7156982421875, -3.381103515625, -3.0465087890625, -2.7119140625, -2.3773193359375, -2.042724609375, -1.7081298828125, -1.37353515625, -1.0389404296875, -0.704345703125, -0.3697509765625, -0.03515625, 0.2994384765625, 0.634033203125, 0.9686279296875, 1.30322265625, 1.6378173828125, 1.972412109375, 2.3070068359375, 2.6416015625, 2.9761962890625, 3.310791015625, 3.6453857421875, 3.97998046875, 4.3145751953125, 4.649169921875, 4.9837646484375, 5.318359375, 5.6529541015625, 5.987548828125, 6.3221435546875, 6.65673828125, 6.9913330078125, 7.325927734375, 7.6605224609375, 7.9951171875, 8.3297119140625, 8.664306640625, 8.9989013671875, 9.33349609375, 9.6680908203125, 10.002685546875, 10.3372802734375, 10.671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 9.0, 17.0, 18.0, 14.0, 23.0, 32.0, 35.0, 54.0, 61.0, 80.0, 133.0, 191.0, 388.0, 901.0, 2944.0, 13522.0, 121426.0, 2537564.0, 432525.0, 27985.0, 4943.0, 1441.0, 515.0, 285.0, 172.0, 93.0, 81.0, 54.0, 45.0, 31.0, 19.0, 26.0, 9.0, 7.0, 11.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.1400146484375, -13.647216796875, -13.1544189453125, -12.66162109375, -12.1688232421875, -11.676025390625, -11.1832275390625, -10.6904296875, -10.1976318359375, -9.704833984375, -9.2120361328125, -8.71923828125, -8.2264404296875, -7.733642578125, -7.2408447265625, -6.748046875, -6.2552490234375, -5.762451171875, -5.2696533203125, -4.77685546875, -4.2840576171875, -3.791259765625, -3.2984619140625, -2.8056640625, -2.3128662109375, -1.820068359375, -1.3272705078125, -0.83447265625, -0.3416748046875, 0.151123046875, 0.6439208984375, 1.13671875, 1.6295166015625, 2.122314453125, 2.6151123046875, 3.10791015625, 3.6007080078125, 4.093505859375, 4.5863037109375, 5.0791015625, 5.5718994140625, 6.064697265625, 6.5574951171875, 7.05029296875, 7.5430908203125, 8.035888671875, 8.5286865234375, 9.021484375, 9.5142822265625, 10.007080078125, 10.4998779296875, 10.99267578125, 11.4854736328125, 11.978271484375, 12.4710693359375, 12.9638671875, 13.4566650390625, 13.949462890625, 14.4422607421875, 14.93505859375, 15.4278564453125, 15.920654296875, 16.4134521484375, 16.90625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [19.0, 403.0, 562.0, 33.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.081791877746582, -5.270118713378906, -0.45844554901123047, 4.353227615356445, 9.164900779724121, 13.97657299041748, 18.788246154785156, 23.59992218017578, 28.41159439086914, 33.2232666015625, 38.034942626953125, 42.846614837646484, 47.658287048339844, 52.4699592590332, 57.28163146972656, 62.09330749511719, 66.90497589111328, 71.7166519165039, 76.5283203125, 81.33999633789062, 86.15167236328125, 90.96334075927734, 95.77501678466797, 100.58668518066406, 105.39836120605469, 110.21003723144531, 115.0217056274414, 119.83338165283203, 124.64505004882812, 129.45672607421875, 134.26840209960938, 139.080078125, 143.89175415039062, 148.70343017578125, 153.51510620117188, 158.32676696777344, 163.13844299316406, 167.9501190185547, 172.7617950439453, 177.57347106933594, 182.3851318359375, 187.19680786132812, 192.00848388671875, 196.8201446533203, 201.63182067871094, 206.44349670410156, 211.2551727294922, 216.0668487548828, 220.87852478027344, 225.69020080566406, 230.5018768310547, 235.31353759765625, 240.12521362304688, 244.9368896484375, 249.74856567382812, 254.56024169921875, 259.3719177246094, 264.18359375, 268.9952697753906, 273.80694580078125, 278.6186218261719, 283.4302978515625, 288.241943359375, 293.0536193847656, 297.86529541015625]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 7.0, 9.0, 12.0, 14.0, 15.0, 14.0, 24.0, 13.0, 22.0, 20.0, 29.0, 26.0, 33.0, 29.0, 20.0, 37.0, 30.0, 42.0, 54.0, 51.0, 39.0, 34.0, 27.0, 43.0, 35.0, 24.0, 25.0, 37.0, 29.0, 19.0, 23.0, 28.0, 21.0, 14.0, 10.0, 22.0, 13.0, 6.0, 6.0, 8.0, 2.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.561973571777344, -34.51008224487305, -33.458187103271484, -32.40629577636719, -31.354402542114258, -30.302509307861328, -29.25061798095703, -28.1987247467041, -27.146831512451172, -26.094938278198242, -25.043046951293945, -23.991153717041016, -22.939260482788086, -21.887367248535156, -20.83547592163086, -19.78358268737793, -18.731691360473633, -17.679798126220703, -16.627906799316406, -15.576013565063477, -14.524120330810547, -13.472228050231934, -12.42033576965332, -11.36844253540039, -10.316550254821777, -9.264657974243164, -8.212764739990234, -7.160872459411621, -6.10897970199585, -5.057086944580078, -4.005194664001465, -2.9533019065856934, -1.9014110565185547, -0.8495184183120728, 0.20237421989440918, 1.2542667388916016, 2.306159496307373, 3.3580522537231445, 4.409944534301758, 5.461837291717529, 6.513730049133301, 7.565622806549072, 8.617515563964844, 9.669407844543457, 10.72130012512207, 11.773193359375, 12.825085639953613, 13.876977920532227, 14.928871154785156, 15.98076343536377, 17.032655715942383, 18.084548950195312, 19.136442184448242, 20.188335418701172, 21.24022674560547, 22.2921199798584, 23.344013214111328, 24.395906448364258, 25.447797775268555, 26.499691009521484, 27.551584243774414, 28.603477478027344, 29.65536880493164, 30.70726203918457, 31.759153366088867]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 4.0, 9.0, 7.0, 13.0, 12.0, 16.0, 27.0, 24.0, 36.0, 38.0, 45.0, 46.0, 43.0, 55.0, 48.0, 45.0, 57.0, 45.0, 51.0, 46.0, 42.0, 33.0, 29.0, 33.0, 35.0, 28.0, 23.0, 21.0, 18.0, 10.0, 10.0, 5.0, 11.0, 3.0, 7.0, 3.0, 6.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.326171875, -3.2174072265625, -3.108642578125, -2.9998779296875, -2.89111328125, -2.7823486328125, -2.673583984375, -2.5648193359375, -2.4560546875, -2.3472900390625, -2.238525390625, -2.1297607421875, -2.02099609375, -1.9122314453125, -1.803466796875, -1.6947021484375, -1.5859375, -1.4771728515625, -1.368408203125, -1.2596435546875, -1.15087890625, -1.0421142578125, -0.933349609375, -0.8245849609375, -0.7158203125, -0.6070556640625, -0.498291015625, -0.3895263671875, -0.28076171875, -0.1719970703125, -0.063232421875, 0.0455322265625, 0.154296875, 0.2630615234375, 0.371826171875, 0.4805908203125, 0.58935546875, 0.6981201171875, 0.806884765625, 0.9156494140625, 1.0244140625, 1.1331787109375, 1.241943359375, 1.3507080078125, 1.45947265625, 1.5682373046875, 1.677001953125, 1.7857666015625, 1.89453125, 2.0032958984375, 2.112060546875, 2.2208251953125, 2.32958984375, 2.4383544921875, 2.547119140625, 2.6558837890625, 2.7646484375, 2.8734130859375, 2.982177734375, 3.0909423828125, 3.19970703125, 3.3084716796875, 3.417236328125, 3.5260009765625, 3.634765625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 12.0, 8.0, 16.0, 28.0, 39.0, 43.0, 68.0, 100.0, 119.0, 225.0, 303.0, 537.0, 984.0, 2031.0, 5353.0, 19524.0, 116673.0, 1238203.0, 2496971.0, 267687.0, 33678.0, 7291.0, 2235.0, 908.0, 416.0, 239.0, 162.0, 101.0, 76.0, 60.0, 48.0, 27.0, 24.0, 18.0, 14.0, 13.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.921875, -11.5626220703125, -11.203369140625, -10.8441162109375, -10.48486328125, -10.1256103515625, -9.766357421875, -9.4071044921875, -9.0478515625, -8.6885986328125, -8.329345703125, -7.9700927734375, -7.61083984375, -7.2515869140625, -6.892333984375, -6.5330810546875, -6.173828125, -5.8145751953125, -5.455322265625, -5.0960693359375, -4.73681640625, -4.3775634765625, -4.018310546875, -3.6590576171875, -3.2998046875, -2.9405517578125, -2.581298828125, -2.2220458984375, -1.86279296875, -1.5035400390625, -1.144287109375, -0.7850341796875, -0.42578125, -0.0665283203125, 0.292724609375, 0.6519775390625, 1.01123046875, 1.3704833984375, 1.729736328125, 2.0889892578125, 2.4482421875, 2.8074951171875, 3.166748046875, 3.5260009765625, 3.88525390625, 4.2445068359375, 4.603759765625, 4.9630126953125, 5.322265625, 5.6815185546875, 6.040771484375, 6.4000244140625, 6.75927734375, 7.1185302734375, 7.477783203125, 7.8370361328125, 8.1962890625, 8.5555419921875, 8.914794921875, 9.2740478515625, 9.63330078125, 9.9925537109375, 10.351806640625, 10.7110595703125, 11.0703125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 10.0, 8.0, 12.0, 17.0, 20.0, 26.0, 38.0, 58.0, 75.0, 105.0, 137.0, 211.0, 316.0, 385.0, 471.0, 552.0, 441.0, 324.0, 247.0, 188.0, 125.0, 100.0, 43.0, 52.0, 26.0, 24.0, 16.0, 18.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.278076171875, -8.97021484375, -8.662353515625, -8.3544921875, -8.046630859375, -7.73876953125, -7.430908203125, -7.123046875, -6.815185546875, -6.50732421875, -6.199462890625, -5.8916015625, -5.583740234375, -5.27587890625, -4.968017578125, -4.66015625, -4.352294921875, -4.04443359375, -3.736572265625, -3.4287109375, -3.120849609375, -2.81298828125, -2.505126953125, -2.197265625, -1.889404296875, -1.58154296875, -1.273681640625, -0.9658203125, -0.657958984375, -0.35009765625, -0.042236328125, 0.265625, 0.573486328125, 0.88134765625, 1.189208984375, 1.4970703125, 1.804931640625, 2.11279296875, 2.420654296875, 2.728515625, 3.036376953125, 3.34423828125, 3.652099609375, 3.9599609375, 4.267822265625, 4.57568359375, 4.883544921875, 5.19140625, 5.499267578125, 5.80712890625, 6.114990234375, 6.4228515625, 6.730712890625, 7.03857421875, 7.346435546875, 7.654296875, 7.962158203125, 8.27001953125, 8.577880859375, 8.8857421875, 9.193603515625, 9.50146484375, 9.809326171875, 10.1171875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 5.0, 7.0, 6.0, 10.0, 11.0, 19.0, 31.0, 46.0, 52.0, 80.0, 121.0, 232.0, 441.0, 871.0, 2210.0, 7188.0, 32523.0, 222824.0, 1727538.0, 1899752.0, 251984.0, 36183.0, 7708.0, 2374.0, 956.0, 442.0, 220.0, 149.0, 92.0, 49.0, 44.0, 37.0, 22.0, 13.0, 10.0, 10.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.90625, -16.37841796875, -15.8505859375, -15.32275390625, -14.794921875, -14.26708984375, -13.7392578125, -13.21142578125, -12.68359375, -12.15576171875, -11.6279296875, -11.10009765625, -10.572265625, -10.04443359375, -9.5166015625, -8.98876953125, -8.4609375, -7.93310546875, -7.4052734375, -6.87744140625, -6.349609375, -5.82177734375, -5.2939453125, -4.76611328125, -4.23828125, -3.71044921875, -3.1826171875, -2.65478515625, -2.126953125, -1.59912109375, -1.0712890625, -0.54345703125, -0.015625, 0.51220703125, 1.0400390625, 1.56787109375, 2.095703125, 2.62353515625, 3.1513671875, 3.67919921875, 4.20703125, 4.73486328125, 5.2626953125, 5.79052734375, 6.318359375, 6.84619140625, 7.3740234375, 7.90185546875, 8.4296875, 8.95751953125, 9.4853515625, 10.01318359375, 10.541015625, 11.06884765625, 11.5966796875, 12.12451171875, 12.65234375, 13.18017578125, 13.7080078125, 14.23583984375, 14.763671875, 15.29150390625, 15.8193359375, 16.34716796875, 16.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 11.0, 27.0, 29.0, 52.0, 92.0, 102.0, 136.0, 147.0, 134.0, 96.0, 75.0, 61.0, 21.0, 19.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.36311721801758, -54.36628723144531, -52.36945343017578, -50.37261962890625, -48.375789642333984, -46.37895965576172, -44.38212585449219, -42.385292053222656, -40.38846206665039, -38.391632080078125, -36.394798278808594, -34.39796447753906, -32.4011344909668, -30.4043025970459, -28.407470703125, -26.4106388092041, -24.413806915283203, -22.416975021362305, -20.420143127441406, -18.423311233520508, -16.42647933959961, -14.429647445678711, -12.432815551757812, -10.435983657836914, -8.439151763916016, -6.442319869995117, -4.445487976074219, -2.4486560821533203, -0.4518241882324219, 1.5450077056884766, 3.541839599609375, 5.538671493530273, 7.535499572753906, 9.532331466674805, 11.529163360595703, 13.525995254516602, 15.5228271484375, 17.5196590423584, 19.516490936279297, 21.513322830200195, 23.510154724121094, 25.506986618041992, 27.50381851196289, 29.50065040588379, 31.497482299804688, 33.49431610107422, 35.491146087646484, 37.48797607421875, 39.48480987548828, 41.48164367675781, 43.47847366333008, 45.475303649902344, 47.472137451171875, 49.468971252441406, 51.46580123901367, 53.46263122558594, 55.45946502685547, 57.456298828125, 59.453128814697266, 61.44995880126953, 63.44679260253906, 65.4436264038086, 67.44046020507812, 69.43728637695312, 71.43412017822266]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 6.0, 8.0, 10.0, 9.0, 14.0, 16.0, 14.0, 18.0, 30.0, 21.0, 29.0, 27.0, 34.0, 39.0, 34.0, 39.0, 40.0, 43.0, 54.0, 35.0, 46.0, 36.0, 35.0, 54.0, 34.0, 27.0, 26.0, 40.0, 33.0, 23.0, 18.0, 16.0, 12.0, 16.0, 11.0, 9.0, 4.0, 7.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.791810989379883, -27.859891891479492, -26.9279727935791, -25.996055603027344, -25.064136505126953, -24.132217407226562, -23.200298309326172, -22.26837921142578, -21.33646011352539, -20.404541015625, -19.47262191772461, -18.54070281982422, -17.60878562927246, -16.67686653137207, -15.74494743347168, -14.813028335571289, -13.881111145019531, -12.94919204711914, -12.017273902893066, -11.085354804992676, -10.153436660766602, -9.221517562866211, -8.28959846496582, -7.357679843902588, -6.4257612228393555, -5.493842601776123, -4.561923980712891, -3.6300048828125, -2.6980862617492676, -1.7661676406860352, -0.8342485427856445, 0.09767007827758789, 1.0295906066894531, 1.961509346961975, 2.893428087234497, 3.8253469467163086, 4.757265567779541, 5.689184188842773, 6.621103286743164, 7.5530219078063965, 8.484940528869629, 9.41685962677002, 10.348777770996094, 11.280696868896484, 12.212615966796875, 13.14453411102295, 14.07645320892334, 15.008371353149414, 15.940290451049805, 16.872209548950195, 17.804128646850586, 18.736045837402344, 19.667964935302734, 20.599884033203125, 21.531803131103516, 22.463722229003906, 23.395641326904297, 24.327560424804688, 25.259479522705078, 26.19139862060547, 27.123315811157227, 28.055234909057617, 28.987154006958008, 29.9190731048584, 30.850990295410156]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 4.0, 8.0, 8.0, 14.0, 17.0, 16.0, 20.0, 25.0, 34.0, 34.0, 33.0, 41.0, 52.0, 49.0, 59.0, 48.0, 58.0, 47.0, 45.0, 40.0, 38.0, 41.0, 40.0, 31.0, 28.0, 28.0, 25.0, 18.0, 21.0, 10.0, 8.0, 9.0, 9.0, 11.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.615234375, -3.504791259765625, -3.39434814453125, -3.283905029296875, -3.1734619140625, -3.063018798828125, -2.95257568359375, -2.842132568359375, -2.731689453125, -2.621246337890625, -2.51080322265625, -2.400360107421875, -2.2899169921875, -2.179473876953125, -2.06903076171875, -1.958587646484375, -1.84814453125, -1.737701416015625, -1.62725830078125, -1.516815185546875, -1.4063720703125, -1.295928955078125, -1.18548583984375, -1.075042724609375, -0.964599609375, -0.854156494140625, -0.74371337890625, -0.633270263671875, -0.5228271484375, -0.412384033203125, -0.30194091796875, -0.191497802734375, -0.0810546875, 0.029388427734375, 0.13983154296875, 0.250274658203125, 0.3607177734375, 0.471160888671875, 0.58160400390625, 0.692047119140625, 0.802490234375, 0.912933349609375, 1.02337646484375, 1.133819580078125, 1.2442626953125, 1.354705810546875, 1.46514892578125, 1.575592041015625, 1.68603515625, 1.796478271484375, 1.90692138671875, 2.017364501953125, 2.1278076171875, 2.238250732421875, 2.34869384765625, 2.459136962890625, 2.569580078125, 2.680023193359375, 2.79046630859375, 2.900909423828125, 3.0113525390625, 3.121795654296875, 3.23223876953125, 3.342681884765625, 3.453125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 21.0, 18.0, 31.0, 41.0, 52.0, 68.0, 116.0, 152.0, 231.0, 290.0, 446.0, 648.0, 1042.0, 1588.0, 2590.0, 4072.0, 6624.0, 11053.0, 18183.0, 31264.0, 53190.0, 87992.0, 133222.0, 173957.0, 172536.0, 132344.0, 86487.0, 52509.0, 30852.0, 18310.0, 10638.0, 6534.0, 3959.0, 2571.0, 1650.0, 1119.0, 670.0, 479.0, 310.0, 219.0, 156.0, 104.0, 76.0, 41.0, 23.0, 31.0, 15.0, 10.0, 9.0, 1.0, 4.0, 2.0, 5.0], "bins": [-0.96337890625, -0.9358444213867188, -0.9083099365234375, -0.8807754516601562, -0.853240966796875, -0.8257064819335938, -0.7981719970703125, -0.7706375122070312, -0.74310302734375, -0.7155685424804688, -0.6880340576171875, -0.6604995727539062, -0.632965087890625, -0.6054306030273438, -0.5778961181640625, -0.5503616333007812, -0.5228271484375, -0.49529266357421875, -0.4677581787109375, -0.44022369384765625, -0.412689208984375, -0.38515472412109375, -0.3576202392578125, -0.33008575439453125, -0.30255126953125, -0.27501678466796875, -0.2474822998046875, -0.21994781494140625, -0.192413330078125, -0.16487884521484375, -0.1373443603515625, -0.10980987548828125, -0.082275390625, -0.05474090576171875, -0.0272064208984375, 0.00032806396484375, 0.027862548828125, 0.05539703369140625, 0.0829315185546875, 0.11046600341796875, 0.13800048828125, 0.16553497314453125, 0.1930694580078125, 0.22060394287109375, 0.248138427734375, 0.27567291259765625, 0.3032073974609375, 0.33074188232421875, 0.3582763671875, 0.38581085205078125, 0.4133453369140625, 0.44087982177734375, 0.468414306640625, 0.49594879150390625, 0.5234832763671875, 0.5510177612304688, 0.57855224609375, 0.6060867309570312, 0.6336212158203125, 0.6611557006835938, 0.688690185546875, 0.7162246704101562, 0.7437591552734375, 0.7712936401367188, 0.798828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 6.0, 8.0, 18.0, 14.0, 16.0, 17.0, 24.0, 25.0, 30.0, 26.0, 35.0, 42.0, 37.0, 33.0, 48.0, 56.0, 40.0, 1074.0, 40.0, 44.0, 43.0, 47.0, 29.0, 30.0, 29.0, 25.0, 31.0, 23.0, 24.0, 16.0, 15.0, 9.0, 7.0, 14.0, 10.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.412109375, -2.332427978515625, -2.25274658203125, -2.173065185546875, -2.0933837890625, -2.013702392578125, -1.93402099609375, -1.854339599609375, -1.774658203125, -1.694976806640625, -1.61529541015625, -1.535614013671875, -1.4559326171875, -1.376251220703125, -1.29656982421875, -1.216888427734375, -1.13720703125, -1.057525634765625, -0.97784423828125, -0.898162841796875, -0.8184814453125, -0.738800048828125, -0.65911865234375, -0.579437255859375, -0.499755859375, -0.420074462890625, -0.34039306640625, -0.260711669921875, -0.1810302734375, -0.101348876953125, -0.02166748046875, 0.058013916015625, 0.1376953125, 0.217376708984375, 0.29705810546875, 0.376739501953125, 0.4564208984375, 0.536102294921875, 0.61578369140625, 0.695465087890625, 0.775146484375, 0.854827880859375, 0.93450927734375, 1.014190673828125, 1.0938720703125, 1.173553466796875, 1.25323486328125, 1.332916259765625, 1.41259765625, 1.492279052734375, 1.57196044921875, 1.651641845703125, 1.7313232421875, 1.811004638671875, 1.89068603515625, 1.970367431640625, 2.050048828125, 2.129730224609375, 2.20941162109375, 2.289093017578125, 2.3687744140625, 2.448455810546875, 2.52813720703125, 2.607818603515625, 2.6875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 7.0, 19.0, 32.0, 25.0, 32.0, 65.0, 71.0, 145.0, 179.0, 258.0, 418.0, 645.0, 1035.0, 1691.0, 2887.0, 4801.0, 8942.0, 16042.0, 30432.0, 57412.0, 103957.0, 182651.0, 1136405.0, 261803.0, 129107.0, 72355.0, 39028.0, 20559.0, 10950.0, 6132.0, 3444.0, 2076.0, 1238.0, 777.0, 496.0, 303.0, 212.0, 161.0, 114.0, 77.0, 40.0, 31.0, 17.0, 12.0, 12.0, 5.0, 7.0, 10.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.416259765625, -0.4026985168457031, -0.38913726806640625, -0.3755760192871094, -0.3620147705078125, -0.3484535217285156, -0.33489227294921875, -0.3213310241699219, -0.307769775390625, -0.2942085266113281, -0.28064727783203125, -0.2670860290527344, -0.2535247802734375, -0.23996353149414062, -0.22640228271484375, -0.21284103393554688, -0.19927978515625, -0.18571853637695312, -0.17215728759765625, -0.15859603881835938, -0.1450347900390625, -0.13147354125976562, -0.11791229248046875, -0.10435104370117188, -0.090789794921875, -0.07722854614257812, -0.06366729736328125, -0.050106048583984375, -0.0365447998046875, -0.022983551025390625, -0.00942230224609375, 0.004138946533203125, 0.0177001953125, 0.031261444091796875, 0.04482269287109375, 0.058383941650390625, 0.0719451904296875, 0.08550643920898438, 0.09906768798828125, 0.11262893676757812, 0.126190185546875, 0.13975143432617188, 0.15331268310546875, 0.16687393188476562, 0.1804351806640625, 0.19399642944335938, 0.20755767822265625, 0.22111892700195312, 0.23468017578125, 0.24824142456054688, 0.26180267333984375, 0.2753639221191406, 0.2889251708984375, 0.3024864196777344, 0.31604766845703125, 0.3296089172363281, 0.343170166015625, 0.3567314147949219, 0.37029266357421875, 0.3838539123535156, 0.3974151611328125, 0.4109764099121094, 0.42453765869140625, 0.4380989074707031, 0.45166015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 2.0, 3.0, 8.0, 10.0, 5.0, 14.0, 11.0, 12.0, 21.0, 20.0, 21.0, 48.0, 91.0, 158.0, 173.0, 124.0, 68.0, 36.0, 23.0, 18.0, 20.0, 15.0, 10.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.149169921875, -0.1447010040283203, -0.14023208618164062, -0.13576316833496094, -0.13129425048828125, -0.12682533264160156, -0.12235641479492188, -0.11788749694824219, -0.1134185791015625, -0.10894966125488281, -0.10448074340820312, -0.10001182556152344, -0.09554290771484375, -0.09107398986816406, -0.08660507202148438, -0.08213615417480469, -0.077667236328125, -0.07319831848144531, -0.06872940063476562, -0.06426048278808594, -0.05979156494140625, -0.05532264709472656, -0.050853729248046875, -0.04638481140136719, -0.0419158935546875, -0.03744697570800781, -0.032978057861328125, -0.028509140014648438, -0.02404022216796875, -0.019571304321289062, -0.015102386474609375, -0.010633468627929688, -0.00616455078125, -0.0016956329345703125, 0.002773284912109375, 0.0072422027587890625, 0.01171112060546875, 0.016180038452148438, 0.020648956298828125, 0.025117874145507812, 0.0295867919921875, 0.03405570983886719, 0.038524627685546875, 0.04299354553222656, 0.04746246337890625, 0.05193138122558594, 0.056400299072265625, 0.06086921691894531, 0.065338134765625, 0.06980705261230469, 0.07427597045898438, 0.07874488830566406, 0.08321380615234375, 0.08768272399902344, 0.09215164184570312, 0.09662055969238281, 0.1010894775390625, 0.10555839538574219, 0.11002731323242188, 0.11449623107910156, 0.11896514892578125, 0.12343406677246094, 0.12790298461914062, 0.1323719024658203, 0.1368408203125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 7.0, 11.0, 9.0, 9.0, 13.0, 13.0, 7.0, 17.0, 28.0, 37.0, 27.0, 34.0, 58.0, 64.0, 83.0, 153.0, 370.0, 1093.0, 4006.0, 27338.0, 977035.0, 31713.0, 4267.0, 1182.0, 366.0, 149.0, 100.0, 63.0, 52.0, 41.0, 36.0, 21.0, 18.0, 18.0, 16.0, 8.0, 13.0, 14.0, 11.0, 8.0, 6.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9375, -1.8740234375, -1.810546875, -1.7470703125, -1.68359375, -1.6201171875, -1.556640625, -1.4931640625, -1.4296875, -1.3662109375, -1.302734375, -1.2392578125, -1.17578125, -1.1123046875, -1.048828125, -0.9853515625, -0.921875, -0.8583984375, -0.794921875, -0.7314453125, -0.66796875, -0.6044921875, -0.541015625, -0.4775390625, -0.4140625, -0.3505859375, -0.287109375, -0.2236328125, -0.16015625, -0.0966796875, -0.033203125, 0.0302734375, 0.09375, 0.1572265625, 0.220703125, 0.2841796875, 0.34765625, 0.4111328125, 0.474609375, 0.5380859375, 0.6015625, 0.6650390625, 0.728515625, 0.7919921875, 0.85546875, 0.9189453125, 0.982421875, 1.0458984375, 1.109375, 1.1728515625, 1.236328125, 1.2998046875, 1.36328125, 1.4267578125, 1.490234375, 1.5537109375, 1.6171875, 1.6806640625, 1.744140625, 1.8076171875, 1.87109375, 1.9345703125, 1.998046875, 2.0615234375, 2.125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 86.0, 723.0, 181.0, 15.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.234398603439331, -1.1601821184158325, -1.085965633392334, -1.0117491483688354, -0.9375326633453369, -0.8633161783218384, -0.7890996336936951, -0.7148831486701965, -0.640666663646698, -0.5664501786231995, -0.4922336935997009, -0.41801717877388, -0.34380069375038147, -0.26958420872688293, -0.195367693901062, -0.12115120887756348, -0.04693472385406494, 0.02728176862001419, 0.10149826109409332, 0.17571476101875305, 0.2499312460422516, 0.3241477310657501, 0.39836424589157104, 0.4725807309150696, 0.5467972159385681, 0.6210137009620667, 0.6952301859855652, 0.7694467306137085, 0.843663215637207, 0.9178797006607056, 0.9920961856842041, 1.0663126707077026, 1.1405291557312012, 1.2147456407546997, 1.2889621257781982, 1.3631786108016968, 1.4373950958251953, 1.5116115808486938, 1.5858280658721924, 1.6600446701049805, 1.7342610359191895, 1.808477520942688, 1.8826940059661865, 1.956910490989685, 2.0311269760131836, 2.1053435802459717, 2.1795599460601807, 2.2537765502929688, 2.3279929161071777, 2.402209520339966, 2.476425886154175, 2.550642490386963, 2.624858856201172, 2.69907546043396, 2.773291826248169, 2.847508430480957, 2.921725034713745, 2.995941638946533, 3.070158004760742, 3.1443746089935303, 3.2185909748077393, 3.2928075790405273, 3.3670239448547363, 3.4412405490875244, 3.5154569149017334]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 9.0, 7.0, 16.0, 15.0, 22.0, 34.0, 32.0, 39.0, 42.0, 58.0, 62.0, 72.0, 48.0, 65.0, 56.0, 64.0, 48.0, 40.0, 49.0, 46.0, 30.0, 25.0, 41.0, 11.0, 21.0, 16.0, 5.0, 11.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4546080231666565, -0.44348543882369995, -0.4323628842830658, -0.42124029994010925, -0.4101177155971527, -0.39899513125419617, -0.387872576713562, -0.37674999237060547, -0.3656274080276489, -0.3545048236846924, -0.3433822691440582, -0.3322596848011017, -0.32113710045814514, -0.3100145161151886, -0.29889196157455444, -0.2877693772315979, -0.27664679288864136, -0.2655242085456848, -0.25440165400505066, -0.24327906966209412, -0.23215648531913757, -0.22103391587734222, -0.20991134643554688, -0.19878876209259033, -0.18766620755195618, -0.17654363811016083, -0.16542105376720428, -0.15429848432540894, -0.1431758999824524, -0.13205333054065704, -0.1209307536482811, -0.10980817675590515, -0.09868559241294861, -0.08756301552057266, -0.07644043862819672, -0.06531786918640137, -0.05419528856873512, -0.04307271167635918, -0.03195013850927353, -0.020827561616897583, -0.009704984724521637, 0.0014175912365317345, 0.012540167197585106, 0.023662742227315903, 0.03478531911969185, 0.045907896012067795, 0.05703046917915344, 0.06815304607152939, 0.07927562296390533, 0.09039819985628128, 0.10152077674865723, 0.11264334619045258, 0.12376593053340912, 0.13488849997520447, 0.146011084318161, 0.15713365375995636, 0.1682562232017517, 0.17937879264354706, 0.1905013769865036, 0.20162394642829895, 0.2127465307712555, 0.22386910021305084, 0.2349916696548462, 0.24611425399780273, 0.2572368383407593]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 6.0, 7.0, 9.0, 13.0, 21.0, 17.0, 29.0, 19.0, 32.0, 51.0, 38.0, 52.0, 44.0, 60.0, 59.0, 54.0, 63.0, 62.0, 47.0, 35.0, 44.0, 37.0, 35.0, 30.0, 26.0, 21.0, 21.0, 14.0, 12.0, 9.0, 4.0, 10.0, 8.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.849822998046875, -3.72503662109375, -3.600250244140625, -3.4754638671875, -3.350677490234375, -3.22589111328125, -3.101104736328125, -2.976318359375, -2.851531982421875, -2.72674560546875, -2.601959228515625, -2.4771728515625, -2.352386474609375, -2.22760009765625, -2.102813720703125, -1.97802734375, -1.853240966796875, -1.72845458984375, -1.603668212890625, -1.4788818359375, -1.354095458984375, -1.22930908203125, -1.104522705078125, -0.979736328125, -0.854949951171875, -0.73016357421875, -0.605377197265625, -0.4805908203125, -0.355804443359375, -0.23101806640625, -0.106231689453125, 0.0185546875, 0.143341064453125, 0.26812744140625, 0.392913818359375, 0.5177001953125, 0.642486572265625, 0.76727294921875, 0.892059326171875, 1.016845703125, 1.141632080078125, 1.26641845703125, 1.391204833984375, 1.5159912109375, 1.640777587890625, 1.76556396484375, 1.890350341796875, 2.01513671875, 2.139923095703125, 2.26470947265625, 2.389495849609375, 2.5142822265625, 2.639068603515625, 2.76385498046875, 2.888641357421875, 3.013427734375, 3.138214111328125, 3.26300048828125, 3.387786865234375, 3.5125732421875, 3.637359619140625, 3.76214599609375, 3.886932373046875, 4.01171875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 19.0, 19.0, 32.0, 59.0, 79.0, 99.0, 131.0, 209.0, 350.0, 529.0, 821.0, 1256.0, 1866.0, 3114.0, 4943.0, 8207.0, 13913.0, 24701.0, 45666.0, 87469.0, 161530.0, 235496.0, 201569.0, 117404.0, 60802.0, 32938.0, 18357.0, 10302.0, 6165.0, 3831.0, 2354.0, 1499.0, 970.0, 618.0, 438.0, 257.0, 165.0, 118.0, 74.0, 53.0, 38.0, 25.0, 18.0, 11.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.283203125, -2.21343994140625, -2.1436767578125, -2.07391357421875, -2.004150390625, -1.93438720703125, -1.8646240234375, -1.79486083984375, -1.72509765625, -1.65533447265625, -1.5855712890625, -1.51580810546875, -1.446044921875, -1.37628173828125, -1.3065185546875, -1.23675537109375, -1.1669921875, -1.09722900390625, -1.0274658203125, -0.95770263671875, -0.887939453125, -0.81817626953125, -0.7484130859375, -0.67864990234375, -0.60888671875, -0.53912353515625, -0.4693603515625, -0.39959716796875, -0.329833984375, -0.26007080078125, -0.1903076171875, -0.12054443359375, -0.05078125, 0.01898193359375, 0.0887451171875, 0.15850830078125, 0.228271484375, 0.29803466796875, 0.3677978515625, 0.43756103515625, 0.50732421875, 0.57708740234375, 0.6468505859375, 0.71661376953125, 0.786376953125, 0.85614013671875, 0.9259033203125, 0.99566650390625, 1.0654296875, 1.13519287109375, 1.2049560546875, 1.27471923828125, 1.344482421875, 1.41424560546875, 1.4840087890625, 1.55377197265625, 1.62353515625, 1.69329833984375, 1.7630615234375, 1.83282470703125, 1.902587890625, 1.97235107421875, 2.0421142578125, 2.11187744140625, 2.181640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 15.0, 10.0, 11.0, 17.0, 12.0, 14.0, 26.0, 30.0, 33.0, 22.0, 30.0, 52.0, 57.0, 76.0, 79.0, 225.0, 1529.0, 288.0, 102.0, 45.0, 49.0, 53.0, 51.0, 47.0, 35.0, 20.0, 22.0, 26.0, 16.0, 8.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.6865234375, -11.263671875, -10.8408203125, -10.41796875, -9.9951171875, -9.572265625, -9.1494140625, -8.7265625, -8.3037109375, -7.880859375, -7.4580078125, -7.03515625, -6.6123046875, -6.189453125, -5.7666015625, -5.34375, -4.9208984375, -4.498046875, -4.0751953125, -3.65234375, -3.2294921875, -2.806640625, -2.3837890625, -1.9609375, -1.5380859375, -1.115234375, -0.6923828125, -0.26953125, 0.1533203125, 0.576171875, 0.9990234375, 1.421875, 1.8447265625, 2.267578125, 2.6904296875, 3.11328125, 3.5361328125, 3.958984375, 4.3818359375, 4.8046875, 5.2275390625, 5.650390625, 6.0732421875, 6.49609375, 6.9189453125, 7.341796875, 7.7646484375, 8.1875, 8.6103515625, 9.033203125, 9.4560546875, 9.87890625, 10.3017578125, 10.724609375, 11.1474609375, 11.5703125, 11.9931640625, 12.416015625, 12.8388671875, 13.26171875, 13.6845703125, 14.107421875, 14.5302734375, 14.953125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 15.0, 18.0, 29.0, 14.0, 36.0, 52.0, 74.0, 106.0, 185.0, 348.0, 775.0, 3564.0, 44183.0, 2414791.0, 659493.0, 18637.0, 2009.0, 551.0, 266.0, 152.0, 105.0, 68.0, 54.0, 27.0, 22.0, 20.0, 14.0, 15.0, 11.0, 10.0, 11.0, 6.0, 3.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.78125, -18.20947265625, -17.6376953125, -17.06591796875, -16.494140625, -15.92236328125, -15.3505859375, -14.77880859375, -14.20703125, -13.63525390625, -13.0634765625, -12.49169921875, -11.919921875, -11.34814453125, -10.7763671875, -10.20458984375, -9.6328125, -9.06103515625, -8.4892578125, -7.91748046875, -7.345703125, -6.77392578125, -6.2021484375, -5.63037109375, -5.05859375, -4.48681640625, -3.9150390625, -3.34326171875, -2.771484375, -2.19970703125, -1.6279296875, -1.05615234375, -0.484375, 0.08740234375, 0.6591796875, 1.23095703125, 1.802734375, 2.37451171875, 2.9462890625, 3.51806640625, 4.08984375, 4.66162109375, 5.2333984375, 5.80517578125, 6.376953125, 6.94873046875, 7.5205078125, 8.09228515625, 8.6640625, 9.23583984375, 9.8076171875, 10.37939453125, 10.951171875, 11.52294921875, 12.0947265625, 12.66650390625, 13.23828125, 13.81005859375, 14.3818359375, 14.95361328125, 15.525390625, 16.09716796875, 16.6689453125, 17.24072265625, 17.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 33.0, 204.0, 412.0, 289.0, 66.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.607519149780273, -28.170665740966797, -25.733814239501953, -23.296960830688477, -20.860107421875, -18.423255920410156, -15.98640251159668, -13.549551010131836, -11.11269760131836, -8.6758451461792, -6.238992214202881, -3.8021392822265625, -1.3652868270874023, 1.0715656280517578, 3.5084190368652344, 5.945270538330078, 8.382123947143555, 10.818976402282715, 13.255828857421875, 15.692682266235352, 18.129535675048828, 20.566387176513672, 23.00324058532715, 25.440092086791992, 27.87694549560547, 30.313798904418945, 32.75065231323242, 35.187503814697266, 37.62435531616211, 40.06121063232422, 42.49806213378906, 44.934913635253906, 47.37176513671875, 49.808616638183594, 52.2454719543457, 54.68232345581055, 57.11917495727539, 59.5560302734375, 61.992881774902344, 64.42973327636719, 66.86658477783203, 69.30343627929688, 71.74028778076172, 74.17713928222656, 76.61399841308594, 79.05084991455078, 81.48770141601562, 83.92455291748047, 86.36140441894531, 88.79825592041016, 91.235107421875, 93.67196655273438, 96.10881805419922, 98.54566955566406, 100.9825210571289, 103.41937255859375, 105.85623168945312, 108.29308319091797, 110.72993469238281, 113.16679382324219, 115.60364532470703, 118.04049682617188, 120.47734832763672, 122.91419982910156, 125.3510513305664]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 10.0, 14.0, 10.0, 22.0, 13.0, 21.0, 25.0, 28.0, 17.0, 39.0, 40.0, 29.0, 38.0, 38.0, 39.0, 51.0, 43.0, 29.0, 42.0, 47.0, 41.0, 42.0, 31.0, 27.0, 34.0, 29.0, 17.0, 28.0, 16.0, 18.0, 17.0, 11.0, 13.0, 14.0, 5.0, 7.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.49536895751953, -37.327301025390625, -36.159236907958984, -34.99116897583008, -33.82310104370117, -32.65503692626953, -31.486968994140625, -30.31890106201172, -29.150835037231445, -27.982769012451172, -26.814701080322266, -25.646635055541992, -24.47856903076172, -23.310501098632812, -22.14243507385254, -20.974369049072266, -19.80630111694336, -18.638235092163086, -17.47016716003418, -16.302101135253906, -15.134034156799316, -13.965967178344727, -12.797901153564453, -11.629834175109863, -10.461767196655273, -9.293700218200684, -8.125633239746094, -6.95756721496582, -5.7895002365112305, -4.621433258056641, -3.453366756439209, -2.2853002548217773, -1.1172370910644531, 0.05082964897155762, 1.2188963890075684, 2.386963129043579, 3.55502986907959, 4.72309684753418, 5.891163349151611, 7.059229850769043, 8.227296829223633, 9.395363807678223, 10.563430786132812, 11.731496810913086, 12.899563789367676, 14.067630767822266, 15.235696792602539, 16.403762817382812, 17.57183074951172, 18.739896774291992, 19.9079647064209, 21.076030731201172, 22.244098663330078, 23.41216468811035, 24.580230712890625, 25.74829864501953, 26.916364669799805, 28.084430694580078, 29.252498626708984, 30.420564651489258, 31.58863067626953, 32.75669860839844, 33.924766540527344, 35.092830657958984, 36.26089859008789]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 4.0, 14.0, 12.0, 12.0, 29.0, 19.0, 26.0, 25.0, 30.0, 39.0, 49.0, 59.0, 58.0, 48.0, 75.0, 52.0, 53.0, 49.0, 42.0, 37.0, 43.0, 40.0, 33.0, 25.0, 22.0, 24.0, 15.0, 17.0, 11.0, 15.0, 4.0, 5.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.67578125, -4.546905517578125, -4.41802978515625, -4.289154052734375, -4.1602783203125, -4.031402587890625, -3.90252685546875, -3.773651123046875, -3.644775390625, -3.515899658203125, -3.38702392578125, -3.258148193359375, -3.1292724609375, -3.000396728515625, -2.87152099609375, -2.742645263671875, -2.61376953125, -2.484893798828125, -2.35601806640625, -2.227142333984375, -2.0982666015625, -1.969390869140625, -1.84051513671875, -1.711639404296875, -1.582763671875, -1.453887939453125, -1.32501220703125, -1.196136474609375, -1.0672607421875, -0.938385009765625, -0.80950927734375, -0.680633544921875, -0.5517578125, -0.422882080078125, -0.29400634765625, -0.165130615234375, -0.0362548828125, 0.092620849609375, 0.22149658203125, 0.350372314453125, 0.479248046875, 0.608123779296875, 0.73699951171875, 0.865875244140625, 0.9947509765625, 1.123626708984375, 1.25250244140625, 1.381378173828125, 1.51025390625, 1.639129638671875, 1.76800537109375, 1.896881103515625, 2.0257568359375, 2.154632568359375, 2.28350830078125, 2.412384033203125, 2.541259765625, 2.670135498046875, 2.79901123046875, 2.927886962890625, 3.0567626953125, 3.185638427734375, 3.31451416015625, 3.443389892578125, 3.572265625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 11.0, 9.0, 17.0, 32.0, 41.0, 64.0, 92.0, 132.0, 192.0, 338.0, 476.0, 830.0, 1539.0, 2879.0, 7409.0, 22486.0, 97322.0, 571336.0, 2364459.0, 925442.0, 150787.0, 32263.0, 9167.0, 3332.0, 1532.0, 784.0, 455.0, 300.0, 162.0, 128.0, 80.0, 51.0, 41.0, 17.0, 18.0, 17.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0], "bins": [-10.609375, -10.334716796875, -10.06005859375, -9.785400390625, -9.5107421875, -9.236083984375, -8.96142578125, -8.686767578125, -8.412109375, -8.137451171875, -7.86279296875, -7.588134765625, -7.3134765625, -7.038818359375, -6.76416015625, -6.489501953125, -6.21484375, -5.940185546875, -5.66552734375, -5.390869140625, -5.1162109375, -4.841552734375, -4.56689453125, -4.292236328125, -4.017578125, -3.742919921875, -3.46826171875, -3.193603515625, -2.9189453125, -2.644287109375, -2.36962890625, -2.094970703125, -1.8203125, -1.545654296875, -1.27099609375, -0.996337890625, -0.7216796875, -0.447021484375, -0.17236328125, 0.102294921875, 0.376953125, 0.651611328125, 0.92626953125, 1.200927734375, 1.4755859375, 1.750244140625, 2.02490234375, 2.299560546875, 2.57421875, 2.848876953125, 3.12353515625, 3.398193359375, 3.6728515625, 3.947509765625, 4.22216796875, 4.496826171875, 4.771484375, 5.046142578125, 5.32080078125, 5.595458984375, 5.8701171875, 6.144775390625, 6.41943359375, 6.694091796875, 6.96875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 7.0, 20.0, 23.0, 30.0, 33.0, 50.0, 87.0, 104.0, 138.0, 203.0, 270.0, 374.0, 436.0, 522.0, 456.0, 381.0, 265.0, 188.0, 150.0, 95.0, 78.0, 50.0, 28.0, 23.0, 21.0, 10.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.8515625, -12.525390625, -12.19921875, -11.873046875, -11.546875, -11.220703125, -10.89453125, -10.568359375, -10.2421875, -9.916015625, -9.58984375, -9.263671875, -8.9375, -8.611328125, -8.28515625, -7.958984375, -7.6328125, -7.306640625, -6.98046875, -6.654296875, -6.328125, -6.001953125, -5.67578125, -5.349609375, -5.0234375, -4.697265625, -4.37109375, -4.044921875, -3.71875, -3.392578125, -3.06640625, -2.740234375, -2.4140625, -2.087890625, -1.76171875, -1.435546875, -1.109375, -0.783203125, -0.45703125, -0.130859375, 0.1953125, 0.521484375, 0.84765625, 1.173828125, 1.5, 1.826171875, 2.15234375, 2.478515625, 2.8046875, 3.130859375, 3.45703125, 3.783203125, 4.109375, 4.435546875, 4.76171875, 5.087890625, 5.4140625, 5.740234375, 6.06640625, 6.392578125, 6.71875, 7.044921875, 7.37109375, 7.697265625, 8.0234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 11.0, 15.0, 20.0, 30.0, 35.0, 52.0, 91.0, 187.0, 281.0, 514.0, 1145.0, 2996.0, 9854.0, 40471.0, 216743.0, 1257545.0, 2107325.0, 453083.0, 78854.0, 16979.0, 4745.0, 1698.0, 760.0, 334.0, 183.0, 118.0, 81.0, 36.0, 31.0, 17.0, 15.0, 11.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.21875, -16.76806640625, -16.3173828125, -15.86669921875, -15.416015625, -14.96533203125, -14.5146484375, -14.06396484375, -13.61328125, -13.16259765625, -12.7119140625, -12.26123046875, -11.810546875, -11.35986328125, -10.9091796875, -10.45849609375, -10.0078125, -9.55712890625, -9.1064453125, -8.65576171875, -8.205078125, -7.75439453125, -7.3037109375, -6.85302734375, -6.40234375, -5.95166015625, -5.5009765625, -5.05029296875, -4.599609375, -4.14892578125, -3.6982421875, -3.24755859375, -2.796875, -2.34619140625, -1.8955078125, -1.44482421875, -0.994140625, -0.54345703125, -0.0927734375, 0.35791015625, 0.80859375, 1.25927734375, 1.7099609375, 2.16064453125, 2.611328125, 3.06201171875, 3.5126953125, 3.96337890625, 4.4140625, 4.86474609375, 5.3154296875, 5.76611328125, 6.216796875, 6.66748046875, 7.1181640625, 7.56884765625, 8.01953125, 8.47021484375, 8.9208984375, 9.37158203125, 9.822265625, 10.27294921875, 10.7236328125, 11.17431640625, 11.625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 12.0, 30.0, 15.0, 33.0, 42.0, 73.0, 106.0, 116.0, 119.0, 111.0, 88.0, 69.0, 70.0, 46.0, 25.0, 24.0, 12.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.44630432128906, -38.81291580200195, -37.179527282714844, -35.546138763427734, -33.912750244140625, -32.279361724853516, -30.645973205566406, -29.012584686279297, -27.379196166992188, -25.745807647705078, -24.11241912841797, -22.47903060913086, -20.84564208984375, -19.21225357055664, -17.57886505126953, -15.945475578308105, -14.31208610534668, -12.67869758605957, -11.045309066772461, -9.411920547485352, -7.778531551361084, -6.145142555236816, -4.511754035949707, -2.8783655166625977, -1.2449769973754883, 0.38841164112091064, 2.0218002796173096, 3.655189037322998, 5.288577556610107, 6.921966552734375, 8.555355072021484, 10.188743591308594, 11.822132110595703, 13.455520629882812, 15.088909149169922, 16.72229766845703, 18.35568618774414, 19.98907470703125, 21.62246322631836, 23.25585174560547, 24.889240264892578, 26.522628784179688, 28.156017303466797, 29.789405822753906, 31.422794342041016, 33.056182861328125, 34.689571380615234, 36.322959899902344, 37.95635223388672, 39.58974075317383, 41.22312927246094, 42.85651779174805, 44.489906311035156, 46.123294830322266, 47.756683349609375, 49.390071868896484, 51.023460388183594, 52.6568489074707, 54.29023742675781, 55.92362594604492, 57.55701446533203, 59.19040298461914, 60.82379150390625, 62.45718002319336, 64.09056854248047]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 9.0, 15.0, 16.0, 23.0, 13.0, 22.0, 29.0, 30.0, 28.0, 28.0, 37.0, 42.0, 38.0, 32.0, 54.0, 49.0, 50.0, 48.0, 54.0, 36.0, 34.0, 33.0, 33.0, 36.0, 18.0, 31.0, 13.0, 17.0, 17.0, 14.0, 18.0, 15.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.206327438354492, -28.193220138549805, -27.180112838745117, -26.16700553894043, -25.153898239135742, -24.140790939331055, -23.127685546875, -22.114578247070312, -21.101470947265625, -20.088363647460938, -19.07525634765625, -18.062149047851562, -17.049041748046875, -16.035934448242188, -15.022828102111816, -14.009720802307129, -12.996612548828125, -11.983505249023438, -10.97039794921875, -9.957290649414062, -8.944183349609375, -7.931076526641846, -6.917969703674316, -5.904862403869629, -4.891755104064941, -3.878647804260254, -2.8655407428741455, -1.852433681488037, -0.8393263816833496, 0.1737809181213379, 1.1868877410888672, 2.1999950408935547, 3.213104248046875, 4.2262115478515625, 5.23931884765625, 6.252425670623779, 7.265532970428467, 8.278640747070312, 9.291747093200684, 10.304854393005371, 11.317961692810059, 12.331068992614746, 13.344176292419434, 14.357282638549805, 15.370389938354492, 16.38349723815918, 17.396604537963867, 18.409711837768555, 19.422819137573242, 20.43592643737793, 21.449033737182617, 22.462141036987305, 23.475248336791992, 24.48835563659668, 25.501461029052734, 26.514568328857422, 27.52767562866211, 28.540782928466797, 29.553890228271484, 30.566997528076172, 31.58010482788086, 32.59321212768555, 33.606319427490234, 34.61942672729492, 35.63253402709961]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 7.0, 13.0, 8.0, 14.0, 18.0, 18.0, 19.0, 28.0, 31.0, 34.0, 41.0, 42.0, 48.0, 58.0, 57.0, 54.0, 65.0, 32.0, 51.0, 45.0, 38.0, 41.0, 32.0, 27.0, 34.0, 34.0, 19.0, 24.0, 13.0, 8.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.602783203125, -4.47509765625, -4.347412109375, -4.2197265625, -4.092041015625, -3.96435546875, -3.836669921875, -3.708984375, -3.581298828125, -3.45361328125, -3.325927734375, -3.1982421875, -3.070556640625, -2.94287109375, -2.815185546875, -2.6875, -2.559814453125, -2.43212890625, -2.304443359375, -2.1767578125, -2.049072265625, -1.92138671875, -1.793701171875, -1.666015625, -1.538330078125, -1.41064453125, -1.282958984375, -1.1552734375, -1.027587890625, -0.89990234375, -0.772216796875, -0.64453125, -0.516845703125, -0.38916015625, -0.261474609375, -0.1337890625, -0.006103515625, 0.12158203125, 0.249267578125, 0.376953125, 0.504638671875, 0.63232421875, 0.760009765625, 0.8876953125, 1.015380859375, 1.14306640625, 1.270751953125, 1.3984375, 1.526123046875, 1.65380859375, 1.781494140625, 1.9091796875, 2.036865234375, 2.16455078125, 2.292236328125, 2.419921875, 2.547607421875, 2.67529296875, 2.802978515625, 2.9306640625, 3.058349609375, 3.18603515625, 3.313720703125, 3.44140625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 4.0, 19.0, 18.0, 18.0, 32.0, 54.0, 75.0, 95.0, 142.0, 236.0, 377.0, 552.0, 816.0, 1172.0, 1881.0, 2825.0, 4149.0, 6452.0, 9637.0, 14520.0, 22146.0, 33549.0, 50262.0, 72422.0, 99508.0, 125362.0, 140422.0, 128694.0, 102676.0, 74979.0, 51882.0, 35322.0, 23274.0, 15230.0, 10148.0, 6631.0, 4355.0, 2839.0, 1918.0, 1264.0, 849.0, 582.0, 414.0, 260.0, 174.0, 102.0, 94.0, 50.0, 26.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6243820190429688, -0.6032562255859375, -0.5821304321289062, -0.561004638671875, -0.5398788452148438, -0.5187530517578125, -0.49762725830078125, -0.47650146484375, -0.45537567138671875, -0.4342498779296875, -0.41312408447265625, -0.391998291015625, -0.37087249755859375, -0.3497467041015625, -0.32862091064453125, -0.3074951171875, -0.28636932373046875, -0.2652435302734375, -0.24411773681640625, -0.222991943359375, -0.20186614990234375, -0.1807403564453125, -0.15961456298828125, -0.13848876953125, -0.11736297607421875, -0.0962371826171875, -0.07511138916015625, -0.053985595703125, -0.03285980224609375, -0.0117340087890625, 0.00939178466796875, 0.030517578125, 0.05164337158203125, 0.0727691650390625, 0.09389495849609375, 0.115020751953125, 0.13614654541015625, 0.1572723388671875, 0.17839813232421875, 0.19952392578125, 0.22064971923828125, 0.2417755126953125, 0.26290130615234375, 0.284027099609375, 0.30515289306640625, 0.3262786865234375, 0.34740447998046875, 0.3685302734375, 0.38965606689453125, 0.4107818603515625, 0.43190765380859375, 0.453033447265625, 0.47415924072265625, 0.4952850341796875, 0.5164108276367188, 0.53753662109375, 0.5586624145507812, 0.5797882080078125, 0.6009140014648438, 0.622039794921875, 0.6431655883789062, 0.6642913818359375, 0.6854171752929688, 0.70654296875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 4.0, 7.0, 7.0, 15.0, 8.0, 13.0, 13.0, 15.0, 26.0, 30.0, 26.0, 34.0, 37.0, 31.0, 33.0, 35.0, 23.0, 39.0, 41.0, 1084.0, 43.0, 49.0, 35.0, 36.0, 39.0, 36.0, 37.0, 30.0, 19.0, 27.0, 27.0, 22.0, 19.0, 11.0, 17.0, 6.0, 12.0, 5.0, 11.0, 8.0, 1.0, 0.0, 1.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.724609375, -2.63629150390625, -2.5479736328125, -2.45965576171875, -2.371337890625, -2.28302001953125, -2.1947021484375, -2.10638427734375, -2.01806640625, -1.92974853515625, -1.8414306640625, -1.75311279296875, -1.664794921875, -1.57647705078125, -1.4881591796875, -1.39984130859375, -1.3115234375, -1.22320556640625, -1.1348876953125, -1.04656982421875, -0.958251953125, -0.86993408203125, -0.7816162109375, -0.69329833984375, -0.60498046875, -0.51666259765625, -0.4283447265625, -0.34002685546875, -0.251708984375, -0.16339111328125, -0.0750732421875, 0.01324462890625, 0.1015625, 0.18988037109375, 0.2781982421875, 0.36651611328125, 0.454833984375, 0.54315185546875, 0.6314697265625, 0.71978759765625, 0.80810546875, 0.89642333984375, 0.9847412109375, 1.07305908203125, 1.161376953125, 1.24969482421875, 1.3380126953125, 1.42633056640625, 1.5146484375, 1.60296630859375, 1.6912841796875, 1.77960205078125, 1.867919921875, 1.95623779296875, 2.0445556640625, 2.13287353515625, 2.22119140625, 2.30950927734375, 2.3978271484375, 2.48614501953125, 2.574462890625, 2.66278076171875, 2.7510986328125, 2.83941650390625, 2.927734375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 6.0, 8.0, 14.0, 19.0, 24.0, 52.0, 60.0, 93.0, 164.0, 233.0, 371.0, 529.0, 955.0, 1530.0, 2663.0, 4502.0, 8119.0, 14408.0, 26313.0, 46937.0, 81743.0, 136928.0, 400267.0, 989834.0, 160032.0, 95319.0, 55197.0, 31136.0, 17063.0, 9573.0, 5352.0, 2971.0, 1822.0, 1094.0, 650.0, 396.0, 259.0, 164.0, 97.0, 79.0, 35.0, 23.0, 26.0, 23.0, 14.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.405029296875, -0.3924293518066406, -0.37982940673828125, -0.3672294616699219, -0.3546295166015625, -0.3420295715332031, -0.32942962646484375, -0.3168296813964844, -0.304229736328125, -0.2916297912597656, -0.27902984619140625, -0.2664299011230469, -0.2538299560546875, -0.24123001098632812, -0.22863006591796875, -0.21603012084960938, -0.20343017578125, -0.19083023071289062, -0.17823028564453125, -0.16563034057617188, -0.1530303955078125, -0.14043045043945312, -0.12783050537109375, -0.11523056030273438, -0.102630615234375, -0.09003067016601562, -0.07743072509765625, -0.06483078002929688, -0.0522308349609375, -0.039630889892578125, -0.02703094482421875, -0.014430999755859375, -0.0018310546875, 0.010768890380859375, 0.02336883544921875, 0.035968780517578125, 0.0485687255859375, 0.061168670654296875, 0.07376861572265625, 0.08636856079101562, 0.098968505859375, 0.11156845092773438, 0.12416839599609375, 0.13676834106445312, 0.1493682861328125, 0.16196823120117188, 0.17456817626953125, 0.18716812133789062, 0.19976806640625, 0.21236801147460938, 0.22496795654296875, 0.23756790161132812, 0.2501678466796875, 0.2627677917480469, 0.27536773681640625, 0.2879676818847656, 0.300567626953125, 0.3131675720214844, 0.32576751708984375, 0.3383674621582031, 0.3509674072265625, 0.3635673522949219, 0.37616729736328125, 0.3887672424316406, 0.4013671875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 9.0, 9.0, 12.0, 22.0, 25.0, 32.0, 39.0, 59.0, 81.0, 136.0, 123.0, 100.0, 82.0, 64.0, 47.0, 33.0, 16.0, 14.0, 17.0, 8.0, 9.0, 6.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0960693359375, -0.09318733215332031, -0.09030532836914062, -0.08742332458496094, -0.08454132080078125, -0.08165931701660156, -0.07877731323242188, -0.07589530944824219, -0.0730133056640625, -0.07013130187988281, -0.06724929809570312, -0.06436729431152344, -0.06148529052734375, -0.05860328674316406, -0.055721282958984375, -0.05283927917480469, -0.049957275390625, -0.04707527160644531, -0.044193267822265625, -0.04131126403808594, -0.03842926025390625, -0.03554725646972656, -0.032665252685546875, -0.029783248901367188, -0.0269012451171875, -0.024019241333007812, -0.021137237548828125, -0.018255233764648438, -0.01537322998046875, -0.012491226196289062, -0.009609222412109375, -0.0067272186279296875, -0.00384521484375, -0.0009632110595703125, 0.001918792724609375, 0.0048007965087890625, 0.00768280029296875, 0.010564804077148438, 0.013446807861328125, 0.016328811645507812, 0.0192108154296875, 0.022092819213867188, 0.024974822998046875, 0.027856826782226562, 0.03073883056640625, 0.03362083435058594, 0.036502838134765625, 0.03938484191894531, 0.042266845703125, 0.04514884948730469, 0.048030853271484375, 0.05091285705566406, 0.05379486083984375, 0.05667686462402344, 0.059558868408203125, 0.06244087219238281, 0.0653228759765625, 0.06820487976074219, 0.07108688354492188, 0.07396888732910156, 0.07685089111328125, 0.07973289489746094, 0.08261489868164062, 0.08549690246582031, 0.08837890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 8.0, 7.0, 5.0, 13.0, 20.0, 11.0, 11.0, 22.0, 34.0, 40.0, 49.0, 66.0, 143.0, 225.0, 529.0, 1882.0, 9474.0, 234344.0, 785239.0, 12568.0, 2435.0, 627.0, 243.0, 145.0, 96.0, 67.0, 44.0, 27.0, 24.0, 20.0, 18.0, 15.0, 13.0, 7.0, 13.0, 8.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0], "bins": [-1.34765625, -1.3056488037109375, -1.263641357421875, -1.2216339111328125, -1.17962646484375, -1.1376190185546875, -1.095611572265625, -1.0536041259765625, -1.0115966796875, -0.9695892333984375, -0.927581787109375, -0.8855743408203125, -0.84356689453125, -0.8015594482421875, -0.759552001953125, -0.7175445556640625, -0.675537109375, -0.6335296630859375, -0.591522216796875, -0.5495147705078125, -0.50750732421875, -0.4654998779296875, -0.423492431640625, -0.3814849853515625, -0.3394775390625, -0.2974700927734375, -0.255462646484375, -0.2134552001953125, -0.17144775390625, -0.1294403076171875, -0.087432861328125, -0.0454254150390625, -0.00341796875, 0.0385894775390625, 0.080596923828125, 0.1226043701171875, 0.16461181640625, 0.2066192626953125, 0.248626708984375, 0.2906341552734375, 0.3326416015625, 0.3746490478515625, 0.416656494140625, 0.4586639404296875, 0.50067138671875, 0.5426788330078125, 0.584686279296875, 0.6266937255859375, 0.668701171875, 0.7107086181640625, 0.752716064453125, 0.7947235107421875, 0.83673095703125, 0.8787384033203125, 0.920745849609375, 0.9627532958984375, 1.0047607421875, 1.0467681884765625, 1.088775634765625, 1.1307830810546875, 1.17279052734375, 1.2147979736328125, 1.256805419921875, 1.2988128662109375, 1.3408203125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 14.0, 29.0, 62.0, 104.0, 227.0, 246.0, 133.0, 77.0, 39.0, 24.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5494539141654968, -0.5369977951049805, -0.5245416164398193, -0.512085497379303, -0.4996293783187866, -0.4871732294559479, -0.47471708059310913, -0.4622609615325928, -0.4498048424720764, -0.43734869360923767, -0.4248925745487213, -0.41243642568588257, -0.3999803066253662, -0.38752415776252747, -0.3750680088996887, -0.36261188983917236, -0.3501557409763336, -0.3376995921134949, -0.3252434730529785, -0.31278732419013977, -0.3003312051296234, -0.28787505626678467, -0.2754189372062683, -0.26296278834342957, -0.2505066394805908, -0.23805050551891327, -0.22559437155723572, -0.21313822269439697, -0.20068210363388062, -0.18822595477104187, -0.17576982080936432, -0.16331368684768677, -0.15085753798484802, -0.13840140402317047, -0.12594527006149292, -0.11348912864923477, -0.10103299468755722, -0.08857686072587967, -0.07612071931362152, -0.06366458535194397, -0.05120845139026642, -0.03875231742858887, -0.026296179741621017, -0.013840042054653168, -0.0013839080929756165, 0.011072225868701935, 0.023528367280960083, 0.035984501242637634, 0.048440635204315186, 0.06089676916599274, 0.07335290312767029, 0.08580904453992844, 0.09826517850160599, 0.11072131246328354, 0.12317745387554169, 0.13563358783721924, 0.1480897217988968, 0.16054585576057434, 0.1730019897222519, 0.18545812368392944, 0.1979142725467682, 0.21037039160728455, 0.2228265404701233, 0.23528267443180084, 0.2477388083934784]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 5.0, 15.0, 23.0, 16.0, 18.0, 21.0, 31.0, 29.0, 28.0, 29.0, 35.0, 49.0, 43.0, 44.0, 44.0, 53.0, 53.0, 54.0, 40.0, 45.0, 36.0, 28.0, 33.0, 30.0, 39.0, 18.0, 21.0, 13.0, 19.0, 14.0, 6.0, 14.0, 7.0, 8.0, 8.0, 5.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14991158246994019, -0.14557991921901703, -0.14124827086925507, -0.1369166076183319, -0.13258495926856995, -0.1282532960176468, -0.12392164021730423, -0.11958998441696167, -0.11525832861661911, -0.11092667281627655, -0.10659501701593399, -0.10226336121559143, -0.09793169796466827, -0.09360004961490631, -0.08926838636398315, -0.0849367305636406, -0.08060507476329803, -0.07627341896295547, -0.07194176316261292, -0.06761010736227036, -0.0632784515619278, -0.05894679203629494, -0.05461513251066208, -0.05028347671031952, -0.04595182090997696, -0.0416201651096344, -0.03728850930929184, -0.03295684978365898, -0.02862519398331642, -0.02429353818297386, -0.019961880519986153, -0.015630222856998444, -0.011298567056655884, -0.006966910324990749, -0.002635253593325615, 0.0016964031383395195, 0.006028059870004654, 0.010359715670347214, 0.014691373333334923, 0.019023030996322632, 0.02335468679666519, 0.02768634259700775, 0.03201799839735031, 0.03634965792298317, 0.04068131372332573, 0.04501296952366829, 0.04934462904930115, 0.05367628484964371, 0.05800794064998627, 0.06233959645032883, 0.06667125225067139, 0.07100290805101395, 0.0753345638513565, 0.07966622710227966, 0.08399788290262222, 0.08832953870296478, 0.09266119450330734, 0.0969928503036499, 0.10132450610399246, 0.10565616190433502, 0.10998782515525818, 0.11431947350502014, 0.1186511367559433, 0.12298279255628586, 0.12731444835662842]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 11.0, 5.0, 18.0, 18.0, 21.0, 16.0, 20.0, 21.0, 39.0, 32.0, 43.0, 44.0, 41.0, 44.0, 60.0, 62.0, 48.0, 49.0, 35.0, 50.0, 37.0, 39.0, 32.0, 37.0, 28.0, 22.0, 24.0, 25.0, 22.0, 10.0, 7.0, 9.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-4.55859375, -4.435638427734375, -4.31268310546875, -4.189727783203125, -4.0667724609375, -3.943817138671875, -3.82086181640625, -3.697906494140625, -3.574951171875, -3.451995849609375, -3.32904052734375, -3.206085205078125, -3.0831298828125, -2.960174560546875, -2.83721923828125, -2.714263916015625, -2.59130859375, -2.468353271484375, -2.34539794921875, -2.222442626953125, -2.0994873046875, -1.976531982421875, -1.85357666015625, -1.730621337890625, -1.607666015625, -1.484710693359375, -1.36175537109375, -1.238800048828125, -1.1158447265625, -0.992889404296875, -0.86993408203125, -0.746978759765625, -0.6240234375, -0.501068115234375, -0.37811279296875, -0.255157470703125, -0.1322021484375, -0.009246826171875, 0.11370849609375, 0.236663818359375, 0.359619140625, 0.482574462890625, 0.60552978515625, 0.728485107421875, 0.8514404296875, 0.974395751953125, 1.09735107421875, 1.220306396484375, 1.34326171875, 1.466217041015625, 1.58917236328125, 1.712127685546875, 1.8350830078125, 1.958038330078125, 2.08099365234375, 2.203948974609375, 2.326904296875, 2.449859619140625, 2.57281494140625, 2.695770263671875, 2.8187255859375, 2.941680908203125, 3.06463623046875, 3.187591552734375, 3.310546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 10.0, 14.0, 28.0, 38.0, 58.0, 82.0, 117.0, 213.0, 311.0, 483.0, 752.0, 1179.0, 1831.0, 2872.0, 4550.0, 7107.0, 11467.0, 18639.0, 31778.0, 58509.0, 118913.0, 229287.0, 255171.0, 142562.0, 69191.0, 37168.0, 21025.0, 12981.0, 8127.0, 5094.0, 3249.0, 2044.0, 1225.0, 870.0, 607.0, 372.0, 218.0, 150.0, 90.0, 57.0, 37.0, 24.0, 21.0, 13.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8551025390625, -2.757080078125, -2.6590576171875, -2.56103515625, -2.4630126953125, -2.364990234375, -2.2669677734375, -2.1689453125, -2.0709228515625, -1.972900390625, -1.8748779296875, -1.77685546875, -1.6788330078125, -1.580810546875, -1.4827880859375, -1.384765625, -1.2867431640625, -1.188720703125, -1.0906982421875, -0.99267578125, -0.8946533203125, -0.796630859375, -0.6986083984375, -0.6005859375, -0.5025634765625, -0.404541015625, -0.3065185546875, -0.20849609375, -0.1104736328125, -0.012451171875, 0.0855712890625, 0.18359375, 0.2816162109375, 0.379638671875, 0.4776611328125, 0.57568359375, 0.6737060546875, 0.771728515625, 0.8697509765625, 0.9677734375, 1.0657958984375, 1.163818359375, 1.2618408203125, 1.35986328125, 1.4578857421875, 1.555908203125, 1.6539306640625, 1.751953125, 1.8499755859375, 1.947998046875, 2.0460205078125, 2.14404296875, 2.2420654296875, 2.340087890625, 2.4381103515625, 2.5361328125, 2.6341552734375, 2.732177734375, 2.8302001953125, 2.92822265625, 3.0262451171875, 3.124267578125, 3.2222900390625, 3.3203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 6.0, 10.0, 15.0, 16.0, 14.0, 25.0, 22.0, 27.0, 28.0, 37.0, 47.0, 60.0, 63.0, 96.0, 143.0, 329.0, 1401.0, 181.0, 82.0, 72.0, 64.0, 38.0, 40.0, 37.0, 28.0, 27.0, 24.0, 22.0, 11.0, 21.0, 12.0, 6.0, 7.0, 9.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.2265625, -13.784423828125, -13.34228515625, -12.900146484375, -12.4580078125, -12.015869140625, -11.57373046875, -11.131591796875, -10.689453125, -10.247314453125, -9.80517578125, -9.363037109375, -8.9208984375, -8.478759765625, -8.03662109375, -7.594482421875, -7.15234375, -6.710205078125, -6.26806640625, -5.825927734375, -5.3837890625, -4.941650390625, -4.49951171875, -4.057373046875, -3.615234375, -3.173095703125, -2.73095703125, -2.288818359375, -1.8466796875, -1.404541015625, -0.96240234375, -0.520263671875, -0.078125, 0.364013671875, 0.80615234375, 1.248291015625, 1.6904296875, 2.132568359375, 2.57470703125, 3.016845703125, 3.458984375, 3.901123046875, 4.34326171875, 4.785400390625, 5.2275390625, 5.669677734375, 6.11181640625, 6.553955078125, 6.99609375, 7.438232421875, 7.88037109375, 8.322509765625, 8.7646484375, 9.206787109375, 9.64892578125, 10.091064453125, 10.533203125, 10.975341796875, 11.41748046875, 11.859619140625, 12.3017578125, 12.743896484375, 13.18603515625, 13.628173828125, 14.0703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 17.0, 11.0, 18.0, 24.0, 30.0, 27.0, 43.0, 61.0, 111.0, 126.0, 257.0, 471.0, 1370.0, 6995.0, 69202.0, 2254894.0, 774380.0, 31660.0, 3987.0, 964.0, 390.0, 206.0, 131.0, 80.0, 56.0, 27.0, 28.0, 27.0, 20.0, 20.0, 13.0, 8.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.08447265625, -18.4658203125, -17.84716796875, -17.228515625, -16.60986328125, -15.9912109375, -15.37255859375, -14.75390625, -14.13525390625, -13.5166015625, -12.89794921875, -12.279296875, -11.66064453125, -11.0419921875, -10.42333984375, -9.8046875, -9.18603515625, -8.5673828125, -7.94873046875, -7.330078125, -6.71142578125, -6.0927734375, -5.47412109375, -4.85546875, -4.23681640625, -3.6181640625, -2.99951171875, -2.380859375, -1.76220703125, -1.1435546875, -0.52490234375, 0.09375, 0.71240234375, 1.3310546875, 1.94970703125, 2.568359375, 3.18701171875, 3.8056640625, 4.42431640625, 5.04296875, 5.66162109375, 6.2802734375, 6.89892578125, 7.517578125, 8.13623046875, 8.7548828125, 9.37353515625, 9.9921875, 10.61083984375, 11.2294921875, 11.84814453125, 12.466796875, 13.08544921875, 13.7041015625, 14.32275390625, 14.94140625, 15.56005859375, 16.1787109375, 16.79736328125, 17.416015625, 18.03466796875, 18.6533203125, 19.27197265625, 19.890625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 14.0, 155.0, 528.0, 285.0, 34.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.866453170776367, -26.30122184753418, -21.735990524291992, -17.170759201049805, -12.605527877807617, -8.04029655456543, -3.475065231323242, 1.0901660919189453, 5.655397415161133, 10.22062873840332, 14.785860061645508, 19.351091384887695, 23.916322708129883, 28.48155403137207, 33.046783447265625, 37.61201477050781, 42.17724609375, 46.74247741699219, 51.307708740234375, 55.87294006347656, 60.43817138671875, 65.00340270996094, 69.56863403320312, 74.13386535644531, 78.6990966796875, 83.26432800292969, 87.82955932617188, 92.39479064941406, 96.96002197265625, 101.52525329589844, 106.09048461914062, 110.65571594238281, 115.220947265625, 119.78617858886719, 124.35140991210938, 128.91664123535156, 133.48187255859375, 138.04710388183594, 142.61233520507812, 147.1775665283203, 151.7427978515625, 156.3080291748047, 160.87326049804688, 165.43849182128906, 170.00372314453125, 174.56895446777344, 179.13418579101562, 183.6994171142578, 188.2646484375, 192.8298797607422, 197.39511108398438, 201.96034240722656, 206.52557373046875, 211.09080505371094, 215.65603637695312, 220.2212677001953, 224.7864990234375, 229.3517303466797, 233.91696166992188, 238.48219299316406, 243.04742431640625, 247.61265563964844, 252.17788696289062, 256.74310302734375, 261.308349609375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 8.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 3.0, 6.0, 14.0, 10.0, 13.0, 23.0, 16.0, 25.0, 25.0, 35.0, 22.0, 28.0, 24.0, 27.0, 26.0, 36.0, 39.0, 43.0, 33.0, 38.0, 45.0, 33.0, 38.0, 46.0, 28.0, 41.0, 36.0, 40.0, 24.0, 26.0, 22.0, 21.0, 15.0, 14.0, 7.0, 9.0, 8.0, 9.0, 9.0, 7.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.54780578613281, -35.39500045776367, -34.242191314697266, -33.089385986328125, -31.936580657958984, -30.78377342224121, -29.630966186523438, -28.478160858154297, -27.325353622436523, -26.17254638671875, -25.01974105834961, -23.866933822631836, -22.714126586914062, -21.561321258544922, -20.40851402282715, -19.255706787109375, -18.102901458740234, -16.95009422302246, -15.79728889465332, -14.644481658935547, -13.49167537689209, -12.338869094848633, -11.18606185913086, -10.033255577087402, -8.880449295043945, -7.727643013000488, -6.574836254119873, -5.422029495239258, -4.269223213195801, -3.1164169311523438, -1.9636101722717285, -0.8108034133911133, 0.34200286865234375, 1.4948093891143799, 2.647615909576416, 3.800422430038452, 4.953228950500488, 6.106035232543945, 7.2588419914245605, 8.411648750305176, 9.564455032348633, 10.71726131439209, 11.870067596435547, 13.02287483215332, 14.175681114196777, 15.328487396240234, 16.481294631958008, 17.63410186767578, 18.786907196044922, 19.939714431762695, 21.092519760131836, 22.24532699584961, 23.39813232421875, 24.550939559936523, 25.703746795654297, 26.856552124023438, 28.00935935974121, 29.162166595458984, 30.314971923828125, 31.4677791595459, 32.62058639526367, 33.77339172363281, 34.92619705200195, 36.07900619506836, 37.2318115234375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 17.0, 16.0, 18.0, 25.0, 25.0, 29.0, 28.0, 49.0, 37.0, 49.0, 54.0, 56.0, 43.0, 57.0, 53.0, 43.0, 42.0, 43.0, 32.0, 41.0, 36.0, 30.0, 19.0, 27.0, 17.0, 21.0, 22.0, 12.0, 2.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.50390625, -4.37322998046875, -4.2425537109375, -4.11187744140625, -3.981201171875, -3.85052490234375, -3.7198486328125, -3.58917236328125, -3.45849609375, -3.32781982421875, -3.1971435546875, -3.06646728515625, -2.935791015625, -2.80511474609375, -2.6744384765625, -2.54376220703125, -2.4130859375, -2.28240966796875, -2.1517333984375, -2.02105712890625, -1.890380859375, -1.75970458984375, -1.6290283203125, -1.49835205078125, -1.36767578125, -1.23699951171875, -1.1063232421875, -0.97564697265625, -0.844970703125, -0.71429443359375, -0.5836181640625, -0.45294189453125, -0.322265625, -0.19158935546875, -0.0609130859375, 0.06976318359375, 0.200439453125, 0.33111572265625, 0.4617919921875, 0.59246826171875, 0.72314453125, 0.85382080078125, 0.9844970703125, 1.11517333984375, 1.245849609375, 1.37652587890625, 1.5072021484375, 1.63787841796875, 1.7685546875, 1.89923095703125, 2.0299072265625, 2.16058349609375, 2.291259765625, 2.42193603515625, 2.5526123046875, 2.68328857421875, 2.81396484375, 2.94464111328125, 3.0753173828125, 3.20599365234375, 3.336669921875, 3.46734619140625, 3.5980224609375, 3.72869873046875, 3.859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 13.0, 11.0, 31.0, 45.0, 40.0, 78.0, 127.0, 208.0, 387.0, 598.0, 1059.0, 2014.0, 4876.0, 14159.0, 49296.0, 211348.0, 1058585.0, 2078570.0, 603320.0, 123336.0, 30529.0, 9106.0, 3428.0, 1434.0, 715.0, 369.0, 224.0, 127.0, 79.0, 50.0, 44.0, 22.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.41162109375, -8.1591796875, -7.90673828125, -7.654296875, -7.40185546875, -7.1494140625, -6.89697265625, -6.64453125, -6.39208984375, -6.1396484375, -5.88720703125, -5.634765625, -5.38232421875, -5.1298828125, -4.87744140625, -4.625, -4.37255859375, -4.1201171875, -3.86767578125, -3.615234375, -3.36279296875, -3.1103515625, -2.85791015625, -2.60546875, -2.35302734375, -2.1005859375, -1.84814453125, -1.595703125, -1.34326171875, -1.0908203125, -0.83837890625, -0.5859375, -0.33349609375, -0.0810546875, 0.17138671875, 0.423828125, 0.67626953125, 0.9287109375, 1.18115234375, 1.43359375, 1.68603515625, 1.9384765625, 2.19091796875, 2.443359375, 2.69580078125, 2.9482421875, 3.20068359375, 3.453125, 3.70556640625, 3.9580078125, 4.21044921875, 4.462890625, 4.71533203125, 4.9677734375, 5.22021484375, 5.47265625, 5.72509765625, 5.9775390625, 6.22998046875, 6.482421875, 6.73486328125, 6.9873046875, 7.23974609375, 7.4921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 11.0, 9.0, 26.0, 24.0, 32.0, 45.0, 73.0, 99.0, 116.0, 152.0, 198.0, 270.0, 337.0, 373.0, 387.0, 402.0, 329.0, 291.0, 228.0, 170.0, 104.0, 92.0, 74.0, 59.0, 48.0, 32.0, 21.0, 15.0, 15.0, 15.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -9.0198974609375, -8.735107421875, -8.4503173828125, -8.16552734375, -7.8807373046875, -7.595947265625, -7.3111572265625, -7.0263671875, -6.7415771484375, -6.456787109375, -6.1719970703125, -5.88720703125, -5.6024169921875, -5.317626953125, -5.0328369140625, -4.748046875, -4.4632568359375, -4.178466796875, -3.8936767578125, -3.60888671875, -3.3240966796875, -3.039306640625, -2.7545166015625, -2.4697265625, -2.1849365234375, -1.900146484375, -1.6153564453125, -1.33056640625, -1.0457763671875, -0.760986328125, -0.4761962890625, -0.19140625, 0.0933837890625, 0.378173828125, 0.6629638671875, 0.94775390625, 1.2325439453125, 1.517333984375, 1.8021240234375, 2.0869140625, 2.3717041015625, 2.656494140625, 2.9412841796875, 3.22607421875, 3.5108642578125, 3.795654296875, 4.0804443359375, 4.365234375, 4.6500244140625, 4.934814453125, 5.2196044921875, 5.50439453125, 5.7891845703125, 6.073974609375, 6.3587646484375, 6.6435546875, 6.9283447265625, 7.213134765625, 7.4979248046875, 7.78271484375, 8.0675048828125, 8.352294921875, 8.6370849609375, 8.921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 8.0, 8.0, 16.0, 19.0, 36.0, 50.0, 77.0, 130.0, 193.0, 367.0, 710.0, 1414.0, 3442.0, 10462.0, 37186.0, 157823.0, 707016.0, 2012005.0, 971949.0, 219444.0, 50239.0, 13623.0, 4393.0, 1748.0, 822.0, 442.0, 235.0, 146.0, 108.0, 62.0, 31.0, 26.0, 11.0, 12.0, 8.0, 5.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.139404296875, -11.75537109375, -11.371337890625, -10.9873046875, -10.603271484375, -10.21923828125, -9.835205078125, -9.451171875, -9.067138671875, -8.68310546875, -8.299072265625, -7.9150390625, -7.531005859375, -7.14697265625, -6.762939453125, -6.37890625, -5.994873046875, -5.61083984375, -5.226806640625, -4.8427734375, -4.458740234375, -4.07470703125, -3.690673828125, -3.306640625, -2.922607421875, -2.53857421875, -2.154541015625, -1.7705078125, -1.386474609375, -1.00244140625, -0.618408203125, -0.234375, 0.149658203125, 0.53369140625, 0.917724609375, 1.3017578125, 1.685791015625, 2.06982421875, 2.453857421875, 2.837890625, 3.221923828125, 3.60595703125, 3.989990234375, 4.3740234375, 4.758056640625, 5.14208984375, 5.526123046875, 5.91015625, 6.294189453125, 6.67822265625, 7.062255859375, 7.4462890625, 7.830322265625, 8.21435546875, 8.598388671875, 8.982421875, 9.366455078125, 9.75048828125, 10.134521484375, 10.5185546875, 10.902587890625, 11.28662109375, 11.670654296875, 12.0546875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 27.0, 48.0, 104.0, 145.0, 173.0, 193.0, 133.0, 100.0, 43.0, 25.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-135.9585418701172, -133.1690216064453, -130.37948608398438, -127.5899658203125, -124.8004379272461, -122.01091003417969, -119.22138214111328, -116.43185424804688, -113.642333984375, -110.8528060913086, -108.06327819824219, -105.27375793457031, -102.4842300415039, -99.6947021484375, -96.9051742553711, -94.11564636230469, -91.32611846923828, -88.53659057617188, -85.74706268310547, -82.95753479003906, -80.16801452636719, -77.37848663330078, -74.58895874023438, -71.79943084716797, -69.00990295410156, -66.22037506103516, -63.430850982666016, -60.64132308959961, -57.85179901123047, -55.06227111816406, -52.272743225097656, -49.48321533203125, -46.69369888305664, -43.904170989990234, -41.114646911621094, -38.32511901855469, -35.53559112548828, -32.74606704711914, -29.956539154052734, -27.16701316833496, -24.377487182617188, -21.587961196899414, -18.79843521118164, -16.008907318115234, -13.219381332397461, -10.429855346679688, -7.640327453613281, -4.850801467895508, -2.0612754821777344, 0.7282509803771973, 3.517777442932129, 6.307304382324219, 9.096830368041992, 11.886356353759766, 14.675884246826172, 17.465410232543945, 20.25493621826172, 23.044462203979492, 25.833988189697266, 28.623516082763672, 31.413042068481445, 34.20256805419922, 36.992095947265625, 39.78162384033203, 42.57114791870117]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 10.0, 9.0, 16.0, 13.0, 17.0, 13.0, 22.0, 24.0, 36.0, 33.0, 30.0, 35.0, 42.0, 29.0, 33.0, 41.0, 39.0, 53.0, 50.0, 44.0, 45.0, 41.0, 37.0, 46.0, 33.0, 24.0, 30.0, 22.0, 26.0, 15.0, 14.0, 13.0, 17.0, 11.0, 9.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.73675537109375, -34.65925598144531, -33.581756591796875, -32.50425720214844, -31.426759719848633, -30.349260330200195, -29.271760940551758, -28.19426155090332, -27.116764068603516, -26.039264678955078, -24.96176528930664, -23.884265899658203, -22.8067684173584, -21.72926902770996, -20.651769638061523, -19.574270248413086, -18.49677085876465, -17.41927146911621, -16.341772079467773, -15.264273643493652, -14.186775207519531, -13.109275817871094, -12.031776428222656, -10.954277038574219, -9.876778602600098, -8.79927921295166, -7.721780776977539, -6.644281387329102, -5.566782474517822, -4.489283561706543, -3.4117841720581055, -2.334285259246826, -1.2567863464355469, -0.17928731441497803, 0.8982117176055908, 1.9757108688354492, 3.0532097816467285, 4.130708694458008, 5.208208084106445, 6.285706996917725, 7.363205909729004, 8.440705299377441, 9.518203735351562, 10.595703125, 11.673202514648438, 12.750700950622559, 13.828200340270996, 14.905698776245117, 15.983198165893555, 17.060697555541992, 18.13819694519043, 19.215694427490234, 20.293193817138672, 21.37069320678711, 22.448192596435547, 23.525691986083984, 24.603191375732422, 25.68069076538086, 26.758190155029297, 27.835689544677734, 28.91318702697754, 29.990686416625977, 31.068185806274414, 32.14568328857422, 33.223182678222656]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 8.0, 2.0, 6.0, 11.0, 12.0, 12.0, 10.0, 12.0, 13.0, 21.0, 27.0, 23.0, 29.0, 32.0, 33.0, 37.0, 47.0, 33.0, 43.0, 44.0, 47.0, 39.0, 49.0, 45.0, 35.0, 32.0, 50.0, 41.0, 29.0, 27.0, 38.0, 21.0, 12.0, 19.0, 11.0, 7.0, 6.0, 13.0, 12.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.03515625, -3.915863037109375, -3.79656982421875, -3.677276611328125, -3.5579833984375, -3.438690185546875, -3.31939697265625, -3.200103759765625, -3.080810546875, -2.961517333984375, -2.84222412109375, -2.722930908203125, -2.6036376953125, -2.484344482421875, -2.36505126953125, -2.245758056640625, -2.12646484375, -2.007171630859375, -1.88787841796875, -1.768585205078125, -1.6492919921875, -1.529998779296875, -1.41070556640625, -1.291412353515625, -1.172119140625, -1.052825927734375, -0.93353271484375, -0.814239501953125, -0.6949462890625, -0.575653076171875, -0.45635986328125, -0.337066650390625, -0.2177734375, -0.098480224609375, 0.02081298828125, 0.140106201171875, 0.2593994140625, 0.378692626953125, 0.49798583984375, 0.617279052734375, 0.736572265625, 0.855865478515625, 0.97515869140625, 1.094451904296875, 1.2137451171875, 1.333038330078125, 1.45233154296875, 1.571624755859375, 1.69091796875, 1.810211181640625, 1.92950439453125, 2.048797607421875, 2.1680908203125, 2.287384033203125, 2.40667724609375, 2.525970458984375, 2.645263671875, 2.764556884765625, 2.88385009765625, 3.003143310546875, 3.1224365234375, 3.241729736328125, 3.36102294921875, 3.480316162109375, 3.599609375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 8.0, 6.0, 18.0, 14.0, 19.0, 36.0, 35.0, 59.0, 72.0, 145.0, 190.0, 301.0, 419.0, 606.0, 1032.0, 1644.0, 2569.0, 4327.0, 7179.0, 11836.0, 19683.0, 32804.0, 53201.0, 83771.0, 122315.0, 157520.0, 164029.0, 133209.0, 93992.0, 61717.0, 37577.0, 22822.0, 13980.0, 8207.0, 4924.0, 2944.0, 1898.0, 1220.0, 765.0, 477.0, 322.0, 196.0, 132.0, 98.0, 90.0, 46.0, 44.0, 20.0, 8.0, 9.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7890625, -0.7628860473632812, -0.7367095947265625, -0.7105331420898438, -0.684356689453125, -0.6581802368164062, -0.6320037841796875, -0.6058273315429688, -0.57965087890625, -0.5534744262695312, -0.5272979736328125, -0.5011215209960938, -0.474945068359375, -0.44876861572265625, -0.4225921630859375, -0.39641571044921875, -0.3702392578125, -0.34406280517578125, -0.3178863525390625, -0.29170989990234375, -0.265533447265625, -0.23935699462890625, -0.2131805419921875, -0.18700408935546875, -0.16082763671875, -0.13465118408203125, -0.1084747314453125, -0.08229827880859375, -0.056121826171875, -0.02994537353515625, -0.0037689208984375, 0.02240753173828125, 0.048583984375, 0.07476043701171875, 0.1009368896484375, 0.12711334228515625, 0.153289794921875, 0.17946624755859375, 0.2056427001953125, 0.23181915283203125, 0.25799560546875, 0.28417205810546875, 0.3103485107421875, 0.33652496337890625, 0.362701416015625, 0.38887786865234375, 0.4150543212890625, 0.44123077392578125, 0.4674072265625, 0.49358367919921875, 0.5197601318359375, 0.5459365844726562, 0.572113037109375, 0.5982894897460938, 0.6244659423828125, 0.6506423950195312, 0.67681884765625, 0.7029953002929688, 0.7291717529296875, 0.7553482055664062, 0.781524658203125, 0.8077011108398438, 0.8338775634765625, 0.8600540161132812, 0.88623046875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 5.0, 6.0, 4.0, 4.0, 5.0, 17.0, 6.0, 7.0, 14.0, 18.0, 24.0, 14.0, 24.0, 16.0, 31.0, 29.0, 25.0, 36.0, 38.0, 38.0, 29.0, 36.0, 42.0, 1073.0, 46.0, 34.0, 44.0, 39.0, 33.0, 31.0, 37.0, 33.0, 39.0, 19.0, 30.0, 19.0, 14.0, 16.0, 8.0, 8.0, 13.0, 7.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.644500732421875, -2.55657958984375, -2.468658447265625, -2.3807373046875, -2.292816162109375, -2.20489501953125, -2.116973876953125, -2.029052734375, -1.941131591796875, -1.85321044921875, -1.765289306640625, -1.6773681640625, -1.589447021484375, -1.50152587890625, -1.413604736328125, -1.32568359375, -1.237762451171875, -1.14984130859375, -1.061920166015625, -0.9739990234375, -0.886077880859375, -0.79815673828125, -0.710235595703125, -0.622314453125, -0.534393310546875, -0.44647216796875, -0.358551025390625, -0.2706298828125, -0.182708740234375, -0.09478759765625, -0.006866455078125, 0.0810546875, 0.168975830078125, 0.25689697265625, 0.344818115234375, 0.4327392578125, 0.520660400390625, 0.60858154296875, 0.696502685546875, 0.784423828125, 0.872344970703125, 0.96026611328125, 1.048187255859375, 1.1361083984375, 1.224029541015625, 1.31195068359375, 1.399871826171875, 1.48779296875, 1.575714111328125, 1.66363525390625, 1.751556396484375, 1.8394775390625, 1.927398681640625, 2.01531982421875, 2.103240966796875, 2.191162109375, 2.279083251953125, 2.36700439453125, 2.454925537109375, 2.5428466796875, 2.630767822265625, 2.71868896484375, 2.806610107421875, 2.89453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 10.0, 6.0, 6.0, 24.0, 30.0, 33.0, 47.0, 101.0, 143.0, 190.0, 364.0, 575.0, 957.0, 1569.0, 2813.0, 4987.0, 9421.0, 17669.0, 32853.0, 62404.0, 112759.0, 227439.0, 1133636.0, 236703.0, 115245.0, 63717.0, 33854.0, 17942.0, 9585.0, 5270.0, 2732.0, 1547.0, 924.0, 585.0, 363.0, 212.0, 133.0, 103.0, 52.0, 38.0, 25.0, 24.0, 18.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.41064453125, -0.3967323303222656, -0.38282012939453125, -0.3689079284667969, -0.3549957275390625, -0.3410835266113281, -0.32717132568359375, -0.3132591247558594, -0.299346923828125, -0.2854347229003906, -0.27152252197265625, -0.2576103210449219, -0.2436981201171875, -0.22978591918945312, -0.21587371826171875, -0.20196151733398438, -0.18804931640625, -0.17413711547851562, -0.16022491455078125, -0.14631271362304688, -0.1324005126953125, -0.11848831176757812, -0.10457611083984375, -0.09066390991210938, -0.076751708984375, -0.06283950805664062, -0.04892730712890625, -0.035015106201171875, -0.0211029052734375, -0.007190704345703125, 0.00672149658203125, 0.020633697509765625, 0.0345458984375, 0.048458099365234375, 0.06237030029296875, 0.07628250122070312, 0.0901947021484375, 0.10410690307617188, 0.11801910400390625, 0.13193130493164062, 0.145843505859375, 0.15975570678710938, 0.17366790771484375, 0.18758010864257812, 0.2014923095703125, 0.21540451049804688, 0.22931671142578125, 0.24322891235351562, 0.25714111328125, 0.2710533142089844, 0.28496551513671875, 0.2988777160644531, 0.3127899169921875, 0.3267021179199219, 0.34061431884765625, 0.3545265197753906, 0.368438720703125, 0.3823509216308594, 0.39626312255859375, 0.4101753234863281, 0.4240875244140625, 0.4379997253417969, 0.45191192626953125, 0.4658241271972656, 0.479736328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 5.0, 8.0, 9.0, 10.0, 8.0, 8.0, 8.0, 17.0, 15.0, 10.0, 19.0, 24.0, 28.0, 39.0, 48.0, 30.0, 40.0, 55.0, 43.0, 45.0, 65.0, 55.0, 48.0, 32.0, 33.0, 38.0, 32.0, 30.0, 21.0, 20.0, 20.0, 22.0, 11.0, 14.0, 14.0, 7.0, 6.0, 9.0, 7.0, 5.0, 3.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.0693359375, -0.06735610961914062, -0.06537628173828125, -0.06339645385742188, -0.0614166259765625, -0.059436798095703125, -0.05745697021484375, -0.055477142333984375, -0.053497314453125, -0.051517486572265625, -0.04953765869140625, -0.047557830810546875, -0.0455780029296875, -0.043598175048828125, -0.04161834716796875, -0.039638519287109375, -0.03765869140625, -0.035678863525390625, -0.03369903564453125, -0.031719207763671875, -0.0297393798828125, -0.027759552001953125, -0.02577972412109375, -0.023799896240234375, -0.021820068359375, -0.019840240478515625, -0.01786041259765625, -0.015880584716796875, -0.0139007568359375, -0.011920928955078125, -0.00994110107421875, -0.007961273193359375, -0.0059814453125, -0.004001617431640625, -0.00202178955078125, -4.1961669921875e-05, 0.0019378662109375, 0.003917694091796875, 0.00589752197265625, 0.007877349853515625, 0.009857177734375, 0.011837005615234375, 0.01381683349609375, 0.015796661376953125, 0.0177764892578125, 0.019756317138671875, 0.02173614501953125, 0.023715972900390625, 0.02569580078125, 0.027675628662109375, 0.02965545654296875, 0.031635284423828125, 0.0336151123046875, 0.035594940185546875, 0.03757476806640625, 0.039554595947265625, 0.041534423828125, 0.043514251708984375, 0.04549407958984375, 0.047473907470703125, 0.0494537353515625, 0.051433563232421875, 0.05341339111328125, 0.055393218994140625, 0.057373046875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 6.0, 12.0, 14.0, 21.0, 27.0, 51.0, 77.0, 109.0, 206.0, 363.0, 1061.0, 25257.0, 1005305.0, 14284.0, 846.0, 356.0, 184.0, 124.0, 80.0, 42.0, 23.0, 14.0, 16.0, 6.0, 5.0, 5.0, 6.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7631988525390625, -1.701202392578125, -1.6392059326171875, -1.57720947265625, -1.5152130126953125, -1.453216552734375, -1.3912200927734375, -1.3292236328125, -1.2672271728515625, -1.205230712890625, -1.1432342529296875, -1.08123779296875, -1.0192413330078125, -0.957244873046875, -0.8952484130859375, -0.833251953125, -0.7712554931640625, -0.709259033203125, -0.6472625732421875, -0.58526611328125, -0.5232696533203125, -0.461273193359375, -0.3992767333984375, -0.3372802734375, -0.2752838134765625, -0.213287353515625, -0.1512908935546875, -0.08929443359375, -0.0272979736328125, 0.034698486328125, 0.0966949462890625, 0.15869140625, 0.2206878662109375, 0.282684326171875, 0.3446807861328125, 0.40667724609375, 0.4686737060546875, 0.530670166015625, 0.5926666259765625, 0.6546630859375, 0.7166595458984375, 0.778656005859375, 0.8406524658203125, 0.90264892578125, 0.9646453857421875, 1.026641845703125, 1.0886383056640625, 1.150634765625, 1.2126312255859375, 1.274627685546875, 1.3366241455078125, 1.39862060546875, 1.4606170654296875, 1.522613525390625, 1.5846099853515625, 1.6466064453125, 1.7086029052734375, 1.770599365234375, 1.8325958251953125, 1.89459228515625, 1.9565887451171875, 2.018585205078125, 2.0805816650390625, 2.142578125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 16.0, 120.0, 582.0, 237.0, 47.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.409714460372925, -2.3664448261260986, -2.3231751918792725, -2.2799055576324463, -2.23663592338562, -2.193366289138794, -2.1500966548919678, -2.1068270206451416, -2.0635573863983154, -2.0202877521514893, -1.977018117904663, -1.933748483657837, -1.8904788494110107, -1.8472092151641846, -1.8039395809173584, -1.7606699466705322, -1.717400312423706, -1.6741306781768799, -1.6308610439300537, -1.5875914096832275, -1.5443217754364014, -1.5010521411895752, -1.457782506942749, -1.4145128726959229, -1.3712432384490967, -1.3279736042022705, -1.2847039699554443, -1.2414343357086182, -1.198164701461792, -1.1548950672149658, -1.1116254329681396, -1.0683557987213135, -1.0250862836837769, -0.9818166494369507, -0.9385470151901245, -0.8952773809432983, -0.8520077466964722, -0.808738112449646, -0.7654684782028198, -0.7221988439559937, -0.6789292097091675, -0.6356595754623413, -0.5923899412155151, -0.549120306968689, -0.5058506727218628, -0.4625810384750366, -0.41931140422821045, -0.3760417699813843, -0.3327721059322357, -0.28950247168540955, -0.24623283743858337, -0.2029632031917572, -0.15969356894493103, -0.11642393469810486, -0.07315430045127869, -0.029884666204452515, 0.013384968042373657, 0.05665460228919983, 0.099924236536026, 0.14319387078285217, 0.18646350502967834, 0.22973313927650452, 0.2730027735233307, 0.31627240777015686, 0.35954204201698303]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 9.0, 23.0, 21.0, 13.0, 11.0, 31.0, 23.0, 28.0, 32.0, 36.0, 28.0, 32.0, 34.0, 24.0, 44.0, 45.0, 46.0, 38.0, 34.0, 25.0, 34.0, 33.0, 35.0, 31.0, 33.0, 33.0, 25.0, 21.0, 18.0, 16.0, 19.0, 26.0, 15.0, 11.0, 14.0, 10.0, 3.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.12440747022628784, -0.12088853865861893, -0.11736960709095001, -0.1138506829738617, -0.11033175140619278, -0.10681281983852386, -0.10329389572143555, -0.09977496415376663, -0.09625603258609772, -0.0927371010184288, -0.08921816945075989, -0.08569924533367157, -0.08218031376600266, -0.07866138219833374, -0.07514245808124542, -0.07162352651357651, -0.06810459494590759, -0.06458566337823868, -0.06106673553586006, -0.057547807693481445, -0.05402887612581253, -0.050509944558143616, -0.046991016715765, -0.04347208887338638, -0.03995315730571747, -0.03643422573804855, -0.03291529789566994, -0.02939636819064617, -0.025877438485622406, -0.02235850878059864, -0.018839579075574875, -0.01532064937055111, -0.011801719665527344, -0.008282789960503578, -0.004763860255479813, -0.001244930550456047, 0.0022739991545677185, 0.005792928859591484, 0.00931185856461525, 0.012830788269639015, 0.01634971797466278, 0.019868647679686546, 0.023387577384710312, 0.026906507089734077, 0.030425436794757843, 0.03394436836242676, 0.037463296204805374, 0.04098222404718399, 0.044501155614852905, 0.04802008718252182, 0.051539015024900436, 0.05505794286727905, 0.05857687443494797, 0.06209580600261688, 0.0656147301197052, 0.06913366168737411, 0.07265259325504303, 0.07617152482271194, 0.07969045639038086, 0.08320938050746918, 0.08672831207513809, 0.090247243642807, 0.09376616775989532, 0.09728509932756424, 0.10080403089523315]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 10.0, 17.0, 13.0, 12.0, 12.0, 13.0, 27.0, 23.0, 23.0, 38.0, 29.0, 40.0, 30.0, 36.0, 34.0, 33.0, 39.0, 50.0, 39.0, 44.0, 37.0, 27.0, 46.0, 32.0, 38.0, 36.0, 26.0, 25.0, 25.0, 28.0, 14.0, 14.0, 21.0, 4.0, 8.0, 6.0, 6.0, 8.0, 6.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.564453125, -3.452423095703125, -3.34039306640625, -3.228363037109375, -3.1163330078125, -3.004302978515625, -2.89227294921875, -2.780242919921875, -2.668212890625, -2.556182861328125, -2.44415283203125, -2.332122802734375, -2.2200927734375, -2.108062744140625, -1.99603271484375, -1.884002685546875, -1.77197265625, -1.659942626953125, -1.54791259765625, -1.435882568359375, -1.3238525390625, -1.211822509765625, -1.09979248046875, -0.987762451171875, -0.875732421875, -0.763702392578125, -0.65167236328125, -0.539642333984375, -0.4276123046875, -0.315582275390625, -0.20355224609375, -0.091522216796875, 0.0205078125, 0.132537841796875, 0.24456787109375, 0.356597900390625, 0.4686279296875, 0.580657958984375, 0.69268798828125, 0.804718017578125, 0.916748046875, 1.028778076171875, 1.14080810546875, 1.252838134765625, 1.3648681640625, 1.476898193359375, 1.58892822265625, 1.700958251953125, 1.81298828125, 1.925018310546875, 2.03704833984375, 2.149078369140625, 2.2611083984375, 2.373138427734375, 2.48516845703125, 2.597198486328125, 2.709228515625, 2.821258544921875, 2.93328857421875, 3.045318603515625, 3.1573486328125, 3.269378662109375, 3.38140869140625, 3.493438720703125, 3.60546875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 9.0, 15.0, 17.0, 32.0, 28.0, 53.0, 86.0, 133.0, 201.0, 369.0, 668.0, 1315.0, 2510.0, 5280.0, 12006.0, 33847.0, 131052.0, 551645.0, 227876.0, 51210.0, 16343.0, 6866.0, 3234.0, 1746.0, 879.0, 441.0, 257.0, 158.0, 101.0, 40.0, 36.0, 30.0, 17.0, 9.0, 13.0, 9.0, 4.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375, -7.134521484375, -6.89404296875, -6.653564453125, -6.4130859375, -6.172607421875, -5.93212890625, -5.691650390625, -5.451171875, -5.210693359375, -4.97021484375, -4.729736328125, -4.4892578125, -4.248779296875, -4.00830078125, -3.767822265625, -3.52734375, -3.286865234375, -3.04638671875, -2.805908203125, -2.5654296875, -2.324951171875, -2.08447265625, -1.843994140625, -1.603515625, -1.363037109375, -1.12255859375, -0.882080078125, -0.6416015625, -0.401123046875, -0.16064453125, 0.079833984375, 0.3203125, 0.560791015625, 0.80126953125, 1.041748046875, 1.2822265625, 1.522705078125, 1.76318359375, 2.003662109375, 2.244140625, 2.484619140625, 2.72509765625, 2.965576171875, 3.2060546875, 3.446533203125, 3.68701171875, 3.927490234375, 4.16796875, 4.408447265625, 4.64892578125, 4.889404296875, 5.1298828125, 5.370361328125, 5.61083984375, 5.851318359375, 6.091796875, 6.332275390625, 6.57275390625, 6.813232421875, 7.0537109375, 7.294189453125, 7.53466796875, 7.775146484375, 8.015625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 8.0, 8.0, 11.0, 12.0, 11.0, 13.0, 17.0, 14.0, 25.0, 28.0, 27.0, 31.0, 27.0, 50.0, 50.0, 59.0, 90.0, 179.0, 271.0, 1399.0, 183.0, 106.0, 68.0, 56.0, 45.0, 28.0, 30.0, 24.0, 30.0, 22.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2265625, -11.8226318359375, -11.418701171875, -11.0147705078125, -10.61083984375, -10.2069091796875, -9.802978515625, -9.3990478515625, -8.9951171875, -8.5911865234375, -8.187255859375, -7.7833251953125, -7.37939453125, -6.9754638671875, -6.571533203125, -6.1676025390625, -5.763671875, -5.3597412109375, -4.955810546875, -4.5518798828125, -4.14794921875, -3.7440185546875, -3.340087890625, -2.9361572265625, -2.5322265625, -2.1282958984375, -1.724365234375, -1.3204345703125, -0.91650390625, -0.5125732421875, -0.108642578125, 0.2952880859375, 0.69921875, 1.1031494140625, 1.507080078125, 1.9110107421875, 2.31494140625, 2.7188720703125, 3.122802734375, 3.5267333984375, 3.9306640625, 4.3345947265625, 4.738525390625, 5.1424560546875, 5.54638671875, 5.9503173828125, 6.354248046875, 6.7581787109375, 7.162109375, 7.5660400390625, 7.969970703125, 8.3739013671875, 8.77783203125, 9.1817626953125, 9.585693359375, 9.9896240234375, 10.3935546875, 10.7974853515625, 11.201416015625, 11.6053466796875, 12.00927734375, 12.4132080078125, 12.817138671875, 13.2210693359375, 13.625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 14.0, 14.0, 21.0, 30.0, 40.0, 59.0, 81.0, 117.0, 191.0, 333.0, 1036.0, 4929.0, 52351.0, 2763173.0, 308172.0, 12056.0, 1831.0, 484.0, 209.0, 129.0, 113.0, 76.0, 58.0, 37.0, 30.0, 21.0, 20.0, 11.0, 8.0, 12.0, 6.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-29.328125, -28.529296875, -27.73046875, -26.931640625, -26.1328125, -25.333984375, -24.53515625, -23.736328125, -22.9375, -22.138671875, -21.33984375, -20.541015625, -19.7421875, -18.943359375, -18.14453125, -17.345703125, -16.546875, -15.748046875, -14.94921875, -14.150390625, -13.3515625, -12.552734375, -11.75390625, -10.955078125, -10.15625, -9.357421875, -8.55859375, -7.759765625, -6.9609375, -6.162109375, -5.36328125, -4.564453125, -3.765625, -2.966796875, -2.16796875, -1.369140625, -0.5703125, 0.228515625, 1.02734375, 1.826171875, 2.625, 3.423828125, 4.22265625, 5.021484375, 5.8203125, 6.619140625, 7.41796875, 8.216796875, 9.015625, 9.814453125, 10.61328125, 11.412109375, 12.2109375, 13.009765625, 13.80859375, 14.607421875, 15.40625, 16.205078125, 17.00390625, 17.802734375, 18.6015625, 19.400390625, 20.19921875, 20.998046875, 21.796875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 33.0, 869.0, 116.0, 0.0, 1.0], "bins": [-523.8014526367188, -515.15185546875, -506.5022888183594, -497.8526916503906, -489.203125, -480.55352783203125, -471.9039611816406, -463.2543640136719, -454.60479736328125, -445.9552001953125, -437.3056335449219, -428.6560363769531, -420.0064697265625, -411.35687255859375, -402.7073059082031, -394.0577087402344, -385.40814208984375, -376.758544921875, -368.1089782714844, -359.4593811035156, -350.809814453125, -342.16021728515625, -333.5106506347656, -324.8610534667969, -316.2114562988281, -307.5618591308594, -298.91229248046875, -290.2626953125, -281.6131286621094, -272.9635314941406, -264.31396484375, -255.66436767578125, -247.01480102539062, -238.36521911621094, -229.71563720703125, -221.06605529785156, -212.41647338867188, -203.7668914794922, -195.1173095703125, -186.46771240234375, -177.81814575195312, -169.16856384277344, -160.51898193359375, -151.86940002441406, -143.21981811523438, -134.5702362060547, -125.92064666748047, -117.27106475830078, -108.62147521972656, -99.97189331054688, -91.32231140136719, -82.6727294921875, -74.02314758300781, -65.37356567382812, -56.723976135253906, -48.07439422607422, -39.4248161315918, -30.77523422241211, -22.12565040588379, -13.476066589355469, -4.826484680175781, 3.8230972290039062, 12.47268295288086, 21.122264862060547, 29.771846771240234]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 4.0, 11.0, 15.0, 13.0, 16.0, 12.0, 25.0, 24.0, 35.0, 20.0, 31.0, 30.0, 25.0, 31.0, 42.0, 33.0, 54.0, 44.0, 40.0, 35.0, 45.0, 46.0, 30.0, 33.0, 34.0, 27.0, 28.0, 25.0, 22.0, 29.0, 27.0, 21.0, 16.0, 15.0, 5.0, 7.0, 5.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.258506774902344, -37.966331481933594, -36.674156188964844, -35.38197708129883, -34.08980178833008, -32.79762649536133, -31.505449295043945, -30.213272094726562, -28.921096801757812, -27.628921508789062, -26.33674430847168, -25.044567108154297, -23.752391815185547, -22.460216522216797, -21.168039321899414, -19.87586212158203, -18.58368682861328, -17.29151153564453, -15.999334335327148, -14.707158088684082, -13.414981842041016, -12.12280559539795, -10.830629348754883, -9.538453102111816, -8.24627685546875, -6.954100608825684, -5.661924362182617, -4.369748115539551, -3.0775718688964844, -1.785395622253418, -0.49321937561035156, 0.7989568710327148, 2.091136932373047, 3.3833131790161133, 4.67548942565918, 5.967665672302246, 7.2598419189453125, 8.552018165588379, 9.844194412231445, 11.136370658874512, 12.428546905517578, 13.720723152160645, 15.012899398803711, 16.305076599121094, 17.597251892089844, 18.889427185058594, 20.181604385375977, 21.47378158569336, 22.76595687866211, 24.05813217163086, 25.350309371948242, 26.642486572265625, 27.934661865234375, 29.226837158203125, 30.519014358520508, 31.81119155883789, 33.10336685180664, 34.39554214477539, 35.687721252441406, 36.979896545410156, 38.272071838378906, 39.564247131347656, 40.856422424316406, 42.14860153198242, 43.44077682495117]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 8.0, 3.0, 13.0, 14.0, 15.0, 13.0, 26.0, 24.0, 32.0, 26.0, 26.0, 39.0, 35.0, 45.0, 34.0, 42.0, 39.0, 39.0, 40.0, 42.0, 41.0, 40.0, 39.0, 41.0, 32.0, 35.0, 32.0, 25.0, 24.0, 23.0, 15.0, 18.0, 14.0, 15.0, 7.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.19921875, -4.07623291015625, -3.9532470703125, -3.83026123046875, -3.707275390625, -3.58428955078125, -3.4613037109375, -3.33831787109375, -3.21533203125, -3.09234619140625, -2.9693603515625, -2.84637451171875, -2.723388671875, -2.60040283203125, -2.4774169921875, -2.35443115234375, -2.2314453125, -2.10845947265625, -1.9854736328125, -1.86248779296875, -1.739501953125, -1.61651611328125, -1.4935302734375, -1.37054443359375, -1.24755859375, -1.12457275390625, -1.0015869140625, -0.87860107421875, -0.755615234375, -0.63262939453125, -0.5096435546875, -0.38665771484375, -0.263671875, -0.14068603515625, -0.0177001953125, 0.10528564453125, 0.228271484375, 0.35125732421875, 0.4742431640625, 0.59722900390625, 0.72021484375, 0.84320068359375, 0.9661865234375, 1.08917236328125, 1.212158203125, 1.33514404296875, 1.4581298828125, 1.58111572265625, 1.7041015625, 1.82708740234375, 1.9500732421875, 2.07305908203125, 2.196044921875, 2.31903076171875, 2.4420166015625, 2.56500244140625, 2.68798828125, 2.81097412109375, 2.9339599609375, 3.05694580078125, 3.179931640625, 3.30291748046875, 3.4259033203125, 3.54888916015625, 3.671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 10.0, 15.0, 20.0, 30.0, 30.0, 54.0, 66.0, 133.0, 186.0, 293.0, 504.0, 786.0, 1464.0, 3045.0, 7169.0, 19915.0, 65713.0, 246231.0, 962668.0, 1838904.0, 769011.0, 196362.0, 53730.0, 16512.0, 5967.0, 2581.0, 1240.0, 639.0, 372.0, 217.0, 144.0, 94.0, 60.0, 31.0, 20.0, 20.0, 11.0, 11.0, 7.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.45635986328125, -6.2291259765625, -6.00189208984375, -5.774658203125, -5.54742431640625, -5.3201904296875, -5.09295654296875, -4.86572265625, -4.63848876953125, -4.4112548828125, -4.18402099609375, -3.956787109375, -3.72955322265625, -3.5023193359375, -3.27508544921875, -3.0478515625, -2.82061767578125, -2.5933837890625, -2.36614990234375, -2.138916015625, -1.91168212890625, -1.6844482421875, -1.45721435546875, -1.22998046875, -1.00274658203125, -0.7755126953125, -0.54827880859375, -0.321044921875, -0.09381103515625, 0.1334228515625, 0.36065673828125, 0.587890625, 0.81512451171875, 1.0423583984375, 1.26959228515625, 1.496826171875, 1.72406005859375, 1.9512939453125, 2.17852783203125, 2.40576171875, 2.63299560546875, 2.8602294921875, 3.08746337890625, 3.314697265625, 3.54193115234375, 3.7691650390625, 3.99639892578125, 4.2236328125, 4.45086669921875, 4.6781005859375, 4.90533447265625, 5.132568359375, 5.35980224609375, 5.5870361328125, 5.81427001953125, 6.04150390625, 6.26873779296875, 6.4959716796875, 6.72320556640625, 6.950439453125, 7.17767333984375, 7.4049072265625, 7.63214111328125, 7.859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 10.0, 14.0, 3.0, 11.0, 18.0, 27.0, 37.0, 32.0, 32.0, 67.0, 73.0, 102.0, 116.0, 140.0, 183.0, 213.0, 259.0, 340.0, 337.0, 343.0, 291.0, 299.0, 226.0, 177.0, 153.0, 123.0, 118.0, 69.0, 50.0, 48.0, 31.0, 23.0, 27.0, 25.0, 8.0, 11.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.546875, -8.30328369140625, -8.0596923828125, -7.81610107421875, -7.572509765625, -7.32891845703125, -7.0853271484375, -6.84173583984375, -6.59814453125, -6.35455322265625, -6.1109619140625, -5.86737060546875, -5.623779296875, -5.38018798828125, -5.1365966796875, -4.89300537109375, -4.6494140625, -4.40582275390625, -4.1622314453125, -3.91864013671875, -3.675048828125, -3.43145751953125, -3.1878662109375, -2.94427490234375, -2.70068359375, -2.45709228515625, -2.2135009765625, -1.96990966796875, -1.726318359375, -1.48272705078125, -1.2391357421875, -0.99554443359375, -0.751953125, -0.50836181640625, -0.2647705078125, -0.02117919921875, 0.222412109375, 0.46600341796875, 0.7095947265625, 0.95318603515625, 1.19677734375, 1.44036865234375, 1.6839599609375, 1.92755126953125, 2.171142578125, 2.41473388671875, 2.6583251953125, 2.90191650390625, 3.1455078125, 3.38909912109375, 3.6326904296875, 3.87628173828125, 4.119873046875, 4.36346435546875, 4.6070556640625, 4.85064697265625, 5.09423828125, 5.33782958984375, 5.5814208984375, 5.82501220703125, 6.068603515625, 6.31219482421875, 6.5557861328125, 6.79937744140625, 7.04296875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 15.0, 14.0, 24.0, 25.0, 36.0, 45.0, 71.0, 132.0, 170.0, 262.0, 406.0, 779.0, 1482.0, 2816.0, 6035.0, 14485.0, 36675.0, 99017.0, 277813.0, 750306.0, 1443728.0, 970899.0, 373979.0, 132749.0, 48317.0, 18567.0, 7644.0, 3616.0, 1816.0, 902.0, 520.0, 296.0, 202.0, 145.0, 78.0, 58.0, 43.0, 31.0, 23.0, 24.0, 6.0, 7.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.125, -7.85986328125, -7.5947265625, -7.32958984375, -7.064453125, -6.79931640625, -6.5341796875, -6.26904296875, -6.00390625, -5.73876953125, -5.4736328125, -5.20849609375, -4.943359375, -4.67822265625, -4.4130859375, -4.14794921875, -3.8828125, -3.61767578125, -3.3525390625, -3.08740234375, -2.822265625, -2.55712890625, -2.2919921875, -2.02685546875, -1.76171875, -1.49658203125, -1.2314453125, -0.96630859375, -0.701171875, -0.43603515625, -0.1708984375, 0.09423828125, 0.359375, 0.62451171875, 0.8896484375, 1.15478515625, 1.419921875, 1.68505859375, 1.9501953125, 2.21533203125, 2.48046875, 2.74560546875, 3.0107421875, 3.27587890625, 3.541015625, 3.80615234375, 4.0712890625, 4.33642578125, 4.6015625, 4.86669921875, 5.1318359375, 5.39697265625, 5.662109375, 5.92724609375, 6.1923828125, 6.45751953125, 6.72265625, 6.98779296875, 7.2529296875, 7.51806640625, 7.783203125, 8.04833984375, 8.3134765625, 8.57861328125, 8.84375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 16.0, 13.0, 34.0, 26.0, 28.0, 38.0, 45.0, 73.0, 59.0, 65.0, 86.0, 78.0, 77.0, 61.0, 58.0, 61.0, 50.0, 34.0, 20.0, 28.0, 21.0, 9.0, 6.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.32598876953125, -37.020225524902344, -35.7144660949707, -34.4087028503418, -33.10293960571289, -31.797178268432617, -30.491416931152344, -29.185653686523438, -27.879892349243164, -26.57413101196289, -25.268367767333984, -23.96260643005371, -22.656845092773438, -21.35108184814453, -20.045320510864258, -18.739559173583984, -17.433795928955078, -16.128034591674805, -14.822271347045898, -13.516510009765625, -12.210747718811035, -10.904985427856445, -9.599224090576172, -8.293461799621582, -6.987699508666992, -5.681937217712402, -4.376175403594971, -3.07041335105896, -1.7646512985229492, -0.4588890075683594, 0.8468728065490723, 2.152634620666504, 3.458393096923828, 4.764155387878418, 6.06991720199585, 7.375679016113281, 8.681441307067871, 9.987203598022461, 11.292964935302734, 12.598727226257324, 13.904489517211914, 15.210251808166504, 16.516014099121094, 17.821775436401367, 19.12753677368164, 20.433300018310547, 21.73906135559082, 23.044822692871094, 24.3505859375, 25.656347274780273, 26.96211051940918, 28.267871856689453, 29.57363510131836, 30.879396438598633, 32.185157775878906, 33.49092102050781, 34.79668426513672, 36.102447509765625, 37.408206939697266, 38.71397018432617, 40.01973342895508, 41.32549285888672, 42.631256103515625, 43.93701934814453, 45.24277877807617]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 13.0, 15.0, 13.0, 17.0, 19.0, 26.0, 29.0, 34.0, 38.0, 37.0, 42.0, 42.0, 42.0, 51.0, 56.0, 33.0, 47.0, 37.0, 33.0, 42.0, 38.0, 31.0, 46.0, 24.0, 22.0, 15.0, 24.0, 25.0, 14.0, 20.0, 8.0, 16.0, 5.0, 4.0, 3.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-37.106422424316406, -36.03651428222656, -34.966609954833984, -33.89670181274414, -32.82679748535156, -31.75688934326172, -30.686983108520508, -29.617076873779297, -28.547170639038086, -27.477264404296875, -26.407358169555664, -25.337451934814453, -24.26754379272461, -23.19763946533203, -22.127731323242188, -21.057825088500977, -19.987918853759766, -18.918012619018555, -17.848106384277344, -16.778200149536133, -15.708292961120605, -14.638386726379395, -13.568479537963867, -12.498573303222656, -11.428667068481445, -10.358760833740234, -9.288854598999023, -8.218947410583496, -7.149041175842285, -6.079134941101074, -5.009228229522705, -3.939321517944336, -2.8694114685058594, -1.7995049953460693, -0.7295985221862793, 0.34030795097351074, 1.4102144241333008, 2.4801206588745117, 3.550027370452881, 4.61993408203125, 5.689840316772461, 6.759746551513672, 7.829653263092041, 8.89955997467041, 9.969466209411621, 11.039372444152832, 12.10927963256836, 13.17918586730957, 14.249092102050781, 15.318998336791992, 16.388904571533203, 17.458810806274414, 18.528717041015625, 19.59862518310547, 20.66853141784668, 21.73843765258789, 22.8083438873291, 23.878250122070312, 24.948156356811523, 26.018062591552734, 27.087970733642578, 28.157875061035156, 29.227783203125, 30.29768943786621, 31.367595672607422]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 2.0, 6.0, 10.0, 10.0, 12.0, 11.0, 15.0, 11.0, 25.0, 27.0, 37.0, 37.0, 40.0, 38.0, 43.0, 34.0, 42.0, 44.0, 49.0, 52.0, 57.0, 45.0, 44.0, 48.0, 34.0, 39.0, 30.0, 28.0, 29.0, 29.0, 16.0, 13.0, 10.0, 9.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.14801025390625, -3.9991455078125, -3.85028076171875, -3.701416015625, -3.55255126953125, -3.4036865234375, -3.25482177734375, -3.10595703125, -2.95709228515625, -2.8082275390625, -2.65936279296875, -2.510498046875, -2.36163330078125, -2.2127685546875, -2.06390380859375, -1.9150390625, -1.76617431640625, -1.6173095703125, -1.46844482421875, -1.319580078125, -1.17071533203125, -1.0218505859375, -0.87298583984375, -0.72412109375, -0.57525634765625, -0.4263916015625, -0.27752685546875, -0.128662109375, 0.02020263671875, 0.1690673828125, 0.31793212890625, 0.466796875, 0.61566162109375, 0.7645263671875, 0.91339111328125, 1.062255859375, 1.21112060546875, 1.3599853515625, 1.50885009765625, 1.65771484375, 1.80657958984375, 1.9554443359375, 2.10430908203125, 2.253173828125, 2.40203857421875, 2.5509033203125, 2.69976806640625, 2.8486328125, 2.99749755859375, 3.1463623046875, 3.29522705078125, 3.444091796875, 3.59295654296875, 3.7418212890625, 3.89068603515625, 4.03955078125, 4.18841552734375, 4.3372802734375, 4.48614501953125, 4.635009765625, 4.78387451171875, 4.9327392578125, 5.08160400390625, 5.23046875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 11.0, 9.0, 9.0, 27.0, 24.0, 50.0, 46.0, 78.0, 108.0, 169.0, 251.0, 353.0, 550.0, 791.0, 1398.0, 2329.0, 4566.0, 9117.0, 20233.0, 45599.0, 99662.0, 191692.0, 261130.0, 205421.0, 109863.0, 50525.0, 22720.0, 10187.0, 5022.0, 2554.0, 1470.0, 830.0, 577.0, 350.0, 252.0, 150.0, 121.0, 84.0, 68.0, 46.0, 36.0, 27.0, 16.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.572265625, -1.52398681640625, -1.4757080078125, -1.42742919921875, -1.379150390625, -1.33087158203125, -1.2825927734375, -1.23431396484375, -1.18603515625, -1.13775634765625, -1.0894775390625, -1.04119873046875, -0.992919921875, -0.94464111328125, -0.8963623046875, -0.84808349609375, -0.7998046875, -0.75152587890625, -0.7032470703125, -0.65496826171875, -0.606689453125, -0.55841064453125, -0.5101318359375, -0.46185302734375, -0.41357421875, -0.36529541015625, -0.3170166015625, -0.26873779296875, -0.220458984375, -0.17218017578125, -0.1239013671875, -0.07562255859375, -0.02734375, 0.02093505859375, 0.0692138671875, 0.11749267578125, 0.165771484375, 0.21405029296875, 0.2623291015625, 0.31060791015625, 0.35888671875, 0.40716552734375, 0.4554443359375, 0.50372314453125, 0.552001953125, 0.60028076171875, 0.6485595703125, 0.69683837890625, 0.7451171875, 0.79339599609375, 0.8416748046875, 0.88995361328125, 0.938232421875, 0.98651123046875, 1.0347900390625, 1.08306884765625, 1.13134765625, 1.17962646484375, 1.2279052734375, 1.27618408203125, 1.324462890625, 1.37274169921875, 1.4210205078125, 1.46929931640625, 1.517578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 10.0, 9.0, 12.0, 9.0, 15.0, 16.0, 14.0, 25.0, 19.0, 23.0, 32.0, 35.0, 37.0, 36.0, 37.0, 34.0, 25.0, 32.0, 1064.0, 27.0, 41.0, 38.0, 53.0, 26.0, 28.0, 25.0, 28.0, 30.0, 31.0, 37.0, 22.0, 15.0, 23.0, 16.0, 17.0, 17.0, 18.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.5546875, -3.449066162109375, -3.34344482421875, -3.237823486328125, -3.1322021484375, -3.026580810546875, -2.92095947265625, -2.815338134765625, -2.709716796875, -2.604095458984375, -2.49847412109375, -2.392852783203125, -2.2872314453125, -2.181610107421875, -2.07598876953125, -1.970367431640625, -1.86474609375, -1.759124755859375, -1.65350341796875, -1.547882080078125, -1.4422607421875, -1.336639404296875, -1.23101806640625, -1.125396728515625, -1.019775390625, -0.914154052734375, -0.80853271484375, -0.702911376953125, -0.5972900390625, -0.491668701171875, -0.38604736328125, -0.280426025390625, -0.1748046875, -0.069183349609375, 0.03643798828125, 0.142059326171875, 0.2476806640625, 0.353302001953125, 0.45892333984375, 0.564544677734375, 0.670166015625, 0.775787353515625, 0.88140869140625, 0.987030029296875, 1.0926513671875, 1.198272705078125, 1.30389404296875, 1.409515380859375, 1.51513671875, 1.620758056640625, 1.72637939453125, 1.832000732421875, 1.9376220703125, 2.043243408203125, 2.14886474609375, 2.254486083984375, 2.360107421875, 2.465728759765625, 2.57135009765625, 2.676971435546875, 2.7825927734375, 2.888214111328125, 2.99383544921875, 3.099456787109375, 3.205078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 11.0, 12.0, 15.0, 29.0, 23.0, 39.0, 60.0, 114.0, 142.0, 227.0, 315.0, 558.0, 968.0, 1849.0, 3918.0, 8910.0, 22490.0, 59410.0, 159348.0, 989698.0, 616565.0, 142815.0, 53558.0, 20192.0, 8097.0, 3676.0, 1758.0, 878.0, 529.0, 340.0, 187.0, 122.0, 83.0, 65.0, 37.0, 29.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.84423828125, -0.81781005859375, -0.7913818359375, -0.76495361328125, -0.738525390625, -0.71209716796875, -0.6856689453125, -0.65924072265625, -0.6328125, -0.60638427734375, -0.5799560546875, -0.55352783203125, -0.527099609375, -0.50067138671875, -0.4742431640625, -0.44781494140625, -0.42138671875, -0.39495849609375, -0.3685302734375, -0.34210205078125, -0.315673828125, -0.28924560546875, -0.2628173828125, -0.23638916015625, -0.2099609375, -0.18353271484375, -0.1571044921875, -0.13067626953125, -0.104248046875, -0.07781982421875, -0.0513916015625, -0.02496337890625, 0.00146484375, 0.02789306640625, 0.0543212890625, 0.08074951171875, 0.107177734375, 0.13360595703125, 0.1600341796875, 0.18646240234375, 0.212890625, 0.23931884765625, 0.2657470703125, 0.29217529296875, 0.318603515625, 0.34503173828125, 0.3714599609375, 0.39788818359375, 0.42431640625, 0.45074462890625, 0.4771728515625, 0.50360107421875, 0.530029296875, 0.55645751953125, 0.5828857421875, 0.60931396484375, 0.6357421875, 0.66217041015625, 0.6885986328125, 0.71502685546875, 0.741455078125, 0.76788330078125, 0.7943115234375, 0.82073974609375, 0.84716796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 15.0, 10.0, 22.0, 20.0, 34.0, 38.0, 88.0, 179.0, 250.0, 118.0, 66.0, 48.0, 26.0, 20.0, 15.0, 14.0, 11.0, 6.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268798828125, -0.25930023193359375, -0.2498016357421875, -0.24030303955078125, -0.230804443359375, -0.22130584716796875, -0.2118072509765625, -0.20230865478515625, -0.19281005859375, -0.18331146240234375, -0.1738128662109375, -0.16431427001953125, -0.154815673828125, -0.14531707763671875, -0.1358184814453125, -0.12631988525390625, -0.1168212890625, -0.10732269287109375, -0.0978240966796875, -0.08832550048828125, -0.078826904296875, -0.06932830810546875, -0.0598297119140625, -0.05033111572265625, -0.04083251953125, -0.03133392333984375, -0.0218353271484375, -0.01233673095703125, -0.002838134765625, 0.00666046142578125, 0.0161590576171875, 0.02565765380859375, 0.03515625, 0.04465484619140625, 0.0541534423828125, 0.06365203857421875, 0.073150634765625, 0.08264923095703125, 0.0921478271484375, 0.10164642333984375, 0.11114501953125, 0.12064361572265625, 0.1301422119140625, 0.13964080810546875, 0.149139404296875, 0.15863800048828125, 0.1681365966796875, 0.17763519287109375, 0.1871337890625, 0.19663238525390625, 0.2061309814453125, 0.21562957763671875, 0.225128173828125, 0.23462677001953125, 0.2441253662109375, 0.25362396240234375, 0.26312255859375, 0.27262115478515625, 0.2821197509765625, 0.29161834716796875, 0.301116943359375, 0.31061553955078125, 0.3201141357421875, 0.32961273193359375, 0.339111328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 3.0, 12.0, 7.0, 8.0, 15.0, 22.0, 37.0, 49.0, 81.0, 125.0, 216.0, 496.0, 8878.0, 1029330.0, 8184.0, 510.0, 202.0, 133.0, 70.0, 60.0, 36.0, 22.0, 15.0, 9.0, 10.0, 8.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.93359375, -4.794586181640625, -4.65557861328125, -4.516571044921875, -4.3775634765625, -4.238555908203125, -4.09954833984375, -3.960540771484375, -3.821533203125, -3.682525634765625, -3.54351806640625, -3.404510498046875, -3.2655029296875, -3.126495361328125, -2.98748779296875, -2.848480224609375, -2.70947265625, -2.570465087890625, -2.43145751953125, -2.292449951171875, -2.1534423828125, -2.014434814453125, -1.87542724609375, -1.736419677734375, -1.597412109375, -1.458404541015625, -1.31939697265625, -1.180389404296875, -1.0413818359375, -0.902374267578125, -0.76336669921875, -0.624359130859375, -0.4853515625, -0.346343994140625, -0.20733642578125, -0.068328857421875, 0.0706787109375, 0.209686279296875, 0.34869384765625, 0.487701416015625, 0.626708984375, 0.765716552734375, 0.90472412109375, 1.043731689453125, 1.1827392578125, 1.321746826171875, 1.46075439453125, 1.599761962890625, 1.73876953125, 1.877777099609375, 2.01678466796875, 2.155792236328125, 2.2947998046875, 2.433807373046875, 2.57281494140625, 2.711822509765625, 2.850830078125, 2.989837646484375, 3.12884521484375, 3.267852783203125, 3.4068603515625, 3.545867919921875, 3.68487548828125, 3.823883056640625, 3.962890625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 14.0, 23.0, 69.0, 211.0, 424.0, 172.0, 45.0, 24.0, 12.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4938514530658722, -0.45701518654823303, -0.42017892003059387, -0.3833426833152771, -0.34650641679763794, -0.3096701502799988, -0.2728338837623596, -0.23599761724472046, -0.1991613507270813, -0.16232508420944214, -0.12548881769180298, -0.08865256607532501, -0.05181629955768585, -0.014980033040046692, 0.021856218576431274, 0.058692485094070435, 0.0955287516117096, 0.13236501812934875, 0.16920128464698792, 0.20603753626346588, 0.24287380278110504, 0.279710054397583, 0.31654632091522217, 0.35338258743286133, 0.3902188539505005, 0.42705512046813965, 0.4638913869857788, 0.500727653503418, 0.5375639200210571, 0.5744001865386963, 0.6112364530563354, 0.6480727195739746, 0.6849088668823242, 0.7217451333999634, 0.7585813999176025, 0.7954176664352417, 0.8322539329528809, 0.86909019947052, 0.9059264659881592, 0.9427627325057983, 0.9795989990234375, 1.0164352655410767, 1.0532715320587158, 1.090107798576355, 1.1269440650939941, 1.1637803316116333, 1.2006165981292725, 1.2374528646469116, 1.2742891311645508, 1.31112539768219, 1.347961664199829, 1.3847979307174683, 1.4216341972351074, 1.4584704637527466, 1.4953067302703857, 1.532142996788025, 1.5689791440963745, 1.6058154106140137, 1.6426516771316528, 1.679487943649292, 1.7163242101669312, 1.7531604766845703, 1.7899967432022095, 1.8268330097198486, 1.8636692762374878]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 7.0, 4.0, 6.0, 3.0, 20.0, 9.0, 21.0, 22.0, 20.0, 18.0, 30.0, 18.0, 35.0, 25.0, 38.0, 33.0, 41.0, 33.0, 44.0, 31.0, 42.0, 36.0, 44.0, 43.0, 43.0, 33.0, 32.0, 39.0, 21.0, 23.0, 22.0, 22.0, 19.0, 23.0, 13.0, 18.0, 15.0, 6.0, 20.0, 3.0, 9.0, 2.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3218487501144409, -0.31107431650161743, -0.30029988288879395, -0.28952547907829285, -0.27875104546546936, -0.2679766118526459, -0.2572022080421448, -0.2464277744293213, -0.2356533408164978, -0.22487890720367432, -0.21410448849201202, -0.20333006978034973, -0.19255563616752625, -0.18178120255470276, -0.17100678384304047, -0.16023236513137817, -0.1494579315185547, -0.1386834979057312, -0.1279090791940689, -0.11713465303182602, -0.10636022686958313, -0.09558580070734024, -0.08481137454509735, -0.07403694838285446, -0.06326252222061157, -0.05248809605836868, -0.04171366989612579, -0.030939243733882904, -0.020164817571640015, -0.009390391409397125, 0.0013840347528457642, 0.012158460915088654, 0.022932887077331543, 0.03370731323957443, 0.04448173940181732, 0.05525616556406021, 0.0660305917263031, 0.07680501788854599, 0.08757944405078888, 0.09835387021303177, 0.10912829637527466, 0.11990272253751755, 0.13067714869976044, 0.14145156741142273, 0.15222600102424622, 0.1630004346370697, 0.173774853348732, 0.1845492720603943, 0.19532370567321777, 0.20609813928604126, 0.21687255799770355, 0.22764697670936584, 0.23842141032218933, 0.24919584393501282, 0.2599702477455139, 0.2707446813583374, 0.2815191149711609, 0.2922935485839844, 0.30306798219680786, 0.31384238600730896, 0.32461681962013245, 0.33539125323295593, 0.34616565704345703, 0.3569400906562805, 0.367714524269104]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 10.0, 8.0, 7.0, 8.0, 14.0, 15.0, 19.0, 17.0, 23.0, 38.0, 33.0, 27.0, 43.0, 53.0, 44.0, 44.0, 33.0, 47.0, 45.0, 47.0, 41.0, 43.0, 37.0, 39.0, 35.0, 39.0, 35.0, 20.0, 28.0, 17.0, 19.0, 21.0, 7.0, 6.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.421875, -4.2803955078125, -4.138916015625, -3.9974365234375, -3.85595703125, -3.7144775390625, -3.572998046875, -3.4315185546875, -3.2900390625, -3.1485595703125, -3.007080078125, -2.8656005859375, -2.72412109375, -2.5826416015625, -2.441162109375, -2.2996826171875, -2.158203125, -2.0167236328125, -1.875244140625, -1.7337646484375, -1.59228515625, -1.4508056640625, -1.309326171875, -1.1678466796875, -1.0263671875, -0.8848876953125, -0.743408203125, -0.6019287109375, -0.46044921875, -0.3189697265625, -0.177490234375, -0.0360107421875, 0.10546875, 0.2469482421875, 0.388427734375, 0.5299072265625, 0.67138671875, 0.8128662109375, 0.954345703125, 1.0958251953125, 1.2373046875, 1.3787841796875, 1.520263671875, 1.6617431640625, 1.80322265625, 1.9447021484375, 2.086181640625, 2.2276611328125, 2.369140625, 2.5106201171875, 2.652099609375, 2.7935791015625, 2.93505859375, 3.0765380859375, 3.218017578125, 3.3594970703125, 3.5009765625, 3.6424560546875, 3.783935546875, 3.9254150390625, 4.06689453125, 4.2083740234375, 4.349853515625, 4.4913330078125, 4.6328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 10.0, 11.0, 11.0, 23.0, 22.0, 42.0, 74.0, 110.0, 157.0, 259.0, 365.0, 588.0, 1017.0, 1599.0, 2374.0, 3943.0, 6432.0, 10514.0, 18262.0, 35354.0, 81852.0, 207724.0, 330352.0, 194179.0, 75978.0, 33373.0, 17549.0, 10189.0, 5960.0, 3819.0, 2310.0, 1473.0, 971.0, 606.0, 342.0, 237.0, 156.0, 99.0, 76.0, 54.0, 30.0, 24.0, 10.0, 14.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.166748046875, -4.00927734375, -3.851806640625, -3.6943359375, -3.536865234375, -3.37939453125, -3.221923828125, -3.064453125, -2.906982421875, -2.74951171875, -2.592041015625, -2.4345703125, -2.277099609375, -2.11962890625, -1.962158203125, -1.8046875, -1.647216796875, -1.48974609375, -1.332275390625, -1.1748046875, -1.017333984375, -0.85986328125, -0.702392578125, -0.544921875, -0.387451171875, -0.22998046875, -0.072509765625, 0.0849609375, 0.242431640625, 0.39990234375, 0.557373046875, 0.71484375, 0.872314453125, 1.02978515625, 1.187255859375, 1.3447265625, 1.502197265625, 1.65966796875, 1.817138671875, 1.974609375, 2.132080078125, 2.28955078125, 2.447021484375, 2.6044921875, 2.761962890625, 2.91943359375, 3.076904296875, 3.234375, 3.391845703125, 3.54931640625, 3.706787109375, 3.8642578125, 4.021728515625, 4.17919921875, 4.336669921875, 4.494140625, 4.651611328125, 4.80908203125, 4.966552734375, 5.1240234375, 5.281494140625, 5.43896484375, 5.596435546875, 5.75390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 4.0, 9.0, 12.0, 12.0, 18.0, 18.0, 13.0, 15.0, 21.0, 29.0, 36.0, 32.0, 37.0, 49.0, 52.0, 73.0, 97.0, 163.0, 286.0, 1315.0, 206.0, 98.0, 77.0, 46.0, 39.0, 54.0, 35.0, 32.0, 20.0, 15.0, 16.0, 17.0, 15.0, 15.0, 12.0, 16.0, 11.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.6171875, -15.146240234375, -14.67529296875, -14.204345703125, -13.7333984375, -13.262451171875, -12.79150390625, -12.320556640625, -11.849609375, -11.378662109375, -10.90771484375, -10.436767578125, -9.9658203125, -9.494873046875, -9.02392578125, -8.552978515625, -8.08203125, -7.611083984375, -7.14013671875, -6.669189453125, -6.1982421875, -5.727294921875, -5.25634765625, -4.785400390625, -4.314453125, -3.843505859375, -3.37255859375, -2.901611328125, -2.4306640625, -1.959716796875, -1.48876953125, -1.017822265625, -0.546875, -0.075927734375, 0.39501953125, 0.865966796875, 1.3369140625, 1.807861328125, 2.27880859375, 2.749755859375, 3.220703125, 3.691650390625, 4.16259765625, 4.633544921875, 5.1044921875, 5.575439453125, 6.04638671875, 6.517333984375, 6.98828125, 7.459228515625, 7.93017578125, 8.401123046875, 8.8720703125, 9.343017578125, 9.81396484375, 10.284912109375, 10.755859375, 11.226806640625, 11.69775390625, 12.168701171875, 12.6396484375, 13.110595703125, 13.58154296875, 14.052490234375, 14.5234375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 16.0, 21.0, 30.0, 35.0, 42.0, 59.0, 95.0, 176.0, 314.0, 720.0, 3301.0, 86758.0, 2996006.0, 54024.0, 2683.0, 612.0, 296.0, 162.0, 109.0, 50.0, 40.0, 36.0, 28.0, 23.0, 16.0, 8.0, 9.0, 7.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.28125, -45.98388671875, -44.6865234375, -43.38916015625, -42.091796875, -40.79443359375, -39.4970703125, -38.19970703125, -36.90234375, -35.60498046875, -34.3076171875, -33.01025390625, -31.712890625, -30.41552734375, -29.1181640625, -27.82080078125, -26.5234375, -25.22607421875, -23.9287109375, -22.63134765625, -21.333984375, -20.03662109375, -18.7392578125, -17.44189453125, -16.14453125, -14.84716796875, -13.5498046875, -12.25244140625, -10.955078125, -9.65771484375, -8.3603515625, -7.06298828125, -5.765625, -4.46826171875, -3.1708984375, -1.87353515625, -0.576171875, 0.72119140625, 2.0185546875, 3.31591796875, 4.61328125, 5.91064453125, 7.2080078125, 8.50537109375, 9.802734375, 11.10009765625, 12.3974609375, 13.69482421875, 14.9921875, 16.28955078125, 17.5869140625, 18.88427734375, 20.181640625, 21.47900390625, 22.7763671875, 24.07373046875, 25.37109375, 26.66845703125, 27.9658203125, 29.26318359375, 30.560546875, 31.85791015625, 33.1552734375, 34.45263671875, 35.75]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 402.0, 602.0, 11.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.25464630126953, -48.726661682128906, -39.198673248291016, -29.670686721801758, -20.1427001953125, -10.614715576171875, -1.0867271423339844, 8.441261291503906, 17.96924591064453, 27.49723243713379, 37.02521896362305, 46.55320739746094, 56.08119201660156, 65.60917663574219, 75.13716125488281, 84.66515350341797, 94.1931381225586, 103.72112274169922, 113.24911499023438, 122.777099609375, 132.30508422851562, 141.83306884765625, 151.36105346679688, 160.8890380859375, 170.41702270507812, 179.94500732421875, 189.47299194335938, 199.0009765625, 208.52896118164062, 218.05694580078125, 227.58494567871094, 237.11293029785156, 246.64093017578125, 256.1689147949219, 265.6968994140625, 275.2248840332031, 284.75286865234375, 294.2808532714844, 303.808837890625, 313.33685302734375, 322.86480712890625, 332.3927917480469, 341.9207763671875, 351.4487609863281, 360.97674560546875, 370.5047302246094, 380.03271484375, 389.56072998046875, 399.0887145996094, 408.61669921875, 418.1446838378906, 427.67266845703125, 437.2006530761719, 446.7286376953125, 456.2566223144531, 465.78460693359375, 475.3126220703125, 484.8406066894531, 494.36859130859375, 503.8965759277344, 513.424560546875, 522.9525756835938, 532.4805297851562, 542.008544921875, 551.5364990234375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 5.0, 8.0, 7.0, 12.0, 16.0, 21.0, 14.0, 19.0, 24.0, 18.0, 26.0, 27.0, 30.0, 33.0, 37.0, 41.0, 27.0, 31.0, 41.0, 40.0, 45.0, 38.0, 36.0, 43.0, 37.0, 38.0, 50.0, 35.0, 24.0, 26.0, 22.0, 18.0, 25.0, 18.0, 15.0, 11.0, 6.0, 7.0, 9.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-44.93398666381836, -43.652259826660156, -42.37052917480469, -41.088802337646484, -39.80707550048828, -38.52534866333008, -37.24361801147461, -35.961891174316406, -34.6801643371582, -33.3984375, -32.11670684814453, -30.834980010986328, -29.553253173828125, -28.27152442932129, -26.989795684814453, -25.70806884765625, -24.426340103149414, -23.144611358642578, -21.862884521484375, -20.58115577697754, -19.299428939819336, -18.0177001953125, -16.735973358154297, -15.454244613647461, -14.172516822814941, -12.890789031982422, -11.609061241149902, -10.327333450317383, -9.045604705810547, -7.7638773918151855, -6.482149124145508, -5.200421333312988, -3.9186935424804688, -2.636965751647949, -1.3552377223968506, -0.07350969314575195, 1.2082180976867676, 2.489945888519287, 3.771674156188965, 5.053401947021484, 6.335129737854004, 7.616857528686523, 8.898585319519043, 10.180313110351562, 11.462041854858398, 12.743768692016602, 14.025497436523438, 15.307225227355957, 16.588953018188477, 17.870681762695312, 19.152408599853516, 20.43413734436035, 21.715864181518555, 22.99759292602539, 24.279319763183594, 25.56104850769043, 26.842777252197266, 28.1245059967041, 29.406232833862305, 30.68796157836914, 31.969688415527344, 33.25141525268555, 34.533145904541016, 35.81487274169922, 37.09659957885742]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 8.0, 12.0, 3.0, 11.0, 14.0, 8.0, 13.0, 27.0, 21.0, 17.0, 36.0, 33.0, 24.0, 44.0, 39.0, 31.0, 35.0, 49.0, 35.0, 37.0, 42.0, 38.0, 59.0, 41.0, 34.0, 33.0, 36.0, 33.0, 29.0, 37.0, 23.0, 15.0, 22.0, 6.0, 14.0, 12.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.86328125, -4.71881103515625, -4.5743408203125, -4.42987060546875, -4.285400390625, -4.14093017578125, -3.9964599609375, -3.85198974609375, -3.70751953125, -3.56304931640625, -3.4185791015625, -3.27410888671875, -3.129638671875, -2.98516845703125, -2.8406982421875, -2.69622802734375, -2.5517578125, -2.40728759765625, -2.2628173828125, -2.11834716796875, -1.973876953125, -1.82940673828125, -1.6849365234375, -1.54046630859375, -1.39599609375, -1.25152587890625, -1.1070556640625, -0.96258544921875, -0.818115234375, -0.67364501953125, -0.5291748046875, -0.38470458984375, -0.240234375, -0.09576416015625, 0.0487060546875, 0.19317626953125, 0.337646484375, 0.48211669921875, 0.6265869140625, 0.77105712890625, 0.91552734375, 1.05999755859375, 1.2044677734375, 1.34893798828125, 1.493408203125, 1.63787841796875, 1.7823486328125, 1.92681884765625, 2.0712890625, 2.21575927734375, 2.3602294921875, 2.50469970703125, 2.649169921875, 2.79364013671875, 2.9381103515625, 3.08258056640625, 3.22705078125, 3.37152099609375, 3.5159912109375, 3.66046142578125, 3.804931640625, 3.94940185546875, 4.0938720703125, 4.23834228515625, 4.3828125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 23.0, 26.0, 33.0, 26.0, 34.0, 70.0, 73.0, 114.0, 138.0, 289.0, 580.0, 1466.0, 4350.0, 19373.0, 130809.0, 1206985.0, 2391409.0, 380658.0, 45524.0, 8109.0, 2246.0, 830.0, 381.0, 202.0, 121.0, 105.0, 55.0, 47.0, 35.0, 31.0, 16.0, 19.0, 19.0, 8.0, 11.0, 4.0, 4.0, 5.0, 9.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-13.75, -13.348388671875, -12.94677734375, -12.545166015625, -12.1435546875, -11.741943359375, -11.34033203125, -10.938720703125, -10.537109375, -10.135498046875, -9.73388671875, -9.332275390625, -8.9306640625, -8.529052734375, -8.12744140625, -7.725830078125, -7.32421875, -6.922607421875, -6.52099609375, -6.119384765625, -5.7177734375, -5.316162109375, -4.91455078125, -4.512939453125, -4.111328125, -3.709716796875, -3.30810546875, -2.906494140625, -2.5048828125, -2.103271484375, -1.70166015625, -1.300048828125, -0.8984375, -0.496826171875, -0.09521484375, 0.306396484375, 0.7080078125, 1.109619140625, 1.51123046875, 1.912841796875, 2.314453125, 2.716064453125, 3.11767578125, 3.519287109375, 3.9208984375, 4.322509765625, 4.72412109375, 5.125732421875, 5.52734375, 5.928955078125, 6.33056640625, 6.732177734375, 7.1337890625, 7.535400390625, 7.93701171875, 8.338623046875, 8.740234375, 9.141845703125, 9.54345703125, 9.945068359375, 10.3466796875, 10.748291015625, 11.14990234375, 11.551513671875, 11.953125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 16.0, 12.0, 29.0, 42.0, 70.0, 114.0, 202.0, 319.0, 505.0, 703.0, 684.0, 509.0, 343.0, 225.0, 128.0, 84.0, 38.0, 13.0, 11.0, 11.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.382080078125, -18.79541015625, -18.208740234375, -17.6220703125, -17.035400390625, -16.44873046875, -15.862060546875, -15.275390625, -14.688720703125, -14.10205078125, -13.515380859375, -12.9287109375, -12.342041015625, -11.75537109375, -11.168701171875, -10.58203125, -9.995361328125, -9.40869140625, -8.822021484375, -8.2353515625, -7.648681640625, -7.06201171875, -6.475341796875, -5.888671875, -5.302001953125, -4.71533203125, -4.128662109375, -3.5419921875, -2.955322265625, -2.36865234375, -1.781982421875, -1.1953125, -0.608642578125, -0.02197265625, 0.564697265625, 1.1513671875, 1.738037109375, 2.32470703125, 2.911376953125, 3.498046875, 4.084716796875, 4.67138671875, 5.258056640625, 5.8447265625, 6.431396484375, 7.01806640625, 7.604736328125, 8.19140625, 8.778076171875, 9.36474609375, 9.951416015625, 10.5380859375, 11.124755859375, 11.71142578125, 12.298095703125, 12.884765625, 13.471435546875, 14.05810546875, 14.644775390625, 15.2314453125, 15.818115234375, 16.40478515625, 16.991455078125, 17.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 11.0, 15.0, 12.0, 46.0, 89.0, 211.0, 460.0, 1354.0, 20400.0, 2733113.0, 1426109.0, 10752.0, 989.0, 364.0, 156.0, 87.0, 46.0, 22.0, 13.0, 14.0, 11.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.4375, -42.9521484375, -41.466796875, -39.9814453125, -38.49609375, -37.0107421875, -35.525390625, -34.0400390625, -32.5546875, -31.0693359375, -29.583984375, -28.0986328125, -26.61328125, -25.1279296875, -23.642578125, -22.1572265625, -20.671875, -19.1865234375, -17.701171875, -16.2158203125, -14.73046875, -13.2451171875, -11.759765625, -10.2744140625, -8.7890625, -7.3037109375, -5.818359375, -4.3330078125, -2.84765625, -1.3623046875, 0.123046875, 1.6083984375, 3.09375, 4.5791015625, 6.064453125, 7.5498046875, 9.03515625, 10.5205078125, 12.005859375, 13.4912109375, 14.9765625, 16.4619140625, 17.947265625, 19.4326171875, 20.91796875, 22.4033203125, 23.888671875, 25.3740234375, 26.859375, 28.3447265625, 29.830078125, 31.3154296875, 32.80078125, 34.2861328125, 35.771484375, 37.2568359375, 38.7421875, 40.2275390625, 41.712890625, 43.1982421875, 44.68359375, 46.1689453125, 47.654296875, 49.1396484375, 50.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 21.0, 31.0, 50.0, 86.0, 123.0, 169.0, 158.0, 144.0, 96.0, 57.0, 39.0, 14.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-80.74664306640625, -78.06417846679688, -75.3817138671875, -72.69924926757812, -70.01678466796875, -67.33431243896484, -64.65184783935547, -61.969383239746094, -59.28691864013672, -56.604454040527344, -53.92198944091797, -51.23952102661133, -48.55705642700195, -45.87459182739258, -43.19212341308594, -40.50965881347656, -37.82719421386719, -35.14472961425781, -32.46226501464844, -29.779796600341797, -27.097332000732422, -24.414867401123047, -21.73240089416504, -19.04993438720703, -16.367469787597656, -13.685004234313965, -11.002538681030273, -8.320073127746582, -5.637607574462891, -2.955142021179199, -0.2726764678955078, 2.4097900390625, 5.092254638671875, 7.774720191955566, 10.457185745239258, 13.13965129852295, 15.82211685180664, 18.504581451416016, 21.187047958374023, 23.86951446533203, 26.551979064941406, 29.23444366455078, 31.91691017150879, 34.5993766784668, 37.28184127807617, 39.96430587768555, 42.64677429199219, 45.32923889160156, 48.01170349121094, 50.69416809082031, 53.37663269042969, 56.05910110473633, 58.7415657043457, 61.42403030395508, 64.10649871826172, 66.7889633178711, 69.47142791748047, 72.15389251708984, 74.83635711669922, 77.5188217163086, 80.2012939453125, 82.88375854492188, 85.56622314453125, 88.24868774414062, 90.93115234375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 4.0, 5.0, 8.0, 4.0, 13.0, 12.0, 15.0, 11.0, 23.0, 19.0, 33.0, 25.0, 30.0, 31.0, 30.0, 36.0, 33.0, 45.0, 39.0, 46.0, 47.0, 37.0, 39.0, 44.0, 42.0, 29.0, 35.0, 25.0, 28.0, 25.0, 25.0, 11.0, 24.0, 19.0, 12.0, 22.0, 13.0, 13.0, 13.0, 8.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.131439208984375, -32.96098327636719, -31.790529251098633, -30.620073318481445, -29.44961929321289, -28.279163360595703, -27.108707427978516, -25.938251495361328, -24.767797470092773, -23.597341537475586, -22.42688751220703, -21.256431579589844, -20.085975646972656, -18.9155216217041, -17.745065689086914, -16.57461166381836, -15.404155731201172, -14.2337007522583, -13.06324577331543, -11.892789840698242, -10.722334861755371, -9.5518798828125, -8.381423950195312, -7.210968971252441, -6.04051399230957, -4.870059013366699, -3.69960355758667, -2.5291483402252197, -1.3586931228637695, -0.18823814392089844, 0.9822173118591309, 2.15267276763916, 3.3231239318847656, 4.493578910827637, 5.664034366607666, 6.834489822387695, 8.004944801330566, 9.175399780273438, 10.345855712890625, 11.516310691833496, 12.686765670776367, 13.857220649719238, 15.02767562866211, 16.198131561279297, 17.368587493896484, 18.53904151916504, 19.709497451782227, 20.87995147705078, 22.05040740966797, 23.220863342285156, 24.39131736755371, 25.5617733001709, 26.732227325439453, 27.90268325805664, 29.073139190673828, 30.243595123291016, 31.41404914855957, 32.584503173828125, 33.75495910644531, 34.9254150390625, 36.09587097167969, 37.266326904296875, 38.4367790222168, 39.607234954833984, 40.77769088745117]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 0.0, 2.0, 6.0, 4.0, 11.0, 6.0, 10.0, 8.0, 13.0, 20.0, 11.0, 29.0, 30.0, 27.0, 23.0, 26.0, 41.0, 40.0, 40.0, 36.0, 34.0, 39.0, 45.0, 40.0, 44.0, 53.0, 33.0, 40.0, 32.0, 34.0, 34.0, 30.0, 22.0, 26.0, 34.0, 12.0, 9.0, 13.0, 9.0, 10.0, 9.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.29296875, -4.14837646484375, -4.0037841796875, -3.85919189453125, -3.714599609375, -3.57000732421875, -3.4254150390625, -3.28082275390625, -3.13623046875, -2.99163818359375, -2.8470458984375, -2.70245361328125, -2.557861328125, -2.41326904296875, -2.2686767578125, -2.12408447265625, -1.9794921875, -1.83489990234375, -1.6903076171875, -1.54571533203125, -1.401123046875, -1.25653076171875, -1.1119384765625, -0.96734619140625, -0.82275390625, -0.67816162109375, -0.5335693359375, -0.38897705078125, -0.244384765625, -0.09979248046875, 0.0447998046875, 0.18939208984375, 0.333984375, 0.47857666015625, 0.6231689453125, 0.76776123046875, 0.912353515625, 1.05694580078125, 1.2015380859375, 1.34613037109375, 1.49072265625, 1.63531494140625, 1.7799072265625, 1.92449951171875, 2.069091796875, 2.21368408203125, 2.3582763671875, 2.50286865234375, 2.6474609375, 2.79205322265625, 2.9366455078125, 3.08123779296875, 3.225830078125, 3.37042236328125, 3.5150146484375, 3.65960693359375, 3.80419921875, 3.94879150390625, 4.0933837890625, 4.23797607421875, 4.382568359375, 4.52716064453125, 4.6717529296875, 4.81634521484375, 4.9609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [8.0, 1.0, 4.0, 10.0, 17.0, 22.0, 24.0, 35.0, 62.0, 95.0, 155.0, 179.0, 323.0, 461.0, 638.0, 994.0, 1521.0, 2240.0, 3452.0, 5228.0, 7827.0, 11802.0, 18237.0, 27811.0, 41175.0, 59752.0, 82464.0, 107606.0, 126910.0, 130472.0, 115606.0, 92711.0, 68319.0, 47441.0, 32324.0, 21342.0, 14095.0, 9296.0, 6035.0, 3909.0, 2720.0, 1686.0, 1151.0, 786.0, 513.0, 382.0, 250.0, 164.0, 117.0, 68.0, 46.0, 36.0, 19.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8502120971679688, -0.8200531005859375, -0.7898941040039062, -0.759735107421875, -0.7295761108398438, -0.6994171142578125, -0.6692581176757812, -0.63909912109375, -0.6089401245117188, -0.5787811279296875, -0.5486221313476562, -0.518463134765625, -0.48830413818359375, -0.4581451416015625, -0.42798614501953125, -0.3978271484375, -0.36766815185546875, -0.3375091552734375, -0.30735015869140625, -0.277191162109375, -0.24703216552734375, -0.2168731689453125, -0.18671417236328125, -0.15655517578125, -0.12639617919921875, -0.0962371826171875, -0.06607818603515625, -0.035919189453125, -0.00576019287109375, 0.0243988037109375, 0.05455780029296875, 0.084716796875, 0.11487579345703125, 0.1450347900390625, 0.17519378662109375, 0.205352783203125, 0.23551177978515625, 0.2656707763671875, 0.29582977294921875, 0.32598876953125, 0.35614776611328125, 0.3863067626953125, 0.41646575927734375, 0.446624755859375, 0.47678375244140625, 0.5069427490234375, 0.5371017456054688, 0.5672607421875, 0.5974197387695312, 0.6275787353515625, 0.6577377319335938, 0.687896728515625, 0.7180557250976562, 0.7482147216796875, 0.7783737182617188, 0.80853271484375, 0.8386917114257812, 0.8688507080078125, 0.8990097045898438, 0.929168701171875, 0.9593276977539062, 0.9894866943359375, 1.0196456909179688, 1.0498046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 8.0, 6.0, 8.0, 10.0, 10.0, 20.0, 22.0, 19.0, 20.0, 13.0, 24.0, 28.0, 21.0, 21.0, 37.0, 30.0, 35.0, 31.0, 33.0, 38.0, 36.0, 1053.0, 47.0, 31.0, 39.0, 44.0, 29.0, 36.0, 31.0, 28.0, 25.0, 22.0, 23.0, 17.0, 15.0, 14.0, 13.0, 26.0, 7.0, 6.0, 5.0, 8.0, 5.0, 11.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-3.765625, -3.64886474609375, -3.5321044921875, -3.41534423828125, -3.298583984375, -3.18182373046875, -3.0650634765625, -2.94830322265625, -2.83154296875, -2.71478271484375, -2.5980224609375, -2.48126220703125, -2.364501953125, -2.24774169921875, -2.1309814453125, -2.01422119140625, -1.8974609375, -1.78070068359375, -1.6639404296875, -1.54718017578125, -1.430419921875, -1.31365966796875, -1.1968994140625, -1.08013916015625, -0.96337890625, -0.84661865234375, -0.7298583984375, -0.61309814453125, -0.496337890625, -0.37957763671875, -0.2628173828125, -0.14605712890625, -0.029296875, 0.08746337890625, 0.2042236328125, 0.32098388671875, 0.437744140625, 0.55450439453125, 0.6712646484375, 0.78802490234375, 0.90478515625, 1.02154541015625, 1.1383056640625, 1.25506591796875, 1.371826171875, 1.48858642578125, 1.6053466796875, 1.72210693359375, 1.8388671875, 1.95562744140625, 2.0723876953125, 2.18914794921875, 2.305908203125, 2.42266845703125, 2.5394287109375, 2.65618896484375, 2.77294921875, 2.88970947265625, 3.0064697265625, 3.12322998046875, 3.239990234375, 3.35675048828125, 3.4735107421875, 3.59027099609375, 3.70703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 3.0, 12.0, 27.0, 27.0, 39.0, 65.0, 89.0, 127.0, 192.0, 267.0, 408.0, 539.0, 818.0, 1256.0, 1786.0, 2798.0, 4186.0, 6516.0, 10052.0, 15838.0, 25254.0, 39168.0, 60779.0, 91142.0, 138005.0, 797855.0, 524362.0, 128422.0, 86751.0, 57371.0, 36954.0, 23464.0, 15117.0, 9513.0, 6085.0, 3936.0, 2662.0, 1766.0, 1119.0, 771.0, 488.0, 361.0, 227.0, 152.0, 92.0, 83.0, 57.0, 33.0, 36.0, 23.0, 10.0, 7.0, 11.0, 3.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.47021484375, -0.4554862976074219, -0.44075775146484375, -0.4260292053222656, -0.4113006591796875, -0.3965721130371094, -0.38184356689453125, -0.3671150207519531, -0.352386474609375, -0.3376579284667969, -0.32292938232421875, -0.3082008361816406, -0.2934722900390625, -0.2787437438964844, -0.26401519775390625, -0.24928665161132812, -0.23455810546875, -0.21982955932617188, -0.20510101318359375, -0.19037246704101562, -0.1756439208984375, -0.16091537475585938, -0.14618682861328125, -0.13145828247070312, -0.116729736328125, -0.10200119018554688, -0.08727264404296875, -0.07254409790039062, -0.0578155517578125, -0.043087005615234375, -0.02835845947265625, -0.013629913330078125, 0.0010986328125, 0.015827178955078125, 0.03055572509765625, 0.045284271240234375, 0.0600128173828125, 0.07474136352539062, 0.08946990966796875, 0.10419845581054688, 0.118927001953125, 0.13365554809570312, 0.14838409423828125, 0.16311264038085938, 0.1778411865234375, 0.19256973266601562, 0.20729827880859375, 0.22202682495117188, 0.23675537109375, 0.2514839172363281, 0.26621246337890625, 0.2809410095214844, 0.2956695556640625, 0.3103981018066406, 0.32512664794921875, 0.3398551940917969, 0.354583740234375, 0.3693122863769531, 0.38404083251953125, 0.3987693786621094, 0.4134979248046875, 0.4282264709472656, 0.44295501708984375, 0.4576835632324219, 0.472412109375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 4.0, 8.0, 5.0, 7.0, 13.0, 8.0, 9.0, 21.0, 22.0, 25.0, 28.0, 36.0, 57.0, 60.0, 66.0, 84.0, 102.0, 84.0, 55.0, 58.0, 46.0, 36.0, 28.0, 19.0, 11.0, 17.0, 14.0, 13.0, 8.0, 12.0, 4.0, 5.0, 5.0, 5.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1370849609375, -0.13328933715820312, -0.12949371337890625, -0.12569808959960938, -0.1219024658203125, -0.11810684204101562, -0.11431121826171875, -0.11051559448242188, -0.106719970703125, -0.10292434692382812, -0.09912872314453125, -0.09533309936523438, -0.0915374755859375, -0.08774185180664062, -0.08394622802734375, -0.08015060424804688, -0.07635498046875, -0.07255935668945312, -0.06876373291015625, -0.06496810913085938, -0.0611724853515625, -0.057376861572265625, -0.05358123779296875, -0.049785614013671875, -0.045989990234375, -0.042194366455078125, -0.03839874267578125, -0.034603118896484375, -0.0308074951171875, -0.027011871337890625, -0.02321624755859375, -0.019420623779296875, -0.015625, -0.011829376220703125, -0.00803375244140625, -0.004238128662109375, -0.0004425048828125, 0.003353118896484375, 0.00714874267578125, 0.010944366455078125, 0.014739990234375, 0.018535614013671875, 0.02233123779296875, 0.026126861572265625, 0.0299224853515625, 0.033718109130859375, 0.03751373291015625, 0.041309356689453125, 0.04510498046875, 0.048900604248046875, 0.05269622802734375, 0.056491851806640625, 0.0602874755859375, 0.06408309936523438, 0.06787872314453125, 0.07167434692382812, 0.075469970703125, 0.07926559448242188, 0.08306121826171875, 0.08685684204101562, 0.0906524658203125, 0.09444808959960938, 0.09824371337890625, 0.10203933715820312, 0.1058349609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 9.0, 11.0, 13.0, 15.0, 22.0, 33.0, 34.0, 41.0, 65.0, 77.0, 132.0, 206.0, 415.0, 1364.0, 7201.0, 452863.0, 575812.0, 7739.0, 1390.0, 418.0, 209.0, 148.0, 87.0, 66.0, 43.0, 29.0, 17.0, 16.0, 22.0, 8.0, 5.0, 9.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9013671875, -1.8335113525390625, -1.765655517578125, -1.6977996826171875, -1.62994384765625, -1.5620880126953125, -1.494232177734375, -1.4263763427734375, -1.3585205078125, -1.2906646728515625, -1.222808837890625, -1.1549530029296875, -1.08709716796875, -1.0192413330078125, -0.951385498046875, -0.8835296630859375, -0.815673828125, -0.7478179931640625, -0.679962158203125, -0.6121063232421875, -0.54425048828125, -0.4763946533203125, -0.408538818359375, -0.3406829833984375, -0.2728271484375, -0.2049713134765625, -0.137115478515625, -0.0692596435546875, -0.00140380859375, 0.0664520263671875, 0.134307861328125, 0.2021636962890625, 0.27001953125, 0.3378753662109375, 0.405731201171875, 0.4735870361328125, 0.54144287109375, 0.6092987060546875, 0.677154541015625, 0.7450103759765625, 0.8128662109375, 0.8807220458984375, 0.948577880859375, 1.0164337158203125, 1.08428955078125, 1.1521453857421875, 1.220001220703125, 1.2878570556640625, 1.355712890625, 1.4235687255859375, 1.491424560546875, 1.5592803955078125, 1.62713623046875, 1.6949920654296875, 1.762847900390625, 1.8307037353515625, 1.8985595703125, 1.9664154052734375, 2.034271240234375, 2.1021270751953125, 2.16998291015625, 2.2378387451171875, 2.305694580078125, 2.3735504150390625, 2.44140625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 16.0, 66.0, 260.0, 493.0, 126.0, 37.0, 5.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3489272594451904, -1.2908926010131836, -1.2328580617904663, -1.1748234033584595, -1.1167887449264526, -1.0587542057037354, -1.0007195472717285, -0.9426849484443665, -0.8846503496170044, -0.8266157507896423, -0.7685810923576355, -0.7105464935302734, -0.6525118947029114, -0.5944772958755493, -0.5364426374435425, -0.4784080386161804, -0.4203733801841736, -0.36233875155448914, -0.3043041527271271, -0.24626952409744263, -0.18823491036891937, -0.13020029664039612, -0.07216566801071167, -0.01413106918334961, 0.04390355944633484, 0.1019381731748581, 0.15997278690338135, 0.2180074155330658, 0.27604204416275024, 0.3340766429901123, 0.39211127161979675, 0.4501458704471588, 0.5081804990768433, 0.5662150979042053, 0.6242497563362122, 0.6822843551635742, 0.7403189539909363, 0.7983535528182983, 0.8563882112503052, 0.9144228100776672, 0.9724574089050293, 1.0304920673370361, 1.0885266065597534, 1.1465612649917603, 1.204595923423767, 1.2626304626464844, 1.3206651210784912, 1.378699779510498, 1.4367344379425049, 1.4947690963745117, 1.552803635597229, 1.6108382940292358, 1.6688729524612427, 1.72690749168396, 1.7849421501159668, 1.8429768085479736, 1.901011347770691, 1.9590460062026978, 2.017080545425415, 2.075115203857422, 2.1331498622894287, 2.1911845207214355, 2.2492189407348633, 2.30725359916687, 2.365288257598877]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 5.0, 4.0, 10.0, 10.0, 9.0, 17.0, 18.0, 24.0, 15.0, 20.0, 23.0, 32.0, 38.0, 33.0, 43.0, 42.0, 43.0, 42.0, 28.0, 47.0, 40.0, 49.0, 39.0, 39.0, 45.0, 25.0, 38.0, 33.0, 24.0, 22.0, 20.0, 22.0, 14.0, 14.0, 6.0, 11.0, 9.0, 5.0, 6.0, 9.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3284599184989929, -0.3179497718811035, -0.3074395954608917, -0.2969294488430023, -0.2864192724227905, -0.2759091258049011, -0.2653989791870117, -0.2548888027667999, -0.24437865614891052, -0.23386849462985992, -0.22335833311080933, -0.21284818649291992, -0.20233802497386932, -0.19182786345481873, -0.18131770193576813, -0.17080754041671753, -0.16029737889766693, -0.14978721737861633, -0.13927705585956573, -0.12876689434051514, -0.11825674772262573, -0.10774658620357513, -0.09723642468452454, -0.08672627061605453, -0.07621610909700394, -0.06570594757795334, -0.05519579350948334, -0.04468563199043274, -0.03417547419667244, -0.02366531640291214, -0.013155154883861542, -0.0026450008153915405, 0.007865160703659058, 0.018375318497419357, 0.028885478153824806, 0.039395637810230255, 0.049905795603990555, 0.060415953397750854, 0.07092611491680145, 0.08143626898527145, 0.09194643050432205, 0.10245659202337265, 0.11296674609184265, 0.12347690761089325, 0.13398706912994385, 0.14449721574783325, 0.15500739216804504, 0.16551753878593445, 0.17602770030498505, 0.18653786182403564, 0.19704802334308624, 0.20755818486213684, 0.21806833148002625, 0.22857849299907684, 0.23908865451812744, 0.24959880113601685, 0.26010897755622864, 0.27061912417411804, 0.28112930059432983, 0.29163944721221924, 0.30214962363243103, 0.31265977025032043, 0.3231699466705322, 0.33368009328842163, 0.34419023990631104]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 9.0, 6.0, 19.0, 13.0, 23.0, 17.0, 22.0, 34.0, 26.0, 32.0, 34.0, 22.0, 35.0, 45.0, 45.0, 40.0, 43.0, 40.0, 36.0, 50.0, 42.0, 33.0, 42.0, 38.0, 40.0, 25.0, 23.0, 20.0, 19.0, 20.0, 16.0, 15.0, 14.0, 7.0, 12.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.7421875, -4.59967041015625, -4.4571533203125, -4.31463623046875, -4.172119140625, -4.02960205078125, -3.8870849609375, -3.74456787109375, -3.60205078125, -3.45953369140625, -3.3170166015625, -3.17449951171875, -3.031982421875, -2.88946533203125, -2.7469482421875, -2.60443115234375, -2.4619140625, -2.31939697265625, -2.1768798828125, -2.03436279296875, -1.891845703125, -1.74932861328125, -1.6068115234375, -1.46429443359375, -1.32177734375, -1.17926025390625, -1.0367431640625, -0.89422607421875, -0.751708984375, -0.60919189453125, -0.4666748046875, -0.32415771484375, -0.181640625, -0.03912353515625, 0.1033935546875, 0.24591064453125, 0.388427734375, 0.53094482421875, 0.6734619140625, 0.81597900390625, 0.95849609375, 1.10101318359375, 1.2435302734375, 1.38604736328125, 1.528564453125, 1.67108154296875, 1.8135986328125, 1.95611572265625, 2.0986328125, 2.24114990234375, 2.3836669921875, 2.52618408203125, 2.668701171875, 2.81121826171875, 2.9537353515625, 3.09625244140625, 3.23876953125, 3.38128662109375, 3.5238037109375, 3.66632080078125, 3.808837890625, 3.95135498046875, 4.0938720703125, 4.23638916015625, 4.37890625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 16.0, 25.0, 33.0, 52.0, 99.0, 153.0, 267.0, 470.0, 879.0, 1565.0, 2864.0, 5132.0, 9315.0, 16885.0, 30769.0, 61516.0, 159216.0, 369121.0, 227122.0, 79718.0, 37670.0, 20445.0, 11272.0, 6288.0, 3453.0, 1862.0, 1014.0, 539.0, 314.0, 180.0, 109.0, 70.0, 47.0, 27.0, 15.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.08416748046875, -4.9183349609375, -4.75250244140625, -4.586669921875, -4.42083740234375, -4.2550048828125, -4.08917236328125, -3.92333984375, -3.75750732421875, -3.5916748046875, -3.42584228515625, -3.260009765625, -3.09417724609375, -2.9283447265625, -2.76251220703125, -2.5966796875, -2.43084716796875, -2.2650146484375, -2.09918212890625, -1.933349609375, -1.76751708984375, -1.6016845703125, -1.43585205078125, -1.27001953125, -1.10418701171875, -0.9383544921875, -0.77252197265625, -0.606689453125, -0.44085693359375, -0.2750244140625, -0.10919189453125, 0.056640625, 0.22247314453125, 0.3883056640625, 0.55413818359375, 0.719970703125, 0.88580322265625, 1.0516357421875, 1.21746826171875, 1.38330078125, 1.54913330078125, 1.7149658203125, 1.88079833984375, 2.046630859375, 2.21246337890625, 2.3782958984375, 2.54412841796875, 2.7099609375, 2.87579345703125, 3.0416259765625, 3.20745849609375, 3.373291015625, 3.53912353515625, 3.7049560546875, 3.87078857421875, 4.03662109375, 4.20245361328125, 4.3682861328125, 4.53411865234375, 4.699951171875, 4.86578369140625, 5.0316162109375, 5.19744873046875, 5.36328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 7.0, 7.0, 7.0, 7.0, 12.0, 19.0, 26.0, 19.0, 15.0, 33.0, 32.0, 39.0, 36.0, 42.0, 67.0, 87.0, 115.0, 292.0, 1447.0, 233.0, 115.0, 66.0, 56.0, 43.0, 36.0, 29.0, 31.0, 31.0, 20.0, 13.0, 15.0, 15.0, 12.0, 13.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.1669921875, -18.537109375, -17.9072265625, -17.27734375, -16.6474609375, -16.017578125, -15.3876953125, -14.7578125, -14.1279296875, -13.498046875, -12.8681640625, -12.23828125, -11.6083984375, -10.978515625, -10.3486328125, -9.71875, -9.0888671875, -8.458984375, -7.8291015625, -7.19921875, -6.5693359375, -5.939453125, -5.3095703125, -4.6796875, -4.0498046875, -3.419921875, -2.7900390625, -2.16015625, -1.5302734375, -0.900390625, -0.2705078125, 0.359375, 0.9892578125, 1.619140625, 2.2490234375, 2.87890625, 3.5087890625, 4.138671875, 4.7685546875, 5.3984375, 6.0283203125, 6.658203125, 7.2880859375, 7.91796875, 8.5478515625, 9.177734375, 9.8076171875, 10.4375, 11.0673828125, 11.697265625, 12.3271484375, 12.95703125, 13.5869140625, 14.216796875, 14.8466796875, 15.4765625, 16.1064453125, 16.736328125, 17.3662109375, 17.99609375, 18.6259765625, 19.255859375, 19.8857421875, 20.515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 10.0, 10.0, 13.0, 12.0, 34.0, 37.0, 50.0, 56.0, 90.0, 128.0, 199.0, 394.0, 900.0, 5861.0, 481242.0, 2639342.0, 14676.0, 1398.0, 440.0, 255.0, 150.0, 99.0, 68.0, 57.0, 51.0, 26.0, 20.0, 11.0, 14.0, 18.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-50.875, -49.46728515625, -48.0595703125, -46.65185546875, -45.244140625, -43.83642578125, -42.4287109375, -41.02099609375, -39.61328125, -38.20556640625, -36.7978515625, -35.39013671875, -33.982421875, -32.57470703125, -31.1669921875, -29.75927734375, -28.3515625, -26.94384765625, -25.5361328125, -24.12841796875, -22.720703125, -21.31298828125, -19.9052734375, -18.49755859375, -17.08984375, -15.68212890625, -14.2744140625, -12.86669921875, -11.458984375, -10.05126953125, -8.6435546875, -7.23583984375, -5.828125, -4.42041015625, -3.0126953125, -1.60498046875, -0.197265625, 1.21044921875, 2.6181640625, 4.02587890625, 5.43359375, 6.84130859375, 8.2490234375, 9.65673828125, 11.064453125, 12.47216796875, 13.8798828125, 15.28759765625, 16.6953125, 18.10302734375, 19.5107421875, 20.91845703125, 22.326171875, 23.73388671875, 25.1416015625, 26.54931640625, 27.95703125, 29.36474609375, 30.7724609375, 32.18017578125, 33.587890625, 34.99560546875, 36.4033203125, 37.81103515625, 39.21875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 14.0, 473.0, 501.0, 27.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.107120513916016, -32.2010612487793, -24.29500389099121, -16.388946533203125, -8.482887268066406, -0.5768280029296875, 7.329227447509766, 15.235286712646484, 23.141345977783203, 31.047405242919922, 38.953460693359375, 46.859519958496094, 54.76557922363281, 62.67163848876953, 70.57769775390625, 78.48374938964844, 86.38981628417969, 94.2958755493164, 102.20193481445312, 110.10798645019531, 118.01405334472656, 125.92010498046875, 133.826171875, 141.7322235107422, 149.63827514648438, 157.54432678222656, 165.4503936767578, 173.3564453125, 181.26251220703125, 189.16856384277344, 197.07461547851562, 204.98068237304688, 212.88674926757812, 220.7928009033203, 228.69886779785156, 236.60491943359375, 244.510986328125, 252.4170379638672, 260.3230895996094, 268.2291564941406, 276.1352233886719, 284.0412902832031, 291.94732666015625, 299.8533935546875, 307.75946044921875, 315.66552734375, 323.5715637207031, 331.4776306152344, 339.3836669921875, 347.28973388671875, 355.1957702636719, 363.1018371582031, 371.0079040527344, 378.9139709472656, 386.82000732421875, 394.72607421875, 402.63214111328125, 410.5382080078125, 418.4442443847656, 426.3503112792969, 434.2563781738281, 442.1624450683594, 450.0684814453125, 457.97454833984375, 465.880615234375]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 4.0, 4.0, 5.0, 12.0, 13.0, 10.0, 13.0, 16.0, 14.0, 16.0, 19.0, 27.0, 29.0, 24.0, 35.0, 29.0, 39.0, 31.0, 30.0, 38.0, 36.0, 43.0, 38.0, 50.0, 34.0, 44.0, 40.0, 28.0, 39.0, 29.0, 28.0, 23.0, 19.0, 18.0, 24.0, 14.0, 15.0, 13.0, 6.0, 13.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.1356201171875, -46.62645721435547, -45.11729431152344, -43.608131408691406, -42.098968505859375, -40.589805603027344, -39.08064270019531, -37.57147979736328, -36.06231689453125, -34.55315399169922, -33.04399108886719, -31.534828186035156, -30.025665283203125, -28.516502380371094, -27.007339477539062, -25.49817657470703, -23.989015579223633, -22.4798526763916, -20.97068977355957, -19.46152687072754, -17.952363967895508, -16.443201065063477, -14.934039115905762, -13.42487621307373, -11.9157133102417, -10.406550407409668, -8.897387504577637, -7.388225078582764, -5.879062175750732, -4.369899272918701, -2.860736846923828, -1.3515739440917969, 0.15758895874023438, 1.666751742362976, 3.1759145259857178, 4.68507719039917, 6.194240093231201, 7.703402996063232, 9.212565422058105, 10.721728324890137, 12.230891227722168, 13.7400541305542, 15.24921703338623, 16.758378982543945, 18.267541885375977, 19.776704788208008, 21.28586769104004, 22.79503059387207, 24.3041934967041, 25.813356399536133, 27.322519302368164, 28.831682205200195, 30.340845108032227, 31.850008010864258, 33.359169006347656, 34.86833190917969, 36.37749481201172, 37.88665771484375, 39.39582061767578, 40.90498352050781, 42.414146423339844, 43.923309326171875, 45.432472229003906, 46.94163513183594, 48.45079803466797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 15.0, 6.0, 10.0, 16.0, 24.0, 17.0, 18.0, 31.0, 33.0, 33.0, 37.0, 41.0, 35.0, 40.0, 42.0, 46.0, 50.0, 50.0, 32.0, 45.0, 40.0, 49.0, 42.0, 33.0, 30.0, 23.0, 29.0, 19.0, 22.0, 16.0, 15.0, 9.0, 11.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80078125, -4.62811279296875, -4.4554443359375, -4.28277587890625, -4.110107421875, -3.93743896484375, -3.7647705078125, -3.59210205078125, -3.41943359375, -3.24676513671875, -3.0740966796875, -2.90142822265625, -2.728759765625, -2.55609130859375, -2.3834228515625, -2.21075439453125, -2.0380859375, -1.86541748046875, -1.6927490234375, -1.52008056640625, -1.347412109375, -1.17474365234375, -1.0020751953125, -0.82940673828125, -0.65673828125, -0.48406982421875, -0.3114013671875, -0.13873291015625, 0.033935546875, 0.20660400390625, 0.3792724609375, 0.55194091796875, 0.724609375, 0.89727783203125, 1.0699462890625, 1.24261474609375, 1.415283203125, 1.58795166015625, 1.7606201171875, 1.93328857421875, 2.10595703125, 2.27862548828125, 2.4512939453125, 2.62396240234375, 2.796630859375, 2.96929931640625, 3.1419677734375, 3.31463623046875, 3.4873046875, 3.65997314453125, 3.8326416015625, 4.00531005859375, 4.177978515625, 4.35064697265625, 4.5233154296875, 4.69598388671875, 4.86865234375, 5.04132080078125, 5.2139892578125, 5.38665771484375, 5.559326171875, 5.73199462890625, 5.9046630859375, 6.07733154296875, 6.25]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 12.0, 12.0, 17.0, 28.0, 24.0, 37.0, 44.0, 83.0, 136.0, 213.0, 359.0, 666.0, 1296.0, 2653.0, 6282.0, 17610.0, 57391.0, 214261.0, 795820.0, 1709934.0, 998855.0, 279962.0, 73119.0, 21694.0, 7502.0, 3035.0, 1393.0, 787.0, 404.0, 223.0, 133.0, 93.0, 63.0, 29.0, 22.0, 24.0, 19.0, 16.0, 11.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5859375, -7.3380126953125, -7.090087890625, -6.8421630859375, -6.59423828125, -6.3463134765625, -6.098388671875, -5.8504638671875, -5.6025390625, -5.3546142578125, -5.106689453125, -4.8587646484375, -4.61083984375, -4.3629150390625, -4.114990234375, -3.8670654296875, -3.619140625, -3.3712158203125, -3.123291015625, -2.8753662109375, -2.62744140625, -2.3795166015625, -2.131591796875, -1.8836669921875, -1.6357421875, -1.3878173828125, -1.139892578125, -0.8919677734375, -0.64404296875, -0.3961181640625, -0.148193359375, 0.0997314453125, 0.34765625, 0.5955810546875, 0.843505859375, 1.0914306640625, 1.33935546875, 1.5872802734375, 1.835205078125, 2.0831298828125, 2.3310546875, 2.5789794921875, 2.826904296875, 3.0748291015625, 3.32275390625, 3.5706787109375, 3.818603515625, 4.0665283203125, 4.314453125, 4.5623779296875, 4.810302734375, 5.0582275390625, 5.30615234375, 5.5540771484375, 5.802001953125, 6.0499267578125, 6.2978515625, 6.5457763671875, 6.793701171875, 7.0416259765625, 7.28955078125, 7.5374755859375, 7.785400390625, 8.0333251953125, 8.28125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 9.0, 22.0, 28.0, 47.0, 88.0, 133.0, 209.0, 361.0, 509.0, 627.0, 723.0, 508.0, 303.0, 186.0, 122.0, 65.0, 43.0, 40.0, 17.0, 14.0, 11.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3515625, -13.7537841796875, -13.156005859375, -12.5582275390625, -11.96044921875, -11.3626708984375, -10.764892578125, -10.1671142578125, -9.5693359375, -8.9715576171875, -8.373779296875, -7.7760009765625, -7.17822265625, -6.5804443359375, -5.982666015625, -5.3848876953125, -4.787109375, -4.1893310546875, -3.591552734375, -2.9937744140625, -2.39599609375, -1.7982177734375, -1.200439453125, -0.6026611328125, -0.0048828125, 0.5928955078125, 1.190673828125, 1.7884521484375, 2.38623046875, 2.9840087890625, 3.581787109375, 4.1795654296875, 4.77734375, 5.3751220703125, 5.972900390625, 6.5706787109375, 7.16845703125, 7.7662353515625, 8.364013671875, 8.9617919921875, 9.5595703125, 10.1573486328125, 10.755126953125, 11.3529052734375, 11.95068359375, 12.5484619140625, 13.146240234375, 13.7440185546875, 14.341796875, 14.9395751953125, 15.537353515625, 16.1351318359375, 16.73291015625, 17.3306884765625, 17.928466796875, 18.5262451171875, 19.1240234375, 19.7218017578125, 20.319580078125, 20.9173583984375, 21.51513671875, 22.1129150390625, 22.710693359375, 23.3084716796875, 23.90625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 18.0, 12.0, 27.0, 46.0, 92.0, 135.0, 300.0, 742.0, 4541.0, 108494.0, 3076572.0, 977041.0, 23417.0, 1822.0, 524.0, 221.0, 133.0, 61.0, 40.0, 20.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -42.037109375, -40.98046875, -39.923828125, -38.8671875, -37.810546875, -36.75390625, -35.697265625, -34.640625, -33.583984375, -32.52734375, -31.470703125, -30.4140625, -29.357421875, -28.30078125, -27.244140625, -26.1875, -25.130859375, -24.07421875, -23.017578125, -21.9609375, -20.904296875, -19.84765625, -18.791015625, -17.734375, -16.677734375, -15.62109375, -14.564453125, -13.5078125, -12.451171875, -11.39453125, -10.337890625, -9.28125, -8.224609375, -7.16796875, -6.111328125, -5.0546875, -3.998046875, -2.94140625, -1.884765625, -0.828125, 0.228515625, 1.28515625, 2.341796875, 3.3984375, 4.455078125, 5.51171875, 6.568359375, 7.625, 8.681640625, 9.73828125, 10.794921875, 11.8515625, 12.908203125, 13.96484375, 15.021484375, 16.078125, 17.134765625, 18.19140625, 19.248046875, 20.3046875, 21.361328125, 22.41796875, 23.474609375, 24.53125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 41.0, 119.0, 252.0, 286.0, 197.0, 86.0, 24.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.16169738769531, -107.87973022460938, -102.59776306152344, -97.3157958984375, -92.03382873535156, -86.75186157226562, -81.46989440917969, -76.18792724609375, -70.90596008300781, -65.62399291992188, -60.34202575683594, -55.06005859375, -49.77809143066406, -44.496124267578125, -39.21415710449219, -33.93218994140625, -28.650222778320312, -23.368255615234375, -18.086288452148438, -12.8043212890625, -7.5223541259765625, -2.240386962890625, 3.0415802001953125, 8.32354736328125, 13.605514526367188, 18.887481689453125, 24.169448852539062, 29.451416015625, 34.73338317871094, 40.015350341796875, 45.29731750488281, 50.57928466796875, 55.861236572265625, 61.14320373535156, 66.4251708984375, 71.70713806152344, 76.98910522460938, 82.27107238769531, 87.55303955078125, 92.83500671386719, 98.11697387695312, 103.39894104003906, 108.680908203125, 113.96287536621094, 119.24484252929688, 124.52680969238281, 129.80877685546875, 135.0907440185547, 140.37271118164062, 145.65467834472656, 150.9366455078125, 156.21861267089844, 161.50057983398438, 166.7825469970703, 172.06451416015625, 177.3464813232422, 182.62844848632812, 187.91041564941406, 193.1923828125, 198.47434997558594, 203.75631713867188, 209.0382843017578, 214.32025146484375, 219.6022186279297, 224.88418579101562]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 2.0, 11.0, 17.0, 19.0, 15.0, 19.0, 31.0, 33.0, 34.0, 26.0, 39.0, 53.0, 45.0, 48.0, 44.0, 47.0, 46.0, 43.0, 44.0, 40.0, 48.0, 45.0, 37.0, 28.0, 32.0, 27.0, 15.0, 29.0, 13.0, 15.0, 11.0, 11.0, 7.0, 8.0, 2.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-52.55269241333008, -51.11041259765625, -49.668128967285156, -48.22584915161133, -46.7835693359375, -45.341285705566406, -43.89900588989258, -42.45672607421875, -41.014442443847656, -39.57216262817383, -38.129878997802734, -36.687599182128906, -35.24531936645508, -33.803035736083984, -32.360755920410156, -30.918474197387695, -29.476194381713867, -28.033912658691406, -26.591632843017578, -25.149351119995117, -23.707069396972656, -22.264789581298828, -20.822507858276367, -19.380226135253906, -17.937946319580078, -16.495664596557617, -15.053383827209473, -13.611103057861328, -12.168821334838867, -10.726540565490723, -9.284259796142578, -7.841978073120117, -6.399696350097656, -4.9574151039123535, -3.51513409614563, -2.0728530883789062, -0.6305718421936035, 0.8117094039916992, 2.2539901733398438, 3.6962718963623047, 5.138552665710449, 6.580833911895752, 8.023115158081055, 9.4653959274292, 10.907676696777344, 12.349958419799805, 13.79223918914795, 15.23452091217041, 16.676801681518555, 18.119083404541016, 19.561363220214844, 21.003644943237305, 22.445926666259766, 23.888206481933594, 25.330488204956055, 26.772769927978516, 28.215049743652344, 29.657331466674805, 31.099611282348633, 32.541893005371094, 33.98417282104492, 35.426456451416016, 36.868736267089844, 38.31101989746094, 39.753299713134766]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 5.0, 6.0, 18.0, 17.0, 19.0, 21.0, 33.0, 27.0, 44.0, 40.0, 42.0, 55.0, 54.0, 67.0, 56.0, 48.0, 49.0, 49.0, 42.0, 41.0, 39.0, 37.0, 37.0, 23.0, 23.0, 26.0, 16.0, 12.0, 9.0, 5.0, 3.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.68914794921875, -5.4915771484375, -5.29400634765625, -5.096435546875, -4.89886474609375, -4.7012939453125, -4.50372314453125, -4.30615234375, -4.10858154296875, -3.9110107421875, -3.71343994140625, -3.515869140625, -3.31829833984375, -3.1207275390625, -2.92315673828125, -2.7255859375, -2.52801513671875, -2.3304443359375, -2.13287353515625, -1.935302734375, -1.73773193359375, -1.5401611328125, -1.34259033203125, -1.14501953125, -0.94744873046875, -0.7498779296875, -0.55230712890625, -0.354736328125, -0.15716552734375, 0.0404052734375, 0.23797607421875, 0.435546875, 0.63311767578125, 0.8306884765625, 1.02825927734375, 1.225830078125, 1.42340087890625, 1.6209716796875, 1.81854248046875, 2.01611328125, 2.21368408203125, 2.4112548828125, 2.60882568359375, 2.806396484375, 3.00396728515625, 3.2015380859375, 3.39910888671875, 3.5966796875, 3.79425048828125, 3.9918212890625, 4.18939208984375, 4.386962890625, 4.58453369140625, 4.7821044921875, 4.97967529296875, 5.17724609375, 5.37481689453125, 5.5723876953125, 5.76995849609375, 5.967529296875, 6.16510009765625, 6.3626708984375, 6.56024169921875, 6.7578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 7.0, 12.0, 15.0, 14.0, 31.0, 52.0, 81.0, 107.0, 143.0, 275.0, 390.0, 643.0, 990.0, 1561.0, 2475.0, 3970.0, 6168.0, 9700.0, 15412.0, 23735.0, 36799.0, 54817.0, 78645.0, 105730.0, 127632.0, 136178.0, 123570.0, 100274.0, 73791.0, 51070.0, 33751.0, 22092.0, 14057.0, 8898.0, 5649.0, 3496.0, 2257.0, 1487.0, 901.0, 580.0, 357.0, 273.0, 162.0, 95.0, 79.0, 45.0, 28.0, 27.0, 11.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1337890625, -1.0988006591796875, -1.063812255859375, -1.0288238525390625, -0.99383544921875, -0.9588470458984375, -0.923858642578125, -0.8888702392578125, -0.8538818359375, -0.8188934326171875, -0.783905029296875, -0.7489166259765625, -0.71392822265625, -0.6789398193359375, -0.643951416015625, -0.6089630126953125, -0.573974609375, -0.5389862060546875, -0.503997802734375, -0.4690093994140625, -0.43402099609375, -0.3990325927734375, -0.364044189453125, -0.3290557861328125, -0.2940673828125, -0.2590789794921875, -0.224090576171875, -0.1891021728515625, -0.15411376953125, -0.1191253662109375, -0.084136962890625, -0.0491485595703125, -0.01416015625, 0.0208282470703125, 0.055816650390625, 0.0908050537109375, 0.12579345703125, 0.1607818603515625, 0.195770263671875, 0.2307586669921875, 0.2657470703125, 0.3007354736328125, 0.335723876953125, 0.3707122802734375, 0.40570068359375, 0.4406890869140625, 0.475677490234375, 0.5106658935546875, 0.545654296875, 0.5806427001953125, 0.615631103515625, 0.6506195068359375, 0.68560791015625, 0.7205963134765625, 0.755584716796875, 0.7905731201171875, 0.8255615234375, 0.8605499267578125, 0.895538330078125, 0.9305267333984375, 0.96551513671875, 1.0005035400390625, 1.035491943359375, 1.0704803466796875, 1.10546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 6.0, 3.0, 7.0, 15.0, 11.0, 9.0, 10.0, 11.0, 18.0, 21.0, 25.0, 23.0, 30.0, 39.0, 42.0, 47.0, 39.0, 46.0, 36.0, 35.0, 1058.0, 44.0, 47.0, 48.0, 43.0, 33.0, 32.0, 25.0, 22.0, 42.0, 33.0, 23.0, 13.0, 19.0, 16.0, 15.0, 8.0, 11.0, 4.0, 7.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.2520751953125, -4.093994140625, -3.9359130859375, -3.77783203125, -3.6197509765625, -3.461669921875, -3.3035888671875, -3.1455078125, -2.9874267578125, -2.829345703125, -2.6712646484375, -2.51318359375, -2.3551025390625, -2.197021484375, -2.0389404296875, -1.880859375, -1.7227783203125, -1.564697265625, -1.4066162109375, -1.24853515625, -1.0904541015625, -0.932373046875, -0.7742919921875, -0.6162109375, -0.4581298828125, -0.300048828125, -0.1419677734375, 0.01611328125, 0.1741943359375, 0.332275390625, 0.4903564453125, 0.6484375, 0.8065185546875, 0.964599609375, 1.1226806640625, 1.28076171875, 1.4388427734375, 1.596923828125, 1.7550048828125, 1.9130859375, 2.0711669921875, 2.229248046875, 2.3873291015625, 2.54541015625, 2.7034912109375, 2.861572265625, 3.0196533203125, 3.177734375, 3.3358154296875, 3.493896484375, 3.6519775390625, 3.81005859375, 3.9681396484375, 4.126220703125, 4.2843017578125, 4.4423828125, 4.6004638671875, 4.758544921875, 4.9166259765625, 5.07470703125, 5.2327880859375, 5.390869140625, 5.5489501953125, 5.70703125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 10.0, 20.0, 23.0, 54.0, 63.0, 81.0, 170.0, 214.0, 340.0, 498.0, 722.0, 1077.0, 1804.0, 2756.0, 4282.0, 7013.0, 11144.0, 17679.0, 29361.0, 46898.0, 73686.0, 110265.0, 189948.0, 1130683.0, 172124.0, 106358.0, 70434.0, 44836.0, 27984.0, 17475.0, 10541.0, 6838.0, 4169.0, 2633.0, 1611.0, 1131.0, 733.0, 475.0, 332.0, 222.0, 126.0, 95.0, 74.0, 45.0, 30.0, 24.0, 14.0, 10.0, 3.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-0.5517578125, -0.5342178344726562, -0.5166778564453125, -0.49913787841796875, -0.481597900390625, -0.46405792236328125, -0.4465179443359375, -0.42897796630859375, -0.41143798828125, -0.39389801025390625, -0.3763580322265625, -0.35881805419921875, -0.341278076171875, -0.32373809814453125, -0.3061981201171875, -0.28865814208984375, -0.2711181640625, -0.25357818603515625, -0.2360382080078125, -0.21849822998046875, -0.200958251953125, -0.18341827392578125, -0.1658782958984375, -0.14833831787109375, -0.13079833984375, -0.11325836181640625, -0.0957183837890625, -0.07817840576171875, -0.060638427734375, -0.04309844970703125, -0.0255584716796875, -0.00801849365234375, 0.009521484375, 0.02706146240234375, 0.0446014404296875, 0.06214141845703125, 0.079681396484375, 0.09722137451171875, 0.1147613525390625, 0.13230133056640625, 0.14984130859375, 0.16738128662109375, 0.1849212646484375, 0.20246124267578125, 0.220001220703125, 0.23754119873046875, 0.2550811767578125, 0.27262115478515625, 0.2901611328125, 0.30770111083984375, 0.3252410888671875, 0.34278106689453125, 0.360321044921875, 0.37786102294921875, 0.3954010009765625, 0.41294097900390625, 0.43048095703125, 0.44802093505859375, 0.4655609130859375, 0.48310089111328125, 0.500640869140625, 0.5181808471679688, 0.5357208251953125, 0.5532608032226562, 0.57080078125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 7.0, 12.0, 14.0, 21.0, 27.0, 27.0, 27.0, 42.0, 58.0, 44.0, 80.0, 75.0, 84.0, 72.0, 61.0, 60.0, 58.0, 55.0, 31.0, 29.0, 27.0, 16.0, 20.0, 11.0, 5.0, 6.0, 1.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.1579151153564453, -0.15262222290039062, -0.14732933044433594, -0.14203643798828125, -0.13674354553222656, -0.13145065307617188, -0.1261577606201172, -0.1208648681640625, -0.11557197570800781, -0.11027908325195312, -0.10498619079589844, -0.09969329833984375, -0.09440040588378906, -0.08910751342773438, -0.08381462097167969, -0.078521728515625, -0.07322883605957031, -0.06793594360351562, -0.06264305114746094, -0.05735015869140625, -0.05205726623535156, -0.046764373779296875, -0.04147148132324219, -0.0361785888671875, -0.030885696411132812, -0.025592803955078125, -0.020299911499023438, -0.01500701904296875, -0.009714126586914062, -0.004421234130859375, 0.0008716583251953125, 0.00616455078125, 0.011457443237304688, 0.016750335693359375, 0.022043228149414062, 0.02733612060546875, 0.03262901306152344, 0.037921905517578125, 0.04321479797363281, 0.0485076904296875, 0.05380058288574219, 0.059093475341796875, 0.06438636779785156, 0.06967926025390625, 0.07497215270996094, 0.08026504516601562, 0.08555793762207031, 0.090850830078125, 0.09614372253417969, 0.10143661499023438, 0.10672950744628906, 0.11202239990234375, 0.11731529235839844, 0.12260818481445312, 0.1279010772705078, 0.1331939697265625, 0.1384868621826172, 0.14377975463867188, 0.14907264709472656, 0.15436553955078125, 0.15965843200683594, 0.16495132446289062, 0.1702442169189453, 0.175537109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 14.0, 29.0, 32.0, 34.0, 42.0, 68.0, 94.0, 186.0, 377.0, 1235.0, 125921.0, 916864.0, 2478.0, 494.0, 222.0, 132.0, 75.0, 37.0, 37.0, 29.0, 30.0, 26.0, 17.0, 10.0, 10.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.392578125, -3.290252685546875, -3.18792724609375, -3.085601806640625, -2.9832763671875, -2.880950927734375, -2.77862548828125, -2.676300048828125, -2.573974609375, -2.471649169921875, -2.36932373046875, -2.266998291015625, -2.1646728515625, -2.062347412109375, -1.96002197265625, -1.857696533203125, -1.75537109375, -1.653045654296875, -1.55072021484375, -1.448394775390625, -1.3460693359375, -1.243743896484375, -1.14141845703125, -1.039093017578125, -0.936767578125, -0.834442138671875, -0.73211669921875, -0.629791259765625, -0.5274658203125, -0.425140380859375, -0.32281494140625, -0.220489501953125, -0.1181640625, -0.015838623046875, 0.08648681640625, 0.188812255859375, 0.2911376953125, 0.393463134765625, 0.49578857421875, 0.598114013671875, 0.700439453125, 0.802764892578125, 0.90509033203125, 1.007415771484375, 1.1097412109375, 1.212066650390625, 1.31439208984375, 1.416717529296875, 1.51904296875, 1.621368408203125, 1.72369384765625, 1.826019287109375, 1.9283447265625, 2.030670166015625, 2.13299560546875, 2.235321044921875, 2.337646484375, 2.439971923828125, 2.54229736328125, 2.644622802734375, 2.7469482421875, 2.849273681640625, 2.95159912109375, 3.053924560546875, 3.15625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 8.0, 16.0, 52.0, 151.0, 353.0, 298.0, 75.0, 24.0, 14.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.444756269454956, -1.415202021598816, -1.3856477737426758, -1.3560936450958252, -1.326539397239685, -1.296985149383545, -1.2674309015274048, -1.2378766536712646, -1.2083224058151245, -1.1787681579589844, -1.1492139101028442, -1.119659662246704, -1.0901055335998535, -1.0605512857437134, -1.0309970378875732, -1.001442790031433, -0.9718886017799377, -0.9423343539237976, -0.9127801656723022, -0.8832259178161621, -0.853671669960022, -0.8241174221038818, -0.7945632338523865, -0.7650089859962463, -0.735454797744751, -0.7059005498886108, -0.6763463616371155, -0.6467921137809753, -0.6172378659248352, -0.5876836776733398, -0.5581294298171997, -0.5285751819610596, -0.4990209639072418, -0.4694667458534241, -0.43991249799728394, -0.4103582799434662, -0.38080406188964844, -0.3512498140335083, -0.32169559597969055, -0.2921413779258728, -0.26258713006973267, -0.23303289711475372, -0.20347866415977478, -0.17392444610595703, -0.1443702131509781, -0.11481598019599915, -0.0852617621421814, -0.055707529187202454, -0.02615329623222351, 0.0034009329974651337, 0.03295516222715378, 0.06250938773155212, 0.09206362068653107, 0.12161785364151001, 0.15117207169532776, 0.1807263046503067, 0.21028053760528564, 0.2398347705602646, 0.26938900351524353, 0.2989432215690613, 0.3284974694252014, 0.35805168747901917, 0.3876059055328369, 0.41716015338897705, 0.4467143714427948]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 14.0, 1.0, 10.0, 8.0, 14.0, 20.0, 18.0, 17.0, 25.0, 16.0, 28.0, 24.0, 31.0, 36.0, 30.0, 40.0, 45.0, 32.0, 32.0, 33.0, 33.0, 35.0, 44.0, 33.0, 34.0, 25.0, 26.0, 36.0, 32.0, 29.0, 16.0, 16.0, 19.0, 20.0, 18.0, 19.0, 10.0, 21.0, 11.0, 8.0, 3.0, 6.0, 6.0, 4.0, 1.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.12011396884918213, -0.11632144451141357, -0.11252892017364502, -0.10873639583587646, -0.10494387149810791, -0.10115134716033936, -0.0973588302731514, -0.09356630593538284, -0.08977378159761429, -0.08598125725984573, -0.08218873292207718, -0.07839620858430862, -0.07460369169712067, -0.07081116735935211, -0.06701864302158356, -0.063226118683815, -0.05943359434604645, -0.05564107000827789, -0.05184854567050934, -0.04805602505803108, -0.04426350072026253, -0.04047097638249397, -0.03667845577001572, -0.03288593143224716, -0.029093407094478607, -0.025300882756710052, -0.021508360281586647, -0.01771583780646324, -0.013923313468694687, -0.010130789130926132, -0.006338266655802727, -0.0025457441806793213, 0.0012467801570892334, 0.0050393035635352135, 0.008831826969981194, 0.012624350376427174, 0.016416873782873154, 0.02020939812064171, 0.024001920595765114, 0.02779444307088852, 0.031586967408657074, 0.03537949174642563, 0.03917201608419418, 0.04296453669667244, 0.046757061034440994, 0.05054958537220955, 0.054342105984687805, 0.05813463032245636, 0.061927154660224915, 0.06571967899799347, 0.06951220333576202, 0.07330472767353058, 0.07709725201129913, 0.08088977634906769, 0.08468229323625565, 0.0884748175740242, 0.09226734191179276, 0.09605986624956131, 0.09985239058732986, 0.10364491492509842, 0.10743743181228638, 0.11122995615005493, 0.11502248048782349, 0.11881500482559204, 0.1226075291633606]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 7.0, 6.0, 15.0, 7.0, 12.0, 10.0, 26.0, 19.0, 25.0, 27.0, 38.0, 31.0, 42.0, 56.0, 57.0, 59.0, 46.0, 45.0, 62.0, 52.0, 48.0, 31.0, 52.0, 38.0, 32.0, 32.0, 28.0, 18.0, 17.0, 16.0, 22.0, 10.0, 2.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.2008056640625, -6.003173828125, -5.8055419921875, -5.60791015625, -5.4102783203125, -5.212646484375, -5.0150146484375, -4.8173828125, -4.6197509765625, -4.422119140625, -4.2244873046875, -4.02685546875, -3.8292236328125, -3.631591796875, -3.4339599609375, -3.236328125, -3.0386962890625, -2.841064453125, -2.6434326171875, -2.44580078125, -2.2481689453125, -2.050537109375, -1.8529052734375, -1.6552734375, -1.4576416015625, -1.260009765625, -1.0623779296875, -0.86474609375, -0.6671142578125, -0.469482421875, -0.2718505859375, -0.07421875, 0.1234130859375, 0.321044921875, 0.5186767578125, 0.71630859375, 0.9139404296875, 1.111572265625, 1.3092041015625, 1.5068359375, 1.7044677734375, 1.902099609375, 2.0997314453125, 2.29736328125, 2.4949951171875, 2.692626953125, 2.8902587890625, 3.087890625, 3.2855224609375, 3.483154296875, 3.6807861328125, 3.87841796875, 4.0760498046875, 4.273681640625, 4.4713134765625, 4.6689453125, 4.8665771484375, 5.064208984375, 5.2618408203125, 5.45947265625, 5.6571044921875, 5.854736328125, 6.0523681640625, 6.25]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 9.0, 6.0, 29.0, 34.0, 56.0, 73.0, 125.0, 242.0, 384.0, 762.0, 1469.0, 2670.0, 5519.0, 10612.0, 20952.0, 39814.0, 77867.0, 151010.0, 259440.0, 226021.0, 122649.0, 62364.0, 32194.0, 16520.0, 8578.0, 4373.0, 2194.0, 1182.0, 615.0, 315.0, 182.0, 114.0, 60.0, 35.0, 22.0, 18.0, 12.0, 13.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.6051025390625, -5.417236328125, -5.2293701171875, -5.04150390625, -4.8536376953125, -4.665771484375, -4.4779052734375, -4.2900390625, -4.1021728515625, -3.914306640625, -3.7264404296875, -3.53857421875, -3.3507080078125, -3.162841796875, -2.9749755859375, -2.787109375, -2.5992431640625, -2.411376953125, -2.2235107421875, -2.03564453125, -1.8477783203125, -1.659912109375, -1.4720458984375, -1.2841796875, -1.0963134765625, -0.908447265625, -0.7205810546875, -0.53271484375, -0.3448486328125, -0.156982421875, 0.0308837890625, 0.21875, 0.4066162109375, 0.594482421875, 0.7823486328125, 0.97021484375, 1.1580810546875, 1.345947265625, 1.5338134765625, 1.7216796875, 1.9095458984375, 2.097412109375, 2.2852783203125, 2.47314453125, 2.6610107421875, 2.848876953125, 3.0367431640625, 3.224609375, 3.4124755859375, 3.600341796875, 3.7882080078125, 3.97607421875, 4.1639404296875, 4.351806640625, 4.5396728515625, 4.7275390625, 4.9154052734375, 5.103271484375, 5.2911376953125, 5.47900390625, 5.6668701171875, 5.854736328125, 6.0426025390625, 6.23046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 8.0, 11.0, 22.0, 23.0, 30.0, 29.0, 27.0, 35.0, 46.0, 74.0, 99.0, 169.0, 297.0, 1415.0, 214.0, 135.0, 89.0, 54.0, 40.0, 39.0, 36.0, 34.0, 20.0, 10.0, 13.0, 13.0, 10.0, 6.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.78125, -28.9599609375, -28.138671875, -27.3173828125, -26.49609375, -25.6748046875, -24.853515625, -24.0322265625, -23.2109375, -22.3896484375, -21.568359375, -20.7470703125, -19.92578125, -19.1044921875, -18.283203125, -17.4619140625, -16.640625, -15.8193359375, -14.998046875, -14.1767578125, -13.35546875, -12.5341796875, -11.712890625, -10.8916015625, -10.0703125, -9.2490234375, -8.427734375, -7.6064453125, -6.78515625, -5.9638671875, -5.142578125, -4.3212890625, -3.5, -2.6787109375, -1.857421875, -1.0361328125, -0.21484375, 0.6064453125, 1.427734375, 2.2490234375, 3.0703125, 3.8916015625, 4.712890625, 5.5341796875, 6.35546875, 7.1767578125, 7.998046875, 8.8193359375, 9.640625, 10.4619140625, 11.283203125, 12.1044921875, 12.92578125, 13.7470703125, 14.568359375, 15.3896484375, 16.2109375, 17.0322265625, 17.853515625, 18.6748046875, 19.49609375, 20.3173828125, 21.138671875, 21.9599609375, 22.78125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 19.0, 15.0, 24.0, 26.0, 22.0, 63.0, 79.0, 115.0, 165.0, 246.0, 448.0, 1179.0, 10388.0, 1643722.0, 1477198.0, 9583.0, 1127.0, 455.0, 229.0, 166.0, 107.0, 74.0, 55.0, 46.0, 40.0, 23.0, 16.0, 11.0, 4.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.01171875, -39.4921875, -37.97265625, -36.453125, -34.93359375, -33.4140625, -31.89453125, -30.375, -28.85546875, -27.3359375, -25.81640625, -24.296875, -22.77734375, -21.2578125, -19.73828125, -18.21875, -16.69921875, -15.1796875, -13.66015625, -12.140625, -10.62109375, -9.1015625, -7.58203125, -6.0625, -4.54296875, -3.0234375, -1.50390625, 0.015625, 1.53515625, 3.0546875, 4.57421875, 6.09375, 7.61328125, 9.1328125, 10.65234375, 12.171875, 13.69140625, 15.2109375, 16.73046875, 18.25, 19.76953125, 21.2890625, 22.80859375, 24.328125, 25.84765625, 27.3671875, 28.88671875, 30.40625, 31.92578125, 33.4453125, 34.96484375, 36.484375, 38.00390625, 39.5234375, 41.04296875, 42.5625, 44.08203125, 45.6015625, 47.12109375, 48.640625, 50.16015625, 51.6796875, 53.19921875, 54.71875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 12.0, 33.0, 117.0, 211.0, 262.0, 224.0, 95.0, 47.0, 11.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.17825698852539, -26.134414672851562, -23.0905704498291, -20.04672622680664, -17.002883911132812, -13.959040641784668, -10.915197372436523, -7.8713531494140625, -4.827510833740234, -1.7836675643920898, 1.2601757049560547, 4.304018974304199, 7.347862243652344, 10.391705513000488, 13.435548782348633, 16.479393005371094, 19.523235321044922, 22.56707763671875, 25.61092185974121, 28.654766082763672, 31.6986083984375, 34.74245071411133, 37.786293029785156, 40.83013916015625, 43.87398147583008, 46.917823791503906, 49.961669921875, 53.00551223754883, 56.049354553222656, 59.093196868896484, 62.13703918457031, 65.1808853149414, 68.2247314453125, 71.2685775756836, 74.31241607666016, 77.35626220703125, 80.40010070800781, 83.4439468383789, 86.48779296875, 89.53163146972656, 92.57547760009766, 95.61932373046875, 98.66316223144531, 101.7070083618164, 104.7508544921875, 107.79469299316406, 110.83853912353516, 113.88238525390625, 116.92622375488281, 119.9700698852539, 123.01390838623047, 126.05775451660156, 129.10159301757812, 132.14544677734375, 135.1892852783203, 138.23312377929688, 141.2769775390625, 144.32081604003906, 147.3646697998047, 150.40850830078125, 153.4523468017578, 156.49620056152344, 159.5400390625, 162.58387756347656, 165.62771606445312]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 14.0, 9.0, 8.0, 11.0, 16.0, 12.0, 23.0, 17.0, 24.0, 22.0, 34.0, 34.0, 33.0, 38.0, 38.0, 34.0, 44.0, 42.0, 37.0, 49.0, 38.0, 36.0, 33.0, 37.0, 42.0, 41.0, 22.0, 26.0, 27.0, 21.0, 23.0, 12.0, 13.0, 20.0, 8.0, 13.0, 7.0, 9.0, 5.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.859703063964844, -49.288818359375, -47.717933654785156, -46.14704895019531, -44.57616424560547, -43.00528335571289, -41.43439865112305, -39.8635139465332, -38.29262924194336, -36.721744537353516, -35.15085983276367, -33.57997512817383, -32.00909423828125, -30.438207626342773, -28.867324829101562, -27.29644012451172, -25.725555419921875, -24.15467071533203, -22.583786010742188, -21.012903213500977, -19.442018508911133, -17.87113380432129, -16.300251007080078, -14.729366302490234, -13.15848159790039, -11.587596893310547, -10.01671314239502, -8.445829391479492, -6.874944686889648, -5.304060459136963, -3.7331762313842773, -2.16229248046875, -0.5914039611816406, 0.9794802665710449, 2.5503644943237305, 4.121248722076416, 5.692132949829102, 7.263017177581787, 8.833901405334473, 10.40478515625, 11.975669860839844, 13.546554565429688, 15.117438316345215, 16.688322067260742, 18.259206771850586, 19.83009147644043, 21.40097427368164, 22.971858978271484, 24.542743682861328, 26.113628387451172, 27.684513092041016, 29.255395889282227, 30.82628059387207, 32.39716339111328, 33.968048095703125, 35.53893280029297, 37.10981750488281, 38.680702209472656, 40.2515869140625, 41.822471618652344, 43.39335632324219, 44.964237213134766, 46.53512191772461, 48.10600662231445, 49.6768913269043]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 12.0, 6.0, 15.0, 13.0, 22.0, 24.0, 23.0, 22.0, 32.0, 47.0, 47.0, 52.0, 54.0, 51.0, 66.0, 57.0, 48.0, 50.0, 45.0, 65.0, 51.0, 41.0, 24.0, 22.0, 21.0, 22.0, 19.0, 16.0, 6.0, 9.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.68353271484375, -7.4530029296875, -7.22247314453125, -6.991943359375, -6.76141357421875, -6.5308837890625, -6.30035400390625, -6.06982421875, -5.83929443359375, -5.6087646484375, -5.37823486328125, -5.147705078125, -4.91717529296875, -4.6866455078125, -4.45611572265625, -4.2255859375, -3.99505615234375, -3.7645263671875, -3.53399658203125, -3.303466796875, -3.07293701171875, -2.8424072265625, -2.61187744140625, -2.38134765625, -2.15081787109375, -1.9202880859375, -1.68975830078125, -1.459228515625, -1.22869873046875, -0.9981689453125, -0.76763916015625, -0.537109375, -0.30657958984375, -0.0760498046875, 0.15447998046875, 0.385009765625, 0.61553955078125, 0.8460693359375, 1.07659912109375, 1.30712890625, 1.53765869140625, 1.7681884765625, 1.99871826171875, 2.229248046875, 2.45977783203125, 2.6903076171875, 2.92083740234375, 3.1513671875, 3.38189697265625, 3.6124267578125, 3.84295654296875, 4.073486328125, 4.30401611328125, 4.5345458984375, 4.76507568359375, 4.99560546875, 5.22613525390625, 5.4566650390625, 5.68719482421875, 5.917724609375, 6.14825439453125, 6.3787841796875, 6.60931396484375, 6.83984375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 31.0, 27.0, 39.0, 40.0, 60.0, 85.0, 135.0, 259.0, 568.0, 1489.0, 5530.0, 34371.0, 358697.0, 2382029.0, 1267369.0, 124011.0, 14709.0, 3009.0, 851.0, 365.0, 191.0, 97.0, 63.0, 63.0, 37.0, 27.0, 22.0, 23.0, 12.0, 7.0, 6.0, 6.0, 5.0, 7.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.046875, -16.5704345703125, -16.093994140625, -15.6175537109375, -15.14111328125, -14.6646728515625, -14.188232421875, -13.7117919921875, -13.2353515625, -12.7589111328125, -12.282470703125, -11.8060302734375, -11.32958984375, -10.8531494140625, -10.376708984375, -9.9002685546875, -9.423828125, -8.9473876953125, -8.470947265625, -7.9945068359375, -7.51806640625, -7.0416259765625, -6.565185546875, -6.0887451171875, -5.6123046875, -5.1358642578125, -4.659423828125, -4.1829833984375, -3.70654296875, -3.2301025390625, -2.753662109375, -2.2772216796875, -1.80078125, -1.3243408203125, -0.847900390625, -0.3714599609375, 0.10498046875, 0.5814208984375, 1.057861328125, 1.5343017578125, 2.0107421875, 2.4871826171875, 2.963623046875, 3.4400634765625, 3.91650390625, 4.3929443359375, 4.869384765625, 5.3458251953125, 5.822265625, 6.2987060546875, 6.775146484375, 7.2515869140625, 7.72802734375, 8.2044677734375, 8.680908203125, 9.1573486328125, 9.6337890625, 10.1102294921875, 10.586669921875, 11.0631103515625, 11.53955078125, 12.0159912109375, 12.492431640625, 12.9688720703125, 13.4453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 12.0, 12.0, 15.0, 22.0, 36.0, 43.0, 69.0, 98.0, 103.0, 138.0, 198.0, 293.0, 377.0, 467.0, 478.0, 426.0, 341.0, 246.0, 194.0, 153.0, 104.0, 78.0, 45.0, 23.0, 28.0, 23.0, 11.0, 8.0, 7.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.9617919921875, -13.540771484375, -13.1197509765625, -12.69873046875, -12.2777099609375, -11.856689453125, -11.4356689453125, -11.0146484375, -10.5936279296875, -10.172607421875, -9.7515869140625, -9.33056640625, -8.9095458984375, -8.488525390625, -8.0675048828125, -7.646484375, -7.2254638671875, -6.804443359375, -6.3834228515625, -5.96240234375, -5.5413818359375, -5.120361328125, -4.6993408203125, -4.2783203125, -3.8572998046875, -3.436279296875, -3.0152587890625, -2.59423828125, -2.1732177734375, -1.752197265625, -1.3311767578125, -0.91015625, -0.4891357421875, -0.068115234375, 0.3529052734375, 0.77392578125, 1.1949462890625, 1.615966796875, 2.0369873046875, 2.4580078125, 2.8790283203125, 3.300048828125, 3.7210693359375, 4.14208984375, 4.5631103515625, 4.984130859375, 5.4051513671875, 5.826171875, 6.2471923828125, 6.668212890625, 7.0892333984375, 7.51025390625, 7.9312744140625, 8.352294921875, 8.7733154296875, 9.1943359375, 9.6153564453125, 10.036376953125, 10.4573974609375, 10.87841796875, 11.2994384765625, 11.720458984375, 12.1414794921875, 12.5625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 10.0, 12.0, 12.0, 14.0, 30.0, 20.0, 38.0, 65.0, 92.0, 162.0, 280.0, 577.0, 1665.0, 10343.0, 151517.0, 2484661.0, 1463661.0, 72905.0, 5960.0, 1200.0, 432.0, 208.0, 133.0, 102.0, 52.0, 39.0, 30.0, 14.0, 18.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.484375, -24.63134765625, -23.7783203125, -22.92529296875, -22.072265625, -21.21923828125, -20.3662109375, -19.51318359375, -18.66015625, -17.80712890625, -16.9541015625, -16.10107421875, -15.248046875, -14.39501953125, -13.5419921875, -12.68896484375, -11.8359375, -10.98291015625, -10.1298828125, -9.27685546875, -8.423828125, -7.57080078125, -6.7177734375, -5.86474609375, -5.01171875, -4.15869140625, -3.3056640625, -2.45263671875, -1.599609375, -0.74658203125, 0.1064453125, 0.95947265625, 1.8125, 2.66552734375, 3.5185546875, 4.37158203125, 5.224609375, 6.07763671875, 6.9306640625, 7.78369140625, 8.63671875, 9.48974609375, 10.3427734375, 11.19580078125, 12.048828125, 12.90185546875, 13.7548828125, 14.60791015625, 15.4609375, 16.31396484375, 17.1669921875, 18.02001953125, 18.873046875, 19.72607421875, 20.5791015625, 21.43212890625, 22.28515625, 23.13818359375, 23.9912109375, 24.84423828125, 25.697265625, 26.55029296875, 27.4033203125, 28.25634765625, 29.109375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 26.0, 33.0, 43.0, 58.0, 96.0, 104.0, 106.0, 112.0, 88.0, 94.0, 74.0, 54.0, 37.0, 33.0, 12.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.86249542236328, -59.87479782104492, -57.88710021972656, -55.89939880371094, -53.91170120239258, -51.92400360107422, -49.93630599975586, -47.9486083984375, -45.960906982421875, -43.973209381103516, -41.985511779785156, -39.99781036376953, -38.01011276245117, -36.02241516113281, -34.03471755981445, -32.047019958496094, -30.059322357177734, -28.071624755859375, -26.083925247192383, -24.096227645874023, -22.10852813720703, -20.120830535888672, -18.133132934570312, -16.145435333251953, -14.157735824584961, -12.170037269592285, -10.18233871459961, -8.19464111328125, -6.206942558288574, -4.219244003295898, -2.231546401977539, -0.24384784698486328, 1.7438507080078125, 3.731549024581909, 5.719247341156006, 7.706945419311523, 9.6946439743042, 11.682342529296875, 13.670040130615234, 15.65773868560791, 17.645437240600586, 19.633134841918945, 21.620834350585938, 23.608531951904297, 25.596229553222656, 27.58392906188965, 29.571626663208008, 31.559326171875, 33.54702377319336, 35.53472137451172, 37.52241897583008, 39.51011657714844, 41.49781799316406, 43.48551559448242, 45.47321319580078, 47.46091079711914, 49.4486083984375, 51.43630599975586, 53.42400360107422, 55.411705017089844, 57.3994026184082, 59.38710021972656, 61.37479782104492, 63.36249542236328, 65.3501968383789]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 10.0, 12.0, 17.0, 21.0, 30.0, 31.0, 27.0, 33.0, 32.0, 49.0, 44.0, 44.0, 52.0, 46.0, 53.0, 53.0, 41.0, 52.0, 53.0, 53.0, 38.0, 32.0, 27.0, 23.0, 24.0, 23.0, 16.0, 12.0, 10.0, 2.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.765010833740234, -47.16758346557617, -45.57015609741211, -43.97272872924805, -42.375301361083984, -40.77787399291992, -39.180450439453125, -37.58302307128906, -35.985595703125, -34.38816833496094, -32.790740966796875, -31.193313598632812, -29.59588623046875, -27.998458862304688, -26.401033401489258, -24.803606033325195, -23.2061767578125, -21.608749389648438, -20.011322021484375, -18.413894653320312, -16.81646728515625, -15.219040870666504, -13.621614456176758, -12.024187088012695, -10.426759719848633, -8.82933235168457, -7.231905460357666, -5.634478569030762, -4.037051200866699, -2.4396238327026367, -0.8421974182128906, 0.7552299499511719, 2.3526573181152344, 3.9500844478607178, 5.547511577606201, 7.1449384689331055, 8.742365837097168, 10.33979320526123, 11.937219619750977, 13.534646987915039, 15.132074356079102, 16.729501724243164, 18.326929092407227, 19.924354553222656, 21.52178192138672, 23.11920928955078, 24.716636657714844, 26.314064025878906, 27.91149139404297, 29.50891876220703, 31.106346130371094, 32.703773498535156, 34.30120086669922, 35.89862823486328, 37.496055603027344, 39.093482971191406, 40.69091033935547, 42.28833770751953, 43.885765075683594, 45.483192443847656, 47.08061981201172, 48.67804718017578, 50.275474548339844, 51.872901916503906, 53.4703254699707]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 16.0, 15.0, 16.0, 26.0, 31.0, 28.0, 31.0, 51.0, 45.0, 46.0, 44.0, 54.0, 65.0, 54.0, 61.0, 50.0, 56.0, 61.0, 46.0, 34.0, 26.0, 17.0, 26.0, 14.0, 24.0, 18.0, 9.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.06195068359375, -5.8387451171875, -5.61553955078125, -5.392333984375, -5.16912841796875, -4.9459228515625, -4.72271728515625, -4.49951171875, -4.27630615234375, -4.0531005859375, -3.82989501953125, -3.606689453125, -3.38348388671875, -3.1602783203125, -2.93707275390625, -2.7138671875, -2.49066162109375, -2.2674560546875, -2.04425048828125, -1.821044921875, -1.59783935546875, -1.3746337890625, -1.15142822265625, -0.92822265625, -0.70501708984375, -0.4818115234375, -0.25860595703125, -0.035400390625, 0.18780517578125, 0.4110107421875, 0.63421630859375, 0.857421875, 1.08062744140625, 1.3038330078125, 1.52703857421875, 1.750244140625, 1.97344970703125, 2.1966552734375, 2.41986083984375, 2.64306640625, 2.86627197265625, 3.0894775390625, 3.31268310546875, 3.535888671875, 3.75909423828125, 3.9822998046875, 4.20550537109375, 4.4287109375, 4.65191650390625, 4.8751220703125, 5.09832763671875, 5.321533203125, 5.54473876953125, 5.7679443359375, 5.99114990234375, 6.21435546875, 6.43756103515625, 6.6607666015625, 6.88397216796875, 7.107177734375, 7.33038330078125, 7.5535888671875, 7.77679443359375, 8.0]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 11.0, 12.0, 16.0, 27.0, 39.0, 58.0, 81.0, 149.0, 238.0, 363.0, 599.0, 998.0, 1584.0, 2610.0, 4182.0, 6807.0, 11488.0, 19224.0, 31073.0, 48858.0, 74588.0, 107011.0, 138367.0, 152041.0, 137916.0, 107063.0, 74515.0, 49013.0, 30984.0, 18991.0, 11650.0, 7117.0, 4262.0, 2612.0, 1553.0, 963.0, 540.0, 337.0, 228.0, 148.0, 80.0, 65.0, 41.0, 15.0, 18.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.1419525146484375, -1.103240966796875, -1.0645294189453125, -1.02581787109375, -0.9871063232421875, -0.948394775390625, -0.9096832275390625, -0.8709716796875, -0.8322601318359375, -0.793548583984375, -0.7548370361328125, -0.71612548828125, -0.6774139404296875, -0.638702392578125, -0.5999908447265625, -0.561279296875, -0.5225677490234375, -0.483856201171875, -0.4451446533203125, -0.40643310546875, -0.3677215576171875, -0.329010009765625, -0.2902984619140625, -0.2515869140625, -0.2128753662109375, -0.174163818359375, -0.1354522705078125, -0.09674072265625, -0.0580291748046875, -0.019317626953125, 0.0193939208984375, 0.05810546875, 0.0968170166015625, 0.135528564453125, 0.1742401123046875, 0.21295166015625, 0.2516632080078125, 0.290374755859375, 0.3290863037109375, 0.3677978515625, 0.4065093994140625, 0.445220947265625, 0.4839324951171875, 0.52264404296875, 0.5613555908203125, 0.600067138671875, 0.6387786865234375, 0.677490234375, 0.7162017822265625, 0.754913330078125, 0.7936248779296875, 0.83233642578125, 0.8710479736328125, 0.909759521484375, 0.9484710693359375, 0.9871826171875, 1.0258941650390625, 1.064605712890625, 1.1033172607421875, 1.14202880859375, 1.1807403564453125, 1.219451904296875, 1.2581634521484375, 1.296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 9.0, 3.0, 2.0, 6.0, 6.0, 11.0, 5.0, 20.0, 17.0, 21.0, 21.0, 20.0, 28.0, 27.0, 28.0, 31.0, 33.0, 32.0, 35.0, 35.0, 38.0, 33.0, 32.0, 1061.0, 39.0, 41.0, 41.0, 23.0, 23.0, 32.0, 22.0, 30.0, 27.0, 21.0, 21.0, 24.0, 16.0, 16.0, 22.0, 11.0, 18.0, 6.0, 8.0, 11.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.830078125, -3.698577880859375, -3.56707763671875, -3.435577392578125, -3.3040771484375, -3.172576904296875, -3.04107666015625, -2.909576416015625, -2.778076171875, -2.646575927734375, -2.51507568359375, -2.383575439453125, -2.2520751953125, -2.120574951171875, -1.98907470703125, -1.857574462890625, -1.72607421875, -1.594573974609375, -1.46307373046875, -1.331573486328125, -1.2000732421875, -1.068572998046875, -0.93707275390625, -0.805572509765625, -0.674072265625, -0.542572021484375, -0.41107177734375, -0.279571533203125, -0.1480712890625, -0.016571044921875, 0.11492919921875, 0.246429443359375, 0.3779296875, 0.509429931640625, 0.64093017578125, 0.772430419921875, 0.9039306640625, 1.035430908203125, 1.16693115234375, 1.298431396484375, 1.429931640625, 1.561431884765625, 1.69293212890625, 1.824432373046875, 1.9559326171875, 2.087432861328125, 2.21893310546875, 2.350433349609375, 2.48193359375, 2.613433837890625, 2.74493408203125, 2.876434326171875, 3.0079345703125, 3.139434814453125, 3.27093505859375, 3.402435302734375, 3.533935546875, 3.665435791015625, 3.79693603515625, 3.928436279296875, 4.0599365234375, 4.191436767578125, 4.32293701171875, 4.454437255859375, 4.5859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 4.0, 4.0, 8.0, 19.0, 18.0, 28.0, 70.0, 101.0, 136.0, 171.0, 286.0, 484.0, 673.0, 979.0, 1579.0, 2358.0, 3823.0, 5843.0, 9353.0, 14836.0, 23006.0, 36322.0, 56650.0, 83662.0, 120238.0, 376758.0, 940019.0, 141318.0, 94511.0, 64926.0, 42926.0, 27467.0, 17519.0, 11187.0, 7152.0, 4487.0, 2848.0, 1825.0, 1195.0, 808.0, 512.0, 359.0, 233.0, 160.0, 97.0, 56.0, 34.0, 17.0, 23.0, 14.0, 5.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.5283203125, -0.51190185546875, -0.4954833984375, -0.47906494140625, -0.462646484375, -0.44622802734375, -0.4298095703125, -0.41339111328125, -0.39697265625, -0.38055419921875, -0.3641357421875, -0.34771728515625, -0.331298828125, -0.31488037109375, -0.2984619140625, -0.28204345703125, -0.265625, -0.24920654296875, -0.2327880859375, -0.21636962890625, -0.199951171875, -0.18353271484375, -0.1671142578125, -0.15069580078125, -0.13427734375, -0.11785888671875, -0.1014404296875, -0.08502197265625, -0.068603515625, -0.05218505859375, -0.0357666015625, -0.01934814453125, -0.0029296875, 0.01348876953125, 0.0299072265625, 0.04632568359375, 0.062744140625, 0.07916259765625, 0.0955810546875, 0.11199951171875, 0.12841796875, 0.14483642578125, 0.1612548828125, 0.17767333984375, 0.194091796875, 0.21051025390625, 0.2269287109375, 0.24334716796875, 0.259765625, 0.27618408203125, 0.2926025390625, 0.30902099609375, 0.325439453125, 0.34185791015625, 0.3582763671875, 0.37469482421875, 0.39111328125, 0.40753173828125, 0.4239501953125, 0.44036865234375, 0.456787109375, 0.47320556640625, 0.4896240234375, 0.50604248046875, 0.5224609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 13.0, 12.0, 9.0, 15.0, 18.0, 21.0, 10.0, 28.0, 30.0, 33.0, 41.0, 44.0, 56.0, 55.0, 73.0, 71.0, 69.0, 52.0, 51.0, 49.0, 33.0, 21.0, 27.0, 19.0, 23.0, 18.0, 16.0, 8.0, 11.0, 12.0, 10.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09014892578125, -0.08749103546142578, -0.08483314514160156, -0.08217525482177734, -0.07951736450195312, -0.0768594741821289, -0.07420158386230469, -0.07154369354248047, -0.06888580322265625, -0.06622791290283203, -0.06357002258300781, -0.060912132263183594, -0.058254241943359375, -0.055596351623535156, -0.05293846130371094, -0.05028057098388672, -0.0476226806640625, -0.04496479034423828, -0.04230690002441406, -0.039649009704589844, -0.036991119384765625, -0.034333229064941406, -0.03167533874511719, -0.02901744842529297, -0.02635955810546875, -0.02370166778564453, -0.021043777465820312, -0.018385887145996094, -0.015727996826171875, -0.013070106506347656, -0.010412216186523438, -0.007754325866699219, -0.005096435546875, -0.0024385452270507812, 0.0002193450927734375, 0.0028772354125976562, 0.005535125732421875, 0.008193016052246094, 0.010850906372070312, 0.013508796691894531, 0.01616668701171875, 0.01882457733154297, 0.021482467651367188, 0.024140357971191406, 0.026798248291015625, 0.029456138610839844, 0.03211402893066406, 0.03477191925048828, 0.0374298095703125, 0.04008769989013672, 0.04274559020996094, 0.045403480529785156, 0.048061370849609375, 0.050719261169433594, 0.05337715148925781, 0.05603504180908203, 0.05869293212890625, 0.06135082244873047, 0.06400871276855469, 0.0666666030883789, 0.06932449340820312, 0.07198238372802734, 0.07464027404785156, 0.07729816436767578, 0.0799560546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 8.0, 6.0, 7.0, 19.0, 24.0, 18.0, 34.0, 43.0, 78.0, 128.0, 377.0, 1804.0, 943418.0, 101202.0, 840.0, 238.0, 107.0, 46.0, 41.0, 26.0, 18.0, 15.0, 14.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.540771484375, -2.45263671875, -2.364501953125, -2.2763671875, -2.188232421875, -2.10009765625, -2.011962890625, -1.923828125, -1.835693359375, -1.74755859375, -1.659423828125, -1.5712890625, -1.483154296875, -1.39501953125, -1.306884765625, -1.21875, -1.130615234375, -1.04248046875, -0.954345703125, -0.8662109375, -0.778076171875, -0.68994140625, -0.601806640625, -0.513671875, -0.425537109375, -0.33740234375, -0.249267578125, -0.1611328125, -0.072998046875, 0.01513671875, 0.103271484375, 0.19140625, 0.279541015625, 0.36767578125, 0.455810546875, 0.5439453125, 0.632080078125, 0.72021484375, 0.808349609375, 0.896484375, 0.984619140625, 1.07275390625, 1.160888671875, 1.2490234375, 1.337158203125, 1.42529296875, 1.513427734375, 1.6015625, 1.689697265625, 1.77783203125, 1.865966796875, 1.9541015625, 2.042236328125, 2.13037109375, 2.218505859375, 2.306640625, 2.394775390625, 2.48291015625, 2.571044921875, 2.6591796875, 2.747314453125, 2.83544921875, 2.923583984375, 3.01171875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 9.0, 11.0, 14.0, 31.0, 32.0, 61.0, 97.0, 158.0, 203.0, 169.0, 82.0, 59.0, 24.0, 18.0, 12.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2366447001695633, -0.22401343286037445, -0.2113821804523468, -0.19875091314315796, -0.18611964583396912, -0.17348839342594147, -0.16085712611675262, -0.14822587370872498, -0.13559460639953613, -0.12296334654092789, -0.11033208668231964, -0.0977008193731308, -0.08506955951452255, -0.0724382996559143, -0.059807032346725464, -0.04717577248811722, -0.03454451262950897, -0.021913250908255577, -0.009281989187002182, 0.0033492743968963623, 0.015980534255504608, 0.028611794114112854, 0.0412430614233017, 0.05387432128190994, 0.06650558114051819, 0.07913684099912643, 0.09176810085773468, 0.10439936816692352, 0.11703062802553177, 0.12966188788414001, 0.14229315519332886, 0.1549244225025177, 0.16755568981170654, 0.18018695712089539, 0.19281820952892303, 0.20544947683811188, 0.21808072924613953, 0.23071199655532837, 0.2433432638645172, 0.25597453117370605, 0.2686057686805725, 0.28123703598976135, 0.2938683032989502, 0.30649954080581665, 0.3191308081150055, 0.33176207542419434, 0.3443933427333832, 0.357024610042572, 0.36965587735176086, 0.3822871446609497, 0.39491841197013855, 0.4075496792793274, 0.42018091678619385, 0.4328121840953827, 0.44544345140457153, 0.4580747187137604, 0.4707059860229492, 0.48333725333213806, 0.4959685206413269, 0.5085997581481934, 0.5212310552597046, 0.533862292766571, 0.5464935302734375, 0.5591248273849487, 0.5717560648918152]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 4.0, 9.0, 6.0, 5.0, 14.0, 9.0, 15.0, 11.0, 13.0, 15.0, 19.0, 29.0, 39.0, 32.0, 43.0, 32.0, 45.0, 47.0, 47.0, 40.0, 48.0, 37.0, 50.0, 34.0, 42.0, 29.0, 31.0, 30.0, 29.0, 25.0, 29.0, 27.0, 19.0, 14.0, 16.0, 8.0, 12.0, 10.0, 14.0, 5.0, 4.0, 4.0, 1.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.11357057094573975, -0.11040318757295609, -0.10723580420017242, -0.10406842827796936, -0.1009010449051857, -0.09773366153240204, -0.09456628561019897, -0.09139890223741531, -0.08823151886463165, -0.08506413549184799, -0.08189675211906433, -0.07872937619686127, -0.0755619928240776, -0.07239460945129395, -0.06922723352909088, -0.06605985015630722, -0.06289246678352356, -0.0597250834107399, -0.056557703763246536, -0.053390324115753174, -0.05022294074296951, -0.04705555737018585, -0.04388817772269249, -0.04072079807519913, -0.037553414702415466, -0.034386031329631805, -0.031218651682138443, -0.02805127017199993, -0.02488388866186142, -0.021716507151722908, -0.018549125641584396, -0.015381744131445885, -0.012214362621307373, -0.009046981111168861, -0.00587959960103035, -0.002712218090891838, 0.0004551634192466736, 0.0036225449293851852, 0.006789926439523697, 0.009957307949662209, 0.01312468945980072, 0.016292070969939232, 0.019459452480077744, 0.022626833990216255, 0.025794215500354767, 0.02896159701049328, 0.03212897852063179, 0.03529635816812515, 0.038463741540908813, 0.041631124913692474, 0.04479850456118584, 0.0479658842086792, 0.05113326758146286, 0.05430065095424652, 0.05746803060173988, 0.060635410249233246, 0.0638027936220169, 0.06697017699480057, 0.07013756036758423, 0.07330493628978729, 0.07647231966257095, 0.07963970303535461, 0.08280707895755768, 0.08597446233034134, 0.089141845703125]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 12.0, 14.0, 13.0, 26.0, 19.0, 31.0, 26.0, 46.0, 34.0, 40.0, 55.0, 44.0, 68.0, 48.0, 57.0, 68.0, 63.0, 40.0, 57.0, 34.0, 42.0, 28.0, 30.0, 20.0, 21.0, 15.0, 12.0, 9.0, 4.0, 10.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.5191650390625, -6.296142578125, -6.0731201171875, -5.85009765625, -5.6270751953125, -5.404052734375, -5.1810302734375, -4.9580078125, -4.7349853515625, -4.511962890625, -4.2889404296875, -4.06591796875, -3.8428955078125, -3.619873046875, -3.3968505859375, -3.173828125, -2.9508056640625, -2.727783203125, -2.5047607421875, -2.28173828125, -2.0587158203125, -1.835693359375, -1.6126708984375, -1.3896484375, -1.1666259765625, -0.943603515625, -0.7205810546875, -0.49755859375, -0.2745361328125, -0.051513671875, 0.1715087890625, 0.39453125, 0.6175537109375, 0.840576171875, 1.0635986328125, 1.28662109375, 1.5096435546875, 1.732666015625, 1.9556884765625, 2.1787109375, 2.4017333984375, 2.624755859375, 2.8477783203125, 3.07080078125, 3.2938232421875, 3.516845703125, 3.7398681640625, 3.962890625, 4.1859130859375, 4.408935546875, 4.6319580078125, 4.85498046875, 5.0780029296875, 5.301025390625, 5.5240478515625, 5.7470703125, 5.9700927734375, 6.193115234375, 6.4161376953125, 6.63916015625, 6.8621826171875, 7.085205078125, 7.3082275390625, 7.53125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 7.0, 4.0, 7.0, 3.0, 11.0, 19.0, 18.0, 37.0, 58.0, 94.0, 172.0, 240.0, 462.0, 886.0, 1713.0, 3409.0, 6753.0, 13693.0, 30071.0, 69091.0, 172533.0, 362687.0, 225657.0, 89326.0, 37646.0, 17345.0, 8268.0, 4020.0, 1966.0, 1013.0, 535.0, 321.0, 176.0, 112.0, 59.0, 38.0, 28.0, 32.0, 14.0, 14.0, 10.0, 2.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3984375, -8.156005859375, -7.91357421875, -7.671142578125, -7.4287109375, -7.186279296875, -6.94384765625, -6.701416015625, -6.458984375, -6.216552734375, -5.97412109375, -5.731689453125, -5.4892578125, -5.246826171875, -5.00439453125, -4.761962890625, -4.51953125, -4.277099609375, -4.03466796875, -3.792236328125, -3.5498046875, -3.307373046875, -3.06494140625, -2.822509765625, -2.580078125, -2.337646484375, -2.09521484375, -1.852783203125, -1.6103515625, -1.367919921875, -1.12548828125, -0.883056640625, -0.640625, -0.398193359375, -0.15576171875, 0.086669921875, 0.3291015625, 0.571533203125, 0.81396484375, 1.056396484375, 1.298828125, 1.541259765625, 1.78369140625, 2.026123046875, 2.2685546875, 2.510986328125, 2.75341796875, 2.995849609375, 3.23828125, 3.480712890625, 3.72314453125, 3.965576171875, 4.2080078125, 4.450439453125, 4.69287109375, 4.935302734375, 5.177734375, 5.420166015625, 5.66259765625, 5.905029296875, 6.1474609375, 6.389892578125, 6.63232421875, 6.874755859375, 7.1171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 11.0, 12.0, 16.0, 22.0, 24.0, 23.0, 19.0, 30.0, 42.0, 39.0, 41.0, 54.0, 78.0, 101.0, 198.0, 1373.0, 311.0, 141.0, 80.0, 65.0, 52.0, 37.0, 37.0, 34.0, 32.0, 19.0, 24.0, 20.0, 28.0, 16.0, 9.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.904052734375, -19.27685546875, -18.649658203125, -18.0224609375, -17.395263671875, -16.76806640625, -16.140869140625, -15.513671875, -14.886474609375, -14.25927734375, -13.632080078125, -13.0048828125, -12.377685546875, -11.75048828125, -11.123291015625, -10.49609375, -9.868896484375, -9.24169921875, -8.614501953125, -7.9873046875, -7.360107421875, -6.73291015625, -6.105712890625, -5.478515625, -4.851318359375, -4.22412109375, -3.596923828125, -2.9697265625, -2.342529296875, -1.71533203125, -1.088134765625, -0.4609375, 0.166259765625, 0.79345703125, 1.420654296875, 2.0478515625, 2.675048828125, 3.30224609375, 3.929443359375, 4.556640625, 5.183837890625, 5.81103515625, 6.438232421875, 7.0654296875, 7.692626953125, 8.31982421875, 8.947021484375, 9.57421875, 10.201416015625, 10.82861328125, 11.455810546875, 12.0830078125, 12.710205078125, 13.33740234375, 13.964599609375, 14.591796875, 15.218994140625, 15.84619140625, 16.473388671875, 17.1005859375, 17.727783203125, 18.35498046875, 18.982177734375, 19.609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 9.0, 11.0, 6.0, 18.0, 17.0, 24.0, 27.0, 45.0, 46.0, 48.0, 68.0, 87.0, 115.0, 166.0, 249.0, 462.0, 1347.0, 10382.0, 456787.0, 2635219.0, 36094.0, 2631.0, 647.0, 330.0, 224.0, 141.0, 111.0, 70.0, 55.0, 47.0, 34.0, 21.0, 33.0, 24.0, 22.0, 19.0, 13.0, 8.0, 5.0, 10.0, 10.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.09375, -34.85791015625, -33.6220703125, -32.38623046875, -31.150390625, -29.91455078125, -28.6787109375, -27.44287109375, -26.20703125, -24.97119140625, -23.7353515625, -22.49951171875, -21.263671875, -20.02783203125, -18.7919921875, -17.55615234375, -16.3203125, -15.08447265625, -13.8486328125, -12.61279296875, -11.376953125, -10.14111328125, -8.9052734375, -7.66943359375, -6.43359375, -5.19775390625, -3.9619140625, -2.72607421875, -1.490234375, -0.25439453125, 0.9814453125, 2.21728515625, 3.453125, 4.68896484375, 5.9248046875, 7.16064453125, 8.396484375, 9.63232421875, 10.8681640625, 12.10400390625, 13.33984375, 14.57568359375, 15.8115234375, 17.04736328125, 18.283203125, 19.51904296875, 20.7548828125, 21.99072265625, 23.2265625, 24.46240234375, 25.6982421875, 26.93408203125, 28.169921875, 29.40576171875, 30.6416015625, 31.87744140625, 33.11328125, 34.34912109375, 35.5849609375, 36.82080078125, 38.056640625, 39.29248046875, 40.5283203125, 41.76416015625, 43.0]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 29.0, 326.0, 536.0, 118.0, 7.0, 2.0], "bins": [-397.85980224609375, -391.2550964355469, -384.650390625, -378.04571533203125, -371.4410095214844, -364.8363037109375, -358.2315979003906, -351.62689208984375, -345.0221862792969, -338.41748046875, -331.8127746582031, -325.20806884765625, -318.6033935546875, -311.9986877441406, -305.39398193359375, -298.7892761230469, -292.1845703125, -285.5798645019531, -278.97515869140625, -272.3704833984375, -265.7657775878906, -259.16107177734375, -252.55636596679688, -245.95166015625, -239.34698486328125, -232.74227905273438, -226.13758850097656, -219.5328826904297, -212.9281768798828, -206.323486328125, -199.71878051757812, -193.11407470703125, -186.50936889648438, -179.9046630859375, -173.2999725341797, -166.6952667236328, -160.09056091308594, -153.48587036132812, -146.88116455078125, -140.27645874023438, -133.67176818847656, -127.06707000732422, -120.46236419677734, -113.857666015625, -107.25296020507812, -100.64826202392578, -94.04356384277344, -87.43885803222656, -80.83415985107422, -74.22946166992188, -67.624755859375, -61.020057678222656, -54.41535568237305, -47.81065368652344, -41.205955505371094, -34.601253509521484, -27.996551513671875, -21.391849517822266, -14.787149429321289, -8.182449340820312, -1.5777473449707031, 5.026954650878906, 11.63165283203125, 18.23635482788086, 24.84105682373047]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 12.0, 16.0, 15.0, 10.0, 7.0, 17.0, 25.0, 25.0, 28.0, 30.0, 31.0, 33.0, 47.0, 47.0, 53.0, 43.0, 48.0, 42.0, 53.0, 52.0, 43.0, 31.0, 39.0, 36.0, 38.0, 26.0, 21.0, 17.0, 27.0, 24.0, 11.0, 12.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.00276184082031, -67.91947937011719, -65.83618927001953, -63.75290298461914, -61.66961669921875, -59.58633041381836, -57.50304412841797, -55.41975784301758, -53.33647155761719, -51.2531852722168, -49.169898986816406, -47.086612701416016, -45.003326416015625, -42.920040130615234, -40.836753845214844, -38.75346755981445, -36.67018127441406, -34.58689498901367, -32.50360870361328, -30.42032241821289, -28.3370361328125, -26.25374984741211, -24.17046356201172, -22.087177276611328, -20.003890991210938, -17.920604705810547, -15.837318420410156, -13.754032135009766, -11.670745849609375, -9.587459564208984, -7.504173278808594, -5.420886993408203, -3.3376007080078125, -1.2543144226074219, 0.8289718627929688, 2.9122581481933594, 4.99554443359375, 7.078830718994141, 9.162117004394531, 11.245403289794922, 13.328689575195312, 15.411975860595703, 17.495262145996094, 19.578548431396484, 21.661834716796875, 23.745121002197266, 25.828407287597656, 27.911693572998047, 29.994979858398438, 32.07826614379883, 34.16155242919922, 36.24483871459961, 38.328125, 40.41141128540039, 42.49469757080078, 44.57798385620117, 46.66127014160156, 48.74455642700195, 50.827842712402344, 52.911128997802734, 54.994415283203125, 57.077701568603516, 59.160987854003906, 61.2442741394043, 63.32756042480469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 19.0, 26.0, 24.0, 24.0, 30.0, 38.0, 38.0, 46.0, 43.0, 60.0, 54.0, 52.0, 56.0, 74.0, 46.0, 48.0, 45.0, 49.0, 36.0, 37.0, 26.0, 29.0, 19.0, 12.0, 12.0, 14.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.44439697265625, -6.1895751953125, -5.93475341796875, -5.679931640625, -5.42510986328125, -5.1702880859375, -4.91546630859375, -4.66064453125, -4.40582275390625, -4.1510009765625, -3.89617919921875, -3.641357421875, -3.38653564453125, -3.1317138671875, -2.87689208984375, -2.6220703125, -2.36724853515625, -2.1124267578125, -1.85760498046875, -1.602783203125, -1.34796142578125, -1.0931396484375, -0.83831787109375, -0.58349609375, -0.32867431640625, -0.0738525390625, 0.18096923828125, 0.435791015625, 0.69061279296875, 0.9454345703125, 1.20025634765625, 1.455078125, 1.70989990234375, 1.9647216796875, 2.21954345703125, 2.474365234375, 2.72918701171875, 2.9840087890625, 3.23883056640625, 3.49365234375, 3.74847412109375, 4.0032958984375, 4.25811767578125, 4.512939453125, 4.76776123046875, 5.0225830078125, 5.27740478515625, 5.5322265625, 5.78704833984375, 6.0418701171875, 6.29669189453125, 6.551513671875, 6.80633544921875, 7.0611572265625, 7.31597900390625, 7.57080078125, 7.82562255859375, 8.0804443359375, 8.33526611328125, 8.590087890625, 8.84490966796875, 9.0997314453125, 9.35455322265625, 9.609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 12.0, 11.0, 14.0, 16.0, 36.0, 47.0, 59.0, 91.0, 129.0, 242.0, 396.0, 869.0, 2282.0, 8240.0, 45244.0, 334536.0, 1798135.0, 1662668.0, 290955.0, 39238.0, 7191.0, 2056.0, 803.0, 376.0, 214.0, 126.0, 75.0, 57.0, 42.0, 30.0, 24.0, 17.0, 10.0, 5.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.066162109375, -10.65576171875, -10.245361328125, -9.8349609375, -9.424560546875, -9.01416015625, -8.603759765625, -8.193359375, -7.782958984375, -7.37255859375, -6.962158203125, -6.5517578125, -6.141357421875, -5.73095703125, -5.320556640625, -4.91015625, -4.499755859375, -4.08935546875, -3.678955078125, -3.2685546875, -2.858154296875, -2.44775390625, -2.037353515625, -1.626953125, -1.216552734375, -0.80615234375, -0.395751953125, 0.0146484375, 0.425048828125, 0.83544921875, 1.245849609375, 1.65625, 2.066650390625, 2.47705078125, 2.887451171875, 3.2978515625, 3.708251953125, 4.11865234375, 4.529052734375, 4.939453125, 5.349853515625, 5.76025390625, 6.170654296875, 6.5810546875, 6.991455078125, 7.40185546875, 7.812255859375, 8.22265625, 8.633056640625, 9.04345703125, 9.453857421875, 9.8642578125, 10.274658203125, 10.68505859375, 11.095458984375, 11.505859375, 11.916259765625, 12.32666015625, 12.737060546875, 13.1474609375, 13.557861328125, 13.96826171875, 14.378662109375, 14.7890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 16.0, 12.0, 17.0, 25.0, 28.0, 28.0, 38.0, 57.0, 60.0, 84.0, 118.0, 127.0, 158.0, 252.0, 290.0, 299.0, 334.0, 363.0, 334.0, 252.0, 239.0, 174.0, 175.0, 112.0, 90.0, 62.0, 71.0, 37.0, 47.0, 35.0, 21.0, 19.0, 13.0, 15.0, 11.0, 8.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.4296875, -10.115478515625, -9.80126953125, -9.487060546875, -9.1728515625, -8.858642578125, -8.54443359375, -8.230224609375, -7.916015625, -7.601806640625, -7.28759765625, -6.973388671875, -6.6591796875, -6.344970703125, -6.03076171875, -5.716552734375, -5.40234375, -5.088134765625, -4.77392578125, -4.459716796875, -4.1455078125, -3.831298828125, -3.51708984375, -3.202880859375, -2.888671875, -2.574462890625, -2.26025390625, -1.946044921875, -1.6318359375, -1.317626953125, -1.00341796875, -0.689208984375, -0.375, -0.060791015625, 0.25341796875, 0.567626953125, 0.8818359375, 1.196044921875, 1.51025390625, 1.824462890625, 2.138671875, 2.452880859375, 2.76708984375, 3.081298828125, 3.3955078125, 3.709716796875, 4.02392578125, 4.338134765625, 4.65234375, 4.966552734375, 5.28076171875, 5.594970703125, 5.9091796875, 6.223388671875, 6.53759765625, 6.851806640625, 7.166015625, 7.480224609375, 7.79443359375, 8.108642578125, 8.4228515625, 8.737060546875, 9.05126953125, 9.365478515625, 9.6796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 16.0, 13.0, 16.0, 25.0, 32.0, 32.0, 42.0, 57.0, 69.0, 85.0, 160.0, 243.0, 389.0, 813.0, 3463.0, 58838.0, 2067139.0, 2000518.0, 57022.0, 3365.0, 816.0, 338.0, 187.0, 141.0, 101.0, 83.0, 42.0, 45.0, 32.0, 24.0, 31.0, 22.0, 8.0, 16.0, 7.0, 7.0, 3.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.25, -31.20947265625, -30.1689453125, -29.12841796875, -28.087890625, -27.04736328125, -26.0068359375, -24.96630859375, -23.92578125, -22.88525390625, -21.8447265625, -20.80419921875, -19.763671875, -18.72314453125, -17.6826171875, -16.64208984375, -15.6015625, -14.56103515625, -13.5205078125, -12.47998046875, -11.439453125, -10.39892578125, -9.3583984375, -8.31787109375, -7.27734375, -6.23681640625, -5.1962890625, -4.15576171875, -3.115234375, -2.07470703125, -1.0341796875, 0.00634765625, 1.046875, 2.08740234375, 3.1279296875, 4.16845703125, 5.208984375, 6.24951171875, 7.2900390625, 8.33056640625, 9.37109375, 10.41162109375, 11.4521484375, 12.49267578125, 13.533203125, 14.57373046875, 15.6142578125, 16.65478515625, 17.6953125, 18.73583984375, 19.7763671875, 20.81689453125, 21.857421875, 22.89794921875, 23.9384765625, 24.97900390625, 26.01953125, 27.06005859375, 28.1005859375, 29.14111328125, 30.181640625, 31.22216796875, 32.2626953125, 33.30322265625, 34.34375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 23.0, 33.0, 53.0, 105.0, 130.0, 151.0, 148.0, 112.0, 115.0, 54.0, 43.0, 15.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-98.87984466552734, -96.21894073486328, -93.55803680419922, -90.89714050292969, -88.23623657226562, -85.57533264160156, -82.9144287109375, -80.25352478027344, -77.5926284790039, -74.93172454833984, -72.27082061767578, -69.60992431640625, -66.94902038574219, -64.28811645507812, -61.62721252441406, -58.966312408447266, -56.3054084777832, -53.64450454711914, -50.983604431152344, -48.32270050048828, -45.661800384521484, -43.00089645385742, -40.339996337890625, -37.67909240722656, -35.0181884765625, -32.35728454589844, -29.69638442993164, -27.035480499267578, -24.37458038330078, -21.71367645263672, -19.05277442932129, -16.39187240600586, -13.730972290039062, -11.070070266723633, -8.409168243408203, -5.748265266418457, -3.0873632431030273, -0.42646121978759766, 2.2344417572021484, 4.895343780517578, 7.556245803833008, 10.217147827148438, 12.878049850463867, 15.538952827453613, 18.19985580444336, 20.860755920410156, 23.52165985107422, 26.18256187438965, 28.843463897705078, 31.504365921020508, 34.16526794433594, 36.826171875, 39.4870719909668, 42.14797592163086, 44.808876037597656, 47.46977996826172, 50.13068389892578, 52.791587829589844, 55.45248794555664, 58.1133918762207, 60.7742919921875, 63.43519592285156, 66.09609985351562, 68.75700378417969, 71.41790008544922]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 3.0, 5.0, 10.0, 8.0, 14.0, 14.0, 15.0, 22.0, 23.0, 25.0, 26.0, 28.0, 25.0, 34.0, 50.0, 42.0, 49.0, 50.0, 41.0, 41.0, 48.0, 37.0, 41.0, 35.0, 36.0, 26.0, 42.0, 23.0, 30.0, 22.0, 22.0, 17.0, 12.0, 11.0, 14.0, 8.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28371047973633, -38.98664093017578, -37.689571380615234, -36.39250183105469, -35.09543228149414, -33.798362731933594, -32.50129318237305, -31.2042236328125, -29.907154083251953, -28.610084533691406, -27.31301498413086, -26.015945434570312, -24.718875885009766, -23.42180633544922, -22.124736785888672, -20.827667236328125, -19.53059959411621, -18.233530044555664, -16.936460494995117, -15.63939094543457, -14.342321395874023, -13.045251846313477, -11.748183250427246, -10.4511137008667, -9.154044151306152, -7.8569746017456055, -6.559905052185059, -5.26283597946167, -3.965766429901123, -2.668696880340576, -1.3716278076171875, -0.07455825805664062, 1.2225112915039062, 2.519580841064453, 3.816650152206421, 5.113719463348389, 6.4107890129089355, 7.707858562469482, 9.004927635192871, 10.301997184753418, 11.599066734313965, 12.896136283874512, 14.193205833435059, 15.490274429321289, 16.787343978881836, 18.084413528442383, 19.38148307800293, 20.678552627563477, 21.975622177124023, 23.27269172668457, 24.569761276245117, 25.866830825805664, 27.16390037536621, 28.460969924926758, 29.758037567138672, 31.05510711669922, 32.352176666259766, 33.64924621582031, 34.94631576538086, 36.243385314941406, 37.54045486450195, 38.8375244140625, 40.13459396362305, 41.431663513183594, 42.72873306274414]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 1.0, 11.0, 7.0, 14.0, 15.0, 19.0, 26.0, 27.0, 27.0, 46.0, 51.0, 48.0, 50.0, 54.0, 51.0, 48.0, 63.0, 55.0, 63.0, 48.0, 45.0, 35.0, 39.0, 23.0, 34.0, 22.0, 20.0, 14.0, 8.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.265380859375, -6.02294921875, -5.780517578125, -5.5380859375, -5.295654296875, -5.05322265625, -4.810791015625, -4.568359375, -4.325927734375, -4.08349609375, -3.841064453125, -3.5986328125, -3.356201171875, -3.11376953125, -2.871337890625, -2.62890625, -2.386474609375, -2.14404296875, -1.901611328125, -1.6591796875, -1.416748046875, -1.17431640625, -0.931884765625, -0.689453125, -0.447021484375, -0.20458984375, 0.037841796875, 0.2802734375, 0.522705078125, 0.76513671875, 1.007568359375, 1.25, 1.492431640625, 1.73486328125, 1.977294921875, 2.2197265625, 2.462158203125, 2.70458984375, 2.947021484375, 3.189453125, 3.431884765625, 3.67431640625, 3.916748046875, 4.1591796875, 4.401611328125, 4.64404296875, 4.886474609375, 5.12890625, 5.371337890625, 5.61376953125, 5.856201171875, 6.0986328125, 6.341064453125, 6.58349609375, 6.825927734375, 7.068359375, 7.310791015625, 7.55322265625, 7.795654296875, 8.0380859375, 8.280517578125, 8.52294921875, 8.765380859375, 9.0078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 9.0, 15.0, 18.0, 31.0, 48.0, 69.0, 105.0, 184.0, 358.0, 524.0, 941.0, 1581.0, 2700.0, 4692.0, 8305.0, 14439.0, 24981.0, 42911.0, 68969.0, 104505.0, 143059.0, 166362.0, 152762.0, 115544.0, 78120.0, 48781.0, 29288.0, 16650.0, 9630.0, 5430.0, 3170.0, 1852.0, 1035.0, 598.0, 382.0, 213.0, 109.0, 68.0, 37.0, 28.0, 21.0, 15.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.03515625, -0.9990081787109375, -0.962860107421875, -0.9267120361328125, -0.89056396484375, -0.8544158935546875, -0.818267822265625, -0.7821197509765625, -0.7459716796875, -0.7098236083984375, -0.673675537109375, -0.6375274658203125, -0.60137939453125, -0.5652313232421875, -0.529083251953125, -0.4929351806640625, -0.456787109375, -0.4206390380859375, -0.384490966796875, -0.3483428955078125, -0.31219482421875, -0.2760467529296875, -0.239898681640625, -0.2037506103515625, -0.1676025390625, -0.1314544677734375, -0.095306396484375, -0.0591583251953125, -0.02301025390625, 0.0131378173828125, 0.049285888671875, 0.0854339599609375, 0.12158203125, 0.1577301025390625, 0.193878173828125, 0.2300262451171875, 0.26617431640625, 0.3023223876953125, 0.338470458984375, 0.3746185302734375, 0.4107666015625, 0.4469146728515625, 0.483062744140625, 0.5192108154296875, 0.55535888671875, 0.5915069580078125, 0.627655029296875, 0.6638031005859375, 0.699951171875, 0.7360992431640625, 0.772247314453125, 0.8083953857421875, 0.84454345703125, 0.8806915283203125, 0.916839599609375, 0.9529876708984375, 0.9891357421875, 1.0252838134765625, 1.061431884765625, 1.0975799560546875, 1.13372802734375, 1.1698760986328125, 1.206024169921875, 1.2421722412109375, 1.2783203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 11.0, 12.0, 13.0, 10.0, 6.0, 15.0, 13.0, 22.0, 19.0, 29.0, 31.0, 24.0, 29.0, 27.0, 41.0, 31.0, 31.0, 34.0, 51.0, 1069.0, 42.0, 39.0, 32.0, 53.0, 25.0, 40.0, 35.0, 27.0, 27.0, 20.0, 18.0, 18.0, 16.0, 16.0, 18.0, 13.0, 11.0, 11.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.897705078125, -4.74853515625, -4.599365234375, -4.4501953125, -4.301025390625, -4.15185546875, -4.002685546875, -3.853515625, -3.704345703125, -3.55517578125, -3.406005859375, -3.2568359375, -3.107666015625, -2.95849609375, -2.809326171875, -2.66015625, -2.510986328125, -2.36181640625, -2.212646484375, -2.0634765625, -1.914306640625, -1.76513671875, -1.615966796875, -1.466796875, -1.317626953125, -1.16845703125, -1.019287109375, -0.8701171875, -0.720947265625, -0.57177734375, -0.422607421875, -0.2734375, -0.124267578125, 0.02490234375, 0.174072265625, 0.3232421875, 0.472412109375, 0.62158203125, 0.770751953125, 0.919921875, 1.069091796875, 1.21826171875, 1.367431640625, 1.5166015625, 1.665771484375, 1.81494140625, 1.964111328125, 2.11328125, 2.262451171875, 2.41162109375, 2.560791015625, 2.7099609375, 2.859130859375, 3.00830078125, 3.157470703125, 3.306640625, 3.455810546875, 3.60498046875, 3.754150390625, 3.9033203125, 4.052490234375, 4.20166015625, 4.350830078125, 4.5]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 12.0, 20.0, 26.0, 39.0, 71.0, 105.0, 156.0, 255.0, 465.0, 788.0, 1217.0, 2175.0, 3741.0, 6935.0, 12967.0, 24334.0, 45116.0, 81900.0, 139541.0, 454561.0, 967306.0, 153697.0, 90802.0, 51067.0, 27480.0, 14598.0, 7838.0, 4216.0, 2286.0, 1424.0, 762.0, 466.0, 264.0, 178.0, 102.0, 68.0, 54.0, 32.0, 19.0, 25.0, 3.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65283203125, -0.6318359375, -0.61083984375, -0.58984375, -0.56884765625, -0.5478515625, -0.52685546875, -0.505859375, -0.48486328125, -0.4638671875, -0.44287109375, -0.421875, -0.40087890625, -0.3798828125, -0.35888671875, -0.337890625, -0.31689453125, -0.2958984375, -0.27490234375, -0.25390625, -0.23291015625, -0.2119140625, -0.19091796875, -0.169921875, -0.14892578125, -0.1279296875, -0.10693359375, -0.0859375, -0.06494140625, -0.0439453125, -0.02294921875, -0.001953125, 0.01904296875, 0.0400390625, 0.06103515625, 0.08203125, 0.10302734375, 0.1240234375, 0.14501953125, 0.166015625, 0.18701171875, 0.2080078125, 0.22900390625, 0.25, 0.27099609375, 0.2919921875, 0.31298828125, 0.333984375, 0.35498046875, 0.3759765625, 0.39697265625, 0.41796875, 0.43896484375, 0.4599609375, 0.48095703125, 0.501953125, 0.52294921875, 0.5439453125, 0.56494140625, 0.5859375, 0.60693359375, 0.6279296875, 0.64892578125, 0.669921875, 0.69091796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 3.0, 7.0, 21.0, 19.0, 20.0, 25.0, 31.0, 46.0, 58.0, 84.0, 99.0, 90.0, 96.0, 65.0, 77.0, 47.0, 28.0, 34.0, 31.0, 12.0, 16.0, 11.0, 11.0, 2.0, 8.0, 5.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15700149536132812, -0.15201568603515625, -0.14702987670898438, -0.1420440673828125, -0.13705825805664062, -0.13207244873046875, -0.12708663940429688, -0.122100830078125, -0.11711502075195312, -0.11212921142578125, -0.10714340209960938, -0.1021575927734375, -0.09717178344726562, -0.09218597412109375, -0.08720016479492188, -0.08221435546875, -0.07722854614257812, -0.07224273681640625, -0.06725692749023438, -0.0622711181640625, -0.057285308837890625, -0.05229949951171875, -0.047313690185546875, -0.042327880859375, -0.037342071533203125, -0.03235626220703125, -0.027370452880859375, -0.0223846435546875, -0.017398834228515625, -0.01241302490234375, -0.007427215576171875, -0.00244140625, 0.002544403076171875, 0.00753021240234375, 0.012516021728515625, 0.0175018310546875, 0.022487640380859375, 0.02747344970703125, 0.032459259033203125, 0.037445068359375, 0.042430877685546875, 0.04741668701171875, 0.052402496337890625, 0.0573883056640625, 0.062374114990234375, 0.06735992431640625, 0.07234573364257812, 0.07733154296875, 0.08231735229492188, 0.08730316162109375, 0.09228897094726562, 0.0972747802734375, 0.10226058959960938, 0.10724639892578125, 0.11223220825195312, 0.117218017578125, 0.12220382690429688, 0.12718963623046875, 0.13217544555664062, 0.1371612548828125, 0.14214706420898438, 0.14713287353515625, 0.15211868286132812, 0.1571044921875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 16.0, 23.0, 13.0, 23.0, 37.0, 58.0, 87.0, 132.0, 242.0, 665.0, 13542.0, 1022892.0, 9550.0, 591.0, 245.0, 139.0, 65.0, 44.0, 38.0, 19.0, 26.0, 10.0, 11.0, 8.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.229888916015625, -3.12384033203125, -3.017791748046875, -2.9117431640625, -2.805694580078125, -2.69964599609375, -2.593597412109375, -2.487548828125, -2.381500244140625, -2.27545166015625, -2.169403076171875, -2.0633544921875, -1.957305908203125, -1.85125732421875, -1.745208740234375, -1.63916015625, -1.533111572265625, -1.42706298828125, -1.321014404296875, -1.2149658203125, -1.108917236328125, -1.00286865234375, -0.896820068359375, -0.790771484375, -0.684722900390625, -0.57867431640625, -0.472625732421875, -0.3665771484375, -0.260528564453125, -0.15447998046875, -0.048431396484375, 0.0576171875, 0.163665771484375, 0.26971435546875, 0.375762939453125, 0.4818115234375, 0.587860107421875, 0.69390869140625, 0.799957275390625, 0.906005859375, 1.012054443359375, 1.11810302734375, 1.224151611328125, 1.3302001953125, 1.436248779296875, 1.54229736328125, 1.648345947265625, 1.75439453125, 1.860443115234375, 1.96649169921875, 2.072540283203125, 2.1785888671875, 2.284637451171875, 2.39068603515625, 2.496734619140625, 2.602783203125, 2.708831787109375, 2.81488037109375, 2.920928955078125, 3.0269775390625, 3.133026123046875, 3.23907470703125, 3.345123291015625, 3.451171875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 21.0, 43.0, 93.0, 359.0, 369.0, 84.0, 17.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45485252141952515, -0.4172830283641815, -0.3797135651111603, -0.34214407205581665, -0.3045746088027954, -0.2670051157474518, -0.22943562269210815, -0.19186615943908691, -0.1542966663837433, -0.11672718822956085, -0.07915770262479782, -0.04158821702003479, -0.004018738865852356, 0.03355073928833008, 0.0711202323436737, 0.10868969559669495, 0.14625918865203857, 0.183828666806221, 0.22139814496040344, 0.25896763801574707, 0.2965371012687683, 0.33410659432411194, 0.37167608737945557, 0.4092455506324768, 0.44681504368782043, 0.48438453674316406, 0.5219539999961853, 0.5595234632492065, 0.5970929861068726, 0.6346624493598938, 0.672231912612915, 0.709801435470581, 0.7473709583282471, 0.7849404215812683, 0.8225099444389343, 0.8600794076919556, 0.8976488709449768, 0.935218334197998, 0.9727878570556641, 1.01035737991333, 1.0479267835617065, 1.0854963064193726, 1.123065710067749, 1.160635232925415, 1.198204755783081, 1.2357741594314575, 1.2733436822891235, 1.3109130859375, 1.348482608795166, 1.386052131652832, 1.4236215353012085, 1.4611910581588745, 1.4987605810165405, 1.536329984664917, 1.573899507522583, 1.611469030380249, 1.649038553237915, 1.686608076095581, 1.7241774797439575, 1.7617470026016235, 1.7993165254592896, 1.836885929107666, 1.874455451965332, 1.912024974822998, 1.9495943784713745]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 10.0, 6.0, 17.0, 11.0, 17.0, 17.0, 16.0, 22.0, 32.0, 29.0, 31.0, 33.0, 28.0, 37.0, 51.0, 56.0, 34.0, 48.0, 56.0, 54.0, 47.0, 35.0, 37.0, 39.0, 30.0, 35.0, 27.0, 28.0, 22.0, 21.0, 12.0, 18.0, 11.0, 5.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28441178798675537, -0.27548426389694214, -0.2665567100048065, -0.2576291859149933, -0.24870163202285767, -0.23977410793304443, -0.23084656894207, -0.22191902995109558, -0.21299149096012115, -0.20406395196914673, -0.1951364129781723, -0.18620887398719788, -0.17728134989738464, -0.16835379600524902, -0.1594262719154358, -0.15049873292446136, -0.14157119393348694, -0.1326436549425125, -0.12371611595153809, -0.11478858441114426, -0.10586104542016983, -0.0969335064291954, -0.08800597488880157, -0.07907843589782715, -0.07015089690685272, -0.061223357915878296, -0.05229582265019417, -0.04336828738451004, -0.034440748393535614, -0.025513209402561188, -0.01658567413687706, -0.007658138871192932, 0.0012694001197814941, 0.010196937248110771, 0.019124474376440048, 0.028052011504769325, 0.0369795486330986, 0.04590708762407303, 0.054834622889757156, 0.06376215815544128, 0.07268969714641571, 0.08161723613739014, 0.09054477512836456, 0.09947230666875839, 0.10839984565973282, 0.11732738465070724, 0.12625491619110107, 0.1351824551820755, 0.14410999417304993, 0.15303753316402435, 0.16196507215499878, 0.1708926111459732, 0.17982015013694763, 0.18874767422676086, 0.1976752132177353, 0.20660275220870972, 0.21553029119968414, 0.22445783019065857, 0.233385369181633, 0.24231290817260742, 0.25124043226242065, 0.2601679861545563, 0.2690955102443695, 0.2780230641365051, 0.28695058822631836]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 8.0, 10.0, 18.0, 17.0, 25.0, 28.0, 35.0, 48.0, 51.0, 50.0, 49.0, 65.0, 43.0, 65.0, 70.0, 63.0, 55.0, 58.0, 39.0, 48.0, 29.0, 30.0, 16.0, 20.0, 18.0, 15.0, 9.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.0172119140625, -6.753173828125, -6.4891357421875, -6.22509765625, -5.9610595703125, -5.697021484375, -5.4329833984375, -5.1689453125, -4.9049072265625, -4.640869140625, -4.3768310546875, -4.11279296875, -3.8487548828125, -3.584716796875, -3.3206787109375, -3.056640625, -2.7926025390625, -2.528564453125, -2.2645263671875, -2.00048828125, -1.7364501953125, -1.472412109375, -1.2083740234375, -0.9443359375, -0.6802978515625, -0.416259765625, -0.1522216796875, 0.11181640625, 0.3758544921875, 0.639892578125, 0.9039306640625, 1.16796875, 1.4320068359375, 1.696044921875, 1.9600830078125, 2.22412109375, 2.4881591796875, 2.752197265625, 3.0162353515625, 3.2802734375, 3.5443115234375, 3.808349609375, 4.0723876953125, 4.33642578125, 4.6004638671875, 4.864501953125, 5.1285400390625, 5.392578125, 5.6566162109375, 5.920654296875, 6.1846923828125, 6.44873046875, 6.7127685546875, 6.976806640625, 7.2408447265625, 7.5048828125, 7.7689208984375, 8.032958984375, 8.2969970703125, 8.56103515625, 8.8250732421875, 9.089111328125, 9.3531494140625, 9.6171875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 6.0, 14.0, 14.0, 21.0, 35.0, 52.0, 88.0, 149.0, 280.0, 503.0, 911.0, 1817.0, 3777.0, 7944.0, 16462.0, 36821.0, 82263.0, 197603.0, 344769.0, 201091.0, 84473.0, 36954.0, 16784.0, 7923.0, 3778.0, 1881.0, 973.0, 484.0, 255.0, 154.0, 91.0, 58.0, 44.0, 25.0, 17.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.28125, -7.0501708984375, -6.819091796875, -6.5880126953125, -6.35693359375, -6.1258544921875, -5.894775390625, -5.6636962890625, -5.4326171875, -5.2015380859375, -4.970458984375, -4.7393798828125, -4.50830078125, -4.2772216796875, -4.046142578125, -3.8150634765625, -3.583984375, -3.3529052734375, -3.121826171875, -2.8907470703125, -2.65966796875, -2.4285888671875, -2.197509765625, -1.9664306640625, -1.7353515625, -1.5042724609375, -1.273193359375, -1.0421142578125, -0.81103515625, -0.5799560546875, -0.348876953125, -0.1177978515625, 0.11328125, 0.3443603515625, 0.575439453125, 0.8065185546875, 1.03759765625, 1.2686767578125, 1.499755859375, 1.7308349609375, 1.9619140625, 2.1929931640625, 2.424072265625, 2.6551513671875, 2.88623046875, 3.1173095703125, 3.348388671875, 3.5794677734375, 3.810546875, 4.0416259765625, 4.272705078125, 4.5037841796875, 4.73486328125, 4.9659423828125, 5.197021484375, 5.4281005859375, 5.6591796875, 5.8902587890625, 6.121337890625, 6.3524169921875, 6.58349609375, 6.8145751953125, 7.045654296875, 7.2767333984375, 7.5078125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 9.0, 8.0, 12.0, 12.0, 17.0, 12.0, 22.0, 23.0, 36.0, 36.0, 31.0, 49.0, 49.0, 52.0, 86.0, 167.0, 324.0, 1375.0, 203.0, 101.0, 68.0, 68.0, 35.0, 38.0, 39.0, 33.0, 26.0, 23.0, 20.0, 19.0, 14.0, 11.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.65625, -23.933349609375, -23.21044921875, -22.487548828125, -21.7646484375, -21.041748046875, -20.31884765625, -19.595947265625, -18.873046875, -18.150146484375, -17.42724609375, -16.704345703125, -15.9814453125, -15.258544921875, -14.53564453125, -13.812744140625, -13.08984375, -12.366943359375, -11.64404296875, -10.921142578125, -10.1982421875, -9.475341796875, -8.75244140625, -8.029541015625, -7.306640625, -6.583740234375, -5.86083984375, -5.137939453125, -4.4150390625, -3.692138671875, -2.96923828125, -2.246337890625, -1.5234375, -0.800537109375, -0.07763671875, 0.645263671875, 1.3681640625, 2.091064453125, 2.81396484375, 3.536865234375, 4.259765625, 4.982666015625, 5.70556640625, 6.428466796875, 7.1513671875, 7.874267578125, 8.59716796875, 9.320068359375, 10.04296875, 10.765869140625, 11.48876953125, 12.211669921875, 12.9345703125, 13.657470703125, 14.38037109375, 15.103271484375, 15.826171875, 16.549072265625, 17.27197265625, 17.994873046875, 18.7177734375, 19.440673828125, 20.16357421875, 20.886474609375, 21.609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 13.0, 15.0, 31.0, 31.0, 59.0, 65.0, 84.0, 146.0, 238.0, 313.0, 537.0, 1461.0, 68544.0, 3046916.0, 24732.0, 1069.0, 462.0, 283.0, 189.0, 125.0, 82.0, 73.0, 54.0, 33.0, 25.0, 20.0, 13.0, 10.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-64.125, -62.26123046875, -60.3974609375, -58.53369140625, -56.669921875, -54.80615234375, -52.9423828125, -51.07861328125, -49.21484375, -47.35107421875, -45.4873046875, -43.62353515625, -41.759765625, -39.89599609375, -38.0322265625, -36.16845703125, -34.3046875, -32.44091796875, -30.5771484375, -28.71337890625, -26.849609375, -24.98583984375, -23.1220703125, -21.25830078125, -19.39453125, -17.53076171875, -15.6669921875, -13.80322265625, -11.939453125, -10.07568359375, -8.2119140625, -6.34814453125, -4.484375, -2.62060546875, -0.7568359375, 1.10693359375, 2.970703125, 4.83447265625, 6.6982421875, 8.56201171875, 10.42578125, 12.28955078125, 14.1533203125, 16.01708984375, 17.880859375, 19.74462890625, 21.6083984375, 23.47216796875, 25.3359375, 27.19970703125, 29.0634765625, 30.92724609375, 32.791015625, 34.65478515625, 36.5185546875, 38.38232421875, 40.24609375, 42.10986328125, 43.9736328125, 45.83740234375, 47.701171875, 49.56494140625, 51.4287109375, 53.29248046875, 55.15625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 24.0, 818.0, 172.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65788650512695, -20.38923454284668, -8.120582580566406, 4.148067474365234, 16.41672134399414, 28.685375213623047, 40.95402145385742, 53.22267532348633, 65.4913330078125, 77.7599868774414, 90.02864074707031, 102.29728698730469, 114.5659408569336, 126.8345947265625, 139.10324096679688, 151.37188720703125, 163.6405487060547, 175.90919494628906, 188.1778564453125, 200.44650268554688, 212.71514892578125, 224.9838104248047, 237.25245666503906, 249.5211181640625, 261.7897644042969, 274.05841064453125, 286.3270568847656, 298.595703125, 310.8643798828125, 323.1330261230469, 335.40167236328125, 347.6703186035156, 359.93896484375, 372.2076110839844, 384.47625732421875, 396.74493408203125, 409.0135803222656, 421.2822265625, 433.5508728027344, 445.81951904296875, 458.08819580078125, 470.3568420410156, 482.62548828125, 494.8941650390625, 507.1628112792969, 519.4314575195312, 531.7000732421875, 543.96875, 556.2374267578125, 568.506103515625, 580.7747192382812, 593.0433959960938, 605.31201171875, 617.5806884765625, 629.849365234375, 642.1179809570312, 654.3865966796875, 666.6552734375, 678.9238891601562, 691.1925659179688, 703.461181640625, 715.7298583984375, 727.99853515625, 740.2671508789062, 752.5358276367188]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 5.0, 6.0, 6.0, 8.0, 7.0, 15.0, 13.0, 14.0, 16.0, 26.0, 23.0, 19.0, 23.0, 29.0, 26.0, 31.0, 36.0, 35.0, 31.0, 31.0, 35.0, 20.0, 41.0, 39.0, 44.0, 43.0, 31.0, 36.0, 35.0, 33.0, 37.0, 26.0, 27.0, 27.0, 18.0, 23.0, 7.0, 15.0, 12.0, 11.0, 6.0, 4.0, 4.0, 5.0, 5.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-50.81249237060547, -49.29574203491211, -47.778987884521484, -46.262237548828125, -44.7454833984375, -43.22873306274414, -41.71198272705078, -40.195228576660156, -38.6784782409668, -37.16172790527344, -35.64497375488281, -34.12822341918945, -32.611473083496094, -31.09471893310547, -29.57796859741211, -28.061216354370117, -26.544464111328125, -25.027711868286133, -23.51095962524414, -21.99420928955078, -20.47745704650879, -18.960704803466797, -17.443954467773438, -15.927202224731445, -14.410449981689453, -12.893697738647461, -11.376946449279785, -9.86019515991211, -8.343442916870117, -6.826691150665283, -5.309939384460449, -3.7931880950927734, -2.276439666748047, -0.7596879005432129, 0.7570638656616211, 2.273815631866455, 3.790567398071289, 5.307319164276123, 6.824070930480957, 8.340822219848633, 9.857574462890625, 11.374326705932617, 12.891077995300293, 14.407829284667969, 15.924581527709961, 17.441333770751953, 18.958084106445312, 20.474836349487305, 21.991588592529297, 23.50834083557129, 25.02509307861328, 26.54184341430664, 28.058595657348633, 29.575347900390625, 31.092098236083984, 32.608848571777344, 34.12560272216797, 35.64235305786133, 37.15910720825195, 38.67585754394531, 40.19261169433594, 41.7093620300293, 43.226112365722656, 44.74286651611328, 46.25961685180664]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 8.0, 11.0, 13.0, 23.0, 22.0, 20.0, 28.0, 42.0, 30.0, 39.0, 39.0, 50.0, 51.0, 52.0, 55.0, 60.0, 56.0, 53.0, 52.0, 37.0, 49.0, 28.0, 28.0, 26.0, 24.0, 18.0, 26.0, 12.0, 17.0, 9.0, 4.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.7655029296875, -7.507568359375, -7.2496337890625, -6.99169921875, -6.7337646484375, -6.475830078125, -6.2178955078125, -5.9599609375, -5.7020263671875, -5.444091796875, -5.1861572265625, -4.92822265625, -4.6702880859375, -4.412353515625, -4.1544189453125, -3.896484375, -3.6385498046875, -3.380615234375, -3.1226806640625, -2.86474609375, -2.6068115234375, -2.348876953125, -2.0909423828125, -1.8330078125, -1.5750732421875, -1.317138671875, -1.0592041015625, -0.80126953125, -0.5433349609375, -0.285400390625, -0.0274658203125, 0.23046875, 0.4884033203125, 0.746337890625, 1.0042724609375, 1.26220703125, 1.5201416015625, 1.778076171875, 2.0360107421875, 2.2939453125, 2.5518798828125, 2.809814453125, 3.0677490234375, 3.32568359375, 3.5836181640625, 3.841552734375, 4.0994873046875, 4.357421875, 4.6153564453125, 4.873291015625, 5.1312255859375, 5.38916015625, 5.6470947265625, 5.905029296875, 6.1629638671875, 6.4208984375, 6.6788330078125, 6.936767578125, 7.1947021484375, 7.45263671875, 7.7105712890625, 7.968505859375, 8.2264404296875, 8.484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 9.0, 20.0, 21.0, 27.0, 33.0, 37.0, 66.0, 104.0, 130.0, 190.0, 309.0, 537.0, 949.0, 1774.0, 3907.0, 9828.0, 29858.0, 107216.0, 404281.0, 1221444.0, 1531721.0, 634535.0, 175435.0, 47522.0, 14407.0, 5189.0, 2159.0, 1027.0, 568.0, 325.0, 189.0, 126.0, 81.0, 82.0, 37.0, 38.0, 31.0, 18.0, 10.0, 11.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.546875, -9.2591552734375, -8.971435546875, -8.6837158203125, -8.39599609375, -8.1082763671875, -7.820556640625, -7.5328369140625, -7.2451171875, -6.9573974609375, -6.669677734375, -6.3819580078125, -6.09423828125, -5.8065185546875, -5.518798828125, -5.2310791015625, -4.943359375, -4.6556396484375, -4.367919921875, -4.0802001953125, -3.79248046875, -3.5047607421875, -3.217041015625, -2.9293212890625, -2.6416015625, -2.3538818359375, -2.066162109375, -1.7784423828125, -1.49072265625, -1.2030029296875, -0.915283203125, -0.6275634765625, -0.33984375, -0.0521240234375, 0.235595703125, 0.5233154296875, 0.81103515625, 1.0987548828125, 1.386474609375, 1.6741943359375, 1.9619140625, 2.2496337890625, 2.537353515625, 2.8250732421875, 3.11279296875, 3.4005126953125, 3.688232421875, 3.9759521484375, 4.263671875, 4.5513916015625, 4.839111328125, 5.1268310546875, 5.41455078125, 5.7022705078125, 5.989990234375, 6.2777099609375, 6.5654296875, 6.8531494140625, 7.140869140625, 7.4285888671875, 7.71630859375, 8.0040283203125, 8.291748046875, 8.5794677734375, 8.8671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 14.0, 23.0, 20.0, 26.0, 34.0, 47.0, 35.0, 71.0, 100.0, 124.0, 172.0, 224.0, 299.0, 355.0, 385.0, 384.0, 361.0, 329.0, 249.0, 188.0, 134.0, 110.0, 95.0, 75.0, 46.0, 36.0, 33.0, 17.0, 26.0, 11.0, 9.0, 13.0, 7.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.5390625, -10.1514892578125, -9.763916015625, -9.3763427734375, -8.98876953125, -8.6011962890625, -8.213623046875, -7.8260498046875, -7.4384765625, -7.0509033203125, -6.663330078125, -6.2757568359375, -5.88818359375, -5.5006103515625, -5.113037109375, -4.7254638671875, -4.337890625, -3.9503173828125, -3.562744140625, -3.1751708984375, -2.78759765625, -2.4000244140625, -2.012451171875, -1.6248779296875, -1.2373046875, -0.8497314453125, -0.462158203125, -0.0745849609375, 0.31298828125, 0.7005615234375, 1.088134765625, 1.4757080078125, 1.86328125, 2.2508544921875, 2.638427734375, 3.0260009765625, 3.41357421875, 3.8011474609375, 4.188720703125, 4.5762939453125, 4.9638671875, 5.3514404296875, 5.739013671875, 6.1265869140625, 6.51416015625, 6.9017333984375, 7.289306640625, 7.6768798828125, 8.064453125, 8.4520263671875, 8.839599609375, 9.2271728515625, 9.61474609375, 10.0023193359375, 10.389892578125, 10.7774658203125, 11.1650390625, 11.5526123046875, 11.940185546875, 12.3277587890625, 12.71533203125, 13.1029052734375, 13.490478515625, 13.8780517578125, 14.265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 8.0, 10.0, 12.0, 13.0, 19.0, 25.0, 22.0, 31.0, 41.0, 75.0, 96.0, 125.0, 162.0, 236.0, 402.0, 1402.0, 22159.0, 1268484.0, 2833620.0, 63275.0, 2597.0, 542.0, 295.0, 176.0, 122.0, 86.0, 51.0, 51.0, 35.0, 26.0, 25.0, 18.0, 17.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.90625, -43.66357421875, -42.4208984375, -41.17822265625, -39.935546875, -38.69287109375, -37.4501953125, -36.20751953125, -34.96484375, -33.72216796875, -32.4794921875, -31.23681640625, -29.994140625, -28.75146484375, -27.5087890625, -26.26611328125, -25.0234375, -23.78076171875, -22.5380859375, -21.29541015625, -20.052734375, -18.81005859375, -17.5673828125, -16.32470703125, -15.08203125, -13.83935546875, -12.5966796875, -11.35400390625, -10.111328125, -8.86865234375, -7.6259765625, -6.38330078125, -5.140625, -3.89794921875, -2.6552734375, -1.41259765625, -0.169921875, 1.07275390625, 2.3154296875, 3.55810546875, 4.80078125, 6.04345703125, 7.2861328125, 8.52880859375, 9.771484375, 11.01416015625, 12.2568359375, 13.49951171875, 14.7421875, 15.98486328125, 17.2275390625, 18.47021484375, 19.712890625, 20.95556640625, 22.1982421875, 23.44091796875, 24.68359375, 25.92626953125, 27.1689453125, 28.41162109375, 29.654296875, 30.89697265625, 32.1396484375, 33.38232421875, 34.625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 19.0, 30.0, 35.0, 68.0, 84.0, 104.0, 127.0, 114.0, 98.0, 86.0, 80.0, 40.0, 44.0, 30.0, 15.0, 4.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.15153121948242, -61.11180114746094, -59.07207107543945, -57.03234100341797, -54.992610931396484, -52.952880859375, -50.913150787353516, -48.87342071533203, -46.83369064331055, -44.79396057128906, -42.75423049926758, -40.714500427246094, -38.67477035522461, -36.635040283203125, -34.59531021118164, -32.555580139160156, -30.515850067138672, -28.476119995117188, -26.436389923095703, -24.39665985107422, -22.356929779052734, -20.31719970703125, -18.277469635009766, -16.23773956298828, -14.198009490966797, -12.158279418945312, -10.118549346923828, -8.078819274902344, -6.039089202880859, -3.999359130859375, -1.9596290588378906, 0.08010101318359375, 2.1198348999023438, 4.159564971923828, 6.1992950439453125, 8.239025115966797, 10.278755187988281, 12.318485260009766, 14.35821533203125, 16.397945404052734, 18.43767547607422, 20.477405548095703, 22.517135620117188, 24.556865692138672, 26.596595764160156, 28.63632583618164, 30.676055908203125, 32.71578598022461, 34.755516052246094, 36.79524612426758, 38.83497619628906, 40.87470626831055, 42.91443634033203, 44.954166412353516, 46.993896484375, 49.033626556396484, 51.07335662841797, 53.11308670043945, 55.15281677246094, 57.19254684448242, 59.232276916503906, 61.27200698852539, 63.311737060546875, 65.35147094726562, 67.39119720458984]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 4.0, 8.0, 15.0, 14.0, 10.0, 17.0, 28.0, 32.0, 24.0, 26.0, 31.0, 40.0, 40.0, 37.0, 48.0, 35.0, 45.0, 38.0, 39.0, 50.0, 45.0, 32.0, 43.0, 41.0, 38.0, 32.0, 29.0, 18.0, 21.0, 23.0, 19.0, 16.0, 11.0, 12.0, 5.0, 10.0, 0.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.09914779663086, -39.69208526611328, -38.28502655029297, -36.87796401977539, -35.47090148925781, -34.063838958740234, -32.656776428222656, -31.249717712402344, -29.842655181884766, -28.435592651367188, -27.028532028198242, -25.621471405029297, -24.21440887451172, -22.80734634399414, -21.400285720825195, -19.99322509765625, -18.586162567138672, -17.179100036621094, -15.772039413452148, -14.364977836608887, -12.957916259765625, -11.550854682922363, -10.143793106079102, -8.73673152923584, -7.329669952392578, -5.922608375549316, -4.515546798706055, -3.108485221862793, -1.7014236450195312, -0.29436206817626953, 1.1126995086669922, 2.519761085510254, 3.9268264770507812, 5.333888053894043, 6.740949630737305, 8.148011207580566, 9.555072784423828, 10.96213436126709, 12.369195938110352, 13.776257514953613, 15.183319091796875, 16.590381622314453, 17.9974422454834, 19.404502868652344, 20.811565399169922, 22.2186279296875, 23.625688552856445, 25.03274917602539, 26.43981170654297, 27.846874237060547, 29.253934860229492, 30.660995483398438, 32.068058013916016, 33.475120544433594, 34.882179260253906, 36.289241790771484, 37.69630432128906, 39.10336685180664, 40.51042938232422, 41.91748809814453, 43.32455062866211, 44.73161315917969, 46.138671875, 47.54573440551758, 48.952796936035156]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 6.0, 9.0, 7.0, 16.0, 15.0, 19.0, 33.0, 24.0, 34.0, 55.0, 43.0, 39.0, 55.0, 49.0, 62.0, 51.0, 54.0, 49.0, 49.0, 47.0, 38.0, 42.0, 39.0, 36.0, 29.0, 15.0, 22.0, 9.0, 8.0, 8.0, 7.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.573486328125, -7.33447265625, -7.095458984375, -6.8564453125, -6.617431640625, -6.37841796875, -6.139404296875, -5.900390625, -5.661376953125, -5.42236328125, -5.183349609375, -4.9443359375, -4.705322265625, -4.46630859375, -4.227294921875, -3.98828125, -3.749267578125, -3.51025390625, -3.271240234375, -3.0322265625, -2.793212890625, -2.55419921875, -2.315185546875, -2.076171875, -1.837158203125, -1.59814453125, -1.359130859375, -1.1201171875, -0.881103515625, -0.64208984375, -0.403076171875, -0.1640625, 0.074951171875, 0.31396484375, 0.552978515625, 0.7919921875, 1.031005859375, 1.27001953125, 1.509033203125, 1.748046875, 1.987060546875, 2.22607421875, 2.465087890625, 2.7041015625, 2.943115234375, 3.18212890625, 3.421142578125, 3.66015625, 3.899169921875, 4.13818359375, 4.377197265625, 4.6162109375, 4.855224609375, 5.09423828125, 5.333251953125, 5.572265625, 5.811279296875, 6.05029296875, 6.289306640625, 6.5283203125, 6.767333984375, 7.00634765625, 7.245361328125, 7.484375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 11.0, 21.0, 15.0, 44.0, 52.0, 90.0, 131.0, 198.0, 355.0, 565.0, 861.0, 1485.0, 2407.0, 3835.0, 6260.0, 10563.0, 17031.0, 27732.0, 43651.0, 66969.0, 97558.0, 129364.0, 151000.0, 143828.0, 114872.0, 82928.0, 54779.0, 34992.0, 21927.0, 13630.0, 8317.0, 4979.0, 3136.0, 1847.0, 1170.0, 653.0, 483.0, 300.0, 172.0, 118.0, 83.0, 57.0, 27.0, 21.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.111328125, -1.0793609619140625, -1.047393798828125, -1.0154266357421875, -0.98345947265625, -0.9514923095703125, -0.919525146484375, -0.8875579833984375, -0.8555908203125, -0.8236236572265625, -0.791656494140625, -0.7596893310546875, -0.72772216796875, -0.6957550048828125, -0.663787841796875, -0.6318206787109375, -0.599853515625, -0.5678863525390625, -0.535919189453125, -0.5039520263671875, -0.47198486328125, -0.4400177001953125, -0.408050537109375, -0.3760833740234375, -0.3441162109375, -0.3121490478515625, -0.280181884765625, -0.2482147216796875, -0.21624755859375, -0.1842803955078125, -0.152313232421875, -0.1203460693359375, -0.08837890625, -0.0564117431640625, -0.024444580078125, 0.0075225830078125, 0.03948974609375, 0.0714569091796875, 0.103424072265625, 0.1353912353515625, 0.1673583984375, 0.1993255615234375, 0.231292724609375, 0.2632598876953125, 0.29522705078125, 0.3271942138671875, 0.359161376953125, 0.3911285400390625, 0.423095703125, 0.4550628662109375, 0.487030029296875, 0.5189971923828125, 0.55096435546875, 0.5829315185546875, 0.614898681640625, 0.6468658447265625, 0.6788330078125, 0.7108001708984375, 0.742767333984375, 0.7747344970703125, 0.80670166015625, 0.8386688232421875, 0.870635986328125, 0.9026031494140625, 0.9345703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 7.0, 8.0, 9.0, 18.0, 16.0, 16.0, 24.0, 32.0, 39.0, 32.0, 31.0, 30.0, 41.0, 45.0, 39.0, 54.0, 41.0, 1056.0, 53.0, 46.0, 52.0, 46.0, 44.0, 35.0, 31.0, 35.0, 27.0, 29.0, 23.0, 10.0, 8.0, 13.0, 8.0, 6.0, 11.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.9605712890625, -4.784423828125, -4.6082763671875, -4.43212890625, -4.2559814453125, -4.079833984375, -3.9036865234375, -3.7275390625, -3.5513916015625, -3.375244140625, -3.1990966796875, -3.02294921875, -2.8468017578125, -2.670654296875, -2.4945068359375, -2.318359375, -2.1422119140625, -1.966064453125, -1.7899169921875, -1.61376953125, -1.4376220703125, -1.261474609375, -1.0853271484375, -0.9091796875, -0.7330322265625, -0.556884765625, -0.3807373046875, -0.20458984375, -0.0284423828125, 0.147705078125, 0.3238525390625, 0.5, 0.6761474609375, 0.852294921875, 1.0284423828125, 1.20458984375, 1.3807373046875, 1.556884765625, 1.7330322265625, 1.9091796875, 2.0853271484375, 2.261474609375, 2.4376220703125, 2.61376953125, 2.7899169921875, 2.966064453125, 3.1422119140625, 3.318359375, 3.4945068359375, 3.670654296875, 3.8468017578125, 4.02294921875, 4.1990966796875, 4.375244140625, 4.5513916015625, 4.7275390625, 4.9036865234375, 5.079833984375, 5.2559814453125, 5.43212890625, 5.6082763671875, 5.784423828125, 5.9605712890625, 6.13671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 14.0, 14.0, 25.0, 51.0, 48.0, 103.0, 124.0, 210.0, 386.0, 634.0, 1126.0, 1777.0, 3401.0, 5948.0, 11126.0, 20995.0, 39932.0, 73348.0, 125665.0, 232776.0, 1201955.0, 158967.0, 98995.0, 55482.0, 29334.0, 15662.0, 8468.0, 4460.0, 2544.0, 1437.0, 821.0, 501.0, 289.0, 173.0, 102.0, 74.0, 45.0, 42.0, 27.0, 18.0, 9.0, 2.0, 6.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6166229248046875, -0.595550537109375, -0.5744781494140625, -0.55340576171875, -0.5323333740234375, -0.511260986328125, -0.4901885986328125, -0.4691162109375, -0.4480438232421875, -0.426971435546875, -0.4058990478515625, -0.38482666015625, -0.3637542724609375, -0.342681884765625, -0.3216094970703125, -0.300537109375, -0.2794647216796875, -0.258392333984375, -0.2373199462890625, -0.21624755859375, -0.1951751708984375, -0.174102783203125, -0.1530303955078125, -0.1319580078125, -0.1108856201171875, -0.089813232421875, -0.0687408447265625, -0.04766845703125, -0.0265960693359375, -0.005523681640625, 0.0155487060546875, 0.03662109375, 0.0576934814453125, 0.078765869140625, 0.0998382568359375, 0.12091064453125, 0.1419830322265625, 0.163055419921875, 0.1841278076171875, 0.2052001953125, 0.2262725830078125, 0.247344970703125, 0.2684173583984375, 0.28948974609375, 0.3105621337890625, 0.331634521484375, 0.3527069091796875, 0.373779296875, 0.3948516845703125, 0.415924072265625, 0.4369964599609375, 0.45806884765625, 0.4791412353515625, 0.500213623046875, 0.5212860107421875, 0.5423583984375, 0.5634307861328125, 0.584503173828125, 0.6055755615234375, 0.62664794921875, 0.6477203369140625, 0.668792724609375, 0.6898651123046875, 0.7109375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 12.0, 16.0, 12.0, 17.0, 23.0, 26.0, 34.0, 56.0, 57.0, 89.0, 109.0, 111.0, 118.0, 71.0, 57.0, 43.0, 35.0, 16.0, 17.0, 18.0, 7.0, 12.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10107421875, -0.09827804565429688, -0.09548187255859375, -0.09268569946289062, -0.0898895263671875, -0.08709335327148438, -0.08429718017578125, -0.08150100708007812, -0.078704833984375, -0.07590866088867188, -0.07311248779296875, -0.07031631469726562, -0.0675201416015625, -0.06472396850585938, -0.06192779541015625, -0.059131622314453125, -0.05633544921875, -0.053539276123046875, -0.05074310302734375, -0.047946929931640625, -0.0451507568359375, -0.042354583740234375, -0.03955841064453125, -0.036762237548828125, -0.033966064453125, -0.031169891357421875, -0.02837371826171875, -0.025577545166015625, -0.0227813720703125, -0.019985198974609375, -0.01718902587890625, -0.014392852783203125, -0.0115966796875, -0.008800506591796875, -0.00600433349609375, -0.003208160400390625, -0.0004119873046875, 0.002384185791015625, 0.00518035888671875, 0.007976531982421875, 0.010772705078125, 0.013568878173828125, 0.01636505126953125, 0.019161224365234375, 0.0219573974609375, 0.024753570556640625, 0.02754974365234375, 0.030345916748046875, 0.03314208984375, 0.035938262939453125, 0.03873443603515625, 0.041530609130859375, 0.0443267822265625, 0.047122955322265625, 0.04991912841796875, 0.052715301513671875, 0.055511474609375, 0.058307647705078125, 0.06110382080078125, 0.06389999389648438, 0.0666961669921875, 0.06949234008789062, 0.07228851318359375, 0.07508468627929688, 0.077880859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 11.0, 11.0, 16.0, 34.0, 32.0, 64.0, 89.0, 164.0, 583.0, 8560.0, 1004212.0, 33074.0, 1187.0, 196.0, 94.0, 55.0, 39.0, 16.0, 21.0, 20.0, 16.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0], "bins": [-1.7392578125, -1.6763763427734375, -1.613494873046875, -1.5506134033203125, -1.48773193359375, -1.4248504638671875, -1.361968994140625, -1.2990875244140625, -1.2362060546875, -1.1733245849609375, -1.110443115234375, -1.0475616455078125, -0.98468017578125, -0.9217987060546875, -0.858917236328125, -0.7960357666015625, -0.733154296875, -0.6702728271484375, -0.607391357421875, -0.5445098876953125, -0.48162841796875, -0.4187469482421875, -0.355865478515625, -0.2929840087890625, -0.2301025390625, -0.1672210693359375, -0.104339599609375, -0.0414581298828125, 0.02142333984375, 0.0843048095703125, 0.147186279296875, 0.2100677490234375, 0.27294921875, 0.3358306884765625, 0.398712158203125, 0.4615936279296875, 0.52447509765625, 0.5873565673828125, 0.650238037109375, 0.7131195068359375, 0.7760009765625, 0.8388824462890625, 0.901763916015625, 0.9646453857421875, 1.02752685546875, 1.0904083251953125, 1.153289794921875, 1.2161712646484375, 1.279052734375, 1.3419342041015625, 1.404815673828125, 1.4676971435546875, 1.53057861328125, 1.5934600830078125, 1.656341552734375, 1.7192230224609375, 1.7821044921875, 1.8449859619140625, 1.907867431640625, 1.9707489013671875, 2.03363037109375, 2.0965118408203125, 2.159393310546875, 2.2222747802734375, 2.28515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 13.0, 31.0, 149.0, 484.0, 276.0, 49.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6079012751579285, -0.5811535716056824, -0.554405927658081, -0.527658224105835, -0.5009105205535889, -0.47416284680366516, -0.44741517305374146, -0.42066746950149536, -0.39391979575157166, -0.36717212200164795, -0.34042441844940186, -0.31367674469947815, -0.28692907094955444, -0.26018136739730835, -0.23343369364738464, -0.20668600499629974, -0.17993831634521484, -0.15319062769412994, -0.12644293904304504, -0.09969526529312134, -0.07294757664203644, -0.04619988799095154, -0.019452214241027832, 0.007295474410057068, 0.03404316306114197, 0.06079084798693657, 0.08753853291273117, 0.11428621411323547, 0.14103390276432037, 0.16778159141540527, 0.19452926516532898, 0.22127695381641388, 0.248024582862854, 0.2747722566127777, 0.3015199601650238, 0.3282676339149475, 0.3550153374671936, 0.3817630112171173, 0.408510684967041, 0.4352583885192871, 0.4620060622692108, 0.4887537360191345, 0.5155014395713806, 0.5422490835189819, 0.568996787071228, 0.5957444906234741, 0.6224921941757202, 0.6492398381233215, 0.6759875416755676, 0.7027352452278137, 0.729482889175415, 0.7562305927276611, 0.7829782962799072, 0.8097259998321533, 0.8364736437797546, 0.8632213473320007, 0.889968991279602, 0.9167166948318481, 0.9434643387794495, 0.9702120423316956, 0.9969597458839417, 1.023707389831543, 1.050455093383789, 1.0772027969360352, 1.1039505004882812]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 11.0, 4.0, 6.0, 11.0, 11.0, 5.0, 11.0, 10.0, 15.0, 12.0, 18.0, 16.0, 20.0, 30.0, 33.0, 23.0, 29.0, 22.0, 33.0, 40.0, 36.0, 45.0, 31.0, 41.0, 47.0, 33.0, 37.0, 34.0, 36.0, 41.0, 34.0, 25.0, 23.0, 20.0, 24.0, 20.0, 27.0, 24.0, 15.0, 7.0, 13.0, 2.0, 5.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1591394543647766, -0.15438105165958405, -0.14962264895439148, -0.14486423134803772, -0.14010582864284515, -0.1353474259376526, -0.13058902323246002, -0.12583062052726746, -0.1210722103714943, -0.11631380766630173, -0.11155539751052856, -0.106796994805336, -0.10203859210014343, -0.09728018194437027, -0.0925217792391777, -0.08776336908340454, -0.08300496637821198, -0.07824656367301941, -0.07348815351724625, -0.06872975081205368, -0.06397134065628052, -0.05921293795108795, -0.054454535245895386, -0.04969612881541252, -0.04493772238492966, -0.04017931595444679, -0.03542090952396393, -0.030662506818771362, -0.025904100388288498, -0.021145693957805634, -0.01638728938996792, -0.011628884822130203, -0.006870478391647339, -0.002112072892487049, 0.0026463326066732407, 0.00740473810583353, 0.01216314360499382, 0.016921550035476685, 0.0216799546033144, 0.026438359171152115, 0.03119676560163498, 0.035955172032117844, 0.04071357846260071, 0.045471981167793274, 0.05023038759827614, 0.054988794028759, 0.05974719673395157, 0.06450560688972473, 0.0692640095949173, 0.07402241230010986, 0.07878082245588303, 0.08353922516107559, 0.08829763531684875, 0.09305603802204132, 0.09781444072723389, 0.10257284343242645, 0.10733125358819962, 0.11208965629339218, 0.11684806644916534, 0.12160646915435791, 0.12636487185955048, 0.13112327456474304, 0.1358816921710968, 0.14064009487628937, 0.14539849758148193]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 13.0, 14.0, 15.0, 22.0, 30.0, 32.0, 42.0, 49.0, 48.0, 49.0, 52.0, 52.0, 60.0, 59.0, 54.0, 57.0, 46.0, 51.0, 40.0, 40.0, 32.0, 23.0, 19.0, 14.0, 20.0, 8.0, 9.0, 9.0, 7.0, 6.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.04876708984375, -6.7967529296875, -6.54473876953125, -6.292724609375, -6.04071044921875, -5.7886962890625, -5.53668212890625, -5.28466796875, -5.03265380859375, -4.7806396484375, -4.52862548828125, -4.276611328125, -4.02459716796875, -3.7725830078125, -3.52056884765625, -3.2685546875, -3.01654052734375, -2.7645263671875, -2.51251220703125, -2.260498046875, -2.00848388671875, -1.7564697265625, -1.50445556640625, -1.25244140625, -1.00042724609375, -0.7484130859375, -0.49639892578125, -0.244384765625, 0.00762939453125, 0.2596435546875, 0.51165771484375, 0.763671875, 1.01568603515625, 1.2677001953125, 1.51971435546875, 1.771728515625, 2.02374267578125, 2.2757568359375, 2.52777099609375, 2.77978515625, 3.03179931640625, 3.2838134765625, 3.53582763671875, 3.787841796875, 4.03985595703125, 4.2918701171875, 4.54388427734375, 4.7958984375, 5.04791259765625, 5.2999267578125, 5.55194091796875, 5.803955078125, 6.05596923828125, 6.3079833984375, 6.55999755859375, 6.81201171875, 7.06402587890625, 7.3160400390625, 7.56805419921875, 7.820068359375, 8.07208251953125, 8.3240966796875, 8.57611083984375, 8.828125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 14.0, 15.0, 22.0, 39.0, 67.0, 112.0, 193.0, 342.0, 580.0, 1064.0, 2114.0, 4022.0, 8668.0, 21366.0, 55283.0, 143263.0, 335038.0, 283062.0, 116428.0, 44697.0, 17533.0, 7265.0, 3465.0, 1719.0, 920.0, 507.0, 306.0, 162.0, 107.0, 59.0, 35.0, 29.0, 14.0, 14.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.619384765625, -8.34033203125, -8.061279296875, -7.7822265625, -7.503173828125, -7.22412109375, -6.945068359375, -6.666015625, -6.386962890625, -6.10791015625, -5.828857421875, -5.5498046875, -5.270751953125, -4.99169921875, -4.712646484375, -4.43359375, -4.154541015625, -3.87548828125, -3.596435546875, -3.3173828125, -3.038330078125, -2.75927734375, -2.480224609375, -2.201171875, -1.922119140625, -1.64306640625, -1.364013671875, -1.0849609375, -0.805908203125, -0.52685546875, -0.247802734375, 0.03125, 0.310302734375, 0.58935546875, 0.868408203125, 1.1474609375, 1.426513671875, 1.70556640625, 1.984619140625, 2.263671875, 2.542724609375, 2.82177734375, 3.100830078125, 3.3798828125, 3.658935546875, 3.93798828125, 4.217041015625, 4.49609375, 4.775146484375, 5.05419921875, 5.333251953125, 5.6123046875, 5.891357421875, 6.17041015625, 6.449462890625, 6.728515625, 7.007568359375, 7.28662109375, 7.565673828125, 7.8447265625, 8.123779296875, 8.40283203125, 8.681884765625, 8.9609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 2.0, 6.0, 11.0, 19.0, 20.0, 22.0, 25.0, 28.0, 31.0, 40.0, 35.0, 47.0, 40.0, 57.0, 89.0, 180.0, 1467.0, 345.0, 122.0, 77.0, 55.0, 54.0, 47.0, 34.0, 22.0, 22.0, 30.0, 23.0, 18.0, 15.0, 12.0, 9.0, 8.0, 8.0, 8.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.515625, -24.7138671875, -23.912109375, -23.1103515625, -22.30859375, -21.5068359375, -20.705078125, -19.9033203125, -19.1015625, -18.2998046875, -17.498046875, -16.6962890625, -15.89453125, -15.0927734375, -14.291015625, -13.4892578125, -12.6875, -11.8857421875, -11.083984375, -10.2822265625, -9.48046875, -8.6787109375, -7.876953125, -7.0751953125, -6.2734375, -5.4716796875, -4.669921875, -3.8681640625, -3.06640625, -2.2646484375, -1.462890625, -0.6611328125, 0.140625, 0.9423828125, 1.744140625, 2.5458984375, 3.34765625, 4.1494140625, 4.951171875, 5.7529296875, 6.5546875, 7.3564453125, 8.158203125, 8.9599609375, 9.76171875, 10.5634765625, 11.365234375, 12.1669921875, 12.96875, 13.7705078125, 14.572265625, 15.3740234375, 16.17578125, 16.9775390625, 17.779296875, 18.5810546875, 19.3828125, 20.1845703125, 20.986328125, 21.7880859375, 22.58984375, 23.3916015625, 24.193359375, 24.9951171875, 25.796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 7.0, 10.0, 16.0, 21.0, 33.0, 50.0, 76.0, 99.0, 144.0, 268.0, 663.0, 2513.0, 403637.0, 2731978.0, 4412.0, 881.0, 371.0, 148.0, 101.0, 88.0, 51.0, 20.0, 35.0, 24.0, 13.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.5, -88.818359375, -86.13671875, -83.455078125, -80.7734375, -78.091796875, -75.41015625, -72.728515625, -70.046875, -67.365234375, -64.68359375, -62.001953125, -59.3203125, -56.638671875, -53.95703125, -51.275390625, -48.59375, -45.912109375, -43.23046875, -40.548828125, -37.8671875, -35.185546875, -32.50390625, -29.822265625, -27.140625, -24.458984375, -21.77734375, -19.095703125, -16.4140625, -13.732421875, -11.05078125, -8.369140625, -5.6875, -3.005859375, -0.32421875, 2.357421875, 5.0390625, 7.720703125, 10.40234375, 13.083984375, 15.765625, 18.447265625, 21.12890625, 23.810546875, 26.4921875, 29.173828125, 31.85546875, 34.537109375, 37.21875, 39.900390625, 42.58203125, 45.263671875, 47.9453125, 50.626953125, 53.30859375, 55.990234375, 58.671875, 61.353515625, 64.03515625, 66.716796875, 69.3984375, 72.080078125, 74.76171875, 77.443359375, 80.125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 33.0, 89.0, 178.0, 225.0, 253.0, 149.0, 59.0, 20.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.248231887817383, -14.765911102294922, -12.283590316772461, -9.80126953125, -7.318948745727539, -4.836627960205078, -2.354307174682617, 0.12801361083984375, 2.6103343963623047, 5.092655181884766, 7.574975967407227, 10.057296752929688, 12.539617538452148, 15.02193832397461, 17.50425910949707, 19.98657989501953, 22.468900680541992, 24.951221466064453, 27.433542251586914, 29.915863037109375, 32.39818572998047, 34.8805046081543, 37.362823486328125, 39.84514617919922, 42.32746887207031, 44.809791564941406, 47.292110443115234, 49.77442932128906, 52.256752014160156, 54.73907470703125, 57.22139358520508, 59.703712463378906, 62.18603515625, 64.6683578491211, 67.15068054199219, 69.63299560546875, 72.11531829833984, 74.59764099121094, 77.0799560546875, 79.5622787475586, 82.04460144042969, 84.52692413330078, 87.00924682617188, 89.49156188964844, 91.97388458251953, 94.45620727539062, 96.93852233886719, 99.42084503173828, 101.90316772460938, 104.38549041748047, 106.86781311035156, 109.35012817382812, 111.83245086669922, 114.31477355957031, 116.79708862304688, 119.27941131591797, 121.76173400878906, 124.24405670166016, 126.72637939453125, 129.2086944580078, 131.69100952148438, 134.17333984375, 136.65565490722656, 139.1379852294922, 141.62030029296875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 3.0, 6.0, 13.0, 6.0, 17.0, 20.0, 19.0, 19.0, 26.0, 22.0, 22.0, 22.0, 35.0, 35.0, 33.0, 46.0, 36.0, 29.0, 35.0, 37.0, 42.0, 44.0, 49.0, 32.0, 44.0, 30.0, 35.0, 35.0, 21.0, 28.0, 17.0, 15.0, 18.0, 22.0, 17.0, 14.0, 8.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-59.61161804199219, -57.921905517578125, -56.2321891784668, -54.54247283935547, -52.852760314941406, -51.163047790527344, -49.473331451416016, -47.78361511230469, -46.093902587890625, -44.40419006347656, -42.714473724365234, -41.024757385253906, -39.335044860839844, -37.64533233642578, -35.95561599731445, -34.265899658203125, -32.57618713378906, -30.886472702026367, -29.196758270263672, -27.507043838500977, -25.81732940673828, -24.127614974975586, -22.43790054321289, -20.748186111450195, -19.0584716796875, -17.368757247924805, -15.67904281616211, -13.989328384399414, -12.299613952636719, -10.609899520874023, -8.920185089111328, -7.230470657348633, -5.5407562255859375, -3.851041793823242, -2.161327362060547, -0.47161293029785156, 1.2181015014648438, 2.907815933227539, 4.597530364990234, 6.28724479675293, 7.976959228515625, 9.66667366027832, 11.356388092041016, 13.046102523803711, 14.735816955566406, 16.4255313873291, 18.115245819091797, 19.804960250854492, 21.494674682617188, 23.184389114379883, 24.874103546142578, 26.563817977905273, 28.25353240966797, 29.943246841430664, 31.63296127319336, 33.32267761230469, 35.01239013671875, 36.70210266113281, 38.39181900024414, 40.08153533935547, 41.77124786376953, 43.460960388183594, 45.15067672729492, 46.84039306640625, 48.53010559082031]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 17.0, 14.0, 14.0, 25.0, 30.0, 46.0, 43.0, 55.0, 47.0, 49.0, 65.0, 60.0, 61.0, 59.0, 60.0, 63.0, 41.0, 46.0, 35.0, 33.0, 35.0, 18.0, 11.0, 9.0, 10.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96484375, -6.67681884765625, -6.3887939453125, -6.10076904296875, -5.812744140625, -5.52471923828125, -5.2366943359375, -4.94866943359375, -4.66064453125, -4.37261962890625, -4.0845947265625, -3.79656982421875, -3.508544921875, -3.22052001953125, -2.9324951171875, -2.64447021484375, -2.3564453125, -2.06842041015625, -1.7803955078125, -1.49237060546875, -1.204345703125, -0.91632080078125, -0.6282958984375, -0.34027099609375, -0.05224609375, 0.23577880859375, 0.5238037109375, 0.81182861328125, 1.099853515625, 1.38787841796875, 1.6759033203125, 1.96392822265625, 2.251953125, 2.53997802734375, 2.8280029296875, 3.11602783203125, 3.404052734375, 3.69207763671875, 3.9801025390625, 4.26812744140625, 4.55615234375, 4.84417724609375, 5.1322021484375, 5.42022705078125, 5.708251953125, 5.99627685546875, 6.2843017578125, 6.57232666015625, 6.8603515625, 7.14837646484375, 7.4364013671875, 7.72442626953125, 8.012451171875, 8.30047607421875, 8.5885009765625, 8.87652587890625, 9.16455078125, 9.45257568359375, 9.7406005859375, 10.02862548828125, 10.316650390625, 10.60467529296875, 10.8927001953125, 11.18072509765625, 11.46875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 10.0, 20.0, 28.0, 33.0, 64.0, 90.0, 179.0, 307.0, 590.0, 1477.0, 4138.0, 15001.0, 75944.0, 456716.0, 1883441.0, 1418822.0, 275451.0, 46604.0, 10161.0, 3012.0, 1082.0, 515.0, 235.0, 107.0, 68.0, 46.0, 37.0, 25.0, 11.0, 15.0, 11.0, 6.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.334716796875, -9.93505859375, -9.535400390625, -9.1357421875, -8.736083984375, -8.33642578125, -7.936767578125, -7.537109375, -7.137451171875, -6.73779296875, -6.338134765625, -5.9384765625, -5.538818359375, -5.13916015625, -4.739501953125, -4.33984375, -3.940185546875, -3.54052734375, -3.140869140625, -2.7412109375, -2.341552734375, -1.94189453125, -1.542236328125, -1.142578125, -0.742919921875, -0.34326171875, 0.056396484375, 0.4560546875, 0.855712890625, 1.25537109375, 1.655029296875, 2.0546875, 2.454345703125, 2.85400390625, 3.253662109375, 3.6533203125, 4.052978515625, 4.45263671875, 4.852294921875, 5.251953125, 5.651611328125, 6.05126953125, 6.450927734375, 6.8505859375, 7.250244140625, 7.64990234375, 8.049560546875, 8.44921875, 8.848876953125, 9.24853515625, 9.648193359375, 10.0478515625, 10.447509765625, 10.84716796875, 11.246826171875, 11.646484375, 12.046142578125, 12.44580078125, 12.845458984375, 13.2451171875, 13.644775390625, 14.04443359375, 14.444091796875, 14.84375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 10.0, 21.0, 11.0, 38.0, 56.0, 73.0, 109.0, 198.0, 245.0, 372.0, 496.0, 562.0, 520.0, 413.0, 256.0, 204.0, 142.0, 93.0, 72.0, 53.0, 39.0, 20.0, 14.0, 11.0, 10.0, 8.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.5625, -10.048828125, -9.53515625, -9.021484375, -8.5078125, -7.994140625, -7.48046875, -6.966796875, -6.453125, -5.939453125, -5.42578125, -4.912109375, -4.3984375, -3.884765625, -3.37109375, -2.857421875, -2.34375, -1.830078125, -1.31640625, -0.802734375, -0.2890625, 0.224609375, 0.73828125, 1.251953125, 1.765625, 2.279296875, 2.79296875, 3.306640625, 3.8203125, 4.333984375, 4.84765625, 5.361328125, 5.875, 6.388671875, 6.90234375, 7.416015625, 7.9296875, 8.443359375, 8.95703125, 9.470703125, 9.984375, 10.498046875, 11.01171875, 11.525390625, 12.0390625, 12.552734375, 13.06640625, 13.580078125, 14.09375, 14.607421875, 15.12109375, 15.634765625, 16.1484375, 16.662109375, 17.17578125, 17.689453125, 18.203125, 18.716796875, 19.23046875, 19.744140625, 20.2578125, 20.771484375, 21.28515625, 21.798828125, 22.3125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 10.0, 14.0, 9.0, 21.0, 31.0, 57.0, 71.0, 93.0, 119.0, 217.0, 302.0, 782.0, 27546.0, 4049390.0, 113550.0, 1089.0, 355.0, 221.0, 138.0, 79.0, 56.0, 39.0, 20.0, 19.0, 12.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-94.75, -92.52587890625, -90.3017578125, -88.07763671875, -85.853515625, -83.62939453125, -81.4052734375, -79.18115234375, -76.95703125, -74.73291015625, -72.5087890625, -70.28466796875, -68.060546875, -65.83642578125, -63.6123046875, -61.38818359375, -59.1640625, -56.93994140625, -54.7158203125, -52.49169921875, -50.267578125, -48.04345703125, -45.8193359375, -43.59521484375, -41.37109375, -39.14697265625, -36.9228515625, -34.69873046875, -32.474609375, -30.25048828125, -28.0263671875, -25.80224609375, -23.578125, -21.35400390625, -19.1298828125, -16.90576171875, -14.681640625, -12.45751953125, -10.2333984375, -8.00927734375, -5.78515625, -3.56103515625, -1.3369140625, 0.88720703125, 3.111328125, 5.33544921875, 7.5595703125, 9.78369140625, 12.0078125, 14.23193359375, 16.4560546875, 18.68017578125, 20.904296875, 23.12841796875, 25.3525390625, 27.57666015625, 29.80078125, 32.02490234375, 34.2490234375, 36.47314453125, 38.697265625, 40.92138671875, 43.1455078125, 45.36962890625, 47.59375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 32.0, 45.0, 98.0, 115.0, 169.0, 162.0, 170.0, 89.0, 67.0, 31.0, 14.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.05191802978516, -111.03495025634766, -108.01797485351562, -105.00100708007812, -101.98403930664062, -98.96707153320312, -95.95010375976562, -92.9331283569336, -89.9161605834961, -86.8991928100586, -83.88221740722656, -80.86524963378906, -77.84828186035156, -74.83131408691406, -71.81434631347656, -68.79737091064453, -65.78040313720703, -62.76343536376953, -59.746463775634766, -56.7294921875, -53.7125244140625, -50.695556640625, -47.678585052490234, -44.66161346435547, -41.64464569091797, -38.62767791748047, -35.6107063293457, -32.59373474121094, -29.576766967773438, -26.559797286987305, -23.542827606201172, -20.52585792541504, -17.508895874023438, -14.491926193237305, -11.474956512451172, -8.457986831665039, -5.441017150878906, -2.4240474700927734, 0.5929222106933594, 3.609891891479492, 6.626861572265625, 9.643831253051758, 12.66080093383789, 15.677770614624023, 18.694740295410156, 21.71170997619629, 24.728679656982422, 27.745649337768555, 30.762619018554688, 33.77958679199219, 36.79655838012695, 39.81352996826172, 42.83049774169922, 45.84746551513672, 48.864437103271484, 51.88140869140625, 54.89837646484375, 57.91534423828125, 60.932315826416016, 63.94928741455078, 66.96625518798828, 69.98322296142578, 73.00019836425781, 76.01716613769531, 79.03413391113281]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 5.0, 5.0, 6.0, 8.0, 8.0, 17.0, 20.0, 20.0, 29.0, 35.0, 28.0, 23.0, 30.0, 38.0, 56.0, 35.0, 43.0, 49.0, 34.0, 42.0, 36.0, 36.0, 46.0, 44.0, 44.0, 34.0, 38.0, 25.0, 23.0, 25.0, 13.0, 11.0, 14.0, 8.0, 16.0, 11.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-52.8895263671875, -51.399253845214844, -49.90898513793945, -48.4187126159668, -46.928443908691406, -45.43817138671875, -43.947898864746094, -42.45762634277344, -40.96735763549805, -39.47708511352539, -37.98681640625, -36.496543884277344, -35.00627136230469, -33.5160026550293, -32.02573013305664, -30.535459518432617, -29.045188903808594, -27.55491828918457, -26.064647674560547, -24.57437515258789, -23.084104537963867, -21.593833923339844, -20.103561401367188, -18.613290786743164, -17.12302017211914, -15.632749557495117, -14.142477989196777, -12.652206420898438, -11.161935806274414, -9.67166519165039, -8.18139362335205, -6.691122055053711, -5.200847625732422, -3.7105765342712402, -2.2203054428100586, -0.730034351348877, 0.7602367401123047, 2.2505078315734863, 3.740778923034668, 5.231050491333008, 6.721321105957031, 8.211591720581055, 9.701863288879395, 11.192134857177734, 12.682405471801758, 14.172676086425781, 15.662947654724121, 17.15321922302246, 18.643489837646484, 20.133760452270508, 21.62403106689453, 23.114303588867188, 24.60457420349121, 26.094844818115234, 27.58511734008789, 29.075387954711914, 30.565658569335938, 32.055931091308594, 33.546199798583984, 35.03647232055664, 36.52674102783203, 38.01701354980469, 39.507286071777344, 40.99755859375, 42.48782730102539]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 9.0, 12.0, 19.0, 16.0, 20.0, 33.0, 34.0, 42.0, 56.0, 37.0, 39.0, 58.0, 45.0, 56.0, 59.0, 48.0, 61.0, 44.0, 55.0, 52.0, 34.0, 32.0, 34.0, 24.0, 17.0, 15.0, 8.0, 7.0, 5.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.9393310546875, -7.683349609375, -7.4273681640625, -7.17138671875, -6.9154052734375, -6.659423828125, -6.4034423828125, -6.1474609375, -5.8914794921875, -5.635498046875, -5.3795166015625, -5.12353515625, -4.8675537109375, -4.611572265625, -4.3555908203125, -4.099609375, -3.8436279296875, -3.587646484375, -3.3316650390625, -3.07568359375, -2.8197021484375, -2.563720703125, -2.3077392578125, -2.0517578125, -1.7957763671875, -1.539794921875, -1.2838134765625, -1.02783203125, -0.7718505859375, -0.515869140625, -0.2598876953125, -0.00390625, 0.2520751953125, 0.508056640625, 0.7640380859375, 1.02001953125, 1.2760009765625, 1.531982421875, 1.7879638671875, 2.0439453125, 2.2999267578125, 2.555908203125, 2.8118896484375, 3.06787109375, 3.3238525390625, 3.579833984375, 3.8358154296875, 4.091796875, 4.3477783203125, 4.603759765625, 4.8597412109375, 5.11572265625, 5.3717041015625, 5.627685546875, 5.8836669921875, 6.1396484375, 6.3956298828125, 6.651611328125, 6.9075927734375, 7.16357421875, 7.4195556640625, 7.675537109375, 7.9315185546875, 8.1875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 9.0, 14.0, 42.0, 48.0, 78.0, 119.0, 239.0, 330.0, 577.0, 893.0, 1492.0, 2584.0, 4307.0, 7366.0, 12953.0, 21551.0, 36096.0, 57737.0, 89767.0, 126399.0, 157505.0, 159375.0, 128961.0, 90257.0, 59472.0, 36703.0, 22162.0, 13065.0, 7499.0, 4470.0, 2601.0, 1586.0, 884.0, 576.0, 319.0, 206.0, 123.0, 69.0, 40.0, 21.0, 18.0, 18.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8886947631835938, -0.8569793701171875, -0.8252639770507812, -0.793548583984375, -0.7618331909179688, -0.7301177978515625, -0.6984024047851562, -0.66668701171875, -0.6349716186523438, -0.6032562255859375, -0.5715408325195312, -0.539825439453125, -0.5081100463867188, -0.4763946533203125, -0.44467926025390625, -0.4129638671875, -0.38124847412109375, -0.3495330810546875, -0.31781768798828125, -0.286102294921875, -0.25438690185546875, -0.2226715087890625, -0.19095611572265625, -0.15924072265625, -0.12752532958984375, -0.0958099365234375, -0.06409454345703125, -0.032379150390625, -0.00066375732421875, 0.0310516357421875, 0.06276702880859375, 0.094482421875, 0.12619781494140625, 0.1579132080078125, 0.18962860107421875, 0.221343994140625, 0.25305938720703125, 0.2847747802734375, 0.31649017333984375, 0.34820556640625, 0.37992095947265625, 0.4116363525390625, 0.44335174560546875, 0.475067138671875, 0.5067825317382812, 0.5384979248046875, 0.5702133178710938, 0.6019287109375, 0.6336441040039062, 0.6653594970703125, 0.6970748901367188, 0.728790283203125, 0.7605056762695312, 0.7922210693359375, 0.8239364624023438, 0.85565185546875, 0.8873672485351562, 0.9190826416015625, 0.9507980346679688, 0.982513427734375, 1.0142288208007812, 1.0459442138671875, 1.0776596069335938, 1.109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 6.0, 16.0, 11.0, 13.0, 17.0, 23.0, 19.0, 19.0, 27.0, 28.0, 27.0, 31.0, 38.0, 39.0, 44.0, 52.0, 49.0, 1068.0, 38.0, 46.0, 40.0, 40.0, 33.0, 37.0, 39.0, 39.0, 33.0, 25.0, 21.0, 17.0, 17.0, 18.0, 16.0, 7.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0078125, -5.82330322265625, -5.6387939453125, -5.45428466796875, -5.269775390625, -5.08526611328125, -4.9007568359375, -4.71624755859375, -4.53173828125, -4.34722900390625, -4.1627197265625, -3.97821044921875, -3.793701171875, -3.60919189453125, -3.4246826171875, -3.24017333984375, -3.0556640625, -2.87115478515625, -2.6866455078125, -2.50213623046875, -2.317626953125, -2.13311767578125, -1.9486083984375, -1.76409912109375, -1.57958984375, -1.39508056640625, -1.2105712890625, -1.02606201171875, -0.841552734375, -0.65704345703125, -0.4725341796875, -0.28802490234375, -0.103515625, 0.08099365234375, 0.2655029296875, 0.45001220703125, 0.634521484375, 0.81903076171875, 1.0035400390625, 1.18804931640625, 1.37255859375, 1.55706787109375, 1.7415771484375, 1.92608642578125, 2.110595703125, 2.29510498046875, 2.4796142578125, 2.66412353515625, 2.8486328125, 3.03314208984375, 3.2176513671875, 3.40216064453125, 3.586669921875, 3.77117919921875, 3.9556884765625, 4.14019775390625, 4.32470703125, 4.50921630859375, 4.6937255859375, 4.87823486328125, 5.062744140625, 5.24725341796875, 5.4317626953125, 5.61627197265625, 5.80078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 14.0, 15.0, 18.0, 24.0, 46.0, 70.0, 107.0, 163.0, 287.0, 447.0, 684.0, 988.0, 1539.0, 2586.0, 4100.0, 6768.0, 11069.0, 17860.0, 28650.0, 45301.0, 69724.0, 101458.0, 147195.0, 1128444.0, 199185.0, 112750.0, 78406.0, 52116.0, 32933.0, 20617.0, 12598.0, 7887.0, 4807.0, 2964.0, 1939.0, 1221.0, 768.0, 501.0, 300.0, 218.0, 138.0, 88.0, 52.0, 27.0, 17.0, 24.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.5419921875, -0.5263519287109375, -0.510711669921875, -0.4950714111328125, -0.47943115234375, -0.4637908935546875, -0.448150634765625, -0.4325103759765625, -0.4168701171875, -0.4012298583984375, -0.385589599609375, -0.3699493408203125, -0.35430908203125, -0.3386688232421875, -0.323028564453125, -0.3073883056640625, -0.291748046875, -0.2761077880859375, -0.260467529296875, -0.2448272705078125, -0.22918701171875, -0.2135467529296875, -0.197906494140625, -0.1822662353515625, -0.1666259765625, -0.1509857177734375, -0.135345458984375, -0.1197052001953125, -0.10406494140625, -0.0884246826171875, -0.072784423828125, -0.0571441650390625, -0.04150390625, -0.0258636474609375, -0.010223388671875, 0.0054168701171875, 0.02105712890625, 0.0366973876953125, 0.052337646484375, 0.0679779052734375, 0.0836181640625, 0.0992584228515625, 0.114898681640625, 0.1305389404296875, 0.14617919921875, 0.1618194580078125, 0.177459716796875, 0.1930999755859375, 0.208740234375, 0.2243804931640625, 0.240020751953125, 0.2556610107421875, 0.27130126953125, 0.2869415283203125, 0.302581787109375, 0.3182220458984375, 0.3338623046875, 0.3495025634765625, 0.365142822265625, 0.3807830810546875, 0.39642333984375, 0.4120635986328125, 0.427703857421875, 0.4433441162109375, 0.458984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 10.0, 13.0, 10.0, 13.0, 13.0, 12.0, 21.0, 33.0, 30.0, 45.0, 55.0, 82.0, 120.0, 121.0, 107.0, 63.0, 50.0, 35.0, 27.0, 26.0, 16.0, 19.0, 14.0, 12.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07858085632324219, -0.07580184936523438, -0.07302284240722656, -0.07024383544921875, -0.06746482849121094, -0.06468582153320312, -0.06190681457519531, -0.0591278076171875, -0.05634880065917969, -0.053569793701171875, -0.05079078674316406, -0.04801177978515625, -0.04523277282714844, -0.042453765869140625, -0.03967475891113281, -0.036895751953125, -0.03411674499511719, -0.031337738037109375, -0.028558731079101562, -0.02577972412109375, -0.023000717163085938, -0.020221710205078125, -0.017442703247070312, -0.0146636962890625, -0.011884689331054688, -0.009105682373046875, -0.0063266754150390625, -0.00354766845703125, -0.0007686614990234375, 0.002010345458984375, 0.0047893524169921875, 0.007568359375, 0.010347366333007812, 0.013126373291015625, 0.015905380249023438, 0.01868438720703125, 0.021463394165039062, 0.024242401123046875, 0.027021408081054688, 0.0298004150390625, 0.03257942199707031, 0.035358428955078125, 0.03813743591308594, 0.04091644287109375, 0.04369544982910156, 0.046474456787109375, 0.04925346374511719, 0.052032470703125, 0.05481147766113281, 0.057590484619140625, 0.06036949157714844, 0.06314849853515625, 0.06592750549316406, 0.06870651245117188, 0.07148551940917969, 0.0742645263671875, 0.07704353332519531, 0.07982254028320312, 0.08260154724121094, 0.08538055419921875, 0.08815956115722656, 0.09093856811523438, 0.09371757507324219, 0.09649658203125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 13.0, 15.0, 16.0, 21.0, 24.0, 35.0, 60.0, 81.0, 158.0, 405.0, 1938.0, 994886.0, 49496.0, 748.0, 247.0, 113.0, 81.0, 49.0, 32.0, 15.0, 20.0, 11.0, 13.0, 16.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.111328125, -2.0506134033203125, -1.989898681640625, -1.9291839599609375, -1.86846923828125, -1.8077545166015625, -1.747039794921875, -1.6863250732421875, -1.6256103515625, -1.5648956298828125, -1.504180908203125, -1.4434661865234375, -1.38275146484375, -1.3220367431640625, -1.261322021484375, -1.2006072998046875, -1.139892578125, -1.0791778564453125, -1.018463134765625, -0.9577484130859375, -0.89703369140625, -0.8363189697265625, -0.775604248046875, -0.7148895263671875, -0.6541748046875, -0.5934600830078125, -0.532745361328125, -0.4720306396484375, -0.41131591796875, -0.3506011962890625, -0.289886474609375, -0.2291717529296875, -0.16845703125, -0.1077423095703125, -0.047027587890625, 0.0136871337890625, 0.07440185546875, 0.1351165771484375, 0.195831298828125, 0.2565460205078125, 0.3172607421875, 0.3779754638671875, 0.438690185546875, 0.4994049072265625, 0.56011962890625, 0.6208343505859375, 0.681549072265625, 0.7422637939453125, 0.802978515625, 0.8636932373046875, 0.924407958984375, 0.9851226806640625, 1.04583740234375, 1.1065521240234375, 1.167266845703125, 1.2279815673828125, 1.2886962890625, 1.3494110107421875, 1.410125732421875, 1.4708404541015625, 1.53155517578125, 1.5922698974609375, 1.652984619140625, 1.7136993408203125, 1.7744140625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 21.0, 37.0, 106.0, 185.0, 308.0, 220.0, 75.0, 26.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.5991914868354797, -0.5879911184310913, -0.5767908096313477, -0.5655904412269592, -0.5543901324272156, -0.5431897640228271, -0.5319894552230835, -0.5207890868186951, -0.5095887184143066, -0.4983883798122406, -0.48718804121017456, -0.4759877026081085, -0.4647873640060425, -0.45358699560165405, -0.442386656999588, -0.431186318397522, -0.4199860095977783, -0.4087856709957123, -0.39758533239364624, -0.3863849937915802, -0.37518465518951416, -0.36398428678512573, -0.3527839481830597, -0.34158360958099365, -0.3303832709789276, -0.3191829323768616, -0.30798259377479553, -0.2967822551727295, -0.28558188676834106, -0.274381548166275, -0.263181209564209, -0.25198087096214294, -0.2407805621623993, -0.22958022356033325, -0.2183798849582672, -0.20717953145503998, -0.19597919285297394, -0.1847788542509079, -0.17357850074768066, -0.16237816214561462, -0.15117782354354858, -0.13997748494148254, -0.1287771463394165, -0.11757679283618927, -0.10637645423412323, -0.09517611563205719, -0.08397576957941055, -0.07277542352676392, -0.061575084924697876, -0.05037474259734154, -0.0391744002699852, -0.02797405794262886, -0.016773715615272522, -0.0055733732879161835, 0.005626969039440155, 0.016827315092086792, 0.028027653694152832, 0.03922799602150917, 0.05042833834886551, 0.06162868067622185, 0.07282902300357819, 0.08402936160564423, 0.09522970765829086, 0.1064300537109375, 0.11763039231300354]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 7.0, 4.0, 6.0, 5.0, 9.0, 13.0, 11.0, 14.0, 18.0, 23.0, 19.0, 18.0, 32.0, 26.0, 31.0, 24.0, 24.0, 40.0, 44.0, 42.0, 33.0, 39.0, 47.0, 37.0, 48.0, 38.0, 47.0, 30.0, 31.0, 30.0, 33.0, 24.0, 30.0, 22.0, 22.0, 17.0, 14.0, 6.0, 8.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.10876572132110596, -0.10518695414066315, -0.10160819441080093, -0.09802943468093872, -0.09445066750049591, -0.0908719003200531, -0.08729314059019089, -0.08371438086032867, -0.08013561367988586, -0.07655684649944305, -0.07297808676958084, -0.06939932703971863, -0.06582055985927582, -0.062241796404123306, -0.058663032948970795, -0.05508426949381828, -0.05150550603866577, -0.04792674258351326, -0.04434797912836075, -0.04076921567320824, -0.037190452218055725, -0.033611688762903214, -0.030032925307750702, -0.02645416185259819, -0.02287539839744568, -0.019296634942293167, -0.015717871487140656, -0.012139108031988144, -0.008560344576835632, -0.004981581121683121, -0.0014028176665306091, 0.0021759457886219025, 0.005754709243774414, 0.009333472698926926, 0.012912236154079437, 0.01649099960923195, 0.02006976306438446, 0.023648526519536972, 0.027227289974689484, 0.030806053429841995, 0.03438481688499451, 0.03796358034014702, 0.04154234379529953, 0.04512110725045204, 0.04869987070560455, 0.052278634160757065, 0.055857397615909576, 0.05943616107106209, 0.0630149245262146, 0.06659369170665741, 0.07017245143651962, 0.07375121116638184, 0.07732997834682465, 0.08090874552726746, 0.08448750525712967, 0.08806626498699188, 0.09164503216743469, 0.0952237993478775, 0.09880255907773972, 0.10238131880760193, 0.10596008598804474, 0.10953885316848755, 0.11311761289834976, 0.11669637262821198, 0.12027513980865479]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 5.0, 4.0, 2.0, 7.0, 12.0, 12.0, 12.0, 19.0, 29.0, 34.0, 29.0, 41.0, 33.0, 37.0, 53.0, 49.0, 50.0, 62.0, 59.0, 47.0, 47.0, 45.0, 49.0, 37.0, 41.0, 36.0, 38.0, 20.0, 27.0, 10.0, 13.0, 12.0, 4.0, 5.0, 12.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0078125, -7.7662353515625, -7.524658203125, -7.2830810546875, -7.04150390625, -6.7999267578125, -6.558349609375, -6.3167724609375, -6.0751953125, -5.8336181640625, -5.592041015625, -5.3504638671875, -5.10888671875, -4.8673095703125, -4.625732421875, -4.3841552734375, -4.142578125, -3.9010009765625, -3.659423828125, -3.4178466796875, -3.17626953125, -2.9346923828125, -2.693115234375, -2.4515380859375, -2.2099609375, -1.9683837890625, -1.726806640625, -1.4852294921875, -1.24365234375, -1.0020751953125, -0.760498046875, -0.5189208984375, -0.27734375, -0.0357666015625, 0.205810546875, 0.4473876953125, 0.68896484375, 0.9305419921875, 1.172119140625, 1.4136962890625, 1.6552734375, 1.8968505859375, 2.138427734375, 2.3800048828125, 2.62158203125, 2.8631591796875, 3.104736328125, 3.3463134765625, 3.587890625, 3.8294677734375, 4.071044921875, 4.3126220703125, 4.55419921875, 4.7957763671875, 5.037353515625, 5.2789306640625, 5.5205078125, 5.7620849609375, 6.003662109375, 6.2452392578125, 6.48681640625, 6.7283935546875, 6.969970703125, 7.2115478515625, 7.453125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 10.0, 7.0, 17.0, 32.0, 34.0, 65.0, 126.0, 204.0, 417.0, 864.0, 2043.0, 4468.0, 9690.0, 22234.0, 56560.0, 158217.0, 396660.0, 250726.0, 87924.0, 32522.0, 14055.0, 6254.0, 2912.0, 1296.0, 544.0, 275.0, 137.0, 78.0, 56.0, 36.0, 24.0, 12.0, 9.0, 16.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2734375, -9.96875, -9.6640625, -9.359375, -9.0546875, -8.75, -8.4453125, -8.140625, -7.8359375, -7.53125, -7.2265625, -6.921875, -6.6171875, -6.3125, -6.0078125, -5.703125, -5.3984375, -5.09375, -4.7890625, -4.484375, -4.1796875, -3.875, -3.5703125, -3.265625, -2.9609375, -2.65625, -2.3515625, -2.046875, -1.7421875, -1.4375, -1.1328125, -0.828125, -0.5234375, -0.21875, 0.0859375, 0.390625, 0.6953125, 1.0, 1.3046875, 1.609375, 1.9140625, 2.21875, 2.5234375, 2.828125, 3.1328125, 3.4375, 3.7421875, 4.046875, 4.3515625, 4.65625, 4.9609375, 5.265625, 5.5703125, 5.875, 6.1796875, 6.484375, 6.7890625, 7.09375, 7.3984375, 7.703125, 8.0078125, 8.3125, 8.6171875, 8.921875, 9.2265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 19.0, 20.0, 26.0, 19.0, 23.0, 37.0, 45.0, 38.0, 53.0, 63.0, 86.0, 168.0, 308.0, 1420.0, 193.0, 95.0, 71.0, 55.0, 50.0, 28.0, 32.0, 28.0, 11.0, 16.0, 21.0, 17.0, 15.0, 6.0, 9.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.296875, -28.509765625, -27.72265625, -26.935546875, -26.1484375, -25.361328125, -24.57421875, -23.787109375, -23.0, -22.212890625, -21.42578125, -20.638671875, -19.8515625, -19.064453125, -18.27734375, -17.490234375, -16.703125, -15.916015625, -15.12890625, -14.341796875, -13.5546875, -12.767578125, -11.98046875, -11.193359375, -10.40625, -9.619140625, -8.83203125, -8.044921875, -7.2578125, -6.470703125, -5.68359375, -4.896484375, -4.109375, -3.322265625, -2.53515625, -1.748046875, -0.9609375, -0.173828125, 0.61328125, 1.400390625, 2.1875, 2.974609375, 3.76171875, 4.548828125, 5.3359375, 6.123046875, 6.91015625, 7.697265625, 8.484375, 9.271484375, 10.05859375, 10.845703125, 11.6328125, 12.419921875, 13.20703125, 13.994140625, 14.78125, 15.568359375, 16.35546875, 17.142578125, 17.9296875, 18.716796875, 19.50390625, 20.291015625, 21.078125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 8.0, 7.0, 12.0, 12.0, 18.0, 21.0, 13.0, 28.0, 21.0, 35.0, 47.0, 60.0, 97.0, 154.0, 202.0, 317.0, 559.0, 2499.0, 100511.0, 2985983.0, 51595.0, 1827.0, 508.0, 313.0, 217.0, 165.0, 94.0, 88.0, 58.0, 49.0, 37.0, 35.0, 20.0, 19.0, 12.0, 9.0, 6.0, 7.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -40.83203125, -39.2265625, -37.62109375, -36.015625, -34.41015625, -32.8046875, -31.19921875, -29.59375, -27.98828125, -26.3828125, -24.77734375, -23.171875, -21.56640625, -19.9609375, -18.35546875, -16.75, -15.14453125, -13.5390625, -11.93359375, -10.328125, -8.72265625, -7.1171875, -5.51171875, -3.90625, -2.30078125, -0.6953125, 0.91015625, 2.515625, 4.12109375, 5.7265625, 7.33203125, 8.9375, 10.54296875, 12.1484375, 13.75390625, 15.359375, 16.96484375, 18.5703125, 20.17578125, 21.78125, 23.38671875, 24.9921875, 26.59765625, 28.203125, 29.80859375, 31.4140625, 33.01953125, 34.625, 36.23046875, 37.8359375, 39.44140625, 41.046875, 42.65234375, 44.2578125, 45.86328125, 47.46875, 49.07421875, 50.6796875, 52.28515625, 53.890625, 55.49609375, 57.1015625, 58.70703125, 60.3125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 209.0, 806.0], "bins": [-1052.1636962890625, -1035.509521484375, -1018.8552856445312, -1002.2010498046875, -985.546875, -968.8926391601562, -952.2384033203125, -935.584228515625, -918.9299926757812, -902.2757568359375, -885.62158203125, -868.9673461914062, -852.3131103515625, -835.658935546875, -819.0046997070312, -802.3505249023438, -785.6962890625, -769.0420532226562, -752.3878784179688, -735.733642578125, -719.0794677734375, -702.4252319335938, -685.77099609375, -669.1168212890625, -652.4625854492188, -635.808349609375, -619.1541748046875, -602.4999389648438, -585.845703125, -569.1915283203125, -552.5372924804688, -535.8831176757812, -519.2288208007812, -502.5746154785156, -485.92041015625, -469.26617431640625, -452.6119689941406, -435.957763671875, -419.30352783203125, -402.6493225097656, -385.9951171875, -369.3409118652344, -352.68670654296875, -336.032470703125, -319.3782653808594, -302.72406005859375, -286.06982421875, -269.4156188964844, -252.76141357421875, -236.10720825195312, -219.45298767089844, -202.79876708984375, -186.14456176757812, -169.4903564453125, -152.8361358642578, -136.18191528320312, -119.5277099609375, -102.87349700927734, -86.21928405761719, -69.56507110595703, -52.910858154296875, -36.25664520263672, -19.602432250976562, -2.9482192993164062, 13.7059907913208]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 6.0, 19.0, 9.0, 18.0, 15.0, 22.0, 29.0, 16.0, 37.0, 22.0, 36.0, 34.0, 35.0, 33.0, 26.0, 53.0, 38.0, 49.0, 50.0, 36.0, 40.0, 35.0, 45.0, 35.0, 34.0, 24.0, 26.0, 26.0, 33.0, 18.0, 18.0, 16.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-65.6315689086914, -63.76346969604492, -61.89536666870117, -60.02726745605469, -58.15916442871094, -56.29106521606445, -54.42296600341797, -52.55486297607422, -50.686763763427734, -48.81866455078125, -46.9505615234375, -45.082462310791016, -43.214359283447266, -41.34626007080078, -39.47815704345703, -37.61005783081055, -35.74195861816406, -33.87385940551758, -32.00575637817383, -30.137657165527344, -28.269556045532227, -26.40145492553711, -24.533353805541992, -22.665252685546875, -20.797149658203125, -18.929048538208008, -17.06094741821289, -15.19284725189209, -13.324747085571289, -11.456645965576172, -9.588544845581055, -7.720444679260254, -5.852344512939453, -3.984243869781494, -2.116142988204956, -0.24804210662841797, 1.620058536529541, 3.4881591796875, 5.356260299682617, 7.224360466003418, 9.092461585998535, 10.960562705993652, 12.828662872314453, 14.69676399230957, 16.564865112304688, 18.432964324951172, 20.301067352294922, 22.169166564941406, 24.037267684936523, 25.90536880493164, 27.773469924926758, 29.641571044921875, 31.50967025756836, 33.377769470214844, 35.245872497558594, 37.11397171020508, 38.98207473754883, 40.85017395019531, 42.71827697753906, 44.58637619018555, 46.4544792175293, 48.32257843017578, 50.19068145751953, 52.058780670166016, 53.9268798828125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 4.0, 11.0, 12.0, 14.0, 17.0, 22.0, 25.0, 27.0, 30.0, 27.0, 31.0, 51.0, 37.0, 40.0, 46.0, 58.0, 59.0, 56.0, 61.0, 46.0, 27.0, 42.0, 43.0, 38.0, 33.0, 30.0, 23.0, 14.0, 19.0, 9.0, 14.0, 6.0, 6.0, 14.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.2076416015625, -7.946533203125, -7.6854248046875, -7.42431640625, -7.1632080078125, -6.902099609375, -6.6409912109375, -6.3798828125, -6.1187744140625, -5.857666015625, -5.5965576171875, -5.33544921875, -5.0743408203125, -4.813232421875, -4.5521240234375, -4.291015625, -4.0299072265625, -3.768798828125, -3.5076904296875, -3.24658203125, -2.9854736328125, -2.724365234375, -2.4632568359375, -2.2021484375, -1.9410400390625, -1.679931640625, -1.4188232421875, -1.15771484375, -0.8966064453125, -0.635498046875, -0.3743896484375, -0.11328125, 0.1478271484375, 0.408935546875, 0.6700439453125, 0.93115234375, 1.1922607421875, 1.453369140625, 1.7144775390625, 1.9755859375, 2.2366943359375, 2.497802734375, 2.7589111328125, 3.02001953125, 3.2811279296875, 3.542236328125, 3.8033447265625, 4.064453125, 4.3255615234375, 4.586669921875, 4.8477783203125, 5.10888671875, 5.3699951171875, 5.631103515625, 5.8922119140625, 6.1533203125, 6.4144287109375, 6.675537109375, 6.9366455078125, 7.19775390625, 7.4588623046875, 7.719970703125, 7.9810791015625, 8.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 11.0, 10.0, 12.0, 23.0, 19.0, 21.0, 38.0, 53.0, 63.0, 110.0, 176.0, 367.0, 852.0, 3063.0, 14276.0, 95048.0, 707576.0, 2308628.0, 912260.0, 127310.0, 18661.0, 3680.0, 991.0, 420.0, 222.0, 112.0, 63.0, 47.0, 45.0, 28.0, 12.0, 16.0, 7.0, 11.0, 12.0, 10.0, 5.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3515625, -13.89697265625, -13.4423828125, -12.98779296875, -12.533203125, -12.07861328125, -11.6240234375, -11.16943359375, -10.71484375, -10.26025390625, -9.8056640625, -9.35107421875, -8.896484375, -8.44189453125, -7.9873046875, -7.53271484375, -7.078125, -6.62353515625, -6.1689453125, -5.71435546875, -5.259765625, -4.80517578125, -4.3505859375, -3.89599609375, -3.44140625, -2.98681640625, -2.5322265625, -2.07763671875, -1.623046875, -1.16845703125, -0.7138671875, -0.25927734375, 0.1953125, 0.64990234375, 1.1044921875, 1.55908203125, 2.013671875, 2.46826171875, 2.9228515625, 3.37744140625, 3.83203125, 4.28662109375, 4.7412109375, 5.19580078125, 5.650390625, 6.10498046875, 6.5595703125, 7.01416015625, 7.46875, 7.92333984375, 8.3779296875, 8.83251953125, 9.287109375, 9.74169921875, 10.1962890625, 10.65087890625, 11.10546875, 11.56005859375, 12.0146484375, 12.46923828125, 12.923828125, 13.37841796875, 13.8330078125, 14.28759765625, 14.7421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 14.0, 16.0, 18.0, 29.0, 27.0, 41.0, 47.0, 70.0, 98.0, 126.0, 144.0, 216.0, 246.0, 325.0, 368.0, 404.0, 384.0, 314.0, 268.0, 222.0, 180.0, 129.0, 92.0, 61.0, 65.0, 41.0, 20.0, 19.0, 14.0, 13.0, 8.0, 10.0, 13.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.578125, -9.2054443359375, -8.832763671875, -8.4600830078125, -8.08740234375, -7.7147216796875, -7.342041015625, -6.9693603515625, -6.5966796875, -6.2239990234375, -5.851318359375, -5.4786376953125, -5.10595703125, -4.7332763671875, -4.360595703125, -3.9879150390625, -3.615234375, -3.2425537109375, -2.869873046875, -2.4971923828125, -2.12451171875, -1.7518310546875, -1.379150390625, -1.0064697265625, -0.6337890625, -0.2611083984375, 0.111572265625, 0.4842529296875, 0.85693359375, 1.2296142578125, 1.602294921875, 1.9749755859375, 2.34765625, 2.7203369140625, 3.093017578125, 3.4656982421875, 3.83837890625, 4.2110595703125, 4.583740234375, 4.9564208984375, 5.3291015625, 5.7017822265625, 6.074462890625, 6.4471435546875, 6.81982421875, 7.1925048828125, 7.565185546875, 7.9378662109375, 8.310546875, 8.6832275390625, 9.055908203125, 9.4285888671875, 9.80126953125, 10.1739501953125, 10.546630859375, 10.9193115234375, 11.2919921875, 11.6646728515625, 12.037353515625, 12.4100341796875, 12.78271484375, 13.1553955078125, 13.528076171875, 13.9007568359375, 14.2734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 8.0, 11.0, 15.0, 19.0, 20.0, 34.0, 57.0, 63.0, 90.0, 116.0, 183.0, 257.0, 360.0, 1219.0, 62348.0, 3753641.0, 371115.0, 3126.0, 496.0, 289.0, 202.0, 157.0, 105.0, 82.0, 55.0, 32.0, 46.0, 20.0, 24.0, 22.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0], "bins": [-62.71875, -61.0966796875, -59.474609375, -57.8525390625, -56.23046875, -54.6083984375, -52.986328125, -51.3642578125, -49.7421875, -48.1201171875, -46.498046875, -44.8759765625, -43.25390625, -41.6318359375, -40.009765625, -38.3876953125, -36.765625, -35.1435546875, -33.521484375, -31.8994140625, -30.27734375, -28.6552734375, -27.033203125, -25.4111328125, -23.7890625, -22.1669921875, -20.544921875, -18.9228515625, -17.30078125, -15.6787109375, -14.056640625, -12.4345703125, -10.8125, -9.1904296875, -7.568359375, -5.9462890625, -4.32421875, -2.7021484375, -1.080078125, 0.5419921875, 2.1640625, 3.7861328125, 5.408203125, 7.0302734375, 8.65234375, 10.2744140625, 11.896484375, 13.5185546875, 15.140625, 16.7626953125, 18.384765625, 20.0068359375, 21.62890625, 23.2509765625, 24.873046875, 26.4951171875, 28.1171875, 29.7392578125, 31.361328125, 32.9833984375, 34.60546875, 36.2275390625, 37.849609375, 39.4716796875, 41.09375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 29.0, 65.0, 112.0, 156.0, 220.0, 165.0, 133.0, 91.0, 24.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.68490600585938, -114.31295776367188, -110.94100952148438, -107.56905364990234, -104.19710540771484, -100.82515716552734, -97.45320129394531, -94.08125305175781, -90.70930480957031, -87.33735656738281, -83.96540832519531, -80.59345245361328, -77.22150421142578, -73.84955596923828, -70.47760009765625, -67.10565185546875, -63.73370361328125, -60.36175537109375, -56.989803314208984, -53.61785125732422, -50.24590301513672, -46.87395477294922, -43.50200271606445, -40.13005065917969, -36.75810241699219, -33.38615417480469, -30.014202117919922, -26.64225196838379, -23.270301818847656, -19.898351669311523, -16.52640151977539, -13.154451370239258, -9.782493591308594, -6.410543441772461, -3.038593292236328, 0.3333568572998047, 3.7053070068359375, 7.07725715637207, 10.449207305908203, 13.821157455444336, 17.19310760498047, 20.5650577545166, 23.937007904052734, 27.308958053588867, 30.680908203125, 34.0528564453125, 37.424808502197266, 40.79676055908203, 44.16870880126953, 47.54065704345703, 50.9126091003418, 54.28456115722656, 57.65650939941406, 61.02845764160156, 64.40040588378906, 67.7723617553711, 71.1443099975586, 74.5162582397461, 77.88821411132812, 81.26016235351562, 84.63211059570312, 88.00405883789062, 91.37600708007812, 94.74796295166016, 98.11991119384766]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 2.0, 9.0, 11.0, 12.0, 8.0, 19.0, 6.0, 16.0, 15.0, 24.0, 20.0, 22.0, 27.0, 20.0, 35.0, 35.0, 40.0, 35.0, 46.0, 32.0, 38.0, 34.0, 33.0, 32.0, 35.0, 38.0, 25.0, 30.0, 42.0, 32.0, 22.0, 38.0, 28.0, 13.0, 16.0, 15.0, 13.0, 12.0, 16.0, 9.0, 12.0, 5.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.139007568359375, -39.90483856201172, -38.67066955566406, -37.436500549316406, -36.20233154296875, -34.96815872192383, -33.73398971557617, -32.499820709228516, -31.26565170288086, -30.031482696533203, -28.797313690185547, -27.563142776489258, -26.3289737701416, -25.094804763793945, -23.860633850097656, -22.62646484375, -21.392295837402344, -20.158126831054688, -18.92395782470703, -17.689786911010742, -16.455617904663086, -15.22144889831543, -13.987278938293457, -12.753108978271484, -11.518939971923828, -10.284770965576172, -9.0506010055542, -7.816431522369385, -6.58226203918457, -5.348092555999756, -4.113923072814941, -2.8797531127929688, -1.6455841064453125, -0.41141462326049805, 0.8227548599243164, 2.056924343109131, 3.2910938262939453, 4.52526330947876, 5.759432792663574, 6.993602752685547, 8.227771759033203, 9.46194076538086, 10.696110725402832, 11.930280685424805, 13.164449691772461, 14.398618698120117, 15.63278865814209, 16.866958618164062, 18.10112762451172, 19.335296630859375, 20.56946563720703, 21.80363655090332, 23.037805557250977, 24.271974563598633, 25.506145477294922, 26.740314483642578, 27.974483489990234, 29.20865249633789, 30.442821502685547, 31.676992416381836, 32.911163330078125, 34.14533233642578, 35.37950134277344, 36.613670349121094, 37.84783935546875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 14.0, 17.0, 18.0, 18.0, 21.0, 24.0, 22.0, 24.0, 32.0, 45.0, 43.0, 45.0, 57.0, 43.0, 39.0, 44.0, 45.0, 52.0, 45.0, 33.0, 39.0, 40.0, 44.0, 33.0, 34.0, 26.0, 21.0, 17.0, 11.0, 13.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -7.0423583984375, -6.811279296875, -6.5802001953125, -6.34912109375, -6.1180419921875, -5.886962890625, -5.6558837890625, -5.4248046875, -5.1937255859375, -4.962646484375, -4.7315673828125, -4.50048828125, -4.2694091796875, -4.038330078125, -3.8072509765625, -3.576171875, -3.3450927734375, -3.114013671875, -2.8829345703125, -2.65185546875, -2.4207763671875, -2.189697265625, -1.9586181640625, -1.7275390625, -1.4964599609375, -1.265380859375, -1.0343017578125, -0.80322265625, -0.5721435546875, -0.341064453125, -0.1099853515625, 0.12109375, 0.3521728515625, 0.583251953125, 0.8143310546875, 1.04541015625, 1.2764892578125, 1.507568359375, 1.7386474609375, 1.9697265625, 2.2008056640625, 2.431884765625, 2.6629638671875, 2.89404296875, 3.1251220703125, 3.356201171875, 3.5872802734375, 3.818359375, 4.0494384765625, 4.280517578125, 4.5115966796875, 4.74267578125, 4.9737548828125, 5.204833984375, 5.4359130859375, 5.6669921875, 5.8980712890625, 6.129150390625, 6.3602294921875, 6.59130859375, 6.8223876953125, 7.053466796875, 7.2845458984375, 7.515625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 4.0, 10.0, 10.0, 22.0, 18.0, 40.0, 55.0, 80.0, 172.0, 235.0, 379.0, 585.0, 890.0, 1292.0, 1975.0, 2823.0, 4280.0, 6195.0, 9084.0, 12879.0, 18377.0, 25667.0, 35257.0, 47812.0, 62860.0, 79136.0, 95188.0, 107404.0, 108745.0, 98119.0, 82976.0, 66277.0, 50896.0, 37548.0, 27411.0, 19497.0, 13931.0, 9565.0, 6787.0, 4586.0, 3120.0, 2154.0, 1427.0, 996.0, 655.0, 386.0, 287.0, 158.0, 105.0, 80.0, 66.0, 23.0, 22.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5899200439453125, -0.570953369140625, -0.5519866943359375, -0.53302001953125, -0.5140533447265625, -0.495086669921875, -0.4761199951171875, -0.4571533203125, -0.4381866455078125, -0.419219970703125, -0.4002532958984375, -0.38128662109375, -0.3623199462890625, -0.343353271484375, -0.3243865966796875, -0.305419921875, -0.2864532470703125, -0.267486572265625, -0.2485198974609375, -0.22955322265625, -0.2105865478515625, -0.191619873046875, -0.1726531982421875, -0.1536865234375, -0.1347198486328125, -0.115753173828125, -0.0967864990234375, -0.07781982421875, -0.0588531494140625, -0.039886474609375, -0.0209197998046875, -0.001953125, 0.0170135498046875, 0.035980224609375, 0.0549468994140625, 0.07391357421875, 0.0928802490234375, 0.111846923828125, 0.1308135986328125, 0.1497802734375, 0.1687469482421875, 0.187713623046875, 0.2066802978515625, 0.22564697265625, 0.2446136474609375, 0.263580322265625, 0.2825469970703125, 0.301513671875, 0.3204803466796875, 0.339447021484375, 0.3584136962890625, 0.37738037109375, 0.3963470458984375, 0.415313720703125, 0.4342803955078125, 0.4532470703125, 0.4722137451171875, 0.491180419921875, 0.5101470947265625, 0.52911376953125, 0.5480804443359375, 0.567047119140625, 0.5860137939453125, 0.60498046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 8.0, 11.0, 19.0, 8.0, 11.0, 21.0, 25.0, 20.0, 17.0, 29.0, 30.0, 35.0, 37.0, 43.0, 39.0, 48.0, 48.0, 30.0, 1070.0, 32.0, 43.0, 39.0, 41.0, 25.0, 42.0, 45.0, 28.0, 21.0, 23.0, 21.0, 13.0, 17.0, 16.0, 10.0, 10.0, 13.0, 4.0, 11.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.64666748046875, -4.4847412109375, -4.32281494140625, -4.160888671875, -3.99896240234375, -3.8370361328125, -3.67510986328125, -3.51318359375, -3.35125732421875, -3.1893310546875, -3.02740478515625, -2.865478515625, -2.70355224609375, -2.5416259765625, -2.37969970703125, -2.2177734375, -2.05584716796875, -1.8939208984375, -1.73199462890625, -1.570068359375, -1.40814208984375, -1.2462158203125, -1.08428955078125, -0.92236328125, -0.76043701171875, -0.5985107421875, -0.43658447265625, -0.274658203125, -0.11273193359375, 0.0491943359375, 0.21112060546875, 0.373046875, 0.53497314453125, 0.6968994140625, 0.85882568359375, 1.020751953125, 1.18267822265625, 1.3446044921875, 1.50653076171875, 1.66845703125, 1.83038330078125, 1.9923095703125, 2.15423583984375, 2.316162109375, 2.47808837890625, 2.6400146484375, 2.80194091796875, 2.9638671875, 3.12579345703125, 3.2877197265625, 3.44964599609375, 3.611572265625, 3.77349853515625, 3.9354248046875, 4.09735107421875, 4.25927734375, 4.42120361328125, 4.5831298828125, 4.74505615234375, 4.906982421875, 5.06890869140625, 5.2308349609375, 5.39276123046875, 5.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 4.0, 12.0, 13.0, 34.0, 47.0, 62.0, 84.0, 147.0, 195.0, 257.0, 441.0, 599.0, 949.0, 1454.0, 2109.0, 3256.0, 4902.0, 7478.0, 10787.0, 16373.0, 24217.0, 34929.0, 49567.0, 67844.0, 88755.0, 113238.0, 931883.0, 346665.0, 104250.0, 82074.0, 62221.0, 44674.0, 31557.0, 21851.0, 14571.0, 9841.0, 6597.0, 4365.0, 2906.0, 1930.0, 1330.0, 864.0, 587.0, 359.0, 287.0, 198.0, 113.0, 89.0, 50.0, 37.0, 29.0, 22.0, 12.0, 9.0, 3.0, 4.0, 3.0], "bins": [-0.3857421875, -0.3743476867675781, -0.36295318603515625, -0.3515586853027344, -0.3401641845703125, -0.3287696838378906, -0.31737518310546875, -0.3059806823730469, -0.294586181640625, -0.2831916809082031, -0.27179718017578125, -0.2604026794433594, -0.2490081787109375, -0.23761367797851562, -0.22621917724609375, -0.21482467651367188, -0.20343017578125, -0.19203567504882812, -0.18064117431640625, -0.16924667358398438, -0.1578521728515625, -0.14645767211914062, -0.13506317138671875, -0.12366867065429688, -0.112274169921875, -0.10087966918945312, -0.08948516845703125, -0.07809066772460938, -0.0666961669921875, -0.055301666259765625, -0.04390716552734375, -0.032512664794921875, -0.0211181640625, -0.009723663330078125, 0.00167083740234375, 0.013065338134765625, 0.0244598388671875, 0.035854339599609375, 0.04724884033203125, 0.058643341064453125, 0.070037841796875, 0.08143234252929688, 0.09282684326171875, 0.10422134399414062, 0.1156158447265625, 0.12701034545898438, 0.13840484619140625, 0.14979934692382812, 0.16119384765625, 0.17258834838867188, 0.18398284912109375, 0.19537734985351562, 0.2067718505859375, 0.21816635131835938, 0.22956085205078125, 0.24095535278320312, 0.252349853515625, 0.2637443542480469, 0.27513885498046875, 0.2865333557128906, 0.2979278564453125, 0.3093223571777344, 0.32071685791015625, 0.3321113586425781, 0.343505859375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 8.0, 9.0, 7.0, 14.0, 8.0, 14.0, 12.0, 13.0, 18.0, 16.0, 26.0, 31.0, 22.0, 40.0, 50.0, 58.0, 69.0, 53.0, 57.0, 56.0, 60.0, 55.0, 42.0, 31.0, 32.0, 22.0, 19.0, 17.0, 23.0, 15.0, 15.0, 12.0, 11.0, 15.0, 6.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.050201416015625, -0.04867696762084961, -0.04715251922607422, -0.04562807083129883, -0.04410362243652344, -0.04257917404174805, -0.041054725646972656, -0.039530277252197266, -0.038005828857421875, -0.036481380462646484, -0.034956932067871094, -0.0334324836730957, -0.03190803527832031, -0.030383586883544922, -0.02885913848876953, -0.02733469009399414, -0.02581024169921875, -0.02428579330444336, -0.02276134490966797, -0.021236896514892578, -0.019712448120117188, -0.018187999725341797, -0.016663551330566406, -0.015139102935791016, -0.013614654541015625, -0.012090206146240234, -0.010565757751464844, -0.009041309356689453, -0.0075168609619140625, -0.005992412567138672, -0.004467964172363281, -0.0029435157775878906, -0.0014190673828125, 0.00010538101196289062, 0.0016298294067382812, 0.003154277801513672, 0.0046787261962890625, 0.006203174591064453, 0.007727622985839844, 0.009252071380615234, 0.010776519775390625, 0.012300968170166016, 0.013825416564941406, 0.015349864959716797, 0.016874313354492188, 0.018398761749267578, 0.01992321014404297, 0.02144765853881836, 0.02297210693359375, 0.02449655532836914, 0.02602100372314453, 0.027545452117919922, 0.029069900512695312, 0.030594348907470703, 0.032118797302246094, 0.033643245697021484, 0.035167694091796875, 0.036692142486572266, 0.038216590881347656, 0.03974103927612305, 0.04126548767089844, 0.04278993606567383, 0.04431438446044922, 0.04583883285522461, 0.04736328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 18.0, 15.0, 12.0, 25.0, 25.0, 24.0, 41.0, 46.0, 66.0, 138.0, 175.0, 340.0, 1237.0, 50274.0, 988454.0, 6304.0, 604.0, 245.0, 139.0, 85.0, 57.0, 37.0, 27.0, 24.0, 19.0, 17.0, 10.0, 18.0, 5.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.0758056640625, -1.040283203125, -1.0047607421875, -0.96923828125, -0.9337158203125, -0.898193359375, -0.8626708984375, -0.8271484375, -0.7916259765625, -0.756103515625, -0.7205810546875, -0.68505859375, -0.6495361328125, -0.614013671875, -0.5784912109375, -0.54296875, -0.5074462890625, -0.471923828125, -0.4364013671875, -0.40087890625, -0.3653564453125, -0.329833984375, -0.2943115234375, -0.2587890625, -0.2232666015625, -0.187744140625, -0.1522216796875, -0.11669921875, -0.0811767578125, -0.045654296875, -0.0101318359375, 0.025390625, 0.0609130859375, 0.096435546875, 0.1319580078125, 0.16748046875, 0.2030029296875, 0.238525390625, 0.2740478515625, 0.3095703125, 0.3450927734375, 0.380615234375, 0.4161376953125, 0.45166015625, 0.4871826171875, 0.522705078125, 0.5582275390625, 0.59375, 0.6292724609375, 0.664794921875, 0.7003173828125, 0.73583984375, 0.7713623046875, 0.806884765625, 0.8424072265625, 0.8779296875, 0.9134521484375, 0.948974609375, 0.9844970703125, 1.02001953125, 1.0555419921875, 1.091064453125, 1.1265869140625, 1.162109375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 38.0, 83.0, 374.0, 375.0, 82.0, 33.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5864637494087219, -0.5701732635498047, -0.5538827776908875, -0.5375922918319702, -0.521301805973053, -0.5050113201141357, -0.4887208342552185, -0.47243034839630127, -0.45613986253738403, -0.4398493766784668, -0.42355889081954956, -0.4072684049606323, -0.3909779191017151, -0.37468743324279785, -0.3583969473838806, -0.3421064615249634, -0.32581600546836853, -0.3095255196094513, -0.29323503375053406, -0.2769445478916168, -0.2606540620326996, -0.24436357617378235, -0.2280731052160263, -0.21178261935710907, -0.19549213349819183, -0.1792016476392746, -0.16291116178035736, -0.14662069082260132, -0.13033020496368408, -0.11403971165418625, -0.09774923324584961, -0.08145874738693237, -0.06516826152801514, -0.0488777756690979, -0.03258729353547096, -0.016296811401844025, -6.32554292678833e-06, 0.016284160315990448, 0.03257463872432709, 0.048865124583244324, 0.06515561044216156, 0.0814460963010788, 0.09773658215999603, 0.11402706056833267, 0.1303175389766693, 0.14660802483558655, 0.16289851069450378, 0.17918899655342102, 0.19547948241233826, 0.2117699682712555, 0.22806045413017273, 0.24435093998908997, 0.2606414258480072, 0.27693191170692444, 0.2932223677635193, 0.3095128536224365, 0.32580333948135376, 0.342093825340271, 0.35838431119918823, 0.37467479705810547, 0.3909652829170227, 0.40725576877593994, 0.4235462546348572, 0.4398367404937744, 0.45612722635269165]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 1.0, 5.0, 11.0, 12.0, 8.0, 11.0, 17.0, 12.0, 24.0, 19.0, 21.0, 22.0, 27.0, 32.0, 35.0, 29.0, 36.0, 38.0, 36.0, 40.0, 45.0, 37.0, 39.0, 38.0, 40.0, 44.0, 38.0, 38.0, 29.0, 34.0, 23.0, 31.0, 21.0, 15.0, 16.0, 8.0, 17.0, 7.0, 12.0, 11.0, 3.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1927649974822998, -0.1873200684785843, -0.18187513947486877, -0.17643019556999207, -0.17098526656627655, -0.16554033756256104, -0.16009539365768433, -0.1546504646539688, -0.1492055356502533, -0.14376060664653778, -0.13831567764282227, -0.13287073373794556, -0.12742580473423004, -0.12198087573051453, -0.11653593927621841, -0.1110910028219223, -0.10564607381820679, -0.10020114481449127, -0.09475620836019516, -0.08931127190589905, -0.08386634290218353, -0.07842141389846802, -0.0729764774441719, -0.0675315409898758, -0.06208661198616028, -0.056641679257154465, -0.05119674652814865, -0.04575181379914284, -0.040306881070137024, -0.03486194834113121, -0.029417015612125397, -0.023972082883119583, -0.01852715015411377, -0.013082217425107956, -0.007637284696102142, -0.0021923519670963287, 0.003252580761909485, 0.008697513490915298, 0.014142446219921112, 0.019587378948926926, 0.02503231167793274, 0.030477244406938553, 0.035922177135944366, 0.04136710986495018, 0.046812042593955994, 0.05225697532296181, 0.05770190805196762, 0.06314684450626373, 0.06859177350997925, 0.07403670251369476, 0.07948163896799088, 0.08492657542228699, 0.0903715044260025, 0.09581643342971802, 0.10126136988401413, 0.10670630633831024, 0.11215123534202576, 0.11759616434574127, 0.12304110080003738, 0.1284860372543335, 0.133930966258049, 0.13937589526176453, 0.14482083916664124, 0.15026576817035675, 0.15571069717407227]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 17.0, 6.0, 13.0, 17.0, 19.0, 21.0, 16.0, 24.0, 28.0, 40.0, 41.0, 36.0, 41.0, 37.0, 43.0, 56.0, 38.0, 51.0, 47.0, 44.0, 45.0, 40.0, 41.0, 35.0, 29.0, 21.0, 44.0, 17.0, 27.0, 20.0, 14.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.046875, -7.81585693359375, -7.5848388671875, -7.35382080078125, -7.122802734375, -6.89178466796875, -6.6607666015625, -6.42974853515625, -6.19873046875, -5.96771240234375, -5.7366943359375, -5.50567626953125, -5.274658203125, -5.04364013671875, -4.8126220703125, -4.58160400390625, -4.3505859375, -4.11956787109375, -3.8885498046875, -3.65753173828125, -3.426513671875, -3.19549560546875, -2.9644775390625, -2.73345947265625, -2.50244140625, -2.27142333984375, -2.0404052734375, -1.80938720703125, -1.578369140625, -1.34735107421875, -1.1163330078125, -0.88531494140625, -0.654296875, -0.42327880859375, -0.1922607421875, 0.03875732421875, 0.269775390625, 0.50079345703125, 0.7318115234375, 0.96282958984375, 1.19384765625, 1.42486572265625, 1.6558837890625, 1.88690185546875, 2.117919921875, 2.34893798828125, 2.5799560546875, 2.81097412109375, 3.0419921875, 3.27301025390625, 3.5040283203125, 3.73504638671875, 3.966064453125, 4.19708251953125, 4.4281005859375, 4.65911865234375, 4.89013671875, 5.12115478515625, 5.3521728515625, 5.58319091796875, 5.814208984375, 6.04522705078125, 6.2762451171875, 6.50726318359375, 6.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 6.0, 14.0, 17.0, 24.0, 40.0, 58.0, 79.0, 102.0, 179.0, 283.0, 443.0, 831.0, 1387.0, 2436.0, 4301.0, 8267.0, 15978.0, 31548.0, 64482.0, 132920.0, 289181.0, 259203.0, 119274.0, 57864.0, 28468.0, 14204.0, 7513.0, 4054.0, 2138.0, 1314.0, 754.0, 445.0, 257.0, 151.0, 103.0, 88.0, 45.0, 28.0, 17.0, 18.0, 13.0, 7.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-7.953125, -7.71868896484375, -7.4842529296875, -7.24981689453125, -7.015380859375, -6.78094482421875, -6.5465087890625, -6.31207275390625, -6.07763671875, -5.84320068359375, -5.6087646484375, -5.37432861328125, -5.139892578125, -4.90545654296875, -4.6710205078125, -4.43658447265625, -4.2021484375, -3.96771240234375, -3.7332763671875, -3.49884033203125, -3.264404296875, -3.02996826171875, -2.7955322265625, -2.56109619140625, -2.32666015625, -2.09222412109375, -1.8577880859375, -1.62335205078125, -1.388916015625, -1.15447998046875, -0.9200439453125, -0.68560791015625, -0.451171875, -0.21673583984375, 0.0177001953125, 0.25213623046875, 0.486572265625, 0.72100830078125, 0.9554443359375, 1.18988037109375, 1.42431640625, 1.65875244140625, 1.8931884765625, 2.12762451171875, 2.362060546875, 2.59649658203125, 2.8309326171875, 3.06536865234375, 3.2998046875, 3.53424072265625, 3.7686767578125, 4.00311279296875, 4.237548828125, 4.47198486328125, 4.7064208984375, 4.94085693359375, 5.17529296875, 5.40972900390625, 5.6441650390625, 5.87860107421875, 6.113037109375, 6.34747314453125, 6.5819091796875, 6.81634521484375, 7.05078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 6.0, 10.0, 6.0, 9.0, 11.0, 15.0, 10.0, 17.0, 19.0, 25.0, 29.0, 38.0, 30.0, 40.0, 34.0, 43.0, 56.0, 72.0, 119.0, 284.0, 1402.0, 238.0, 114.0, 53.0, 50.0, 35.0, 24.0, 34.0, 30.0, 29.0, 28.0, 24.0, 20.0, 24.0, 14.0, 11.0, 8.0, 5.0, 7.0, 10.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -17.004638671875, -16.38427734375, -15.763916015625, -15.1435546875, -14.523193359375, -13.90283203125, -13.282470703125, -12.662109375, -12.041748046875, -11.42138671875, -10.801025390625, -10.1806640625, -9.560302734375, -8.93994140625, -8.319580078125, -7.69921875, -7.078857421875, -6.45849609375, -5.838134765625, -5.2177734375, -4.597412109375, -3.97705078125, -3.356689453125, -2.736328125, -2.115966796875, -1.49560546875, -0.875244140625, -0.2548828125, 0.365478515625, 0.98583984375, 1.606201171875, 2.2265625, 2.846923828125, 3.46728515625, 4.087646484375, 4.7080078125, 5.328369140625, 5.94873046875, 6.569091796875, 7.189453125, 7.809814453125, 8.43017578125, 9.050537109375, 9.6708984375, 10.291259765625, 10.91162109375, 11.531982421875, 12.15234375, 12.772705078125, 13.39306640625, 14.013427734375, 14.6337890625, 15.254150390625, 15.87451171875, 16.494873046875, 17.115234375, 17.735595703125, 18.35595703125, 18.976318359375, 19.5966796875, 20.217041015625, 20.83740234375, 21.457763671875, 22.078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 16.0, 18.0, 22.0, 24.0, 35.0, 43.0, 66.0, 84.0, 127.0, 198.0, 303.0, 705.0, 2518.0, 138768.0, 2987176.0, 12948.0, 1303.0, 497.0, 238.0, 183.0, 110.0, 71.0, 50.0, 47.0, 27.0, 25.0, 17.0, 13.0, 3.0, 11.0, 4.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.1875, -66.138671875, -64.08984375, -62.041015625, -59.9921875, -57.943359375, -55.89453125, -53.845703125, -51.796875, -49.748046875, -47.69921875, -45.650390625, -43.6015625, -41.552734375, -39.50390625, -37.455078125, -35.40625, -33.357421875, -31.30859375, -29.259765625, -27.2109375, -25.162109375, -23.11328125, -21.064453125, -19.015625, -16.966796875, -14.91796875, -12.869140625, -10.8203125, -8.771484375, -6.72265625, -4.673828125, -2.625, -0.576171875, 1.47265625, 3.521484375, 5.5703125, 7.619140625, 9.66796875, 11.716796875, 13.765625, 15.814453125, 17.86328125, 19.912109375, 21.9609375, 24.009765625, 26.05859375, 28.107421875, 30.15625, 32.205078125, 34.25390625, 36.302734375, 38.3515625, 40.400390625, 42.44921875, 44.498046875, 46.546875, 48.595703125, 50.64453125, 52.693359375, 54.7421875, 56.791015625, 58.83984375, 60.888671875, 62.9375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 2.0, 13.0, 27.0, 25.0, 55.0, 99.0, 124.0, 130.0, 140.0, 126.0, 102.0, 81.0, 38.0, 25.0, 10.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.031455993652344, -14.725845336914062, -13.420234680175781, -12.1146240234375, -10.809013366699219, -9.503402709960938, -8.197793006896973, -6.892182350158691, -5.58657169342041, -4.280961036682129, -2.9753506183624268, -1.6697402000427246, -0.36412954330444336, 0.9414811134338379, 2.247091293334961, 3.552701950073242, 4.858312606811523, 6.163923263549805, 7.469533920288086, 8.775144577026367, 10.080755233764648, 11.38636589050293, 12.691975593566895, 13.997586250305176, 15.303196907043457, 16.608806610107422, 17.914417266845703, 19.220027923583984, 20.525638580322266, 21.831249237060547, 23.136859893798828, 24.44247055053711, 25.74808120727539, 27.053691864013672, 28.359302520751953, 29.664913177490234, 30.970523834228516, 32.2761344909668, 33.58174514770508, 34.88735580444336, 36.19296646118164, 37.49857711791992, 38.8041877746582, 40.109798431396484, 41.415409088134766, 42.72101974487305, 44.02663040161133, 45.33224105834961, 46.637847900390625, 47.943458557128906, 49.24906921386719, 50.55467987060547, 51.86029052734375, 53.16590118408203, 54.47151184082031, 55.777122497558594, 57.082733154296875, 58.388343811035156, 59.69395446777344, 60.99956512451172, 62.30517578125, 63.61078643798828, 64.91639709472656, 66.22200775146484, 67.52761840820312]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 7.0, 10.0, 5.0, 11.0, 11.0, 10.0, 18.0, 15.0, 15.0, 20.0, 27.0, 36.0, 36.0, 27.0, 44.0, 33.0, 26.0, 30.0, 37.0, 41.0, 26.0, 44.0, 45.0, 29.0, 38.0, 27.0, 32.0, 33.0, 28.0, 27.0, 23.0, 17.0, 29.0, 21.0, 20.0, 17.0, 7.0, 14.0, 15.0, 6.0, 10.0, 6.0, 4.0, 8.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.43549346923828, -45.97197341918945, -44.508453369140625, -43.04492950439453, -41.5814094543457, -40.117889404296875, -38.65436553955078, -37.19084548950195, -35.727325439453125, -34.2638053894043, -32.80028533935547, -31.336761474609375, -29.873241424560547, -28.40972137451172, -26.946199417114258, -25.482677459716797, -24.01915740966797, -22.55563735961914, -21.09211540222168, -19.62859344482422, -18.16507339477539, -16.701553344726562, -15.238031387329102, -13.774510383605957, -12.310989379882812, -10.847468376159668, -9.383947372436523, -7.920426368713379, -6.456905364990234, -4.99338436126709, -3.5298633575439453, -2.066342353820801, -0.6028175354003906, 0.8607034683227539, 2.3242244720458984, 3.787745475769043, 5.2512664794921875, 6.714787483215332, 8.178308486938477, 9.641829490661621, 11.105350494384766, 12.56887149810791, 14.032392501831055, 15.4959135055542, 16.959434509277344, 18.422954559326172, 19.886476516723633, 21.349998474121094, 22.813518524169922, 24.27703857421875, 25.74056053161621, 27.204082489013672, 28.6676025390625, 30.131122589111328, 31.59464454650879, 33.05816650390625, 34.52168655395508, 35.985206604003906, 37.44873046875, 38.91225051879883, 40.375770568847656, 41.839290618896484, 43.30281066894531, 44.766334533691406, 46.229854583740234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 15.0, 14.0, 13.0, 11.0, 18.0, 19.0, 22.0, 25.0, 33.0, 24.0, 43.0, 40.0, 36.0, 31.0, 47.0, 49.0, 43.0, 52.0, 54.0, 43.0, 42.0, 39.0, 41.0, 28.0, 40.0, 28.0, 26.0, 17.0, 22.0, 12.0, 18.0, 19.0, 10.0, 6.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.160400390625, -6.91455078125, -6.668701171875, -6.4228515625, -6.177001953125, -5.93115234375, -5.685302734375, -5.439453125, -5.193603515625, -4.94775390625, -4.701904296875, -4.4560546875, -4.210205078125, -3.96435546875, -3.718505859375, -3.47265625, -3.226806640625, -2.98095703125, -2.735107421875, -2.4892578125, -2.243408203125, -1.99755859375, -1.751708984375, -1.505859375, -1.260009765625, -1.01416015625, -0.768310546875, -0.5224609375, -0.276611328125, -0.03076171875, 0.215087890625, 0.4609375, 0.706787109375, 0.95263671875, 1.198486328125, 1.4443359375, 1.690185546875, 1.93603515625, 2.181884765625, 2.427734375, 2.673583984375, 2.91943359375, 3.165283203125, 3.4111328125, 3.656982421875, 3.90283203125, 4.148681640625, 4.39453125, 4.640380859375, 4.88623046875, 5.132080078125, 5.3779296875, 5.623779296875, 5.86962890625, 6.115478515625, 6.361328125, 6.607177734375, 6.85302734375, 7.098876953125, 7.3447265625, 7.590576171875, 7.83642578125, 8.082275390625, 8.328125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 1.0, 9.0, 12.0, 10.0, 9.0, 18.0, 12.0, 22.0, 17.0, 28.0, 35.0, 37.0, 79.0, 167.0, 434.0, 1845.0, 12622.0, 126939.0, 1239348.0, 2379400.0, 391272.0, 36084.0, 4417.0, 874.0, 225.0, 110.0, 61.0, 32.0, 31.0, 25.0, 25.0, 14.0, 14.0, 8.0, 13.0, 4.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.714599609375, -15.19482421875, -14.675048828125, -14.1552734375, -13.635498046875, -13.11572265625, -12.595947265625, -12.076171875, -11.556396484375, -11.03662109375, -10.516845703125, -9.9970703125, -9.477294921875, -8.95751953125, -8.437744140625, -7.91796875, -7.398193359375, -6.87841796875, -6.358642578125, -5.8388671875, -5.319091796875, -4.79931640625, -4.279541015625, -3.759765625, -3.239990234375, -2.72021484375, -2.200439453125, -1.6806640625, -1.160888671875, -0.64111328125, -0.121337890625, 0.3984375, 0.918212890625, 1.43798828125, 1.957763671875, 2.4775390625, 2.997314453125, 3.51708984375, 4.036865234375, 4.556640625, 5.076416015625, 5.59619140625, 6.115966796875, 6.6357421875, 7.155517578125, 7.67529296875, 8.195068359375, 8.71484375, 9.234619140625, 9.75439453125, 10.274169921875, 10.7939453125, 11.313720703125, 11.83349609375, 12.353271484375, 12.873046875, 13.392822265625, 13.91259765625, 14.432373046875, 14.9521484375, 15.471923828125, 15.99169921875, 16.511474609375, 17.03125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 12.0, 15.0, 17.0, 21.0, 22.0, 22.0, 45.0, 45.0, 55.0, 91.0, 109.0, 145.0, 182.0, 207.0, 279.0, 338.0, 389.0, 375.0, 367.0, 284.0, 217.0, 185.0, 165.0, 109.0, 65.0, 69.0, 52.0, 43.0, 36.0, 26.0, 18.0, 15.0, 12.0, 5.0, 5.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8294677734375, -8.502685546875, -8.1759033203125, -7.84912109375, -7.5223388671875, -7.195556640625, -6.8687744140625, -6.5419921875, -6.2152099609375, -5.888427734375, -5.5616455078125, -5.23486328125, -4.9080810546875, -4.581298828125, -4.2545166015625, -3.927734375, -3.6009521484375, -3.274169921875, -2.9473876953125, -2.62060546875, -2.2938232421875, -1.967041015625, -1.6402587890625, -1.3134765625, -0.9866943359375, -0.659912109375, -0.3331298828125, -0.00634765625, 0.3204345703125, 0.647216796875, 0.9739990234375, 1.30078125, 1.6275634765625, 1.954345703125, 2.2811279296875, 2.60791015625, 2.9346923828125, 3.261474609375, 3.5882568359375, 3.9150390625, 4.2418212890625, 4.568603515625, 4.8953857421875, 5.22216796875, 5.5489501953125, 5.875732421875, 6.2025146484375, 6.529296875, 6.8560791015625, 7.182861328125, 7.5096435546875, 7.83642578125, 8.1632080078125, 8.489990234375, 8.8167724609375, 9.1435546875, 9.4703369140625, 9.797119140625, 10.1239013671875, 10.45068359375, 10.7774658203125, 11.104248046875, 11.4310302734375, 11.7578125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 7.0, 18.0, 24.0, 25.0, 39.0, 42.0, 48.0, 71.0, 83.0, 135.0, 159.0, 225.0, 346.0, 759.0, 20685.0, 3395661.0, 770540.0, 3784.0, 486.0, 305.0, 193.0, 145.0, 110.0, 96.0, 57.0, 41.0, 36.0, 28.0, 18.0, 21.0, 14.0, 19.0, 11.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.0, -59.296875, -57.59375, -55.890625, -54.1875, -52.484375, -50.78125, -49.078125, -47.375, -45.671875, -43.96875, -42.265625, -40.5625, -38.859375, -37.15625, -35.453125, -33.75, -32.046875, -30.34375, -28.640625, -26.9375, -25.234375, -23.53125, -21.828125, -20.125, -18.421875, -16.71875, -15.015625, -13.3125, -11.609375, -9.90625, -8.203125, -6.5, -4.796875, -3.09375, -1.390625, 0.3125, 2.015625, 3.71875, 5.421875, 7.125, 8.828125, 10.53125, 12.234375, 13.9375, 15.640625, 17.34375, 19.046875, 20.75, 22.453125, 24.15625, 25.859375, 27.5625, 29.265625, 30.96875, 32.671875, 34.375, 36.078125, 37.78125, 39.484375, 41.1875, 42.890625, 44.59375, 46.296875, 48.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 18.0, 42.0, 36.0, 45.0, 54.0, 88.0, 89.0, 92.0, 106.0, 96.0, 77.0, 89.0, 43.0, 44.0, 25.0, 23.0, 13.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.161476135253906, -33.638694763183594, -32.11591339111328, -30.5931339263916, -29.07035255432129, -27.54757308959961, -26.024791717529297, -24.502010345458984, -22.979228973388672, -21.45644760131836, -19.93366813659668, -18.410886764526367, -16.888105392456055, -15.365324974060059, -13.842544555664062, -12.31976318359375, -10.79698371887207, -9.274203300476074, -7.751421928405762, -6.228641510009766, -4.705860614776611, -3.183079719543457, -1.660299301147461, -0.13751792907714844, 1.3852624893188477, 2.908043384552002, 4.430824279785156, 5.953604698181152, 7.476385593414307, 8.999166488647461, 10.521946907043457, 12.04472827911377, 13.567508697509766, 15.090289115905762, 16.613069534301758, 18.13585090637207, 19.658632278442383, 21.181411743164062, 22.704193115234375, 24.226974487304688, 25.749755859375, 27.272537231445312, 28.795316696166992, 30.318098068237305, 31.840879440307617, 33.3636589050293, 34.88644027709961, 36.40922164916992, 37.93199920654297, 39.45478057861328, 40.977561950683594, 42.500343322753906, 44.02312088012695, 45.545902252197266, 47.06868362426758, 48.59146499633789, 50.1142463684082, 51.637027740478516, 53.15980911254883, 54.682586669921875, 56.20536804199219, 57.7281494140625, 59.25093078613281, 60.773712158203125, 62.29649353027344]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 0.0, 1.0, 2.0, 8.0, 8.0, 11.0, 9.0, 15.0, 12.0, 13.0, 14.0, 30.0, 24.0, 28.0, 17.0, 26.0, 38.0, 42.0, 43.0, 47.0, 37.0, 48.0, 28.0, 40.0, 40.0, 44.0, 37.0, 33.0, 27.0, 33.0, 29.0, 29.0, 26.0, 22.0, 23.0, 20.0, 20.0, 12.0, 14.0, 12.0, 3.0, 7.0, 6.0, 5.0, 7.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.899864196777344, -37.698829650878906, -36.49779510498047, -35.29676055908203, -34.095726013183594, -32.89468765258789, -31.693653106689453, -30.492618560791016, -29.291584014892578, -28.09054946899414, -26.889514923095703, -25.688478469848633, -24.487443923950195, -23.286409378051758, -22.085372924804688, -20.88433837890625, -19.683303833007812, -18.482269287109375, -17.281234741210938, -16.080198287963867, -14.87916374206543, -13.678129196166992, -12.477093696594238, -11.276058197021484, -10.075023651123047, -8.87398910522461, -7.6729536056518555, -6.47191858291626, -5.270883560180664, -4.069848537445068, -2.8688135147094727, -1.6677780151367188, -0.4667396545410156, 0.7342953681945801, 1.9353303909301758, 3.1363654136657715, 4.337400436401367, 5.538435459136963, 6.739470481872559, 7.9405059814453125, 9.14154052734375, 10.342575073242188, 11.543610572814941, 12.744646072387695, 13.945680618286133, 15.14671516418457, 16.34775161743164, 17.548786163330078, 18.749820709228516, 19.950855255126953, 21.15188980102539, 22.35292625427246, 23.5539608001709, 24.754995346069336, 25.956031799316406, 27.157066345214844, 28.35810089111328, 29.55913543701172, 30.760169982910156, 31.961206436157227, 33.16223907470703, 34.363277435302734, 35.56431198120117, 36.76534652709961, 37.96638107299805]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 11.0, 15.0, 12.0, 17.0, 10.0, 32.0, 21.0, 31.0, 24.0, 30.0, 23.0, 42.0, 33.0, 54.0, 53.0, 51.0, 45.0, 47.0, 42.0, 40.0, 45.0, 40.0, 33.0, 36.0, 33.0, 32.0, 29.0, 22.0, 15.0, 16.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.51690673828125, -6.2799072265625, -6.04290771484375, -5.805908203125, -5.56890869140625, -5.3319091796875, -5.09490966796875, -4.85791015625, -4.62091064453125, -4.3839111328125, -4.14691162109375, -3.909912109375, -3.67291259765625, -3.4359130859375, -3.19891357421875, -2.9619140625, -2.72491455078125, -2.4879150390625, -2.25091552734375, -2.013916015625, -1.77691650390625, -1.5399169921875, -1.30291748046875, -1.06591796875, -0.82891845703125, -0.5919189453125, -0.35491943359375, -0.117919921875, 0.11907958984375, 0.3560791015625, 0.59307861328125, 0.830078125, 1.06707763671875, 1.3040771484375, 1.54107666015625, 1.778076171875, 2.01507568359375, 2.2520751953125, 2.48907470703125, 2.72607421875, 2.96307373046875, 3.2000732421875, 3.43707275390625, 3.674072265625, 3.91107177734375, 4.1480712890625, 4.38507080078125, 4.6220703125, 4.85906982421875, 5.0960693359375, 5.33306884765625, 5.570068359375, 5.80706787109375, 6.0440673828125, 6.28106689453125, 6.51806640625, 6.75506591796875, 6.9920654296875, 7.22906494140625, 7.466064453125, 7.70306396484375, 7.9400634765625, 8.17706298828125, 8.4140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 9.0, 12.0, 21.0, 30.0, 45.0, 64.0, 88.0, 161.0, 253.0, 370.0, 584.0, 858.0, 1369.0, 1943.0, 2968.0, 4536.0, 6756.0, 10019.0, 14886.0, 21303.0, 30579.0, 42689.0, 57506.0, 75030.0, 94511.0, 109750.0, 117059.0, 107331.0, 90798.0, 72200.0, 54368.0, 40663.0, 28270.0, 20036.0, 13724.0, 9209.0, 6212.0, 4209.0, 2733.0, 1857.0, 1211.0, 772.0, 548.0, 395.0, 223.0, 112.0, 106.0, 61.0, 48.0, 23.0, 20.0, 5.0, 7.0, 7.0, 4.0, 5.0, 2.0], "bins": [-0.67822265625, -0.6579208374023438, -0.6376190185546875, -0.6173171997070312, -0.597015380859375, -0.5767135620117188, -0.5564117431640625, -0.5361099243164062, -0.51580810546875, -0.49550628662109375, -0.4752044677734375, -0.45490264892578125, -0.434600830078125, -0.41429901123046875, -0.3939971923828125, -0.37369537353515625, -0.3533935546875, -0.33309173583984375, -0.3127899169921875, -0.29248809814453125, -0.272186279296875, -0.25188446044921875, -0.2315826416015625, -0.21128082275390625, -0.19097900390625, -0.17067718505859375, -0.1503753662109375, -0.13007354736328125, -0.109771728515625, -0.08946990966796875, -0.0691680908203125, -0.04886627197265625, -0.028564453125, -0.00826263427734375, 0.0120391845703125, 0.03234100341796875, 0.052642822265625, 0.07294464111328125, 0.0932464599609375, 0.11354827880859375, 0.13385009765625, 0.15415191650390625, 0.1744537353515625, 0.19475555419921875, 0.215057373046875, 0.23535919189453125, 0.2556610107421875, 0.27596282958984375, 0.2962646484375, 0.31656646728515625, 0.3368682861328125, 0.35717010498046875, 0.377471923828125, 0.39777374267578125, 0.4180755615234375, 0.43837738037109375, 0.45867919921875, 0.47898101806640625, 0.4992828369140625, 0.5195846557617188, 0.539886474609375, 0.5601882934570312, 0.5804901123046875, 0.6007919311523438, 0.62109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 14.0, 7.0, 15.0, 16.0, 21.0, 31.0, 28.0, 26.0, 34.0, 38.0, 49.0, 41.0, 61.0, 47.0, 49.0, 1086.0, 44.0, 49.0, 37.0, 44.0, 39.0, 33.0, 29.0, 25.0, 23.0, 26.0, 29.0, 15.0, 19.0, 9.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3218994140625, -5.120361328125, -4.9188232421875, -4.71728515625, -4.5157470703125, -4.314208984375, -4.1126708984375, -3.9111328125, -3.7095947265625, -3.508056640625, -3.3065185546875, -3.10498046875, -2.9034423828125, -2.701904296875, -2.5003662109375, -2.298828125, -2.0972900390625, -1.895751953125, -1.6942138671875, -1.49267578125, -1.2911376953125, -1.089599609375, -0.8880615234375, -0.6865234375, -0.4849853515625, -0.283447265625, -0.0819091796875, 0.11962890625, 0.3211669921875, 0.522705078125, 0.7242431640625, 0.92578125, 1.1273193359375, 1.328857421875, 1.5303955078125, 1.73193359375, 1.9334716796875, 2.135009765625, 2.3365478515625, 2.5380859375, 2.7396240234375, 2.941162109375, 3.1427001953125, 3.34423828125, 3.5457763671875, 3.747314453125, 3.9488525390625, 4.150390625, 4.3519287109375, 4.553466796875, 4.7550048828125, 4.95654296875, 5.1580810546875, 5.359619140625, 5.5611572265625, 5.7626953125, 5.9642333984375, 6.165771484375, 6.3673095703125, 6.56884765625, 6.7703857421875, 6.971923828125, 7.1734619140625, 7.375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 22.0, 17.0, 30.0, 42.0, 73.0, 127.0, 200.0, 333.0, 521.0, 848.0, 1391.0, 2309.0, 3830.0, 6312.0, 10303.0, 16828.0, 27305.0, 43845.0, 67501.0, 97569.0, 136790.0, 1069339.0, 261978.0, 117193.0, 83867.0, 55999.0, 35702.0, 22209.0, 13533.0, 8237.0, 5025.0, 3094.0, 1844.0, 1107.0, 652.0, 413.0, 263.0, 176.0, 122.0, 67.0, 40.0, 29.0, 10.0, 6.0, 8.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454345703125, -0.4390907287597656, -0.42383575439453125, -0.4085807800292969, -0.3933258056640625, -0.3780708312988281, -0.36281585693359375, -0.3475608825683594, -0.332305908203125, -0.3170509338378906, -0.30179595947265625, -0.2865409851074219, -0.2712860107421875, -0.2560310363769531, -0.24077606201171875, -0.22552108764648438, -0.21026611328125, -0.19501113891601562, -0.17975616455078125, -0.16450119018554688, -0.1492462158203125, -0.13399124145507812, -0.11873626708984375, -0.10348129272460938, -0.088226318359375, -0.07297134399414062, -0.05771636962890625, -0.042461395263671875, -0.0272064208984375, -0.011951446533203125, 0.00330352783203125, 0.018558502197265625, 0.0338134765625, 0.049068450927734375, 0.06432342529296875, 0.07957839965820312, 0.0948333740234375, 0.11008834838867188, 0.12534332275390625, 0.14059829711914062, 0.155853271484375, 0.17110824584960938, 0.18636322021484375, 0.20161819458007812, 0.2168731689453125, 0.23212814331054688, 0.24738311767578125, 0.2626380920410156, 0.27789306640625, 0.2931480407714844, 0.30840301513671875, 0.3236579895019531, 0.3389129638671875, 0.3541679382324219, 0.36942291259765625, 0.3846778869628906, 0.399932861328125, 0.4151878356933594, 0.43044281005859375, 0.4456977844238281, 0.4609527587890625, 0.4762077331542969, 0.49146270751953125, 0.5067176818847656, 0.52197265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 9.0, 8.0, 11.0, 18.0, 26.0, 27.0, 30.0, 43.0, 55.0, 58.0, 71.0, 77.0, 82.0, 69.0, 79.0, 56.0, 38.0, 27.0, 21.0, 24.0, 22.0, 13.0, 17.0, 13.0, 8.0, 4.0, 10.0, 9.0, 4.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06848716735839844, -0.06580734252929688, -0.06312751770019531, -0.06044769287109375, -0.05776786804199219, -0.055088043212890625, -0.05240821838378906, -0.0497283935546875, -0.04704856872558594, -0.044368743896484375, -0.04168891906738281, -0.03900909423828125, -0.03632926940917969, -0.033649444580078125, -0.030969619750976562, -0.028289794921875, -0.025609970092773438, -0.022930145263671875, -0.020250320434570312, -0.01757049560546875, -0.014890670776367188, -0.012210845947265625, -0.009531021118164062, -0.0068511962890625, -0.0041713714599609375, -0.001491546630859375, 0.0011882781982421875, 0.00386810302734375, 0.0065479278564453125, 0.009227752685546875, 0.011907577514648438, 0.01458740234375, 0.017267227172851562, 0.019947052001953125, 0.022626876831054688, 0.02530670166015625, 0.027986526489257812, 0.030666351318359375, 0.03334617614746094, 0.0360260009765625, 0.03870582580566406, 0.041385650634765625, 0.04406547546386719, 0.04674530029296875, 0.04942512512207031, 0.052104949951171875, 0.05478477478027344, 0.057464599609375, 0.06014442443847656, 0.06282424926757812, 0.06550407409667969, 0.06818389892578125, 0.07086372375488281, 0.07354354858398438, 0.07622337341308594, 0.0789031982421875, 0.08158302307128906, 0.08426284790039062, 0.08694267272949219, 0.08962249755859375, 0.09230232238769531, 0.09498214721679688, 0.09766197204589844, 0.100341796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 10.0, 7.0, 6.0, 11.0, 18.0, 21.0, 23.0, 38.0, 42.0, 43.0, 110.0, 187.0, 317.0, 1031.0, 849798.0, 195109.0, 893.0, 319.0, 179.0, 101.0, 58.0, 48.0, 30.0, 30.0, 19.0, 13.0, 11.0, 11.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-2.25390625, -2.1912078857421875, -2.128509521484375, -2.0658111572265625, -2.00311279296875, -1.9404144287109375, -1.877716064453125, -1.8150177001953125, -1.7523193359375, -1.6896209716796875, -1.626922607421875, -1.5642242431640625, -1.50152587890625, -1.4388275146484375, -1.376129150390625, -1.3134307861328125, -1.250732421875, -1.1880340576171875, -1.125335693359375, -1.0626373291015625, -0.99993896484375, -0.9372406005859375, -0.874542236328125, -0.8118438720703125, -0.7491455078125, -0.6864471435546875, -0.623748779296875, -0.5610504150390625, -0.49835205078125, -0.4356536865234375, -0.372955322265625, -0.3102569580078125, -0.24755859375, -0.1848602294921875, -0.122161865234375, -0.0594635009765625, 0.00323486328125, 0.0659332275390625, 0.128631591796875, 0.1913299560546875, 0.2540283203125, 0.3167266845703125, 0.379425048828125, 0.4421234130859375, 0.50482177734375, 0.5675201416015625, 0.630218505859375, 0.6929168701171875, 0.755615234375, 0.8183135986328125, 0.881011962890625, 0.9437103271484375, 1.00640869140625, 1.0691070556640625, 1.131805419921875, 1.1945037841796875, 1.2572021484375, 1.3199005126953125, 1.382598876953125, 1.4452972412109375, 1.50799560546875, 1.5706939697265625, 1.633392333984375, 1.6960906982421875, 1.7587890625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 12.0, 47.0, 373.0, 495.0, 72.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7394949197769165, -0.718406081199646, -0.6973173022270203, -0.6762284636497498, -0.655139684677124, -0.6340508460998535, -0.612962007522583, -0.5918731689453125, -0.5707843899726868, -0.5496955513954163, -0.5286067724227905, -0.50751793384552, -0.4864291250705719, -0.4653403162956238, -0.44425147771835327, -0.42316266894340515, -0.40207386016845703, -0.3809850513935089, -0.3598962426185608, -0.3388074040412903, -0.31771859526634216, -0.29662978649139404, -0.27554094791412354, -0.2544521391391754, -0.2333633303642273, -0.21227452158927917, -0.19118569791316986, -0.17009687423706055, -0.14900806546211243, -0.1279192566871643, -0.10683043301105499, -0.08574160933494568, -0.06465286016464233, -0.04356404393911362, -0.0224752277135849, -0.0013864114880561829, 0.019702404737472534, 0.04079122096300125, 0.06188003718852997, 0.08296886086463928, 0.1040576696395874, 0.12514647841453552, 0.14623530209064484, 0.16732412576675415, 0.18841293454170227, 0.2095017433166504, 0.2305905669927597, 0.251679390668869, 0.27276819944381714, 0.29385700821876526, 0.3149458169937134, 0.3360346555709839, 0.357123464345932, 0.3782122731208801, 0.39930111169815063, 0.42038992047309875, 0.4414787292480469, 0.462567538022995, 0.4836563467979431, 0.5047451853752136, 0.5258339643478394, 0.5469228029251099, 0.5680116415023804, 0.5891004800796509, 0.6101892590522766]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 12.0, 10.0, 11.0, 20.0, 11.0, 11.0, 17.0, 18.0, 37.0, 28.0, 21.0, 36.0, 42.0, 27.0, 30.0, 50.0, 36.0, 36.0, 32.0, 39.0, 42.0, 33.0, 35.0, 38.0, 36.0, 38.0, 35.0, 26.0, 22.0, 22.0, 18.0, 15.0, 16.0, 16.0, 14.0, 11.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.24797695875167847, -0.240403950214386, -0.2328309267759323, -0.22525791823863983, -0.21768490970134735, -0.21011188626289368, -0.2025388777256012, -0.19496586918830872, -0.18739286065101624, -0.17981985211372375, -0.17224682867527008, -0.1646738201379776, -0.15710081160068512, -0.14952778816223145, -0.14195477962493896, -0.13438177108764648, -0.1268087476491928, -0.11923573166131973, -0.11166272312402725, -0.10408970713615417, -0.0965166985988617, -0.08894368261098862, -0.08137066662311554, -0.07379765808582306, -0.06622464209794998, -0.0586516298353672, -0.051078617572784424, -0.043505601584911346, -0.03593258932232857, -0.02835957705974579, -0.02078656107187271, -0.013213548809289932, -0.005640536546707153, 0.0019324766471982002, 0.009505489841103554, 0.017078503966331482, 0.02465151622891426, 0.03222452849149704, 0.03979754447937012, 0.047370556741952896, 0.054943569004535675, 0.06251658499240875, 0.07008959352970123, 0.07766260951757431, 0.08523562550544739, 0.09280863404273987, 0.10038165003061295, 0.10795466601848602, 0.1155276745557785, 0.12310069054365158, 0.13067370653152466, 0.13824671506881714, 0.14581972360610962, 0.1533927321434021, 0.16096575558185577, 0.16853876411914825, 0.17611178755760193, 0.1836847960948944, 0.19125781953334808, 0.19883082807064056, 0.20640383660793304, 0.21397686004638672, 0.2215498685836792, 0.22912287712097168, 0.23669588565826416]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 7.0, 12.0, 9.0, 13.0, 20.0, 24.0, 26.0, 22.0, 27.0, 32.0, 34.0, 41.0, 35.0, 42.0, 48.0, 53.0, 67.0, 38.0, 40.0, 42.0, 53.0, 35.0, 40.0, 33.0, 39.0, 27.0, 24.0, 24.0, 12.0, 26.0, 10.0, 9.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.578125, -7.3330078125, -7.087890625, -6.8427734375, -6.59765625, -6.3525390625, -6.107421875, -5.8623046875, -5.6171875, -5.3720703125, -5.126953125, -4.8818359375, -4.63671875, -4.3916015625, -4.146484375, -3.9013671875, -3.65625, -3.4111328125, -3.166015625, -2.9208984375, -2.67578125, -2.4306640625, -2.185546875, -1.9404296875, -1.6953125, -1.4501953125, -1.205078125, -0.9599609375, -0.71484375, -0.4697265625, -0.224609375, 0.0205078125, 0.265625, 0.5107421875, 0.755859375, 1.0009765625, 1.24609375, 1.4912109375, 1.736328125, 1.9814453125, 2.2265625, 2.4716796875, 2.716796875, 2.9619140625, 3.20703125, 3.4521484375, 3.697265625, 3.9423828125, 4.1875, 4.4326171875, 4.677734375, 4.9228515625, 5.16796875, 5.4130859375, 5.658203125, 5.9033203125, 6.1484375, 6.3935546875, 6.638671875, 6.8837890625, 7.12890625, 7.3740234375, 7.619140625, 7.8642578125, 8.109375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 8.0, 8.0, 14.0, 14.0, 23.0, 24.0, 41.0, 61.0, 82.0, 118.0, 223.0, 431.0, 1190.0, 3211.0, 9723.0, 27988.0, 83543.0, 291219.0, 431047.0, 133880.0, 42812.0, 14709.0, 5020.0, 1732.0, 671.0, 261.0, 162.0, 84.0, 74.0, 34.0, 28.0, 26.0, 11.0, 14.0, 11.0, 13.0, 11.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.908935546875, -9.59130859375, -9.273681640625, -8.9560546875, -8.638427734375, -8.32080078125, -8.003173828125, -7.685546875, -7.367919921875, -7.05029296875, -6.732666015625, -6.4150390625, -6.097412109375, -5.77978515625, -5.462158203125, -5.14453125, -4.826904296875, -4.50927734375, -4.191650390625, -3.8740234375, -3.556396484375, -3.23876953125, -2.921142578125, -2.603515625, -2.285888671875, -1.96826171875, -1.650634765625, -1.3330078125, -1.015380859375, -0.69775390625, -0.380126953125, -0.0625, 0.255126953125, 0.57275390625, 0.890380859375, 1.2080078125, 1.525634765625, 1.84326171875, 2.160888671875, 2.478515625, 2.796142578125, 3.11376953125, 3.431396484375, 3.7490234375, 4.066650390625, 4.38427734375, 4.701904296875, 5.01953125, 5.337158203125, 5.65478515625, 5.972412109375, 6.2900390625, 6.607666015625, 6.92529296875, 7.242919921875, 7.560546875, 7.878173828125, 8.19580078125, 8.513427734375, 8.8310546875, 9.148681640625, 9.46630859375, 9.783935546875, 10.1015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 4.0, 15.0, 10.0, 8.0, 23.0, 16.0, 17.0, 20.0, 21.0, 32.0, 21.0, 29.0, 32.0, 37.0, 64.0, 73.0, 102.0, 227.0, 1463.0, 228.0, 117.0, 74.0, 53.0, 45.0, 40.0, 37.0, 39.0, 29.0, 25.0, 20.0, 18.0, 13.0, 17.0, 10.0, 9.0, 8.0, 11.0, 8.0, 4.0, 3.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-23.234375, -22.58154296875, -21.9287109375, -21.27587890625, -20.623046875, -19.97021484375, -19.3173828125, -18.66455078125, -18.01171875, -17.35888671875, -16.7060546875, -16.05322265625, -15.400390625, -14.74755859375, -14.0947265625, -13.44189453125, -12.7890625, -12.13623046875, -11.4833984375, -10.83056640625, -10.177734375, -9.52490234375, -8.8720703125, -8.21923828125, -7.56640625, -6.91357421875, -6.2607421875, -5.60791015625, -4.955078125, -4.30224609375, -3.6494140625, -2.99658203125, -2.34375, -1.69091796875, -1.0380859375, -0.38525390625, 0.267578125, 0.92041015625, 1.5732421875, 2.22607421875, 2.87890625, 3.53173828125, 4.1845703125, 4.83740234375, 5.490234375, 6.14306640625, 6.7958984375, 7.44873046875, 8.1015625, 8.75439453125, 9.4072265625, 10.06005859375, 10.712890625, 11.36572265625, 12.0185546875, 12.67138671875, 13.32421875, 13.97705078125, 14.6298828125, 15.28271484375, 15.935546875, 16.58837890625, 17.2412109375, 17.89404296875, 18.546875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 3.0, 11.0, 15.0, 20.0, 11.0, 18.0, 25.0, 23.0, 37.0, 35.0, 48.0, 69.0, 99.0, 166.0, 231.0, 376.0, 1121.0, 8805.0, 2248335.0, 878721.0, 5461.0, 930.0, 370.0, 218.0, 128.0, 93.0, 77.0, 48.0, 32.0, 31.0, 30.0, 27.0, 17.0, 16.0, 13.0, 8.0, 7.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.53125, -45.94287109375, -44.3544921875, -42.76611328125, -41.177734375, -39.58935546875, -38.0009765625, -36.41259765625, -34.82421875, -33.23583984375, -31.6474609375, -30.05908203125, -28.470703125, -26.88232421875, -25.2939453125, -23.70556640625, -22.1171875, -20.52880859375, -18.9404296875, -17.35205078125, -15.763671875, -14.17529296875, -12.5869140625, -10.99853515625, -9.41015625, -7.82177734375, -6.2333984375, -4.64501953125, -3.056640625, -1.46826171875, 0.1201171875, 1.70849609375, 3.296875, 4.88525390625, 6.4736328125, 8.06201171875, 9.650390625, 11.23876953125, 12.8271484375, 14.41552734375, 16.00390625, 17.59228515625, 19.1806640625, 20.76904296875, 22.357421875, 23.94580078125, 25.5341796875, 27.12255859375, 28.7109375, 30.29931640625, 31.8876953125, 33.47607421875, 35.064453125, 36.65283203125, 38.2412109375, 39.82958984375, 41.41796875, 43.00634765625, 44.5947265625, 46.18310546875, 47.771484375, 49.35986328125, 50.9482421875, 52.53662109375, 54.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 10.0, 575.0, 428.0, 4.0, 1.0], "bins": [-576.196533203125, -566.7381591796875, -557.2797241210938, -547.8213500976562, -538.3629760742188, -528.904541015625, -519.4461669921875, -509.98779296875, -500.5293884277344, -491.07098388671875, -481.61260986328125, -472.1542053222656, -462.69580078125, -453.2374267578125, -443.7790222167969, -434.32061767578125, -424.86224365234375, -415.4038391113281, -405.9454650878906, -396.487060546875, -387.0286560058594, -377.5702819824219, -368.11187744140625, -358.65350341796875, -349.195068359375, -339.7366638183594, -330.2782897949219, -320.81988525390625, -311.3614807128906, -301.9031066894531, -292.4447021484375, -282.986328125, -273.5279235839844, -264.06951904296875, -254.6111297607422, -245.15274047851562, -235.69435119628906, -226.2359619140625, -216.77755737304688, -207.3191680908203, -197.8607635498047, -188.40237426757812, -178.9439697265625, -169.48558044433594, -160.02719116210938, -150.56878662109375, -141.1103973388672, -131.65200805664062, -122.19361877441406, -112.73522186279297, -103.2768325805664, -93.81843566894531, -84.36004638671875, -74.90164947509766, -65.44325256347656, -55.98486328125, -46.526466369628906, -37.06807327270508, -27.609678268432617, -18.151283264160156, -8.692890167236328, 0.7655029296875, 10.223899841308594, 19.682289123535156, 29.140687942504883]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 4.0, 14.0, 9.0, 17.0, 11.0, 18.0, 16.0, 25.0, 24.0, 29.0, 36.0, 29.0, 29.0, 29.0, 36.0, 43.0, 46.0, 36.0, 30.0, 48.0, 40.0, 36.0, 38.0, 31.0, 26.0, 25.0, 21.0, 32.0, 30.0, 24.0, 20.0, 25.0, 23.0, 18.0, 9.0, 6.0, 7.0, 13.0, 8.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-56.16048812866211, -54.387813568115234, -52.61513900756836, -50.842464447021484, -49.06978988647461, -47.29711151123047, -45.524436950683594, -43.75176239013672, -41.979087829589844, -40.20641326904297, -38.433738708496094, -36.66106414794922, -34.888389587402344, -33.11571502685547, -31.34303855895996, -29.570362091064453, -27.79768943786621, -26.025014877319336, -24.25234031677246, -22.479663848876953, -20.706989288330078, -18.934314727783203, -17.161640167236328, -15.388964653015137, -13.616290092468262, -11.843615531921387, -10.070940017700195, -8.29826545715332, -6.525590419769287, -4.752915382385254, -2.980240821838379, -1.2075653076171875, 0.5651092529296875, 2.3377842903137207, 4.110459327697754, 5.883133888244629, 7.655808925628662, 9.428483963012695, 11.20115852355957, 12.973834037780762, 14.746508598327637, 16.519184112548828, 18.291858673095703, 20.064533233642578, 21.837207794189453, 23.609882354736328, 25.382556915283203, 27.15523338317871, 28.927907943725586, 30.70058250427246, 32.47325897216797, 34.245933532714844, 36.01860809326172, 37.791282653808594, 39.56395721435547, 41.336631774902344, 43.10930633544922, 44.881980895996094, 46.65465545654297, 48.427330017089844, 50.20000457763672, 51.972679138183594, 53.74535369873047, 55.51803207397461, 57.290706634521484]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 16.0, 10.0, 19.0, 11.0, 13.0, 25.0, 20.0, 27.0, 28.0, 39.0, 38.0, 39.0, 40.0, 35.0, 36.0, 57.0, 48.0, 47.0, 40.0, 44.0, 39.0, 43.0, 32.0, 38.0, 35.0, 28.0, 28.0, 23.0, 13.0, 11.0, 12.0, 11.0, 8.0, 10.0, 6.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.18060302734375, -6.9276123046875, -6.67462158203125, -6.421630859375, -6.16864013671875, -5.9156494140625, -5.66265869140625, -5.40966796875, -5.15667724609375, -4.9036865234375, -4.65069580078125, -4.397705078125, -4.14471435546875, -3.8917236328125, -3.63873291015625, -3.3857421875, -3.13275146484375, -2.8797607421875, -2.62677001953125, -2.373779296875, -2.12078857421875, -1.8677978515625, -1.61480712890625, -1.36181640625, -1.10882568359375, -0.8558349609375, -0.60284423828125, -0.349853515625, -0.09686279296875, 0.1561279296875, 0.40911865234375, 0.662109375, 0.91510009765625, 1.1680908203125, 1.42108154296875, 1.674072265625, 1.92706298828125, 2.1800537109375, 2.43304443359375, 2.68603515625, 2.93902587890625, 3.1920166015625, 3.44500732421875, 3.697998046875, 3.95098876953125, 4.2039794921875, 4.45697021484375, 4.7099609375, 4.96295166015625, 5.2159423828125, 5.46893310546875, 5.721923828125, 5.97491455078125, 6.2279052734375, 6.48089599609375, 6.73388671875, 6.98687744140625, 7.2398681640625, 7.49285888671875, 7.745849609375, 7.99884033203125, 8.2518310546875, 8.50482177734375, 8.7578125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 13.0, 11.0, 22.0, 30.0, 40.0, 52.0, 118.0, 185.0, 324.0, 578.0, 1233.0, 2593.0, 5927.0, 14217.0, 35856.0, 93053.0, 233832.0, 534932.0, 967128.0, 1081660.0, 684678.0, 320605.0, 130521.0, 50684.0, 20306.0, 8283.0, 3719.0, 1729.0, 811.0, 446.0, 253.0, 142.0, 95.0, 47.0, 33.0, 32.0, 19.0, 18.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.828125, -6.615966796875, -6.40380859375, -6.191650390625, -5.9794921875, -5.767333984375, -5.55517578125, -5.343017578125, -5.130859375, -4.918701171875, -4.70654296875, -4.494384765625, -4.2822265625, -4.070068359375, -3.85791015625, -3.645751953125, -3.43359375, -3.221435546875, -3.00927734375, -2.797119140625, -2.5849609375, -2.372802734375, -2.16064453125, -1.948486328125, -1.736328125, -1.524169921875, -1.31201171875, -1.099853515625, -0.8876953125, -0.675537109375, -0.46337890625, -0.251220703125, -0.0390625, 0.173095703125, 0.38525390625, 0.597412109375, 0.8095703125, 1.021728515625, 1.23388671875, 1.446044921875, 1.658203125, 1.870361328125, 2.08251953125, 2.294677734375, 2.5068359375, 2.718994140625, 2.93115234375, 3.143310546875, 3.35546875, 3.567626953125, 3.77978515625, 3.991943359375, 4.2041015625, 4.416259765625, 4.62841796875, 4.840576171875, 5.052734375, 5.264892578125, 5.47705078125, 5.689208984375, 5.9013671875, 6.113525390625, 6.32568359375, 6.537841796875, 6.75]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 8.0, 4.0, 3.0, 7.0, 12.0, 11.0, 25.0, 22.0, 32.0, 41.0, 64.0, 70.0, 103.0, 132.0, 152.0, 210.0, 274.0, 347.0, 413.0, 410.0, 356.0, 340.0, 264.0, 186.0, 147.0, 93.0, 85.0, 81.0, 44.0, 36.0, 22.0, 21.0, 19.0, 13.0, 10.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.1209716796875, -12.726318359375, -12.3316650390625, -11.93701171875, -11.5423583984375, -11.147705078125, -10.7530517578125, -10.3583984375, -9.9637451171875, -9.569091796875, -9.1744384765625, -8.77978515625, -8.3851318359375, -7.990478515625, -7.5958251953125, -7.201171875, -6.8065185546875, -6.411865234375, -6.0172119140625, -5.62255859375, -5.2279052734375, -4.833251953125, -4.4385986328125, -4.0439453125, -3.6492919921875, -3.254638671875, -2.8599853515625, -2.46533203125, -2.0706787109375, -1.676025390625, -1.2813720703125, -0.88671875, -0.4920654296875, -0.097412109375, 0.2972412109375, 0.69189453125, 1.0865478515625, 1.481201171875, 1.8758544921875, 2.2705078125, 2.6651611328125, 3.059814453125, 3.4544677734375, 3.84912109375, 4.2437744140625, 4.638427734375, 5.0330810546875, 5.427734375, 5.8223876953125, 6.217041015625, 6.6116943359375, 7.00634765625, 7.4010009765625, 7.795654296875, 8.1903076171875, 8.5849609375, 8.9796142578125, 9.374267578125, 9.7689208984375, 10.16357421875, 10.5582275390625, 10.952880859375, 11.3475341796875, 11.7421875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 6.0, 13.0, 13.0, 13.0, 20.0, 25.0, 25.0, 47.0, 74.0, 93.0, 103.0, 194.0, 341.0, 651.0, 1526.0, 14322.0, 1685227.0, 2466828.0, 21390.0, 1597.0, 682.0, 377.0, 218.0, 149.0, 92.0, 71.0, 46.0, 35.0, 27.0, 18.0, 17.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.78125, -41.30859375, -39.8359375, -38.36328125, -36.890625, -35.41796875, -33.9453125, -32.47265625, -31.0, -29.52734375, -28.0546875, -26.58203125, -25.109375, -23.63671875, -22.1640625, -20.69140625, -19.21875, -17.74609375, -16.2734375, -14.80078125, -13.328125, -11.85546875, -10.3828125, -8.91015625, -7.4375, -5.96484375, -4.4921875, -3.01953125, -1.546875, -0.07421875, 1.3984375, 2.87109375, 4.34375, 5.81640625, 7.2890625, 8.76171875, 10.234375, 11.70703125, 13.1796875, 14.65234375, 16.125, 17.59765625, 19.0703125, 20.54296875, 22.015625, 23.48828125, 24.9609375, 26.43359375, 27.90625, 29.37890625, 30.8515625, 32.32421875, 33.796875, 35.26953125, 36.7421875, 38.21484375, 39.6875, 41.16015625, 42.6328125, 44.10546875, 45.578125, 47.05078125, 48.5234375, 49.99609375, 51.46875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 30.0, 226.0, 470.0, 239.0, 50.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-371.7904052734375, -363.9750061035156, -356.15960693359375, -348.3442077636719, -340.52880859375, -332.7134094238281, -324.89801025390625, -317.08258056640625, -309.2672119140625, -301.4518127441406, -293.63641357421875, -285.8210144042969, -278.005615234375, -270.1902160644531, -262.37481689453125, -254.5594024658203, -246.74398803710938, -238.9285888671875, -231.11318969726562, -223.29779052734375, -215.48239135742188, -207.6669921875, -199.85157775878906, -192.0361785888672, -184.2207794189453, -176.40538024902344, -168.58998107910156, -160.7745819091797, -152.95916748046875, -145.14376831054688, -137.328369140625, -129.51296997070312, -121.69757080078125, -113.88217163085938, -106.0667724609375, -98.2513656616211, -90.43596649169922, -82.62056732177734, -74.80516052246094, -66.98976135253906, -59.17436218261719, -51.35896301269531, -43.54356002807617, -35.72815704345703, -27.912757873535156, -20.09735870361328, -12.28195571899414, -4.466552734375, 3.348846435546875, 11.164247512817383, 18.97964859008789, 26.7950496673584, 34.610450744628906, 42.42584991455078, 50.24125289916992, 58.05665588378906, 65.87205505371094, 73.68745422363281, 81.50285339355469, 89.3182601928711, 97.13365936279297, 104.94905853271484, 112.76446533203125, 120.57986450195312, 128.395263671875]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 10.0, 8.0, 14.0, 13.0, 12.0, 16.0, 19.0, 21.0, 26.0, 32.0, 34.0, 28.0, 35.0, 29.0, 45.0, 48.0, 53.0, 39.0, 48.0, 29.0, 27.0, 32.0, 38.0, 44.0, 39.0, 35.0, 28.0, 22.0, 31.0, 22.0, 17.0, 13.0, 20.0, 12.0, 7.0, 8.0, 13.0, 8.0, 3.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.00914764404297, -45.561180114746094, -44.11321258544922, -42.665245056152344, -41.21727752685547, -39.769309997558594, -38.32134246826172, -36.873374938964844, -35.42540740966797, -33.977439880371094, -32.52947235107422, -31.081504821777344, -29.63353729248047, -28.185569763183594, -26.73760223388672, -25.289634704589844, -23.841665267944336, -22.39369773864746, -20.945730209350586, -19.49776268005371, -18.049795150756836, -16.60182762145996, -15.15385913848877, -13.705891609191895, -12.25792407989502, -10.809956550598145, -9.36198902130127, -7.914021015167236, -6.466053485870361, -5.018085956573486, -3.570117950439453, -2.122150421142578, -0.6741828918457031, 0.7737847566604614, 2.221752405166626, 3.66972017288208, 5.117687702178955, 6.56565523147583, 8.013623237609863, 9.461590766906738, 10.909558296203613, 12.357525825500488, 13.805493354797363, 15.253461837768555, 16.70142936706543, 18.149396896362305, 19.59736442565918, 21.045331954956055, 22.49329948425293, 23.941267013549805, 25.38923454284668, 26.837202072143555, 28.28516960144043, 29.733137130737305, 31.181106567382812, 32.62907409667969, 34.07704162597656, 35.52500915527344, 36.97297668457031, 38.42094421386719, 39.86891174316406, 41.31687927246094, 42.76484680175781, 44.21281433105469, 45.66078186035156]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 12.0, 11.0, 6.0, 17.0, 21.0, 18.0, 21.0, 19.0, 19.0, 21.0, 35.0, 23.0, 47.0, 31.0, 34.0, 49.0, 48.0, 52.0, 46.0, 40.0, 36.0, 38.0, 43.0, 36.0, 34.0, 22.0, 37.0, 28.0, 33.0, 16.0, 23.0, 14.0, 14.0, 9.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.46875, -7.2418212890625, -7.014892578125, -6.7879638671875, -6.56103515625, -6.3341064453125, -6.107177734375, -5.8802490234375, -5.6533203125, -5.4263916015625, -5.199462890625, -4.9725341796875, -4.74560546875, -4.5186767578125, -4.291748046875, -4.0648193359375, -3.837890625, -3.6109619140625, -3.384033203125, -3.1571044921875, -2.93017578125, -2.7032470703125, -2.476318359375, -2.2493896484375, -2.0224609375, -1.7955322265625, -1.568603515625, -1.3416748046875, -1.11474609375, -0.8878173828125, -0.660888671875, -0.4339599609375, -0.20703125, 0.0198974609375, 0.246826171875, 0.4737548828125, 0.70068359375, 0.9276123046875, 1.154541015625, 1.3814697265625, 1.6083984375, 1.8353271484375, 2.062255859375, 2.2891845703125, 2.51611328125, 2.7430419921875, 2.969970703125, 3.1968994140625, 3.423828125, 3.6507568359375, 3.877685546875, 4.1046142578125, 4.33154296875, 4.5584716796875, 4.785400390625, 5.0123291015625, 5.2392578125, 5.4661865234375, 5.693115234375, 5.9200439453125, 6.14697265625, 6.3739013671875, 6.600830078125, 6.8277587890625, 7.0546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 5.0, 15.0, 19.0, 26.0, 40.0, 54.0, 111.0, 157.0, 249.0, 410.0, 681.0, 1224.0, 1975.0, 3308.0, 5862.0, 10019.0, 16792.0, 28152.0, 47388.0, 74917.0, 111282.0, 146963.0, 164128.0, 143844.0, 107627.0, 72114.0, 44928.0, 27104.0, 16189.0, 9427.0, 5571.0, 3231.0, 1861.0, 1189.0, 642.0, 367.0, 231.0, 168.0, 98.0, 57.0, 36.0, 23.0, 24.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.878326416015625, -0.85040283203125, -0.822479248046875, -0.7945556640625, -0.766632080078125, -0.73870849609375, -0.710784912109375, -0.682861328125, -0.654937744140625, -0.62701416015625, -0.599090576171875, -0.5711669921875, -0.543243408203125, -0.51531982421875, -0.487396240234375, -0.45947265625, -0.431549072265625, -0.40362548828125, -0.375701904296875, -0.3477783203125, -0.319854736328125, -0.29193115234375, -0.264007568359375, -0.236083984375, -0.208160400390625, -0.18023681640625, -0.152313232421875, -0.1243896484375, -0.096466064453125, -0.06854248046875, -0.040618896484375, -0.0126953125, 0.015228271484375, 0.04315185546875, 0.071075439453125, 0.0989990234375, 0.126922607421875, 0.15484619140625, 0.182769775390625, 0.210693359375, 0.238616943359375, 0.26654052734375, 0.294464111328125, 0.3223876953125, 0.350311279296875, 0.37823486328125, 0.406158447265625, 0.43408203125, 0.462005615234375, 0.48992919921875, 0.517852783203125, 0.5457763671875, 0.573699951171875, 0.60162353515625, 0.629547119140625, 0.657470703125, 0.685394287109375, 0.71331787109375, 0.741241455078125, 0.7691650390625, 0.797088623046875, 0.82501220703125, 0.852935791015625, 0.880859375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 8.0, 11.0, 12.0, 16.0, 18.0, 15.0, 13.0, 15.0, 25.0, 33.0, 32.0, 28.0, 33.0, 23.0, 24.0, 26.0, 36.0, 42.0, 41.0, 1051.0, 34.0, 35.0, 41.0, 30.0, 37.0, 32.0, 34.0, 31.0, 35.0, 28.0, 21.0, 13.0, 23.0, 18.0, 11.0, 8.0, 5.0, 12.0, 16.0, 11.0, 7.0, 5.0, 6.0, 2.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.94921875, -4.7908935546875, -4.632568359375, -4.4742431640625, -4.31591796875, -4.1575927734375, -3.999267578125, -3.8409423828125, -3.6826171875, -3.5242919921875, -3.365966796875, -3.2076416015625, -3.04931640625, -2.8909912109375, -2.732666015625, -2.5743408203125, -2.416015625, -2.2576904296875, -2.099365234375, -1.9410400390625, -1.78271484375, -1.6243896484375, -1.466064453125, -1.3077392578125, -1.1494140625, -0.9910888671875, -0.832763671875, -0.6744384765625, -0.51611328125, -0.3577880859375, -0.199462890625, -0.0411376953125, 0.1171875, 0.2755126953125, 0.433837890625, 0.5921630859375, 0.75048828125, 0.9088134765625, 1.067138671875, 1.2254638671875, 1.3837890625, 1.5421142578125, 1.700439453125, 1.8587646484375, 2.01708984375, 2.1754150390625, 2.333740234375, 2.4920654296875, 2.650390625, 2.8087158203125, 2.967041015625, 3.1253662109375, 3.28369140625, 3.4420166015625, 3.600341796875, 3.7586669921875, 3.9169921875, 4.0753173828125, 4.233642578125, 4.3919677734375, 4.55029296875, 4.7086181640625, 4.866943359375, 5.0252685546875, 5.18359375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 10.0, 15.0, 20.0, 38.0, 51.0, 76.0, 143.0, 175.0, 330.0, 559.0, 891.0, 1489.0, 2411.0, 3881.0, 6659.0, 10736.0, 18265.0, 29840.0, 47687.0, 74430.0, 109105.0, 154534.0, 1187629.0, 148656.0, 106613.0, 72403.0, 46579.0, 29087.0, 17687.0, 10529.0, 6519.0, 3889.0, 2467.0, 1400.0, 835.0, 591.0, 316.0, 227.0, 129.0, 87.0, 71.0, 28.0, 15.0, 11.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.57763671875, -0.5613517761230469, -0.5450668334960938, -0.5287818908691406, -0.5124969482421875, -0.4962120056152344, -0.47992706298828125, -0.4636421203613281, -0.447357177734375, -0.4310722351074219, -0.41478729248046875, -0.3985023498535156, -0.3822174072265625, -0.3659324645996094, -0.34964752197265625, -0.3333625793457031, -0.31707763671875, -0.3007926940917969, -0.28450775146484375, -0.2682228088378906, -0.2519378662109375, -0.23565292358398438, -0.21936798095703125, -0.20308303833007812, -0.186798095703125, -0.17051315307617188, -0.15422821044921875, -0.13794326782226562, -0.1216583251953125, -0.10537338256835938, -0.08908843994140625, -0.07280349731445312, -0.0565185546875, -0.040233612060546875, -0.02394866943359375, -0.007663726806640625, 0.0086212158203125, 0.024906158447265625, 0.04119110107421875, 0.057476043701171875, 0.073760986328125, 0.09004592895507812, 0.10633087158203125, 0.12261581420898438, 0.1389007568359375, 0.15518569946289062, 0.17147064208984375, 0.18775558471679688, 0.20404052734375, 0.22032546997070312, 0.23661041259765625, 0.2528953552246094, 0.2691802978515625, 0.2854652404785156, 0.30175018310546875, 0.3180351257324219, 0.334320068359375, 0.3506050109863281, 0.36688995361328125, 0.3831748962402344, 0.3994598388671875, 0.4157447814941406, 0.43202972412109375, 0.4483146667480469, 0.464599609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 2.0, 5.0, 11.0, 8.0, 15.0, 10.0, 17.0, 22.0, 27.0, 19.0, 27.0, 47.0, 48.0, 57.0, 69.0, 86.0, 76.0, 74.0, 73.0, 69.0, 43.0, 26.0, 36.0, 24.0, 13.0, 15.0, 9.0, 9.0, 7.0, 6.0, 3.0, 8.0, 7.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.060262203216552734, -0.05817699432373047, -0.0560917854309082, -0.05400657653808594, -0.05192136764526367, -0.049836158752441406, -0.04775094985961914, -0.045665740966796875, -0.04358053207397461, -0.041495323181152344, -0.03941011428833008, -0.03732490539550781, -0.03523969650268555, -0.03315448760986328, -0.031069278717041016, -0.02898406982421875, -0.026898860931396484, -0.02481365203857422, -0.022728443145751953, -0.020643234252929688, -0.018558025360107422, -0.016472816467285156, -0.01438760757446289, -0.012302398681640625, -0.01021718978881836, -0.008131980895996094, -0.006046772003173828, -0.0039615631103515625, -0.0018763542175292969, 0.00020885467529296875, 0.0022940635681152344, 0.0043792724609375, 0.006464481353759766, 0.008549690246582031, 0.010634899139404297, 0.012720108032226562, 0.014805316925048828, 0.016890525817871094, 0.01897573471069336, 0.021060943603515625, 0.02314615249633789, 0.025231361389160156, 0.027316570281982422, 0.029401779174804688, 0.03148698806762695, 0.03357219696044922, 0.035657405853271484, 0.03774261474609375, 0.039827823638916016, 0.04191303253173828, 0.04399824142456055, 0.04608345031738281, 0.04816865921020508, 0.050253868103027344, 0.05233907699584961, 0.054424285888671875, 0.05650949478149414, 0.058594703674316406, 0.06067991256713867, 0.06276512145996094, 0.0648503303527832, 0.06693553924560547, 0.06902074813842773, 0.07110595703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 11.0, 6.0, 4.0, 10.0, 11.0, 8.0, 14.0, 21.0, 22.0, 41.0, 50.0, 57.0, 93.0, 209.0, 422.0, 2366.0, 1017549.0, 26114.0, 848.0, 226.0, 151.0, 80.0, 53.0, 24.0, 39.0, 28.0, 11.0, 19.0, 18.0, 5.0, 7.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.640625, -1.5920562744140625, -1.543487548828125, -1.4949188232421875, -1.44635009765625, -1.3977813720703125, -1.349212646484375, -1.3006439208984375, -1.2520751953125, -1.2035064697265625, -1.154937744140625, -1.1063690185546875, -1.05780029296875, -1.0092315673828125, -0.960662841796875, -0.9120941162109375, -0.863525390625, -0.8149566650390625, -0.766387939453125, -0.7178192138671875, -0.66925048828125, -0.6206817626953125, -0.572113037109375, -0.5235443115234375, -0.4749755859375, -0.4264068603515625, -0.377838134765625, -0.3292694091796875, -0.28070068359375, -0.2321319580078125, -0.183563232421875, -0.1349945068359375, -0.08642578125, -0.0378570556640625, 0.010711669921875, 0.0592803955078125, 0.10784912109375, 0.1564178466796875, 0.204986572265625, 0.2535552978515625, 0.3021240234375, 0.3506927490234375, 0.399261474609375, 0.4478302001953125, 0.49639892578125, 0.5449676513671875, 0.593536376953125, 0.6421051025390625, 0.690673828125, 0.7392425537109375, 0.787811279296875, 0.8363800048828125, 0.88494873046875, 0.9335174560546875, 0.982086181640625, 1.0306549072265625, 1.0792236328125, 1.1277923583984375, 1.176361083984375, 1.2249298095703125, 1.27349853515625, 1.3220672607421875, 1.370635986328125, 1.4192047119140625, 1.4677734375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 22.0, 107.0, 549.0, 269.0, 51.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7875995635986328, -0.7717677354812622, -0.7559359073638916, -0.740104079246521, -0.7242722511291504, -0.708440363407135, -0.6926085352897644, -0.6767767071723938, -0.6609448790550232, -0.6451130509376526, -0.629281222820282, -0.6134493947029114, -0.597617506980896, -0.5817856788635254, -0.5659538507461548, -0.5501220226287842, -0.5342901945114136, -0.518458366394043, -0.5026265382766724, -0.48679468035697937, -0.47096285223960876, -0.45513102412223816, -0.43929916620254517, -0.42346733808517456, -0.40763550996780396, -0.39180368185043335, -0.37597185373306274, -0.36013999581336975, -0.34430816769599915, -0.32847633957862854, -0.31264448165893555, -0.29681265354156494, -0.28098076581954956, -0.26514893770217896, -0.24931709468364716, -0.23348525166511536, -0.21765342354774475, -0.20182159543037415, -0.18598975241184235, -0.17015790939331055, -0.15432609617710114, -0.13849425315856934, -0.12266242504119873, -0.10683058947324753, -0.09099875390529633, -0.07516691833734512, -0.05933508276939392, -0.04350324720144272, -0.027671411633491516, -0.011839576065540314, 0.003992259502410889, 0.01982409507036209, 0.03565593063831329, 0.051487766206264496, 0.0673196017742157, 0.0831514373421669, 0.0989832729101181, 0.1148151084780693, 0.1306469440460205, 0.1464787721633911, 0.1623106151819229, 0.1781424582004547, 0.19397428631782532, 0.20980611443519592, 0.22563795745372772]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 9.0, 6.0, 10.0, 6.0, 11.0, 7.0, 20.0, 17.0, 25.0, 25.0, 26.0, 27.0, 24.0, 34.0, 25.0, 23.0, 40.0, 47.0, 32.0, 37.0, 32.0, 40.0, 32.0, 39.0, 42.0, 27.0, 39.0, 36.0, 22.0, 33.0, 21.0, 27.0, 20.0, 21.0, 16.0, 23.0, 16.0, 10.0, 15.0, 5.0, 3.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16876286268234253, -0.1630399227142334, -0.15731698274612427, -0.15159404277801514, -0.145871102809906, -0.14014816284179688, -0.13442522287368774, -0.1287022829055786, -0.12297934293746948, -0.11725640296936035, -0.11153346300125122, -0.10581052303314209, -0.10008758306503296, -0.09436464309692383, -0.0886417031288147, -0.08291876316070557, -0.07719582319259644, -0.0714728832244873, -0.06574994325637817, -0.06002700328826904, -0.05430406332015991, -0.04858112335205078, -0.04285818338394165, -0.03713524341583252, -0.03141230344772339, -0.025689363479614258, -0.019966423511505127, -0.014243483543395996, -0.008520543575286865, -0.0027976036071777344, 0.0029253363609313965, 0.008648276329040527, 0.014371216297149658, 0.02009415626525879, 0.02581709623336792, 0.03154003620147705, 0.03726297616958618, 0.04298591613769531, 0.04870885610580444, 0.054431796073913574, 0.060154736042022705, 0.06587767601013184, 0.07160061597824097, 0.0773235559463501, 0.08304649591445923, 0.08876943588256836, 0.09449237585067749, 0.10021531581878662, 0.10593825578689575, 0.11166119575500488, 0.11738413572311401, 0.12310707569122314, 0.12883001565933228, 0.1345529556274414, 0.14027589559555054, 0.14599883556365967, 0.1517217755317688, 0.15744471549987793, 0.16316765546798706, 0.1688905954360962, 0.17461353540420532, 0.18033647537231445, 0.18605941534042358, 0.19178235530853271, 0.19750529527664185]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 7.0, 7.0, 15.0, 7.0, 12.0, 15.0, 12.0, 23.0, 14.0, 16.0, 31.0, 20.0, 34.0, 43.0, 30.0, 43.0, 34.0, 37.0, 49.0, 45.0, 36.0, 37.0, 41.0, 37.0, 36.0, 32.0, 37.0, 35.0, 25.0, 31.0, 32.0, 18.0, 19.0, 14.0, 12.0, 16.0, 10.0, 9.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.7890625, -6.5718994140625, -6.354736328125, -6.1375732421875, -5.92041015625, -5.7032470703125, -5.486083984375, -5.2689208984375, -5.0517578125, -4.8345947265625, -4.617431640625, -4.4002685546875, -4.18310546875, -3.9659423828125, -3.748779296875, -3.5316162109375, -3.314453125, -3.0972900390625, -2.880126953125, -2.6629638671875, -2.44580078125, -2.2286376953125, -2.011474609375, -1.7943115234375, -1.5771484375, -1.3599853515625, -1.142822265625, -0.9256591796875, -0.70849609375, -0.4913330078125, -0.274169921875, -0.0570068359375, 0.16015625, 0.3773193359375, 0.594482421875, 0.8116455078125, 1.02880859375, 1.2459716796875, 1.463134765625, 1.6802978515625, 1.8974609375, 2.1146240234375, 2.331787109375, 2.5489501953125, 2.76611328125, 2.9832763671875, 3.200439453125, 3.4176025390625, 3.634765625, 3.8519287109375, 4.069091796875, 4.2862548828125, 4.50341796875, 4.7205810546875, 4.937744140625, 5.1549072265625, 5.3720703125, 5.5892333984375, 5.806396484375, 6.0235595703125, 6.24072265625, 6.4578857421875, 6.675048828125, 6.8922119140625, 7.109375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 11.0, 12.0, 23.0, 44.0, 58.0, 94.0, 122.0, 214.0, 375.0, 604.0, 1014.0, 1695.0, 2779.0, 4680.0, 7507.0, 12877.0, 21395.0, 36763.0, 68106.0, 133922.0, 247244.0, 235742.0, 124379.0, 63664.0, 34794.0, 20271.0, 11960.0, 7185.0, 4367.0, 2645.0, 1538.0, 921.0, 587.0, 326.0, 232.0, 136.0, 75.0, 51.0, 43.0, 41.0, 13.0, 14.0, 4.0, 7.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.75, -5.5579833984375, -5.365966796875, -5.1739501953125, -4.98193359375, -4.7899169921875, -4.597900390625, -4.4058837890625, -4.2138671875, -4.0218505859375, -3.829833984375, -3.6378173828125, -3.44580078125, -3.2537841796875, -3.061767578125, -2.8697509765625, -2.677734375, -2.4857177734375, -2.293701171875, -2.1016845703125, -1.90966796875, -1.7176513671875, -1.525634765625, -1.3336181640625, -1.1416015625, -0.9495849609375, -0.757568359375, -0.5655517578125, -0.37353515625, -0.1815185546875, 0.010498046875, 0.2025146484375, 0.39453125, 0.5865478515625, 0.778564453125, 0.9705810546875, 1.16259765625, 1.3546142578125, 1.546630859375, 1.7386474609375, 1.9306640625, 2.1226806640625, 2.314697265625, 2.5067138671875, 2.69873046875, 2.8907470703125, 3.082763671875, 3.2747802734375, 3.466796875, 3.6588134765625, 3.850830078125, 4.0428466796875, 4.23486328125, 4.4268798828125, 4.618896484375, 4.8109130859375, 5.0029296875, 5.1949462890625, 5.386962890625, 5.5789794921875, 5.77099609375, 5.9630126953125, 6.155029296875, 6.3470458984375, 6.5390625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 9.0, 8.0, 6.0, 17.0, 13.0, 25.0, 20.0, 18.0, 36.0, 25.0, 32.0, 38.0, 26.0, 50.0, 57.0, 99.0, 167.0, 329.0, 1335.0, 179.0, 104.0, 68.0, 50.0, 51.0, 50.0, 30.0, 23.0, 19.0, 28.0, 15.0, 23.0, 8.0, 19.0, 10.0, 6.0, 4.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-21.046875, -20.389892578125, -19.73291015625, -19.075927734375, -18.4189453125, -17.761962890625, -17.10498046875, -16.447998046875, -15.791015625, -15.134033203125, -14.47705078125, -13.820068359375, -13.1630859375, -12.506103515625, -11.84912109375, -11.192138671875, -10.53515625, -9.878173828125, -9.22119140625, -8.564208984375, -7.9072265625, -7.250244140625, -6.59326171875, -5.936279296875, -5.279296875, -4.622314453125, -3.96533203125, -3.308349609375, -2.6513671875, -1.994384765625, -1.33740234375, -0.680419921875, -0.0234375, 0.633544921875, 1.29052734375, 1.947509765625, 2.6044921875, 3.261474609375, 3.91845703125, 4.575439453125, 5.232421875, 5.889404296875, 6.54638671875, 7.203369140625, 7.8603515625, 8.517333984375, 9.17431640625, 9.831298828125, 10.48828125, 11.145263671875, 11.80224609375, 12.459228515625, 13.1162109375, 13.773193359375, 14.43017578125, 15.087158203125, 15.744140625, 16.401123046875, 17.05810546875, 17.715087890625, 18.3720703125, 19.029052734375, 19.68603515625, 20.343017578125, 21.0]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 5.0, 15.0, 19.0, 9.0, 25.0, 23.0, 38.0, 57.0, 70.0, 95.0, 170.0, 222.0, 381.0, 788.0, 4211.0, 102646.0, 2912844.0, 117490.0, 4599.0, 849.0, 386.0, 226.0, 136.0, 99.0, 60.0, 50.0, 44.0, 30.0, 27.0, 18.0, 10.0, 10.0, 11.0, 7.0, 5.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-47.5625, -46.32763671875, -45.0927734375, -43.85791015625, -42.623046875, -41.38818359375, -40.1533203125, -38.91845703125, -37.68359375, -36.44873046875, -35.2138671875, -33.97900390625, -32.744140625, -31.50927734375, -30.2744140625, -29.03955078125, -27.8046875, -26.56982421875, -25.3349609375, -24.10009765625, -22.865234375, -21.63037109375, -20.3955078125, -19.16064453125, -17.92578125, -16.69091796875, -15.4560546875, -14.22119140625, -12.986328125, -11.75146484375, -10.5166015625, -9.28173828125, -8.046875, -6.81201171875, -5.5771484375, -4.34228515625, -3.107421875, -1.87255859375, -0.6376953125, 0.59716796875, 1.83203125, 3.06689453125, 4.3017578125, 5.53662109375, 6.771484375, 8.00634765625, 9.2412109375, 10.47607421875, 11.7109375, 12.94580078125, 14.1806640625, 15.41552734375, 16.650390625, 17.88525390625, 19.1201171875, 20.35498046875, 21.58984375, 22.82470703125, 24.0595703125, 25.29443359375, 26.529296875, 27.76416015625, 28.9990234375, 30.23388671875, 31.46875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 67.0, 883.0, 68.0], "bins": [-719.5696411132812, -708.0525512695312, -696.5355224609375, -685.0184326171875, -673.5013427734375, -661.9842529296875, -650.4671630859375, -638.9501342773438, -627.4330444335938, -615.9159545898438, -604.39892578125, -592.8818359375, -581.36474609375, -569.84765625, -558.33056640625, -546.8135375976562, -535.2964477539062, -523.7793579101562, -512.2623291015625, -500.7452392578125, -489.2281494140625, -477.7110595703125, -466.1940002441406, -454.67694091796875, -443.15985107421875, -431.64276123046875, -420.1257019042969, -408.608642578125, -397.091552734375, -385.574462890625, -374.0574035644531, -362.54034423828125, -351.0232849121094, -339.5062255859375, -327.9891357421875, -316.4720458984375, -304.9549865722656, -293.43792724609375, -281.92083740234375, -270.40374755859375, -258.8866882324219, -247.36961364746094, -235.8525390625, -224.33546447753906, -212.81838989257812, -201.3013153076172, -189.78424072265625, -178.2671661376953, -166.75009155273438, -155.23301696777344, -143.7159423828125, -132.19886779785156, -120.68179321289062, -109.16471862792969, -97.64764404296875, -86.13056945800781, -74.61349487304688, -63.09642028808594, -51.579345703125, -40.06227111816406, -28.545196533203125, -17.028121948242188, -5.51104736328125, 6.0060272216796875, 17.523101806640625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 4.0, 7.0, 12.0, 14.0, 6.0, 12.0, 20.0, 18.0, 22.0, 22.0, 24.0, 29.0, 28.0, 43.0, 39.0, 29.0, 35.0, 54.0, 41.0, 31.0, 52.0, 44.0, 34.0, 33.0, 39.0, 27.0, 40.0, 33.0, 28.0, 17.0, 18.0, 31.0, 19.0, 12.0, 23.0, 15.0, 3.0, 4.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.15851974487305, -49.51762390136719, -47.87672424316406, -46.2358283996582, -44.59492874145508, -42.95403289794922, -41.313133239746094, -39.672237396240234, -38.031341552734375, -36.390445709228516, -34.74954605102539, -33.10865020751953, -31.46775245666504, -29.826854705810547, -28.185956954956055, -26.545059204101562, -24.90416145324707, -23.263263702392578, -21.622365951538086, -19.981468200683594, -18.340572357177734, -16.699674606323242, -15.05877685546875, -13.417880058288574, -11.776982307434082, -10.13608455657959, -8.495187759399414, -6.854290008544922, -5.213392734527588, -3.572495460510254, -1.9315977096557617, -0.29070091247558594, 1.3501968383789062, 2.9910941123962402, 4.631991386413574, 6.272889137268066, 7.9137864112854, 9.554683685302734, 11.195581436157227, 12.836478233337402, 14.477375984191895, 16.11827278137207, 17.759170532226562, 19.400068283081055, 21.040966033935547, 22.681861877441406, 24.32276153564453, 25.96365737915039, 27.604555130004883, 29.245452880859375, 30.886350631713867, 32.52724838256836, 34.16814422607422, 35.809043884277344, 37.4499397277832, 39.09083557128906, 40.73173522949219, 42.37263107299805, 44.01353073120117, 45.65442657470703, 47.295326232910156, 48.936222076416016, 50.577117919921875, 52.218017578125, 53.85891342163086]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 5.0, 8.0, 13.0, 16.0, 16.0, 27.0, 30.0, 28.0, 33.0, 35.0, 40.0, 41.0, 31.0, 42.0, 40.0, 44.0, 35.0, 48.0, 48.0, 61.0, 52.0, 49.0, 34.0, 37.0, 30.0, 22.0, 30.0, 18.0, 17.0, 19.0, 14.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.2991943359375, -8.035888671875, -7.7725830078125, -7.50927734375, -7.2459716796875, -6.982666015625, -6.7193603515625, -6.4560546875, -6.1927490234375, -5.929443359375, -5.6661376953125, -5.40283203125, -5.1395263671875, -4.876220703125, -4.6129150390625, -4.349609375, -4.0863037109375, -3.822998046875, -3.5596923828125, -3.29638671875, -3.0330810546875, -2.769775390625, -2.5064697265625, -2.2431640625, -1.9798583984375, -1.716552734375, -1.4532470703125, -1.18994140625, -0.9266357421875, -0.663330078125, -0.4000244140625, -0.13671875, 0.1265869140625, 0.389892578125, 0.6531982421875, 0.91650390625, 1.1798095703125, 1.443115234375, 1.7064208984375, 1.9697265625, 2.2330322265625, 2.496337890625, 2.7596435546875, 3.02294921875, 3.2862548828125, 3.549560546875, 3.8128662109375, 4.076171875, 4.3394775390625, 4.602783203125, 4.8660888671875, 5.12939453125, 5.3927001953125, 5.656005859375, 5.9193115234375, 6.1826171875, 6.4459228515625, 6.709228515625, 6.9725341796875, 7.23583984375, 7.4991455078125, 7.762451171875, 8.0257568359375, 8.2890625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 13.0, 10.0, 20.0, 20.0, 14.0, 21.0, 21.0, 33.0, 37.0, 50.0, 79.0, 155.0, 497.0, 2898.0, 32069.0, 436261.0, 2714286.0, 930834.0, 69571.0, 5954.0, 816.0, 234.0, 92.0, 61.0, 53.0, 40.0, 26.0, 30.0, 21.0, 11.0, 11.0, 7.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -16.989501953125, -16.41650390625, -15.843505859375, -15.2705078125, -14.697509765625, -14.12451171875, -13.551513671875, -12.978515625, -12.405517578125, -11.83251953125, -11.259521484375, -10.6865234375, -10.113525390625, -9.54052734375, -8.967529296875, -8.39453125, -7.821533203125, -7.24853515625, -6.675537109375, -6.1025390625, -5.529541015625, -4.95654296875, -4.383544921875, -3.810546875, -3.237548828125, -2.66455078125, -2.091552734375, -1.5185546875, -0.945556640625, -0.37255859375, 0.200439453125, 0.7734375, 1.346435546875, 1.91943359375, 2.492431640625, 3.0654296875, 3.638427734375, 4.21142578125, 4.784423828125, 5.357421875, 5.930419921875, 6.50341796875, 7.076416015625, 7.6494140625, 8.222412109375, 8.79541015625, 9.368408203125, 9.94140625, 10.514404296875, 11.08740234375, 11.660400390625, 12.2333984375, 12.806396484375, 13.37939453125, 13.952392578125, 14.525390625, 15.098388671875, 15.67138671875, 16.244384765625, 16.8173828125, 17.390380859375, 17.96337890625, 18.536376953125, 19.109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 8.0, 2.0, 5.0, 8.0, 16.0, 24.0, 33.0, 37.0, 56.0, 62.0, 75.0, 105.0, 175.0, 213.0, 275.0, 343.0, 380.0, 442.0, 391.0, 337.0, 283.0, 194.0, 169.0, 116.0, 84.0, 66.0, 49.0, 33.0, 26.0, 33.0, 11.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.1951904296875, -8.835693359375, -8.4761962890625, -8.11669921875, -7.7572021484375, -7.397705078125, -7.0382080078125, -6.6787109375, -6.3192138671875, -5.959716796875, -5.6002197265625, -5.24072265625, -4.8812255859375, -4.521728515625, -4.1622314453125, -3.802734375, -3.4432373046875, -3.083740234375, -2.7242431640625, -2.36474609375, -2.0052490234375, -1.645751953125, -1.2862548828125, -0.9267578125, -0.5672607421875, -0.207763671875, 0.1517333984375, 0.51123046875, 0.8707275390625, 1.230224609375, 1.5897216796875, 1.94921875, 2.3087158203125, 2.668212890625, 3.0277099609375, 3.38720703125, 3.7467041015625, 4.106201171875, 4.4656982421875, 4.8251953125, 5.1846923828125, 5.544189453125, 5.9036865234375, 6.26318359375, 6.6226806640625, 6.982177734375, 7.3416748046875, 7.701171875, 8.0606689453125, 8.420166015625, 8.7796630859375, 9.13916015625, 9.4986572265625, 9.858154296875, 10.2176513671875, 10.5771484375, 10.9366455078125, 11.296142578125, 11.6556396484375, 12.01513671875, 12.3746337890625, 12.734130859375, 13.0936279296875, 13.453125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 15.0, 16.0, 29.0, 33.0, 44.0, 57.0, 95.0, 133.0, 253.0, 387.0, 786.0, 3348.0, 119195.0, 3544494.0, 514201.0, 8704.0, 1131.0, 504.0, 295.0, 185.0, 91.0, 81.0, 56.0, 42.0, 30.0, 23.0, 15.0, 10.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5, -47.21240234375, -45.9248046875, -44.63720703125, -43.349609375, -42.06201171875, -40.7744140625, -39.48681640625, -38.19921875, -36.91162109375, -35.6240234375, -34.33642578125, -33.048828125, -31.76123046875, -30.4736328125, -29.18603515625, -27.8984375, -26.61083984375, -25.3232421875, -24.03564453125, -22.748046875, -21.46044921875, -20.1728515625, -18.88525390625, -17.59765625, -16.31005859375, -15.0224609375, -13.73486328125, -12.447265625, -11.15966796875, -9.8720703125, -8.58447265625, -7.296875, -6.00927734375, -4.7216796875, -3.43408203125, -2.146484375, -0.85888671875, 0.4287109375, 1.71630859375, 3.00390625, 4.29150390625, 5.5791015625, 6.86669921875, 8.154296875, 9.44189453125, 10.7294921875, 12.01708984375, 13.3046875, 14.59228515625, 15.8798828125, 17.16748046875, 18.455078125, 19.74267578125, 21.0302734375, 22.31787109375, 23.60546875, 24.89306640625, 26.1806640625, 27.46826171875, 28.755859375, 30.04345703125, 31.3310546875, 32.61865234375, 33.90625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 10.0, 47.0, 85.0, 160.0, 205.0, 185.0, 159.0, 84.0, 43.0, 21.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84935760498047, -38.89195251464844, -35.934547424316406, -32.97713851928711, -30.019733428955078, -27.062328338623047, -24.104921340942383, -21.14751434326172, -18.190109252929688, -15.23270320892334, -12.275297164916992, -9.317891120910645, -6.360485076904297, -3.403079032897949, -0.44567298889160156, 2.5117340087890625, 5.469139099121094, 8.426545143127441, 11.383951187133789, 14.341357231140137, 17.298763275146484, 20.256168365478516, 23.21357536315918, 26.170982360839844, 29.128387451171875, 32.085792541503906, 35.04319763183594, 38.000606536865234, 40.958011627197266, 43.9154167175293, 46.872825622558594, 49.830230712890625, 52.78764343261719, 55.74504852294922, 58.70245361328125, 61.65986251831055, 64.61726379394531, 67.57467651367188, 70.5320816040039, 73.48948669433594, 76.44689178466797, 79.404296875, 82.36170196533203, 85.31910705566406, 88.27651977539062, 91.23392486572266, 94.19132995605469, 97.14873504638672, 100.10614013671875, 103.06354522705078, 106.02095031738281, 108.97835540771484, 111.93576049804688, 114.89317321777344, 117.85057830810547, 120.8079833984375, 123.76538848876953, 126.72279357910156, 129.68020629882812, 132.63760375976562, 135.5950164794922, 138.5524139404297, 141.50982666015625, 144.46722412109375, 147.4246368408203]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 9.0, 11.0, 8.0, 14.0, 17.0, 16.0, 30.0, 21.0, 23.0, 25.0, 36.0, 28.0, 30.0, 46.0, 41.0, 37.0, 35.0, 45.0, 38.0, 35.0, 40.0, 29.0, 23.0, 35.0, 31.0, 38.0, 41.0, 31.0, 18.0, 27.0, 24.0, 12.0, 16.0, 9.0, 12.0, 8.0, 5.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.54390335083008, -37.37818908691406, -36.21247482299805, -35.04676055908203, -33.881046295166016, -32.71533203125, -31.54961585998535, -30.383901596069336, -29.21818733215332, -28.052473068237305, -26.88675880432129, -25.721044540405273, -24.555328369140625, -23.38961410522461, -22.223899841308594, -21.058185577392578, -19.892471313476562, -18.726757049560547, -17.56104278564453, -16.395328521728516, -15.229613304138184, -14.063899040222168, -12.898183822631836, -11.73246955871582, -10.566755294799805, -9.401041030883789, -8.235326766967773, -7.069611549377441, -5.903897285461426, -4.73818302154541, -3.5724682807922363, -2.4067535400390625, -1.2410392761230469, -0.07532477378845215, 1.0903897285461426, 2.2561042308807373, 3.421818733215332, 4.587532997131348, 5.7532477378845215, 6.918962478637695, 8.084676742553711, 9.250391006469727, 10.416105270385742, 11.581820487976074, 12.74753475189209, 13.913249015808105, 15.078964233398438, 16.244678497314453, 17.41039276123047, 18.576107025146484, 19.7418212890625, 20.907535552978516, 22.07324981689453, 23.238964080810547, 24.404680252075195, 25.57039451599121, 26.736108779907227, 27.901823043823242, 29.067537307739258, 30.233251571655273, 31.398967742919922, 32.56468200683594, 33.73039627075195, 34.89611053466797, 36.061824798583984]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 11.0, 15.0, 12.0, 13.0, 17.0, 25.0, 17.0, 19.0, 31.0, 22.0, 23.0, 30.0, 26.0, 32.0, 41.0, 35.0, 53.0, 41.0, 32.0, 33.0, 45.0, 39.0, 43.0, 36.0, 32.0, 28.0, 27.0, 27.0, 22.0, 23.0, 20.0, 21.0, 16.0, 9.0, 10.0, 11.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.671875, -6.458251953125, -6.24462890625, -6.031005859375, -5.8173828125, -5.603759765625, -5.39013671875, -5.176513671875, -4.962890625, -4.749267578125, -4.53564453125, -4.322021484375, -4.1083984375, -3.894775390625, -3.68115234375, -3.467529296875, -3.25390625, -3.040283203125, -2.82666015625, -2.613037109375, -2.3994140625, -2.185791015625, -1.97216796875, -1.758544921875, -1.544921875, -1.331298828125, -1.11767578125, -0.904052734375, -0.6904296875, -0.476806640625, -0.26318359375, -0.049560546875, 0.1640625, 0.377685546875, 0.59130859375, 0.804931640625, 1.0185546875, 1.232177734375, 1.44580078125, 1.659423828125, 1.873046875, 2.086669921875, 2.30029296875, 2.513916015625, 2.7275390625, 2.941162109375, 3.15478515625, 3.368408203125, 3.58203125, 3.795654296875, 4.00927734375, 4.222900390625, 4.4365234375, 4.650146484375, 4.86376953125, 5.077392578125, 5.291015625, 5.504638671875, 5.71826171875, 5.931884765625, 6.1455078125, 6.359130859375, 6.57275390625, 6.786376953125, 7.0]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 26.0, 32.0, 62.0, 83.0, 144.0, 204.0, 330.0, 522.0, 900.0, 1345.0, 2262.0, 3630.0, 5721.0, 9181.0, 15030.0, 23071.0, 35577.0, 53604.0, 76617.0, 104224.0, 127929.0, 139316.0, 126211.0, 101342.0, 74745.0, 51886.0, 34474.0, 22238.0, 14477.0, 8805.0, 5522.0, 3375.0, 2100.0, 1323.0, 807.0, 510.0, 336.0, 210.0, 136.0, 90.0, 46.0, 33.0, 23.0, 14.0, 11.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.53448486328125, -0.5142822265625, -0.49407958984375, -0.473876953125, -0.45367431640625, -0.4334716796875, -0.41326904296875, -0.39306640625, -0.37286376953125, -0.3526611328125, -0.33245849609375, -0.312255859375, -0.29205322265625, -0.2718505859375, -0.25164794921875, -0.2314453125, -0.21124267578125, -0.1910400390625, -0.17083740234375, -0.150634765625, -0.13043212890625, -0.1102294921875, -0.09002685546875, -0.06982421875, -0.04962158203125, -0.0294189453125, -0.00921630859375, 0.010986328125, 0.03118896484375, 0.0513916015625, 0.07159423828125, 0.091796875, 0.11199951171875, 0.1322021484375, 0.15240478515625, 0.172607421875, 0.19281005859375, 0.2130126953125, 0.23321533203125, 0.25341796875, 0.27362060546875, 0.2938232421875, 0.31402587890625, 0.334228515625, 0.35443115234375, 0.3746337890625, 0.39483642578125, 0.4150390625, 0.43524169921875, 0.4554443359375, 0.47564697265625, 0.495849609375, 0.51605224609375, 0.5362548828125, 0.55645751953125, 0.57666015625, 0.59686279296875, 0.6170654296875, 0.63726806640625, 0.657470703125, 0.67767333984375, 0.6978759765625, 0.71807861328125, 0.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 3.0, 7.0, 5.0, 10.0, 12.0, 17.0, 26.0, 27.0, 15.0, 21.0, 36.0, 30.0, 46.0, 28.0, 40.0, 28.0, 41.0, 44.0, 46.0, 1067.0, 45.0, 45.0, 32.0, 35.0, 38.0, 38.0, 37.0, 32.0, 24.0, 18.0, 16.0, 19.0, 8.0, 12.0, 12.0, 12.0, 11.0, 8.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.86370849609375, -4.6844482421875, -4.50518798828125, -4.325927734375, -4.14666748046875, -3.9674072265625, -3.78814697265625, -3.60888671875, -3.42962646484375, -3.2503662109375, -3.07110595703125, -2.891845703125, -2.71258544921875, -2.5333251953125, -2.35406494140625, -2.1748046875, -1.99554443359375, -1.8162841796875, -1.63702392578125, -1.457763671875, -1.27850341796875, -1.0992431640625, -0.91998291015625, -0.74072265625, -0.56146240234375, -0.3822021484375, -0.20294189453125, -0.023681640625, 0.15557861328125, 0.3348388671875, 0.51409912109375, 0.693359375, 0.87261962890625, 1.0518798828125, 1.23114013671875, 1.410400390625, 1.58966064453125, 1.7689208984375, 1.94818115234375, 2.12744140625, 2.30670166015625, 2.4859619140625, 2.66522216796875, 2.844482421875, 3.02374267578125, 3.2030029296875, 3.38226318359375, 3.5615234375, 3.74078369140625, 3.9200439453125, 4.09930419921875, 4.278564453125, 4.45782470703125, 4.6370849609375, 4.81634521484375, 4.99560546875, 5.17486572265625, 5.3541259765625, 5.53338623046875, 5.712646484375, 5.89190673828125, 6.0711669921875, 6.25042724609375, 6.4296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 6.0, 7.0, 13.0, 18.0, 26.0, 44.0, 65.0, 103.0, 163.0, 273.0, 418.0, 752.0, 1142.0, 2040.0, 3473.0, 5827.0, 9625.0, 16113.0, 26678.0, 42690.0, 67327.0, 98556.0, 133585.0, 1116103.0, 226321.0, 117946.0, 84154.0, 55422.0, 34890.0, 21387.0, 12846.0, 7648.0, 4539.0, 2715.0, 1621.0, 1004.0, 627.0, 345.0, 222.0, 142.0, 96.0, 62.0, 33.0, 22.0, 21.0, 10.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.469482421875, -0.45516204833984375, -0.4408416748046875, -0.42652130126953125, -0.412200927734375, -0.39788055419921875, -0.3835601806640625, -0.36923980712890625, -0.35491943359375, -0.34059906005859375, -0.3262786865234375, -0.31195831298828125, -0.297637939453125, -0.28331756591796875, -0.2689971923828125, -0.25467681884765625, -0.2403564453125, -0.22603607177734375, -0.2117156982421875, -0.19739532470703125, -0.183074951171875, -0.16875457763671875, -0.1544342041015625, -0.14011383056640625, -0.12579345703125, -0.11147308349609375, -0.0971527099609375, -0.08283233642578125, -0.068511962890625, -0.05419158935546875, -0.0398712158203125, -0.02555084228515625, -0.01123046875, 0.00308990478515625, 0.0174102783203125, 0.03173065185546875, 0.046051025390625, 0.06037139892578125, 0.0746917724609375, 0.08901214599609375, 0.10333251953125, 0.11765289306640625, 0.1319732666015625, 0.14629364013671875, 0.160614013671875, 0.17493438720703125, 0.1892547607421875, 0.20357513427734375, 0.2178955078125, 0.23221588134765625, 0.2465362548828125, 0.26085662841796875, 0.275177001953125, 0.28949737548828125, 0.3038177490234375, 0.31813812255859375, 0.33245849609375, 0.34677886962890625, 0.3610992431640625, 0.37541961669921875, 0.389739990234375, 0.40406036376953125, 0.4183807373046875, 0.43270111083984375, 0.447021484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 9.0, 11.0, 8.0, 13.0, 14.0, 22.0, 35.0, 35.0, 43.0, 44.0, 52.0, 63.0, 70.0, 53.0, 75.0, 66.0, 64.0, 59.0, 52.0, 49.0, 39.0, 30.0, 19.0, 12.0, 14.0, 13.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04779052734375, -0.04622650146484375, -0.0446624755859375, -0.04309844970703125, -0.041534423828125, -0.03997039794921875, -0.0384063720703125, -0.03684234619140625, -0.0352783203125, -0.03371429443359375, -0.0321502685546875, -0.03058624267578125, -0.029022216796875, -0.02745819091796875, -0.0258941650390625, -0.02433013916015625, -0.02276611328125, -0.02120208740234375, -0.0196380615234375, -0.01807403564453125, -0.016510009765625, -0.01494598388671875, -0.0133819580078125, -0.01181793212890625, -0.01025390625, -0.00868988037109375, -0.0071258544921875, -0.00556182861328125, -0.003997802734375, -0.00243377685546875, -0.0008697509765625, 0.00069427490234375, 0.00225830078125, 0.00382232666015625, 0.0053863525390625, 0.00695037841796875, 0.008514404296875, 0.01007843017578125, 0.0116424560546875, 0.01320648193359375, 0.0147705078125, 0.01633453369140625, 0.0178985595703125, 0.01946258544921875, 0.021026611328125, 0.02259063720703125, 0.0241546630859375, 0.02571868896484375, 0.02728271484375, 0.02884674072265625, 0.0304107666015625, 0.03197479248046875, 0.033538818359375, 0.03510284423828125, 0.0366668701171875, 0.03823089599609375, 0.039794921875, 0.04135894775390625, 0.0429229736328125, 0.04448699951171875, 0.046051025390625, 0.04761505126953125, 0.0491790771484375, 0.05074310302734375, 0.05230712890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 12.0, 20.0, 11.0, 21.0, 36.0, 40.0, 61.0, 80.0, 130.0, 209.0, 428.0, 1848.0, 1041694.0, 2844.0, 491.0, 222.0, 110.0, 72.0, 58.0, 35.0, 28.0, 20.0, 13.0, 15.0, 12.0, 8.0, 4.0, 8.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1729736328125, -1.136962890625, -1.1009521484375, -1.06494140625, -1.0289306640625, -0.992919921875, -0.9569091796875, -0.9208984375, -0.8848876953125, -0.848876953125, -0.8128662109375, -0.77685546875, -0.7408447265625, -0.704833984375, -0.6688232421875, -0.6328125, -0.5968017578125, -0.560791015625, -0.5247802734375, -0.48876953125, -0.4527587890625, -0.416748046875, -0.3807373046875, -0.3447265625, -0.3087158203125, -0.272705078125, -0.2366943359375, -0.20068359375, -0.1646728515625, -0.128662109375, -0.0926513671875, -0.056640625, -0.0206298828125, 0.015380859375, 0.0513916015625, 0.08740234375, 0.1234130859375, 0.159423828125, 0.1954345703125, 0.2314453125, 0.2674560546875, 0.303466796875, 0.3394775390625, 0.37548828125, 0.4114990234375, 0.447509765625, 0.4835205078125, 0.51953125, 0.5555419921875, 0.591552734375, 0.6275634765625, 0.66357421875, 0.6995849609375, 0.735595703125, 0.7716064453125, 0.8076171875, 0.8436279296875, 0.879638671875, 0.9156494140625, 0.95166015625, 0.9876708984375, 1.023681640625, 1.0596923828125, 1.095703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 72.0, 822.0, 102.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9391686916351318, -0.9213151335716248, -0.9034616351127625, -0.8856080770492554, -0.8677545785903931, -0.849901020526886, -0.8320474624633789, -0.8141939640045166, -0.7963404059410095, -0.7784868478775024, -0.7606333494186401, -0.7427797913551331, -0.7249262928962708, -0.7070727348327637, -0.6892192363739014, -0.6713656783103943, -0.6535121202468872, -0.6356585621833801, -0.6178050637245178, -0.5999515056610107, -0.5820980072021484, -0.5642444491386414, -0.5463908910751343, -0.528537392616272, -0.5106838941574097, -0.492830365896225, -0.4749768376350403, -0.4571232795715332, -0.4392697513103485, -0.4214162230491638, -0.4035626947879791, -0.38570916652679443, -0.36785560846328735, -0.35000208020210266, -0.33214855194091797, -0.3142949938774109, -0.2964414656162262, -0.2785879373550415, -0.2607344090938568, -0.24288088083267212, -0.22502735257148743, -0.20717382431030273, -0.18932028114795685, -0.17146675288677216, -0.15361320972442627, -0.13575968146324158, -0.11790615320205688, -0.1000526174902916, -0.0821990817785263, -0.06434554606676102, -0.046492014080286026, -0.028638482093811035, -0.010784946382045746, 0.0070685893297195435, 0.024922117590904236, 0.042775653302669525, 0.060629189014434814, 0.0784827247262001, 0.0963362604379654, 0.11418978869915009, 0.13204333186149597, 0.14989686012268066, 0.16775038838386536, 0.18560391664505005, 0.20345745980739594]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 7.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 13.0, 19.0, 28.0, 19.0, 24.0, 30.0, 47.0, 31.0, 38.0, 52.0, 50.0, 63.0, 52.0, 56.0, 57.0, 33.0, 27.0, 43.0, 33.0, 40.0, 34.0, 32.0, 25.0, 22.0, 20.0, 16.0, 10.0, 8.0, 10.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15506339073181152, -0.14997737109661102, -0.14489135146141052, -0.13980533182621002, -0.13471931219100952, -0.12963330745697021, -0.12454728782176971, -0.11946126818656921, -0.11437524855136871, -0.10928922891616821, -0.10420320928096771, -0.09911719709634781, -0.09403117746114731, -0.08894515782594681, -0.0838591456413269, -0.0787731260061264, -0.0736871063709259, -0.0686010867357254, -0.0635150671005249, -0.058429054915905, -0.0533430352807045, -0.048257015645504, -0.043170999735593796, -0.038084983825683594, -0.03299896419048309, -0.027912946417927742, -0.02282692864537239, -0.01774091087281704, -0.012654893100261688, -0.007568875327706337, -0.0024828575551509857, 0.0026031583547592163, 0.007689177989959717, 0.012775195762515068, 0.01786121353507042, 0.02294723130762577, 0.028033249080181122, 0.03311926871538162, 0.038205284625291824, 0.043291300535202026, 0.04837732017040253, 0.05346333980560303, 0.05854935571551323, 0.06363537162542343, 0.06872139126062393, 0.07380741089582443, 0.07889342308044434, 0.08397944271564484, 0.08906546235084534, 0.09415148198604584, 0.09923750162124634, 0.10432351380586624, 0.10940953344106674, 0.11449555307626724, 0.11958156526088715, 0.12466758489608765, 0.12975360453128815, 0.13483962416648865, 0.13992564380168915, 0.14501166343688965, 0.15009766817092896, 0.15518368780612946, 0.16026970744132996, 0.16535572707653046, 0.17044174671173096]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 13.0, 8.0, 12.0, 13.0, 21.0, 22.0, 26.0, 26.0, 20.0, 23.0, 45.0, 29.0, 34.0, 32.0, 30.0, 41.0, 40.0, 47.0, 44.0, 36.0, 42.0, 45.0, 46.0, 40.0, 34.0, 29.0, 30.0, 34.0, 20.0, 10.0, 15.0, 13.0, 14.0, 10.0, 13.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.7890625, -7.5589599609375, -7.328857421875, -7.0987548828125, -6.86865234375, -6.6385498046875, -6.408447265625, -6.1783447265625, -5.9482421875, -5.7181396484375, -5.488037109375, -5.2579345703125, -5.02783203125, -4.7977294921875, -4.567626953125, -4.3375244140625, -4.107421875, -3.8773193359375, -3.647216796875, -3.4171142578125, -3.18701171875, -2.9569091796875, -2.726806640625, -2.4967041015625, -2.2666015625, -2.0364990234375, -1.806396484375, -1.5762939453125, -1.34619140625, -1.1160888671875, -0.885986328125, -0.6558837890625, -0.42578125, -0.1956787109375, 0.034423828125, 0.2645263671875, 0.49462890625, 0.7247314453125, 0.954833984375, 1.1849365234375, 1.4150390625, 1.6451416015625, 1.875244140625, 2.1053466796875, 2.33544921875, 2.5655517578125, 2.795654296875, 3.0257568359375, 3.255859375, 3.4859619140625, 3.716064453125, 3.9461669921875, 4.17626953125, 4.4063720703125, 4.636474609375, 4.8665771484375, 5.0966796875, 5.3267822265625, 5.556884765625, 5.7869873046875, 6.01708984375, 6.2471923828125, 6.477294921875, 6.7073974609375, 6.9375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 9.0, 11.0, 20.0, 8.0, 14.0, 34.0, 30.0, 44.0, 62.0, 64.0, 93.0, 155.0, 305.0, 577.0, 1285.0, 2930.0, 6711.0, 15698.0, 41122.0, 147903.0, 440800.0, 275960.0, 72785.0, 24060.0, 9754.0, 4241.0, 1957.0, 811.0, 455.0, 211.0, 126.0, 77.0, 47.0, 39.0, 39.0, 18.0, 19.0, 21.0, 12.0, 13.0, 5.0, 7.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 4.0], "bins": [-12.2578125, -11.914794921875, -11.57177734375, -11.228759765625, -10.8857421875, -10.542724609375, -10.19970703125, -9.856689453125, -9.513671875, -9.170654296875, -8.82763671875, -8.484619140625, -8.1416015625, -7.798583984375, -7.45556640625, -7.112548828125, -6.76953125, -6.426513671875, -6.08349609375, -5.740478515625, -5.3974609375, -5.054443359375, -4.71142578125, -4.368408203125, -4.025390625, -3.682373046875, -3.33935546875, -2.996337890625, -2.6533203125, -2.310302734375, -1.96728515625, -1.624267578125, -1.28125, -0.938232421875, -0.59521484375, -0.252197265625, 0.0908203125, 0.433837890625, 0.77685546875, 1.119873046875, 1.462890625, 1.805908203125, 2.14892578125, 2.491943359375, 2.8349609375, 3.177978515625, 3.52099609375, 3.864013671875, 4.20703125, 4.550048828125, 4.89306640625, 5.236083984375, 5.5791015625, 5.922119140625, 6.26513671875, 6.608154296875, 6.951171875, 7.294189453125, 7.63720703125, 7.980224609375, 8.3232421875, 8.666259765625, 9.00927734375, 9.352294921875, 9.6953125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 4.0, 11.0, 16.0, 7.0, 23.0, 17.0, 27.0, 27.0, 37.0, 47.0, 38.0, 55.0, 64.0, 93.0, 154.0, 1505.0, 337.0, 127.0, 82.0, 53.0, 38.0, 35.0, 33.0, 31.0, 26.0, 24.0, 17.0, 15.0, 18.0, 18.0, 8.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.51171875, -23.7421875, -22.97265625, -22.203125, -21.43359375, -20.6640625, -19.89453125, -19.125, -18.35546875, -17.5859375, -16.81640625, -16.046875, -15.27734375, -14.5078125, -13.73828125, -12.96875, -12.19921875, -11.4296875, -10.66015625, -9.890625, -9.12109375, -8.3515625, -7.58203125, -6.8125, -6.04296875, -5.2734375, -4.50390625, -3.734375, -2.96484375, -2.1953125, -1.42578125, -0.65625, 0.11328125, 0.8828125, 1.65234375, 2.421875, 3.19140625, 3.9609375, 4.73046875, 5.5, 6.26953125, 7.0390625, 7.80859375, 8.578125, 9.34765625, 10.1171875, 10.88671875, 11.65625, 12.42578125, 13.1953125, 13.96484375, 14.734375, 15.50390625, 16.2734375, 17.04296875, 17.8125, 18.58203125, 19.3515625, 20.12109375, 20.890625, 21.66015625, 22.4296875, 23.19921875, 23.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 5.0, 7.0, 7.0, 8.0, 13.0, 17.0, 23.0, 37.0, 31.0, 50.0, 48.0, 82.0, 117.0, 176.0, 328.0, 872.0, 5860.0, 308191.0, 2803321.0, 23638.0, 1613.0, 439.0, 252.0, 140.0, 127.0, 62.0, 47.0, 42.0, 35.0, 24.0, 18.0, 19.0, 11.0, 9.0, 9.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.0, -46.55517578125, -45.1103515625, -43.66552734375, -42.220703125, -40.77587890625, -39.3310546875, -37.88623046875, -36.44140625, -34.99658203125, -33.5517578125, -32.10693359375, -30.662109375, -29.21728515625, -27.7724609375, -26.32763671875, -24.8828125, -23.43798828125, -21.9931640625, -20.54833984375, -19.103515625, -17.65869140625, -16.2138671875, -14.76904296875, -13.32421875, -11.87939453125, -10.4345703125, -8.98974609375, -7.544921875, -6.10009765625, -4.6552734375, -3.21044921875, -1.765625, -0.32080078125, 1.1240234375, 2.56884765625, 4.013671875, 5.45849609375, 6.9033203125, 8.34814453125, 9.79296875, 11.23779296875, 12.6826171875, 14.12744140625, 15.572265625, 17.01708984375, 18.4619140625, 19.90673828125, 21.3515625, 22.79638671875, 24.2412109375, 25.68603515625, 27.130859375, 28.57568359375, 30.0205078125, 31.46533203125, 32.91015625, 34.35498046875, 35.7998046875, 37.24462890625, 38.689453125, 40.13427734375, 41.5791015625, 43.02392578125, 44.46875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 287.0, 726.0], "bins": [-859.6781005859375, -846.0603637695312, -832.442626953125, -818.8248901367188, -805.2070922851562, -791.58935546875, -777.9716186523438, -764.3538818359375, -750.7361450195312, -737.118408203125, -723.5006713867188, -709.8829345703125, -696.26513671875, -682.6473999023438, -669.0296630859375, -655.4119262695312, -641.794189453125, -628.1764526367188, -614.5587158203125, -600.9409790039062, -587.3231811523438, -573.7054443359375, -560.0877075195312, -546.469970703125, -532.8522338867188, -519.2344970703125, -505.6167297363281, -491.9989929199219, -478.3812561035156, -464.76348876953125, -451.145751953125, -437.52801513671875, -423.91021728515625, -410.29248046875, -396.6747131347656, -383.0569763183594, -369.4392395019531, -355.82147216796875, -342.2037353515625, -328.58599853515625, -314.96826171875, -301.35052490234375, -287.7327575683594, -274.1150207519531, -260.4972839355469, -246.87953186035156, -233.26177978515625, -219.64404296875, -206.0262908935547, -192.40853881835938, -178.79080200195312, -165.1730499267578, -151.55531311035156, -137.93756103515625, -124.31981658935547, -110.70207214355469, -97.08433532714844, -83.46659088134766, -69.84884643554688, -56.23109817504883, -42.61335372924805, -28.99560546875, -15.377861022949219, -1.7601165771484375, 11.857630729675293]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 14.0, 13.0, 12.0, 19.0, 19.0, 21.0, 29.0, 27.0, 26.0, 30.0, 32.0, 32.0, 37.0, 38.0, 39.0, 30.0, 42.0, 33.0, 41.0, 41.0, 27.0, 42.0, 28.0, 41.0, 31.0, 26.0, 29.0, 21.0, 20.0, 15.0, 20.0, 17.0, 13.0, 16.0, 10.0, 12.0, 8.0, 1.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.64727020263672, -48.03639602661133, -46.4255256652832, -44.81465148925781, -43.20378112792969, -41.5929069519043, -39.98203659057617, -38.37116241455078, -36.760292053222656, -35.149417877197266, -33.53854751586914, -31.927675247192383, -30.316802978515625, -28.705928802490234, -27.09505844116211, -25.48418426513672, -23.87331199645996, -22.262439727783203, -20.651567459106445, -19.040695190429688, -17.42982292175293, -15.818949699401855, -14.208077430725098, -12.59720516204834, -10.986332893371582, -9.375460624694824, -7.764588356018066, -6.15371561050415, -4.542843341827393, -2.9319705963134766, -1.3210983276367188, 0.28977394104003906, 1.9006462097167969, 3.5115184783935547, 5.1223907470703125, 6.7332634925842285, 8.344135284423828, 9.955008506774902, 11.56588077545166, 13.176753044128418, 14.787625312805176, 16.39849853515625, 18.009370803833008, 19.620243072509766, 21.231115341186523, 22.84198760986328, 24.45285987854004, 26.063732147216797, 27.674604415893555, 29.285476684570312, 30.89634895324707, 32.50722122192383, 34.11809539794922, 35.728965759277344, 37.339839935302734, 38.95071029663086, 40.56158447265625, 42.17245864868164, 43.783329010009766, 45.394203186035156, 47.00507354736328, 48.61594772338867, 50.2268180847168, 51.83769226074219, 53.44856262207031]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 13.0, 5.0, 5.0, 14.0, 8.0, 5.0, 23.0, 12.0, 26.0, 16.0, 15.0, 31.0, 25.0, 32.0, 34.0, 32.0, 55.0, 30.0, 36.0, 40.0, 44.0, 26.0, 32.0, 37.0, 47.0, 39.0, 33.0, 40.0, 37.0, 27.0, 26.0, 20.0, 21.0, 16.0, 24.0, 15.0, 10.0, 12.0, 8.0, 9.0, 10.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.0390625, -7.802734375, -7.56640625, -7.330078125, -7.09375, -6.857421875, -6.62109375, -6.384765625, -6.1484375, -5.912109375, -5.67578125, -5.439453125, -5.203125, -4.966796875, -4.73046875, -4.494140625, -4.2578125, -4.021484375, -3.78515625, -3.548828125, -3.3125, -3.076171875, -2.83984375, -2.603515625, -2.3671875, -2.130859375, -1.89453125, -1.658203125, -1.421875, -1.185546875, -0.94921875, -0.712890625, -0.4765625, -0.240234375, -0.00390625, 0.232421875, 0.46875, 0.705078125, 0.94140625, 1.177734375, 1.4140625, 1.650390625, 1.88671875, 2.123046875, 2.359375, 2.595703125, 2.83203125, 3.068359375, 3.3046875, 3.541015625, 3.77734375, 4.013671875, 4.25, 4.486328125, 4.72265625, 4.958984375, 5.1953125, 5.431640625, 5.66796875, 5.904296875, 6.140625, 6.376953125, 6.61328125, 6.849609375, 7.0859375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 2.0, 6.0, 11.0, 6.0, 14.0, 13.0, 17.0, 16.0, 24.0, 23.0, 45.0, 79.0, 105.0, 244.0, 562.0, 1617.0, 6034.0, 26802.0, 149731.0, 828422.0, 2088218.0, 891311.0, 162119.0, 29091.0, 6558.0, 1832.0, 689.0, 255.0, 139.0, 77.0, 54.0, 34.0, 21.0, 14.0, 23.0, 24.0, 10.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.21875, -12.824462890625, -12.43017578125, -12.035888671875, -11.6416015625, -11.247314453125, -10.85302734375, -10.458740234375, -10.064453125, -9.670166015625, -9.27587890625, -8.881591796875, -8.4873046875, -8.093017578125, -7.69873046875, -7.304443359375, -6.91015625, -6.515869140625, -6.12158203125, -5.727294921875, -5.3330078125, -4.938720703125, -4.54443359375, -4.150146484375, -3.755859375, -3.361572265625, -2.96728515625, -2.572998046875, -2.1787109375, -1.784423828125, -1.39013671875, -0.995849609375, -0.6015625, -0.207275390625, 0.18701171875, 0.581298828125, 0.9755859375, 1.369873046875, 1.76416015625, 2.158447265625, 2.552734375, 2.947021484375, 3.34130859375, 3.735595703125, 4.1298828125, 4.524169921875, 4.91845703125, 5.312744140625, 5.70703125, 6.101318359375, 6.49560546875, 6.889892578125, 7.2841796875, 7.678466796875, 8.07275390625, 8.467041015625, 8.861328125, 9.255615234375, 9.64990234375, 10.044189453125, 10.4384765625, 10.832763671875, 11.22705078125, 11.621337890625, 12.015625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 14.0, 19.0, 19.0, 40.0, 47.0, 65.0, 93.0, 135.0, 182.0, 243.0, 386.0, 457.0, 473.0, 463.0, 372.0, 276.0, 222.0, 168.0, 109.0, 91.0, 50.0, 31.0, 36.0, 21.0, 16.0, 12.0, 9.0, 6.0, 10.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.08642578125, -11.6806640625, -11.27490234375, -10.869140625, -10.46337890625, -10.0576171875, -9.65185546875, -9.24609375, -8.84033203125, -8.4345703125, -8.02880859375, -7.623046875, -7.21728515625, -6.8115234375, -6.40576171875, -6.0, -5.59423828125, -5.1884765625, -4.78271484375, -4.376953125, -3.97119140625, -3.5654296875, -3.15966796875, -2.75390625, -2.34814453125, -1.9423828125, -1.53662109375, -1.130859375, -0.72509765625, -0.3193359375, 0.08642578125, 0.4921875, 0.89794921875, 1.3037109375, 1.70947265625, 2.115234375, 2.52099609375, 2.9267578125, 3.33251953125, 3.73828125, 4.14404296875, 4.5498046875, 4.95556640625, 5.361328125, 5.76708984375, 6.1728515625, 6.57861328125, 6.984375, 7.39013671875, 7.7958984375, 8.20166015625, 8.607421875, 9.01318359375, 9.4189453125, 9.82470703125, 10.23046875, 10.63623046875, 11.0419921875, 11.44775390625, 11.853515625, 12.25927734375, 12.6650390625, 13.07080078125, 13.4765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 14.0, 12.0, 17.0, 24.0, 35.0, 46.0, 61.0, 134.0, 189.0, 314.0, 570.0, 1258.0, 6682.0, 101962.0, 2479250.0, 1539577.0, 57243.0, 4527.0, 1052.0, 497.0, 293.0, 175.0, 112.0, 74.0, 62.0, 32.0, 21.0, 10.0, 9.0, 8.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.25, -33.268798828125, -32.28759765625, -31.306396484375, -30.3251953125, -29.343994140625, -28.36279296875, -27.381591796875, -26.400390625, -25.419189453125, -24.43798828125, -23.456787109375, -22.4755859375, -21.494384765625, -20.51318359375, -19.531982421875, -18.55078125, -17.569580078125, -16.58837890625, -15.607177734375, -14.6259765625, -13.644775390625, -12.66357421875, -11.682373046875, -10.701171875, -9.719970703125, -8.73876953125, -7.757568359375, -6.7763671875, -5.795166015625, -4.81396484375, -3.832763671875, -2.8515625, -1.870361328125, -0.88916015625, 0.092041015625, 1.0732421875, 2.054443359375, 3.03564453125, 4.016845703125, 4.998046875, 5.979248046875, 6.96044921875, 7.941650390625, 8.9228515625, 9.904052734375, 10.88525390625, 11.866455078125, 12.84765625, 13.828857421875, 14.81005859375, 15.791259765625, 16.7724609375, 17.753662109375, 18.73486328125, 19.716064453125, 20.697265625, 21.678466796875, 22.65966796875, 23.640869140625, 24.6220703125, 25.603271484375, 26.58447265625, 27.565673828125, 28.546875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 34.0, 145.0, 332.0, 338.0, 130.0, 24.0, 9.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.7858123779297, -221.11129760742188, -215.43679809570312, -209.7622833251953, -204.0877685546875, -198.41326904296875, -192.73875427246094, -187.06423950195312, -181.38973999023438, -175.71522521972656, -170.0407257080078, -164.3662109375, -158.69171142578125, -153.01719665527344, -147.34268188476562, -141.66818237304688, -135.99366760253906, -130.31915283203125, -124.6446533203125, -118.97013854980469, -113.2956314086914, -107.62112426757812, -101.94660949707031, -96.27210235595703, -90.59759521484375, -84.92308807373047, -79.24858093261719, -73.57406616210938, -67.8995590209961, -62.22505187988281, -56.550540924072266, -50.87602996826172, -45.2015380859375, -39.52703094482422, -33.85251998901367, -28.178010940551758, -22.503501892089844, -16.82899284362793, -11.154483795166016, -5.479972839355469, 0.1945343017578125, 5.869043350219727, 11.54355239868164, 17.218061447143555, 22.89257049560547, 28.567079544067383, 34.2415885925293, 39.916099548339844, 45.590606689453125, 51.265113830566406, 56.93962478637695, 62.6141357421875, 68.28864288330078, 73.96315002441406, 79.63766479492188, 85.31217193603516, 90.98667907714844, 96.66118621826172, 102.335693359375, 108.01020812988281, 113.6847152709961, 119.35922241210938, 125.03373718261719, 130.708251953125, 136.38275146484375]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 14.0, 10.0, 13.0, 16.0, 19.0, 14.0, 17.0, 15.0, 21.0, 26.0, 32.0, 23.0, 27.0, 47.0, 42.0, 46.0, 30.0, 43.0, 30.0, 44.0, 46.0, 41.0, 32.0, 29.0, 38.0, 35.0, 28.0, 28.0, 22.0, 14.0, 18.0, 14.0, 16.0, 14.0, 8.0, 13.0, 8.0, 11.0, 8.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.63477325439453, -31.51970863342285, -30.40464210510254, -29.28957748413086, -28.174510955810547, -27.059446334838867, -25.944381713867188, -24.829315185546875, -23.714250564575195, -22.599185943603516, -21.484119415283203, -20.369054794311523, -19.253990173339844, -18.13892364501953, -17.02385902404785, -15.908793449401855, -14.79372787475586, -13.678662300109863, -12.563596725463867, -11.448532104492188, -10.333466529846191, -9.218400955200195, -8.103336334228516, -6.9882707595825195, -5.873205184936523, -4.758139610290527, -3.6430745124816895, -2.5280091762542725, -1.4129438400268555, -0.2978782653808594, 0.8171868324279785, 1.9322519302368164, 3.0473175048828125, 4.162383079528809, 5.2774481773376465, 6.392513275146484, 7.5075788497924805, 8.622644424438477, 9.737709045410156, 10.852774620056152, 11.967840194702148, 13.082905769348145, 14.19797134399414, 15.31303596496582, 16.4281005859375, 17.543167114257812, 18.658231735229492, 19.773296356201172, 20.888362884521484, 22.003427505493164, 23.118494033813477, 24.233558654785156, 25.34862518310547, 26.46368980407715, 27.578754425048828, 28.69382095336914, 29.80888557434082, 30.9239501953125, 32.03901672363281, 33.154083251953125, 34.26914596557617, 35.384212493896484, 36.4992790222168, 37.614341735839844, 38.729408264160156]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 9.0, 9.0, 12.0, 13.0, 11.0, 15.0, 13.0, 19.0, 17.0, 21.0, 25.0, 18.0, 22.0, 22.0, 26.0, 27.0, 33.0, 38.0, 41.0, 43.0, 41.0, 35.0, 56.0, 57.0, 30.0, 34.0, 45.0, 26.0, 31.0, 21.0, 25.0, 19.0, 13.0, 16.0, 15.0, 14.0, 14.0, 12.0, 17.0, 5.0, 9.0, 5.0, 5.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0], "bins": [-6.8046875, -6.59197998046875, -6.3792724609375, -6.16656494140625, -5.953857421875, -5.74114990234375, -5.5284423828125, -5.31573486328125, -5.10302734375, -4.89031982421875, -4.6776123046875, -4.46490478515625, -4.252197265625, -4.03948974609375, -3.8267822265625, -3.61407470703125, -3.4013671875, -3.18865966796875, -2.9759521484375, -2.76324462890625, -2.550537109375, -2.33782958984375, -2.1251220703125, -1.91241455078125, -1.69970703125, -1.48699951171875, -1.2742919921875, -1.06158447265625, -0.848876953125, -0.63616943359375, -0.4234619140625, -0.21075439453125, 0.001953125, 0.21466064453125, 0.4273681640625, 0.64007568359375, 0.852783203125, 1.06549072265625, 1.2781982421875, 1.49090576171875, 1.70361328125, 1.91632080078125, 2.1290283203125, 2.34173583984375, 2.554443359375, 2.76715087890625, 2.9798583984375, 3.19256591796875, 3.4052734375, 3.61798095703125, 3.8306884765625, 4.04339599609375, 4.256103515625, 4.46881103515625, 4.6815185546875, 4.89422607421875, 5.10693359375, 5.31964111328125, 5.5323486328125, 5.74505615234375, 5.957763671875, 6.17047119140625, 6.3831787109375, 6.59588623046875, 6.80859375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 6.0, 19.0, 17.0, 31.0, 50.0, 75.0, 121.0, 186.0, 270.0, 405.0, 601.0, 877.0, 1313.0, 2015.0, 2843.0, 4180.0, 6116.0, 8778.0, 12964.0, 18413.0, 26072.0, 36334.0, 49126.0, 64405.0, 81089.0, 97229.0, 107364.0, 107635.0, 97824.0, 82029.0, 65807.0, 50152.0, 36898.0, 26499.0, 18663.0, 13108.0, 9096.0, 6390.0, 4385.0, 3012.0, 1983.0, 1414.0, 932.0, 598.0, 407.0, 299.0, 201.0, 122.0, 80.0, 56.0, 34.0, 12.0, 17.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49286651611328125, -0.4764556884765625, -0.46004486083984375, -0.443634033203125, -0.42722320556640625, -0.4108123779296875, -0.39440155029296875, -0.37799072265625, -0.36157989501953125, -0.3451690673828125, -0.32875823974609375, -0.312347412109375, -0.29593658447265625, -0.2795257568359375, -0.26311492919921875, -0.2467041015625, -0.23029327392578125, -0.2138824462890625, -0.19747161865234375, -0.181060791015625, -0.16464996337890625, -0.1482391357421875, -0.13182830810546875, -0.11541748046875, -0.09900665283203125, -0.0825958251953125, -0.06618499755859375, -0.049774169921875, -0.03336334228515625, -0.0169525146484375, -0.00054168701171875, 0.015869140625, 0.03227996826171875, 0.0486907958984375, 0.06510162353515625, 0.081512451171875, 0.09792327880859375, 0.1143341064453125, 0.13074493408203125, 0.14715576171875, 0.16356658935546875, 0.1799774169921875, 0.19638824462890625, 0.212799072265625, 0.22920989990234375, 0.2456207275390625, 0.26203155517578125, 0.2784423828125, 0.29485321044921875, 0.3112640380859375, 0.32767486572265625, 0.344085693359375, 0.36049652099609375, 0.3769073486328125, 0.39331817626953125, 0.40972900390625, 0.42613983154296875, 0.4425506591796875, 0.45896148681640625, 0.475372314453125, 0.49178314208984375, 0.5081939697265625, 0.5246047973632812, 0.541015625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 5.0, 13.0, 16.0, 9.0, 23.0, 16.0, 33.0, 38.0, 29.0, 38.0, 31.0, 43.0, 38.0, 46.0, 41.0, 1074.0, 51.0, 54.0, 45.0, 34.0, 40.0, 38.0, 40.0, 39.0, 35.0, 25.0, 24.0, 12.0, 13.0, 14.0, 9.0, 11.0, 6.0, 5.0, 5.0, 11.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.74090576171875, -6.5364990234375, -6.33209228515625, -6.127685546875, -5.92327880859375, -5.7188720703125, -5.51446533203125, -5.31005859375, -5.10565185546875, -4.9012451171875, -4.69683837890625, -4.492431640625, -4.28802490234375, -4.0836181640625, -3.87921142578125, -3.6748046875, -3.47039794921875, -3.2659912109375, -3.06158447265625, -2.857177734375, -2.65277099609375, -2.4483642578125, -2.24395751953125, -2.03955078125, -1.83514404296875, -1.6307373046875, -1.42633056640625, -1.221923828125, -1.01751708984375, -0.8131103515625, -0.60870361328125, -0.404296875, -0.19989013671875, 0.0045166015625, 0.20892333984375, 0.413330078125, 0.61773681640625, 0.8221435546875, 1.02655029296875, 1.23095703125, 1.43536376953125, 1.6397705078125, 1.84417724609375, 2.048583984375, 2.25299072265625, 2.4573974609375, 2.66180419921875, 2.8662109375, 3.07061767578125, 3.2750244140625, 3.47943115234375, 3.683837890625, 3.88824462890625, 4.0926513671875, 4.29705810546875, 4.50146484375, 4.70587158203125, 4.9102783203125, 5.11468505859375, 5.319091796875, 5.52349853515625, 5.7279052734375, 5.93231201171875, 6.13671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 11.0, 11.0, 14.0, 18.0, 34.0, 53.0, 69.0, 131.0, 171.0, 280.0, 448.0, 676.0, 1017.0, 1687.0, 2505.0, 4117.0, 6352.0, 10259.0, 16045.0, 25542.0, 39444.0, 58262.0, 84190.0, 111877.0, 237847.0, 1079289.0, 123752.0, 95026.0, 68342.0, 46290.0, 30245.0, 19513.0, 12352.0, 7763.0, 4875.0, 3183.0, 1926.0, 1253.0, 849.0, 493.0, 306.0, 217.0, 134.0, 93.0, 52.0, 49.0, 20.0, 12.0, 15.0, 10.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.449462890625, -0.4355049133300781, -0.42154693603515625, -0.4075889587402344, -0.3936309814453125, -0.3796730041503906, -0.36571502685546875, -0.3517570495605469, -0.337799072265625, -0.3238410949707031, -0.30988311767578125, -0.2959251403808594, -0.2819671630859375, -0.2680091857910156, -0.25405120849609375, -0.24009323120117188, -0.22613525390625, -0.21217727661132812, -0.19821929931640625, -0.18426132202148438, -0.1703033447265625, -0.15634536743164062, -0.14238739013671875, -0.12842941284179688, -0.114471435546875, -0.10051345825195312, -0.08655548095703125, -0.07259750366210938, -0.0586395263671875, -0.044681549072265625, -0.03072357177734375, -0.016765594482421875, -0.0028076171875, 0.011150360107421875, 0.02510833740234375, 0.039066314697265625, 0.0530242919921875, 0.06698226928710938, 0.08094024658203125, 0.09489822387695312, 0.108856201171875, 0.12281417846679688, 0.13677215576171875, 0.15073013305664062, 0.1646881103515625, 0.17864608764648438, 0.19260406494140625, 0.20656204223632812, 0.22052001953125, 0.23447799682617188, 0.24843597412109375, 0.2623939514160156, 0.2763519287109375, 0.2903099060058594, 0.30426788330078125, 0.3182258605957031, 0.332183837890625, 0.3461418151855469, 0.36009979248046875, 0.3740577697753906, 0.3880157470703125, 0.4019737243652344, 0.41593170166015625, 0.4298896789550781, 0.44384765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 11.0, 16.0, 15.0, 16.0, 26.0, 18.0, 37.0, 43.0, 66.0, 93.0, 139.0, 117.0, 98.0, 61.0, 54.0, 47.0, 29.0, 18.0, 20.0, 14.0, 9.0, 9.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05780029296875, -0.05587577819824219, -0.053951263427734375, -0.05202674865722656, -0.05010223388671875, -0.04817771911621094, -0.046253204345703125, -0.04432868957519531, -0.0424041748046875, -0.04047966003417969, -0.038555145263671875, -0.03663063049316406, -0.03470611572265625, -0.03278160095214844, -0.030857086181640625, -0.028932571411132812, -0.027008056640625, -0.025083541870117188, -0.023159027099609375, -0.021234512329101562, -0.01930999755859375, -0.017385482788085938, -0.015460968017578125, -0.013536453247070312, -0.0116119384765625, -0.009687423706054688, -0.007762908935546875, -0.0058383941650390625, -0.00391387939453125, -0.0019893646240234375, -6.4849853515625e-05, 0.0018596649169921875, 0.0037841796875, 0.0057086944580078125, 0.007633209228515625, 0.009557723999023438, 0.01148223876953125, 0.013406753540039062, 0.015331268310546875, 0.017255783081054688, 0.0191802978515625, 0.021104812622070312, 0.023029327392578125, 0.024953842163085938, 0.02687835693359375, 0.028802871704101562, 0.030727386474609375, 0.03265190124511719, 0.034576416015625, 0.03650093078613281, 0.038425445556640625, 0.04034996032714844, 0.04227447509765625, 0.04419898986816406, 0.046123504638671875, 0.04804801940917969, 0.0499725341796875, 0.05189704895019531, 0.053821563720703125, 0.05574607849121094, 0.05767059326171875, 0.05959510803222656, 0.061519622802734375, 0.06344413757324219, 0.06536865234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 9.0, 9.0, 10.0, 16.0, 16.0, 34.0, 40.0, 78.0, 124.0, 252.0, 788.0, 1015425.0, 30741.0, 540.0, 189.0, 99.0, 47.0, 35.0, 28.0, 11.0, 19.0, 13.0, 7.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6272430419921875, -1.577728271484375, -1.5282135009765625, -1.47869873046875, -1.4291839599609375, -1.379669189453125, -1.3301544189453125, -1.2806396484375, -1.2311248779296875, -1.181610107421875, -1.1320953369140625, -1.08258056640625, -1.0330657958984375, -0.983551025390625, -0.9340362548828125, -0.884521484375, -0.8350067138671875, -0.785491943359375, -0.7359771728515625, -0.68646240234375, -0.6369476318359375, -0.587432861328125, -0.5379180908203125, -0.4884033203125, -0.4388885498046875, -0.389373779296875, -0.3398590087890625, -0.29034423828125, -0.2408294677734375, -0.191314697265625, -0.1417999267578125, -0.09228515625, -0.0427703857421875, 0.006744384765625, 0.0562591552734375, 0.10577392578125, 0.1552886962890625, 0.204803466796875, 0.2543182373046875, 0.3038330078125, 0.3533477783203125, 0.402862548828125, 0.4523773193359375, 0.50189208984375, 0.5514068603515625, 0.600921630859375, 0.6504364013671875, 0.699951171875, 0.7494659423828125, 0.798980712890625, 0.8484954833984375, 0.89801025390625, 0.9475250244140625, 0.997039794921875, 1.0465545654296875, 1.0960693359375, 1.1455841064453125, 1.195098876953125, 1.2446136474609375, 1.29412841796875, 1.3436431884765625, 1.393157958984375, 1.4426727294921875, 1.4921875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 40.0, 801.0, 152.0, 14.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8977954387664795, -0.8807346820831299, -0.8636739253997803, -0.8466131687164307, -0.829552412033081, -0.8124916553497314, -0.7954308986663818, -0.7783701419830322, -0.7613093852996826, -0.744248628616333, -0.7271878719329834, -0.7101271152496338, -0.6930663585662842, -0.6760056018829346, -0.658944845199585, -0.6418840885162354, -0.6248233318328857, -0.6077625751495361, -0.5907018184661865, -0.5736410617828369, -0.5565803050994873, -0.5395195484161377, -0.5224587917327881, -0.5053980350494385, -0.4883372187614441, -0.4712764620780945, -0.4542157053947449, -0.43715494871139526, -0.42009419202804565, -0.40303343534469604, -0.38597267866134644, -0.3689119219779968, -0.3518511950969696, -0.33479043841362, -0.3177296817302704, -0.3006689250469208, -0.28360816836357117, -0.26654741168022156, -0.24948664009571075, -0.23242588341236115, -0.21536512672901154, -0.19830437004566193, -0.18124361336231232, -0.1641828417778015, -0.1471220850944519, -0.1300613284111023, -0.11300057172775269, -0.09593981504440308, -0.07887905836105347, -0.06181830167770386, -0.04475754126906395, -0.027696780860424042, -0.010636024177074432, 0.006424732506275177, 0.023485496640205383, 0.04054625332355499, 0.0576070100069046, 0.07466776669025421, 0.09172852337360382, 0.10878928750753403, 0.12585005164146423, 0.14291080832481384, 0.15997156500816345, 0.17703232169151306, 0.19409307837486267]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 8.0, 6.0, 3.0, 11.0, 15.0, 16.0, 20.0, 23.0, 27.0, 22.0, 24.0, 44.0, 33.0, 28.0, 35.0, 42.0, 36.0, 48.0, 40.0, 45.0, 47.0, 38.0, 43.0, 32.0, 34.0, 43.0, 24.0, 32.0, 24.0, 24.0, 19.0, 29.0, 16.0, 14.0, 13.0, 6.0, 2.0, 11.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11979502439498901, -0.11590801179409027, -0.11202099174261093, -0.10813397914171219, -0.10424695909023285, -0.1003599464893341, -0.09647293388843536, -0.09258592128753662, -0.08869890123605728, -0.08481188863515854, -0.0809248685836792, -0.07703785598278046, -0.07315084338188171, -0.06926382333040237, -0.06537681072950363, -0.06148979440331459, -0.05760277807712555, -0.05371576175093651, -0.04982874542474747, -0.045941732823848724, -0.04205471649765968, -0.03816770017147064, -0.0342806875705719, -0.03039367124438286, -0.026506654918193817, -0.022619638592004776, -0.018732624128460884, -0.014845608733594418, -0.010958593338727951, -0.00707157701253891, -0.003184562548995018, 0.0007024519145488739, 0.004589468240737915, 0.008476483635604382, 0.012363499030470848, 0.01625051349401474, 0.02013752982020378, 0.024024546146392822, 0.027911560609936714, 0.031798575073480606, 0.03568559139966965, 0.03957260772585869, 0.04345962405204773, 0.04734663665294647, 0.05123365297913551, 0.055120669305324554, 0.0590076819062233, 0.06289470195770264, 0.06678171455860138, 0.07066872715950012, 0.07455574721097946, 0.0784427598118782, 0.08232977986335754, 0.08621679246425629, 0.09010380506515503, 0.09399081766605377, 0.09787783771753311, 0.10176485031843185, 0.1056518703699112, 0.10953888297080994, 0.11342589557170868, 0.11731291562318802, 0.12119992822408676, 0.1250869482755661, 0.12897396087646484]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 8.0, 11.0, 11.0, 14.0, 11.0, 16.0, 20.0, 21.0, 16.0, 22.0, 22.0, 25.0, 25.0, 30.0, 39.0, 30.0, 35.0, 35.0, 41.0, 38.0, 43.0, 34.0, 42.0, 44.0, 34.0, 36.0, 31.0, 32.0, 35.0, 22.0, 30.0, 19.0, 15.0, 17.0, 13.0, 20.0, 7.0, 8.0, 8.0, 10.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.8671875, -6.647705078125, -6.42822265625, -6.208740234375, -5.9892578125, -5.769775390625, -5.55029296875, -5.330810546875, -5.111328125, -4.891845703125, -4.67236328125, -4.452880859375, -4.2333984375, -4.013916015625, -3.79443359375, -3.574951171875, -3.35546875, -3.135986328125, -2.91650390625, -2.697021484375, -2.4775390625, -2.258056640625, -2.03857421875, -1.819091796875, -1.599609375, -1.380126953125, -1.16064453125, -0.941162109375, -0.7216796875, -0.502197265625, -0.28271484375, -0.063232421875, 0.15625, 0.375732421875, 0.59521484375, 0.814697265625, 1.0341796875, 1.253662109375, 1.47314453125, 1.692626953125, 1.912109375, 2.131591796875, 2.35107421875, 2.570556640625, 2.7900390625, 3.009521484375, 3.22900390625, 3.448486328125, 3.66796875, 3.887451171875, 4.10693359375, 4.326416015625, 4.5458984375, 4.765380859375, 4.98486328125, 5.204345703125, 5.423828125, 5.643310546875, 5.86279296875, 6.082275390625, 6.3017578125, 6.521240234375, 6.74072265625, 6.960205078125, 7.1796875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 12.0, 13.0, 27.0, 27.0, 39.0, 40.0, 55.0, 76.0, 102.0, 127.0, 235.0, 370.0, 714.0, 1586.0, 3635.0, 8371.0, 19907.0, 53531.0, 268193.0, 550267.0, 90666.0, 28857.0, 11903.0, 5196.0, 2225.0, 1006.0, 489.0, 265.0, 170.0, 117.0, 75.0, 50.0, 44.0, 33.0, 20.0, 22.0, 18.0, 14.0, 15.0, 6.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.9161376953125, -12.488525390625, -12.0609130859375, -11.63330078125, -11.2056884765625, -10.778076171875, -10.3504638671875, -9.9228515625, -9.4952392578125, -9.067626953125, -8.6400146484375, -8.21240234375, -7.7847900390625, -7.357177734375, -6.9295654296875, -6.501953125, -6.0743408203125, -5.646728515625, -5.2191162109375, -4.79150390625, -4.3638916015625, -3.936279296875, -3.5086669921875, -3.0810546875, -2.6534423828125, -2.225830078125, -1.7982177734375, -1.37060546875, -0.9429931640625, -0.515380859375, -0.0877685546875, 0.33984375, 0.7674560546875, 1.195068359375, 1.6226806640625, 2.05029296875, 2.4779052734375, 2.905517578125, 3.3331298828125, 3.7607421875, 4.1883544921875, 4.615966796875, 5.0435791015625, 5.47119140625, 5.8988037109375, 6.326416015625, 6.7540283203125, 7.181640625, 7.6092529296875, 8.036865234375, 8.4644775390625, 8.89208984375, 9.3197021484375, 9.747314453125, 10.1749267578125, 10.6025390625, 11.0301513671875, 11.457763671875, 11.8853759765625, 12.31298828125, 12.7406005859375, 13.168212890625, 13.5958251953125, 14.0234375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 14.0, 15.0, 20.0, 22.0, 32.0, 28.0, 30.0, 44.0, 38.0, 54.0, 54.0, 75.0, 152.0, 1444.0, 403.0, 118.0, 76.0, 58.0, 41.0, 46.0, 42.0, 21.0, 34.0, 23.0, 16.0, 22.0, 15.0, 13.0, 14.0, 11.0, 11.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.8125, -25.114013671875, -24.41552734375, -23.717041015625, -23.0185546875, -22.320068359375, -21.62158203125, -20.923095703125, -20.224609375, -19.526123046875, -18.82763671875, -18.129150390625, -17.4306640625, -16.732177734375, -16.03369140625, -15.335205078125, -14.63671875, -13.938232421875, -13.23974609375, -12.541259765625, -11.8427734375, -11.144287109375, -10.44580078125, -9.747314453125, -9.048828125, -8.350341796875, -7.65185546875, -6.953369140625, -6.2548828125, -5.556396484375, -4.85791015625, -4.159423828125, -3.4609375, -2.762451171875, -2.06396484375, -1.365478515625, -0.6669921875, 0.031494140625, 0.72998046875, 1.428466796875, 2.126953125, 2.825439453125, 3.52392578125, 4.222412109375, 4.9208984375, 5.619384765625, 6.31787109375, 7.016357421875, 7.71484375, 8.413330078125, 9.11181640625, 9.810302734375, 10.5087890625, 11.207275390625, 11.90576171875, 12.604248046875, 13.302734375, 14.001220703125, 14.69970703125, 15.398193359375, 16.0966796875, 16.795166015625, 17.49365234375, 18.192138671875, 18.890625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 17.0, 11.0, 26.0, 19.0, 37.0, 40.0, 52.0, 67.0, 86.0, 156.0, 220.0, 339.0, 1075.0, 7779.0, 205998.0, 2885205.0, 40041.0, 2923.0, 645.0, 297.0, 184.0, 125.0, 97.0, 55.0, 35.0, 33.0, 27.0, 26.0, 16.0, 14.0, 10.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-42.75, -41.3837890625, -40.017578125, -38.6513671875, -37.28515625, -35.9189453125, -34.552734375, -33.1865234375, -31.8203125, -30.4541015625, -29.087890625, -27.7216796875, -26.35546875, -24.9892578125, -23.623046875, -22.2568359375, -20.890625, -19.5244140625, -18.158203125, -16.7919921875, -15.42578125, -14.0595703125, -12.693359375, -11.3271484375, -9.9609375, -8.5947265625, -7.228515625, -5.8623046875, -4.49609375, -3.1298828125, -1.763671875, -0.3974609375, 0.96875, 2.3349609375, 3.701171875, 5.0673828125, 6.43359375, 7.7998046875, 9.166015625, 10.5322265625, 11.8984375, 13.2646484375, 14.630859375, 15.9970703125, 17.36328125, 18.7294921875, 20.095703125, 21.4619140625, 22.828125, 24.1943359375, 25.560546875, 26.9267578125, 28.29296875, 29.6591796875, 31.025390625, 32.3916015625, 33.7578125, 35.1240234375, 36.490234375, 37.8564453125, 39.22265625, 40.5888671875, 41.955078125, 43.3212890625, 44.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 6.0, 42.0, 131.0, 240.0, 263.0, 198.0, 94.0, 31.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11930847167969, -66.83709716796875, -64.55488586425781, -62.272674560546875, -59.99046325683594, -57.708251953125, -55.42604064941406, -53.143829345703125, -50.86161804199219, -48.57940673828125, -46.29719543457031, -44.014984130859375, -41.73277282714844, -39.4505615234375, -37.16835021972656, -34.886138916015625, -32.60392379760742, -30.321712493896484, -28.039501190185547, -25.75728988647461, -23.475078582763672, -21.192867279052734, -18.910654067993164, -16.628442764282227, -14.346231460571289, -12.064020156860352, -9.781808853149414, -7.49959659576416, -5.217385292053223, -2.935173988342285, -0.6529617309570312, 1.6292495727539062, 3.9114608764648438, 6.193672180175781, 8.475883483886719, 10.758095741271973, 13.04030704498291, 15.322518348693848, 17.6047306060791, 19.88694190979004, 22.169153213500977, 24.451364517211914, 26.73357582092285, 29.015789031982422, 31.29800033569336, 33.5802116394043, 35.862422943115234, 38.14463424682617, 40.42684555053711, 42.70905685424805, 44.991268157958984, 47.27347946166992, 49.55569076538086, 51.8379020690918, 54.1201171875, 56.40232849121094, 58.684539794921875, 60.96675109863281, 63.24896240234375, 65.53117370605469, 67.81338500976562, 70.09559631347656, 72.3778076171875, 74.66001892089844, 76.94223022460938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 10.0, 10.0, 8.0, 13.0, 18.0, 15.0, 17.0, 30.0, 19.0, 23.0, 22.0, 34.0, 38.0, 48.0, 31.0, 34.0, 35.0, 45.0, 30.0, 50.0, 35.0, 41.0, 34.0, 29.0, 47.0, 26.0, 37.0, 31.0, 25.0, 16.0, 22.0, 15.0, 23.0, 12.0, 9.0, 11.0, 13.0, 7.0, 1.0, 3.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.43474578857422, -44.89057922363281, -43.346412658691406, -41.80224609375, -40.258079528808594, -38.71391296386719, -37.16974639892578, -35.625579833984375, -34.08141326904297, -32.53724670410156, -30.993080139160156, -29.44891357421875, -27.904747009277344, -26.360580444335938, -24.8164119720459, -23.272245407104492, -21.728076934814453, -20.183910369873047, -18.63974380493164, -17.095577239990234, -15.551409721374512, -14.007243156433105, -12.463075637817383, -10.918909072875977, -9.37474250793457, -7.830575942993164, -6.2864089012146, -4.742241859436035, -3.198075294494629, -1.6539087295532227, -0.1097412109375, 1.4344253540039062, 2.9785919189453125, 4.522758483886719, 6.066925525665283, 7.611092567443848, 9.155259132385254, 10.69942569732666, 12.243593215942383, 13.787759780883789, 15.331926345825195, 16.8760929107666, 18.420259475708008, 19.964427947998047, 21.508594512939453, 23.05276107788086, 24.596927642822266, 26.141094207763672, 27.685260772705078, 29.229427337646484, 30.77359390258789, 32.3177604675293, 33.8619270324707, 35.40609359741211, 36.95026397705078, 38.49443054199219, 40.038597106933594, 41.582763671875, 43.126930236816406, 44.67109680175781, 46.21526336669922, 47.759429931640625, 49.30359649658203, 50.84776306152344, 52.391929626464844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 12.0, 11.0, 17.0, 24.0, 21.0, 15.0, 23.0, 20.0, 23.0, 20.0, 28.0, 22.0, 33.0, 31.0, 42.0, 35.0, 42.0, 42.0, 36.0, 38.0, 46.0, 37.0, 30.0, 34.0, 27.0, 31.0, 26.0, 30.0, 16.0, 24.0, 12.0, 15.0, 11.0, 17.0, 13.0, 16.0, 9.0, 4.0, 8.0, 6.0, 5.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.66796875, -6.45208740234375, -6.2362060546875, -6.02032470703125, -5.804443359375, -5.58856201171875, -5.3726806640625, -5.15679931640625, -4.94091796875, -4.72503662109375, -4.5091552734375, -4.29327392578125, -4.077392578125, -3.86151123046875, -3.6456298828125, -3.42974853515625, -3.2138671875, -2.99798583984375, -2.7821044921875, -2.56622314453125, -2.350341796875, -2.13446044921875, -1.9185791015625, -1.70269775390625, -1.48681640625, -1.27093505859375, -1.0550537109375, -0.83917236328125, -0.623291015625, -0.40740966796875, -0.1915283203125, 0.02435302734375, 0.240234375, 0.45611572265625, 0.6719970703125, 0.88787841796875, 1.103759765625, 1.31964111328125, 1.5355224609375, 1.75140380859375, 1.96728515625, 2.18316650390625, 2.3990478515625, 2.61492919921875, 2.830810546875, 3.04669189453125, 3.2625732421875, 3.47845458984375, 3.6943359375, 3.91021728515625, 4.1260986328125, 4.34197998046875, 4.557861328125, 4.77374267578125, 4.9896240234375, 5.20550537109375, 5.42138671875, 5.63726806640625, 5.8531494140625, 6.06903076171875, 6.284912109375, 6.50079345703125, 6.7166748046875, 6.93255615234375, 7.1484375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 1.0, 5.0, 6.0, 11.0, 14.0, 16.0, 16.0, 19.0, 30.0, 70.0, 84.0, 94.0, 188.0, 404.0, 807.0, 2001.0, 5600.0, 17976.0, 64439.0, 246626.0, 860564.0, 1675608.0, 940800.0, 275674.0, 72561.0, 20266.0, 6413.0, 2099.0, 883.0, 393.0, 204.0, 130.0, 101.0, 50.0, 28.0, 22.0, 22.0, 12.0, 14.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4765625, -9.1761474609375, -8.875732421875, -8.5753173828125, -8.27490234375, -7.9744873046875, -7.674072265625, -7.3736572265625, -7.0732421875, -6.7728271484375, -6.472412109375, -6.1719970703125, -5.87158203125, -5.5711669921875, -5.270751953125, -4.9703369140625, -4.669921875, -4.3695068359375, -4.069091796875, -3.7686767578125, -3.46826171875, -3.1678466796875, -2.867431640625, -2.5670166015625, -2.2666015625, -1.9661865234375, -1.665771484375, -1.3653564453125, -1.06494140625, -0.7645263671875, -0.464111328125, -0.1636962890625, 0.13671875, 0.4371337890625, 0.737548828125, 1.0379638671875, 1.33837890625, 1.6387939453125, 1.939208984375, 2.2396240234375, 2.5400390625, 2.8404541015625, 3.140869140625, 3.4412841796875, 3.74169921875, 4.0421142578125, 4.342529296875, 4.6429443359375, 4.943359375, 5.2437744140625, 5.544189453125, 5.8446044921875, 6.14501953125, 6.4454345703125, 6.745849609375, 7.0462646484375, 7.3466796875, 7.6470947265625, 7.947509765625, 8.2479248046875, 8.54833984375, 8.8487548828125, 9.149169921875, 9.4495849609375, 9.75]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 10.0, 10.0, 9.0, 23.0, 27.0, 39.0, 46.0, 85.0, 102.0, 121.0, 160.0, 264.0, 278.0, 357.0, 405.0, 415.0, 416.0, 322.0, 251.0, 184.0, 130.0, 116.0, 87.0, 66.0, 37.0, 25.0, 26.0, 15.0, 8.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.4732666015625, -10.126220703125, -9.7791748046875, -9.43212890625, -9.0850830078125, -8.738037109375, -8.3909912109375, -8.0439453125, -7.6968994140625, -7.349853515625, -7.0028076171875, -6.65576171875, -6.3087158203125, -5.961669921875, -5.6146240234375, -5.267578125, -4.9205322265625, -4.573486328125, -4.2264404296875, -3.87939453125, -3.5323486328125, -3.185302734375, -2.8382568359375, -2.4912109375, -2.1441650390625, -1.797119140625, -1.4500732421875, -1.10302734375, -0.7559814453125, -0.408935546875, -0.0618896484375, 0.28515625, 0.6322021484375, 0.979248046875, 1.3262939453125, 1.67333984375, 2.0203857421875, 2.367431640625, 2.7144775390625, 3.0615234375, 3.4085693359375, 3.755615234375, 4.1026611328125, 4.44970703125, 4.7967529296875, 5.143798828125, 5.4908447265625, 5.837890625, 6.1849365234375, 6.531982421875, 6.8790283203125, 7.22607421875, 7.5731201171875, 7.920166015625, 8.2672119140625, 8.6142578125, 8.9613037109375, 9.308349609375, 9.6553955078125, 10.00244140625, 10.3494873046875, 10.696533203125, 11.0435791015625, 11.390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 12.0, 13.0, 14.0, 37.0, 39.0, 77.0, 100.0, 151.0, 222.0, 372.0, 743.0, 1707.0, 8071.0, 85963.0, 1724274.0, 2241718.0, 116724.0, 10002.0, 2094.0, 776.0, 416.0, 223.0, 161.0, 100.0, 67.0, 58.0, 36.0, 18.0, 19.0, 20.0, 8.0, 5.0, 9.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.453125, -26.5966796875, -25.740234375, -24.8837890625, -24.02734375, -23.1708984375, -22.314453125, -21.4580078125, -20.6015625, -19.7451171875, -18.888671875, -18.0322265625, -17.17578125, -16.3193359375, -15.462890625, -14.6064453125, -13.75, -12.8935546875, -12.037109375, -11.1806640625, -10.32421875, -9.4677734375, -8.611328125, -7.7548828125, -6.8984375, -6.0419921875, -5.185546875, -4.3291015625, -3.47265625, -2.6162109375, -1.759765625, -0.9033203125, -0.046875, 0.8095703125, 1.666015625, 2.5224609375, 3.37890625, 4.2353515625, 5.091796875, 5.9482421875, 6.8046875, 7.6611328125, 8.517578125, 9.3740234375, 10.23046875, 11.0869140625, 11.943359375, 12.7998046875, 13.65625, 14.5126953125, 15.369140625, 16.2255859375, 17.08203125, 17.9384765625, 18.794921875, 19.6513671875, 20.5078125, 21.3642578125, 22.220703125, 23.0771484375, 23.93359375, 24.7900390625, 25.646484375, 26.5029296875, 27.359375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 15.0, 168.0, 574.0, 235.0, 22.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-476.984375, -468.5560607910156, -460.1277770996094, -451.699462890625, -443.27117919921875, -434.8428649902344, -426.4145812988281, -417.98626708984375, -409.5579833984375, -401.1296691894531, -392.7013854980469, -384.2730712890625, -375.84478759765625, -367.4164733886719, -358.9881896972656, -350.55987548828125, -342.1315612792969, -333.7032470703125, -325.27496337890625, -316.8466491699219, -308.4183654785156, -299.99005126953125, -291.561767578125, -283.1334533691406, -274.70513916015625, -266.2768249511719, -257.8485412597656, -249.4202423095703, -240.991943359375, -232.56362915039062, -224.1353302001953, -215.70703125, -207.27871704101562, -198.8504180908203, -190.422119140625, -181.9938201904297, -173.56552124023438, -165.13720703125, -156.7089080810547, -148.28060913085938, -139.85231018066406, -131.42401123046875, -122.99571228027344, -114.5674057006836, -106.13910675048828, -97.71080780029297, -89.28250122070312, -80.85420227050781, -72.4259033203125, -63.99760437011719, -55.56930160522461, -47.14099884033203, -38.71269989013672, -30.284400939941406, -21.856098175048828, -13.42779541015625, -4.9994964599609375, 3.428804397583008, 11.857105255126953, 20.2854061126709, 28.713706970214844, 37.142005920410156, 45.570308685302734, 53.99861145019531, 62.426910400390625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 5.0, 6.0, 3.0, 7.0, 3.0, 4.0, 7.0, 8.0, 13.0, 5.0, 13.0, 14.0, 8.0, 15.0, 21.0, 26.0, 17.0, 15.0, 31.0, 39.0, 33.0, 29.0, 37.0, 34.0, 36.0, 31.0, 45.0, 34.0, 41.0, 60.0, 45.0, 28.0, 31.0, 28.0, 14.0, 29.0, 32.0, 24.0, 18.0, 19.0, 13.0, 14.0, 14.0, 4.0, 10.0, 9.0, 3.0, 3.0, 7.0, 6.0, 1.0, 6.0, 2.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-34.54085922241211, -33.45721435546875, -32.37356948852539, -31.289926528930664, -30.206283569335938, -29.122638702392578, -28.03899383544922, -26.95534896850586, -25.871706008911133, -24.788061141967773, -23.704418182373047, -22.620773315429688, -21.537128448486328, -20.4534854888916, -19.369840621948242, -18.286197662353516, -17.202552795410156, -16.118907928466797, -15.03526496887207, -13.951620101928711, -12.867976188659668, -11.784332275390625, -10.700687408447266, -9.617043495178223, -8.53339958190918, -7.449755668640137, -6.3661112785339355, -5.282466888427734, -4.198822975158691, -3.1151790618896484, -2.0315346717834473, -0.9478902816772461, 0.13575363159179688, 1.219397783279419, 2.303041934967041, 3.386686086654663, 4.470330238342285, 5.553974151611328, 6.637618541717529, 7.7212629318237305, 8.804906845092773, 9.888550758361816, 10.97219467163086, 12.055839538574219, 13.139483451843262, 14.223127365112305, 15.306772232055664, 16.39041519165039, 17.47406005859375, 18.55770492553711, 19.641347885131836, 20.724992752075195, 21.808635711669922, 22.89228057861328, 23.97592544555664, 25.0595703125, 26.143213272094727, 27.226858139038086, 28.310501098632812, 29.394145965576172, 30.47779083251953, 31.561433792114258, 32.645076751708984, 33.728721618652344, 34.8123664855957]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 1.0, 3.0, 12.0, 8.0, 4.0, 4.0, 9.0, 7.0, 18.0, 19.0, 21.0, 25.0, 22.0, 22.0, 30.0, 31.0, 31.0, 51.0, 31.0, 34.0, 40.0, 60.0, 46.0, 47.0, 39.0, 34.0, 32.0, 36.0, 44.0, 41.0, 35.0, 23.0, 11.0, 21.0, 21.0, 15.0, 11.0, 14.0, 8.0, 8.0, 5.0, 5.0, 5.0, 8.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-8.5, -8.25909423828125, -8.0181884765625, -7.77728271484375, -7.536376953125, -7.29547119140625, -7.0545654296875, -6.81365966796875, -6.57275390625, -6.33184814453125, -6.0909423828125, -5.85003662109375, -5.609130859375, -5.36822509765625, -5.1273193359375, -4.88641357421875, -4.6455078125, -4.40460205078125, -4.1636962890625, -3.92279052734375, -3.681884765625, -3.44097900390625, -3.2000732421875, -2.95916748046875, -2.71826171875, -2.47735595703125, -2.2364501953125, -1.99554443359375, -1.754638671875, -1.51373291015625, -1.2728271484375, -1.03192138671875, -0.791015625, -0.55010986328125, -0.3092041015625, -0.06829833984375, 0.172607421875, 0.41351318359375, 0.6544189453125, 0.89532470703125, 1.13623046875, 1.37713623046875, 1.6180419921875, 1.85894775390625, 2.099853515625, 2.34075927734375, 2.5816650390625, 2.82257080078125, 3.0634765625, 3.30438232421875, 3.5452880859375, 3.78619384765625, 4.027099609375, 4.26800537109375, 4.5089111328125, 4.74981689453125, 4.99072265625, 5.23162841796875, 5.4725341796875, 5.71343994140625, 5.954345703125, 6.19525146484375, 6.4361572265625, 6.67706298828125, 6.91796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 5.0, 12.0, 19.0, 19.0, 34.0, 42.0, 82.0, 127.0, 178.0, 309.0, 517.0, 873.0, 1403.0, 2385.0, 3776.0, 6202.0, 10155.0, 16438.0, 26501.0, 41962.0, 63771.0, 91934.0, 124251.0, 146372.0, 143995.0, 117965.0, 87126.0, 59404.0, 39148.0, 24366.0, 15366.0, 9294.0, 5706.0, 3438.0, 2081.0, 1233.0, 783.0, 495.0, 311.0, 179.0, 99.0, 71.0, 42.0, 33.0, 18.0, 8.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.71484375, -0.69244384765625, -0.6700439453125, -0.64764404296875, -0.625244140625, -0.60284423828125, -0.5804443359375, -0.55804443359375, -0.53564453125, -0.51324462890625, -0.4908447265625, -0.46844482421875, -0.446044921875, -0.42364501953125, -0.4012451171875, -0.37884521484375, -0.3564453125, -0.33404541015625, -0.3116455078125, -0.28924560546875, -0.266845703125, -0.24444580078125, -0.2220458984375, -0.19964599609375, -0.17724609375, -0.15484619140625, -0.1324462890625, -0.11004638671875, -0.087646484375, -0.06524658203125, -0.0428466796875, -0.02044677734375, 0.001953125, 0.02435302734375, 0.0467529296875, 0.06915283203125, 0.091552734375, 0.11395263671875, 0.1363525390625, 0.15875244140625, 0.18115234375, 0.20355224609375, 0.2259521484375, 0.24835205078125, 0.270751953125, 0.29315185546875, 0.3155517578125, 0.33795166015625, 0.3603515625, 0.38275146484375, 0.4051513671875, 0.42755126953125, 0.449951171875, 0.47235107421875, 0.4947509765625, 0.51715087890625, 0.53955078125, 0.56195068359375, 0.5843505859375, 0.60675048828125, 0.629150390625, 0.65155029296875, 0.6739501953125, 0.69635009765625, 0.71875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 10.0, 8.0, 9.0, 12.0, 22.0, 25.0, 15.0, 29.0, 35.0, 31.0, 32.0, 40.0, 36.0, 34.0, 44.0, 49.0, 36.0, 38.0, 1060.0, 41.0, 33.0, 41.0, 39.0, 43.0, 22.0, 31.0, 24.0, 25.0, 19.0, 14.0, 14.0, 16.0, 10.0, 11.0, 14.0, 8.0, 7.0, 9.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.203125, -5.03717041015625, -4.8712158203125, -4.70526123046875, -4.539306640625, -4.37335205078125, -4.2073974609375, -4.04144287109375, -3.87548828125, -3.70953369140625, -3.5435791015625, -3.37762451171875, -3.211669921875, -3.04571533203125, -2.8797607421875, -2.71380615234375, -2.5478515625, -2.38189697265625, -2.2159423828125, -2.04998779296875, -1.884033203125, -1.71807861328125, -1.5521240234375, -1.38616943359375, -1.22021484375, -1.05426025390625, -0.8883056640625, -0.72235107421875, -0.556396484375, -0.39044189453125, -0.2244873046875, -0.05853271484375, 0.107421875, 0.27337646484375, 0.4393310546875, 0.60528564453125, 0.771240234375, 0.93719482421875, 1.1031494140625, 1.26910400390625, 1.43505859375, 1.60101318359375, 1.7669677734375, 1.93292236328125, 2.098876953125, 2.26483154296875, 2.4307861328125, 2.59674072265625, 2.7626953125, 2.92864990234375, 3.0946044921875, 3.26055908203125, 3.426513671875, 3.59246826171875, 3.7584228515625, 3.92437744140625, 4.09033203125, 4.25628662109375, 4.4222412109375, 4.58819580078125, 4.754150390625, 4.92010498046875, 5.0860595703125, 5.25201416015625, 5.41796875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 12.0, 27.0, 40.0, 61.0, 86.0, 117.0, 199.0, 293.0, 431.0, 575.0, 972.0, 1501.0, 2044.0, 3223.0, 4689.0, 6996.0, 10582.0, 15184.0, 22340.0, 32718.0, 46312.0, 63267.0, 83755.0, 104089.0, 413425.0, 870660.0, 106416.0, 86141.0, 66210.0, 47947.0, 34203.0, 23290.0, 16056.0, 10884.0, 7417.0, 4902.0, 3360.0, 2210.0, 1510.0, 999.0, 670.0, 466.0, 283.0, 175.0, 151.0, 81.0, 56.0, 36.0, 19.0, 23.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0], "bins": [-0.371826171875, -0.3602294921875, -0.3486328125, -0.3370361328125, -0.325439453125, -0.3138427734375, -0.30224609375, -0.2906494140625, -0.279052734375, -0.2674560546875, -0.255859375, -0.2442626953125, -0.232666015625, -0.2210693359375, -0.20947265625, -0.1978759765625, -0.186279296875, -0.1746826171875, -0.1630859375, -0.1514892578125, -0.139892578125, -0.1282958984375, -0.11669921875, -0.1051025390625, -0.093505859375, -0.0819091796875, -0.0703125, -0.0587158203125, -0.047119140625, -0.0355224609375, -0.02392578125, -0.0123291015625, -0.000732421875, 0.0108642578125, 0.0224609375, 0.0340576171875, 0.045654296875, 0.0572509765625, 0.06884765625, 0.0804443359375, 0.092041015625, 0.1036376953125, 0.115234375, 0.1268310546875, 0.138427734375, 0.1500244140625, 0.16162109375, 0.1732177734375, 0.184814453125, 0.1964111328125, 0.2080078125, 0.2196044921875, 0.231201171875, 0.2427978515625, 0.25439453125, 0.2659912109375, 0.277587890625, 0.2891845703125, 0.30078125, 0.3123779296875, 0.323974609375, 0.3355712890625, 0.34716796875, 0.3587646484375, 0.370361328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 9.0, 8.0, 17.0, 14.0, 29.0, 25.0, 45.0, 44.0, 53.0, 53.0, 90.0, 75.0, 84.0, 74.0, 78.0, 66.0, 46.0, 27.0, 24.0, 22.0, 23.0, 16.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0350341796875, -0.03401446342468262, -0.032994747161865234, -0.03197503089904785, -0.03095531463623047, -0.029935598373413086, -0.028915882110595703, -0.02789616584777832, -0.026876449584960938, -0.025856733322143555, -0.024837017059326172, -0.02381730079650879, -0.022797584533691406, -0.021777868270874023, -0.02075815200805664, -0.019738435745239258, -0.018718719482421875, -0.017699003219604492, -0.01667928695678711, -0.015659570693969727, -0.014639854431152344, -0.013620138168334961, -0.012600421905517578, -0.011580705642700195, -0.010560989379882812, -0.00954127311706543, -0.008521556854248047, -0.007501840591430664, -0.006482124328613281, -0.0054624080657958984, -0.004442691802978516, -0.003422975540161133, -0.00240325927734375, -0.0013835430145263672, -0.0003638267517089844, 0.0006558895111083984, 0.0016756057739257812, 0.002695322036743164, 0.003715038299560547, 0.00473475456237793, 0.0057544708251953125, 0.006774187088012695, 0.007793903350830078, 0.008813619613647461, 0.009833335876464844, 0.010853052139282227, 0.01187276840209961, 0.012892484664916992, 0.013912200927734375, 0.014931917190551758, 0.01595163345336914, 0.016971349716186523, 0.017991065979003906, 0.01901078224182129, 0.020030498504638672, 0.021050214767456055, 0.022069931030273438, 0.02308964729309082, 0.024109363555908203, 0.025129079818725586, 0.02614879608154297, 0.02716851234436035, 0.028188228607177734, 0.029207944869995117, 0.0302276611328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 15.0, 24.0, 33.0, 47.0, 64.0, 64.0, 134.0, 241.0, 619.0, 9050.0, 1035138.0, 1976.0, 417.0, 248.0, 119.0, 81.0, 68.0, 43.0, 31.0, 23.0, 19.0, 15.0, 6.0, 7.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6747665405273438, -0.6517791748046875, -0.6287918090820312, -0.605804443359375, -0.5828170776367188, -0.5598297119140625, -0.5368423461914062, -0.51385498046875, -0.49086761474609375, -0.4678802490234375, -0.44489288330078125, -0.421905517578125, -0.39891815185546875, -0.3759307861328125, -0.35294342041015625, -0.3299560546875, -0.30696868896484375, -0.2839813232421875, -0.26099395751953125, -0.238006591796875, -0.21501922607421875, -0.1920318603515625, -0.16904449462890625, -0.14605712890625, -0.12306976318359375, -0.1000823974609375, -0.07709503173828125, -0.054107666015625, -0.03112030029296875, -0.0081329345703125, 0.01485443115234375, 0.037841796875, 0.06082916259765625, 0.0838165283203125, 0.10680389404296875, 0.129791259765625, 0.15277862548828125, 0.1757659912109375, 0.19875335693359375, 0.22174072265625, 0.24472808837890625, 0.2677154541015625, 0.29070281982421875, 0.313690185546875, 0.33667755126953125, 0.3596649169921875, 0.38265228271484375, 0.4056396484375, 0.42862701416015625, 0.4516143798828125, 0.47460174560546875, 0.497589111328125, 0.5205764770507812, 0.5435638427734375, 0.5665512084960938, 0.58953857421875, 0.6125259399414062, 0.6355133056640625, 0.6585006713867188, 0.681488037109375, 0.7044754028320312, 0.7274627685546875, 0.7504501342773438, 0.7734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 138.0, 718.0, 113.0, 26.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4119504392147064, -0.40395405888557434, -0.3959576487541199, -0.3879612684249878, -0.3799648582935333, -0.37196847796440125, -0.3639720678329468, -0.3559756875038147, -0.3479793071746826, -0.33998292684555054, -0.33198651671409607, -0.323990136384964, -0.3159937262535095, -0.30799734592437744, -0.30000096559524536, -0.2920045554637909, -0.2840081453323364, -0.27601176500320435, -0.2680153548717499, -0.2600189745426178, -0.25202256441116333, -0.24402618408203125, -0.23602978885173798, -0.2280333936214447, -0.22003701329231262, -0.21204061806201935, -0.20404422283172607, -0.196047842502594, -0.18805144727230072, -0.18005505204200745, -0.17205865681171417, -0.1640622615814209, -0.15606586635112762, -0.14806947112083435, -0.14007307589054108, -0.1320766806602478, -0.12408030033111572, -0.11608390510082245, -0.10808750987052917, -0.1000911146402359, -0.09209472686052322, -0.08409833163022995, -0.07610194385051727, -0.068105548620224, -0.060109157115221024, -0.05211276561021805, -0.044116370379924774, -0.0361199788749218, -0.028123587369918823, -0.020127195864915848, -0.012130802497267723, -0.004134409129619598, 0.003861982375383377, 0.011858373880386353, 0.019854769110679626, 0.027851160615682602, 0.03584755212068558, 0.04384394362568855, 0.05184033513069153, 0.0598367303609848, 0.06783312559127808, 0.07582951337099075, 0.08382590860128403, 0.0918222963809967, 0.09981869161128998]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 9.0, 13.0, 12.0, 12.0, 13.0, 20.0, 22.0, 26.0, 17.0, 34.0, 26.0, 39.0, 41.0, 37.0, 47.0, 48.0, 46.0, 69.0, 42.0, 46.0, 21.0, 43.0, 43.0, 33.0, 38.0, 31.0, 21.0, 23.0, 21.0, 8.0, 18.0, 11.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05651211738586426, -0.05446071922779083, -0.05240932106971741, -0.05035792291164398, -0.04830652475357056, -0.04625512659549713, -0.044203728437423706, -0.04215233027935028, -0.040100932121276855, -0.03804953396320343, -0.035998135805130005, -0.03394673764705658, -0.031895339488983154, -0.02984394133090973, -0.027792543172836304, -0.02574114501476288, -0.023689746856689453, -0.021638348698616028, -0.019586950540542603, -0.017535552382469177, -0.015484154224395752, -0.013432756066322327, -0.011381357908248901, -0.009329959750175476, -0.007278561592102051, -0.0052271634340286255, -0.0031757652759552, -0.001124367117881775, 0.0009270310401916504, 0.0029784291982650757, 0.005029827356338501, 0.007081225514411926, 0.009132623672485352, 0.011184021830558777, 0.013235419988632202, 0.015286818146705627, 0.017338216304779053, 0.019389614462852478, 0.021441012620925903, 0.02349241077899933, 0.025543808937072754, 0.02759520709514618, 0.029646605253219604, 0.03169800341129303, 0.033749401569366455, 0.03580079972743988, 0.037852197885513306, 0.03990359604358673, 0.041954994201660156, 0.04400639235973358, 0.04605779051780701, 0.04810918867588043, 0.05016058683395386, 0.05221198499202728, 0.05426338315010071, 0.05631478130817413, 0.05836617946624756, 0.060417577624320984, 0.06246897578239441, 0.06452037394046783, 0.06657177209854126, 0.06862317025661469, 0.07067456841468811, 0.07272596657276154, 0.07477736473083496]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 3.0, 6.0, 7.0, 5.0, 13.0, 13.0, 12.0, 12.0, 13.0, 17.0, 22.0, 20.0, 20.0, 36.0, 27.0, 32.0, 43.0, 42.0, 40.0, 50.0, 44.0, 48.0, 39.0, 45.0, 30.0, 42.0, 39.0, 43.0, 31.0, 29.0, 27.0, 18.0, 15.0, 18.0, 18.0, 14.0, 6.0, 8.0, 10.0, 7.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.71875, -7.47955322265625, -7.2403564453125, -7.00115966796875, -6.761962890625, -6.52276611328125, -6.2835693359375, -6.04437255859375, -5.80517578125, -5.56597900390625, -5.3267822265625, -5.08758544921875, -4.848388671875, -4.60919189453125, -4.3699951171875, -4.13079833984375, -3.8916015625, -3.65240478515625, -3.4132080078125, -3.17401123046875, -2.934814453125, -2.69561767578125, -2.4564208984375, -2.21722412109375, -1.97802734375, -1.73883056640625, -1.4996337890625, -1.26043701171875, -1.021240234375, -0.78204345703125, -0.5428466796875, -0.30364990234375, -0.064453125, 0.17474365234375, 0.4139404296875, 0.65313720703125, 0.892333984375, 1.13153076171875, 1.3707275390625, 1.60992431640625, 1.84912109375, 2.08831787109375, 2.3275146484375, 2.56671142578125, 2.805908203125, 3.04510498046875, 3.2843017578125, 3.52349853515625, 3.7626953125, 4.00189208984375, 4.2410888671875, 4.48028564453125, 4.719482421875, 4.95867919921875, 5.1978759765625, 5.43707275390625, 5.67626953125, 5.91546630859375, 6.1546630859375, 6.39385986328125, 6.633056640625, 6.87225341796875, 7.1114501953125, 7.35064697265625, 7.58984375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 11.0, 19.0, 38.0, 52.0, 90.0, 152.0, 250.0, 429.0, 797.0, 1494.0, 2966.0, 5891.0, 11731.0, 23915.0, 49196.0, 106672.0, 251048.0, 316961.0, 148635.0, 65948.0, 31120.0, 15331.0, 7639.0, 3842.0, 1912.0, 1022.0, 596.0, 331.0, 170.0, 114.0, 65.0, 46.0, 20.0, 13.0, 5.0, 10.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.6690673828125, -8.361572265625, -8.0540771484375, -7.74658203125, -7.4390869140625, -7.131591796875, -6.8240966796875, -6.5166015625, -6.2091064453125, -5.901611328125, -5.5941162109375, -5.28662109375, -4.9791259765625, -4.671630859375, -4.3641357421875, -4.056640625, -3.7491455078125, -3.441650390625, -3.1341552734375, -2.82666015625, -2.5191650390625, -2.211669921875, -1.9041748046875, -1.5966796875, -1.2891845703125, -0.981689453125, -0.6741943359375, -0.36669921875, -0.0592041015625, 0.248291015625, 0.5557861328125, 0.86328125, 1.1707763671875, 1.478271484375, 1.7857666015625, 2.09326171875, 2.4007568359375, 2.708251953125, 3.0157470703125, 3.3232421875, 3.6307373046875, 3.938232421875, 4.2457275390625, 4.55322265625, 4.8607177734375, 5.168212890625, 5.4757080078125, 5.783203125, 6.0906982421875, 6.398193359375, 6.7056884765625, 7.01318359375, 7.3206787109375, 7.628173828125, 7.9356689453125, 8.2431640625, 8.5506591796875, 8.858154296875, 9.1656494140625, 9.47314453125, 9.7806396484375, 10.088134765625, 10.3956298828125, 10.703125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 13.0, 12.0, 7.0, 12.0, 15.0, 17.0, 17.0, 22.0, 23.0, 22.0, 24.0, 36.0, 31.0, 47.0, 42.0, 55.0, 97.0, 158.0, 279.0, 1360.0, 188.0, 99.0, 80.0, 57.0, 41.0, 42.0, 34.0, 29.0, 24.0, 20.0, 22.0, 17.0, 13.0, 16.0, 16.0, 8.0, 8.0, 8.0, 3.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.484375, -18.878662109375, -18.27294921875, -17.667236328125, -17.0615234375, -16.455810546875, -15.85009765625, -15.244384765625, -14.638671875, -14.032958984375, -13.42724609375, -12.821533203125, -12.2158203125, -11.610107421875, -11.00439453125, -10.398681640625, -9.79296875, -9.187255859375, -8.58154296875, -7.975830078125, -7.3701171875, -6.764404296875, -6.15869140625, -5.552978515625, -4.947265625, -4.341552734375, -3.73583984375, -3.130126953125, -2.5244140625, -1.918701171875, -1.31298828125, -0.707275390625, -0.1015625, 0.504150390625, 1.10986328125, 1.715576171875, 2.3212890625, 2.927001953125, 3.53271484375, 4.138427734375, 4.744140625, 5.349853515625, 5.95556640625, 6.561279296875, 7.1669921875, 7.772705078125, 8.37841796875, 8.984130859375, 9.58984375, 10.195556640625, 10.80126953125, 11.406982421875, 12.0126953125, 12.618408203125, 13.22412109375, 13.829833984375, 14.435546875, 15.041259765625, 15.64697265625, 16.252685546875, 16.8583984375, 17.464111328125, 18.06982421875, 18.675537109375, 19.28125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 11.0, 10.0, 12.0, 15.0, 14.0, 24.0, 38.0, 48.0, 87.0, 148.0, 250.0, 457.0, 1051.0, 6898.0, 115111.0, 2786874.0, 221055.0, 10967.0, 1406.0, 518.0, 255.0, 151.0, 102.0, 68.0, 45.0, 33.0, 18.0, 5.0, 14.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.5234375, -32.390625, -31.2578125, -30.125, -28.9921875, -27.859375, -26.7265625, -25.59375, -24.4609375, -23.328125, -22.1953125, -21.0625, -19.9296875, -18.796875, -17.6640625, -16.53125, -15.3984375, -14.265625, -13.1328125, -12.0, -10.8671875, -9.734375, -8.6015625, -7.46875, -6.3359375, -5.203125, -4.0703125, -2.9375, -1.8046875, -0.671875, 0.4609375, 1.59375, 2.7265625, 3.859375, 4.9921875, 6.125, 7.2578125, 8.390625, 9.5234375, 10.65625, 11.7890625, 12.921875, 14.0546875, 15.1875, 16.3203125, 17.453125, 18.5859375, 19.71875, 20.8515625, 21.984375, 23.1171875, 24.25, 25.3828125, 26.515625, 27.6484375, 28.78125, 29.9140625, 31.046875, 32.1796875, 33.3125, 34.4453125, 35.578125, 36.7109375, 37.84375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 37.0, 58.0, 123.0, 182.0, 204.0, 172.0, 116.0, 56.0, 37.0, 12.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.272377014160156, -43.33911895751953, -41.40585708618164, -39.472599029541016, -37.53934097290039, -35.6060791015625, -33.672821044921875, -31.73956298828125, -29.806303024291992, -27.873043060302734, -25.93978500366211, -24.00652503967285, -22.073265075683594, -20.14000701904297, -18.20674705505371, -16.273487091064453, -14.340229034423828, -12.406970024108887, -10.473711013793945, -8.540451049804688, -6.607192039489746, -4.673933029174805, -2.740673065185547, -0.8074140548706055, 1.125844955444336, 3.0591042041778564, 4.992363452911377, 6.925622940063477, 8.858881950378418, 10.79214096069336, 12.725400924682617, 14.658659934997559, 16.5919189453125, 18.525178909301758, 20.458436965942383, 22.39169692993164, 24.324954986572266, 26.258214950561523, 28.19147491455078, 30.124732971191406, 32.05799102783203, 33.991249084472656, 35.92451095581055, 37.85776901245117, 39.7910270690918, 41.72428894042969, 43.65754699707031, 45.59080505371094, 47.52406692504883, 49.45732498168945, 51.390586853027344, 53.32384490966797, 55.257102966308594, 57.19036102294922, 59.12362289428711, 61.056880950927734, 62.990142822265625, 64.92340087890625, 66.85665893554688, 68.7899169921875, 70.72318267822266, 72.65644073486328, 74.5896987915039, 76.52295684814453, 78.45621490478516]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 2.0, 11.0, 4.0, 9.0, 5.0, 8.0, 14.0, 13.0, 19.0, 25.0, 18.0, 30.0, 16.0, 27.0, 50.0, 41.0, 27.0, 38.0, 31.0, 39.0, 45.0, 42.0, 30.0, 44.0, 42.0, 39.0, 45.0, 31.0, 32.0, 39.0, 26.0, 19.0, 21.0, 17.0, 21.0, 12.0, 13.0, 9.0, 8.0, 7.0, 6.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.930152893066406, -46.48430252075195, -45.038448333740234, -43.59259796142578, -42.14674758911133, -40.700897216796875, -39.255043029785156, -37.8091926574707, -36.36334228515625, -34.9174919128418, -33.47163772583008, -32.025787353515625, -30.579936981201172, -29.134084701538086, -27.688232421875, -26.242382049560547, -24.79652976989746, -23.350677490234375, -21.904827117919922, -20.458974838256836, -19.013124465942383, -17.567272186279297, -16.121421813964844, -14.675569534301758, -13.229718208312988, -11.783866882324219, -10.33801555633545, -8.89216423034668, -7.446312427520752, -6.000461101531982, -4.554609298706055, -3.108757972717285, -1.6629066467285156, -0.21705520153045654, 1.2287962436676025, 2.674647808074951, 4.120499134063721, 5.56635046005249, 7.012202262878418, 8.458053588867188, 9.903904914855957, 11.349756240844727, 12.795607566833496, 14.241458892822266, 15.687311172485352, 17.133161544799805, 18.57901382446289, 20.024864196777344, 21.47071647644043, 22.916568756103516, 24.36241912841797, 25.808271408081055, 27.254121780395508, 28.699974060058594, 30.145824432373047, 31.591676712036133, 33.03752899169922, 34.48337936401367, 35.92923355102539, 37.375083923339844, 38.8209342956543, 40.26678466796875, 41.71263885498047, 43.15848922729492, 44.604339599609375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 4.0, 8.0, 2.0, 9.0, 16.0, 16.0, 19.0, 26.0, 18.0, 20.0, 28.0, 26.0, 33.0, 33.0, 46.0, 43.0, 52.0, 59.0, 36.0, 30.0, 48.0, 43.0, 30.0, 53.0, 31.0, 38.0, 28.0, 32.0, 28.0, 14.0, 16.0, 20.0, 12.0, 14.0, 9.0, 5.0, 10.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.453125, -8.19940185546875, -7.9456787109375, -7.69195556640625, -7.438232421875, -7.18450927734375, -6.9307861328125, -6.67706298828125, -6.42333984375, -6.16961669921875, -5.9158935546875, -5.66217041015625, -5.408447265625, -5.15472412109375, -4.9010009765625, -4.64727783203125, -4.3935546875, -4.13983154296875, -3.8861083984375, -3.63238525390625, -3.378662109375, -3.12493896484375, -2.8712158203125, -2.61749267578125, -2.36376953125, -2.11004638671875, -1.8563232421875, -1.60260009765625, -1.348876953125, -1.09515380859375, -0.8414306640625, -0.58770751953125, -0.333984375, -0.08026123046875, 0.1734619140625, 0.42718505859375, 0.680908203125, 0.93463134765625, 1.1883544921875, 1.44207763671875, 1.69580078125, 1.94952392578125, 2.2032470703125, 2.45697021484375, 2.710693359375, 2.96441650390625, 3.2181396484375, 3.47186279296875, 3.7255859375, 3.97930908203125, 4.2330322265625, 4.48675537109375, 4.740478515625, 4.99420166015625, 5.2479248046875, 5.50164794921875, 5.75537109375, 6.00909423828125, 6.2628173828125, 6.51654052734375, 6.770263671875, 7.02398681640625, 7.2777099609375, 7.53143310546875, 7.78515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 10.0, 5.0, 12.0, 16.0, 17.0, 33.0, 22.0, 35.0, 48.0, 62.0, 72.0, 74.0, 108.0, 201.0, 440.0, 3491.0, 1348303.0, 2833314.0, 6748.0, 497.0, 217.0, 109.0, 92.0, 65.0, 45.0, 50.0, 39.0, 25.0, 30.0, 24.0, 17.0, 11.0, 7.0, 5.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.03125, -56.328125, -54.625, -52.921875, -51.21875, -49.515625, -47.8125, -46.109375, -44.40625, -42.703125, -41.0, -39.296875, -37.59375, -35.890625, -34.1875, -32.484375, -30.78125, -29.078125, -27.375, -25.671875, -23.96875, -22.265625, -20.5625, -18.859375, -17.15625, -15.453125, -13.75, -12.046875, -10.34375, -8.640625, -6.9375, -5.234375, -3.53125, -1.828125, -0.125, 1.578125, 3.28125, 4.984375, 6.6875, 8.390625, 10.09375, 11.796875, 13.5, 15.203125, 16.90625, 18.609375, 20.3125, 22.015625, 23.71875, 25.421875, 27.125, 28.828125, 30.53125, 32.234375, 33.9375, 35.640625, 37.34375, 39.046875, 40.75, 42.453125, 44.15625, 45.859375, 47.5625, 49.265625, 50.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 7.0, 7.0, 16.0, 11.0, 15.0, 12.0, 17.0, 50.0, 56.0, 59.0, 97.0, 124.0, 160.0, 248.0, 293.0, 413.0, 450.0, 474.0, 373.0, 316.0, 215.0, 172.0, 139.0, 84.0, 68.0, 39.0, 55.0, 19.0, 25.0, 16.0, 7.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.2117919921875, -7.868896484375, -7.5260009765625, -7.18310546875, -6.8402099609375, -6.497314453125, -6.1544189453125, -5.8115234375, -5.4686279296875, -5.125732421875, -4.7828369140625, -4.43994140625, -4.0970458984375, -3.754150390625, -3.4112548828125, -3.068359375, -2.7254638671875, -2.382568359375, -2.0396728515625, -1.69677734375, -1.3538818359375, -1.010986328125, -0.6680908203125, -0.3251953125, 0.0177001953125, 0.360595703125, 0.7034912109375, 1.04638671875, 1.3892822265625, 1.732177734375, 2.0750732421875, 2.41796875, 2.7608642578125, 3.103759765625, 3.4466552734375, 3.78955078125, 4.1324462890625, 4.475341796875, 4.8182373046875, 5.1611328125, 5.5040283203125, 5.846923828125, 6.1898193359375, 6.53271484375, 6.8756103515625, 7.218505859375, 7.5614013671875, 7.904296875, 8.2471923828125, 8.590087890625, 8.9329833984375, 9.27587890625, 9.6187744140625, 9.961669921875, 10.3045654296875, 10.6474609375, 10.9903564453125, 11.333251953125, 11.6761474609375, 12.01904296875, 12.3619384765625, 12.704833984375, 13.0477294921875, 13.390625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 4.0, 11.0, 30.0, 29.0, 21.0, 49.0, 77.0, 145.0, 402.0, 2103.0, 62504.0, 3794643.0, 327744.0, 5336.0, 631.0, 206.0, 91.0, 62.0, 31.0, 26.0, 19.0, 13.0, 18.0, 15.0, 5.0, 8.0, 3.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.1875, -46.6162109375, -45.044921875, -43.4736328125, -41.90234375, -40.3310546875, -38.759765625, -37.1884765625, -35.6171875, -34.0458984375, -32.474609375, -30.9033203125, -29.33203125, -27.7607421875, -26.189453125, -24.6181640625, -23.046875, -21.4755859375, -19.904296875, -18.3330078125, -16.76171875, -15.1904296875, -13.619140625, -12.0478515625, -10.4765625, -8.9052734375, -7.333984375, -5.7626953125, -4.19140625, -2.6201171875, -1.048828125, 0.5224609375, 2.09375, 3.6650390625, 5.236328125, 6.8076171875, 8.37890625, 9.9501953125, 11.521484375, 13.0927734375, 14.6640625, 16.2353515625, 17.806640625, 19.3779296875, 20.94921875, 22.5205078125, 24.091796875, 25.6630859375, 27.234375, 28.8056640625, 30.376953125, 31.9482421875, 33.51953125, 35.0908203125, 36.662109375, 38.2333984375, 39.8046875, 41.3759765625, 42.947265625, 44.5185546875, 46.08984375, 47.6611328125, 49.232421875, 50.8037109375, 52.375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 51.0, 505.0, 429.0, 31.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-478.3664855957031, -468.5836181640625, -458.80072021484375, -449.017822265625, -439.2349548339844, -429.45208740234375, -419.669189453125, -409.88629150390625, -400.1034240722656, -390.320556640625, -380.53765869140625, -370.7547607421875, -360.9718933105469, -351.18902587890625, -341.4061279296875, -331.62322998046875, -321.8403625488281, -312.0574951171875, -302.27459716796875, -292.49169921875, -282.7088317871094, -272.92596435546875, -263.14306640625, -253.3601837158203, -243.57730102539062, -233.79441833496094, -224.01153564453125, -214.22865295410156, -204.44577026367188, -194.6628875732422, -184.8800048828125, -175.0971221923828, -165.31423950195312, -155.53135681152344, -145.74847412109375, -135.96559143066406, -126.18270874023438, -116.39982604980469, -106.616943359375, -96.83406066894531, -87.05117797851562, -77.26829528808594, -67.48541259765625, -57.70252990722656, -47.919647216796875, -38.13676452636719, -28.3538818359375, -18.570999145507812, -8.788116455078125, 0.9947662353515625, 10.77764892578125, 20.560531616210938, 30.343414306640625, 40.12629699707031, 49.9091796875, 59.69206237792969, 69.47494506835938, 79.25782775878906, 89.04071044921875, 98.82359313964844, 108.60647583007812, 118.38935852050781, 128.1722412109375, 137.9551239013672, 147.73800659179688]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 4.0, 1.0, 7.0, 9.0, 8.0, 19.0, 21.0, 23.0, 23.0, 33.0, 16.0, 21.0, 33.0, 38.0, 33.0, 40.0, 38.0, 40.0, 42.0, 47.0, 53.0, 46.0, 38.0, 37.0, 37.0, 35.0, 28.0, 28.0, 19.0, 21.0, 23.0, 24.0, 24.0, 22.0, 15.0, 13.0, 12.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-41.50874328613281, -40.334983825683594, -39.161224365234375, -37.987464904785156, -36.81370544433594, -35.63994598388672, -34.4661865234375, -33.29242706298828, -32.11866760253906, -30.944908142089844, -29.771148681640625, -28.597389221191406, -27.423629760742188, -26.24987030029297, -25.076112747192383, -23.902353286743164, -22.728595733642578, -21.55483627319336, -20.38107681274414, -19.207317352294922, -18.033557891845703, -16.859798431396484, -15.686040878295898, -14.51228141784668, -13.338521957397461, -12.164762496948242, -10.991003036499023, -9.817244529724121, -8.643485069274902, -7.469725608825684, -6.295966625213623, -5.1222076416015625, -3.948444366455078, -2.7746851444244385, -1.6009259223937988, -0.4271667003631592, 0.7465925216674805, 1.9203519821166992, 3.0941109657287598, 4.26786994934082, 5.441629409790039, 6.615388870239258, 7.789147853851318, 8.962906837463379, 10.136666297912598, 11.310425758361816, 12.484184265136719, 13.657943725585938, 14.831703186035156, 16.005462646484375, 17.179222106933594, 18.352981567382812, 19.52674102783203, 20.70050048828125, 21.874258041381836, 23.048017501831055, 24.221776962280273, 25.395536422729492, 26.56929588317871, 27.74305534362793, 28.916812896728516, 30.090572357177734, 31.264331817626953, 32.43809127807617, 33.61185073852539]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 6.0, 4.0, 2.0, 12.0, 8.0, 14.0, 14.0, 19.0, 19.0, 25.0, 25.0, 32.0, 35.0, 27.0, 33.0, 37.0, 36.0, 46.0, 43.0, 33.0, 41.0, 40.0, 44.0, 33.0, 44.0, 33.0, 33.0, 29.0, 32.0, 27.0, 20.0, 23.0, 14.0, 20.0, 19.0, 17.0, 5.0, 9.0, 7.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.609375, -7.3665771484375, -7.123779296875, -6.8809814453125, -6.63818359375, -6.3953857421875, -6.152587890625, -5.9097900390625, -5.6669921875, -5.4241943359375, -5.181396484375, -4.9385986328125, -4.69580078125, -4.4530029296875, -4.210205078125, -3.9674072265625, -3.724609375, -3.4818115234375, -3.239013671875, -2.9962158203125, -2.75341796875, -2.5106201171875, -2.267822265625, -2.0250244140625, -1.7822265625, -1.5394287109375, -1.296630859375, -1.0538330078125, -0.81103515625, -0.5682373046875, -0.325439453125, -0.0826416015625, 0.16015625, 0.4029541015625, 0.645751953125, 0.8885498046875, 1.13134765625, 1.3741455078125, 1.616943359375, 1.8597412109375, 2.1025390625, 2.3453369140625, 2.588134765625, 2.8309326171875, 3.07373046875, 3.3165283203125, 3.559326171875, 3.8021240234375, 4.044921875, 4.2877197265625, 4.530517578125, 4.7733154296875, 5.01611328125, 5.2589111328125, 5.501708984375, 5.7445068359375, 5.9873046875, 6.2301025390625, 6.472900390625, 6.7156982421875, 6.95849609375, 7.2012939453125, 7.444091796875, 7.6868896484375, 7.9296875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 10.0, 19.0, 20.0, 51.0, 75.0, 119.0, 174.0, 290.0, 514.0, 843.0, 1275.0, 2247.0, 3849.0, 6387.0, 10714.0, 18524.0, 30564.0, 50934.0, 80263.0, 119010.0, 153596.0, 163456.0, 139457.0, 99761.0, 65782.0, 40865.0, 24272.0, 14361.0, 8568.0, 5102.0, 2971.0, 1774.0, 1080.0, 600.0, 408.0, 234.0, 147.0, 76.0, 53.0, 34.0, 19.0, 18.0, 18.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.8016433715820312, -0.7751617431640625, -0.7486801147460938, -0.722198486328125, -0.6957168579101562, -0.6692352294921875, -0.6427536010742188, -0.61627197265625, -0.5897903442382812, -0.5633087158203125, -0.5368270874023438, -0.510345458984375, -0.48386383056640625, -0.4573822021484375, -0.43090057373046875, -0.4044189453125, -0.37793731689453125, -0.3514556884765625, -0.32497406005859375, -0.298492431640625, -0.27201080322265625, -0.2455291748046875, -0.21904754638671875, -0.19256591796875, -0.16608428955078125, -0.1396026611328125, -0.11312103271484375, -0.086639404296875, -0.06015777587890625, -0.0336761474609375, -0.00719451904296875, 0.019287109375, 0.04576873779296875, 0.0722503662109375, 0.09873199462890625, 0.125213623046875, 0.15169525146484375, 0.1781768798828125, 0.20465850830078125, 0.23114013671875, 0.25762176513671875, 0.2841033935546875, 0.31058502197265625, 0.337066650390625, 0.36354827880859375, 0.3900299072265625, 0.41651153564453125, 0.4429931640625, 0.46947479248046875, 0.4959564208984375, 0.5224380493164062, 0.548919677734375, 0.5754013061523438, 0.6018829345703125, 0.6283645629882812, 0.65484619140625, 0.6813278198242188, 0.7078094482421875, 0.7342910766601562, 0.760772705078125, 0.7872543334960938, 0.8137359619140625, 0.8402175903320312, 0.86669921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 5.0, 7.0, 15.0, 8.0, 11.0, 17.0, 16.0, 18.0, 30.0, 29.0, 30.0, 31.0, 36.0, 36.0, 27.0, 49.0, 35.0, 46.0, 31.0, 1057.0, 43.0, 34.0, 43.0, 41.0, 29.0, 36.0, 33.0, 32.0, 27.0, 19.0, 27.0, 18.0, 19.0, 14.0, 13.0, 14.0, 10.0, 5.0, 9.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.78802490234375, -4.6033935546875, -4.41876220703125, -4.234130859375, -4.04949951171875, -3.8648681640625, -3.68023681640625, -3.49560546875, -3.31097412109375, -3.1263427734375, -2.94171142578125, -2.757080078125, -2.57244873046875, -2.3878173828125, -2.20318603515625, -2.0185546875, -1.83392333984375, -1.6492919921875, -1.46466064453125, -1.280029296875, -1.09539794921875, -0.9107666015625, -0.72613525390625, -0.54150390625, -0.35687255859375, -0.1722412109375, 0.01239013671875, 0.197021484375, 0.38165283203125, 0.5662841796875, 0.75091552734375, 0.935546875, 1.12017822265625, 1.3048095703125, 1.48944091796875, 1.674072265625, 1.85870361328125, 2.0433349609375, 2.22796630859375, 2.41259765625, 2.59722900390625, 2.7818603515625, 2.96649169921875, 3.151123046875, 3.33575439453125, 3.5203857421875, 3.70501708984375, 3.8896484375, 4.07427978515625, 4.2589111328125, 4.44354248046875, 4.628173828125, 4.81280517578125, 4.9974365234375, 5.18206787109375, 5.36669921875, 5.55133056640625, 5.7359619140625, 5.92059326171875, 6.105224609375, 6.28985595703125, 6.4744873046875, 6.65911865234375, 6.84375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 17.0, 23.0, 47.0, 72.0, 98.0, 165.0, 245.0, 372.0, 537.0, 816.0, 1271.0, 1883.0, 3010.0, 4501.0, 7136.0, 10684.0, 16365.0, 25231.0, 36885.0, 53507.0, 75284.0, 99957.0, 131410.0, 1159295.0, 130293.0, 99971.0, 75433.0, 53639.0, 36907.0, 24607.0, 16423.0, 10663.0, 7102.0, 4591.0, 2966.0, 1939.0, 1345.0, 827.0, 548.0, 366.0, 243.0, 160.0, 96.0, 60.0, 46.0, 22.0, 19.0, 23.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.433349609375, -0.4195899963378906, -0.40583038330078125, -0.3920707702636719, -0.3783111572265625, -0.3645515441894531, -0.35079193115234375, -0.3370323181152344, -0.323272705078125, -0.3095130920410156, -0.29575347900390625, -0.2819938659667969, -0.2682342529296875, -0.2544746398925781, -0.24071502685546875, -0.22695541381835938, -0.21319580078125, -0.19943618774414062, -0.18567657470703125, -0.17191696166992188, -0.1581573486328125, -0.14439773559570312, -0.13063812255859375, -0.11687850952148438, -0.103118896484375, -0.08935928344726562, -0.07559967041015625, -0.061840057373046875, -0.0480804443359375, -0.034320831298828125, -0.02056121826171875, -0.006801605224609375, 0.0069580078125, 0.020717620849609375, 0.03447723388671875, 0.048236846923828125, 0.0619964599609375, 0.07575607299804688, 0.08951568603515625, 0.10327529907226562, 0.117034912109375, 0.13079452514648438, 0.14455413818359375, 0.15831375122070312, 0.1720733642578125, 0.18583297729492188, 0.19959259033203125, 0.21335220336914062, 0.22711181640625, 0.24087142944335938, 0.25463104248046875, 0.2683906555175781, 0.2821502685546875, 0.2959098815917969, 0.30966949462890625, 0.3234291076660156, 0.337188720703125, 0.3509483337402344, 0.36470794677734375, 0.3784675598144531, 0.3922271728515625, 0.4059867858886719, 0.41974639892578125, 0.4335060119628906, 0.447265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 11.0, 14.0, 19.0, 26.0, 49.0, 80.0, 147.0, 241.0, 150.0, 75.0, 70.0, 29.0, 26.0, 14.0, 10.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1046142578125, -0.10140609741210938, -0.09819793701171875, -0.09498977661132812, -0.0917816162109375, -0.08857345581054688, -0.08536529541015625, -0.08215713500976562, -0.078948974609375, -0.07574081420898438, -0.07253265380859375, -0.06932449340820312, -0.0661163330078125, -0.06290817260742188, -0.05970001220703125, -0.056491851806640625, -0.05328369140625, -0.050075531005859375, -0.04686737060546875, -0.043659210205078125, -0.0404510498046875, -0.037242889404296875, -0.03403472900390625, -0.030826568603515625, -0.027618408203125, -0.024410247802734375, -0.02120208740234375, -0.017993927001953125, -0.0147857666015625, -0.011577606201171875, -0.00836944580078125, -0.005161285400390625, -0.001953125, 0.001255035400390625, 0.00446319580078125, 0.007671356201171875, 0.0108795166015625, 0.014087677001953125, 0.01729583740234375, 0.020503997802734375, 0.023712158203125, 0.026920318603515625, 0.03012847900390625, 0.033336639404296875, 0.0365447998046875, 0.039752960205078125, 0.04296112060546875, 0.046169281005859375, 0.04937744140625, 0.052585601806640625, 0.05579376220703125, 0.059001922607421875, 0.0622100830078125, 0.06541824340820312, 0.06862640380859375, 0.07183456420898438, 0.075042724609375, 0.07825088500976562, 0.08145904541015625, 0.08466720581054688, 0.0878753662109375, 0.09108352661132812, 0.09429168701171875, 0.09749984741210938, 0.1007080078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 10.0, 22.0, 30.0, 35.0, 75.0, 166.0, 371.0, 8225.0, 1038306.0, 823.0, 203.0, 88.0, 58.0, 36.0, 29.0, 20.0, 9.0, 4.0, 5.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.174163818359375, -2.10223388671875, -2.030303955078125, -1.9583740234375, -1.886444091796875, -1.81451416015625, -1.742584228515625, -1.670654296875, -1.598724365234375, -1.52679443359375, -1.454864501953125, -1.3829345703125, -1.311004638671875, -1.23907470703125, -1.167144775390625, -1.09521484375, -1.023284912109375, -0.95135498046875, -0.879425048828125, -0.8074951171875, -0.735565185546875, -0.66363525390625, -0.591705322265625, -0.519775390625, -0.447845458984375, -0.37591552734375, -0.303985595703125, -0.2320556640625, -0.160125732421875, -0.08819580078125, -0.016265869140625, 0.0556640625, 0.127593994140625, 0.19952392578125, 0.271453857421875, 0.3433837890625, 0.415313720703125, 0.48724365234375, 0.559173583984375, 0.631103515625, 0.703033447265625, 0.77496337890625, 0.846893310546875, 0.9188232421875, 0.990753173828125, 1.06268310546875, 1.134613037109375, 1.20654296875, 1.278472900390625, 1.35040283203125, 1.422332763671875, 1.4942626953125, 1.566192626953125, 1.63812255859375, 1.710052490234375, 1.781982421875, 1.853912353515625, 1.92584228515625, 1.997772216796875, 2.0697021484375, 2.141632080078125, 2.21356201171875, 2.285491943359375, 2.357421875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 30.0, 381.0, 541.0, 46.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8438287973403931, -0.8276101350784302, -0.8113914728164673, -0.7951728105545044, -0.7789541482925415, -0.7627354860305786, -0.7465168237686157, -0.7302981615066528, -0.7140794992446899, -0.697860836982727, -0.6816421747207642, -0.6654235124588013, -0.6492048501968384, -0.6329861879348755, -0.6167675256729126, -0.6005488634109497, -0.5843302011489868, -0.5681115388870239, -0.551892876625061, -0.5356742143630981, -0.5194555521011353, -0.5032368898391724, -0.4870182275772095, -0.4707995653152466, -0.4545809030532837, -0.4383622407913208, -0.4221435785293579, -0.405924916267395, -0.38970625400543213, -0.37348759174346924, -0.35726892948150635, -0.34105026721954346, -0.32483160495758057, -0.3086129426956177, -0.2923942804336548, -0.2761756181716919, -0.259956955909729, -0.2437382936477661, -0.22751963138580322, -0.21130096912384033, -0.19508230686187744, -0.17886364459991455, -0.16264498233795166, -0.14642632007598877, -0.13020765781402588, -0.11398899555206299, -0.0977703332901001, -0.08155167102813721, -0.06533300876617432, -0.049114346504211426, -0.032895684242248535, -0.016677021980285645, -0.0004583597183227539, 0.015760302543640137, 0.03197896480560303, 0.04819762706756592, 0.06441628932952881, 0.0806349515914917, 0.09685361385345459, 0.11307227611541748, 0.12929093837738037, 0.14550960063934326, 0.16172826290130615, 0.17794692516326904, 0.19416558742523193]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 10.0, 8.0, 9.0, 7.0, 11.0, 17.0, 21.0, 24.0, 29.0, 24.0, 32.0, 31.0, 31.0, 29.0, 33.0, 45.0, 38.0, 39.0, 41.0, 46.0, 45.0, 37.0, 31.0, 51.0, 44.0, 20.0, 37.0, 31.0, 21.0, 20.0, 23.0, 21.0, 13.0, 12.0, 12.0, 12.0, 9.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492423415184021, -0.14463026821613312, -0.14001819491386414, -0.13540612161159515, -0.13079404830932617, -0.1261819750070572, -0.12156990170478821, -0.11695782840251923, -0.11234575510025024, -0.10773368179798126, -0.10312160849571228, -0.0985095351934433, -0.09389746189117432, -0.08928538858890533, -0.08467331528663635, -0.08006124198436737, -0.07544916868209839, -0.0708370953798294, -0.06622502207756042, -0.06161294877529144, -0.05700087547302246, -0.05238880217075348, -0.0477767288684845, -0.043164655566215515, -0.03855258226394653, -0.03394050896167755, -0.02932843565940857, -0.024716362357139587, -0.020104289054870605, -0.015492215752601624, -0.010880142450332642, -0.00626806914806366, -0.0016559958457946777, 0.002956077456474304, 0.007568150758743286, 0.012180224061012268, 0.01679229736328125, 0.021404370665550232, 0.026016443967819214, 0.030628517270088196, 0.03524059057235718, 0.03985266387462616, 0.04446473717689514, 0.049076810479164124, 0.053688883781433105, 0.05830095708370209, 0.06291303038597107, 0.06752510368824005, 0.07213717699050903, 0.07674925029277802, 0.081361323595047, 0.08597339689731598, 0.09058547019958496, 0.09519754350185394, 0.09980961680412292, 0.1044216901063919, 0.10903376340866089, 0.11364583671092987, 0.11825791001319885, 0.12286998331546783, 0.12748205661773682, 0.1320941299200058, 0.13670620322227478, 0.14131827652454376, 0.14593034982681274]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 6.0, 8.0, 5.0, 10.0, 13.0, 15.0, 19.0, 18.0, 12.0, 24.0, 28.0, 40.0, 38.0, 33.0, 40.0, 56.0, 33.0, 42.0, 42.0, 40.0, 37.0, 35.0, 38.0, 32.0, 40.0, 44.0, 36.0, 31.0, 23.0, 19.0, 16.0, 17.0, 23.0, 17.0, 11.0, 10.0, 11.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5078125, -7.254150390625, -7.00048828125, -6.746826171875, -6.4931640625, -6.239501953125, -5.98583984375, -5.732177734375, -5.478515625, -5.224853515625, -4.97119140625, -4.717529296875, -4.4638671875, -4.210205078125, -3.95654296875, -3.702880859375, -3.44921875, -3.195556640625, -2.94189453125, -2.688232421875, -2.4345703125, -2.180908203125, -1.92724609375, -1.673583984375, -1.419921875, -1.166259765625, -0.91259765625, -0.658935546875, -0.4052734375, -0.151611328125, 0.10205078125, 0.355712890625, 0.609375, 0.863037109375, 1.11669921875, 1.370361328125, 1.6240234375, 1.877685546875, 2.13134765625, 2.385009765625, 2.638671875, 2.892333984375, 3.14599609375, 3.399658203125, 3.6533203125, 3.906982421875, 4.16064453125, 4.414306640625, 4.66796875, 4.921630859375, 5.17529296875, 5.428955078125, 5.6826171875, 5.936279296875, 6.18994140625, 6.443603515625, 6.697265625, 6.950927734375, 7.20458984375, 7.458251953125, 7.7119140625, 7.965576171875, 8.21923828125, 8.472900390625, 8.7265625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 11.0, 9.0, 16.0, 16.0, 25.0, 45.0, 47.0, 73.0, 107.0, 136.0, 216.0, 436.0, 704.0, 1399.0, 2661.0, 5402.0, 11025.0, 22944.0, 49508.0, 113547.0, 266293.0, 312481.0, 144028.0, 61957.0, 28359.0, 13436.0, 6611.0, 3232.0, 1706.0, 790.0, 520.0, 287.0, 166.0, 117.0, 80.0, 53.0, 28.0, 19.0, 21.0, 15.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.4296875, -10.0947265625, -9.759765625, -9.4248046875, -9.08984375, -8.7548828125, -8.419921875, -8.0849609375, -7.75, -7.4150390625, -7.080078125, -6.7451171875, -6.41015625, -6.0751953125, -5.740234375, -5.4052734375, -5.0703125, -4.7353515625, -4.400390625, -4.0654296875, -3.73046875, -3.3955078125, -3.060546875, -2.7255859375, -2.390625, -2.0556640625, -1.720703125, -1.3857421875, -1.05078125, -0.7158203125, -0.380859375, -0.0458984375, 0.2890625, 0.6240234375, 0.958984375, 1.2939453125, 1.62890625, 1.9638671875, 2.298828125, 2.6337890625, 2.96875, 3.3037109375, 3.638671875, 3.9736328125, 4.30859375, 4.6435546875, 4.978515625, 5.3134765625, 5.6484375, 5.9833984375, 6.318359375, 6.6533203125, 6.98828125, 7.3232421875, 7.658203125, 7.9931640625, 8.328125, 8.6630859375, 8.998046875, 9.3330078125, 9.66796875, 10.0029296875, 10.337890625, 10.6728515625, 11.0078125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 9.0, 6.0, 16.0, 11.0, 24.0, 14.0, 23.0, 25.0, 28.0, 41.0, 34.0, 60.0, 56.0, 96.0, 134.0, 291.0, 1437.0, 205.0, 117.0, 83.0, 57.0, 49.0, 41.0, 35.0, 38.0, 25.0, 13.0, 19.0, 13.0, 15.0, 5.0, 7.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.9375, -19.11376953125, -18.2900390625, -17.46630859375, -16.642578125, -15.81884765625, -14.9951171875, -14.17138671875, -13.34765625, -12.52392578125, -11.7001953125, -10.87646484375, -10.052734375, -9.22900390625, -8.4052734375, -7.58154296875, -6.7578125, -5.93408203125, -5.1103515625, -4.28662109375, -3.462890625, -2.63916015625, -1.8154296875, -0.99169921875, -0.16796875, 0.65576171875, 1.4794921875, 2.30322265625, 3.126953125, 3.95068359375, 4.7744140625, 5.59814453125, 6.421875, 7.24560546875, 8.0693359375, 8.89306640625, 9.716796875, 10.54052734375, 11.3642578125, 12.18798828125, 13.01171875, 13.83544921875, 14.6591796875, 15.48291015625, 16.306640625, 17.13037109375, 17.9541015625, 18.77783203125, 19.6015625, 20.42529296875, 21.2490234375, 22.07275390625, 22.896484375, 23.72021484375, 24.5439453125, 25.36767578125, 26.19140625, 27.01513671875, 27.8388671875, 28.66259765625, 29.486328125, 30.31005859375, 31.1337890625, 31.95751953125, 32.78125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 12.0, 19.0, 24.0, 32.0, 37.0, 42.0, 73.0, 140.0, 222.0, 341.0, 696.0, 2546.0, 40422.0, 2828098.0, 263472.0, 7230.0, 1078.0, 462.0, 277.0, 188.0, 88.0, 50.0, 48.0, 35.0, 15.0, 6.0, 10.0, 8.0, 5.0, 3.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -48.001953125, -46.53515625, -45.068359375, -43.6015625, -42.134765625, -40.66796875, -39.201171875, -37.734375, -36.267578125, -34.80078125, -33.333984375, -31.8671875, -30.400390625, -28.93359375, -27.466796875, -26.0, -24.533203125, -23.06640625, -21.599609375, -20.1328125, -18.666015625, -17.19921875, -15.732421875, -14.265625, -12.798828125, -11.33203125, -9.865234375, -8.3984375, -6.931640625, -5.46484375, -3.998046875, -2.53125, -1.064453125, 0.40234375, 1.869140625, 3.3359375, 4.802734375, 6.26953125, 7.736328125, 9.203125, 10.669921875, 12.13671875, 13.603515625, 15.0703125, 16.537109375, 18.00390625, 19.470703125, 20.9375, 22.404296875, 23.87109375, 25.337890625, 26.8046875, 28.271484375, 29.73828125, 31.205078125, 32.671875, 34.138671875, 35.60546875, 37.072265625, 38.5390625, 40.005859375, 41.47265625, 42.939453125, 44.40625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 76.0, 661.0, 274.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.8414306640625, -305.5087890625, -296.1761474609375, -286.843505859375, -277.5108642578125, -268.1781921386719, -258.8455505371094, -249.51290893554688, -240.18026733398438, -230.84762573242188, -221.51498413085938, -212.1823272705078, -202.8496856689453, -193.5170440673828, -184.18438720703125, -174.85174560546875, -165.51910400390625, -156.18646240234375, -146.85382080078125, -137.5211639404297, -128.1885223388672, -118.85588073730469, -109.52323150634766, -100.19058227539062, -90.85794067382812, -81.52529907226562, -72.1926498413086, -62.86000442504883, -53.52735900878906, -44.1947135925293, -34.86206817626953, -25.5294189453125, -16.196746826171875, -6.864101409912109, 2.4685440063476562, 11.801189422607422, 21.133834838867188, 30.466480255126953, 39.79912567138672, 49.13177490234375, 58.46441650390625, 67.79705810546875, 77.12970733642578, 86.46235656738281, 95.79499816894531, 105.12763977050781, 114.46028900146484, 123.79293823242188, 133.12557983398438, 142.45822143554688, 151.79086303710938, 161.12351989746094, 170.45616149902344, 179.78880310058594, 189.1214599609375, 198.4541015625, 207.7867431640625, 217.119384765625, 226.4520263671875, 235.78468322753906, 245.11732482910156, 254.44996643066406, 263.7826232910156, 273.1152648925781, 282.4479064941406]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 11.0, 6.0, 16.0, 18.0, 16.0, 17.0, 15.0, 19.0, 27.0, 29.0, 36.0, 31.0, 42.0, 33.0, 43.0, 42.0, 26.0, 44.0, 34.0, 49.0, 46.0, 42.0, 40.0, 30.0, 32.0, 32.0, 23.0, 36.0, 25.0, 27.0, 18.0, 21.0, 15.0, 11.0, 11.0, 10.0, 7.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.81560134887695, -54.20024108886719, -52.58488464355469, -50.96952438354492, -49.35416793823242, -47.738807678222656, -46.123451232910156, -44.50809097290039, -42.892730712890625, -41.27737045288086, -39.66201400756836, -38.046653747558594, -36.431297302246094, -34.81593704223633, -33.20057678222656, -31.585220336914062, -29.969863891601562, -28.35450553894043, -26.739147186279297, -25.12378692626953, -23.50843048095703, -21.893070220947266, -20.277711868286133, -18.662353515625, -17.046995162963867, -15.431636810302734, -13.816278457641602, -12.200919151306152, -10.58556079864502, -8.970202445983887, -7.3548431396484375, -5.739484786987305, -4.1241302490234375, -2.5087716579437256, -0.8934130668640137, 0.7219457626342773, 2.33730411529541, 3.952662467956543, 5.568021774291992, 7.183380126953125, 8.798738479614258, 10.41409683227539, 12.029455184936523, 13.644814491271973, 15.260172843933105, 16.875530242919922, 18.490890502929688, 20.10624885559082, 21.721607208251953, 23.336965560913086, 24.95232391357422, 26.567684173583984, 28.183040618896484, 29.79840087890625, 31.413759231567383, 33.029117584228516, 34.64447784423828, 36.25983810424805, 37.87519454956055, 39.49055480957031, 41.10591125488281, 42.72127151489258, 44.336631774902344, 45.951988220214844, 47.567344665527344]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 4.0, 5.0, 5.0, 10.0, 8.0, 14.0, 17.0, 21.0, 23.0, 11.0, 19.0, 29.0, 36.0, 44.0, 39.0, 33.0, 46.0, 32.0, 54.0, 49.0, 39.0, 49.0, 48.0, 33.0, 22.0, 37.0, 38.0, 39.0, 30.0, 22.0, 17.0, 7.0, 27.0, 16.0, 17.0, 12.0, 10.0, 7.0, 5.0, 2.0, 4.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9921875, -8.7265625, -8.4609375, -8.1953125, -7.9296875, -7.6640625, -7.3984375, -7.1328125, -6.8671875, -6.6015625, -6.3359375, -6.0703125, -5.8046875, -5.5390625, -5.2734375, -5.0078125, -4.7421875, -4.4765625, -4.2109375, -3.9453125, -3.6796875, -3.4140625, -3.1484375, -2.8828125, -2.6171875, -2.3515625, -2.0859375, -1.8203125, -1.5546875, -1.2890625, -1.0234375, -0.7578125, -0.4921875, -0.2265625, 0.0390625, 0.3046875, 0.5703125, 0.8359375, 1.1015625, 1.3671875, 1.6328125, 1.8984375, 2.1640625, 2.4296875, 2.6953125, 2.9609375, 3.2265625, 3.4921875, 3.7578125, 4.0234375, 4.2890625, 4.5546875, 4.8203125, 5.0859375, 5.3515625, 5.6171875, 5.8828125, 6.1484375, 6.4140625, 6.6796875, 6.9453125, 7.2109375, 7.4765625, 7.7421875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 7.0, 9.0, 16.0, 21.0, 25.0, 17.0, 24.0, 38.0, 41.0, 65.0, 75.0, 112.0, 105.0, 159.0, 238.0, 313.0, 456.0, 3454.0, 3114505.0, 1070986.0, 1907.0, 424.0, 327.0, 220.0, 182.0, 108.0, 86.0, 47.0, 75.0, 41.0, 39.0, 25.0, 18.0, 13.0, 15.0, 22.0, 9.0, 6.0, 12.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-77.0625, -74.7216796875, -72.380859375, -70.0400390625, -67.69921875, -65.3583984375, -63.017578125, -60.6767578125, -58.3359375, -55.9951171875, -53.654296875, -51.3134765625, -48.97265625, -46.6318359375, -44.291015625, -41.9501953125, -39.609375, -37.2685546875, -34.927734375, -32.5869140625, -30.24609375, -27.9052734375, -25.564453125, -23.2236328125, -20.8828125, -18.5419921875, -16.201171875, -13.8603515625, -11.51953125, -9.1787109375, -6.837890625, -4.4970703125, -2.15625, 0.1845703125, 2.525390625, 4.8662109375, 7.20703125, 9.5478515625, 11.888671875, 14.2294921875, 16.5703125, 18.9111328125, 21.251953125, 23.5927734375, 25.93359375, 28.2744140625, 30.615234375, 32.9560546875, 35.296875, 37.6376953125, 39.978515625, 42.3193359375, 44.66015625, 47.0009765625, 49.341796875, 51.6826171875, 54.0234375, 56.3642578125, 58.705078125, 61.0458984375, 63.38671875, 65.7275390625, 68.068359375, 70.4091796875, 72.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 13.0, 9.0, 23.0, 18.0, 23.0, 25.0, 34.0, 50.0, 68.0, 90.0, 120.0, 153.0, 229.0, 307.0, 380.0, 510.0, 512.0, 382.0, 279.0, 233.0, 151.0, 98.0, 93.0, 65.0, 48.0, 36.0, 21.0, 22.0, 19.0, 12.0, 10.0, 9.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.297607421875, -8.93896484375, -8.580322265625, -8.2216796875, -7.863037109375, -7.50439453125, -7.145751953125, -6.787109375, -6.428466796875, -6.06982421875, -5.711181640625, -5.3525390625, -4.993896484375, -4.63525390625, -4.276611328125, -3.91796875, -3.559326171875, -3.20068359375, -2.842041015625, -2.4833984375, -2.124755859375, -1.76611328125, -1.407470703125, -1.048828125, -0.690185546875, -0.33154296875, 0.027099609375, 0.3857421875, 0.744384765625, 1.10302734375, 1.461669921875, 1.8203125, 2.178955078125, 2.53759765625, 2.896240234375, 3.2548828125, 3.613525390625, 3.97216796875, 4.330810546875, 4.689453125, 5.048095703125, 5.40673828125, 5.765380859375, 6.1240234375, 6.482666015625, 6.84130859375, 7.199951171875, 7.55859375, 7.917236328125, 8.27587890625, 8.634521484375, 8.9931640625, 9.351806640625, 9.71044921875, 10.069091796875, 10.427734375, 10.786376953125, 11.14501953125, 11.503662109375, 11.8623046875, 12.220947265625, 12.57958984375, 12.938232421875, 13.296875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 5.0, 4.0, 11.0, 12.0, 15.0, 16.0, 12.0, 25.0, 52.0, 52.0, 90.0, 150.0, 292.0, 712.0, 4580.0, 76759.0, 3037924.0, 1040171.0, 29825.0, 2349.0, 502.0, 241.0, 143.0, 95.0, 39.0, 34.0, 28.0, 21.0, 30.0, 13.0, 7.0, 15.0, 10.0, 10.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-36.5, -35.31689453125, -34.1337890625, -32.95068359375, -31.767578125, -30.58447265625, -29.4013671875, -28.21826171875, -27.03515625, -25.85205078125, -24.6689453125, -23.48583984375, -22.302734375, -21.11962890625, -19.9365234375, -18.75341796875, -17.5703125, -16.38720703125, -15.2041015625, -14.02099609375, -12.837890625, -11.65478515625, -10.4716796875, -9.28857421875, -8.10546875, -6.92236328125, -5.7392578125, -4.55615234375, -3.373046875, -2.18994140625, -1.0068359375, 0.17626953125, 1.359375, 2.54248046875, 3.7255859375, 4.90869140625, 6.091796875, 7.27490234375, 8.4580078125, 9.64111328125, 10.82421875, 12.00732421875, 13.1904296875, 14.37353515625, 15.556640625, 16.73974609375, 17.9228515625, 19.10595703125, 20.2890625, 21.47216796875, 22.6552734375, 23.83837890625, 25.021484375, 26.20458984375, 27.3876953125, 28.57080078125, 29.75390625, 30.93701171875, 32.1201171875, 33.30322265625, 34.486328125, 35.66943359375, 36.8525390625, 38.03564453125, 39.21875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 15.0, 44.0, 102.0, 149.0, 208.0, 198.0, 148.0, 91.0, 37.0, 12.0, 5.0, 2.0], "bins": [-164.15582275390625, -161.27142333984375, -158.3870086669922, -155.5026092529297, -152.6182098388672, -149.73379516601562, -146.84939575195312, -143.96499633789062, -141.08059692382812, -138.19619750976562, -135.31178283691406, -132.42738342285156, -129.54298400878906, -126.65857696533203, -123.774169921875, -120.8897705078125, -118.00535583496094, -115.1209487915039, -112.2365493774414, -109.35214233398438, -106.46774291992188, -103.58333587646484, -100.69892883300781, -97.81452941894531, -94.93012237548828, -92.04571533203125, -89.16131591796875, -86.27690887451172, -83.39250183105469, -80.50810241699219, -77.62369537353516, -74.73928833007812, -71.85488891601562, -68.9704818725586, -66.0860824584961, -63.20167541503906, -60.3172721862793, -57.43286895751953, -54.5484619140625, -51.664058685302734, -48.779659271240234, -45.89525604248047, -43.01084899902344, -40.12644577026367, -37.242042541503906, -34.35763931274414, -31.473234176635742, -28.588829040527344, -25.704425811767578, -22.820022583007812, -19.935617446899414, -17.051212310791016, -14.16680908203125, -11.282404899597168, -8.398000717163086, -5.5135955810546875, -2.629192352294922, 0.25521183013916016, 3.139616012573242, 6.024020195007324, 8.908424377441406, 11.792828559875488, 14.67723274230957, 17.56163787841797, 20.446041107177734]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 10.0, 11.0, 17.0, 25.0, 13.0, 20.0, 20.0, 25.0, 27.0, 21.0, 39.0, 36.0, 45.0, 50.0, 42.0, 50.0, 48.0, 57.0, 42.0, 50.0, 43.0, 36.0, 42.0, 27.0, 38.0, 34.0, 25.0, 16.0, 16.0, 9.0, 16.0, 7.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.233428955078125, -47.84324264526367, -46.45305633544922, -45.06287384033203, -43.67268753051758, -42.282501220703125, -40.89231491088867, -39.50212860107422, -38.11194610595703, -36.72175979614258, -35.331573486328125, -33.94139099121094, -32.551204681396484, -31.16101837158203, -29.770832061767578, -28.380645751953125, -26.990459442138672, -25.60027313232422, -24.2100887298584, -22.819902420043945, -21.429718017578125, -20.039531707763672, -18.64934539794922, -17.259159088134766, -15.868974685668945, -14.478789329528809, -13.088603973388672, -11.698417663574219, -10.308232307434082, -8.918046951293945, -7.527860641479492, -6.1376752853393555, -4.747493743896484, -3.3573081493377686, -1.9671225547790527, -0.5769367218017578, 0.8132486343383789, 2.2034339904785156, 3.5936203002929688, 4.9838056564331055, 6.373991012573242, 7.764176368713379, 9.154361724853516, 10.544548034667969, 11.934733390808105, 13.324918746948242, 14.715105056762695, 16.105289459228516, 17.49547576904297, 18.885662078857422, 20.275846481323242, 21.666032791137695, 23.056217193603516, 24.44640350341797, 25.836589813232422, 27.226776123046875, 28.616960525512695, 30.00714683532715, 31.39733123779297, 32.78751754760742, 34.177703857421875, 35.56788635253906, 36.95807647705078, 38.34825897216797, 39.73844528198242]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 8.0, 5.0, 14.0, 9.0, 11.0, 14.0, 10.0, 22.0, 21.0, 15.0, 19.0, 25.0, 19.0, 34.0, 28.0, 42.0, 23.0, 27.0, 24.0, 40.0, 38.0, 36.0, 33.0, 43.0, 53.0, 42.0, 45.0, 35.0, 32.0, 22.0, 23.0, 32.0, 24.0, 24.0, 12.0, 12.0, 16.0, 15.0, 8.0, 9.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.53515625, -7.29449462890625, -7.0538330078125, -6.81317138671875, -6.572509765625, -6.33184814453125, -6.0911865234375, -5.85052490234375, -5.60986328125, -5.36920166015625, -5.1285400390625, -4.88787841796875, -4.647216796875, -4.40655517578125, -4.1658935546875, -3.92523193359375, -3.6845703125, -3.44390869140625, -3.2032470703125, -2.96258544921875, -2.721923828125, -2.48126220703125, -2.2406005859375, -1.99993896484375, -1.75927734375, -1.51861572265625, -1.2779541015625, -1.03729248046875, -0.796630859375, -0.55596923828125, -0.3153076171875, -0.07464599609375, 0.166015625, 0.40667724609375, 0.6473388671875, 0.88800048828125, 1.128662109375, 1.36932373046875, 1.6099853515625, 1.85064697265625, 2.09130859375, 2.33197021484375, 2.5726318359375, 2.81329345703125, 3.053955078125, 3.29461669921875, 3.5352783203125, 3.77593994140625, 4.0166015625, 4.25726318359375, 4.4979248046875, 4.73858642578125, 4.979248046875, 5.21990966796875, 5.4605712890625, 5.70123291015625, 5.94189453125, 6.18255615234375, 6.4232177734375, 6.66387939453125, 6.904541015625, 7.14520263671875, 7.3858642578125, 7.62652587890625, 7.8671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 9.0, 22.0, 35.0, 36.0, 60.0, 94.0, 142.0, 205.0, 261.0, 405.0, 656.0, 983.0, 1413.0, 2083.0, 3002.0, 4459.0, 6440.0, 9785.0, 14343.0, 21420.0, 30553.0, 43630.0, 59400.0, 78493.0, 98060.0, 113535.0, 117598.0, 108251.0, 89559.0, 70286.0, 52771.0, 37971.0, 26085.0, 18346.0, 12374.0, 8502.0, 5688.0, 3817.0, 2581.0, 1713.0, 1097.0, 784.0, 511.0, 363.0, 222.0, 156.0, 96.0, 81.0, 66.0, 33.0, 26.0, 20.0, 10.0, 3.0, 3.0, 4.0, 3.0], "bins": [-0.65380859375, -0.6341705322265625, -0.614532470703125, -0.5948944091796875, -0.57525634765625, -0.5556182861328125, -0.535980224609375, -0.5163421630859375, -0.4967041015625, -0.4770660400390625, -0.457427978515625, -0.4377899169921875, -0.41815185546875, -0.3985137939453125, -0.378875732421875, -0.3592376708984375, -0.339599609375, -0.3199615478515625, -0.300323486328125, -0.2806854248046875, -0.26104736328125, -0.2414093017578125, -0.221771240234375, -0.2021331787109375, -0.1824951171875, -0.1628570556640625, -0.143218994140625, -0.1235809326171875, -0.10394287109375, -0.0843048095703125, -0.064666748046875, -0.0450286865234375, -0.025390625, -0.0057525634765625, 0.013885498046875, 0.0335235595703125, 0.05316162109375, 0.0727996826171875, 0.092437744140625, 0.1120758056640625, 0.1317138671875, 0.1513519287109375, 0.170989990234375, 0.1906280517578125, 0.21026611328125, 0.2299041748046875, 0.249542236328125, 0.2691802978515625, 0.288818359375, 0.3084564208984375, 0.328094482421875, 0.3477325439453125, 0.36737060546875, 0.3870086669921875, 0.406646728515625, 0.4262847900390625, 0.4459228515625, 0.4655609130859375, 0.485198974609375, 0.5048370361328125, 0.52447509765625, 0.5441131591796875, 0.563751220703125, 0.5833892822265625, 0.60302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 7.0, 5.0, 10.0, 17.0, 9.0, 18.0, 23.0, 20.0, 17.0, 26.0, 17.0, 15.0, 31.0, 25.0, 29.0, 33.0, 38.0, 34.0, 25.0, 34.0, 40.0, 1065.0, 41.0, 36.0, 35.0, 39.0, 30.0, 25.0, 26.0, 42.0, 20.0, 21.0, 19.0, 20.0, 23.0, 16.0, 11.0, 9.0, 13.0, 10.0, 6.0, 4.0, 6.0, 4.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.6484375, -5.47845458984375, -5.3084716796875, -5.13848876953125, -4.968505859375, -4.79852294921875, -4.6285400390625, -4.45855712890625, -4.28857421875, -4.11859130859375, -3.9486083984375, -3.77862548828125, -3.608642578125, -3.43865966796875, -3.2686767578125, -3.09869384765625, -2.9287109375, -2.75872802734375, -2.5887451171875, -2.41876220703125, -2.248779296875, -2.07879638671875, -1.9088134765625, -1.73883056640625, -1.56884765625, -1.39886474609375, -1.2288818359375, -1.05889892578125, -0.888916015625, -0.71893310546875, -0.5489501953125, -0.37896728515625, -0.208984375, -0.03900146484375, 0.1309814453125, 0.30096435546875, 0.470947265625, 0.64093017578125, 0.8109130859375, 0.98089599609375, 1.15087890625, 1.32086181640625, 1.4908447265625, 1.66082763671875, 1.830810546875, 2.00079345703125, 2.1707763671875, 2.34075927734375, 2.5107421875, 2.68072509765625, 2.8507080078125, 3.02069091796875, 3.190673828125, 3.36065673828125, 3.5306396484375, 3.70062255859375, 3.87060546875, 4.04058837890625, 4.2105712890625, 4.38055419921875, 4.550537109375, 4.72052001953125, 4.8905029296875, 5.06048583984375, 5.23046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 12.0, 16.0, 27.0, 35.0, 75.0, 118.0, 149.0, 222.0, 352.0, 485.0, 723.0, 1055.0, 1684.0, 2542.0, 3693.0, 5477.0, 8166.0, 12247.0, 18013.0, 26130.0, 37677.0, 53305.0, 72164.0, 93078.0, 119520.0, 1123754.0, 150731.0, 98295.0, 77410.0, 57691.0, 41480.0, 29264.0, 19900.0, 13550.0, 9070.0, 6274.0, 4237.0, 2826.0, 1846.0, 1236.0, 795.0, 590.0, 409.0, 273.0, 181.0, 128.0, 89.0, 59.0, 29.0, 19.0, 12.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.427001953125, -0.4135017395019531, -0.40000152587890625, -0.3865013122558594, -0.3730010986328125, -0.3595008850097656, -0.34600067138671875, -0.3325004577636719, -0.319000244140625, -0.3055000305175781, -0.29199981689453125, -0.2784996032714844, -0.2649993896484375, -0.2514991760253906, -0.23799896240234375, -0.22449874877929688, -0.21099853515625, -0.19749832153320312, -0.18399810791015625, -0.17049789428710938, -0.1569976806640625, -0.14349746704101562, -0.12999725341796875, -0.11649703979492188, -0.102996826171875, -0.08949661254882812, -0.07599639892578125, -0.062496185302734375, -0.0489959716796875, -0.035495758056640625, -0.02199554443359375, -0.008495330810546875, 0.0050048828125, 0.018505096435546875, 0.03200531005859375, 0.045505523681640625, 0.0590057373046875, 0.07250595092773438, 0.08600616455078125, 0.09950637817382812, 0.113006591796875, 0.12650680541992188, 0.14000701904296875, 0.15350723266601562, 0.1670074462890625, 0.18050765991210938, 0.19400787353515625, 0.20750808715820312, 0.22100830078125, 0.23450851440429688, 0.24800872802734375, 0.2615089416503906, 0.2750091552734375, 0.2885093688964844, 0.30200958251953125, 0.3155097961425781, 0.329010009765625, 0.3425102233886719, 0.35601043701171875, 0.3695106506347656, 0.3830108642578125, 0.3965110778808594, 0.41001129150390625, 0.4235115051269531, 0.43701171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 11.0, 16.0, 25.0, 41.0, 53.0, 78.0, 119.0, 135.0, 118.0, 111.0, 78.0, 42.0, 52.0, 26.0, 20.0, 14.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.11138916015625, -0.10860538482666016, -0.10582160949707031, -0.10303783416748047, -0.10025405883789062, -0.09747028350830078, -0.09468650817871094, -0.0919027328491211, -0.08911895751953125, -0.0863351821899414, -0.08355140686035156, -0.08076763153076172, -0.07798385620117188, -0.07520008087158203, -0.07241630554199219, -0.06963253021240234, -0.0668487548828125, -0.06406497955322266, -0.06128120422363281, -0.05849742889404297, -0.055713653564453125, -0.05292987823486328, -0.05014610290527344, -0.047362327575683594, -0.04457855224609375, -0.041794776916503906, -0.03901100158691406, -0.03622722625732422, -0.033443450927734375, -0.03065967559814453, -0.027875900268554688, -0.025092124938964844, -0.022308349609375, -0.019524574279785156, -0.016740798950195312, -0.013957023620605469, -0.011173248291015625, -0.008389472961425781, -0.0056056976318359375, -0.0028219223022460938, -3.814697265625e-05, 0.0027456283569335938, 0.0055294036865234375, 0.008313179016113281, 0.011096954345703125, 0.013880729675292969, 0.016664505004882812, 0.019448280334472656, 0.0222320556640625, 0.025015830993652344, 0.027799606323242188, 0.03058338165283203, 0.033367156982421875, 0.03615093231201172, 0.03893470764160156, 0.041718482971191406, 0.04450225830078125, 0.047286033630371094, 0.05006980895996094, 0.05285358428955078, 0.055637359619140625, 0.05842113494873047, 0.06120491027832031, 0.06398868560791016, 0.0667724609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 5.0, 15.0, 16.0, 22.0, 41.0, 62.0, 107.0, 182.0, 363.0, 1449.0, 1029798.0, 15149.0, 669.0, 289.0, 122.0, 73.0, 36.0, 34.0, 26.0, 24.0, 7.0, 13.0, 8.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.25, -1.197418212890625, -1.14483642578125, -1.092254638671875, -1.0396728515625, -0.987091064453125, -0.93450927734375, -0.881927490234375, -0.829345703125, -0.776763916015625, -0.72418212890625, -0.671600341796875, -0.6190185546875, -0.566436767578125, -0.51385498046875, -0.461273193359375, -0.40869140625, -0.356109619140625, -0.30352783203125, -0.250946044921875, -0.1983642578125, -0.145782470703125, -0.09320068359375, -0.040618896484375, 0.011962890625, 0.064544677734375, 0.11712646484375, 0.169708251953125, 0.2222900390625, 0.274871826171875, 0.32745361328125, 0.380035400390625, 0.4326171875, 0.485198974609375, 0.53778076171875, 0.590362548828125, 0.6429443359375, 0.695526123046875, 0.74810791015625, 0.800689697265625, 0.853271484375, 0.905853271484375, 0.95843505859375, 1.011016845703125, 1.0635986328125, 1.116180419921875, 1.16876220703125, 1.221343994140625, 1.27392578125, 1.326507568359375, 1.37908935546875, 1.431671142578125, 1.4842529296875, 1.536834716796875, 1.58941650390625, 1.641998291015625, 1.694580078125, 1.747161865234375, 1.79974365234375, 1.852325439453125, 1.9049072265625, 1.957489013671875, 2.01007080078125, 2.062652587890625, 2.115234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 13.0, 50.0, 421.0, 492.0, 29.0, 5.0, 1.0, 1.0], "bins": [-0.7726542949676514, -0.7595790028572083, -0.7465036511421204, -0.7334283590316772, -0.7203530073165894, -0.7072777152061462, -0.6942023634910583, -0.6811270713806152, -0.6680517196655273, -0.6549764275550842, -0.6419010758399963, -0.6288257837295532, -0.6157504320144653, -0.6026751399040222, -0.5895997881889343, -0.5765244960784912, -0.5634491443634033, -0.5503738522529602, -0.5372985005378723, -0.5242232084274292, -0.5111478567123413, -0.4980725347995758, -0.4849972128868103, -0.4719218909740448, -0.4588465988636017, -0.4457712769508362, -0.4326959550380707, -0.4196206331253052, -0.4065453112125397, -0.39346998929977417, -0.38039466738700867, -0.36731934547424316, -0.35424402356147766, -0.34116870164871216, -0.32809337973594666, -0.31501805782318115, -0.30194273591041565, -0.28886741399765015, -0.27579209208488464, -0.26271677017211914, -0.24964146316051483, -0.23656614124774933, -0.22349081933498383, -0.21041549742221832, -0.19734017550945282, -0.1842648684978485, -0.171189546585083, -0.1581142246723175, -0.145038902759552, -0.1319635808467865, -0.118888258934021, -0.1058129370212555, -0.09273761510848999, -0.07966230064630508, -0.06658697873353958, -0.05351165682077408, -0.04043632745742798, -0.027361005544662476, -0.014285685494542122, -0.0012103654444217682, 0.011864956468343735, 0.02494027465581894, 0.03801559656858444, 0.051090918481349945, 0.06416624039411545]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 5.0, 15.0, 13.0, 12.0, 17.0, 25.0, 23.0, 42.0, 25.0, 32.0, 37.0, 33.0, 33.0, 42.0, 43.0, 38.0, 49.0, 29.0, 33.0, 45.0, 39.0, 47.0, 35.0, 32.0, 31.0, 23.0, 32.0, 26.0, 19.0, 20.0, 15.0, 14.0, 8.0, 10.0, 13.0, 5.0, 8.0, 2.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10916274785995483, -0.10536446422338486, -0.10156618803739548, -0.0977679044008255, -0.09396962821483612, -0.09017134457826614, -0.08637306094169617, -0.08257478475570679, -0.07877650111913681, -0.07497821748256683, -0.07117994129657745, -0.06738165766000748, -0.0635833740234375, -0.05978509783744812, -0.05598681420087814, -0.052188534289598465, -0.04839025437831879, -0.04459197446703911, -0.04079369455575943, -0.03699541091918945, -0.033197131007909775, -0.029398851096630096, -0.02560056932270527, -0.02180228754878044, -0.018004007637500763, -0.01420572679489851, -0.010407445952296257, -0.006609165109694004, -0.002810884267091751, 0.0009873956441879272, 0.004785677418112755, 0.008583959192037582, 0.01238223910331726, 0.01618051901459694, 0.019978800788521767, 0.023777082562446594, 0.027575362473726273, 0.03137364238500595, 0.03517192602157593, 0.038970205932855606, 0.042768485844135284, 0.04656676575541496, 0.05036504566669464, 0.05416332930326462, 0.057961609214544296, 0.061759889125823975, 0.06555817276239395, 0.06935645639896393, 0.07315473258495331, 0.07695301622152328, 0.08075129240751266, 0.08454957604408264, 0.08834785223007202, 0.092146135866642, 0.09594441950321198, 0.09974269568920135, 0.10354097932577133, 0.10733926296234131, 0.11113753914833069, 0.11493582278490067, 0.11873410642147064, 0.12253238260746002, 0.1263306587934494, 0.13012894988059998, 0.13392722606658936]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 0.0, 5.0, 5.0, 2.0, 8.0, 10.0, 4.0, 12.0, 18.0, 13.0, 17.0, 16.0, 25.0, 20.0, 21.0, 37.0, 30.0, 34.0, 29.0, 36.0, 32.0, 26.0, 35.0, 43.0, 44.0, 35.0, 50.0, 38.0, 41.0, 28.0, 38.0, 36.0, 27.0, 27.0, 22.0, 20.0, 17.0, 10.0, 13.0, 22.0, 7.0, 11.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.0859375, -7.84228515625, -7.5986328125, -7.35498046875, -7.111328125, -6.86767578125, -6.6240234375, -6.38037109375, -6.13671875, -5.89306640625, -5.6494140625, -5.40576171875, -5.162109375, -4.91845703125, -4.6748046875, -4.43115234375, -4.1875, -3.94384765625, -3.7001953125, -3.45654296875, -3.212890625, -2.96923828125, -2.7255859375, -2.48193359375, -2.23828125, -1.99462890625, -1.7509765625, -1.50732421875, -1.263671875, -1.02001953125, -0.7763671875, -0.53271484375, -0.2890625, -0.04541015625, 0.1982421875, 0.44189453125, 0.685546875, 0.92919921875, 1.1728515625, 1.41650390625, 1.66015625, 1.90380859375, 2.1474609375, 2.39111328125, 2.634765625, 2.87841796875, 3.1220703125, 3.36572265625, 3.609375, 3.85302734375, 4.0966796875, 4.34033203125, 4.583984375, 4.82763671875, 5.0712890625, 5.31494140625, 5.55859375, 5.80224609375, 6.0458984375, 6.28955078125, 6.533203125, 6.77685546875, 7.0205078125, 7.26416015625, 7.5078125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 6.0, 6.0, 8.0, 7.0, 9.0, 20.0, 13.0, 14.0, 31.0, 39.0, 64.0, 64.0, 83.0, 154.0, 195.0, 291.0, 436.0, 668.0, 1123.0, 2031.0, 3906.0, 7701.0, 16175.0, 33540.0, 72871.0, 166343.0, 304833.0, 237051.0, 106971.0, 48055.0, 22647.0, 10813.0, 5470.0, 2790.0, 1569.0, 880.0, 543.0, 305.0, 241.0, 154.0, 112.0, 88.0, 58.0, 46.0, 23.0, 29.0, 21.0, 17.0, 15.0, 9.0, 8.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.71875, -8.425537109375, -8.13232421875, -7.839111328125, -7.5458984375, -7.252685546875, -6.95947265625, -6.666259765625, -6.373046875, -6.079833984375, -5.78662109375, -5.493408203125, -5.2001953125, -4.906982421875, -4.61376953125, -4.320556640625, -4.02734375, -3.734130859375, -3.44091796875, -3.147705078125, -2.8544921875, -2.561279296875, -2.26806640625, -1.974853515625, -1.681640625, -1.388427734375, -1.09521484375, -0.802001953125, -0.5087890625, -0.215576171875, 0.07763671875, 0.370849609375, 0.6640625, 0.957275390625, 1.25048828125, 1.543701171875, 1.8369140625, 2.130126953125, 2.42333984375, 2.716552734375, 3.009765625, 3.302978515625, 3.59619140625, 3.889404296875, 4.1826171875, 4.475830078125, 4.76904296875, 5.062255859375, 5.35546875, 5.648681640625, 5.94189453125, 6.235107421875, 6.5283203125, 6.821533203125, 7.11474609375, 7.407958984375, 7.701171875, 7.994384765625, 8.28759765625, 8.580810546875, 8.8740234375, 9.167236328125, 9.46044921875, 9.753662109375, 10.046875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 15.0, 23.0, 14.0, 22.0, 26.0, 20.0, 37.0, 37.0, 31.0, 45.0, 40.0, 57.0, 122.0, 232.0, 1415.0, 285.0, 132.0, 84.0, 52.0, 49.0, 33.0, 43.0, 34.0, 26.0, 22.0, 14.0, 23.0, 15.0, 19.0, 12.0, 11.0, 8.0, 7.0, 4.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.59375, -19.9443359375, -19.294921875, -18.6455078125, -17.99609375, -17.3466796875, -16.697265625, -16.0478515625, -15.3984375, -14.7490234375, -14.099609375, -13.4501953125, -12.80078125, -12.1513671875, -11.501953125, -10.8525390625, -10.203125, -9.5537109375, -8.904296875, -8.2548828125, -7.60546875, -6.9560546875, -6.306640625, -5.6572265625, -5.0078125, -4.3583984375, -3.708984375, -3.0595703125, -2.41015625, -1.7607421875, -1.111328125, -0.4619140625, 0.1875, 0.8369140625, 1.486328125, 2.1357421875, 2.78515625, 3.4345703125, 4.083984375, 4.7333984375, 5.3828125, 6.0322265625, 6.681640625, 7.3310546875, 7.98046875, 8.6298828125, 9.279296875, 9.9287109375, 10.578125, 11.2275390625, 11.876953125, 12.5263671875, 13.17578125, 13.8251953125, 14.474609375, 15.1240234375, 15.7734375, 16.4228515625, 17.072265625, 17.7216796875, 18.37109375, 19.0205078125, 19.669921875, 20.3193359375, 20.96875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 7.0, 3.0, 6.0, 12.0, 16.0, 17.0, 25.0, 28.0, 39.0, 65.0, 82.0, 136.0, 216.0, 340.0, 669.0, 1456.0, 68928.0, 3067941.0, 3553.0, 863.0, 486.0, 230.0, 149.0, 110.0, 83.0, 50.0, 38.0, 26.0, 24.0, 20.0, 16.0, 8.0, 13.0, 3.0, 9.0, 3.0, 1.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-97.75, -95.1259765625, -92.501953125, -89.8779296875, -87.25390625, -84.6298828125, -82.005859375, -79.3818359375, -76.7578125, -74.1337890625, -71.509765625, -68.8857421875, -66.26171875, -63.6376953125, -61.013671875, -58.3896484375, -55.765625, -53.1416015625, -50.517578125, -47.8935546875, -45.26953125, -42.6455078125, -40.021484375, -37.3974609375, -34.7734375, -32.1494140625, -29.525390625, -26.9013671875, -24.27734375, -21.6533203125, -19.029296875, -16.4052734375, -13.78125, -11.1572265625, -8.533203125, -5.9091796875, -3.28515625, -0.6611328125, 1.962890625, 4.5869140625, 7.2109375, 9.8349609375, 12.458984375, 15.0830078125, 17.70703125, 20.3310546875, 22.955078125, 25.5791015625, 28.203125, 30.8271484375, 33.451171875, 36.0751953125, 38.69921875, 41.3232421875, 43.947265625, 46.5712890625, 49.1953125, 51.8193359375, 54.443359375, 57.0673828125, 59.69140625, 62.3154296875, 64.939453125, 67.5634765625, 70.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 13.0, 34.0, 77.0, 181.0, 263.0, 234.0, 133.0, 50.0, 20.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3770751953125, -64.41552734375, -61.45398712158203, -58.4924430847168, -55.53089904785156, -52.56935501098633, -49.607810974121094, -46.646263122558594, -43.684722900390625, -40.72317886352539, -37.761634826660156, -34.80009078979492, -31.838546752929688, -28.877002716064453, -25.915456771850586, -22.95391273498535, -19.992366790771484, -17.03082275390625, -14.069278717041016, -11.107733726501465, -8.14618968963623, -5.184645652770996, -2.2231006622314453, 0.7384433746337891, 3.6999874114990234, 6.661531448364258, 9.623075485229492, 12.584620475769043, 15.546164512634277, 18.507709503173828, 21.469253540039062, 24.430797576904297, 27.39234161376953, 30.353885650634766, 33.3154296875, 36.276973724365234, 39.23851776123047, 42.2000617980957, 45.16160583496094, 48.12315368652344, 51.084693908691406, 54.04623794555664, 57.007781982421875, 59.96932601928711, 62.930870056152344, 65.89241790771484, 68.85395812988281, 71.81550598144531, 74.77705383300781, 77.73860168457031, 80.70014190673828, 83.66168975830078, 86.62322998046875, 89.58477783203125, 92.54631805419922, 95.50786590576172, 98.46940612792969, 101.43095397949219, 104.39249420166016, 107.35404205322266, 110.31558227539062, 113.27713012695312, 116.2386703491211, 119.2002182006836, 122.16175842285156]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 17.0, 11.0, 13.0, 16.0, 13.0, 13.0, 15.0, 20.0, 30.0, 24.0, 22.0, 27.0, 35.0, 33.0, 34.0, 33.0, 45.0, 34.0, 32.0, 38.0, 37.0, 35.0, 38.0, 36.0, 34.0, 36.0, 26.0, 26.0, 30.0, 27.0, 16.0, 28.0, 17.0, 18.0, 14.0, 12.0, 7.0, 7.0, 10.0, 4.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-49.549407958984375, -48.026283264160156, -46.50315856933594, -44.98003387451172, -43.4569091796875, -41.93378448486328, -40.41065979003906, -38.887535095214844, -37.364410400390625, -35.841285705566406, -34.31816101074219, -32.79503631591797, -31.27191162109375, -29.74878692626953, -28.225664138793945, -26.702539443969727, -25.17941665649414, -23.656291961669922, -22.133167266845703, -20.610042572021484, -19.086917877197266, -17.563793182373047, -16.04067039489746, -14.517545700073242, -12.994421005249023, -11.471296310424805, -9.948171615600586, -8.425047874450684, -6.901923179626465, -5.378798484802246, -3.8556747436523438, -2.332550048828125, -0.8094215393066406, 0.713702917098999, 2.2368273735046387, 3.759951591491699, 5.283076286315918, 6.806200981140137, 8.329324722290039, 9.852449417114258, 11.375574111938477, 12.898698806762695, 14.421823501586914, 15.944947242736816, 17.46807098388672, 18.991195678710938, 20.514320373535156, 22.037445068359375, 23.560569763183594, 25.083694458007812, 26.60681915283203, 28.12994384765625, 29.65306854248047, 31.176193237304688, 32.699317932128906, 34.222442626953125, 35.745567321777344, 37.26869201660156, 38.79181671142578, 40.31494140625, 41.83806610107422, 43.36119079589844, 44.884315490722656, 46.407440185546875, 47.93056106567383]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 5.0, 15.0, 16.0, 24.0, 12.0, 20.0, 29.0, 27.0, 33.0, 27.0, 30.0, 25.0, 36.0, 33.0, 36.0, 40.0, 27.0, 37.0, 45.0, 41.0, 42.0, 36.0, 41.0, 40.0, 37.0, 26.0, 30.0, 22.0, 14.0, 22.0, 18.0, 13.0, 9.0, 14.0, 9.0, 7.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.850341796875, -7.59912109375, -7.347900390625, -7.0966796875, -6.845458984375, -6.59423828125, -6.343017578125, -6.091796875, -5.840576171875, -5.58935546875, -5.338134765625, -5.0869140625, -4.835693359375, -4.58447265625, -4.333251953125, -4.08203125, -3.830810546875, -3.57958984375, -3.328369140625, -3.0771484375, -2.825927734375, -2.57470703125, -2.323486328125, -2.072265625, -1.821044921875, -1.56982421875, -1.318603515625, -1.0673828125, -0.816162109375, -0.56494140625, -0.313720703125, -0.0625, 0.188720703125, 0.43994140625, 0.691162109375, 0.9423828125, 1.193603515625, 1.44482421875, 1.696044921875, 1.947265625, 2.198486328125, 2.44970703125, 2.700927734375, 2.9521484375, 3.203369140625, 3.45458984375, 3.705810546875, 3.95703125, 4.208251953125, 4.45947265625, 4.710693359375, 4.9619140625, 5.213134765625, 5.46435546875, 5.715576171875, 5.966796875, 6.218017578125, 6.46923828125, 6.720458984375, 6.9716796875, 7.222900390625, 7.47412109375, 7.725341796875, 7.9765625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 15.0, 19.0, 32.0, 52.0, 61.0, 103.0, 188.0, 295.0, 485.0, 984.0, 1946.0, 4491.0, 11308.0, 37140.0, 159790.0, 676333.0, 1828106.0, 1087235.0, 291561.0, 64620.0, 17551.0, 6337.0, 2691.0, 1323.0, 641.0, 377.0, 208.0, 138.0, 84.0, 64.0, 41.0, 19.0, 17.0, 4.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.057373046875, -10.68505859375, -10.312744140625, -9.9404296875, -9.568115234375, -9.19580078125, -8.823486328125, -8.451171875, -8.078857421875, -7.70654296875, -7.334228515625, -6.9619140625, -6.589599609375, -6.21728515625, -5.844970703125, -5.47265625, -5.100341796875, -4.72802734375, -4.355712890625, -3.9833984375, -3.611083984375, -3.23876953125, -2.866455078125, -2.494140625, -2.121826171875, -1.74951171875, -1.377197265625, -1.0048828125, -0.632568359375, -0.26025390625, 0.112060546875, 0.484375, 0.856689453125, 1.22900390625, 1.601318359375, 1.9736328125, 2.345947265625, 2.71826171875, 3.090576171875, 3.462890625, 3.835205078125, 4.20751953125, 4.579833984375, 4.9521484375, 5.324462890625, 5.69677734375, 6.069091796875, 6.44140625, 6.813720703125, 7.18603515625, 7.558349609375, 7.9306640625, 8.302978515625, 8.67529296875, 9.047607421875, 9.419921875, 9.792236328125, 10.16455078125, 10.536865234375, 10.9091796875, 11.281494140625, 11.65380859375, 12.026123046875, 12.3984375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 11.0, 19.0, 31.0, 41.0, 65.0, 84.0, 144.0, 183.0, 236.0, 341.0, 497.0, 662.0, 555.0, 352.0, 247.0, 187.0, 114.0, 105.0, 56.0, 51.0, 32.0, 16.0, 10.0, 15.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.234375, -21.6998291015625, -21.165283203125, -20.6307373046875, -20.09619140625, -19.5616455078125, -19.027099609375, -18.4925537109375, -17.9580078125, -17.4234619140625, -16.888916015625, -16.3543701171875, -15.81982421875, -15.2852783203125, -14.750732421875, -14.2161865234375, -13.681640625, -13.1470947265625, -12.612548828125, -12.0780029296875, -11.54345703125, -11.0089111328125, -10.474365234375, -9.9398193359375, -9.4052734375, -8.8707275390625, -8.336181640625, -7.8016357421875, -7.26708984375, -6.7325439453125, -6.197998046875, -5.6634521484375, -5.12890625, -4.5943603515625, -4.059814453125, -3.5252685546875, -2.99072265625, -2.4561767578125, -1.921630859375, -1.3870849609375, -0.8525390625, -0.3179931640625, 0.216552734375, 0.7510986328125, 1.28564453125, 1.8201904296875, 2.354736328125, 2.8892822265625, 3.423828125, 3.9583740234375, 4.492919921875, 5.0274658203125, 5.56201171875, 6.0965576171875, 6.631103515625, 7.1656494140625, 7.7001953125, 8.2347412109375, 8.769287109375, 9.3038330078125, 9.83837890625, 10.3729248046875, 10.907470703125, 11.4420166015625, 11.9765625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 10.0, 17.0, 30.0, 50.0, 95.0, 201.0, 402.0, 896.0, 2743.0, 16656.0, 381694.0, 3481768.0, 291691.0, 13852.0, 2503.0, 875.0, 384.0, 177.0, 120.0, 52.0, 28.0, 19.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.515625, -30.513916015625, -29.51220703125, -28.510498046875, -27.5087890625, -26.507080078125, -25.50537109375, -24.503662109375, -23.501953125, -22.500244140625, -21.49853515625, -20.496826171875, -19.4951171875, -18.493408203125, -17.49169921875, -16.489990234375, -15.48828125, -14.486572265625, -13.48486328125, -12.483154296875, -11.4814453125, -10.479736328125, -9.47802734375, -8.476318359375, -7.474609375, -6.472900390625, -5.47119140625, -4.469482421875, -3.4677734375, -2.466064453125, -1.46435546875, -0.462646484375, 0.5390625, 1.540771484375, 2.54248046875, 3.544189453125, 4.5458984375, 5.547607421875, 6.54931640625, 7.551025390625, 8.552734375, 9.554443359375, 10.55615234375, 11.557861328125, 12.5595703125, 13.561279296875, 14.56298828125, 15.564697265625, 16.56640625, 17.568115234375, 18.56982421875, 19.571533203125, 20.5732421875, 21.574951171875, 22.57666015625, 23.578369140625, 24.580078125, 25.581787109375, 26.58349609375, 27.585205078125, 28.5869140625, 29.588623046875, 30.59033203125, 31.592041015625, 32.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 31.0, 666.0, 318.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-622.9430541992188, -608.049560546875, -593.156005859375, -578.2625122070312, -563.3689575195312, -548.4754638671875, -533.5819091796875, -518.6884155273438, -503.7948913574219, -488.9013671875, -474.0078430175781, -459.11431884765625, -444.2208251953125, -429.3273010253906, -414.43377685546875, -399.5402526855469, -384.646728515625, -369.7532043457031, -354.85968017578125, -339.9661865234375, -325.0726623535156, -310.17913818359375, -295.2856140136719, -280.39208984375, -265.49859619140625, -250.60507202148438, -235.71156311035156, -220.8180389404297, -205.9245147705078, -191.031005859375, -176.13748168945312, -161.24395751953125, -146.35043334960938, -131.4569091796875, -116.56339263916016, -101.66987609863281, -86.77635192871094, -71.8828353881836, -56.98931884765625, -42.095794677734375, -27.20227813720703, -12.308758735656738, 2.5847606658935547, 17.47827911376953, 32.37179946899414, 47.26531982421875, 62.158836364746094, 77.05236053466797, 91.94587707519531, 106.83939361572266, 121.73291778564453, 136.62643432617188, 151.51995849609375, 166.41348266601562, 181.30699157714844, 196.2005157470703, 211.09402465820312, 225.987548828125, 240.8810577392578, 255.7745819091797, 270.6680908203125, 285.5616149902344, 300.45513916015625, 315.3486633300781, 330.2421875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 12.0, 2.0, 5.0, 9.0, 5.0, 9.0, 14.0, 15.0, 13.0, 20.0, 26.0, 26.0, 30.0, 39.0, 20.0, 30.0, 51.0, 37.0, 31.0, 40.0, 36.0, 48.0, 39.0, 54.0, 49.0, 49.0, 46.0, 25.0, 28.0, 29.0, 22.0, 26.0, 18.0, 24.0, 18.0, 10.0, 16.0, 15.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.45050048828125, -47.84785461425781, -46.24520492553711, -44.64255905151367, -43.039913177490234, -41.43726348876953, -39.834617614746094, -38.231971740722656, -36.62932586669922, -35.02667999267578, -33.42403030395508, -31.82138442993164, -30.218738555908203, -28.616090774536133, -27.013442993164062, -25.410797119140625, -23.808147430419922, -22.20549964904785, -20.602853775024414, -19.000205993652344, -17.397560119628906, -15.794912338256836, -14.192264556884766, -12.589617729187012, -10.986970901489258, -9.384324073791504, -7.781676769256592, -6.17902946472168, -4.576382637023926, -2.973735809326172, -1.3710880279541016, 0.23155879974365234, 1.8342056274414062, 3.4368526935577393, 5.039499759674072, 6.642147064208984, 8.244793891906738, 9.847440719604492, 11.450088500976562, 13.052735328674316, 14.65538215637207, 16.25802993774414, 17.860675811767578, 19.46332359313965, 21.06597137451172, 22.668617248535156, 24.271265029907227, 25.873912811279297, 27.476558685302734, 29.079206466674805, 30.681852340698242, 32.28450012207031, 33.88714599609375, 35.48979187011719, 37.09244155883789, 38.69508743286133, 40.29773712158203, 41.90038299560547, 43.50303268432617, 45.10567855834961, 46.70832443237305, 48.31097412109375, 49.91361999511719, 51.516265869140625, 53.11891174316406]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 12.0, 8.0, 10.0, 18.0, 12.0, 17.0, 28.0, 29.0, 30.0, 26.0, 33.0, 32.0, 41.0, 43.0, 44.0, 45.0, 45.0, 40.0, 47.0, 43.0, 29.0, 36.0, 38.0, 37.0, 32.0, 32.0, 25.0, 27.0, 21.0, 17.0, 17.0, 12.0, 13.0, 14.0, 6.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08203125, -6.85565185546875, -6.6292724609375, -6.40289306640625, -6.176513671875, -5.95013427734375, -5.7237548828125, -5.49737548828125, -5.27099609375, -5.04461669921875, -4.8182373046875, -4.59185791015625, -4.365478515625, -4.13909912109375, -3.9127197265625, -3.68634033203125, -3.4599609375, -3.23358154296875, -3.0072021484375, -2.78082275390625, -2.554443359375, -2.32806396484375, -2.1016845703125, -1.87530517578125, -1.64892578125, -1.42254638671875, -1.1961669921875, -0.96978759765625, -0.743408203125, -0.51702880859375, -0.2906494140625, -0.06427001953125, 0.162109375, 0.38848876953125, 0.6148681640625, 0.84124755859375, 1.067626953125, 1.29400634765625, 1.5203857421875, 1.74676513671875, 1.97314453125, 2.19952392578125, 2.4259033203125, 2.65228271484375, 2.878662109375, 3.10504150390625, 3.3314208984375, 3.55780029296875, 3.7841796875, 4.01055908203125, 4.2369384765625, 4.46331787109375, 4.689697265625, 4.91607666015625, 5.1424560546875, 5.36883544921875, 5.59521484375, 5.82159423828125, 6.0479736328125, 6.27435302734375, 6.500732421875, 6.72711181640625, 6.9534912109375, 7.17987060546875, 7.40625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 5.0, 13.0, 17.0, 33.0, 43.0, 44.0, 97.0, 115.0, 195.0, 250.0, 423.0, 614.0, 846.0, 1255.0, 1936.0, 2754.0, 4098.0, 5780.0, 8403.0, 12007.0, 17512.0, 24555.0, 34763.0, 47822.0, 64428.0, 82710.0, 99946.0, 112018.0, 112555.0, 100178.0, 83068.0, 64849.0, 48298.0, 34875.0, 24975.0, 17533.0, 12391.0, 8522.0, 5891.0, 4001.0, 2734.0, 1943.0, 1289.0, 867.0, 618.0, 393.0, 289.0, 197.0, 135.0, 114.0, 53.0, 36.0, 33.0, 15.0, 13.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.424072265625, -0.409942626953125, -0.39581298828125, -0.381683349609375, -0.3675537109375, -0.353424072265625, -0.33929443359375, -0.325164794921875, -0.31103515625, -0.296905517578125, -0.28277587890625, -0.268646240234375, -0.2545166015625, -0.240386962890625, -0.22625732421875, -0.212127685546875, -0.197998046875, -0.183868408203125, -0.16973876953125, -0.155609130859375, -0.1414794921875, -0.127349853515625, -0.11322021484375, -0.099090576171875, -0.0849609375, -0.070831298828125, -0.05670166015625, -0.042572021484375, -0.0284423828125, -0.014312744140625, -0.00018310546875, 0.013946533203125, 0.028076171875, 0.042205810546875, 0.05633544921875, 0.070465087890625, 0.0845947265625, 0.098724365234375, 0.11285400390625, 0.126983642578125, 0.14111328125, 0.155242919921875, 0.16937255859375, 0.183502197265625, 0.1976318359375, 0.211761474609375, 0.22589111328125, 0.240020751953125, 0.254150390625, 0.268280029296875, 0.28240966796875, 0.296539306640625, 0.3106689453125, 0.324798583984375, 0.33892822265625, 0.353057861328125, 0.3671875, 0.381317138671875, 0.39544677734375, 0.409576416015625, 0.4237060546875, 0.437835693359375, 0.45196533203125, 0.466094970703125, 0.480224609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 6.0, 10.0, 4.0, 13.0, 13.0, 21.0, 19.0, 18.0, 20.0, 28.0, 26.0, 29.0, 27.0, 40.0, 23.0, 36.0, 54.0, 44.0, 42.0, 1053.0, 40.0, 46.0, 34.0, 47.0, 38.0, 26.0, 33.0, 33.0, 23.0, 30.0, 25.0, 19.0, 18.0, 17.0, 16.0, 8.0, 14.0, 9.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.12420654296875, -4.9671630859375, -4.81011962890625, -4.653076171875, -4.49603271484375, -4.3389892578125, -4.18194580078125, -4.02490234375, -3.86785888671875, -3.7108154296875, -3.55377197265625, -3.396728515625, -3.23968505859375, -3.0826416015625, -2.92559814453125, -2.7685546875, -2.61151123046875, -2.4544677734375, -2.29742431640625, -2.140380859375, -1.98333740234375, -1.8262939453125, -1.66925048828125, -1.51220703125, -1.35516357421875, -1.1981201171875, -1.04107666015625, -0.884033203125, -0.72698974609375, -0.5699462890625, -0.41290283203125, -0.255859375, -0.09881591796875, 0.0582275390625, 0.21527099609375, 0.372314453125, 0.52935791015625, 0.6864013671875, 0.84344482421875, 1.00048828125, 1.15753173828125, 1.3145751953125, 1.47161865234375, 1.628662109375, 1.78570556640625, 1.9427490234375, 2.09979248046875, 2.2568359375, 2.41387939453125, 2.5709228515625, 2.72796630859375, 2.885009765625, 3.04205322265625, 3.1990966796875, 3.35614013671875, 3.51318359375, 3.67022705078125, 3.8272705078125, 3.98431396484375, 4.141357421875, 4.29840087890625, 4.4554443359375, 4.61248779296875, 4.76953125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 8.0, 7.0, 23.0, 27.0, 58.0, 85.0, 106.0, 185.0, 273.0, 394.0, 597.0, 920.0, 1473.0, 2177.0, 3313.0, 5010.0, 7422.0, 11399.0, 17164.0, 25363.0, 36690.0, 52175.0, 71257.0, 93080.0, 113236.0, 1146335.0, 140063.0, 100561.0, 78796.0, 58935.0, 41838.0, 29102.0, 19841.0, 13346.0, 8796.0, 5882.0, 3887.0, 2506.0, 1627.0, 1027.0, 700.0, 490.0, 348.0, 210.0, 131.0, 106.0, 64.0, 48.0, 19.0, 16.0, 5.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.32861328125, -0.3182411193847656, -0.30786895751953125, -0.2974967956542969, -0.2871246337890625, -0.2767524719238281, -0.26638031005859375, -0.2560081481933594, -0.245635986328125, -0.23526382446289062, -0.22489166259765625, -0.21451950073242188, -0.2041473388671875, -0.19377517700195312, -0.18340301513671875, -0.17303085327148438, -0.16265869140625, -0.15228652954101562, -0.14191436767578125, -0.13154220581054688, -0.1211700439453125, -0.11079788208007812, -0.10042572021484375, -0.09005355834960938, -0.079681396484375, -0.06930923461914062, -0.05893707275390625, -0.048564910888671875, -0.0381927490234375, -0.027820587158203125, -0.01744842529296875, -0.007076263427734375, 0.0032958984375, 0.013668060302734375, 0.02404022216796875, 0.034412384033203125, 0.0447845458984375, 0.055156707763671875, 0.06552886962890625, 0.07590103149414062, 0.086273193359375, 0.09664535522460938, 0.10701751708984375, 0.11738967895507812, 0.1277618408203125, 0.13813400268554688, 0.14850616455078125, 0.15887832641601562, 0.16925048828125, 0.17962265014648438, 0.18999481201171875, 0.20036697387695312, 0.2107391357421875, 0.22111129760742188, 0.23148345947265625, 0.24185562133789062, 0.252227783203125, 0.2625999450683594, 0.27297210693359375, 0.2833442687988281, 0.2937164306640625, 0.3040885925292969, 0.31446075439453125, 0.3248329162597656, 0.335205078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 5.0, 2.0, 11.0, 6.0, 5.0, 6.0, 11.0, 8.0, 10.0, 15.0, 29.0, 28.0, 46.0, 53.0, 54.0, 80.0, 68.0, 68.0, 61.0, 71.0, 58.0, 68.0, 37.0, 43.0, 25.0, 30.0, 13.0, 11.0, 10.0, 8.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01318359375, -0.012781262397766113, -0.012378931045532227, -0.01197659969329834, -0.011574268341064453, -0.011171936988830566, -0.01076960563659668, -0.010367274284362793, -0.009964942932128906, -0.00956261157989502, -0.009160280227661133, -0.008757948875427246, -0.00835561752319336, -0.007953286170959473, -0.007550954818725586, -0.007148623466491699, -0.0067462921142578125, -0.006343960762023926, -0.005941629409790039, -0.005539298057556152, -0.005136966705322266, -0.004734635353088379, -0.004332304000854492, -0.0039299726486206055, -0.0035276412963867188, -0.003125309944152832, -0.0027229785919189453, -0.0023206472396850586, -0.0019183158874511719, -0.0015159845352172852, -0.0011136531829833984, -0.0007113218307495117, -0.000308990478515625, 9.334087371826172e-05, 0.0004956722259521484, 0.0008980035781860352, 0.0013003349304199219, 0.0017026662826538086, 0.0021049976348876953, 0.002507328987121582, 0.0029096603393554688, 0.0033119916915893555, 0.003714323043823242, 0.004116654396057129, 0.004518985748291016, 0.004921317100524902, 0.005323648452758789, 0.005725979804992676, 0.0061283111572265625, 0.006530642509460449, 0.006932973861694336, 0.007335305213928223, 0.007737636566162109, 0.008139967918395996, 0.008542299270629883, 0.00894463062286377, 0.009346961975097656, 0.009749293327331543, 0.01015162467956543, 0.010553956031799316, 0.010956287384033203, 0.01135861873626709, 0.011760950088500977, 0.012163281440734863, 0.01256561279296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 8.0, 7.0, 5.0, 11.0, 9.0, 12.0, 17.0, 15.0, 20.0, 24.0, 29.0, 51.0, 65.0, 111.0, 150.0, 216.0, 393.0, 801.0, 5233.0, 1013914.0, 25099.0, 1059.0, 435.0, 247.0, 164.0, 101.0, 81.0, 52.0, 46.0, 27.0, 24.0, 19.0, 17.0, 16.0, 10.0, 11.0, 10.0, 6.0, 4.0, 11.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.2412700653076172, -0.23339462280273438, -0.22551918029785156, -0.21764373779296875, -0.20976829528808594, -0.20189285278320312, -0.1940174102783203, -0.1861419677734375, -0.1782665252685547, -0.17039108276367188, -0.16251564025878906, -0.15464019775390625, -0.14676475524902344, -0.13888931274414062, -0.1310138702392578, -0.123138427734375, -0.11526298522949219, -0.10738754272460938, -0.09951210021972656, -0.09163665771484375, -0.08376121520996094, -0.07588577270507812, -0.06801033020019531, -0.0601348876953125, -0.05225944519042969, -0.044384002685546875, -0.03650856018066406, -0.02863311767578125, -0.020757675170898438, -0.012882232666015625, -0.0050067901611328125, 0.00286865234375, 0.010744094848632812, 0.018619537353515625, 0.026494979858398438, 0.03437042236328125, 0.04224586486816406, 0.050121307373046875, 0.05799674987792969, 0.0658721923828125, 0.07374763488769531, 0.08162307739257812, 0.08949851989746094, 0.09737396240234375, 0.10524940490722656, 0.11312484741210938, 0.12100028991699219, 0.128875732421875, 0.1367511749267578, 0.14462661743164062, 0.15250205993652344, 0.16037750244140625, 0.16825294494628906, 0.17612838745117188, 0.1840038299560547, 0.1918792724609375, 0.1997547149658203, 0.20763015747070312, 0.21550559997558594, 0.22338104248046875, 0.23125648498535156, 0.23913192749023438, 0.2470073699951172, 0.2548828125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 37.0, 756.0, 208.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3463728427886963, -0.33992746472358704, -0.3334820866584778, -0.3270367383956909, -0.32059136033058167, -0.3141459822654724, -0.30770063400268555, -0.3012552559375763, -0.29480987787246704, -0.2883644998073578, -0.28191912174224854, -0.27547377347946167, -0.2690283954143524, -0.26258301734924316, -0.2561376690864563, -0.24969229102134705, -0.2432469129562378, -0.23680153489112854, -0.23035617172718048, -0.22391080856323242, -0.21746543049812317, -0.21102005243301392, -0.20457468926906586, -0.1981293261051178, -0.19168394804000854, -0.1852385699748993, -0.17879320681095123, -0.17234784364700317, -0.16590246558189392, -0.15945708751678467, -0.1530117243528366, -0.14656636118888855, -0.1401209682226181, -0.13367560505867004, -0.1272302269935608, -0.12078485637903214, -0.11433948576450348, -0.10789411514997482, -0.10144874453544617, -0.09500337392091751, -0.08855800330638885, -0.0821126326918602, -0.07566726207733154, -0.06922189146280289, -0.06277652084827423, -0.056331150233745575, -0.04988577961921692, -0.04344040900468826, -0.03699503839015961, -0.03054966777563095, -0.024104297161102295, -0.01765892654657364, -0.011213555932044983, -0.004768185317516327, 0.001677185297012329, 0.008122555911540985, 0.014567926526069641, 0.021013297140598297, 0.027458667755126953, 0.03390403836965561, 0.040349408984184265, 0.04679477959871292, 0.05324015021324158, 0.05968552082777023, 0.06613089144229889]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 7.0, 3.0, 12.0, 10.0, 7.0, 7.0, 9.0, 20.0, 23.0, 22.0, 25.0, 24.0, 35.0, 41.0, 26.0, 45.0, 43.0, 48.0, 38.0, 37.0, 47.0, 41.0, 33.0, 43.0, 39.0, 27.0, 42.0, 32.0, 30.0, 23.0, 21.0, 28.0, 21.0, 21.0, 11.0, 11.0, 11.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01814413070678711, -0.017520586028695107, -0.016897041350603104, -0.0162734966725111, -0.015649951994419098, -0.015026407316327095, -0.014402862638235092, -0.01377931796014309, -0.013155773282051086, -0.012532228603959084, -0.01190868392586708, -0.011285139247775078, -0.010661594569683075, -0.010038049891591072, -0.00941450521349907, -0.008790960535407066, -0.008167415857315063, -0.007543871179223061, -0.006920326501131058, -0.006296781823039055, -0.005673237144947052, -0.005049692466855049, -0.004426147788763046, -0.0038026031106710434, -0.0031790584325790405, -0.0025555137544870377, -0.0019319690763950348, -0.001308424398303032, -0.000684879720211029, -6.133504211902618e-05, 0.0005622096359729767, 0.0011857543140649796, 0.0018092989921569824, 0.0024328436702489853, 0.003056388348340988, 0.003679933026432991, 0.004303477704524994, 0.004927022382616997, 0.005550567060709, 0.0061741117388010025, 0.006797656416893005, 0.007421201094985008, 0.008044745773077011, 0.008668290451169014, 0.009291835129261017, 0.00991537980735302, 0.010538924485445023, 0.011162469163537025, 0.011786013841629028, 0.012409558519721031, 0.013033103197813034, 0.013656647875905037, 0.01428019255399704, 0.014903737232089043, 0.015527281910181046, 0.01615082658827305, 0.01677437126636505, 0.017397915944457054, 0.018021460622549057, 0.01864500530064106, 0.019268549978733063, 0.019892094656825066, 0.02051563933491707, 0.02113918401300907, 0.021762728691101074]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 17.0, 10.0, 14.0, 13.0, 15.0, 18.0, 25.0, 24.0, 27.0, 23.0, 29.0, 26.0, 41.0, 33.0, 39.0, 37.0, 43.0, 43.0, 38.0, 45.0, 49.0, 45.0, 25.0, 38.0, 32.0, 33.0, 40.0, 19.0, 27.0, 20.0, 14.0, 14.0, 12.0, 11.0, 7.0, 13.0, 6.0, 2.0, 2.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.46673583984375, -6.2420654296875, -6.01739501953125, -5.792724609375, -5.56805419921875, -5.3433837890625, -5.11871337890625, -4.89404296875, -4.66937255859375, -4.4447021484375, -4.22003173828125, -3.995361328125, -3.77069091796875, -3.5460205078125, -3.32135009765625, -3.0966796875, -2.87200927734375, -2.6473388671875, -2.42266845703125, -2.197998046875, -1.97332763671875, -1.7486572265625, -1.52398681640625, -1.29931640625, -1.07464599609375, -0.8499755859375, -0.62530517578125, -0.400634765625, -0.17596435546875, 0.0487060546875, 0.27337646484375, 0.498046875, 0.72271728515625, 0.9473876953125, 1.17205810546875, 1.396728515625, 1.62139892578125, 1.8460693359375, 2.07073974609375, 2.29541015625, 2.52008056640625, 2.7447509765625, 2.96942138671875, 3.194091796875, 3.41876220703125, 3.6434326171875, 3.86810302734375, 4.0927734375, 4.31744384765625, 4.5421142578125, 4.76678466796875, 4.991455078125, 5.21612548828125, 5.4407958984375, 5.66546630859375, 5.89013671875, 6.11480712890625, 6.3394775390625, 6.56414794921875, 6.788818359375, 7.01348876953125, 7.2381591796875, 7.46282958984375, 7.6875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 14.0, 14.0, 30.0, 30.0, 33.0, 46.0, 60.0, 79.0, 141.0, 152.0, 188.0, 273.0, 375.0, 497.0, 755.0, 1152.0, 1869.0, 3647.0, 8688.0, 24380.0, 76604.0, 282867.0, 451762.0, 130268.0, 38872.0, 13437.0, 5244.0, 2529.0, 1323.0, 895.0, 622.0, 415.0, 313.0, 249.0, 178.0, 130.0, 113.0, 68.0, 47.0, 47.0, 42.0, 26.0, 16.0, 13.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-11.6328125, -11.2825927734375, -10.932373046875, -10.5821533203125, -10.23193359375, -9.8817138671875, -9.531494140625, -9.1812744140625, -8.8310546875, -8.4808349609375, -8.130615234375, -7.7803955078125, -7.43017578125, -7.0799560546875, -6.729736328125, -6.3795166015625, -6.029296875, -5.6790771484375, -5.328857421875, -4.9786376953125, -4.62841796875, -4.2781982421875, -3.927978515625, -3.5777587890625, -3.2275390625, -2.8773193359375, -2.527099609375, -2.1768798828125, -1.82666015625, -1.4764404296875, -1.126220703125, -0.7760009765625, -0.42578125, -0.0755615234375, 0.274658203125, 0.6248779296875, 0.97509765625, 1.3253173828125, 1.675537109375, 2.0257568359375, 2.3759765625, 2.7261962890625, 3.076416015625, 3.4266357421875, 3.77685546875, 4.1270751953125, 4.477294921875, 4.8275146484375, 5.177734375, 5.5279541015625, 5.878173828125, 6.2283935546875, 6.57861328125, 6.9288330078125, 7.279052734375, 7.6292724609375, 7.9794921875, 8.3297119140625, 8.679931640625, 9.0301513671875, 9.38037109375, 9.7305908203125, 10.080810546875, 10.4310302734375, 10.78125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 9.0, 10.0, 5.0, 8.0, 14.0, 18.0, 19.0, 18.0, 16.0, 11.0, 26.0, 30.0, 53.0, 38.0, 53.0, 69.0, 102.0, 228.0, 1449.0, 256.0, 158.0, 81.0, 49.0, 38.0, 37.0, 42.0, 31.0, 27.0, 20.0, 23.0, 24.0, 20.0, 11.0, 4.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-18.953125, -18.4207763671875, -17.888427734375, -17.3560791015625, -16.82373046875, -16.2913818359375, -15.759033203125, -15.2266845703125, -14.6943359375, -14.1619873046875, -13.629638671875, -13.0972900390625, -12.56494140625, -12.0325927734375, -11.500244140625, -10.9678955078125, -10.435546875, -9.9031982421875, -9.370849609375, -8.8385009765625, -8.30615234375, -7.7738037109375, -7.241455078125, -6.7091064453125, -6.1767578125, -5.6444091796875, -5.112060546875, -4.5797119140625, -4.04736328125, -3.5150146484375, -2.982666015625, -2.4503173828125, -1.91796875, -1.3856201171875, -0.853271484375, -0.3209228515625, 0.21142578125, 0.7437744140625, 1.276123046875, 1.8084716796875, 2.3408203125, 2.8731689453125, 3.405517578125, 3.9378662109375, 4.47021484375, 5.0025634765625, 5.534912109375, 6.0672607421875, 6.599609375, 7.1319580078125, 7.664306640625, 8.1966552734375, 8.72900390625, 9.2613525390625, 9.793701171875, 10.3260498046875, 10.8583984375, 11.3907470703125, 11.923095703125, 12.4554443359375, 12.98779296875, 13.5201416015625, 14.052490234375, 14.5848388671875, 15.1171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 13.0, 4.0, 7.0, 16.0, 19.0, 24.0, 34.0, 33.0, 36.0, 57.0, 90.0, 134.0, 156.0, 281.0, 424.0, 775.0, 1920.0, 48949.0, 3081654.0, 7936.0, 1342.0, 582.0, 358.0, 233.0, 168.0, 113.0, 72.0, 53.0, 49.0, 35.0, 17.0, 24.0, 9.0, 10.0, 6.0, 5.0, 14.0, 11.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-51.5625, -49.9677734375, -48.373046875, -46.7783203125, -45.18359375, -43.5888671875, -41.994140625, -40.3994140625, -38.8046875, -37.2099609375, -35.615234375, -34.0205078125, -32.42578125, -30.8310546875, -29.236328125, -27.6416015625, -26.046875, -24.4521484375, -22.857421875, -21.2626953125, -19.66796875, -18.0732421875, -16.478515625, -14.8837890625, -13.2890625, -11.6943359375, -10.099609375, -8.5048828125, -6.91015625, -5.3154296875, -3.720703125, -2.1259765625, -0.53125, 1.0634765625, 2.658203125, 4.2529296875, 5.84765625, 7.4423828125, 9.037109375, 10.6318359375, 12.2265625, 13.8212890625, 15.416015625, 17.0107421875, 18.60546875, 20.2001953125, 21.794921875, 23.3896484375, 24.984375, 26.5791015625, 28.173828125, 29.7685546875, 31.36328125, 32.9580078125, 34.552734375, 36.1474609375, 37.7421875, 39.3369140625, 40.931640625, 42.5263671875, 44.12109375, 45.7158203125, 47.310546875, 48.9052734375, 50.5]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 32.0, 201.0, 468.0, 265.0, 37.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.81341552734375, -227.34735107421875, -221.88128662109375, -216.41522216796875, -210.94915771484375, -205.48309326171875, -200.01702880859375, -194.5509490966797, -189.0848846435547, -183.6188201904297, -178.1527557373047, -172.6866912841797, -167.2206268310547, -161.75454711914062, -156.28848266601562, -150.82241821289062, -145.35635375976562, -139.89028930664062, -134.42422485351562, -128.95816040039062, -123.4920883178711, -118.0260238647461, -112.5599594116211, -107.09388732910156, -101.62783813476562, -96.16177368164062, -90.69570922851562, -85.22964477539062, -79.7635726928711, -74.2975082397461, -68.8314437866211, -63.36537551879883, -57.899314880371094, -52.433250427246094, -46.96718215942383, -41.50111770629883, -36.03504943847656, -30.568984985351562, -25.102920532226562, -19.636852264404297, -14.170787811279297, -8.704721450805664, -3.2386560440063477, 2.2274093627929688, 7.693475723266602, 13.159542083740234, 18.625606536865234, 24.0916748046875, 29.5577392578125, 35.0238037109375, 40.489871978759766, 45.955936431884766, 51.42200469970703, 56.88806915283203, 62.35413360595703, 67.82020568847656, 73.28627014160156, 78.75233459472656, 84.21839904785156, 89.68446350097656, 95.1505355834961, 100.6166000366211, 106.0826644897461, 111.54873657226562, 117.0147933959961]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 13.0, 6.0, 11.0, 9.0, 11.0, 12.0, 16.0, 24.0, 27.0, 24.0, 25.0, 38.0, 33.0, 38.0, 29.0, 55.0, 39.0, 40.0, 42.0, 38.0, 43.0, 35.0, 42.0, 49.0, 30.0, 33.0, 25.0, 22.0, 26.0, 25.0, 21.0, 19.0, 15.0, 12.0, 9.0, 14.0, 10.0, 10.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.91911315917969, -45.438594818115234, -43.95808029174805, -42.477561950683594, -40.997047424316406, -39.51652908325195, -38.036014556884766, -36.55549621582031, -35.074981689453125, -33.59446334838867, -32.113948822021484, -30.633432388305664, -29.152915954589844, -27.672399520874023, -26.191883087158203, -24.71136474609375, -23.23084831237793, -21.75033187866211, -20.26981544494629, -18.78929901123047, -17.30878257751465, -15.828266143798828, -14.347748756408691, -12.867232322692871, -11.38671588897705, -9.90619945526123, -8.42568302154541, -6.945166110992432, -5.464649677276611, -3.984133243560791, -2.5036163330078125, -1.0230998992919922, 0.4574165344238281, 1.937933087348938, 3.418449640274048, 4.898966312408447, 6.379482746124268, 7.859999179840088, 9.340516090393066, 10.821032524108887, 12.301548957824707, 13.782065391540527, 15.262581825256348, 16.743099212646484, 18.223615646362305, 19.704132080078125, 21.184648513793945, 22.665164947509766, 24.145681381225586, 25.626197814941406, 27.106714248657227, 28.587230682373047, 30.067747116088867, 31.548263549804688, 33.02878189086914, 34.50929641723633, 35.98981475830078, 37.470333099365234, 38.95084762573242, 40.431365966796875, 41.91188049316406, 43.392398834228516, 44.8729133605957, 46.353431701660156, 47.833946228027344]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 6.0, 7.0, 10.0, 11.0, 12.0, 23.0, 23.0, 24.0, 25.0, 14.0, 20.0, 32.0, 28.0, 24.0, 28.0, 38.0, 49.0, 35.0, 27.0, 32.0, 39.0, 44.0, 31.0, 46.0, 43.0, 29.0, 38.0, 40.0, 34.0, 32.0, 22.0, 12.0, 14.0, 14.0, 11.0, 16.0, 10.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.0, -6.78704833984375, -6.5740966796875, -6.36114501953125, -6.148193359375, -5.93524169921875, -5.7222900390625, -5.50933837890625, -5.29638671875, -5.08343505859375, -4.8704833984375, -4.65753173828125, -4.444580078125, -4.23162841796875, -4.0186767578125, -3.80572509765625, -3.5927734375, -3.37982177734375, -3.1668701171875, -2.95391845703125, -2.740966796875, -2.52801513671875, -2.3150634765625, -2.10211181640625, -1.88916015625, -1.67620849609375, -1.4632568359375, -1.25030517578125, -1.037353515625, -0.82440185546875, -0.6114501953125, -0.39849853515625, -0.185546875, 0.02740478515625, 0.2403564453125, 0.45330810546875, 0.666259765625, 0.87921142578125, 1.0921630859375, 1.30511474609375, 1.51806640625, 1.73101806640625, 1.9439697265625, 2.15692138671875, 2.369873046875, 2.58282470703125, 2.7957763671875, 3.00872802734375, 3.2216796875, 3.43463134765625, 3.6475830078125, 3.86053466796875, 4.073486328125, 4.28643798828125, 4.4993896484375, 4.71234130859375, 4.92529296875, 5.13824462890625, 5.3511962890625, 5.56414794921875, 5.777099609375, 5.99005126953125, 6.2030029296875, 6.41595458984375, 6.62890625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 15.0, 29.0, 73.0, 95.0, 168.0, 277.0, 465.0, 865.0, 1572.0, 3036.0, 6205.0, 15255.0, 50678.0, 255777.0, 1161382.0, 1923568.0, 611946.0, 116953.0, 27283.0, 9636.0, 4205.0, 2047.0, 1151.0, 642.0, 399.0, 210.0, 123.0, 74.0, 57.0, 36.0, 19.0, 16.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3359375, -12.957763671875, -12.57958984375, -12.201416015625, -11.8232421875, -11.445068359375, -11.06689453125, -10.688720703125, -10.310546875, -9.932373046875, -9.55419921875, -9.176025390625, -8.7978515625, -8.419677734375, -8.04150390625, -7.663330078125, -7.28515625, -6.906982421875, -6.52880859375, -6.150634765625, -5.7724609375, -5.394287109375, -5.01611328125, -4.637939453125, -4.259765625, -3.881591796875, -3.50341796875, -3.125244140625, -2.7470703125, -2.368896484375, -1.99072265625, -1.612548828125, -1.234375, -0.856201171875, -0.47802734375, -0.099853515625, 0.2783203125, 0.656494140625, 1.03466796875, 1.412841796875, 1.791015625, 2.169189453125, 2.54736328125, 2.925537109375, 3.3037109375, 3.681884765625, 4.06005859375, 4.438232421875, 4.81640625, 5.194580078125, 5.57275390625, 5.950927734375, 6.3291015625, 6.707275390625, 7.08544921875, 7.463623046875, 7.841796875, 8.219970703125, 8.59814453125, 8.976318359375, 9.3544921875, 9.732666015625, 10.11083984375, 10.489013671875, 10.8671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 10.0, 12.0, 10.0, 34.0, 40.0, 59.0, 106.0, 139.0, 191.0, 207.0, 336.0, 447.0, 517.0, 509.0, 371.0, 323.0, 228.0, 159.0, 124.0, 78.0, 56.0, 41.0, 21.0, 14.0, 8.0, 6.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.3292236328125, -11.916259765625, -11.5032958984375, -11.09033203125, -10.6773681640625, -10.264404296875, -9.8514404296875, -9.4384765625, -9.0255126953125, -8.612548828125, -8.1995849609375, -7.78662109375, -7.3736572265625, -6.960693359375, -6.5477294921875, -6.134765625, -5.7218017578125, -5.308837890625, -4.8958740234375, -4.48291015625, -4.0699462890625, -3.656982421875, -3.2440185546875, -2.8310546875, -2.4180908203125, -2.005126953125, -1.5921630859375, -1.17919921875, -0.7662353515625, -0.353271484375, 0.0596923828125, 0.47265625, 0.8856201171875, 1.298583984375, 1.7115478515625, 2.12451171875, 2.5374755859375, 2.950439453125, 3.3634033203125, 3.7763671875, 4.1893310546875, 4.602294921875, 5.0152587890625, 5.42822265625, 5.8411865234375, 6.254150390625, 6.6671142578125, 7.080078125, 7.4930419921875, 7.906005859375, 8.3189697265625, 8.73193359375, 9.1448974609375, 9.557861328125, 9.9708251953125, 10.3837890625, 10.7967529296875, 11.209716796875, 11.6226806640625, 12.03564453125, 12.4486083984375, 12.861572265625, 13.2745361328125, 13.6875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 15.0, 16.0, 6.0, 14.0, 13.0, 30.0, 62.0, 95.0, 144.0, 327.0, 575.0, 1528.0, 6043.0, 88126.0, 3407025.0, 669247.0, 16422.0, 2782.0, 891.0, 414.0, 218.0, 125.0, 64.0, 46.0, 23.0, 14.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.203125, -30.25, -29.296875, -28.34375, -27.390625, -26.4375, -25.484375, -24.53125, -23.578125, -22.625, -21.671875, -20.71875, -19.765625, -18.8125, -17.859375, -16.90625, -15.953125, -15.0, -14.046875, -13.09375, -12.140625, -11.1875, -10.234375, -9.28125, -8.328125, -7.375, -6.421875, -5.46875, -4.515625, -3.5625, -2.609375, -1.65625, -0.703125, 0.25, 1.203125, 2.15625, 3.109375, 4.0625, 5.015625, 5.96875, 6.921875, 7.875, 8.828125, 9.78125, 10.734375, 11.6875, 12.640625, 13.59375, 14.546875, 15.5, 16.453125, 17.40625, 18.359375, 19.3125, 20.265625, 21.21875, 22.171875, 23.125, 24.078125, 25.03125, 25.984375, 26.9375, 27.890625, 28.84375, 29.796875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 48.0, 233.0, 374.0, 262.0, 71.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-264.3870849609375, -258.7138671875, -253.04067993164062, -247.36746215820312, -241.6942596435547, -236.02105712890625, -230.3478546142578, -224.67465209960938, -219.00143432617188, -213.32823181152344, -207.655029296875, -201.9818115234375, -196.30860900878906, -190.63540649414062, -184.9622039794922, -179.28900146484375, -173.61578369140625, -167.9425811767578, -162.26937866210938, -156.59616088867188, -150.92295837402344, -145.249755859375, -139.57655334472656, -133.90335083007812, -128.2301483154297, -122.55694580078125, -116.88373565673828, -111.21053314208984, -105.53732299804688, -99.86412048339844, -94.19091796875, -88.51770782470703, -82.84449005126953, -77.1712875366211, -71.49807739257812, -65.82487487792969, -60.15166473388672, -54.47846221923828, -48.80525588989258, -43.132049560546875, -37.45884323120117, -31.78563690185547, -26.112430572509766, -20.439226150512695, -14.766019821166992, -9.092813491821289, -3.4196090698242188, 2.2535972595214844, 7.9268035888671875, 13.60000991821289, 19.273216247558594, 24.946420669555664, 30.619626998901367, 36.29283142089844, 41.96603775024414, 47.639244079589844, 53.31245040893555, 58.98565673828125, 64.65885925292969, 70.33206939697266, 76.0052719116211, 81.67848205566406, 87.3516845703125, 93.02488708496094, 98.6980972290039]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 7.0, 11.0, 5.0, 11.0, 17.0, 11.0, 18.0, 17.0, 29.0, 22.0, 29.0, 31.0, 48.0, 39.0, 49.0, 33.0, 59.0, 48.0, 41.0, 45.0, 34.0, 47.0, 27.0, 28.0, 26.0, 42.0, 25.0, 31.0, 26.0, 18.0, 15.0, 21.0, 11.0, 6.0, 13.0, 9.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.8281364440918, -40.54194259643555, -39.25574493408203, -37.96955108642578, -36.683353424072266, -35.397159576416016, -34.1109619140625, -32.82476806640625, -31.538572311401367, -30.252376556396484, -28.9661808013916, -27.67998504638672, -26.39379119873047, -25.107593536376953, -23.821399688720703, -22.53520393371582, -21.249008178710938, -19.962812423706055, -18.676616668701172, -17.39042091369629, -16.104225158691406, -14.81803035736084, -13.531835556030273, -12.24563980102539, -10.959444046020508, -9.673248291015625, -8.387052536010742, -7.100857734680176, -5.814661979675293, -4.52846622467041, -3.2422709465026855, -1.956075668334961, -0.6698837280273438, 0.61631178855896, 1.9025073051452637, 3.1887028217315674, 4.474898338317871, 5.761094093322754, 7.0472893714904785, 8.333484649658203, 9.619680404663086, 10.905876159667969, 12.192071914672852, 13.478266716003418, 14.7644624710083, 16.0506591796875, 17.33685302734375, 18.623048782348633, 19.909244537353516, 21.1954402923584, 22.48163604736328, 23.767831802368164, 25.054027557373047, 26.340221405029297, 27.62641716003418, 28.912612915039062, 30.198808670043945, 31.485004425048828, 32.77119827270508, 34.057395935058594, 35.343589782714844, 36.62978744506836, 37.91598129272461, 39.202178955078125, 40.488372802734375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 4.0, 14.0, 9.0, 14.0, 15.0, 17.0, 13.0, 14.0, 18.0, 25.0, 19.0, 13.0, 24.0, 31.0, 28.0, 37.0, 44.0, 43.0, 44.0, 36.0, 20.0, 32.0, 38.0, 32.0, 39.0, 34.0, 35.0, 34.0, 28.0, 33.0, 26.0, 24.0, 20.0, 18.0, 13.0, 15.0, 20.0, 9.0, 8.0, 4.0, 7.0, 7.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.32421875, -5.15167236328125, -4.9791259765625, -4.80657958984375, -4.634033203125, -4.46148681640625, -4.2889404296875, -4.11639404296875, -3.94384765625, -3.77130126953125, -3.5987548828125, -3.42620849609375, -3.253662109375, -3.08111572265625, -2.9085693359375, -2.73602294921875, -2.5634765625, -2.39093017578125, -2.2183837890625, -2.04583740234375, -1.873291015625, -1.70074462890625, -1.5281982421875, -1.35565185546875, -1.18310546875, -1.01055908203125, -0.8380126953125, -0.66546630859375, -0.492919921875, -0.32037353515625, -0.1478271484375, 0.02471923828125, 0.197265625, 0.36981201171875, 0.5423583984375, 0.71490478515625, 0.887451171875, 1.05999755859375, 1.2325439453125, 1.40509033203125, 1.57763671875, 1.75018310546875, 1.9227294921875, 2.09527587890625, 2.267822265625, 2.44036865234375, 2.6129150390625, 2.78546142578125, 2.9580078125, 3.13055419921875, 3.3031005859375, 3.47564697265625, 3.648193359375, 3.82073974609375, 3.9932861328125, 4.16583251953125, 4.33837890625, 4.51092529296875, 4.6834716796875, 4.85601806640625, 5.028564453125, 5.20111083984375, 5.3736572265625, 5.54620361328125, 5.71875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 4.0, 14.0, 20.0, 18.0, 40.0, 50.0, 67.0, 102.0, 149.0, 232.0, 312.0, 497.0, 713.0, 1115.0, 1640.0, 2367.0, 3648.0, 5668.0, 8888.0, 13995.0, 21835.0, 33985.0, 51450.0, 76268.0, 104134.0, 131266.0, 144645.0, 129828.0, 101359.0, 73067.0, 49505.0, 32745.0, 20766.0, 13461.0, 8590.0, 5423.0, 3533.0, 2366.0, 1575.0, 1018.0, 699.0, 461.0, 315.0, 212.0, 183.0, 98.0, 88.0, 50.0, 34.0, 17.0, 24.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0], "bins": [-0.51708984375, -0.5016326904296875, -0.486175537109375, -0.4707183837890625, -0.45526123046875, -0.4398040771484375, -0.424346923828125, -0.4088897705078125, -0.3934326171875, -0.3779754638671875, -0.362518310546875, -0.3470611572265625, -0.33160400390625, -0.3161468505859375, -0.300689697265625, -0.2852325439453125, -0.269775390625, -0.2543182373046875, -0.238861083984375, -0.2234039306640625, -0.20794677734375, -0.1924896240234375, -0.177032470703125, -0.1615753173828125, -0.1461181640625, -0.1306610107421875, -0.115203857421875, -0.0997467041015625, -0.08428955078125, -0.0688323974609375, -0.053375244140625, -0.0379180908203125, -0.0224609375, -0.0070037841796875, 0.008453369140625, 0.0239105224609375, 0.03936767578125, 0.0548248291015625, 0.070281982421875, 0.0857391357421875, 0.1011962890625, 0.1166534423828125, 0.132110595703125, 0.1475677490234375, 0.16302490234375, 0.1784820556640625, 0.193939208984375, 0.2093963623046875, 0.224853515625, 0.2403106689453125, 0.255767822265625, 0.2712249755859375, 0.28668212890625, 0.3021392822265625, 0.317596435546875, 0.3330535888671875, 0.3485107421875, 0.3639678955078125, 0.379425048828125, 0.3948822021484375, 0.41033935546875, 0.4257965087890625, 0.441253662109375, 0.4567108154296875, 0.47216796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 6.0, 8.0, 3.0, 12.0, 10.0, 16.0, 31.0, 16.0, 17.0, 15.0, 26.0, 23.0, 32.0, 22.0, 25.0, 27.0, 34.0, 31.0, 36.0, 37.0, 1058.0, 51.0, 33.0, 34.0, 38.0, 33.0, 31.0, 30.0, 32.0, 27.0, 23.0, 26.0, 18.0, 25.0, 26.0, 13.0, 17.0, 11.0, 7.0, 10.0, 3.0, 8.0, 6.0, 4.0, 6.0, 0.0, 4.0, 2.0, 0.0, 3.0], "bins": [-4.0625, -3.94561767578125, -3.8287353515625, -3.71185302734375, -3.594970703125, -3.47808837890625, -3.3612060546875, -3.24432373046875, -3.12744140625, -3.01055908203125, -2.8936767578125, -2.77679443359375, -2.659912109375, -2.54302978515625, -2.4261474609375, -2.30926513671875, -2.1923828125, -2.07550048828125, -1.9586181640625, -1.84173583984375, -1.724853515625, -1.60797119140625, -1.4910888671875, -1.37420654296875, -1.25732421875, -1.14044189453125, -1.0235595703125, -0.90667724609375, -0.789794921875, -0.67291259765625, -0.5560302734375, -0.43914794921875, -0.322265625, -0.20538330078125, -0.0885009765625, 0.02838134765625, 0.145263671875, 0.26214599609375, 0.3790283203125, 0.49591064453125, 0.61279296875, 0.72967529296875, 0.8465576171875, 0.96343994140625, 1.080322265625, 1.19720458984375, 1.3140869140625, 1.43096923828125, 1.5478515625, 1.66473388671875, 1.7816162109375, 1.89849853515625, 2.015380859375, 2.13226318359375, 2.2491455078125, 2.36602783203125, 2.48291015625, 2.59979248046875, 2.7166748046875, 2.83355712890625, 2.950439453125, 3.06732177734375, 3.1842041015625, 3.30108642578125, 3.41796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 2.0, 7.0, 14.0, 17.0, 29.0, 35.0, 50.0, 74.0, 114.0, 202.0, 300.0, 422.0, 685.0, 1125.0, 1826.0, 2926.0, 4798.0, 8228.0, 13657.0, 22318.0, 37297.0, 60100.0, 92735.0, 132092.0, 1012122.0, 352268.0, 125029.0, 86544.0, 55991.0, 34038.0, 20670.0, 12058.0, 7660.0, 4385.0, 2764.0, 1615.0, 1054.0, 640.0, 442.0, 290.0, 151.0, 107.0, 78.0, 57.0, 36.0, 27.0, 24.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.419921875, -0.40716552734375, -0.3944091796875, -0.38165283203125, -0.368896484375, -0.35614013671875, -0.3433837890625, -0.33062744140625, -0.31787109375, -0.30511474609375, -0.2923583984375, -0.27960205078125, -0.266845703125, -0.25408935546875, -0.2413330078125, -0.22857666015625, -0.2158203125, -0.20306396484375, -0.1903076171875, -0.17755126953125, -0.164794921875, -0.15203857421875, -0.1392822265625, -0.12652587890625, -0.11376953125, -0.10101318359375, -0.0882568359375, -0.07550048828125, -0.062744140625, -0.04998779296875, -0.0372314453125, -0.02447509765625, -0.01171875, 0.00103759765625, 0.0137939453125, 0.02655029296875, 0.039306640625, 0.05206298828125, 0.0648193359375, 0.07757568359375, 0.09033203125, 0.10308837890625, 0.1158447265625, 0.12860107421875, 0.141357421875, 0.15411376953125, 0.1668701171875, 0.17962646484375, 0.1923828125, 0.20513916015625, 0.2178955078125, 0.23065185546875, 0.243408203125, 0.25616455078125, 0.2689208984375, 0.28167724609375, 0.29443359375, 0.30718994140625, 0.3199462890625, 0.33270263671875, 0.345458984375, 0.35821533203125, 0.3709716796875, 0.38372802734375, 0.396484375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 11.0, 6.0, 5.0, 5.0, 9.0, 17.0, 11.0, 18.0, 24.0, 30.0, 42.0, 98.0, 145.0, 193.0, 110.0, 68.0, 40.0, 31.0, 21.0, 24.0, 17.0, 11.0, 12.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0301513671875, -0.029125690460205078, -0.028100013732910156, -0.027074337005615234, -0.026048660278320312, -0.02502298355102539, -0.02399730682373047, -0.022971630096435547, -0.021945953369140625, -0.020920276641845703, -0.01989459991455078, -0.01886892318725586, -0.017843246459960938, -0.016817569732666016, -0.015791893005371094, -0.014766216278076172, -0.01374053955078125, -0.012714862823486328, -0.011689186096191406, -0.010663509368896484, -0.009637832641601562, -0.00861215591430664, -0.007586479187011719, -0.006560802459716797, -0.005535125732421875, -0.004509449005126953, -0.0034837722778320312, -0.0024580955505371094, -0.0014324188232421875, -0.0004067420959472656, 0.0006189346313476562, 0.0016446113586425781, 0.0026702880859375, 0.003695964813232422, 0.004721641540527344, 0.005747318267822266, 0.0067729949951171875, 0.007798671722412109, 0.008824348449707031, 0.009850025177001953, 0.010875701904296875, 0.011901378631591797, 0.012927055358886719, 0.01395273208618164, 0.014978408813476562, 0.016004085540771484, 0.017029762268066406, 0.018055438995361328, 0.01908111572265625, 0.020106792449951172, 0.021132469177246094, 0.022158145904541016, 0.023183822631835938, 0.02420949935913086, 0.02523517608642578, 0.026260852813720703, 0.027286529541015625, 0.028312206268310547, 0.02933788299560547, 0.03036355972290039, 0.03138923645019531, 0.032414913177490234, 0.033440589904785156, 0.03446626663208008, 0.035491943359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 1.0, 3.0, 5.0, 7.0, 10.0, 16.0, 16.0, 32.0, 36.0, 39.0, 73.0, 120.0, 265.0, 698.0, 998091.0, 47963.0, 575.0, 263.0, 98.0, 57.0, 47.0, 29.0, 21.0, 17.0, 10.0, 11.0, 15.0, 11.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9134979248046875, -0.886566162109375, -0.8596343994140625, -0.83270263671875, -0.8057708740234375, -0.778839111328125, -0.7519073486328125, -0.7249755859375, -0.6980438232421875, -0.671112060546875, -0.6441802978515625, -0.61724853515625, -0.5903167724609375, -0.563385009765625, -0.5364532470703125, -0.509521484375, -0.4825897216796875, -0.455657958984375, -0.4287261962890625, -0.40179443359375, -0.3748626708984375, -0.347930908203125, -0.3209991455078125, -0.2940673828125, -0.2671356201171875, -0.240203857421875, -0.2132720947265625, -0.18634033203125, -0.1594085693359375, -0.132476806640625, -0.1055450439453125, -0.07861328125, -0.0516815185546875, -0.024749755859375, 0.0021820068359375, 0.02911376953125, 0.0560455322265625, 0.082977294921875, 0.1099090576171875, 0.1368408203125, 0.1637725830078125, 0.190704345703125, 0.2176361083984375, 0.24456787109375, 0.2714996337890625, 0.298431396484375, 0.3253631591796875, 0.352294921875, 0.3792266845703125, 0.406158447265625, 0.4330902099609375, 0.46002197265625, 0.4869537353515625, 0.513885498046875, 0.5408172607421875, 0.5677490234375, 0.5946807861328125, 0.621612548828125, 0.6485443115234375, 0.67547607421875, 0.7024078369140625, 0.729339599609375, 0.7562713623046875, 0.783203125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 986.0, 19.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24320267140865326, -0.2293393313884735, -0.21547599136829376, -0.201612651348114, -0.18774931132793427, -0.17388597130775452, -0.16002261638641357, -0.14615929126739502, -0.13229593634605408, -0.11843259632587433, -0.10456925630569458, -0.09070591628551483, -0.07684257626533508, -0.06297922879457474, -0.04911588877439499, -0.03525254875421524, -0.02138921618461609, -0.007525875233113766, 0.0063374657183885574, 0.020200807601213455, 0.034064147621393204, 0.04792749136686325, 0.061790831387043, 0.07565417140722275, 0.0895175114274025, 0.10338085144758224, 0.117244191467762, 0.13110753893852234, 0.1449708789587021, 0.15883421897888184, 0.17269755899906158, 0.18656089901924133, 0.2004242241382599, 0.21428756415843964, 0.22815090417861938, 0.24201424419879913, 0.2558775842189789, 0.2697409391403198, 0.2836042642593384, 0.2974676191806793, 0.3113309442996979, 0.3251942992210388, 0.3390576243400574, 0.3529209792613983, 0.36678430438041687, 0.3806476593017578, 0.39451098442077637, 0.4083743393421173, 0.42223769426345825, 0.4361010491847992, 0.44996437430381775, 0.4638277292251587, 0.47769105434417725, 0.4915544092655182, 0.5054177641868591, 0.5192810893058777, 0.5331444144248962, 0.5470077395439148, 0.5608711242675781, 0.5747344493865967, 0.5885977745056152, 0.6024610996246338, 0.6163244843482971, 0.6301878094673157, 0.6440511345863342]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 12.0, 9.0, 19.0, 30.0, 29.0, 33.0, 46.0, 45.0, 49.0, 77.0, 68.0, 60.0, 61.0, 77.0, 75.0, 58.0, 48.0, 42.0, 35.0, 25.0, 27.0, 16.0, 16.0, 14.0, 9.0, 10.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046648263931274414, -0.04503614082932472, -0.04342401772737503, -0.04181189835071564, -0.040199775248765945, -0.038587652146816254, -0.03697553277015686, -0.03536340966820717, -0.03375128656625748, -0.032139163464307785, -0.030527042225003242, -0.0289149209856987, -0.027302797883749008, -0.025690674781799316, -0.024078553542494774, -0.02246643230319023, -0.02085430920124054, -0.019242186099290848, -0.017630064859986305, -0.016017943620681763, -0.014405820518732071, -0.012793698348104954, -0.011181576177477837, -0.00956945400685072, -0.007957331836223602, -0.006345209665596485, -0.004733087494969368, -0.003120965324342251, -0.0015088431537151337, 0.00010327901691198349, 0.0017154011875391006, 0.003327523358166218, 0.004939645528793335, 0.006551767699420452, 0.00816388987004757, 0.009776012040674686, 0.011388134211301804, 0.01300025638192892, 0.014612378552556038, 0.01622449979186058, 0.017836622893810272, 0.019448745995759964, 0.021060867235064507, 0.02267298847436905, 0.02428511157631874, 0.025897234678268433, 0.027509355917572975, 0.029121477156877518, 0.03073360025882721, 0.0323457233607769, 0.03395784646272659, 0.035569965839385986, 0.03718208894133568, 0.03879421204328537, 0.04040633141994476, 0.042018454521894455, 0.04363057762384415, 0.04524270072579384, 0.04685482382774353, 0.048466943204402924, 0.050079066306352615, 0.05169118940830231, 0.0533033087849617, 0.05491543188691139, 0.056527554988861084]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 6.0, 10.0, 6.0, 14.0, 13.0, 17.0, 18.0, 14.0, 21.0, 19.0, 21.0, 33.0, 26.0, 32.0, 43.0, 34.0, 37.0, 46.0, 32.0, 35.0, 40.0, 33.0, 41.0, 44.0, 35.0, 33.0, 38.0, 35.0, 26.0, 21.0, 28.0, 28.0, 20.0, 16.0, 12.0, 13.0, 14.0, 7.0, 5.0, 7.0, 12.0, 2.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.609375, -6.4173583984375, -6.225341796875, -6.0333251953125, -5.84130859375, -5.6492919921875, -5.457275390625, -5.2652587890625, -5.0732421875, -4.8812255859375, -4.689208984375, -4.4971923828125, -4.30517578125, -4.1131591796875, -3.921142578125, -3.7291259765625, -3.537109375, -3.3450927734375, -3.153076171875, -2.9610595703125, -2.76904296875, -2.5770263671875, -2.385009765625, -2.1929931640625, -2.0009765625, -1.8089599609375, -1.616943359375, -1.4249267578125, -1.23291015625, -1.0408935546875, -0.848876953125, -0.6568603515625, -0.46484375, -0.2728271484375, -0.080810546875, 0.1112060546875, 0.30322265625, 0.4952392578125, 0.687255859375, 0.8792724609375, 1.0712890625, 1.2633056640625, 1.455322265625, 1.6473388671875, 1.83935546875, 2.0313720703125, 2.223388671875, 2.4154052734375, 2.607421875, 2.7994384765625, 2.991455078125, 3.1834716796875, 3.37548828125, 3.5675048828125, 3.759521484375, 3.9515380859375, 4.1435546875, 4.3355712890625, 4.527587890625, 4.7196044921875, 4.91162109375, 5.1036376953125, 5.295654296875, 5.4876708984375, 5.6796875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 20.0, 20.0, 33.0, 45.0, 62.0, 75.0, 116.0, 156.0, 197.0, 284.0, 424.0, 718.0, 1095.0, 2140.0, 4934.0, 13303.0, 45689.0, 201760.0, 502370.0, 205000.0, 46289.0, 13442.0, 4909.0, 2161.0, 1176.0, 631.0, 427.0, 281.0, 193.0, 133.0, 116.0, 71.0, 60.0, 47.0, 44.0, 32.0, 24.0, 14.0, 12.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.5625, -9.268310546875, -8.97412109375, -8.679931640625, -8.3857421875, -8.091552734375, -7.79736328125, -7.503173828125, -7.208984375, -6.914794921875, -6.62060546875, -6.326416015625, -6.0322265625, -5.738037109375, -5.44384765625, -5.149658203125, -4.85546875, -4.561279296875, -4.26708984375, -3.972900390625, -3.6787109375, -3.384521484375, -3.09033203125, -2.796142578125, -2.501953125, -2.207763671875, -1.91357421875, -1.619384765625, -1.3251953125, -1.031005859375, -0.73681640625, -0.442626953125, -0.1484375, 0.145751953125, 0.43994140625, 0.734130859375, 1.0283203125, 1.322509765625, 1.61669921875, 1.910888671875, 2.205078125, 2.499267578125, 2.79345703125, 3.087646484375, 3.3818359375, 3.676025390625, 3.97021484375, 4.264404296875, 4.55859375, 4.852783203125, 5.14697265625, 5.441162109375, 5.7353515625, 6.029541015625, 6.32373046875, 6.617919921875, 6.912109375, 7.206298828125, 7.50048828125, 7.794677734375, 8.0888671875, 8.383056640625, 8.67724609375, 8.971435546875, 9.265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 6.0, 14.0, 5.0, 9.0, 16.0, 29.0, 32.0, 25.0, 30.0, 36.0, 44.0, 39.0, 71.0, 97.0, 235.0, 1494.0, 284.0, 157.0, 82.0, 47.0, 47.0, 42.0, 29.0, 32.0, 24.0, 26.0, 12.0, 14.0, 12.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.3564453125, -16.791015625, -16.2255859375, -15.66015625, -15.0947265625, -14.529296875, -13.9638671875, -13.3984375, -12.8330078125, -12.267578125, -11.7021484375, -11.13671875, -10.5712890625, -10.005859375, -9.4404296875, -8.875, -8.3095703125, -7.744140625, -7.1787109375, -6.61328125, -6.0478515625, -5.482421875, -4.9169921875, -4.3515625, -3.7861328125, -3.220703125, -2.6552734375, -2.08984375, -1.5244140625, -0.958984375, -0.3935546875, 0.171875, 0.7373046875, 1.302734375, 1.8681640625, 2.43359375, 2.9990234375, 3.564453125, 4.1298828125, 4.6953125, 5.2607421875, 5.826171875, 6.3916015625, 6.95703125, 7.5224609375, 8.087890625, 8.6533203125, 9.21875, 9.7841796875, 10.349609375, 10.9150390625, 11.48046875, 12.0458984375, 12.611328125, 13.1767578125, 13.7421875, 14.3076171875, 14.873046875, 15.4384765625, 16.00390625, 16.5693359375, 17.134765625, 17.7001953125, 18.265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 8.0, 6.0, 11.0, 11.0, 8.0, 18.0, 31.0, 27.0, 31.0, 31.0, 46.0, 83.0, 113.0, 124.0, 187.0, 318.0, 620.0, 1569.0, 24353.0, 3046320.0, 67773.0, 2068.0, 741.0, 373.0, 224.0, 135.0, 112.0, 72.0, 56.0, 50.0, 25.0, 40.0, 21.0, 21.0, 18.0, 12.0, 10.0, 9.0, 10.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-28.796875, -27.885498046875, -26.97412109375, -26.062744140625, -25.1513671875, -24.239990234375, -23.32861328125, -22.417236328125, -21.505859375, -20.594482421875, -19.68310546875, -18.771728515625, -17.8603515625, -16.948974609375, -16.03759765625, -15.126220703125, -14.21484375, -13.303466796875, -12.39208984375, -11.480712890625, -10.5693359375, -9.657958984375, -8.74658203125, -7.835205078125, -6.923828125, -6.012451171875, -5.10107421875, -4.189697265625, -3.2783203125, -2.366943359375, -1.45556640625, -0.544189453125, 0.3671875, 1.278564453125, 2.18994140625, 3.101318359375, 4.0126953125, 4.924072265625, 5.83544921875, 6.746826171875, 7.658203125, 8.569580078125, 9.48095703125, 10.392333984375, 11.3037109375, 12.215087890625, 13.12646484375, 14.037841796875, 14.94921875, 15.860595703125, 16.77197265625, 17.683349609375, 18.5947265625, 19.506103515625, 20.41748046875, 21.328857421875, 22.240234375, 23.151611328125, 24.06298828125, 24.974365234375, 25.8857421875, 26.797119140625, 27.70849609375, 28.619873046875, 29.53125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 411.0, 585.0, 13.0, 0.0, 1.0], "bins": [-485.3941345214844, -477.3116760253906, -469.2292175292969, -461.146728515625, -453.06427001953125, -444.9818115234375, -436.89935302734375, -428.81689453125, -420.73443603515625, -412.6519775390625, -404.56951904296875, -396.487060546875, -388.4045715332031, -380.3221130371094, -372.2396545410156, -364.1571960449219, -356.07470703125, -347.99224853515625, -339.9097900390625, -331.82733154296875, -323.7448425292969, -315.6623840332031, -307.5799255371094, -299.4974670410156, -291.4150085449219, -283.3325500488281, -275.2500915527344, -267.1676025390625, -259.08514404296875, -251.002685546875, -242.92022705078125, -234.8377685546875, -226.75534057617188, -218.67288208007812, -210.5904083251953, -202.50794982910156, -194.4254913330078, -186.343017578125, -178.26055908203125, -170.1781005859375, -162.0956268310547, -154.01316833496094, -145.93069458007812, -137.84823608398438, -129.76577758789062, -121.68331146240234, -113.60084533691406, -105.51838684082031, -97.43592834472656, -89.35346221923828, -81.27100372314453, -73.18853759765625, -65.1060791015625, -57.02361297607422, -48.94114685058594, -40.85868453979492, -32.77621841430664, -24.693756103515625, -16.611291885375977, -8.528827667236328, -0.4463653564453125, 7.636096954345703, 15.718563079833984, 23.801025390625, 31.883487701416016]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 6.0, 16.0, 6.0, 12.0, 16.0, 17.0, 27.0, 31.0, 31.0, 33.0, 34.0, 44.0, 41.0, 51.0, 42.0, 41.0, 38.0, 35.0, 36.0, 41.0, 48.0, 37.0, 34.0, 40.0, 30.0, 32.0, 24.0, 24.0, 26.0, 19.0, 16.0, 9.0, 12.0, 12.0, 4.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.23396301269531, -38.97794723510742, -37.72193145751953, -36.465911865234375, -35.209896087646484, -33.953880310058594, -32.69786071777344, -31.441844940185547, -30.185829162597656, -28.929813385009766, -27.673795700073242, -26.41777801513672, -25.161762237548828, -23.905746459960938, -22.649728775024414, -21.39371109008789, -20.1376953125, -18.88167953491211, -17.625661849975586, -16.369644165039062, -15.113628387451172, -13.857611656188965, -12.601594924926758, -11.34557819366455, -10.089561462402344, -8.833544731140137, -7.57752799987793, -6.321511268615723, -5.065494537353516, -3.8094778060913086, -2.5534610748291016, -1.2974443435668945, -0.0414276123046875, 1.2145891189575195, 2.4706058502197266, 3.7266225814819336, 4.982639312744141, 6.238656044006348, 7.494672775268555, 8.750689506530762, 10.006706237792969, 11.262722969055176, 12.518739700317383, 13.77475643157959, 15.030773162841797, 16.286788940429688, 17.54280662536621, 18.798824310302734, 20.054840087890625, 21.310855865478516, 22.56687355041504, 23.822891235351562, 25.078907012939453, 26.334922790527344, 27.590940475463867, 28.84695816040039, 30.10297393798828, 31.358989715576172, 32.61500549316406, 33.87102508544922, 35.12704086303711, 36.383056640625, 37.639076232910156, 38.89509201049805, 40.15110778808594]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 8.0, 6.0, 4.0, 11.0, 17.0, 15.0, 17.0, 28.0, 28.0, 29.0, 30.0, 55.0, 38.0, 26.0, 31.0, 45.0, 36.0, 47.0, 47.0, 39.0, 45.0, 57.0, 38.0, 37.0, 50.0, 41.0, 23.0, 20.0, 19.0, 16.0, 25.0, 14.0, 19.0, 12.0, 4.0, 9.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.34375, -8.09271240234375, -7.8416748046875, -7.59063720703125, -7.339599609375, -7.08856201171875, -6.8375244140625, -6.58648681640625, -6.33544921875, -6.08441162109375, -5.8333740234375, -5.58233642578125, -5.331298828125, -5.08026123046875, -4.8292236328125, -4.57818603515625, -4.3271484375, -4.07611083984375, -3.8250732421875, -3.57403564453125, -3.322998046875, -3.07196044921875, -2.8209228515625, -2.56988525390625, -2.31884765625, -2.06781005859375, -1.8167724609375, -1.56573486328125, -1.314697265625, -1.06365966796875, -0.8126220703125, -0.56158447265625, -0.310546875, -0.05950927734375, 0.1915283203125, 0.44256591796875, 0.693603515625, 0.94464111328125, 1.1956787109375, 1.44671630859375, 1.69775390625, 1.94879150390625, 2.1998291015625, 2.45086669921875, 2.701904296875, 2.95294189453125, 3.2039794921875, 3.45501708984375, 3.7060546875, 3.95709228515625, 4.2081298828125, 4.45916748046875, 4.710205078125, 4.96124267578125, 5.2122802734375, 5.46331787109375, 5.71435546875, 5.96539306640625, 6.2164306640625, 6.46746826171875, 6.718505859375, 6.96954345703125, 7.2205810546875, 7.47161865234375, 7.72265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 4.0, 4.0, 11.0, 15.0, 19.0, 22.0, 40.0, 56.0, 85.0, 112.0, 152.0, 242.0, 292.0, 459.0, 663.0, 1165.0, 3303.0, 27550.0, 768321.0, 3114455.0, 259282.0, 12717.0, 2275.0, 1009.0, 650.0, 417.0, 264.0, 202.0, 141.0, 106.0, 73.0, 44.0, 30.0, 32.0, 17.0, 11.0, 7.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -31.06982421875, -30.0458984375, -29.02197265625, -27.998046875, -26.97412109375, -25.9501953125, -24.92626953125, -23.90234375, -22.87841796875, -21.8544921875, -20.83056640625, -19.806640625, -18.78271484375, -17.7587890625, -16.73486328125, -15.7109375, -14.68701171875, -13.6630859375, -12.63916015625, -11.615234375, -10.59130859375, -9.5673828125, -8.54345703125, -7.51953125, -6.49560546875, -5.4716796875, -4.44775390625, -3.423828125, -2.39990234375, -1.3759765625, -0.35205078125, 0.671875, 1.69580078125, 2.7197265625, 3.74365234375, 4.767578125, 5.79150390625, 6.8154296875, 7.83935546875, 8.86328125, 9.88720703125, 10.9111328125, 11.93505859375, 12.958984375, 13.98291015625, 15.0068359375, 16.03076171875, 17.0546875, 18.07861328125, 19.1025390625, 20.12646484375, 21.150390625, 22.17431640625, 23.1982421875, 24.22216796875, 25.24609375, 26.27001953125, 27.2939453125, 28.31787109375, 29.341796875, 30.36572265625, 31.3896484375, 32.41357421875, 33.4375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 15.0, 15.0, 21.0, 24.0, 46.0, 64.0, 77.0, 85.0, 126.0, 183.0, 232.0, 253.0, 329.0, 354.0, 379.0, 359.0, 328.0, 256.0, 222.0, 187.0, 143.0, 102.0, 67.0, 59.0, 41.0, 22.0, 17.0, 19.0, 8.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.4703369140625, -13.065673828125, -12.6610107421875, -12.25634765625, -11.8516845703125, -11.447021484375, -11.0423583984375, -10.6376953125, -10.2330322265625, -9.828369140625, -9.4237060546875, -9.01904296875, -8.6143798828125, -8.209716796875, -7.8050537109375, -7.400390625, -6.9957275390625, -6.591064453125, -6.1864013671875, -5.78173828125, -5.3770751953125, -4.972412109375, -4.5677490234375, -4.1630859375, -3.7584228515625, -3.353759765625, -2.9490966796875, -2.54443359375, -2.1397705078125, -1.735107421875, -1.3304443359375, -0.92578125, -0.5211181640625, -0.116455078125, 0.2882080078125, 0.69287109375, 1.0975341796875, 1.502197265625, 1.9068603515625, 2.3115234375, 2.7161865234375, 3.120849609375, 3.5255126953125, 3.93017578125, 4.3348388671875, 4.739501953125, 5.1441650390625, 5.548828125, 5.9534912109375, 6.358154296875, 6.7628173828125, 7.16748046875, 7.5721435546875, 7.976806640625, 8.3814697265625, 8.7861328125, 9.1907958984375, 9.595458984375, 10.0001220703125, 10.40478515625, 10.8094482421875, 11.214111328125, 11.6187744140625, 12.0234375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 13.0, 18.0, 32.0, 51.0, 86.0, 132.0, 241.0, 489.0, 995.0, 2221.0, 5483.0, 17705.0, 81885.0, 448466.0, 1783642.0, 1456209.0, 316768.0, 58146.0, 13622.0, 4335.0, 1856.0, 858.0, 486.0, 211.0, 128.0, 66.0, 55.0, 30.0, 16.0, 13.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.8875732421875, -12.470458984375, -12.0533447265625, -11.63623046875, -11.2191162109375, -10.802001953125, -10.3848876953125, -9.9677734375, -9.5506591796875, -9.133544921875, -8.7164306640625, -8.29931640625, -7.8822021484375, -7.465087890625, -7.0479736328125, -6.630859375, -6.2137451171875, -5.796630859375, -5.3795166015625, -4.96240234375, -4.5452880859375, -4.128173828125, -3.7110595703125, -3.2939453125, -2.8768310546875, -2.459716796875, -2.0426025390625, -1.62548828125, -1.2083740234375, -0.791259765625, -0.3741455078125, 0.04296875, 0.4600830078125, 0.877197265625, 1.2943115234375, 1.71142578125, 2.1285400390625, 2.545654296875, 2.9627685546875, 3.3798828125, 3.7969970703125, 4.214111328125, 4.6312255859375, 5.04833984375, 5.4654541015625, 5.882568359375, 6.2996826171875, 6.716796875, 7.1339111328125, 7.551025390625, 7.9681396484375, 8.38525390625, 8.8023681640625, 9.219482421875, 9.6365966796875, 10.0537109375, 10.4708251953125, 10.887939453125, 11.3050537109375, 11.72216796875, 12.1392822265625, 12.556396484375, 12.9735107421875, 13.390625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 8.0, 10.0, 20.0, 31.0, 31.0, 37.0, 39.0, 41.0, 36.0, 55.0, 66.0, 66.0, 54.0, 60.0, 62.0, 52.0, 53.0, 38.0, 45.0, 31.0, 32.0, 24.0, 24.0, 22.0, 13.0, 12.0, 4.0, 0.0, 4.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-55.11027908325195, -52.86919403076172, -50.62810516357422, -48.387020111083984, -46.14593505859375, -43.90484619140625, -41.663761138916016, -39.42267608642578, -37.18158721923828, -34.94050216674805, -32.69941329956055, -30.458328247070312, -28.217241287231445, -25.976154327392578, -23.735069274902344, -21.493982315063477, -19.25289535522461, -17.011808395385742, -14.770722389221191, -12.52963638305664, -10.288549423217773, -8.047462463378906, -5.8063764572143555, -3.5652904510498047, -1.3242034912109375, 0.9168829917907715, 3.1579694747924805, 5.3990559577941895, 7.640142440795898, 9.881229400634766, 12.122315406799316, 14.363401412963867, 16.6044921875, 18.845579147338867, 21.086666107177734, 23.32775115966797, 25.568838119506836, 27.809925079345703, 30.051010131835938, 32.29209899902344, 34.53318405151367, 36.774269104003906, 39.015357971191406, 41.25644302368164, 43.497528076171875, 45.738616943359375, 47.97970199584961, 50.220787048339844, 52.461875915527344, 54.70296096801758, 56.94404983520508, 59.18513488769531, 61.42622375488281, 63.66730880737305, 65.90839385986328, 68.14948272705078, 70.39056396484375, 72.63165283203125, 74.87273406982422, 77.11382293701172, 79.35491180419922, 81.59599304199219, 83.83708190917969, 86.07817077636719, 88.31925964355469]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 5.0, 7.0, 2.0, 10.0, 9.0, 12.0, 15.0, 8.0, 12.0, 21.0, 16.0, 25.0, 31.0, 39.0, 26.0, 43.0, 44.0, 49.0, 52.0, 46.0, 42.0, 45.0, 42.0, 39.0, 29.0, 42.0, 30.0, 30.0, 39.0, 30.0, 22.0, 21.0, 19.0, 16.0, 17.0, 11.0, 13.0, 6.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.25094985961914, -60.30513381958008, -58.359317779541016, -56.41350555419922, -54.467689514160156, -52.521873474121094, -50.57605743408203, -48.63024139404297, -46.68442916870117, -44.73861312866211, -42.79279708862305, -40.84698486328125, -38.90116882324219, -36.955352783203125, -35.00953674316406, -33.063720703125, -31.11790657043457, -29.172090530395508, -27.226276397705078, -25.280460357666016, -23.334646224975586, -21.388830184936523, -19.443016052246094, -17.49720001220703, -15.551384925842285, -13.605569839477539, -11.659754753112793, -9.713939666748047, -7.768124103546143, -5.822308540344238, -3.876493453979492, -1.930678367614746, 0.01513671875, 1.9609519243240356, 3.9067671298980713, 5.8525824546813965, 7.798397541046143, 9.744213104248047, 11.690028190612793, 13.635843276977539, 15.581658363342285, 17.52747344970703, 19.473289489746094, 21.419103622436523, 23.364919662475586, 25.310733795166016, 27.256549835205078, 29.20236587524414, 31.14818000793457, 33.093994140625, 35.03981018066406, 36.985626220703125, 38.93144226074219, 40.87725830078125, 42.82307052612305, 44.76888656616211, 46.71470260620117, 48.660518646240234, 50.6063346862793, 52.552146911621094, 54.497962951660156, 56.44377899169922, 58.38959503173828, 60.335411071777344, 62.28122329711914]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 12.0, 9.0, 7.0, 11.0, 13.0, 11.0, 16.0, 18.0, 23.0, 22.0, 20.0, 34.0, 26.0, 42.0, 47.0, 53.0, 42.0, 31.0, 47.0, 38.0, 47.0, 44.0, 41.0, 39.0, 38.0, 30.0, 24.0, 31.0, 33.0, 22.0, 19.0, 15.0, 14.0, 7.0, 12.0, 9.0, 11.0, 8.0, 4.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-98.625, -95.3486328125, -92.072265625, -88.7958984375, -85.51953125, -82.2431640625, -78.966796875, -75.6904296875, -72.4140625, -69.1376953125, -65.861328125, -62.5849609375, -59.30859375, -56.0322265625, -52.755859375, -49.4794921875, -46.203125, -42.9267578125, -39.650390625, -36.3740234375, -33.09765625, -29.8212890625, -26.544921875, -23.2685546875, -19.9921875, -16.7158203125, -13.439453125, -10.1630859375, -6.88671875, -3.6103515625, -0.333984375, 2.9423828125, 6.21875, 9.4951171875, 12.771484375, 16.0478515625, 19.32421875, 22.6005859375, 25.876953125, 29.1533203125, 32.4296875, 35.7060546875, 38.982421875, 42.2587890625, 45.53515625, 48.8115234375, 52.087890625, 55.3642578125, 58.640625, 61.9169921875, 65.193359375, 68.4697265625, 71.74609375, 75.0224609375, 78.298828125, 81.5751953125, 84.8515625, 88.1279296875, 91.404296875, 94.6806640625, 97.95703125, 101.2333984375, 104.509765625, 107.7861328125, 111.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 15.0, 26.0, 26.0, 72.0, 75.0, 131.0, 177.0, 241.0, 486.0, 750.0, 1059.0, 1760.0, 2610.0, 4001.0, 5889.0, 9241.0, 14329.0, 22051.0, 33198.0, 49724.0, 71420.0, 97976.0, 124516.0, 138419.0, 129436.0, 104141.0, 76930.0, 54135.0, 36499.0, 23895.0, 15847.0, 10189.0, 6689.0, 4426.0, 2756.0, 1936.0, 1182.0, 811.0, 552.0, 326.0, 204.0, 136.0, 91.0, 76.0, 40.0, 27.0, 13.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-4.57421875, -4.4339599609375, -4.293701171875, -4.1534423828125, -4.01318359375, -3.8729248046875, -3.732666015625, -3.5924072265625, -3.4521484375, -3.3118896484375, -3.171630859375, -3.0313720703125, -2.89111328125, -2.7508544921875, -2.610595703125, -2.4703369140625, -2.330078125, -2.1898193359375, -2.049560546875, -1.9093017578125, -1.76904296875, -1.6287841796875, -1.488525390625, -1.3482666015625, -1.2080078125, -1.0677490234375, -0.927490234375, -0.7872314453125, -0.64697265625, -0.5067138671875, -0.366455078125, -0.2261962890625, -0.0859375, 0.0543212890625, 0.194580078125, 0.3348388671875, 0.47509765625, 0.6153564453125, 0.755615234375, 0.8958740234375, 1.0361328125, 1.1763916015625, 1.316650390625, 1.4569091796875, 1.59716796875, 1.7374267578125, 1.877685546875, 2.0179443359375, 2.158203125, 2.2984619140625, 2.438720703125, 2.5789794921875, 2.71923828125, 2.8594970703125, 2.999755859375, 3.1400146484375, 3.2802734375, 3.4205322265625, 3.560791015625, 3.7010498046875, 3.84130859375, 3.9815673828125, 4.121826171875, 4.2620849609375, 4.40234375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 4.0, 6.0, 7.0, 11.0, 14.0, 14.0, 16.0, 29.0, 29.0, 22.0, 30.0, 20.0, 32.0, 39.0, 40.0, 45.0, 40.0, 52.0, 48.0, 1067.0, 32.0, 44.0, 44.0, 29.0, 35.0, 35.0, 38.0, 31.0, 19.0, 22.0, 17.0, 21.0, 22.0, 16.0, 14.0, 6.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -62.33203125, -60.2890625, -58.24609375, -56.203125, -54.16015625, -52.1171875, -50.07421875, -48.03125, -45.98828125, -43.9453125, -41.90234375, -39.859375, -37.81640625, -35.7734375, -33.73046875, -31.6875, -29.64453125, -27.6015625, -25.55859375, -23.515625, -21.47265625, -19.4296875, -17.38671875, -15.34375, -13.30078125, -11.2578125, -9.21484375, -7.171875, -5.12890625, -3.0859375, -1.04296875, 1.0, 3.04296875, 5.0859375, 7.12890625, 9.171875, 11.21484375, 13.2578125, 15.30078125, 17.34375, 19.38671875, 21.4296875, 23.47265625, 25.515625, 27.55859375, 29.6015625, 31.64453125, 33.6875, 35.73046875, 37.7734375, 39.81640625, 41.859375, 43.90234375, 45.9453125, 47.98828125, 50.03125, 52.07421875, 54.1171875, 56.16015625, 58.203125, 60.24609375, 62.2890625, 64.33203125, 66.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 10.0, 10.0, 45.0, 60.0, 91.0, 145.0, 222.0, 416.0, 651.0, 1132.0, 1883.0, 3188.0, 5332.0, 9061.0, 15320.0, 25712.0, 41487.0, 65114.0, 95851.0, 130520.0, 1163763.0, 184309.0, 120018.0, 86314.0, 57024.0, 35623.0, 21758.0, 13060.0, 7741.0, 4550.0, 2648.0, 1632.0, 949.0, 598.0, 340.0, 239.0, 138.0, 68.0, 50.0, 16.0, 22.0, 8.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.7991943359375, -4.653076171875, -4.5069580078125, -4.36083984375, -4.2147216796875, -4.068603515625, -3.9224853515625, -3.7763671875, -3.6302490234375, -3.484130859375, -3.3380126953125, -3.19189453125, -3.0457763671875, -2.899658203125, -2.7535400390625, -2.607421875, -2.4613037109375, -2.315185546875, -2.1690673828125, -2.02294921875, -1.8768310546875, -1.730712890625, -1.5845947265625, -1.4384765625, -1.2923583984375, -1.146240234375, -1.0001220703125, -0.85400390625, -0.7078857421875, -0.561767578125, -0.4156494140625, -0.26953125, -0.1234130859375, 0.022705078125, 0.1688232421875, 0.31494140625, 0.4610595703125, 0.607177734375, 0.7532958984375, 0.8994140625, 1.0455322265625, 1.191650390625, 1.3377685546875, 1.48388671875, 1.6300048828125, 1.776123046875, 1.9222412109375, 2.068359375, 2.2144775390625, 2.360595703125, 2.5067138671875, 2.65283203125, 2.7989501953125, 2.945068359375, 3.0911865234375, 3.2373046875, 3.3834228515625, 3.529541015625, 3.6756591796875, 3.82177734375, 3.9678955078125, 4.114013671875, 4.2601318359375, 4.40625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 10.0, 7.0, 5.0, 12.0, 11.0, 12.0, 24.0, 30.0, 28.0, 39.0, 43.0, 38.0, 38.0, 41.0, 37.0, 49.0, 48.0, 54.0, 58.0, 45.0, 62.0, 52.0, 36.0, 40.0, 24.0, 20.0, 24.0, 17.0, 9.0, 15.0, 11.0, 12.0, 4.0, 10.0, 7.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440673828125, -0.04256486892700195, -0.041062355041503906, -0.03955984115600586, -0.03805732727050781, -0.036554813385009766, -0.03505229949951172, -0.03354978561401367, -0.032047271728515625, -0.030544757843017578, -0.02904224395751953, -0.027539730072021484, -0.026037216186523438, -0.02453470230102539, -0.023032188415527344, -0.021529674530029297, -0.02002716064453125, -0.018524646759033203, -0.017022132873535156, -0.01551961898803711, -0.014017105102539062, -0.012514591217041016, -0.011012077331542969, -0.009509563446044922, -0.008007049560546875, -0.006504535675048828, -0.005002021789550781, -0.0034995079040527344, -0.0019969940185546875, -0.0004944801330566406, 0.0010080337524414062, 0.002510547637939453, 0.0040130615234375, 0.005515575408935547, 0.007018089294433594, 0.00852060317993164, 0.010023117065429688, 0.011525630950927734, 0.013028144836425781, 0.014530658721923828, 0.016033172607421875, 0.017535686492919922, 0.01903820037841797, 0.020540714263916016, 0.022043228149414062, 0.02354574203491211, 0.025048255920410156, 0.026550769805908203, 0.02805328369140625, 0.029555797576904297, 0.031058311462402344, 0.03256082534790039, 0.03406333923339844, 0.035565853118896484, 0.03706836700439453, 0.03857088088989258, 0.040073394775390625, 0.04157590866088867, 0.04307842254638672, 0.044580936431884766, 0.04608345031738281, 0.04758596420288086, 0.049088478088378906, 0.05059099197387695, 0.052093505859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 18.0, 26.0, 28.0, 36.0, 38.0, 66.0, 83.0, 125.0, 173.0, 262.0, 383.0, 605.0, 1035.0, 1849.0, 3678.0, 7584.0, 17265.0, 38538.0, 85028.0, 166356.0, 248119.0, 225300.0, 133346.0, 64418.0, 28730.0, 12825.0, 5869.0, 2825.0, 1488.0, 829.0, 487.0, 337.0, 244.0, 136.0, 111.0, 91.0, 59.0, 50.0, 30.0, 21.0, 18.0, 9.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.1711406707763672, -0.16540145874023438, -0.15966224670410156, -0.15392303466796875, -0.14818382263183594, -0.14244461059570312, -0.1367053985595703, -0.1309661865234375, -0.1252269744873047, -0.11948776245117188, -0.11374855041503906, -0.10800933837890625, -0.10227012634277344, -0.09653091430664062, -0.09079170227050781, -0.085052490234375, -0.07931327819824219, -0.07357406616210938, -0.06783485412597656, -0.06209564208984375, -0.05635643005371094, -0.050617218017578125, -0.04487800598144531, -0.0391387939453125, -0.03339958190917969, -0.027660369873046875, -0.021921157836914062, -0.01618194580078125, -0.010442733764648438, -0.004703521728515625, 0.0010356903076171875, 0.00677490234375, 0.012514114379882812, 0.018253326416015625, 0.023992538452148438, 0.02973175048828125, 0.03547096252441406, 0.041210174560546875, 0.04694938659667969, 0.0526885986328125, 0.05842781066894531, 0.06416702270507812, 0.06990623474121094, 0.07564544677734375, 0.08138465881347656, 0.08712387084960938, 0.09286308288574219, 0.098602294921875, 0.10434150695800781, 0.11008071899414062, 0.11581993103027344, 0.12155914306640625, 0.12729835510253906, 0.13303756713867188, 0.1387767791748047, 0.1445159912109375, 0.1502552032470703, 0.15599441528320312, 0.16173362731933594, 0.16747283935546875, 0.17321205139160156, 0.17895126342773438, 0.1846904754638672, 0.1904296875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 30.0, 37.0, 63.0, 60.0, 88.0, 94.0, 104.0, 92.0, 91.0, 85.0, 56.0, 42.0, 30.0, 16.0, 23.0, 15.0, 12.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04940366744995117, -0.04590730741620064, -0.042410947382450104, -0.03891458734869957, -0.035418227314949036, -0.0319218710064888, -0.028425509110093117, -0.024929149076342583, -0.02143278904259205, -0.017936429008841515, -0.01444006897509098, -0.010943709872663021, -0.007447349838912487, -0.003950990736484528, -0.00045463070273399353, 0.0030417293310165405, 0.006538089364767075, 0.010034449398517609, 0.013530809432268143, 0.017027169466018677, 0.02052352949976921, 0.024019887670874596, 0.02751624770462513, 0.031012607738375664, 0.03450896590948105, 0.03800532594323158, 0.04150168597698212, 0.04499804601073265, 0.048494406044483185, 0.05199076235294342, 0.05548712611198425, 0.05898348242044449, 0.06247984617948532, 0.06597620248794556, 0.06947256624698639, 0.07296892255544662, 0.07646528631448746, 0.07996164262294769, 0.08345800638198853, 0.08695436269044876, 0.0904507264494896, 0.09394708275794983, 0.09744344651699066, 0.1009398028254509, 0.10443616658449173, 0.10793252289295197, 0.1114288866519928, 0.11492524296045303, 0.11842159926891327, 0.1219179555773735, 0.12541431188583374, 0.12891067564487457, 0.1324070394039154, 0.13590340316295624, 0.13939975202083588, 0.1428961157798767, 0.14639247953891754, 0.14988884329795837, 0.153385192155838, 0.15688155591487885, 0.16037791967391968, 0.1638742834329605, 0.16737063229084015, 0.17086699604988098, 0.17436335980892181]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 9.0, 11.0, 8.0, 5.0, 9.0, 10.0, 9.0, 22.0, 21.0, 24.0, 22.0, 25.0, 26.0, 28.0, 27.0, 25.0, 35.0, 26.0, 20.0, 30.0, 37.0, 23.0, 45.0, 45.0, 37.0, 34.0, 27.0, 34.0, 28.0, 34.0, 36.0, 25.0, 29.0, 22.0, 21.0, 23.0, 18.0, 15.0, 16.0, 9.0, 9.0, 9.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.050896406173706055, -0.04933762177824974, -0.047778837382793427, -0.04622005298733711, -0.0446612685918808, -0.043102484196424484, -0.04154369980096817, -0.039984915405511856, -0.03842613101005554, -0.03686734661459923, -0.035308562219142914, -0.0337497778236866, -0.032190993428230286, -0.03063220903277397, -0.029073424637317657, -0.027514640241861343, -0.02595585584640503, -0.024397071450948715, -0.0228382870554924, -0.021279502660036087, -0.019720718264579773, -0.01816193386912346, -0.016603149473667145, -0.01504436507821083, -0.013485580682754517, -0.011926796287298203, -0.010368011891841888, -0.008809227496385574, -0.00725044310092926, -0.005691658705472946, -0.004132874310016632, -0.002574089914560318, -0.001015305519104004, 0.0005434788763523102, 0.0021022632718086243, 0.0036610476672649384, 0.0052198320627212524, 0.0067786164581775665, 0.00833740085363388, 0.009896185249090195, 0.011454969644546509, 0.013013754040002823, 0.014572538435459137, 0.01613132283091545, 0.017690107226371765, 0.01924889162182808, 0.020807676017284393, 0.022366460412740707, 0.02392524480819702, 0.025484029203653336, 0.02704281359910965, 0.028601597994565964, 0.030160382390022278, 0.03171916678547859, 0.033277951180934906, 0.03483673557639122, 0.036395519971847534, 0.03795430436730385, 0.03951308876276016, 0.041071873158216476, 0.04263065755367279, 0.044189441949129105, 0.04574822634458542, 0.04730701074004173, 0.04886579513549805]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 10.0, 6.0, 14.0, 11.0, 20.0, 17.0, 14.0, 20.0, 19.0, 26.0, 34.0, 37.0, 35.0, 26.0, 39.0, 50.0, 48.0, 45.0, 53.0, 36.0, 51.0, 45.0, 38.0, 32.0, 24.0, 33.0, 21.0, 23.0, 35.0, 19.0, 20.0, 13.0, 14.0, 10.0, 5.0, 9.0, 9.0, 9.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.3125, -93.986328125, -90.66015625, -87.333984375, -84.0078125, -80.681640625, -77.35546875, -74.029296875, -70.703125, -67.376953125, -64.05078125, -60.724609375, -57.3984375, -54.072265625, -50.74609375, -47.419921875, -44.09375, -40.767578125, -37.44140625, -34.115234375, -30.7890625, -27.462890625, -24.13671875, -20.810546875, -17.484375, -14.158203125, -10.83203125, -7.505859375, -4.1796875, -0.853515625, 2.47265625, 5.798828125, 9.125, 12.451171875, 15.77734375, 19.103515625, 22.4296875, 25.755859375, 29.08203125, 32.408203125, 35.734375, 39.060546875, 42.38671875, 45.712890625, 49.0390625, 52.365234375, 55.69140625, 59.017578125, 62.34375, 65.669921875, 68.99609375, 72.322265625, 75.6484375, 78.974609375, 82.30078125, 85.626953125, 88.953125, 92.279296875, 95.60546875, 98.931640625, 102.2578125, 105.583984375, 108.91015625, 112.236328125, 115.5625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 8.0, 10.0, 14.0, 13.0, 15.0, 18.0, 23.0, 28.0, 35.0, 48.0, 90.0, 117.0, 224.0, 382.0, 960.0, 4012.0, 25396.0, 192836.0, 590543.0, 201384.0, 26223.0, 4095.0, 1046.0, 378.0, 210.0, 113.0, 70.0, 59.0, 56.0, 30.0, 25.0, 19.0, 11.0, 10.0, 8.0, 9.0, 5.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.341064453125, -17.69775390625, -17.054443359375, -16.4111328125, -15.767822265625, -15.12451171875, -14.481201171875, -13.837890625, -13.194580078125, -12.55126953125, -11.907958984375, -11.2646484375, -10.621337890625, -9.97802734375, -9.334716796875, -8.69140625, -8.048095703125, -7.40478515625, -6.761474609375, -6.1181640625, -5.474853515625, -4.83154296875, -4.188232421875, -3.544921875, -2.901611328125, -2.25830078125, -1.614990234375, -0.9716796875, -0.328369140625, 0.31494140625, 0.958251953125, 1.6015625, 2.244873046875, 2.88818359375, 3.531494140625, 4.1748046875, 4.818115234375, 5.46142578125, 6.104736328125, 6.748046875, 7.391357421875, 8.03466796875, 8.677978515625, 9.3212890625, 9.964599609375, 10.60791015625, 11.251220703125, 11.89453125, 12.537841796875, 13.18115234375, 13.824462890625, 14.4677734375, 15.111083984375, 15.75439453125, 16.397705078125, 17.041015625, 17.684326171875, 18.32763671875, 18.970947265625, 19.6142578125, 20.257568359375, 20.90087890625, 21.544189453125, 22.1875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 7.0, 9.0, 5.0, 8.0, 8.0, 10.0, 20.0, 20.0, 30.0, 36.0, 44.0, 56.0, 47.0, 61.0, 78.0, 183.0, 2013.0, 52.0, 46.0, 53.0, 57.0, 51.0, 46.0, 25.0, 21.0, 24.0, 15.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-217.5, -211.12109375, -204.7421875, -198.36328125, -191.984375, -185.60546875, -179.2265625, -172.84765625, -166.46875, -160.08984375, -153.7109375, -147.33203125, -140.953125, -134.57421875, -128.1953125, -121.81640625, -115.4375, -109.05859375, -102.6796875, -96.30078125, -89.921875, -83.54296875, -77.1640625, -70.78515625, -64.40625, -58.02734375, -51.6484375, -45.26953125, -38.890625, -32.51171875, -26.1328125, -19.75390625, -13.375, -6.99609375, -0.6171875, 5.76171875, 12.140625, 18.51953125, 24.8984375, 31.27734375, 37.65625, 44.03515625, 50.4140625, 56.79296875, 63.171875, 69.55078125, 75.9296875, 82.30859375, 88.6875, 95.06640625, 101.4453125, 107.82421875, 114.203125, 120.58203125, 126.9609375, 133.33984375, 139.71875, 146.09765625, 152.4765625, 158.85546875, 165.234375, 171.61328125, 177.9921875, 184.37109375, 190.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 1.0, 7.0, 9.0, 25.0, 37.0, 42.0, 70.0, 104.0, 233.0, 420.0, 824.0, 2118.0, 9587.0, 178737.0, 2872665.0, 72283.0, 5439.0, 1589.0, 667.0, 336.0, 177.0, 97.0, 57.0, 50.0, 33.0, 22.0, 17.0, 16.0, 9.0, 9.0, 6.0, 6.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.265625, -25.400634765625, -24.53564453125, -23.670654296875, -22.8056640625, -21.940673828125, -21.07568359375, -20.210693359375, -19.345703125, -18.480712890625, -17.61572265625, -16.750732421875, -15.8857421875, -15.020751953125, -14.15576171875, -13.290771484375, -12.42578125, -11.560791015625, -10.69580078125, -9.830810546875, -8.9658203125, -8.100830078125, -7.23583984375, -6.370849609375, -5.505859375, -4.640869140625, -3.77587890625, -2.910888671875, -2.0458984375, -1.180908203125, -0.31591796875, 0.549072265625, 1.4140625, 2.279052734375, 3.14404296875, 4.009033203125, 4.8740234375, 5.739013671875, 6.60400390625, 7.468994140625, 8.333984375, 9.198974609375, 10.06396484375, 10.928955078125, 11.7939453125, 12.658935546875, 13.52392578125, 14.388916015625, 15.25390625, 16.118896484375, 16.98388671875, 17.848876953125, 18.7138671875, 19.578857421875, 20.44384765625, 21.308837890625, 22.173828125, 23.038818359375, 23.90380859375, 24.768798828125, 25.6337890625, 26.498779296875, 27.36376953125, 28.228759765625, 29.09375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 9.0, 8.0, 8.0, 23.0, 45.0, 80.0, 124.0, 201.0, 188.0, 142.0, 81.0, 36.0, 22.0, 6.0, 4.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.8191223144531, -348.33062744140625, -339.8421325683594, -331.3536376953125, -322.8651428222656, -314.37664794921875, -305.8881530761719, -297.399658203125, -288.9111633300781, -280.42266845703125, -271.9341735839844, -263.4456787109375, -254.95718383789062, -246.46868896484375, -237.98019409179688, -229.49169921875, -221.00318908691406, -212.5146942138672, -204.0261993408203, -195.53770446777344, -187.04920959472656, -178.5607147216797, -170.07220458984375, -161.58370971679688, -153.09521484375, -144.60671997070312, -136.11822509765625, -127.62973022460938, -119.1412353515625, -110.65274047851562, -102.16423797607422, -93.67574310302734, -85.187255859375, -76.69876098632812, -68.21026611328125, -59.72176742553711, -51.233272552490234, -42.74477767944336, -34.25627899169922, -25.767784118652344, -17.27928924560547, -8.790793418884277, -0.30229759216308594, 8.186199188232422, 16.674694061279297, 25.163188934326172, 33.65168762207031, 42.14018249511719, 50.62867736816406, 59.11717224121094, 67.60566711425781, 76.09416198730469, 84.58265686035156, 93.07115173339844, 101.55965423583984, 110.04814910888672, 118.5366439819336, 127.02513885498047, 135.51364135742188, 144.00213623046875, 152.49063110351562, 160.9791259765625, 169.46762084960938, 177.95611572265625, 186.44461059570312]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 8.0, 6.0, 9.0, 17.0, 28.0, 14.0, 18.0, 24.0, 13.0, 26.0, 34.0, 27.0, 35.0, 51.0, 47.0, 46.0, 39.0, 42.0, 32.0, 42.0, 50.0, 42.0, 45.0, 46.0, 29.0, 24.0, 24.0, 28.0, 16.0, 18.0, 16.0, 15.0, 13.0, 15.0, 8.0, 7.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-204.6805419921875, -198.47418212890625, -192.267822265625, -186.06146240234375, -179.8551025390625, -173.64874267578125, -167.4423828125, -161.23602294921875, -155.0296630859375, -148.82330322265625, -142.616943359375, -136.41058349609375, -130.2042236328125, -123.99786376953125, -117.79151153564453, -111.58515167236328, -105.37879943847656, -99.17243957519531, -92.96607971191406, -86.75971984863281, -80.55335998535156, -74.34700012207031, -68.1406478881836, -61.934288024902344, -55.727928161621094, -49.521568298339844, -43.315208435058594, -37.10885238647461, -30.90249252319336, -24.69613265991211, -18.489776611328125, -12.283416748046875, -6.0770416259765625, 0.1293172836303711, 6.335676193237305, 12.542034149169922, 18.748394012451172, 24.954753875732422, 31.161109924316406, 37.367469787597656, 43.573829650878906, 49.780189514160156, 55.986549377441406, 62.19290542602539, 68.39926147460938, 74.60562133789062, 80.81198120117188, 87.01834106445312, 93.22470092773438, 99.43106079101562, 105.63742065429688, 111.84378051757812, 118.05014038085938, 124.25650024414062, 130.46286010742188, 136.66921997070312, 142.87557983398438, 149.08193969726562, 155.28829956054688, 161.49465942382812, 167.70101928710938, 173.90737915039062, 180.11373901367188, 186.32009887695312, 192.5264434814453]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 9.0, 9.0, 19.0, 28.0, 26.0, 45.0, 73.0, 85.0, 134.0, 157.0, 231.0, 312.0, 389.0, 563.0, 852.0, 1230.0, 1801.0, 2883.0, 4639.0, 7540.0, 1009998.0, 6135.0, 3795.0, 2404.0, 1545.0, 1060.0, 732.0, 515.0, 373.0, 267.0, 197.0, 120.0, 106.0, 95.0, 57.0, 31.0, 30.0, 22.0, 16.0, 7.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.06478500366211, -32.90257263183594, -31.740360260009766, -30.578147888183594, -29.415935516357422, -28.25372314453125, -27.091510772705078, -25.929298400878906, -24.767086029052734, -23.604873657226562, -22.44266128540039, -21.28044891357422, -20.118236541748047, -18.956024169921875, -17.793811798095703, -16.63159942626953, -15.469385147094727, -14.307172775268555, -13.144960403442383, -11.982748031616211, -10.820535659790039, -9.658323287963867, -8.496109962463379, -7.333897590637207, -6.171685218811035, -5.009472846984863, -3.8472602367401123, -2.6850476264953613, -1.5228352546691895, -0.3606228828430176, 0.8015899658203125, 1.9638023376464844, 3.1260147094726562, 4.288227081298828, 5.450439453125, 6.61265230178833, 7.774864673614502, 8.937076568603516, 10.099289894104004, 11.261502265930176, 12.423714637756348, 13.58592700958252, 14.748139381408691, 15.91035270690918, 17.07256507873535, 18.234777450561523, 19.396989822387695, 20.559202194213867, 21.72141456604004, 22.88362693786621, 24.045839309692383, 25.208051681518555, 26.370264053344727, 27.5324764251709, 28.694690704345703, 29.856903076171875, 31.019115447998047, 32.18132781982422, 33.34354019165039, 34.50575256347656, 35.667964935302734, 36.830177307128906, 37.99238967895508, 39.15460205078125, 40.31681442260742]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 4.0, 10.0, 12.0, 15.0, 31.0, 46.0, 91.0, 194.0, 7810.0, 51454540.0, 243.0, 60.0, 32.0, 27.0, 14.0, 8.0, 3.0, 6.0, 9.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2362.27099609375, -2278.351318359375, -2194.431884765625, -2110.51220703125, -2026.592529296875, -1942.6729736328125, -1858.75341796875, -1774.833740234375, -1690.9141845703125, -1606.99462890625, -1523.074951171875, -1439.1553955078125, -1355.23583984375, -1271.316162109375, -1187.3966064453125, -1103.47705078125, -1019.557373046875, -935.6377563476562, -851.7181396484375, -767.798583984375, -683.8789672851562, -599.9593505859375, -516.039794921875, -432.12017822265625, -348.2005615234375, -264.28094482421875, -180.36135864257812, -96.44175720214844, -12.52215576171875, 71.3974609375, 155.31704711914062, 239.23663330078125, 323.156494140625, 407.07611083984375, 490.9956970214844, 574.915283203125, 658.8348999023438, 742.7545166015625, 826.674072265625, 910.5936889648438, 994.5133056640625, 1078.432861328125, 1162.3525390625, 1246.2720947265625, 1330.191650390625, 1414.111328125, 1498.0308837890625, 1581.950439453125, 1665.8701171875, 1749.7896728515625, 1833.7093505859375, 1917.62890625, 2001.548583984375, 2085.46826171875, 2169.3876953125, 2253.307373046875, 2337.22705078125, 2421.146728515625, 2505.066162109375, 2588.98583984375, 2672.905517578125, 2756.8251953125, 2840.74462890625, 2924.664306640625, 3008.583740234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 11.0, 24.0, 34.0, 34.0, 67.0, 76.0, 112.0, 188.0, 300.0, 446.0, 733.0, 1131.0, 1762.0, 2919.0, 5014.0, 8500.0, 14903.0, 26104.0, 47216.0, 86384.0, 158534.0, 283759.0, 469168.0, 3488476.0, 812460.0, 383346.0, 222875.0, 122794.0, 67034.0, 36986.0, 20836.0, 11766.0, 6885.0, 4123.0, 2420.0, 1527.0, 918.0, 543.0, 354.0, 227.0, 133.0, 107.0, 67.0, 39.0, 27.0, 22.0, 22.0, 11.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.4609375, -3.355377197265625, -3.24981689453125, -3.144256591796875, -3.0386962890625, -2.933135986328125, -2.82757568359375, -2.722015380859375, -2.616455078125, -2.510894775390625, -2.40533447265625, -2.299774169921875, -2.1942138671875, -2.088653564453125, -1.98309326171875, -1.877532958984375, -1.77197265625, -1.666412353515625, -1.56085205078125, -1.455291748046875, -1.3497314453125, -1.244171142578125, -1.13861083984375, -1.033050537109375, -0.927490234375, -0.821929931640625, -0.71636962890625, -0.610809326171875, -0.5052490234375, -0.399688720703125, -0.29412841796875, -0.188568115234375, -0.0830078125, 0.022552490234375, 0.12811279296875, 0.233673095703125, 0.3392333984375, 0.444793701171875, 0.55035400390625, 0.655914306640625, 0.761474609375, 0.867034912109375, 0.97259521484375, 1.078155517578125, 1.1837158203125, 1.289276123046875, 1.39483642578125, 1.500396728515625, 1.60595703125, 1.711517333984375, 1.81707763671875, 1.922637939453125, 2.0281982421875, 2.133758544921875, 2.23931884765625, 2.344879150390625, 2.450439453125, 2.555999755859375, 2.66156005859375, 2.767120361328125, 2.8726806640625, 2.978240966796875, 3.08380126953125, 3.189361572265625, 3.294921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 2.0, 4.0, 5.0, 7.0, 20.0, 19.0, 19.0, 16.0, 15.0, 15.0, 19.0, 20.0, 30.0, 27.0, 37.0, 36.0, 46.0, 48.0, 47.0, 768.0, 337.0, 46.0, 31.0, 47.0, 46.0, 46.0, 38.0, 33.0, 26.0, 23.0, 27.0, 13.0, 21.0, 12.0, 18.0, 9.0, 8.0, 6.0, 9.0, 3.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-59.5, -57.84033203125, -56.1806640625, -54.52099609375, -52.861328125, -51.20166015625, -49.5419921875, -47.88232421875, -46.22265625, -44.56298828125, -42.9033203125, -41.24365234375, -39.583984375, -37.92431640625, -36.2646484375, -34.60498046875, -32.9453125, -31.28564453125, -29.6259765625, -27.96630859375, -26.306640625, -24.64697265625, -22.9873046875, -21.32763671875, -19.66796875, -18.00830078125, -16.3486328125, -14.68896484375, -13.029296875, -11.36962890625, -9.7099609375, -8.05029296875, -6.390625, -4.73095703125, -3.0712890625, -1.41162109375, 0.248046875, 1.90771484375, 3.5673828125, 5.22705078125, 6.88671875, 8.54638671875, 10.2060546875, 11.86572265625, 13.525390625, 15.18505859375, 16.8447265625, 18.50439453125, 20.1640625, 21.82373046875, 23.4833984375, 25.14306640625, 26.802734375, 28.46240234375, 30.1220703125, 31.78173828125, 33.44140625, 35.10107421875, 36.7607421875, 38.42041015625, 40.080078125, 41.73974609375, 43.3994140625, 45.05908203125, 46.71875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 10.0, 18.0, 22.0, 47.0, 50.0, 86.0, 119.0, 168.0, 223.0, 433.0, 613.0, 1102.0, 1715.0, 3124.0, 5559.0, 10213.0, 20035.0, 42474.0, 98458.0, 240489.0, 572405.0, 4033053.0, 714092.0, 313264.0, 126891.0, 54200.0, 25064.0, 12106.0, 6455.0, 3519.0, 2124.0, 1238.0, 705.0, 453.0, 280.0, 196.0, 105.0, 94.0, 66.0, 47.0, 26.0, 17.0, 17.0, 14.0, 13.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.728515625, -4.57421875, -4.419921875, -4.265625, -4.111328125, -3.95703125, -3.802734375, -3.6484375, -3.494140625, -3.33984375, -3.185546875, -3.03125, -2.876953125, -2.72265625, -2.568359375, -2.4140625, -2.259765625, -2.10546875, -1.951171875, -1.796875, -1.642578125, -1.48828125, -1.333984375, -1.1796875, -1.025390625, -0.87109375, -0.716796875, -0.5625, -0.408203125, -0.25390625, -0.099609375, 0.0546875, 0.208984375, 0.36328125, 0.517578125, 0.671875, 0.826171875, 0.98046875, 1.134765625, 1.2890625, 1.443359375, 1.59765625, 1.751953125, 1.90625, 2.060546875, 2.21484375, 2.369140625, 2.5234375, 2.677734375, 2.83203125, 2.986328125, 3.140625, 3.294921875, 3.44921875, 3.603515625, 3.7578125, 3.912109375, 4.06640625, 4.220703125, 4.375, 4.529296875, 4.68359375, 4.837890625, 4.9921875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 3.0, 4.0, 4.0, 13.0, 12.0, 13.0, 22.0, 27.0, 24.0, 43.0, 55.0, 73.0, 79.0, 118.0, 1089.0, 83.0, 82.0, 69.0, 51.0, 25.0, 28.0, 22.0, 17.0, 9.0, 10.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-98.375, -95.3232421875, -92.271484375, -89.2197265625, -86.16796875, -83.1162109375, -80.064453125, -77.0126953125, -73.9609375, -70.9091796875, -67.857421875, -64.8056640625, -61.75390625, -58.7021484375, -55.650390625, -52.5986328125, -49.546875, -46.4951171875, -43.443359375, -40.3916015625, -37.33984375, -34.2880859375, -31.236328125, -28.1845703125, -25.1328125, -22.0810546875, -19.029296875, -15.9775390625, -12.92578125, -9.8740234375, -6.822265625, -3.7705078125, -0.71875, 2.3330078125, 5.384765625, 8.4365234375, 11.48828125, 14.5400390625, 17.591796875, 20.6435546875, 23.6953125, 26.7470703125, 29.798828125, 32.8505859375, 35.90234375, 38.9541015625, 42.005859375, 45.0576171875, 48.109375, 51.1611328125, 54.212890625, 57.2646484375, 60.31640625, 63.3681640625, 66.419921875, 69.4716796875, 72.5234375, 75.5751953125, 78.626953125, 81.6787109375, 84.73046875, 87.7822265625, 90.833984375, 93.8857421875, 96.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 10.0, 22.0, 32.0, 35.0, 56.0, 45.0, 54.0, 86.0, 106.0, 192.0, 254.0, 464.0, 781.0, 1547.0, 3481.0, 8875.0, 29898.0, 126422.0, 5904893.0, 159477.0, 36175.0, 10478.0, 3948.0, 1730.0, 906.0, 506.0, 263.0, 156.0, 116.0, 107.0, 60.0, 57.0, 48.0, 43.0, 31.0, 12.0, 7.0, 9.0, 10.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.984375, -21.156982421875, -20.32958984375, -19.502197265625, -18.6748046875, -17.847412109375, -17.02001953125, -16.192626953125, -15.365234375, -14.537841796875, -13.71044921875, -12.883056640625, -12.0556640625, -11.228271484375, -10.40087890625, -9.573486328125, -8.74609375, -7.918701171875, -7.09130859375, -6.263916015625, -5.4365234375, -4.609130859375, -3.78173828125, -2.954345703125, -2.126953125, -1.299560546875, -0.47216796875, 0.355224609375, 1.1826171875, 2.010009765625, 2.83740234375, 3.664794921875, 4.4921875, 5.319580078125, 6.14697265625, 6.974365234375, 7.8017578125, 8.629150390625, 9.45654296875, 10.283935546875, 11.111328125, 11.938720703125, 12.76611328125, 13.593505859375, 14.4208984375, 15.248291015625, 16.07568359375, 16.903076171875, 17.73046875, 18.557861328125, 19.38525390625, 20.212646484375, 21.0400390625, 21.867431640625, 22.69482421875, 23.522216796875, 24.349609375, 25.177001953125, 26.00439453125, 26.831787109375, 27.6591796875, 28.486572265625, 29.31396484375, 30.141357421875, 30.96875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 17.0, 15.0, 22.0, 32.0, 26.0, 39.0, 50.0, 57.0, 53.0, 76.0, 154.0, 1044.0, 71.0, 57.0, 58.0, 49.0, 41.0, 27.0, 27.0, 18.0, 29.0, 13.0, 9.0, 7.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-130.875, -126.66796875, -122.4609375, -118.25390625, -114.046875, -109.83984375, -105.6328125, -101.42578125, -97.21875, -93.01171875, -88.8046875, -84.59765625, -80.390625, -76.18359375, -71.9765625, -67.76953125, -63.5625, -59.35546875, -55.1484375, -50.94140625, -46.734375, -42.52734375, -38.3203125, -34.11328125, -29.90625, -25.69921875, -21.4921875, -17.28515625, -13.078125, -8.87109375, -4.6640625, -0.45703125, 3.75, 7.95703125, 12.1640625, 16.37109375, 20.578125, 24.78515625, 28.9921875, 33.19921875, 37.40625, 41.61328125, 45.8203125, 50.02734375, 54.234375, 58.44140625, 62.6484375, 66.85546875, 71.0625, 75.26953125, 79.4765625, 83.68359375, 87.890625, 92.09765625, 96.3046875, 100.51171875, 104.71875, 108.92578125, 113.1328125, 117.33984375, 121.546875, 125.75390625, 129.9609375, 134.16796875, 138.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 13.0, 42.0, 291.0, 532.0, 80.0, 22.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-433.836181640625, -423.2879943847656, -412.7398376464844, -402.191650390625, -391.64349365234375, -381.0953063964844, -370.547119140625, -359.99896240234375, -349.4507751464844, -338.902587890625, -328.35443115234375, -317.8062438964844, -307.258056640625, -296.70989990234375, -286.1617126464844, -275.613525390625, -265.06536865234375, -254.51719665527344, -243.96902465820312, -233.42083740234375, -222.87266540527344, -212.32449340820312, -201.77630615234375, -191.22813415527344, -180.67996215820312, -170.1317901611328, -159.5836181640625, -149.03543090820312, -138.4872589111328, -127.9390869140625, -117.39090728759766, -106.84272766113281, -96.29452514648438, -85.74635314941406, -75.19817352294922, -64.64999389648438, -54.10182189941406, -43.553646087646484, -33.005470275878906, -22.457290649414062, -11.90911865234375, -1.3609428405761719, 9.187232971191406, 19.735408782958984, 30.283584594726562, 40.83176040649414, 51.37993621826172, 61.92811584472656, 72.47628784179688, 83.02445983886719, 93.57263946533203, 104.12081909179688, 114.66899108886719, 125.2171630859375, 135.76535034179688, 146.3135223388672, 156.8616943359375, 167.4098663330078, 177.95803833007812, 188.5062255859375, 199.0543975830078, 209.60256958007812, 220.1507568359375, 230.6989288330078, 241.24710083007812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 5.0, 8.0, 15.0, 14.0, 25.0, 60.0, 125.0, 189.0, 217.0, 151.0, 85.0, 40.0, 21.0, 15.0, 4.0, 3.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.3887939453125, -619.57861328125, -603.7684326171875, -587.9581909179688, -572.1480102539062, -556.3378295898438, -540.5276489257812, -524.7174072265625, -508.9072265625, -493.0970458984375, -477.2868347167969, -461.4766540527344, -445.66644287109375, -429.85626220703125, -414.0460510253906, -398.2358703613281, -382.4256591796875, -366.615478515625, -350.8052673339844, -334.9950866699219, -319.18487548828125, -303.37469482421875, -287.5644836425781, -271.7543029785156, -255.94412231445312, -240.13392639160156, -224.32373046875, -208.51353454589844, -192.70333862304688, -176.89315795898438, -161.08294677734375, -145.27276611328125, -129.46255493164062, -113.65235900878906, -97.8421630859375, -82.03196716308594, -66.22177124023438, -50.411582946777344, -34.60138702392578, -18.79119110107422, -2.9809951782226562, 12.82919979095459, 28.639394760131836, 44.449588775634766, 60.25978469848633, 76.06997680664062, 91.88017272949219, 107.69036865234375, 123.50056457519531, 139.31076049804688, 155.12095642089844, 170.93115234375, 186.74134826660156, 202.55154418945312, 218.36172485351562, 234.17193603515625, 249.98211669921875, 265.79229736328125, 281.6025085449219, 297.4126892089844, 313.222900390625, 329.0330810546875, 344.8432922363281, 360.6534729003906, 376.46368408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 5.0, 5.0, 17.0, 21.0, 24.0, 31.0, 49.0, 74.0, 90.0, 170.0, 226.0, 436.0, 825.0, 1569.0, 3650.0, 11221.0, 68567.0, 4030834.0, 59219.0, 10186.0, 3540.0, 1576.0, 768.0, 437.0, 278.0, 148.0, 95.0, 62.0, 40.0, 29.0, 28.0, 11.0, 14.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1796875, -1.145477294921875, -1.11126708984375, -1.077056884765625, -1.0428466796875, -1.008636474609375, -0.97442626953125, -0.940216064453125, -0.906005859375, -0.871795654296875, -0.83758544921875, -0.803375244140625, -0.7691650390625, -0.734954833984375, -0.70074462890625, -0.666534423828125, -0.63232421875, -0.598114013671875, -0.56390380859375, -0.529693603515625, -0.4954833984375, -0.461273193359375, -0.42706298828125, -0.392852783203125, -0.358642578125, -0.324432373046875, -0.29022216796875, -0.256011962890625, -0.2218017578125, -0.187591552734375, -0.15338134765625, -0.119171142578125, -0.0849609375, -0.050750732421875, -0.01654052734375, 0.017669677734375, 0.0518798828125, 0.086090087890625, 0.12030029296875, 0.154510498046875, 0.188720703125, 0.222930908203125, 0.25714111328125, 0.291351318359375, 0.3255615234375, 0.359771728515625, 0.39398193359375, 0.428192138671875, 0.46240234375, 0.496612548828125, 0.53082275390625, 0.565032958984375, 0.5992431640625, 0.633453369140625, 0.66766357421875, 0.701873779296875, 0.736083984375, 0.770294189453125, 0.80450439453125, 0.838714599609375, 0.8729248046875, 0.907135009765625, 0.94134521484375, 0.975555419921875, 1.009765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 9.0, 12.0, 12.0, 13.0, 15.0, 18.0, 784.0, 21.0, 23.0, 7.0, 12.0, 4.0, 9.0, 9.0, 8.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.02984619140625, -0.9962158203125, -0.96258544921875, -0.928955078125, -0.89532470703125, -0.8616943359375, -0.82806396484375, -0.79443359375, -0.76080322265625, -0.7271728515625, -0.69354248046875, -0.659912109375, -0.62628173828125, -0.5926513671875, -0.55902099609375, -0.525390625, -0.49176025390625, -0.4581298828125, -0.42449951171875, -0.390869140625, -0.35723876953125, -0.3236083984375, -0.28997802734375, -0.25634765625, -0.22271728515625, -0.1890869140625, -0.15545654296875, -0.121826171875, -0.08819580078125, -0.0545654296875, -0.02093505859375, 0.0126953125, 0.04632568359375, 0.0799560546875, 0.11358642578125, 0.147216796875, 0.18084716796875, 0.2144775390625, 0.24810791015625, 0.28173828125, 0.31536865234375, 0.3489990234375, 0.38262939453125, 0.416259765625, 0.44989013671875, 0.4835205078125, 0.51715087890625, 0.55078125, 0.58441162109375, 0.6180419921875, 0.65167236328125, 0.685302734375, 0.71893310546875, 0.7525634765625, 0.78619384765625, 0.81982421875, 0.85345458984375, 0.8870849609375, 0.92071533203125, 0.954345703125, 0.98797607421875, 1.0216064453125, 1.05523681640625, 1.0888671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 11.0, 13.0, 16.0, 34.0, 58.0, 80.0, 191.0, 418.0, 1208.0, 5847.0, 113533.0, 4022387.0, 43808.0, 4088.0, 1176.0, 570.0, 320.0, 150.0, 123.0, 77.0, 36.0, 26.0, 20.0, 19.0, 13.0, 7.0, 16.0, 6.0, 2.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.068359375, -2.00244140625, -1.9365234375, -1.87060546875, -1.8046875, -1.73876953125, -1.6728515625, -1.60693359375, -1.541015625, -1.47509765625, -1.4091796875, -1.34326171875, -1.27734375, -1.21142578125, -1.1455078125, -1.07958984375, -1.013671875, -0.94775390625, -0.8818359375, -0.81591796875, -0.75, -0.68408203125, -0.6181640625, -0.55224609375, -0.486328125, -0.42041015625, -0.3544921875, -0.28857421875, -0.22265625, -0.15673828125, -0.0908203125, -0.02490234375, 0.041015625, 0.10693359375, 0.1728515625, 0.23876953125, 0.3046875, 0.37060546875, 0.4365234375, 0.50244140625, 0.568359375, 0.63427734375, 0.7001953125, 0.76611328125, 0.83203125, 0.89794921875, 0.9638671875, 1.02978515625, 1.095703125, 1.16162109375, 1.2275390625, 1.29345703125, 1.359375, 1.42529296875, 1.4912109375, 1.55712890625, 1.623046875, 1.68896484375, 1.7548828125, 1.82080078125, 1.88671875, 1.95263671875, 2.0185546875, 2.08447265625, 2.150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 12.0, 21.0, 41.0, 69.0, 180.0, 707.0, 2449.0, 348.0, 116.0, 56.0, 28.0, 20.0, 10.0, 5.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.51806640625, -0.48816680908203125, -0.4582672119140625, -0.42836761474609375, -0.398468017578125, -0.36856842041015625, -0.3386688232421875, -0.30876922607421875, -0.27886962890625, -0.24897003173828125, -0.2190704345703125, -0.18917083740234375, -0.159271240234375, -0.12937164306640625, -0.0994720458984375, -0.06957244873046875, -0.0396728515625, -0.00977325439453125, 0.0201263427734375, 0.05002593994140625, 0.079925537109375, 0.10982513427734375, 0.1397247314453125, 0.16962432861328125, 0.19952392578125, 0.22942352294921875, 0.2593231201171875, 0.28922271728515625, 0.319122314453125, 0.34902191162109375, 0.3789215087890625, 0.40882110595703125, 0.438720703125, 0.46862030029296875, 0.4985198974609375, 0.5284194946289062, 0.558319091796875, 0.5882186889648438, 0.6181182861328125, 0.6480178833007812, 0.67791748046875, 0.7078170776367188, 0.7377166748046875, 0.7676162719726562, 0.797515869140625, 0.8274154663085938, 0.8573150634765625, 0.8872146606445312, 0.9171142578125, 0.9470138549804688, 0.9769134521484375, 1.0068130493164062, 1.036712646484375, 1.0666122436523438, 1.0965118408203125, 1.1264114379882812, 1.15631103515625, 1.1862106323242188, 1.2161102294921875, 1.2460098266601562, 1.275909423828125, 1.3058090209960938, 1.3357086181640625, 1.3656082153320312, 1.3955078125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 7.0, 35.0, 541.0, 393.0, 25.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3236536979675293, -2.0313642024993896, -1.73907470703125, -1.4467853307724, -1.1544958353042603, -0.8622063398361206, -0.5699169635772705, -0.27762746810913086, 0.014662027359008789, 0.30695149302482605, 0.5992409586906433, 0.8915303945541382, 1.1838198900222778, 1.4761093854904175, 1.7683987617492676, 2.0606882572174072, 2.352977752685547, 2.6452672481536865, 2.937556743621826, 3.2298460006713867, 3.5221357345581055, 3.814424991607666, 4.106714248657227, 4.399003982543945, 4.691293716430664, 4.983582973480225, 5.275872707366943, 5.568161964416504, 5.860451698303223, 6.152740955352783, 6.445030212402344, 6.7373199462890625, 7.029608726501465, 7.321897983551025, 7.614187717437744, 7.906476974487305, 8.198766708374023, 8.491056442260742, 8.783345222473145, 9.075634956359863, 9.367924690246582, 9.6602144241333, 9.952503204345703, 10.244792938232422, 10.53708267211914, 10.82937240600586, 11.121661186218262, 11.41395092010498, 11.706239700317383, 11.998529434204102, 12.290818214416504, 12.583107948303223, 12.875397682189941, 13.16768741607666, 13.459976196289062, 13.752265930175781, 14.0445556640625, 14.336845397949219, 14.629134178161621, 14.92142391204834, 15.213713645935059, 15.506003379821777, 15.79829216003418, 16.0905818939209, 16.382871627807617]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 5.0, 6.0, 7.0, 9.0, 9.0, 14.0, 35.0, 44.0, 76.0, 108.0, 131.0, 120.0, 120.0, 91.0, 72.0, 43.0, 19.0, 16.0, 16.0, 7.0, 9.0, 5.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1069557666778564, -2.985807418823242, -2.864659309387207, -2.7435109615325928, -2.6223628520965576, -2.5012145042419434, -2.380066394805908, -2.258918046951294, -2.1377696990966797, -2.0166213512420654, -1.8954732418060303, -1.774324893951416, -1.6531767845153809, -1.5320284366607666, -1.410880208015442, -1.2897319793701172, -1.168583869934082, -1.0474356412887573, -0.9262874126434326, -0.8051391243934631, -0.6839908957481384, -0.5628426671028137, -0.44169437885284424, -0.32054615020751953, -0.19939792156219482, -0.07824967801570892, 0.04289856553077698, 0.16404682397842407, 0.2851950526237488, 0.4063432812690735, 0.527491569519043, 0.6486397981643677, 0.7697882652282715, 0.8909364938735962, 1.012084722518921, 1.1332330703735352, 1.2543811798095703, 1.3755295276641846, 1.4966777563095093, 1.617825984954834, 1.7389742136001587, 1.8601224422454834, 1.981270670890808, 2.102418899536133, 2.223567247390747, 2.3447153568267822, 2.4658637046813965, 2.5870118141174316, 2.708160161972046, 2.82930850982666, 2.9504566192626953, 3.0716049671173096, 3.1927530765533447, 3.313901424407959, 3.435049533843994, 3.5561978816986084, 3.6773462295532227, 3.798494577407837, 3.919642686843872, 4.040791034698486, 4.1619391441345215, 4.283087253570557, 4.40423583984375, 4.525383949279785, 4.64653205871582]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 5.0, 6.0, 11.0, 18.0, 18.0, 28.0, 61.0, 80.0, 115.0, 193.0, 344.0, 567.0, 995.0, 1822.0, 3610.0, 7740.0, 20026.0, 90863.0, 880096.0, 24093.0, 9020.0, 4080.0, 2038.0, 1092.0, 640.0, 382.0, 212.0, 146.0, 94.0, 46.0, 34.0, 16.0, 22.0, 14.0, 5.0, 9.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.6485595703125, -4.508056640625, -4.3675537109375, -4.22705078125, -4.0865478515625, -3.946044921875, -3.8055419921875, -3.6650390625, -3.5245361328125, -3.384033203125, -3.2435302734375, -3.10302734375, -2.9625244140625, -2.822021484375, -2.6815185546875, -2.541015625, -2.4005126953125, -2.260009765625, -2.1195068359375, -1.97900390625, -1.8385009765625, -1.697998046875, -1.5574951171875, -1.4169921875, -1.2764892578125, -1.135986328125, -0.9954833984375, -0.85498046875, -0.7144775390625, -0.573974609375, -0.4334716796875, -0.29296875, -0.1524658203125, -0.011962890625, 0.1285400390625, 0.26904296875, 0.4095458984375, 0.550048828125, 0.6905517578125, 0.8310546875, 0.9715576171875, 1.112060546875, 1.2525634765625, 1.39306640625, 1.5335693359375, 1.674072265625, 1.8145751953125, 1.955078125, 2.0955810546875, 2.236083984375, 2.3765869140625, 2.51708984375, 2.6575927734375, 2.798095703125, 2.9385986328125, 3.0791015625, 3.2196044921875, 3.360107421875, 3.5006103515625, 3.64111328125, 3.7816162109375, 3.922119140625, 4.0626220703125, 4.203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 11.0, 13.0, 13.0, 9.0, 12.0, 14.0, 163.0, 645.0, 19.0, 19.0, 9.0, 8.0, 3.0, 14.0, 6.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9659271240234375, -0.933807373046875, -0.9016876220703125, -0.86956787109375, -0.8374481201171875, -0.805328369140625, -0.7732086181640625, -0.7410888671875, -0.7089691162109375, -0.676849365234375, -0.6447296142578125, -0.61260986328125, -0.5804901123046875, -0.548370361328125, -0.5162506103515625, -0.484130859375, -0.4520111083984375, -0.419891357421875, -0.3877716064453125, -0.35565185546875, -0.3235321044921875, -0.291412353515625, -0.2592926025390625, -0.2271728515625, -0.1950531005859375, -0.162933349609375, -0.1308135986328125, -0.09869384765625, -0.0665740966796875, -0.034454345703125, -0.0023345947265625, 0.02978515625, 0.0619049072265625, 0.094024658203125, 0.1261444091796875, 0.15826416015625, 0.1903839111328125, 0.222503662109375, 0.2546234130859375, 0.2867431640625, 0.3188629150390625, 0.350982666015625, 0.3831024169921875, 0.41522216796875, 0.4473419189453125, 0.479461669921875, 0.5115814208984375, 0.543701171875, 0.5758209228515625, 0.607940673828125, 0.6400604248046875, 0.67218017578125, 0.7042999267578125, 0.736419677734375, 0.7685394287109375, 0.8006591796875, 0.8327789306640625, 0.864898681640625, 0.8970184326171875, 0.92913818359375, 0.9612579345703125, 0.993377685546875, 1.0254974365234375, 1.0576171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 13.0, 18.0, 22.0, 36.0, 55.0, 76.0, 92.0, 134.0, 196.0, 243.0, 423.0, 652.0, 1515.0, 4284.0, 14743.0, 66668.0, 482137.0, 400705.0, 56579.0, 12811.0, 3866.0, 1444.0, 644.0, 350.0, 251.0, 152.0, 107.0, 97.0, 61.0, 37.0, 46.0, 27.0, 22.0, 7.0, 16.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.2234954833984375, -2.159881591796875, -2.0962677001953125, -2.03265380859375, -1.9690399169921875, -1.905426025390625, -1.8418121337890625, -1.7781982421875, -1.7145843505859375, -1.650970458984375, -1.5873565673828125, -1.52374267578125, -1.4601287841796875, -1.396514892578125, -1.3329010009765625, -1.269287109375, -1.2056732177734375, -1.142059326171875, -1.0784454345703125, -1.01483154296875, -0.9512176513671875, -0.887603759765625, -0.8239898681640625, -0.7603759765625, -0.6967620849609375, -0.633148193359375, -0.5695343017578125, -0.50592041015625, -0.4423065185546875, -0.378692626953125, -0.3150787353515625, -0.25146484375, -0.1878509521484375, -0.124237060546875, -0.0606231689453125, 0.00299072265625, 0.0666046142578125, 0.130218505859375, 0.1938323974609375, 0.2574462890625, 0.3210601806640625, 0.384674072265625, 0.4482879638671875, 0.51190185546875, 0.5755157470703125, 0.639129638671875, 0.7027435302734375, 0.766357421875, 0.8299713134765625, 0.893585205078125, 0.9571990966796875, 1.02081298828125, 1.0844268798828125, 1.148040771484375, 1.2116546630859375, 1.2752685546875, 1.3388824462890625, 1.402496337890625, 1.4661102294921875, 1.52972412109375, 1.5933380126953125, 1.656951904296875, 1.7205657958984375, 1.7841796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 6.0, 3.0, 16.0, 15.0, 12.0, 15.0, 16.0, 23.0, 20.0, 23.0, 34.0, 30.0, 33.0, 40.0, 50.0, 42.0, 46.0, 42.0, 46.0, 49.0, 53.0, 45.0, 42.0, 39.0, 28.0, 27.0, 25.0, 30.0, 25.0, 22.0, 22.0, 23.0, 9.0, 9.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.34375, -2.264617919921875, -2.18548583984375, -2.106353759765625, -2.0272216796875, -1.948089599609375, -1.86895751953125, -1.789825439453125, -1.710693359375, -1.631561279296875, -1.55242919921875, -1.473297119140625, -1.3941650390625, -1.315032958984375, -1.23590087890625, -1.156768798828125, -1.07763671875, -0.998504638671875, -0.91937255859375, -0.840240478515625, -0.7611083984375, -0.681976318359375, -0.60284423828125, -0.523712158203125, -0.444580078125, -0.365447998046875, -0.28631591796875, -0.207183837890625, -0.1280517578125, -0.048919677734375, 0.03021240234375, 0.109344482421875, 0.1884765625, 0.267608642578125, 0.34674072265625, 0.425872802734375, 0.5050048828125, 0.584136962890625, 0.66326904296875, 0.742401123046875, 0.821533203125, 0.900665283203125, 0.97979736328125, 1.058929443359375, 1.1380615234375, 1.217193603515625, 1.29632568359375, 1.375457763671875, 1.45458984375, 1.533721923828125, 1.61285400390625, 1.691986083984375, 1.7711181640625, 1.850250244140625, 1.92938232421875, 2.008514404296875, 2.087646484375, 2.166778564453125, 2.24591064453125, 2.325042724609375, 2.4041748046875, 2.483306884765625, 2.56243896484375, 2.641571044921875, 2.720703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 12.0, 9.0, 21.0, 22.0, 60.0, 130.0, 316.0, 1017.0, 6693.0, 964147.0, 72429.0, 2749.0, 569.0, 195.0, 86.0, 33.0, 18.0, 14.0, 13.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.69140625, -3.578857421875, -3.46630859375, -3.353759765625, -3.2412109375, -3.128662109375, -3.01611328125, -2.903564453125, -2.791015625, -2.678466796875, -2.56591796875, -2.453369140625, -2.3408203125, -2.228271484375, -2.11572265625, -2.003173828125, -1.890625, -1.778076171875, -1.66552734375, -1.552978515625, -1.4404296875, -1.327880859375, -1.21533203125, -1.102783203125, -0.990234375, -0.877685546875, -0.76513671875, -0.652587890625, -0.5400390625, -0.427490234375, -0.31494140625, -0.202392578125, -0.08984375, 0.022705078125, 0.13525390625, 0.247802734375, 0.3603515625, 0.472900390625, 0.58544921875, 0.697998046875, 0.810546875, 0.923095703125, 1.03564453125, 1.148193359375, 1.2607421875, 1.373291015625, 1.48583984375, 1.598388671875, 1.7109375, 1.823486328125, 1.93603515625, 2.048583984375, 2.1611328125, 2.273681640625, 2.38623046875, 2.498779296875, 2.611328125, 2.723876953125, 2.83642578125, 2.948974609375, 3.0615234375, 3.174072265625, 3.28662109375, 3.399169921875, 3.51171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 8.0, 5.0, 7.0, 3.0, 11.0, 18.0, 18.0, 40.0, 46.0, 80.0, 109.0, 133.0, 140.0, 118.0, 95.0, 70.0, 35.0, 25.0, 15.0, 15.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56978988647461e-05, -7.341429591178894e-05, -7.113069295883179e-05, -6.884709000587463e-05, -6.656348705291748e-05, -6.427988409996033e-05, -6.199628114700317e-05, -5.971267819404602e-05, -5.742907524108887e-05, -5.5145472288131714e-05, -5.286186933517456e-05, -5.057826638221741e-05, -4.8294663429260254e-05, -4.60110604763031e-05, -4.372745752334595e-05, -4.1443854570388794e-05, -3.916025161743164e-05, -3.687664866447449e-05, -3.4593045711517334e-05, -3.230944275856018e-05, -3.0025839805603027e-05, -2.7742236852645874e-05, -2.545863389968872e-05, -2.3175030946731567e-05, -2.0891427993774414e-05, -1.860782504081726e-05, -1.6324222087860107e-05, -1.4040619134902954e-05, -1.17570161819458e-05, -9.473413228988647e-06, -7.189810276031494e-06, -4.906207323074341e-06, -2.6226043701171875e-06, -3.390014171600342e-07, 1.944601535797119e-06, 4.2282044887542725e-06, 6.511807441711426e-06, 8.795410394668579e-06, 1.1079013347625732e-05, 1.3362616300582886e-05, 1.564621925354004e-05, 1.7929822206497192e-05, 2.0213425159454346e-05, 2.24970281124115e-05, 2.4780631065368652e-05, 2.7064234018325806e-05, 2.934783697128296e-05, 3.163143992424011e-05, 3.3915042877197266e-05, 3.619864583015442e-05, 3.848224878311157e-05, 4.0765851736068726e-05, 4.304945468902588e-05, 4.533305764198303e-05, 4.7616660594940186e-05, 4.990026354789734e-05, 5.218386650085449e-05, 5.4467469453811646e-05, 5.67510724067688e-05, 5.903467535972595e-05, 6.13182783126831e-05, 6.360188126564026e-05, 6.588548421859741e-05, 6.816908717155457e-05, 7.045269012451172e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 8.0, 23.0, 19.0, 29.0, 47.0, 120.0, 212.0, 451.0, 1316.0, 4566.0, 40342.0, 908867.0, 83347.0, 6582.0, 1538.0, 570.0, 223.0, 117.0, 70.0, 31.0, 27.0, 7.0, 11.0, 10.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0713348388671875, -1.016693115234375, -0.9620513916015625, -0.90740966796875, -0.8527679443359375, -0.798126220703125, -0.7434844970703125, -0.6888427734375, -0.6342010498046875, -0.579559326171875, -0.5249176025390625, -0.47027587890625, -0.4156341552734375, -0.360992431640625, -0.3063507080078125, -0.251708984375, -0.1970672607421875, -0.142425537109375, -0.0877838134765625, -0.03314208984375, 0.0214996337890625, 0.076141357421875, 0.1307830810546875, 0.1854248046875, 0.2400665283203125, 0.294708251953125, 0.3493499755859375, 0.40399169921875, 0.4586334228515625, 0.513275146484375, 0.5679168701171875, 0.62255859375, 0.6772003173828125, 0.731842041015625, 0.7864837646484375, 0.84112548828125, 0.8957672119140625, 0.950408935546875, 1.0050506591796875, 1.0596923828125, 1.1143341064453125, 1.168975830078125, 1.2236175537109375, 1.27825927734375, 1.3329010009765625, 1.387542724609375, 1.4421844482421875, 1.496826171875, 1.5514678955078125, 1.606109619140625, 1.6607513427734375, 1.71539306640625, 1.7700347900390625, 1.824676513671875, 1.8793182373046875, 1.9339599609375, 1.9886016845703125, 2.043243408203125, 2.0978851318359375, 2.15252685546875, 2.2071685791015625, 2.261810302734375, 2.3164520263671875, 2.37109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 9.0, 10.0, 16.0, 21.0, 39.0, 53.0, 80.0, 117.0, 105.0, 150.0, 101.0, 83.0, 66.0, 47.0, 37.0, 15.0, 8.0, 15.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5184478759765625, -1.466583251953125, -1.4147186279296875, -1.36285400390625, -1.3109893798828125, -1.259124755859375, -1.2072601318359375, -1.1553955078125, -1.1035308837890625, -1.051666259765625, -0.9998016357421875, -0.94793701171875, -0.8960723876953125, -0.844207763671875, -0.7923431396484375, -0.740478515625, -0.6886138916015625, -0.636749267578125, -0.5848846435546875, -0.53302001953125, -0.4811553955078125, -0.429290771484375, -0.3774261474609375, -0.3255615234375, -0.2736968994140625, -0.221832275390625, -0.1699676513671875, -0.11810302734375, -0.0662384033203125, -0.014373779296875, 0.0374908447265625, 0.08935546875, 0.1412200927734375, 0.193084716796875, 0.2449493408203125, 0.29681396484375, 0.3486785888671875, 0.400543212890625, 0.4524078369140625, 0.5042724609375, 0.5561370849609375, 0.608001708984375, 0.6598663330078125, 0.71173095703125, 0.7635955810546875, 0.815460205078125, 0.8673248291015625, 0.919189453125, 0.9710540771484375, 1.022918701171875, 1.0747833251953125, 1.12664794921875, 1.1785125732421875, 1.230377197265625, 1.2822418212890625, 1.3341064453125, 1.3859710693359375, 1.437835693359375, 1.4897003173828125, 1.54156494140625, 1.5934295654296875, 1.645294189453125, 1.6971588134765625, 1.7490234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 12.0, 30.0, 197.0, 584.0, 135.0, 35.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.98435592651367, -33.486873626708984, -31.98939323425293, -30.491910934448242, -28.994430541992188, -27.4969482421875, -25.999465942382812, -24.501983642578125, -23.00450325012207, -21.507020950317383, -20.009540557861328, -18.51205825805664, -17.014575958251953, -15.517095565795898, -14.019613265991211, -12.52213191986084, -11.024650573730469, -9.527169227600098, -8.029687881469727, -6.532205581665039, -5.034724235534668, -3.537242889404297, -2.0397605895996094, -0.5422792434692383, 0.9552021026611328, 2.452683687210083, 3.950165271759033, 5.4476470947265625, 6.945128440856934, 8.442609786987305, 9.940092086791992, 11.437573432922363, 12.935050964355469, 14.43253231048584, 15.930013656616211, 17.4274959564209, 18.924976348876953, 20.42245864868164, 21.919940948486328, 23.417423248291016, 24.91490364074707, 26.412385940551758, 27.909866333007812, 29.4073486328125, 30.904830932617188, 32.402313232421875, 33.89979553222656, 35.397274017333984, 36.89475631713867, 38.39223861694336, 39.88972091674805, 41.38719940185547, 42.884681701660156, 44.382164001464844, 45.87964630126953, 47.37712860107422, 48.874610900878906, 50.372093200683594, 51.86957550048828, 53.36705780029297, 54.86453628540039, 56.36201858520508, 57.859500885009766, 59.35698318481445, 60.854461669921875]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 10.0, 7.0, 24.0, 47.0, 60.0, 98.0, 156.0, 151.0, 132.0, 98.0, 70.0, 40.0, 19.0, 9.0, 9.0, 3.0, 10.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.204833984375, -46.62118911743164, -45.037540435791016, -43.453895568847656, -41.87024688720703, -40.28660202026367, -38.70295715332031, -37.11930847167969, -35.53566360473633, -33.95201873779297, -32.368370056152344, -30.784725189208984, -29.201078414916992, -27.617431640625, -26.033784866333008, -24.450138092041016, -22.866491317749023, -21.28284454345703, -19.69919776916504, -18.115550994873047, -16.531906127929688, -14.948259353637695, -13.364612579345703, -11.780966758728027, -10.197319984436035, -8.613673210144043, -7.030027389526367, -5.446380615234375, -3.862734317779541, -2.279088020324707, -0.6954412460327148, 0.8882045745849609, 2.471851348876953, 4.055497646331787, 5.639143943786621, 7.222790718078613, 8.806436538696289, 10.390083312988281, 11.973730087280273, 13.55737590789795, 15.141022682189941, 16.724668502807617, 18.30831527709961, 19.8919620513916, 21.475608825683594, 23.059253692626953, 24.642902374267578, 26.226547241210938, 27.81019401550293, 29.393840789794922, 30.977487564086914, 32.561134338378906, 34.144779205322266, 35.728424072265625, 37.31207275390625, 38.89571762084961, 40.479366302490234, 42.063011169433594, 43.64665985107422, 45.23030471801758, 46.8139533996582, 48.39759826660156, 49.98124694824219, 51.56489181518555, 53.148536682128906]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 20.0, 15.0, 29.0, 47.0, 78.0, 138.0, 316.0, 809.0, 2263.0, 8748.0, 54234.0, 4029918.0, 80124.0, 11503.0, 3399.0, 1325.0, 578.0, 301.0, 174.0, 90.0, 65.0, 32.0, 22.0, 14.0, 11.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -8.0067138671875, -7.716552734375, -7.4263916015625, -7.13623046875, -6.8460693359375, -6.555908203125, -6.2657470703125, -5.9755859375, -5.6854248046875, -5.395263671875, -5.1051025390625, -4.81494140625, -4.5247802734375, -4.234619140625, -3.9444580078125, -3.654296875, -3.3641357421875, -3.073974609375, -2.7838134765625, -2.49365234375, -2.2034912109375, -1.913330078125, -1.6231689453125, -1.3330078125, -1.0428466796875, -0.752685546875, -0.4625244140625, -0.17236328125, 0.1177978515625, 0.407958984375, 0.6981201171875, 0.98828125, 1.2784423828125, 1.568603515625, 1.8587646484375, 2.14892578125, 2.4390869140625, 2.729248046875, 3.0194091796875, 3.3095703125, 3.5997314453125, 3.889892578125, 4.1800537109375, 4.47021484375, 4.7603759765625, 5.050537109375, 5.3406982421875, 5.630859375, 5.9210205078125, 6.211181640625, 6.5013427734375, 6.79150390625, 7.0816650390625, 7.371826171875, 7.6619873046875, 7.9521484375, 8.2423095703125, 8.532470703125, 8.8226318359375, 9.11279296875, 9.4029541015625, 9.693115234375, 9.9832763671875, 10.2734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 14.0, 14.0, 12.0, 20.0, 19.0, 22.0, 214.0, 548.0, 48.0, 17.0, 21.0, 9.0, 7.0, 4.0, 11.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9599075317382812, -0.9281158447265625, -0.8963241577148438, -0.864532470703125, -0.8327407836914062, -0.8009490966796875, -0.7691574096679688, -0.73736572265625, -0.7055740356445312, -0.6737823486328125, -0.6419906616210938, -0.610198974609375, -0.5784072875976562, -0.5466156005859375, -0.5148239135742188, -0.4830322265625, -0.45124053955078125, -0.4194488525390625, -0.38765716552734375, -0.355865478515625, -0.32407379150390625, -0.2922821044921875, -0.26049041748046875, -0.22869873046875, -0.19690704345703125, -0.1651153564453125, -0.13332366943359375, -0.101531982421875, -0.06974029541015625, -0.0379486083984375, -0.00615692138671875, 0.025634765625, 0.05742645263671875, 0.0892181396484375, 0.12100982666015625, 0.152801513671875, 0.18459320068359375, 0.2163848876953125, 0.24817657470703125, 0.27996826171875, 0.31175994873046875, 0.3435516357421875, 0.37534332275390625, 0.407135009765625, 0.43892669677734375, 0.4707183837890625, 0.5025100708007812, 0.5343017578125, 0.5660934448242188, 0.5978851318359375, 0.6296768188476562, 0.661468505859375, 0.6932601928710938, 0.7250518798828125, 0.7568435668945312, 0.78863525390625, 0.8204269409179688, 0.8522186279296875, 0.8840103149414062, 0.915802001953125, 0.9475936889648438, 0.9793853759765625, 1.0111770629882812, 1.04296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 7.0, 18.0, 15.0, 20.0, 26.0, 41.0, 52.0, 73.0, 94.0, 143.0, 267.0, 488.0, 940.0, 2123.0, 5540.0, 20720.0, 151888.0, 3610067.0, 357207.0, 32723.0, 7284.0, 2403.0, 963.0, 476.0, 263.0, 150.0, 83.0, 48.0, 52.0, 36.0, 15.0, 11.0, 6.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.79296875, -2.7099609375, -2.626953125, -2.5439453125, -2.4609375, -2.3779296875, -2.294921875, -2.2119140625, -2.12890625, -2.0458984375, -1.962890625, -1.8798828125, -1.796875, -1.7138671875, -1.630859375, -1.5478515625, -1.46484375, -1.3818359375, -1.298828125, -1.2158203125, -1.1328125, -1.0498046875, -0.966796875, -0.8837890625, -0.80078125, -0.7177734375, -0.634765625, -0.5517578125, -0.46875, -0.3857421875, -0.302734375, -0.2197265625, -0.13671875, -0.0537109375, 0.029296875, 0.1123046875, 0.1953125, 0.2783203125, 0.361328125, 0.4443359375, 0.52734375, 0.6103515625, 0.693359375, 0.7763671875, 0.859375, 0.9423828125, 1.025390625, 1.1083984375, 1.19140625, 1.2744140625, 1.357421875, 1.4404296875, 1.5234375, 1.6064453125, 1.689453125, 1.7724609375, 1.85546875, 1.9384765625, 2.021484375, 2.1044921875, 2.1875, 2.2705078125, 2.353515625, 2.4365234375, 2.51953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 27.0, 39.0, 56.0, 73.0, 161.0, 279.0, 635.0, 1452.0, 659.0, 275.0, 134.0, 82.0, 49.0, 38.0, 22.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5604476928710938, -0.5393524169921875, -0.5182571411132812, -0.497161865234375, -0.47606658935546875, -0.4549713134765625, -0.43387603759765625, -0.41278076171875, -0.39168548583984375, -0.3705902099609375, -0.34949493408203125, -0.328399658203125, -0.30730438232421875, -0.2862091064453125, -0.26511383056640625, -0.2440185546875, -0.22292327880859375, -0.2018280029296875, -0.18073272705078125, -0.159637451171875, -0.13854217529296875, -0.1174468994140625, -0.09635162353515625, -0.07525634765625, -0.05416107177734375, -0.0330657958984375, -0.01197052001953125, 0.009124755859375, 0.03022003173828125, 0.0513153076171875, 0.07241058349609375, 0.093505859375, 0.11460113525390625, 0.1356964111328125, 0.15679168701171875, 0.177886962890625, 0.19898223876953125, 0.2200775146484375, 0.24117279052734375, 0.26226806640625, 0.28336334228515625, 0.3044586181640625, 0.32555389404296875, 0.346649169921875, 0.36774444580078125, 0.3888397216796875, 0.40993499755859375, 0.4310302734375, 0.45212554931640625, 0.4732208251953125, 0.49431610107421875, 0.515411376953125, 0.5365066528320312, 0.5576019287109375, 0.5786972045898438, 0.59979248046875, 0.6208877563476562, 0.6419830322265625, 0.6630783081054688, 0.684173583984375, 0.7052688598632812, 0.7263641357421875, 0.7474594116210938, 0.7685546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 16.0, 60.0, 566.0, 339.0, 12.0, 5.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.457021713256836, -18.095115661621094, -17.73320960998535, -17.37130355834961, -17.0093994140625, -16.647493362426758, -16.285587310791016, -15.923681259155273, -15.561775207519531, -15.199869155883789, -14.837963104248047, -14.476058006286621, -14.114151954650879, -13.752245903015137, -13.390340805053711, -13.028434753417969, -12.666528701782227, -12.304622650146484, -11.942716598510742, -11.580811500549316, -11.218905448913574, -10.856999397277832, -10.495094299316406, -10.133188247680664, -9.771282196044922, -9.40937614440918, -9.047470092773438, -8.685564994812012, -8.32365894317627, -7.961752891540527, -7.599847316741943, -7.237941741943359, -6.876036643981934, -6.514130592346191, -6.152225017547607, -5.790319442749023, -5.428413391113281, -5.066507339477539, -4.704601764678955, -4.342696189880371, -3.980790138244629, -3.618884325027466, -3.2569785118103027, -2.8950726985931396, -2.5331668853759766, -2.1712610721588135, -1.8093552589416504, -1.4474494457244873, -1.0855436325073242, -0.7236378192901611, -0.36173200607299805, 0.00017380714416503906, 0.3620796203613281, 0.7239854335784912, 1.0858912467956543, 1.4477970600128174, 1.8097028732299805, 2.1716086864471436, 2.5335144996643066, 2.8954203128814697, 3.257326126098633, 3.619231939315796, 3.981137752532959, 4.343043327331543, 4.704949378967285]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 12.0, 16.0, 30.0, 38.0, 28.0, 31.0, 39.0, 46.0, 52.0, 49.0, 60.0, 55.0, 62.0, 49.0, 63.0, 57.0, 54.0, 37.0, 39.0, 19.0, 33.0, 18.0, 21.0, 15.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4080607891082764, -2.331099510192871, -2.254138469696045, -2.1771774291992188, -2.1002161502838135, -2.023254871368408, -1.946293830871582, -1.8693326711654663, -1.7923715114593506, -1.7154103517532349, -1.6384491920471191, -1.5614880323410034, -1.4845268726348877, -1.407565712928772, -1.3306045532226562, -1.2536433935165405, -1.1766822338104248, -1.099721074104309, -1.0227599143981934, -0.9457987546920776, -0.8688375949859619, -0.7918764352798462, -0.7149152755737305, -0.6379541158676147, -0.560992956161499, -0.4840317964553833, -0.4070706367492676, -0.33010947704315186, -0.25314831733703613, -0.1761871576309204, -0.09922599792480469, -0.022264838218688965, 0.054696083068847656, 0.13165724277496338, 0.2086184024810791, 0.2855795621871948, 0.36254072189331055, 0.43950188159942627, 0.516463041305542, 0.5934242010116577, 0.6703853607177734, 0.7473465204238892, 0.8243076801300049, 0.9012688398361206, 0.9782299995422363, 1.055191159248352, 1.1321523189544678, 1.2091134786605835, 1.2860746383666992, 1.363035798072815, 1.4399969577789307, 1.5169581174850464, 1.593919277191162, 1.6708804368972778, 1.7478415966033936, 1.8248027563095093, 1.901763916015625, 1.9787250757217407, 2.0556862354278564, 2.1326475143432617, 2.209608554840088, 2.286569595336914, 2.3635308742523193, 2.4404921531677246, 2.517453193664551]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 7.0, 7.0, 7.0, 13.0, 19.0, 14.0, 32.0, 26.0, 50.0, 87.0, 121.0, 159.0, 257.0, 421.0, 793.0, 1546.0, 3270.0, 7534.0, 22209.0, 305267.0, 665754.0, 25283.0, 8589.0, 3445.0, 1549.0, 803.0, 452.0, 267.0, 194.0, 110.0, 68.0, 43.0, 48.0, 34.0, 13.0, 15.0, 12.0, 11.0, 5.0, 4.0, 7.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.80859375, -5.62152099609375, -5.4344482421875, -5.24737548828125, -5.060302734375, -4.87322998046875, -4.6861572265625, -4.49908447265625, -4.31201171875, -4.12493896484375, -3.9378662109375, -3.75079345703125, -3.563720703125, -3.37664794921875, -3.1895751953125, -3.00250244140625, -2.8154296875, -2.62835693359375, -2.4412841796875, -2.25421142578125, -2.067138671875, -1.88006591796875, -1.6929931640625, -1.50592041015625, -1.31884765625, -1.13177490234375, -0.9447021484375, -0.75762939453125, -0.570556640625, -0.38348388671875, -0.1964111328125, -0.00933837890625, 0.177734375, 0.36480712890625, 0.5518798828125, 0.73895263671875, 0.926025390625, 1.11309814453125, 1.3001708984375, 1.48724365234375, 1.67431640625, 1.86138916015625, 2.0484619140625, 2.23553466796875, 2.422607421875, 2.60968017578125, 2.7967529296875, 2.98382568359375, 3.1708984375, 3.35797119140625, 3.5450439453125, 3.73211669921875, 3.919189453125, 4.10626220703125, 4.2933349609375, 4.48040771484375, 4.66748046875, 4.85455322265625, 5.0416259765625, 5.22869873046875, 5.415771484375, 5.60284423828125, 5.7899169921875, 5.97698974609375, 6.1640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 10.0, 11.0, 11.0, 18.0, 12.0, 19.0, 66.0, 492.0, 268.0, 26.0, 18.0, 17.0, 4.0, 7.0, 5.0, 5.0, 7.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.998809814453125, -0.96636962890625, -0.933929443359375, -0.9014892578125, -0.869049072265625, -0.83660888671875, -0.804168701171875, -0.771728515625, -0.739288330078125, -0.70684814453125, -0.674407958984375, -0.6419677734375, -0.609527587890625, -0.57708740234375, -0.544647216796875, -0.51220703125, -0.479766845703125, -0.44732666015625, -0.414886474609375, -0.3824462890625, -0.350006103515625, -0.31756591796875, -0.285125732421875, -0.252685546875, -0.220245361328125, -0.18780517578125, -0.155364990234375, -0.1229248046875, -0.090484619140625, -0.05804443359375, -0.025604248046875, 0.0068359375, 0.039276123046875, 0.07171630859375, 0.104156494140625, 0.1365966796875, 0.169036865234375, 0.20147705078125, 0.233917236328125, 0.266357421875, 0.298797607421875, 0.33123779296875, 0.363677978515625, 0.3961181640625, 0.428558349609375, 0.46099853515625, 0.493438720703125, 0.52587890625, 0.558319091796875, 0.59075927734375, 0.623199462890625, 0.6556396484375, 0.688079833984375, 0.72052001953125, 0.752960205078125, 0.785400390625, 0.817840576171875, 0.85028076171875, 0.882720947265625, 0.9151611328125, 0.947601318359375, 0.98004150390625, 1.012481689453125, 1.044921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 18.0, 40.0, 108.0, 379.0, 1660.0, 23285.0, 944278.0, 75327.0, 2755.0, 479.0, 126.0, 42.0, 19.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6468505859375, -6.414794921875, -6.1827392578125, -5.95068359375, -5.7186279296875, -5.486572265625, -5.2545166015625, -5.0224609375, -4.7904052734375, -4.558349609375, -4.3262939453125, -4.09423828125, -3.8621826171875, -3.630126953125, -3.3980712890625, -3.166015625, -2.9339599609375, -2.701904296875, -2.4698486328125, -2.23779296875, -2.0057373046875, -1.773681640625, -1.5416259765625, -1.3095703125, -1.0775146484375, -0.845458984375, -0.6134033203125, -0.38134765625, -0.1492919921875, 0.082763671875, 0.3148193359375, 0.546875, 0.7789306640625, 1.010986328125, 1.2430419921875, 1.47509765625, 1.7071533203125, 1.939208984375, 2.1712646484375, 2.4033203125, 2.6353759765625, 2.867431640625, 3.0994873046875, 3.33154296875, 3.5635986328125, 3.795654296875, 4.0277099609375, 4.259765625, 4.4918212890625, 4.723876953125, 4.9559326171875, 5.18798828125, 5.4200439453125, 5.652099609375, 5.8841552734375, 6.1162109375, 6.3482666015625, 6.580322265625, 6.8123779296875, 7.04443359375, 7.2764892578125, 7.508544921875, 7.7406005859375, 7.97265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 6.0, 21.0, 12.0, 24.0, 22.0, 25.0, 26.0, 37.0, 50.0, 39.0, 41.0, 57.0, 59.0, 65.0, 58.0, 57.0, 52.0, 44.0, 42.0, 42.0, 43.0, 36.0, 27.0, 25.0, 12.0, 15.0, 8.0, 12.0, 8.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.943206787109375, -1.87664794921875, -1.810089111328125, -1.7435302734375, -1.676971435546875, -1.61041259765625, -1.543853759765625, -1.477294921875, -1.410736083984375, -1.34417724609375, -1.277618408203125, -1.2110595703125, -1.144500732421875, -1.07794189453125, -1.011383056640625, -0.94482421875, -0.878265380859375, -0.81170654296875, -0.745147705078125, -0.6785888671875, -0.612030029296875, -0.54547119140625, -0.478912353515625, -0.412353515625, -0.345794677734375, -0.27923583984375, -0.212677001953125, -0.1461181640625, -0.079559326171875, -0.01300048828125, 0.053558349609375, 0.1201171875, 0.186676025390625, 0.25323486328125, 0.319793701171875, 0.3863525390625, 0.452911376953125, 0.51947021484375, 0.586029052734375, 0.652587890625, 0.719146728515625, 0.78570556640625, 0.852264404296875, 0.9188232421875, 0.985382080078125, 1.05194091796875, 1.118499755859375, 1.18505859375, 1.251617431640625, 1.31817626953125, 1.384735107421875, 1.4512939453125, 1.517852783203125, 1.58441162109375, 1.650970458984375, 1.717529296875, 1.784088134765625, 1.85064697265625, 1.917205810546875, 1.9837646484375, 2.050323486328125, 2.11688232421875, 2.183441162109375, 2.25]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 2.0, 12.0, 7.0, 11.0, 22.0, 29.0, 57.0, 85.0, 174.0, 293.0, 734.0, 1968.0, 12969.0, 903882.0, 119582.0, 6278.0, 1403.0, 515.0, 230.0, 107.0, 71.0, 36.0, 25.0, 15.0, 12.0, 13.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5762939453125, -9.293212890625, -9.0101318359375, -8.72705078125, -8.4439697265625, -8.160888671875, -7.8778076171875, -7.5947265625, -7.3116455078125, -7.028564453125, -6.7454833984375, -6.46240234375, -6.1793212890625, -5.896240234375, -5.6131591796875, -5.330078125, -5.0469970703125, -4.763916015625, -4.4808349609375, -4.19775390625, -3.9146728515625, -3.631591796875, -3.3485107421875, -3.0654296875, -2.7823486328125, -2.499267578125, -2.2161865234375, -1.93310546875, -1.6500244140625, -1.366943359375, -1.0838623046875, -0.80078125, -0.5177001953125, -0.234619140625, 0.0484619140625, 0.33154296875, 0.6146240234375, 0.897705078125, 1.1807861328125, 1.4638671875, 1.7469482421875, 2.030029296875, 2.3131103515625, 2.59619140625, 2.8792724609375, 3.162353515625, 3.4454345703125, 3.728515625, 4.0115966796875, 4.294677734375, 4.5777587890625, 4.86083984375, 5.1439208984375, 5.427001953125, 5.7100830078125, 5.9931640625, 6.2762451171875, 6.559326171875, 6.8424072265625, 7.12548828125, 7.4085693359375, 7.691650390625, 7.9747314453125, 8.2578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 15.0, 15.0, 34.0, 65.0, 95.0, 210.0, 247.0, 122.0, 70.0, 45.0, 21.0, 22.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003764629364013672, -0.0003651231527328491, -0.00035378336906433105, -0.000342443585395813, -0.0003311038017272949, -0.00031976401805877686, -0.0003084242343902588, -0.0002970844507217407, -0.00028574466705322266, -0.0002744048833847046, -0.0002630650997161865, -0.00025172531604766846, -0.0002403855323791504, -0.00022904574871063232, -0.00021770596504211426, -0.0002063661813735962, -0.00019502639770507812, -0.00018368661403656006, -0.000172346830368042, -0.00016100704669952393, -0.00014966726303100586, -0.0001383274793624878, -0.00012698769569396973, -0.00011564791202545166, -0.0001043081283569336, -9.296834468841553e-05, -8.162856101989746e-05, -7.02887773513794e-05, -5.894899368286133e-05, -4.760921001434326e-05, -3.6269426345825195e-05, -2.492964267730713e-05, -1.3589859008789062e-05, -2.250075340270996e-06, 9.08970832824707e-06, 2.0429491996765137e-05, 3.17692756652832e-05, 4.310905933380127e-05, 5.4448843002319336e-05, 6.57886266708374e-05, 7.712841033935547e-05, 8.846819400787354e-05, 9.98079776763916e-05, 0.00011114776134490967, 0.00012248754501342773, 0.0001338273286819458, 0.00014516711235046387, 0.00015650689601898193, 0.0001678466796875, 0.00017918646335601807, 0.00019052624702453613, 0.0002018660306930542, 0.00021320581436157227, 0.00022454559803009033, 0.0002358853816986084, 0.00024722516536712646, 0.00025856494903564453, 0.0002699047327041626, 0.00028124451637268066, 0.00029258430004119873, 0.0003039240837097168, 0.00031526386737823486, 0.00032660365104675293, 0.000337943434715271, 0.00034928321838378906]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 14.0, 8.0, 21.0, 23.0, 59.0, 77.0, 137.0, 279.0, 593.0, 1662.0, 6348.0, 62879.0, 932458.0, 36776.0, 4753.0, 1305.0, 509.0, 248.0, 155.0, 101.0, 45.0, 30.0, 23.0, 13.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0057373046875, -4.816162109375, -4.6265869140625, -4.43701171875, -4.2474365234375, -4.057861328125, -3.8682861328125, -3.6787109375, -3.4891357421875, -3.299560546875, -3.1099853515625, -2.92041015625, -2.7308349609375, -2.541259765625, -2.3516845703125, -2.162109375, -1.9725341796875, -1.782958984375, -1.5933837890625, -1.40380859375, -1.2142333984375, -1.024658203125, -0.8350830078125, -0.6455078125, -0.4559326171875, -0.266357421875, -0.0767822265625, 0.11279296875, 0.3023681640625, 0.491943359375, 0.6815185546875, 0.87109375, 1.0606689453125, 1.250244140625, 1.4398193359375, 1.62939453125, 1.8189697265625, 2.008544921875, 2.1981201171875, 2.3876953125, 2.5772705078125, 2.766845703125, 2.9564208984375, 3.14599609375, 3.3355712890625, 3.525146484375, 3.7147216796875, 3.904296875, 4.0938720703125, 4.283447265625, 4.4730224609375, 4.66259765625, 4.8521728515625, 5.041748046875, 5.2313232421875, 5.4208984375, 5.6104736328125, 5.800048828125, 5.9896240234375, 6.17919921875, 6.3687744140625, 6.558349609375, 6.7479248046875, 6.9375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 40.0, 57.0, 124.0, 247.0, 224.0, 96.0, 48.0, 41.0, 17.0, 12.0, 11.0, 12.0, 6.0, 6.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.519378662109375, -4.38641357421875, -4.253448486328125, -4.1204833984375, -3.987518310546875, -3.85455322265625, -3.721588134765625, -3.588623046875, -3.455657958984375, -3.32269287109375, -3.189727783203125, -3.0567626953125, -2.923797607421875, -2.79083251953125, -2.657867431640625, -2.52490234375, -2.391937255859375, -2.25897216796875, -2.126007080078125, -1.9930419921875, -1.860076904296875, -1.72711181640625, -1.594146728515625, -1.461181640625, -1.328216552734375, -1.19525146484375, -1.062286376953125, -0.9293212890625, -0.796356201171875, -0.66339111328125, -0.530426025390625, -0.3974609375, -0.264495849609375, -0.13153076171875, 0.001434326171875, 0.1343994140625, 0.267364501953125, 0.40032958984375, 0.533294677734375, 0.666259765625, 0.799224853515625, 0.93218994140625, 1.065155029296875, 1.1981201171875, 1.331085205078125, 1.46405029296875, 1.597015380859375, 1.72998046875, 1.862945556640625, 1.99591064453125, 2.128875732421875, 2.2618408203125, 2.394805908203125, 2.52777099609375, 2.660736083984375, 2.793701171875, 2.926666259765625, 3.05963134765625, 3.192596435546875, 3.3255615234375, 3.458526611328125, 3.59149169921875, 3.724456787109375, 3.857421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 72.0, 595.0, 284.0, 28.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25328826904297, -33.36487579345703, -31.476465225219727, -29.588054656982422, -27.699642181396484, -25.81123161315918, -23.922821044921875, -22.034408569335938, -20.14599609375, -18.257585525512695, -16.369173049926758, -14.480762481689453, -12.592350006103516, -10.703939437866211, -8.81552791595459, -6.927116394042969, -5.038705825805664, -3.150294303894043, -1.261883020401001, 0.626528263092041, 2.514939785003662, 4.403350830078125, 6.291762351989746, 8.180173873901367, 10.068585395812988, 11.95699691772461, 13.84540843963623, 15.733819961547852, 17.622230529785156, 19.510643005371094, 21.3990535736084, 23.287464141845703, 25.17587661743164, 27.064287185668945, 28.952699661254883, 30.841110229492188, 32.729522705078125, 34.61793518066406, 36.506343841552734, 38.39475631713867, 40.28316879272461, 42.17158126831055, 44.05998992919922, 45.948402404785156, 47.836814880371094, 49.72522735595703, 51.6136360168457, 53.50204849243164, 55.39045715332031, 57.27886962890625, 59.16727828979492, 61.05569076538086, 62.9441032409668, 64.83251190185547, 66.7209243774414, 68.60933685302734, 70.49774932861328, 72.38616180419922, 74.27457427978516, 76.1629867553711, 78.0513916015625, 79.93980407714844, 81.82821655273438, 83.71662902832031, 85.60504150390625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 6.0, 7.0, 10.0, 16.0, 19.0, 27.0, 35.0, 60.0, 67.0, 89.0, 80.0, 95.0, 99.0, 76.0, 87.0, 41.0, 50.0, 33.0, 22.0, 15.0, 6.0, 4.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.466697692871094, -24.712675094604492, -23.95865249633789, -23.204631805419922, -22.45060920715332, -21.69658660888672, -20.942564010620117, -20.188541412353516, -19.434520721435547, -18.680498123168945, -17.926475524902344, -17.172454833984375, -16.418432235717773, -15.664409637451172, -14.91038703918457, -14.156364440917969, -13.402341842651367, -12.648319244384766, -11.89429759979248, -11.140275001525879, -10.386253356933594, -9.632230758666992, -8.87820816040039, -8.124185562133789, -7.370163917541504, -6.6161417961120605, -5.862119674682617, -5.108097076416016, -4.354074954986572, -3.600052833557129, -2.8460302352905273, -2.092008113861084, -1.3379859924316406, -0.5839637517929077, 0.1700584888458252, 0.9240808486938477, 1.678102970123291, 2.4321250915527344, 3.186147689819336, 3.9401698112487793, 4.694191932678223, 5.448214054107666, 6.202236175537109, 6.956258773803711, 7.710280895233154, 8.464303016662598, 9.2183256149292, 9.972347259521484, 10.726369857788086, 11.480392456054688, 12.234414100646973, 12.988436698913574, 13.74245834350586, 14.496480941772461, 15.250503540039062, 16.004526138305664, 16.758548736572266, 17.512571334838867, 18.26659393310547, 19.020614624023438, 19.77463722229004, 20.52865982055664, 21.282682418823242, 22.036705017089844, 22.790725708007812]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 13.0, 19.0, 30.0, 42.0, 49.0, 99.0, 129.0, 223.0, 378.0, 725.0, 1522.0, 4228.0, 26839.0, 4131002.0, 22709.0, 3262.0, 1150.0, 612.0, 343.0, 255.0, 159.0, 104.0, 79.0, 50.0, 47.0, 33.0, 28.0, 23.0, 15.0, 20.0, 10.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.7374267578125, -12.217041015625, -11.6966552734375, -11.17626953125, -10.6558837890625, -10.135498046875, -9.6151123046875, -9.0947265625, -8.5743408203125, -8.053955078125, -7.5335693359375, -7.01318359375, -6.4927978515625, -5.972412109375, -5.4520263671875, -4.931640625, -4.4112548828125, -3.890869140625, -3.3704833984375, -2.85009765625, -2.3297119140625, -1.809326171875, -1.2889404296875, -0.7685546875, -0.2481689453125, 0.272216796875, 0.7926025390625, 1.31298828125, 1.8333740234375, 2.353759765625, 2.8741455078125, 3.39453125, 3.9149169921875, 4.435302734375, 4.9556884765625, 5.47607421875, 5.9964599609375, 6.516845703125, 7.0372314453125, 7.5576171875, 8.0780029296875, 8.598388671875, 9.1187744140625, 9.63916015625, 10.1595458984375, 10.679931640625, 11.2003173828125, 11.720703125, 12.2410888671875, 12.761474609375, 13.2818603515625, 13.80224609375, 14.3226318359375, 14.843017578125, 15.3634033203125, 15.8837890625, 16.4041748046875, 16.924560546875, 17.4449462890625, 17.96533203125, 18.4857177734375, 19.006103515625, 19.5264892578125, 20.046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 6.0, 10.0, 32.0, 37.0, 115.0, 376.0, 289.0, 63.0, 24.0, 13.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93310546875, -0.9017715454101562, -0.8704376220703125, -0.8391036987304688, -0.807769775390625, -0.7764358520507812, -0.7451019287109375, -0.7137680053710938, -0.68243408203125, -0.6511001586914062, -0.6197662353515625, -0.5884323120117188, -0.557098388671875, -0.5257644653320312, -0.4944305419921875, -0.46309661865234375, -0.4317626953125, -0.40042877197265625, -0.3690948486328125, -0.33776092529296875, -0.306427001953125, -0.27509307861328125, -0.2437591552734375, -0.21242523193359375, -0.18109130859375, -0.14975738525390625, -0.1184234619140625, -0.08708953857421875, -0.055755615234375, -0.02442169189453125, 0.0069122314453125, 0.03824615478515625, 0.069580078125, 0.10091400146484375, 0.1322479248046875, 0.16358184814453125, 0.194915771484375, 0.22624969482421875, 0.2575836181640625, 0.28891754150390625, 0.32025146484375, 0.35158538818359375, 0.3829193115234375, 0.41425323486328125, 0.445587158203125, 0.47692108154296875, 0.5082550048828125, 0.5395889282226562, 0.5709228515625, 0.6022567749023438, 0.6335906982421875, 0.6649246215820312, 0.696258544921875, 0.7275924682617188, 0.7589263916015625, 0.7902603149414062, 0.82159423828125, 0.8529281616210938, 0.8842620849609375, 0.9155960083007812, 0.946929931640625, 0.9782638549804688, 1.0095977783203125, 1.0409317016601562, 1.072265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 3.0, 5.0, 8.0, 12.0, 14.0, 25.0, 43.0, 66.0, 145.0, 305.0, 1317.0, 12279.0, 3954951.0, 218947.0, 4871.0, 764.0, 230.0, 96.0, 58.0, 31.0, 31.0, 11.0, 18.0, 7.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.796875, -11.4849853515625, -11.173095703125, -10.8612060546875, -10.54931640625, -10.2374267578125, -9.925537109375, -9.6136474609375, -9.3017578125, -8.9898681640625, -8.677978515625, -8.3660888671875, -8.05419921875, -7.7423095703125, -7.430419921875, -7.1185302734375, -6.806640625, -6.4947509765625, -6.182861328125, -5.8709716796875, -5.55908203125, -5.2471923828125, -4.935302734375, -4.6234130859375, -4.3115234375, -3.9996337890625, -3.687744140625, -3.3758544921875, -3.06396484375, -2.7520751953125, -2.440185546875, -2.1282958984375, -1.81640625, -1.5045166015625, -1.192626953125, -0.8807373046875, -0.56884765625, -0.2569580078125, 0.054931640625, 0.3668212890625, 0.6787109375, 0.9906005859375, 1.302490234375, 1.6143798828125, 1.92626953125, 2.2381591796875, 2.550048828125, 2.8619384765625, 3.173828125, 3.4857177734375, 3.797607421875, 4.1094970703125, 4.42138671875, 4.7332763671875, 5.045166015625, 5.3570556640625, 5.6689453125, 5.9808349609375, 6.292724609375, 6.6046142578125, 6.91650390625, 7.2283935546875, 7.540283203125, 7.8521728515625, 8.1640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 7.0, 9.0, 13.0, 16.0, 27.0, 30.0, 49.0, 63.0, 105.0, 242.0, 632.0, 1674.0, 589.0, 260.0, 113.0, 68.0, 43.0, 27.0, 17.0, 17.0, 9.0, 14.0, 8.0, 1.0, 2.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5403213500976562, -0.5191192626953125, -0.49791717529296875, -0.476715087890625, -0.45551300048828125, -0.4343109130859375, -0.41310882568359375, -0.39190673828125, -0.37070465087890625, -0.3495025634765625, -0.32830047607421875, -0.307098388671875, -0.28589630126953125, -0.2646942138671875, -0.24349212646484375, -0.2222900390625, -0.20108795166015625, -0.1798858642578125, -0.15868377685546875, -0.137481689453125, -0.11627960205078125, -0.0950775146484375, -0.07387542724609375, -0.05267333984375, -0.03147125244140625, -0.0102691650390625, 0.01093292236328125, 0.032135009765625, 0.05333709716796875, 0.0745391845703125, 0.09574127197265625, 0.116943359375, 0.13814544677734375, 0.1593475341796875, 0.18054962158203125, 0.201751708984375, 0.22295379638671875, 0.2441558837890625, 0.26535797119140625, 0.28656005859375, 0.30776214599609375, 0.3289642333984375, 0.35016632080078125, 0.371368408203125, 0.39257049560546875, 0.4137725830078125, 0.43497467041015625, 0.4561767578125, 0.47737884521484375, 0.4985809326171875, 0.5197830200195312, 0.540985107421875, 0.5621871948242188, 0.5833892822265625, 0.6045913696289062, 0.62579345703125, 0.6469955444335938, 0.6681976318359375, 0.6893997192382812, 0.710601806640625, 0.7318038940429688, 0.7530059814453125, 0.7742080688476562, 0.79541015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 39.0, 219.0, 495.0, 192.0, 39.0, 10.0, 0.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.517908096313477, -10.263758659362793, -10.009608268737793, -9.75545883178711, -9.501309394836426, -9.247159004211426, -8.993009567260742, -8.738860130310059, -8.484709739685059, -8.230560302734375, -7.976410388946533, -7.722260475158691, -7.46811056137085, -7.213960647583008, -6.959811210632324, -6.705661296844482, -6.451511859893799, -6.197361946105957, -5.943212509155273, -5.689062595367432, -5.43491268157959, -5.180763244628906, -4.9266133308410645, -4.672463417053223, -4.418313980102539, -4.164164066314697, -3.9100143909454346, -3.655864715576172, -3.40171480178833, -3.1475651264190674, -2.8934154510498047, -2.639265537261963, -2.385115623474121, -2.1309659481048584, -1.8768160343170166, -1.622666358947754, -1.3685165643692017, -1.1143667697906494, -0.8602170944213867, -0.6060672998428345, -0.3519175052642822, -0.09776774048805237, 0.1563820242881775, 0.41053175926208496, 0.6646815538406372, 0.9188313484191895, 1.1729810237884521, 1.4271308183670044, 1.6812806129455566, 1.9354304075241089, 2.189580202102661, 2.443729877471924, 2.6978797912597656, 2.9520294666290283, 3.206179141998291, 3.460329055786133, 3.7144787311553955, 3.968628406524658, 4.2227783203125, 4.476927757263184, 4.731077671051025, 4.985227584838867, 5.239377021789551, 5.493526935577393, 5.747676849365234]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 24.0, 20.0, 15.0, 41.0, 43.0, 57.0, 57.0, 48.0, 68.0, 65.0, 69.0, 69.0, 58.0, 48.0, 52.0, 41.0, 41.0, 30.0, 25.0, 13.0, 13.0, 17.0, 4.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.776867151260376, -2.6947848796844482, -2.6127028465270996, -2.530620574951172, -2.4485385417938232, -2.3664562702178955, -2.284374237060547, -2.202291965484619, -2.1202096939086914, -2.0381274223327637, -1.956045389175415, -1.8739632368087769, -1.7918810844421387, -1.709798812866211, -1.6277166604995728, -1.5456345081329346, -1.463552474975586, -1.3814703226089478, -1.2993881702423096, -1.2173060178756714, -1.1352238655090332, -1.0531415939331055, -0.9710594415664673, -0.8889772891998291, -0.8068951368331909, -0.7248129844665527, -0.6427308320999146, -0.5606486201286316, -0.4785664677619934, -0.3964843153953552, -0.31440213322639465, -0.23231995105743408, -0.1502377986907959, -0.06815563142299652, 0.013926535844802856, 0.09600870311260223, 0.1780908703804016, 0.2601730227470398, 0.34225520491600037, 0.42433738708496094, 0.5064195394515991, 0.5885016918182373, 0.6705838441848755, 0.7526660561561584, 0.8347482085227966, 0.9168303608894348, 0.9989125728607178, 1.080994725227356, 1.1630768775939941, 1.2451590299606323, 1.3272411823272705, 1.4093233346939087, 1.4914054870605469, 1.5734877586364746, 1.6555699110031128, 1.737652063369751, 1.8197342157363892, 1.9018163681030273, 1.9838985204696655, 2.0659806728363037, 2.1480629444122314, 2.23014497756958, 2.312227249145508, 2.3943095207214355, 2.476391553878784]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 9.0, 11.0, 19.0, 28.0, 34.0, 58.0, 74.0, 139.0, 218.0, 345.0, 729.0, 1568.0, 4611.0, 25082.0, 923023.0, 80909.0, 7370.0, 2225.0, 973.0, 470.0, 232.0, 149.0, 93.0, 60.0, 30.0, 23.0, 27.0, 6.0, 14.0, 5.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.48828125, -7.25909423828125, -7.0299072265625, -6.80072021484375, -6.571533203125, -6.34234619140625, -6.1131591796875, -5.88397216796875, -5.65478515625, -5.42559814453125, -5.1964111328125, -4.96722412109375, -4.738037109375, -4.50885009765625, -4.2796630859375, -4.05047607421875, -3.8212890625, -3.59210205078125, -3.3629150390625, -3.13372802734375, -2.904541015625, -2.67535400390625, -2.4461669921875, -2.21697998046875, -1.98779296875, -1.75860595703125, -1.5294189453125, -1.30023193359375, -1.071044921875, -0.84185791015625, -0.6126708984375, -0.38348388671875, -0.154296875, 0.07489013671875, 0.3040771484375, 0.53326416015625, 0.762451171875, 0.99163818359375, 1.2208251953125, 1.45001220703125, 1.67919921875, 1.90838623046875, 2.1375732421875, 2.36676025390625, 2.595947265625, 2.82513427734375, 3.0543212890625, 3.28350830078125, 3.5126953125, 3.74188232421875, 3.9710693359375, 4.20025634765625, 4.429443359375, 4.65863037109375, 4.8878173828125, 5.11700439453125, 5.34619140625, 5.57537841796875, 5.8045654296875, 6.03375244140625, 6.262939453125, 6.49212646484375, 6.7213134765625, 6.95050048828125, 7.1796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 7.0, 6.0, 6.0, 10.0, 16.0, 48.0, 133.0, 377.0, 269.0, 94.0, 16.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.8643646240234375, -0.833221435546875, -0.8020782470703125, -0.77093505859375, -0.7397918701171875, -0.708648681640625, -0.6775054931640625, -0.6463623046875, -0.6152191162109375, -0.584075927734375, -0.5529327392578125, -0.52178955078125, -0.4906463623046875, -0.459503173828125, -0.4283599853515625, -0.397216796875, -0.3660736083984375, -0.334930419921875, -0.3037872314453125, -0.27264404296875, -0.2415008544921875, -0.210357666015625, -0.1792144775390625, -0.1480712890625, -0.1169281005859375, -0.085784912109375, -0.0546417236328125, -0.02349853515625, 0.0076446533203125, 0.038787841796875, 0.0699310302734375, 0.10107421875, 0.1322174072265625, 0.163360595703125, 0.1945037841796875, 0.22564697265625, 0.2567901611328125, 0.287933349609375, 0.3190765380859375, 0.3502197265625, 0.3813629150390625, 0.412506103515625, 0.4436492919921875, 0.47479248046875, 0.5059356689453125, 0.537078857421875, 0.5682220458984375, 0.599365234375, 0.6305084228515625, 0.661651611328125, 0.6927947998046875, 0.72393798828125, 0.7550811767578125, 0.786224365234375, 0.8173675537109375, 0.8485107421875, 0.8796539306640625, 0.910797119140625, 0.9419403076171875, 0.97308349609375, 1.0042266845703125, 1.035369873046875, 1.0665130615234375, 1.09765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 10.0, 8.0, 13.0, 20.0, 35.0, 26.0, 52.0, 73.0, 92.0, 150.0, 248.0, 408.0, 722.0, 1515.0, 4319.0, 19055.0, 159149.0, 702302.0, 135816.0, 17055.0, 4010.0, 1539.0, 736.0, 441.0, 264.0, 169.0, 107.0, 66.0, 40.0, 36.0, 23.0, 13.0, 9.0, 6.0, 6.0, 11.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -3.001800537109375, -2.88836669921875, -2.774932861328125, -2.6614990234375, -2.548065185546875, -2.43463134765625, -2.321197509765625, -2.207763671875, -2.094329833984375, -1.98089599609375, -1.867462158203125, -1.7540283203125, -1.640594482421875, -1.52716064453125, -1.413726806640625, -1.30029296875, -1.186859130859375, -1.07342529296875, -0.959991455078125, -0.8465576171875, -0.733123779296875, -0.61968994140625, -0.506256103515625, -0.392822265625, -0.279388427734375, -0.16595458984375, -0.052520751953125, 0.0609130859375, 0.174346923828125, 0.28778076171875, 0.401214599609375, 0.5146484375, 0.628082275390625, 0.74151611328125, 0.854949951171875, 0.9683837890625, 1.081817626953125, 1.19525146484375, 1.308685302734375, 1.422119140625, 1.535552978515625, 1.64898681640625, 1.762420654296875, 1.8758544921875, 1.989288330078125, 2.10272216796875, 2.216156005859375, 2.32958984375, 2.443023681640625, 2.55645751953125, 2.669891357421875, 2.7833251953125, 2.896759033203125, 3.01019287109375, 3.123626708984375, 3.237060546875, 3.350494384765625, 3.46392822265625, 3.577362060546875, 3.6907958984375, 3.804229736328125, 3.91766357421875, 4.031097412109375, 4.14453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 2.0, 7.0, 6.0, 12.0, 9.0, 14.0, 16.0, 16.0, 19.0, 15.0, 33.0, 29.0, 20.0, 35.0, 44.0, 33.0, 47.0, 49.0, 48.0, 45.0, 40.0, 58.0, 61.0, 44.0, 48.0, 36.0, 34.0, 23.0, 33.0, 17.0, 20.0, 19.0, 12.0, 15.0, 11.0, 7.0, 1.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.89202880859375, -1.8289794921875, -1.76593017578125, -1.702880859375, -1.63983154296875, -1.5767822265625, -1.51373291015625, -1.45068359375, -1.38763427734375, -1.3245849609375, -1.26153564453125, -1.198486328125, -1.13543701171875, -1.0723876953125, -1.00933837890625, -0.9462890625, -0.88323974609375, -0.8201904296875, -0.75714111328125, -0.694091796875, -0.63104248046875, -0.5679931640625, -0.50494384765625, -0.44189453125, -0.37884521484375, -0.3157958984375, -0.25274658203125, -0.189697265625, -0.12664794921875, -0.0635986328125, -0.00054931640625, 0.0625, 0.12554931640625, 0.1885986328125, 0.25164794921875, 0.314697265625, 0.37774658203125, 0.4407958984375, 0.50384521484375, 0.56689453125, 0.62994384765625, 0.6929931640625, 0.75604248046875, 0.819091796875, 0.88214111328125, 0.9451904296875, 1.00823974609375, 1.0712890625, 1.13433837890625, 1.1973876953125, 1.26043701171875, 1.323486328125, 1.38653564453125, 1.4495849609375, 1.51263427734375, 1.57568359375, 1.63873291015625, 1.7017822265625, 1.76483154296875, 1.827880859375, 1.89093017578125, 1.9539794921875, 2.01702880859375, 2.080078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 6.0, 11.0, 17.0, 18.0, 42.0, 63.0, 95.0, 151.0, 303.0, 704.0, 2030.0, 7496.0, 50725.0, 729510.0, 232625.0, 18675.0, 3901.0, 1156.0, 483.0, 252.0, 115.0, 64.0, 48.0, 21.0, 11.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8140869140625, -2.737548828125, -2.6610107421875, -2.58447265625, -2.5079345703125, -2.431396484375, -2.3548583984375, -2.2783203125, -2.2017822265625, -2.125244140625, -2.0487060546875, -1.97216796875, -1.8956298828125, -1.819091796875, -1.7425537109375, -1.666015625, -1.5894775390625, -1.512939453125, -1.4364013671875, -1.35986328125, -1.2833251953125, -1.206787109375, -1.1302490234375, -1.0537109375, -0.9771728515625, -0.900634765625, -0.8240966796875, -0.74755859375, -0.6710205078125, -0.594482421875, -0.5179443359375, -0.44140625, -0.3648681640625, -0.288330078125, -0.2117919921875, -0.13525390625, -0.0587158203125, 0.017822265625, 0.0943603515625, 0.1708984375, 0.2474365234375, 0.323974609375, 0.4005126953125, 0.47705078125, 0.5535888671875, 0.630126953125, 0.7066650390625, 0.783203125, 0.8597412109375, 0.936279296875, 1.0128173828125, 1.08935546875, 1.1658935546875, 1.242431640625, 1.3189697265625, 1.3955078125, 1.4720458984375, 1.548583984375, 1.6251220703125, 1.70166015625, 1.7781982421875, 1.854736328125, 1.9312744140625, 2.0078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 6.0, 3.0, 9.0, 14.0, 19.0, 16.0, 28.0, 34.0, 38.0, 47.0, 57.0, 81.0, 92.0, 111.0, 104.0, 84.0, 63.0, 47.0, 36.0, 25.0, 22.0, 18.0, 10.0, 6.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018465518951416016, -0.00017815269529819489, -0.00017165020108222961, -0.00016514770686626434, -0.00015864521265029907, -0.0001521427184343338, -0.00014564022421836853, -0.00013913773000240326, -0.000132635235786438, -0.00012613274157047272, -0.00011963024735450745, -0.00011312775313854218, -0.0001066252589225769, -0.00010012276470661163, -9.362027049064636e-05, -8.711777627468109e-05, -8.061528205871582e-05, -7.411278784275055e-05, -6.761029362678528e-05, -6.110779941082001e-05, -5.4605305194854736e-05, -4.8102810978889465e-05, -4.1600316762924194e-05, -3.509782254695892e-05, -2.8595328330993652e-05, -2.209283411502838e-05, -1.559033989906311e-05, -9.08784568309784e-06, -2.5853514671325684e-06, 3.917142748832703e-06, 1.0419636964797974e-05, 1.6922131180763245e-05, 2.3424625396728516e-05, 2.9927119612693787e-05, 3.642961382865906e-05, 4.293210804462433e-05, 4.94346022605896e-05, 5.593709647655487e-05, 6.243959069252014e-05, 6.894208490848541e-05, 7.544457912445068e-05, 8.194707334041595e-05, 8.844956755638123e-05, 9.49520617723465e-05, 0.00010145455598831177, 0.00010795705020427704, 0.00011445954442024231, 0.00012096203863620758, 0.00012746453285217285, 0.00013396702706813812, 0.0001404695212841034, 0.00014697201550006866, 0.00015347450971603394, 0.0001599770039319992, 0.00016647949814796448, 0.00017298199236392975, 0.00017948448657989502, 0.0001859869807958603, 0.00019248947501182556, 0.00019899196922779083, 0.0002054944634437561, 0.00021199695765972137, 0.00021849945187568665, 0.00022500194609165192, 0.0002315044403076172]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 10.0, 9.0, 13.0, 34.0, 47.0, 79.0, 171.0, 355.0, 1000.0, 3560.0, 27020.0, 809195.0, 194769.0, 9361.0, 1845.0, 574.0, 235.0, 101.0, 56.0, 29.0, 17.0, 9.0, 10.0, 5.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.890625, -2.790191650390625, -2.68975830078125, -2.589324951171875, -2.4888916015625, -2.388458251953125, -2.28802490234375, -2.187591552734375, -2.087158203125, -1.986724853515625, -1.88629150390625, -1.785858154296875, -1.6854248046875, -1.584991455078125, -1.48455810546875, -1.384124755859375, -1.28369140625, -1.183258056640625, -1.08282470703125, -0.982391357421875, -0.8819580078125, -0.781524658203125, -0.68109130859375, -0.580657958984375, -0.480224609375, -0.379791259765625, -0.27935791015625, -0.178924560546875, -0.0784912109375, 0.021942138671875, 0.12237548828125, 0.222808837890625, 0.3232421875, 0.423675537109375, 0.52410888671875, 0.624542236328125, 0.7249755859375, 0.825408935546875, 0.92584228515625, 1.026275634765625, 1.126708984375, 1.227142333984375, 1.32757568359375, 1.428009033203125, 1.5284423828125, 1.628875732421875, 1.72930908203125, 1.829742431640625, 1.93017578125, 2.030609130859375, 2.13104248046875, 2.231475830078125, 2.3319091796875, 2.432342529296875, 2.53277587890625, 2.633209228515625, 2.733642578125, 2.834075927734375, 2.93450927734375, 3.034942626953125, 3.1353759765625, 3.235809326171875, 3.33624267578125, 3.436676025390625, 3.537109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 11.0, 25.0, 29.0, 23.0, 66.0, 99.0, 133.0, 160.0, 152.0, 111.0, 63.0, 43.0, 24.0, 21.0, 12.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.58294677734375, -1.5330810546875, -1.48321533203125, -1.433349609375, -1.38348388671875, -1.3336181640625, -1.28375244140625, -1.23388671875, -1.18402099609375, -1.1341552734375, -1.08428955078125, -1.034423828125, -0.98455810546875, -0.9346923828125, -0.88482666015625, -0.8349609375, -0.78509521484375, -0.7352294921875, -0.68536376953125, -0.635498046875, -0.58563232421875, -0.5357666015625, -0.48590087890625, -0.43603515625, -0.38616943359375, -0.3363037109375, -0.28643798828125, -0.236572265625, -0.18670654296875, -0.1368408203125, -0.08697509765625, -0.037109375, 0.01275634765625, 0.0626220703125, 0.11248779296875, 0.162353515625, 0.21221923828125, 0.2620849609375, 0.31195068359375, 0.36181640625, 0.41168212890625, 0.4615478515625, 0.51141357421875, 0.561279296875, 0.61114501953125, 0.6610107421875, 0.71087646484375, 0.7607421875, 0.81060791015625, 0.8604736328125, 0.91033935546875, 0.960205078125, 1.01007080078125, 1.0599365234375, 1.10980224609375, 1.15966796875, 1.20953369140625, 1.2593994140625, 1.30926513671875, 1.359130859375, 1.40899658203125, 1.4588623046875, 1.50872802734375, 1.55859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 10.0, 47.0, 304.0, 536.0, 90.0, 13.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.76063537597656, -50.82050323486328, -48.880374908447266, -46.94024658203125, -45.00011444091797, -43.05998229980469, -41.11985397338867, -39.179725646972656, -37.239593505859375, -35.299461364746094, -33.35933303833008, -31.41920280456543, -29.47907257080078, -27.538942337036133, -25.598812103271484, -23.658681869506836, -21.718551635742188, -19.77842140197754, -17.83829116821289, -15.898160934448242, -13.958030700683594, -12.017900466918945, -10.077770233154297, -8.137639999389648, -6.197509765625, -4.257379531860352, -2.317249298095703, -0.3771190643310547, 1.5630111694335938, 3.503141403198242, 5.443271636962891, 7.383401870727539, 9.323532104492188, 11.263662338256836, 13.203792572021484, 15.143922805786133, 17.08405303955078, 19.02418327331543, 20.964313507080078, 22.904443740844727, 24.844573974609375, 26.784704208374023, 28.724834442138672, 30.66496467590332, 32.60509490966797, 34.54522705078125, 36.485355377197266, 38.42548370361328, 40.36561584472656, 42.305747985839844, 44.24587631225586, 46.186004638671875, 48.126136779785156, 50.06626892089844, 52.00639724731445, 53.94652557373047, 55.88665771484375, 57.82678985595703, 59.76691818237305, 61.70704650878906, 63.647178649902344, 65.58731079101562, 67.52743530273438, 69.46756744384766, 71.40769958496094]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 22.0, 24.0, 25.0, 37.0, 53.0, 64.0, 74.0, 64.0, 87.0, 65.0, 70.0, 66.0, 59.0, 63.0, 43.0, 39.0, 28.0, 34.0, 13.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.177108764648438, -23.47942352294922, -22.78173828125, -22.08405303955078, -21.386367797851562, -20.688682556152344, -19.990997314453125, -19.293310165405273, -18.595624923706055, -17.897939682006836, -17.200254440307617, -16.5025691986084, -15.804883003234863, -15.107197761535645, -14.409512519836426, -13.71182632446289, -13.014142036437988, -12.31645679473877, -11.61877155303955, -10.921085357666016, -10.223400115966797, -9.525714874267578, -8.82802963256836, -8.13034439086914, -7.432658672332764, -6.734973430633545, -6.037287712097168, -5.339602470397949, -4.6419172286987305, -3.9442315101623535, -3.2465462684631348, -2.548860549926758, -1.851175308227539, -1.1534898281097412, -0.4558044672012329, 0.2418808937072754, 0.9395663738250732, 1.637251853942871, 2.33493709564209, 3.032622814178467, 3.7303080558776855, 4.427993297576904, 5.125679016113281, 5.8233642578125, 6.521049499511719, 7.218735218048096, 7.9164204597473145, 8.614106178283691, 9.31179141998291, 10.009476661682129, 10.707161903381348, 11.404848098754883, 12.102533340454102, 12.80021858215332, 13.497903823852539, 14.195589065551758, 14.893274307250977, 15.590959548950195, 16.288644790649414, 16.986330032348633, 17.68401527404785, 18.381702423095703, 19.079387664794922, 19.77707290649414, 20.47475814819336]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 9.0, 11.0, 34.0, 86.0, 272.0, 1785.0, 4174263.0, 16741.0, 725.0, 201.0, 70.0, 38.0, 13.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25, -39.8642578125, -38.478515625, -37.0927734375, -35.70703125, -34.3212890625, -32.935546875, -31.5498046875, -30.1640625, -28.7783203125, -27.392578125, -26.0068359375, -24.62109375, -23.2353515625, -21.849609375, -20.4638671875, -19.078125, -17.6923828125, -16.306640625, -14.9208984375, -13.53515625, -12.1494140625, -10.763671875, -9.3779296875, -7.9921875, -6.6064453125, -5.220703125, -3.8349609375, -2.44921875, -1.0634765625, 0.322265625, 1.7080078125, 3.09375, 4.4794921875, 5.865234375, 7.2509765625, 8.63671875, 10.0224609375, 11.408203125, 12.7939453125, 14.1796875, 15.5654296875, 16.951171875, 18.3369140625, 19.72265625, 21.1083984375, 22.494140625, 23.8798828125, 25.265625, 26.6513671875, 28.037109375, 29.4228515625, 30.80859375, 32.1943359375, 33.580078125, 34.9658203125, 36.3515625, 37.7373046875, 39.123046875, 40.5087890625, 41.89453125, 43.2802734375, 44.666015625, 46.0517578125, 47.4375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 25.0, 60.0, 145.0, 237.0, 237.0, 168.0, 64.0, 20.0, 10.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.10833740234375, -1.0701904296875, -1.03204345703125, -0.993896484375, -0.95574951171875, -0.9176025390625, -0.87945556640625, -0.84130859375, -0.80316162109375, -0.7650146484375, -0.72686767578125, -0.688720703125, -0.65057373046875, -0.6124267578125, -0.57427978515625, -0.5361328125, -0.49798583984375, -0.4598388671875, -0.42169189453125, -0.383544921875, -0.34539794921875, -0.3072509765625, -0.26910400390625, -0.23095703125, -0.19281005859375, -0.1546630859375, -0.11651611328125, -0.078369140625, -0.04022216796875, -0.0020751953125, 0.03607177734375, 0.07421875, 0.11236572265625, 0.1505126953125, 0.18865966796875, 0.226806640625, 0.26495361328125, 0.3031005859375, 0.34124755859375, 0.37939453125, 0.41754150390625, 0.4556884765625, 0.49383544921875, 0.531982421875, 0.57012939453125, 0.6082763671875, 0.64642333984375, 0.6845703125, 0.72271728515625, 0.7608642578125, 0.79901123046875, 0.837158203125, 0.87530517578125, 0.9134521484375, 0.95159912109375, 0.98974609375, 1.02789306640625, 1.0660400390625, 1.10418701171875, 1.142333984375, 1.18048095703125, 1.2186279296875, 1.25677490234375, 1.294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 9.0, 11.0, 12.0, 9.0, 13.0, 19.0, 22.0, 29.0, 57.0, 79.0, 161.0, 282.0, 497.0, 989.0, 2254.0, 6309.0, 26340.0, 256580.0, 3704776.0, 165166.0, 21479.0, 5437.0, 1959.0, 844.0, 375.0, 202.0, 127.0, 79.0, 49.0, 28.0, 26.0, 15.0, 7.0, 11.0, 11.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.458984375, -3.355499267578125, -3.25201416015625, -3.148529052734375, -3.0450439453125, -2.941558837890625, -2.83807373046875, -2.734588623046875, -2.631103515625, -2.527618408203125, -2.42413330078125, -2.320648193359375, -2.2171630859375, -2.113677978515625, -2.01019287109375, -1.906707763671875, -1.80322265625, -1.699737548828125, -1.59625244140625, -1.492767333984375, -1.3892822265625, -1.285797119140625, -1.18231201171875, -1.078826904296875, -0.975341796875, -0.871856689453125, -0.76837158203125, -0.664886474609375, -0.5614013671875, -0.457916259765625, -0.35443115234375, -0.250946044921875, -0.1474609375, -0.043975830078125, 0.05950927734375, 0.162994384765625, 0.2664794921875, 0.369964599609375, 0.47344970703125, 0.576934814453125, 0.680419921875, 0.783905029296875, 0.88739013671875, 0.990875244140625, 1.0943603515625, 1.197845458984375, 1.30133056640625, 1.404815673828125, 1.50830078125, 1.611785888671875, 1.71527099609375, 1.818756103515625, 1.9222412109375, 2.025726318359375, 2.12921142578125, 2.232696533203125, 2.336181640625, 2.439666748046875, 2.54315185546875, 2.646636962890625, 2.7501220703125, 2.853607177734375, 2.95709228515625, 3.060577392578125, 3.1640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 27.0, 22.0, 30.0, 66.0, 144.0, 235.0, 562.0, 1528.0, 713.0, 299.0, 145.0, 70.0, 53.0, 35.0, 23.0, 16.0, 13.0, 10.0, 10.0, 5.0, 1.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7641830444335938, -0.7407684326171875, -0.7173538208007812, -0.693939208984375, -0.6705245971679688, -0.6471099853515625, -0.6236953735351562, -0.60028076171875, -0.5768661499023438, -0.5534515380859375, -0.5300369262695312, -0.506622314453125, -0.48320770263671875, -0.4597930908203125, -0.43637847900390625, -0.4129638671875, -0.38954925537109375, -0.3661346435546875, -0.34272003173828125, -0.319305419921875, -0.29589080810546875, -0.2724761962890625, -0.24906158447265625, -0.22564697265625, -0.20223236083984375, -0.1788177490234375, -0.15540313720703125, -0.131988525390625, -0.10857391357421875, -0.0851593017578125, -0.06174468994140625, -0.038330078125, -0.01491546630859375, 0.0084991455078125, 0.03191375732421875, 0.055328369140625, 0.07874298095703125, 0.1021575927734375, 0.12557220458984375, 0.14898681640625, 0.17240142822265625, 0.1958160400390625, 0.21923065185546875, 0.242645263671875, 0.26605987548828125, 0.2894744873046875, 0.31288909912109375, 0.3363037109375, 0.35971832275390625, 0.3831329345703125, 0.40654754638671875, 0.429962158203125, 0.45337677001953125, 0.4767913818359375, 0.5002059936523438, 0.52362060546875, 0.5470352172851562, 0.5704498291015625, 0.5938644409179688, 0.617279052734375, 0.6406936645507812, 0.6641082763671875, 0.6875228881835938, 0.7109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 26.0, 58.0, 119.0, 227.0, 264.0, 178.0, 64.0, 28.0, 9.0, 12.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.540773391723633, -4.360532760620117, -4.180291652679443, -4.000051021575928, -3.819810152053833, -3.6395692825317383, -3.4593286514282227, -3.279087781906128, -3.098846912384033, -2.9186060428619385, -2.7383651733398438, -2.558124542236328, -2.3778836727142334, -2.1976428031921387, -2.017402172088623, -1.8371613025665283, -1.6569204330444336, -1.4766795635223389, -1.2964388132095337, -1.1161980628967285, -0.9359571933746338, -0.7557163834571838, -0.5754755735397339, -0.3952348232269287, -0.21499395370483398, -0.03475314378738403, 0.14548766613006592, 0.32572847604751587, 0.5059692859649658, 0.6862100958824158, 0.8664509057998657, 1.046691656112671, 1.2269330024719238, 1.4071738719940186, 1.5874146223068237, 1.767655372619629, 1.9478962421417236, 2.1281371116638184, 2.308377742767334, 2.4886186122894287, 2.6688594818115234, 2.849100351333618, 3.029341220855713, 3.2095818519592285, 3.3898227214813232, 3.570063591003418, 3.7503042221069336, 3.9305450916290283, 4.110785961151123, 4.291026592254639, 4.4712677001953125, 4.651508331298828, 4.831748962402344, 5.011990070343018, 5.192230701446533, 5.372471809387207, 5.552712440490723, 5.732953071594238, 5.913194179534912, 6.093434810638428, 6.273675918579102, 6.453916549682617, 6.634157180786133, 6.814397811889648, 6.994638919830322]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 12.0, 17.0, 28.0, 33.0, 44.0, 69.0, 66.0, 74.0, 53.0, 93.0, 80.0, 80.0, 62.0, 62.0, 56.0, 33.0, 26.0, 22.0, 28.0, 15.0, 12.0, 8.0, 7.0, 4.0, 2.0, 3.0], "bins": [-5.878988265991211, -5.755491733551025, -5.631995677947998, -5.5084991455078125, -5.385002613067627, -5.261506080627441, -5.138010025024414, -5.0145134925842285, -4.891016960144043, -4.767520427703857, -4.64402437210083, -4.5205278396606445, -4.397031307220459, -4.273534774780273, -4.150038719177246, -4.0265421867370605, -3.903046131134033, -3.7795498371124268, -3.656053304672241, -3.5325570106506348, -3.409060478210449, -3.2855641841888428, -3.1620678901672363, -3.038571357727051, -2.9150748252868652, -2.791578531265259, -2.6680819988250732, -2.544585704803467, -2.4210891723632812, -2.297592878341675, -2.1740965843200684, -2.050600051879883, -1.9271037578582764, -1.8036073446273804, -1.6801109313964844, -1.556614637374878, -1.433118224143982, -1.309621810913086, -1.18612539768219, -1.062628984451294, -0.9391326308250427, -0.8156362175941467, -0.6921398639678955, -0.5686434507369995, -0.4451470673084259, -0.3216506838798523, -0.1981542706489563, -0.07465791702270508, 0.04883849620819092, 0.17233487963676453, 0.29583126306533813, 0.41932767629623413, 0.5428240299224854, 0.6663204431533813, 0.7898168563842773, 0.9133132100105286, 1.0368096828460693, 1.1603060960769653, 1.2838025093078613, 1.4072988033294678, 1.5307952165603638, 1.6542916297912598, 1.7777880430221558, 1.9012844562530518, 2.024780750274658]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 8.0, 14.0, 17.0, 32.0, 34.0, 77.0, 111.0, 216.0, 434.0, 1063.0, 3453.0, 21993.0, 913887.0, 98267.0, 6057.0, 1606.0, 627.0, 273.0, 142.0, 87.0, 46.0, 33.0, 21.0, 15.0, 9.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.72613525390625, -6.5069580078125, -6.28778076171875, -6.068603515625, -5.84942626953125, -5.6302490234375, -5.41107177734375, -5.19189453125, -4.97271728515625, -4.7535400390625, -4.53436279296875, -4.315185546875, -4.09600830078125, -3.8768310546875, -3.65765380859375, -3.4384765625, -3.21929931640625, -3.0001220703125, -2.78094482421875, -2.561767578125, -2.34259033203125, -2.1234130859375, -1.90423583984375, -1.68505859375, -1.46588134765625, -1.2467041015625, -1.02752685546875, -0.808349609375, -0.58917236328125, -0.3699951171875, -0.15081787109375, 0.068359375, 0.28753662109375, 0.5067138671875, 0.72589111328125, 0.945068359375, 1.16424560546875, 1.3834228515625, 1.60260009765625, 1.82177734375, 2.04095458984375, 2.2601318359375, 2.47930908203125, 2.698486328125, 2.91766357421875, 3.1368408203125, 3.35601806640625, 3.5751953125, 3.79437255859375, 4.0135498046875, 4.23272705078125, 4.451904296875, 4.67108154296875, 4.8902587890625, 5.10943603515625, 5.32861328125, 5.54779052734375, 5.7669677734375, 5.98614501953125, 6.205322265625, 6.42449951171875, 6.6436767578125, 6.86285400390625, 7.08203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 12.0, 31.0, 80.0, 163.0, 257.0, 217.0, 131.0, 62.0, 16.0, 7.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.089447021484375, -1.05291748046875, -1.016387939453125, -0.9798583984375, -0.943328857421875, -0.90679931640625, -0.870269775390625, -0.833740234375, -0.797210693359375, -0.76068115234375, -0.724151611328125, -0.6876220703125, -0.651092529296875, -0.61456298828125, -0.578033447265625, -0.54150390625, -0.504974365234375, -0.46844482421875, -0.431915283203125, -0.3953857421875, -0.358856201171875, -0.32232666015625, -0.285797119140625, -0.249267578125, -0.212738037109375, -0.17620849609375, -0.139678955078125, -0.1031494140625, -0.066619873046875, -0.03009033203125, 0.006439208984375, 0.04296875, 0.079498291015625, 0.11602783203125, 0.152557373046875, 0.1890869140625, 0.225616455078125, 0.26214599609375, 0.298675537109375, 0.335205078125, 0.371734619140625, 0.40826416015625, 0.444793701171875, 0.4813232421875, 0.517852783203125, 0.55438232421875, 0.590911865234375, 0.62744140625, 0.663970947265625, 0.70050048828125, 0.737030029296875, 0.7735595703125, 0.810089111328125, 0.84661865234375, 0.883148193359375, 0.919677734375, 0.956207275390625, 0.99273681640625, 1.029266357421875, 1.0657958984375, 1.102325439453125, 1.13885498046875, 1.175384521484375, 1.2119140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 13.0, 15.0, 13.0, 21.0, 34.0, 42.0, 49.0, 70.0, 106.0, 159.0, 179.0, 326.0, 485.0, 738.0, 1210.0, 2624.0, 6806.0, 25976.0, 146327.0, 548160.0, 254875.0, 42843.0, 10007.0, 3333.0, 1566.0, 841.0, 539.0, 370.0, 224.0, 158.0, 113.0, 90.0, 55.0, 55.0, 28.0, 23.0, 28.0, 14.0, 8.0, 11.0, 6.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.755859375, -2.67633056640625, -2.5968017578125, -2.51727294921875, -2.437744140625, -2.35821533203125, -2.2786865234375, -2.19915771484375, -2.11962890625, -2.04010009765625, -1.9605712890625, -1.88104248046875, -1.801513671875, -1.72198486328125, -1.6424560546875, -1.56292724609375, -1.4833984375, -1.40386962890625, -1.3243408203125, -1.24481201171875, -1.165283203125, -1.08575439453125, -1.0062255859375, -0.92669677734375, -0.84716796875, -0.76763916015625, -0.6881103515625, -0.60858154296875, -0.529052734375, -0.44952392578125, -0.3699951171875, -0.29046630859375, -0.2109375, -0.13140869140625, -0.0518798828125, 0.02764892578125, 0.107177734375, 0.18670654296875, 0.2662353515625, 0.34576416015625, 0.42529296875, 0.50482177734375, 0.5843505859375, 0.66387939453125, 0.743408203125, 0.82293701171875, 0.9024658203125, 0.98199462890625, 1.0615234375, 1.14105224609375, 1.2205810546875, 1.30010986328125, 1.379638671875, 1.45916748046875, 1.5386962890625, 1.61822509765625, 1.69775390625, 1.77728271484375, 1.8568115234375, 1.93634033203125, 2.015869140625, 2.09539794921875, 2.1749267578125, 2.25445556640625, 2.333984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 5.0, 16.0, 13.0, 17.0, 24.0, 25.0, 34.0, 43.0, 28.0, 37.0, 41.0, 55.0, 52.0, 52.0, 59.0, 50.0, 56.0, 51.0, 51.0, 37.0, 42.0, 33.0, 25.0, 24.0, 23.0, 25.0, 10.0, 8.0, 14.0, 10.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.54229736328125, -2.4635009765625, -2.38470458984375, -2.305908203125, -2.22711181640625, -2.1483154296875, -2.06951904296875, -1.99072265625, -1.91192626953125, -1.8331298828125, -1.75433349609375, -1.675537109375, -1.59674072265625, -1.5179443359375, -1.43914794921875, -1.3603515625, -1.28155517578125, -1.2027587890625, -1.12396240234375, -1.045166015625, -0.96636962890625, -0.8875732421875, -0.80877685546875, -0.72998046875, -0.65118408203125, -0.5723876953125, -0.49359130859375, -0.414794921875, -0.33599853515625, -0.2572021484375, -0.17840576171875, -0.099609375, -0.02081298828125, 0.0579833984375, 0.13677978515625, 0.215576171875, 0.29437255859375, 0.3731689453125, 0.45196533203125, 0.53076171875, 0.60955810546875, 0.6883544921875, 0.76715087890625, 0.845947265625, 0.92474365234375, 1.0035400390625, 1.08233642578125, 1.1611328125, 1.23992919921875, 1.3187255859375, 1.39752197265625, 1.476318359375, 1.55511474609375, 1.6339111328125, 1.71270751953125, 1.79150390625, 1.87030029296875, 1.9490966796875, 2.02789306640625, 2.106689453125, 2.18548583984375, 2.2642822265625, 2.34307861328125, 2.421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 9.0, 10.0, 13.0, 29.0, 51.0, 135.0, 365.0, 1989.0, 27929.0, 955019.0, 59307.0, 2870.0, 498.0, 157.0, 61.0, 42.0, 20.0, 11.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.91009521484375, -2.8006591796875, -2.69122314453125, -2.581787109375, -2.47235107421875, -2.3629150390625, -2.25347900390625, -2.14404296875, -2.03460693359375, -1.9251708984375, -1.81573486328125, -1.706298828125, -1.59686279296875, -1.4874267578125, -1.37799072265625, -1.2685546875, -1.15911865234375, -1.0496826171875, -0.94024658203125, -0.830810546875, -0.72137451171875, -0.6119384765625, -0.50250244140625, -0.39306640625, -0.28363037109375, -0.1741943359375, -0.06475830078125, 0.044677734375, 0.15411376953125, 0.2635498046875, 0.37298583984375, 0.482421875, 0.59185791015625, 0.7012939453125, 0.81072998046875, 0.920166015625, 1.02960205078125, 1.1390380859375, 1.24847412109375, 1.35791015625, 1.46734619140625, 1.5767822265625, 1.68621826171875, 1.795654296875, 1.90509033203125, 2.0145263671875, 2.12396240234375, 2.2333984375, 2.34283447265625, 2.4522705078125, 2.56170654296875, 2.671142578125, 2.78057861328125, 2.8900146484375, 2.99945068359375, 3.10888671875, 3.21832275390625, 3.3277587890625, 3.43719482421875, 3.546630859375, 3.65606689453125, 3.7655029296875, 3.87493896484375, 3.984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 4.0, 8.0, 4.0, 10.0, 6.0, 15.0, 18.0, 13.0, 18.0, 23.0, 30.0, 35.0, 49.0, 70.0, 73.0, 98.0, 88.0, 83.0, 61.0, 55.0, 34.0, 31.0, 26.0, 29.0, 23.0, 18.0, 13.0, 11.0, 7.0, 5.0, 5.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00014591217041015625, -0.00014179013669490814, -0.00013766810297966003, -0.00013354606926441193, -0.00012942403554916382, -0.0001253020018339157, -0.0001211799681186676, -0.0001170579344034195, -0.00011293590068817139, -0.00010881386697292328, -0.00010469183325767517, -0.00010056979954242706, -9.644776582717896e-05, -9.232573211193085e-05, -8.820369839668274e-05, -8.408166468143463e-05, -7.995963096618652e-05, -7.583759725093842e-05, -7.171556353569031e-05, -6.75935298204422e-05, -6.347149610519409e-05, -5.9349462389945984e-05, -5.5227428674697876e-05, -5.110539495944977e-05, -4.698336124420166e-05, -4.286132752895355e-05, -3.8739293813705444e-05, -3.4617260098457336e-05, -3.049522638320923e-05, -2.637319266796112e-05, -2.2251158952713013e-05, -1.8129125237464905e-05, -1.4007091522216797e-05, -9.885057806968689e-06, -5.763024091720581e-06, -1.6409903764724731e-06, 2.4810433387756348e-06, 6.603077054023743e-06, 1.072511076927185e-05, 1.4847144484519958e-05, 1.8969178199768066e-05, 2.3091211915016174e-05, 2.7213245630264282e-05, 3.133527934551239e-05, 3.54573130607605e-05, 3.9579346776008606e-05, 4.3701380491256714e-05, 4.782341420650482e-05, 5.194544792175293e-05, 5.606748163700104e-05, 6.0189515352249146e-05, 6.431154906749725e-05, 6.843358278274536e-05, 7.255561649799347e-05, 7.667765021324158e-05, 8.079968392848969e-05, 8.492171764373779e-05, 8.90437513589859e-05, 9.316578507423401e-05, 9.728781878948212e-05, 0.00010140985250473022, 0.00010553188621997833, 0.00010965391993522644, 0.00011377595365047455, 0.00011789798736572266]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 10.0, 18.0, 30.0, 32.0, 66.0, 112.0, 241.0, 622.0, 2038.0, 13178.0, 576583.0, 441321.0, 11335.0, 1817.0, 576.0, 245.0, 115.0, 69.0, 51.0, 26.0, 11.0, 11.0, 9.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0], "bins": [-3.751953125, -3.660369873046875, -3.56878662109375, -3.477203369140625, -3.3856201171875, -3.294036865234375, -3.20245361328125, -3.110870361328125, -3.019287109375, -2.927703857421875, -2.83612060546875, -2.744537353515625, -2.6529541015625, -2.561370849609375, -2.46978759765625, -2.378204345703125, -2.28662109375, -2.195037841796875, -2.10345458984375, -2.011871337890625, -1.9202880859375, -1.828704833984375, -1.73712158203125, -1.645538330078125, -1.553955078125, -1.462371826171875, -1.37078857421875, -1.279205322265625, -1.1876220703125, -1.096038818359375, -1.00445556640625, -0.912872314453125, -0.8212890625, -0.729705810546875, -0.63812255859375, -0.546539306640625, -0.4549560546875, -0.363372802734375, -0.27178955078125, -0.180206298828125, -0.088623046875, 0.002960205078125, 0.09454345703125, 0.186126708984375, 0.2777099609375, 0.369293212890625, 0.46087646484375, 0.552459716796875, 0.64404296875, 0.735626220703125, 0.82720947265625, 0.918792724609375, 1.0103759765625, 1.101959228515625, 1.19354248046875, 1.285125732421875, 1.376708984375, 1.468292236328125, 1.55987548828125, 1.651458740234375, 1.7430419921875, 1.834625244140625, 1.92620849609375, 2.017791748046875, 2.109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 10.0, 16.0, 25.0, 41.0, 85.0, 104.0, 140.0, 145.0, 151.0, 89.0, 53.0, 47.0, 22.0, 22.0, 12.0, 13.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.43402099609375, -1.3885498046875, -1.34307861328125, -1.297607421875, -1.25213623046875, -1.2066650390625, -1.16119384765625, -1.11572265625, -1.07025146484375, -1.0247802734375, -0.97930908203125, -0.933837890625, -0.88836669921875, -0.8428955078125, -0.79742431640625, -0.751953125, -0.70648193359375, -0.6610107421875, -0.61553955078125, -0.570068359375, -0.52459716796875, -0.4791259765625, -0.43365478515625, -0.38818359375, -0.34271240234375, -0.2972412109375, -0.25177001953125, -0.206298828125, -0.16082763671875, -0.1153564453125, -0.06988525390625, -0.0244140625, 0.02105712890625, 0.0665283203125, 0.11199951171875, 0.157470703125, 0.20294189453125, 0.2484130859375, 0.29388427734375, 0.33935546875, 0.38482666015625, 0.4302978515625, 0.47576904296875, 0.521240234375, 0.56671142578125, 0.6121826171875, 0.65765380859375, 0.703125, 0.74859619140625, 0.7940673828125, 0.83953857421875, 0.885009765625, 0.93048095703125, 0.9759521484375, 1.02142333984375, 1.06689453125, 1.11236572265625, 1.1578369140625, 1.20330810546875, 1.248779296875, 1.29425048828125, 1.3397216796875, 1.38519287109375, 1.4306640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 17.0, 13.0, 32.0, 63.0, 135.0, 172.0, 198.0, 147.0, 91.0, 54.0, 36.0, 7.0, 10.0, 10.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.320911407470703, -8.837846755981445, -8.354782104492188, -7.87171745300293, -7.388652801513672, -6.905588150024414, -6.422523021697998, -5.93945837020874, -5.456393718719482, -4.973329067230225, -4.490264415740967, -4.007199287414551, -3.524134874343872, -3.0410702228546143, -2.5580053329467773, -2.0749406814575195, -1.5918760299682617, -1.108811378479004, -0.6257466077804565, -0.14268183708190918, 0.34038281440734863, 0.8234474658966064, 1.3065123558044434, 1.7895770072937012, 2.272641658782959, 2.755706310272217, 3.2387709617614746, 3.7218358516693115, 4.204900741577148, 4.687965393066406, 5.171030044555664, 5.654094696044922, 6.13715934753418, 6.6202239990234375, 7.103288650512695, 7.586353302001953, 8.069417953491211, 8.552482604980469, 9.035547256469727, 9.518611907958984, 10.001676559448242, 10.4847412109375, 10.967805862426758, 11.450870513916016, 11.933935165405273, 12.416999816894531, 12.900064468383789, 13.383129119873047, 13.866194725036621, 14.349259376525879, 14.832324028015137, 15.315388679504395, 15.798453330993652, 16.281518936157227, 16.764583587646484, 17.247648239135742, 17.730712890625, 18.213777542114258, 18.696842193603516, 19.179906845092773, 19.66297149658203, 20.14603614807129, 20.629100799560547, 21.112165451049805, 21.595230102539062]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 6.0, 4.0, 10.0, 9.0, 8.0, 14.0, 17.0, 11.0, 32.0, 25.0, 31.0, 35.0, 40.0, 40.0, 40.0, 47.0, 47.0, 37.0, 42.0, 59.0, 42.0, 34.0, 36.0, 38.0, 38.0, 27.0, 34.0, 24.0, 24.0, 20.0, 15.0, 20.0, 20.0, 11.0, 8.0, 9.0, 8.0, 4.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.24370288848877, -12.820619583129883, -12.39753532409668, -11.974452018737793, -11.551368713378906, -11.128284454345703, -10.705201148986816, -10.28211784362793, -9.859033584594727, -9.43595027923584, -9.012866020202637, -8.58978271484375, -8.166699409484863, -7.743615627288818, -7.320531845092773, -6.897448539733887, -6.474365234375, -6.051281452178955, -5.628198146820068, -5.205114364624023, -4.782031059265137, -4.358947277069092, -3.935863494873047, -3.512779951095581, -3.0896964073181152, -2.6666128635406494, -2.2435293197631836, -1.8204455375671387, -1.3973619937896729, -0.974278450012207, -0.5511946678161621, -0.1281111240386963, 0.2949714660644531, 0.7180550694465637, 1.1411386728286743, 1.5642223358154297, 1.9873058795928955, 2.4103894233703613, 2.8334732055664062, 3.256556749343872, 3.679640293121338, 4.102724075317383, 4.5258073806762695, 4.9488911628723145, 5.371974945068359, 5.795058250427246, 6.218142032623291, 6.641225814819336, 7.064309120178223, 7.487392902374268, 7.910476207733154, 8.3335599899292, 8.756643295288086, 9.179727554321289, 9.602810859680176, 10.025894165039062, 10.448978424072266, 10.872061729431152, 11.295145988464355, 11.718229293823242, 12.141312599182129, 12.564395904541016, 12.987480163574219, 13.410563468933105, 13.833646774291992]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 15.0, 17.0, 22.0, 51.0, 113.0, 249.0, 696.0, 3210.0, 114871.0, 4064521.0, 8411.0, 1351.0, 408.0, 149.0, 80.0, 41.0, 19.0, 16.0, 5.0, 8.0, 7.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.267333984375, -10.91748046875, -10.567626953125, -10.2177734375, -9.867919921875, -9.51806640625, -9.168212890625, -8.818359375, -8.468505859375, -8.11865234375, -7.768798828125, -7.4189453125, -7.069091796875, -6.71923828125, -6.369384765625, -6.01953125, -5.669677734375, -5.31982421875, -4.969970703125, -4.6201171875, -4.270263671875, -3.92041015625, -3.570556640625, -3.220703125, -2.870849609375, -2.52099609375, -2.171142578125, -1.8212890625, -1.471435546875, -1.12158203125, -0.771728515625, -0.421875, -0.072021484375, 0.27783203125, 0.627685546875, 0.9775390625, 1.327392578125, 1.67724609375, 2.027099609375, 2.376953125, 2.726806640625, 3.07666015625, 3.426513671875, 3.7763671875, 4.126220703125, 4.47607421875, 4.825927734375, 5.17578125, 5.525634765625, 5.87548828125, 6.225341796875, 6.5751953125, 6.925048828125, 7.27490234375, 7.624755859375, 7.974609375, 8.324462890625, 8.67431640625, 9.024169921875, 9.3740234375, 9.723876953125, 10.07373046875, 10.423583984375, 10.7734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 11.0, 15.0, 28.0, 42.0, 100.0, 130.0, 187.0, 173.0, 129.0, 73.0, 59.0, 25.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0848388671875, -1.048583984375, -1.0123291015625, -0.97607421875, -0.9398193359375, -0.903564453125, -0.8673095703125, -0.8310546875, -0.7947998046875, -0.758544921875, -0.7222900390625, -0.68603515625, -0.6497802734375, -0.613525390625, -0.5772705078125, -0.541015625, -0.5047607421875, -0.468505859375, -0.4322509765625, -0.39599609375, -0.3597412109375, -0.323486328125, -0.2872314453125, -0.2509765625, -0.2147216796875, -0.178466796875, -0.1422119140625, -0.10595703125, -0.0697021484375, -0.033447265625, 0.0028076171875, 0.0390625, 0.0753173828125, 0.111572265625, 0.1478271484375, 0.18408203125, 0.2203369140625, 0.256591796875, 0.2928466796875, 0.3291015625, 0.3653564453125, 0.401611328125, 0.4378662109375, 0.47412109375, 0.5103759765625, 0.546630859375, 0.5828857421875, 0.619140625, 0.6553955078125, 0.691650390625, 0.7279052734375, 0.76416015625, 0.8004150390625, 0.836669921875, 0.8729248046875, 0.9091796875, 0.9454345703125, 0.981689453125, 1.0179443359375, 1.05419921875, 1.0904541015625, 1.126708984375, 1.1629638671875, 1.19921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 21.0, 39.0, 90.0, 299.0, 857.0, 5027.0, 497598.0, 3679884.0, 8720.0, 1166.0, 318.0, 123.0, 69.0, 40.0, 13.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.630859375, -3.405426025390625, -3.17999267578125, -2.954559326171875, -2.7291259765625, -2.503692626953125, -2.27825927734375, -2.052825927734375, -1.827392578125, -1.601959228515625, -1.37652587890625, -1.151092529296875, -0.9256591796875, -0.700225830078125, -0.47479248046875, -0.249359130859375, -0.02392578125, 0.201507568359375, 0.42694091796875, 0.652374267578125, 0.8778076171875, 1.103240966796875, 1.32867431640625, 1.554107666015625, 1.779541015625, 2.004974365234375, 2.23040771484375, 2.455841064453125, 2.6812744140625, 2.906707763671875, 3.13214111328125, 3.357574462890625, 3.5830078125, 3.808441162109375, 4.03387451171875, 4.259307861328125, 4.4847412109375, 4.710174560546875, 4.93560791015625, 5.161041259765625, 5.386474609375, 5.611907958984375, 5.83734130859375, 6.062774658203125, 6.2882080078125, 6.513641357421875, 6.73907470703125, 6.964508056640625, 7.18994140625, 7.415374755859375, 7.64080810546875, 7.866241455078125, 8.0916748046875, 8.317108154296875, 8.54254150390625, 8.767974853515625, 8.993408203125, 9.218841552734375, 9.44427490234375, 9.669708251953125, 9.8951416015625, 10.120574951171875, 10.34600830078125, 10.571441650390625, 10.796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 11.0, 34.0, 64.0, 134.0, 442.0, 1835.0, 1044.0, 257.0, 119.0, 57.0, 19.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -0.9988250732421875, -0.958587646484375, -0.9183502197265625, -0.87811279296875, -0.8378753662109375, -0.797637939453125, -0.7574005126953125, -0.7171630859375, -0.6769256591796875, -0.636688232421875, -0.5964508056640625, -0.55621337890625, -0.5159759521484375, -0.475738525390625, -0.4355010986328125, -0.395263671875, -0.3550262451171875, -0.314788818359375, -0.2745513916015625, -0.23431396484375, -0.1940765380859375, -0.153839111328125, -0.1136016845703125, -0.0733642578125, -0.0331268310546875, 0.007110595703125, 0.0473480224609375, 0.08758544921875, 0.1278228759765625, 0.168060302734375, 0.2082977294921875, 0.24853515625, 0.2887725830078125, 0.329010009765625, 0.3692474365234375, 0.40948486328125, 0.4497222900390625, 0.489959716796875, 0.5301971435546875, 0.5704345703125, 0.6106719970703125, 0.650909423828125, 0.6911468505859375, 0.73138427734375, 0.7716217041015625, 0.811859130859375, 0.8520965576171875, 0.892333984375, 0.9325714111328125, 0.972808837890625, 1.0130462646484375, 1.05328369140625, 1.0935211181640625, 1.133758544921875, 1.1739959716796875, 1.2142333984375, 1.2544708251953125, 1.294708251953125, 1.3349456787109375, 1.37518310546875, 1.4154205322265625, 1.455657958984375, 1.4958953857421875, 1.5361328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 18.0, 48.0, 166.0, 290.0, 263.0, 136.0, 45.0, 15.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669973373413086, -2.4633448123931885, -2.256716251373291, -2.0500874519348145, -1.843458890914917, -1.6368303298950195, -1.430201768875122, -1.223573088645935, -1.0169445276260376, -0.8103159070014954, -0.6036872863769531, -0.39705872535705566, -0.19043010473251343, 0.01619851589202881, 0.22282707691192627, 0.4294557571411133, 0.6360843181610107, 0.842712938785553, 1.0493415594100952, 1.2559701204299927, 1.4625988006591797, 1.6692273616790771, 1.8758559226989746, 2.082484722137451, 2.2891130447387695, 2.495741605758667, 2.7023701667785645, 2.908998966217041, 3.1156275272369385, 3.322256088256836, 3.5288846492767334, 3.735513210296631, 3.9421420097351074, 4.148770809173584, 4.355399131774902, 4.562027931213379, 4.768656253814697, 4.975285053253174, 5.181913375854492, 5.388542175292969, 5.595170974731445, 5.801799774169922, 6.00842809677124, 6.215056896209717, 6.421685218811035, 6.628314018249512, 6.834942817687988, 7.041571140289307, 7.248199462890625, 7.454828262329102, 7.66145658493042, 7.8680853843688965, 8.074713706970215, 8.281342506408691, 8.487971305847168, 8.694600105285645, 8.901228904724121, 9.107857704162598, 9.314486503601074, 9.521114349365234, 9.727743148803711, 9.934371948242188, 10.141000747680664, 10.34762954711914, 10.5542573928833]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 5.0, 7.0, 4.0, 0.0, 4.0, 5.0, 5.0, 8.0, 8.0, 9.0, 8.0, 15.0, 15.0, 16.0, 21.0, 19.0, 16.0, 27.0, 41.0, 40.0, 39.0, 40.0, 46.0, 45.0, 44.0, 40.0, 45.0, 44.0, 40.0, 31.0, 30.0, 33.0, 35.0, 19.0, 27.0, 16.0, 30.0, 19.0, 26.0, 20.0, 9.0, 12.0, 10.0, 9.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.435965061187744, -2.364072799682617, -2.2921805381774902, -2.2202882766723633, -2.1483960151672363, -2.0765037536621094, -2.0046114921569824, -1.9327192306518555, -1.8608269691467285, -1.7889347076416016, -1.7170424461364746, -1.6451501846313477, -1.5732579231262207, -1.5013656616210938, -1.4294734001159668, -1.3575811386108398, -1.285688877105713, -1.213796615600586, -1.141904354095459, -1.070012092590332, -0.9981198310852051, -0.9262275695800781, -0.8543353080749512, -0.7824430465698242, -0.7105507850646973, -0.6386585235595703, -0.5667662620544434, -0.4948740005493164, -0.42298173904418945, -0.3510894775390625, -0.27919721603393555, -0.2073049545288086, -0.13541245460510254, -0.06352019309997559, 0.008372068405151367, 0.08026432991027832, 0.15215659141540527, 0.22404885292053223, 0.2959411144256592, 0.36783337593078613, 0.4397256374359131, 0.51161789894104, 0.583510160446167, 0.655402421951294, 0.7272946834564209, 0.7991869449615479, 0.8710792064666748, 0.9429714679718018, 1.0148637294769287, 1.0867559909820557, 1.1586482524871826, 1.2305405139923096, 1.3024327754974365, 1.3743250370025635, 1.4462172985076904, 1.5181095600128174, 1.5900018215179443, 1.6618940830230713, 1.7337863445281982, 1.8056786060333252, 1.8775708675384521, 1.949463129043579, 2.021355390548706, 2.093247652053833, 2.16513991355896]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 11.0, 12.0, 10.0, 13.0, 14.0, 25.0, 53.0, 55.0, 74.0, 99.0, 156.0, 206.0, 317.0, 446.0, 758.0, 1347.0, 2590.0, 6493.0, 24153.0, 143561.0, 557266.0, 253869.0, 40159.0, 9246.0, 3430.0, 1543.0, 860.0, 551.0, 353.0, 286.0, 146.0, 124.0, 86.0, 62.0, 52.0, 42.0, 21.0, 17.0, 18.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0235595703125, -1.955322265625, -1.8870849609375, -1.81884765625, -1.7506103515625, -1.682373046875, -1.6141357421875, -1.5458984375, -1.4776611328125, -1.409423828125, -1.3411865234375, -1.27294921875, -1.2047119140625, -1.136474609375, -1.0682373046875, -1.0, -0.9317626953125, -0.863525390625, -0.7952880859375, -0.72705078125, -0.6588134765625, -0.590576171875, -0.5223388671875, -0.4541015625, -0.3858642578125, -0.317626953125, -0.2493896484375, -0.18115234375, -0.1129150390625, -0.044677734375, 0.0235595703125, 0.091796875, 0.1600341796875, 0.228271484375, 0.2965087890625, 0.36474609375, 0.4329833984375, 0.501220703125, 0.5694580078125, 0.6376953125, 0.7059326171875, 0.774169921875, 0.8424072265625, 0.91064453125, 0.9788818359375, 1.047119140625, 1.1153564453125, 1.18359375, 1.2518310546875, 1.320068359375, 1.3883056640625, 1.45654296875, 1.5247802734375, 1.593017578125, 1.6612548828125, 1.7294921875, 1.7977294921875, 1.865966796875, 1.9342041015625, 2.00244140625, 2.0706787109375, 2.138916015625, 2.2071533203125, 2.275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 17.0, 39.0, 66.0, 91.0, 126.0, 177.0, 164.0, 122.0, 89.0, 44.0, 22.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.0489044189453125, -1.014801025390625, -0.9806976318359375, -0.94659423828125, -0.9124908447265625, -0.878387451171875, -0.8442840576171875, -0.8101806640625, -0.7760772705078125, -0.741973876953125, -0.7078704833984375, -0.67376708984375, -0.6396636962890625, -0.605560302734375, -0.5714569091796875, -0.537353515625, -0.5032501220703125, -0.469146728515625, -0.4350433349609375, -0.40093994140625, -0.3668365478515625, -0.332733154296875, -0.2986297607421875, -0.2645263671875, -0.2304229736328125, -0.196319580078125, -0.1622161865234375, -0.12811279296875, -0.0940093994140625, -0.059906005859375, -0.0258026123046875, 0.00830078125, 0.0424041748046875, 0.076507568359375, 0.1106109619140625, 0.14471435546875, 0.1788177490234375, 0.212921142578125, 0.2470245361328125, 0.2811279296875, 0.3152313232421875, 0.349334716796875, 0.3834381103515625, 0.41754150390625, 0.4516448974609375, 0.485748291015625, 0.5198516845703125, 0.553955078125, 0.5880584716796875, 0.622161865234375, 0.6562652587890625, 0.69036865234375, 0.7244720458984375, 0.758575439453125, 0.7926788330078125, 0.8267822265625, 0.8608856201171875, 0.894989013671875, 0.9290924072265625, 0.96319580078125, 0.9972991943359375, 1.031402587890625, 1.0655059814453125, 1.099609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 10.0, 13.0, 19.0, 23.0, 28.0, 56.0, 58.0, 99.0, 117.0, 201.0, 283.0, 409.0, 697.0, 1365.0, 3017.0, 9309.0, 44009.0, 285627.0, 540324.0, 130834.0, 21885.0, 5500.0, 2041.0, 998.0, 546.0, 352.0, 227.0, 148.0, 116.0, 63.0, 51.0, 37.0, 20.0, 16.0, 11.0, 4.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.35479736328125, -2.2818603515625, -2.20892333984375, -2.135986328125, -2.06304931640625, -1.9901123046875, -1.91717529296875, -1.84423828125, -1.77130126953125, -1.6983642578125, -1.62542724609375, -1.552490234375, -1.47955322265625, -1.4066162109375, -1.33367919921875, -1.2607421875, -1.18780517578125, -1.1148681640625, -1.04193115234375, -0.968994140625, -0.89605712890625, -0.8231201171875, -0.75018310546875, -0.67724609375, -0.60430908203125, -0.5313720703125, -0.45843505859375, -0.385498046875, -0.31256103515625, -0.2396240234375, -0.16668701171875, -0.09375, -0.02081298828125, 0.0521240234375, 0.12506103515625, 0.197998046875, 0.27093505859375, 0.3438720703125, 0.41680908203125, 0.48974609375, 0.56268310546875, 0.6356201171875, 0.70855712890625, 0.781494140625, 0.85443115234375, 0.9273681640625, 1.00030517578125, 1.0732421875, 1.14617919921875, 1.2191162109375, 1.29205322265625, 1.364990234375, 1.43792724609375, 1.5108642578125, 1.58380126953125, 1.65673828125, 1.72967529296875, 1.8026123046875, 1.87554931640625, 1.948486328125, 2.02142333984375, 2.0943603515625, 2.16729736328125, 2.240234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 10.0, 13.0, 6.0, 13.0, 19.0, 18.0, 12.0, 19.0, 21.0, 17.0, 34.0, 41.0, 37.0, 46.0, 44.0, 45.0, 54.0, 43.0, 58.0, 60.0, 54.0, 31.0, 35.0, 29.0, 36.0, 33.0, 28.0, 27.0, 20.0, 18.0, 15.0, 10.0, 10.0, 9.0, 7.0, 11.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.62109375, -2.548309326171875, -2.47552490234375, -2.402740478515625, -2.3299560546875, -2.257171630859375, -2.18438720703125, -2.111602783203125, -2.038818359375, -1.966033935546875, -1.89324951171875, -1.820465087890625, -1.7476806640625, -1.674896240234375, -1.60211181640625, -1.529327392578125, -1.45654296875, -1.383758544921875, -1.31097412109375, -1.238189697265625, -1.1654052734375, -1.092620849609375, -1.01983642578125, -0.947052001953125, -0.874267578125, -0.801483154296875, -0.72869873046875, -0.655914306640625, -0.5831298828125, -0.510345458984375, -0.43756103515625, -0.364776611328125, -0.2919921875, -0.219207763671875, -0.14642333984375, -0.073638916015625, -0.0008544921875, 0.071929931640625, 0.14471435546875, 0.217498779296875, 0.290283203125, 0.363067626953125, 0.43585205078125, 0.508636474609375, 0.5814208984375, 0.654205322265625, 0.72698974609375, 0.799774169921875, 0.87255859375, 0.945343017578125, 1.01812744140625, 1.090911865234375, 1.1636962890625, 1.236480712890625, 1.30926513671875, 1.382049560546875, 1.454833984375, 1.527618408203125, 1.60040283203125, 1.673187255859375, 1.7459716796875, 1.818756103515625, 1.89154052734375, 1.964324951171875, 2.037109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 9.0, 14.0, 13.0, 18.0, 23.0, 34.0, 54.0, 82.0, 144.0, 257.0, 490.0, 1071.0, 2895.0, 9344.0, 45902.0, 338916.0, 540573.0, 86602.0, 15150.0, 4129.0, 1378.0, 639.0, 340.0, 161.0, 107.0, 69.0, 36.0, 23.0, 21.0, 10.0, 15.0, 7.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6982421875, -0.6743011474609375, -0.650360107421875, -0.6264190673828125, -0.60247802734375, -0.5785369873046875, -0.554595947265625, -0.5306549072265625, -0.5067138671875, -0.4827728271484375, -0.458831787109375, -0.4348907470703125, -0.41094970703125, -0.3870086669921875, -0.363067626953125, -0.3391265869140625, -0.315185546875, -0.2912445068359375, -0.267303466796875, -0.2433624267578125, -0.21942138671875, -0.1954803466796875, -0.171539306640625, -0.1475982666015625, -0.1236572265625, -0.0997161865234375, -0.075775146484375, -0.0518341064453125, -0.02789306640625, -0.0039520263671875, 0.019989013671875, 0.0439300537109375, 0.06787109375, 0.0918121337890625, 0.115753173828125, 0.1396942138671875, 0.16363525390625, 0.1875762939453125, 0.211517333984375, 0.2354583740234375, 0.2593994140625, 0.2833404541015625, 0.307281494140625, 0.3312225341796875, 0.35516357421875, 0.3791046142578125, 0.403045654296875, 0.4269866943359375, 0.450927734375, 0.4748687744140625, 0.498809814453125, 0.5227508544921875, 0.54669189453125, 0.5706329345703125, 0.594573974609375, 0.6185150146484375, 0.6424560546875, 0.6663970947265625, 0.690338134765625, 0.7142791748046875, 0.73822021484375, 0.7621612548828125, 0.786102294921875, 0.8100433349609375, 0.833984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 12.0, 9.0, 20.0, 21.0, 27.0, 42.0, 54.0, 58.0, 93.0, 136.0, 134.0, 87.0, 73.0, 57.0, 39.0, 29.0, 27.0, 20.0, 16.0, 9.0, 10.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00020575523376464844, -0.00020063575357198715, -0.00019551627337932587, -0.00019039679318666458, -0.0001852773129940033, -0.000180157832801342, -0.00017503835260868073, -0.00016991887241601944, -0.00016479939222335815, -0.00015967991203069687, -0.00015456043183803558, -0.0001494409516453743, -0.000144321471452713, -0.00013920199126005173, -0.00013408251106739044, -0.00012896303087472916, -0.00012384355068206787, -0.00011872407048940659, -0.0001136045902967453, -0.00010848511010408401, -0.00010336562991142273, -9.824614971876144e-05, -9.312666952610016e-05, -8.800718933343887e-05, -8.288770914077759e-05, -7.77682289481163e-05, -7.264874875545502e-05, -6.752926856279373e-05, -6.240978837013245e-05, -5.729030817747116e-05, -5.2170827984809875e-05, -4.705134779214859e-05, -4.1931867599487305e-05, -3.681238740682602e-05, -3.1692907214164734e-05, -2.657342702150345e-05, -2.1453946828842163e-05, -1.6334466636180878e-05, -1.1214986443519592e-05, -6.095506250858307e-06, -9.760260581970215e-07, 4.143454134464264e-06, 9.26293432712555e-06, 1.4382414519786835e-05, 1.950189471244812e-05, 2.4621374905109406e-05, 2.974085509777069e-05, 3.4860335290431976e-05, 3.997981548309326e-05, 4.509929567575455e-05, 5.021877586841583e-05, 5.533825606107712e-05, 6.04577362537384e-05, 6.557721644639969e-05, 7.069669663906097e-05, 7.581617683172226e-05, 8.093565702438354e-05, 8.605513721704483e-05, 9.117461740970612e-05, 9.62940976023674e-05, 0.00010141357779502869, 0.00010653305798768997, 0.00011165253818035126, 0.00011677201837301254, 0.00012189149856567383]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 7.0, 15.0, 14.0, 25.0, 53.0, 103.0, 186.0, 378.0, 794.0, 2462.0, 11833.0, 142391.0, 785058.0, 92617.0, 8900.0, 2155.0, 806.0, 315.0, 174.0, 104.0, 45.0, 27.0, 27.0, 18.0, 12.0, 13.0, 4.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9951171875, -0.960113525390625, -0.92510986328125, -0.890106201171875, -0.8551025390625, -0.820098876953125, -0.78509521484375, -0.750091552734375, -0.715087890625, -0.680084228515625, -0.64508056640625, -0.610076904296875, -0.5750732421875, -0.540069580078125, -0.50506591796875, -0.470062255859375, -0.43505859375, -0.400054931640625, -0.36505126953125, -0.330047607421875, -0.2950439453125, -0.260040283203125, -0.22503662109375, -0.190032958984375, -0.155029296875, -0.120025634765625, -0.08502197265625, -0.050018310546875, -0.0150146484375, 0.019989013671875, 0.05499267578125, 0.089996337890625, 0.125, 0.160003662109375, 0.19500732421875, 0.230010986328125, 0.2650146484375, 0.300018310546875, 0.33502197265625, 0.370025634765625, 0.405029296875, 0.440032958984375, 0.47503662109375, 0.510040283203125, 0.5450439453125, 0.580047607421875, 0.61505126953125, 0.650054931640625, 0.68505859375, 0.720062255859375, 0.75506591796875, 0.790069580078125, 0.8250732421875, 0.860076904296875, 0.89508056640625, 0.930084228515625, 0.965087890625, 1.000091552734375, 1.03509521484375, 1.070098876953125, 1.1051025390625, 1.140106201171875, 1.17510986328125, 1.210113525390625, 1.2451171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 14.0, 20.0, 27.0, 28.0, 64.0, 65.0, 98.0, 101.0, 83.0, 103.0, 108.0, 72.0, 54.0, 43.0, 28.0, 28.0, 22.0, 6.0, 8.0, 10.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7948989868164062, -0.7719268798828125, -0.7489547729492188, -0.725982666015625, -0.7030105590820312, -0.6800384521484375, -0.6570663452148438, -0.63409423828125, -0.6111221313476562, -0.5881500244140625, -0.5651779174804688, -0.542205810546875, -0.5192337036132812, -0.4962615966796875, -0.47328948974609375, -0.4503173828125, -0.42734527587890625, -0.4043731689453125, -0.38140106201171875, -0.358428955078125, -0.33545684814453125, -0.3124847412109375, -0.28951263427734375, -0.26654052734375, -0.24356842041015625, -0.2205963134765625, -0.19762420654296875, -0.174652099609375, -0.15167999267578125, -0.1287078857421875, -0.10573577880859375, -0.082763671875, -0.05979156494140625, -0.0368194580078125, -0.01384735107421875, 0.009124755859375, 0.03209686279296875, 0.0550689697265625, 0.07804107666015625, 0.10101318359375, 0.12398529052734375, 0.1469573974609375, 0.16992950439453125, 0.192901611328125, 0.21587371826171875, 0.2388458251953125, 0.26181793212890625, 0.2847900390625, 0.30776214599609375, 0.3307342529296875, 0.35370635986328125, 0.376678466796875, 0.39965057373046875, 0.4226226806640625, 0.44559478759765625, 0.46856689453125, 0.49153900146484375, 0.5145111083984375, 0.5374832153320312, 0.560455322265625, 0.5834274291992188, 0.6063995361328125, 0.6293716430664062, 0.65234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 17.0, 75.0, 479.0, 398.0, 38.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.771095275878906, -22.180673599243164, -20.590253829956055, -18.999832153320312, -17.409412384033203, -15.818990707397461, -14.228569984436035, -12.63814926147461, -11.047728538513184, -9.457307815551758, -7.866887092590332, -6.276465892791748, -4.686045169830322, -3.0956244468688965, -1.5052032470703125, 0.08521747589111328, 1.675638198852539, 3.266058921813965, 4.856479644775391, 6.446900844573975, 8.037321090698242, 9.627742767333984, 11.21816349029541, 12.808584213256836, 14.399004936218262, 15.989425659179688, 17.57984733581543, 19.17026710510254, 20.76068878173828, 22.35110855102539, 23.941530227661133, 25.531951904296875, 27.122371673583984, 28.712793350219727, 30.303213119506836, 31.893634796142578, 33.48405456542969, 35.0744743347168, 36.66489791870117, 38.25531768798828, 39.84573745727539, 41.4361572265625, 43.026580810546875, 44.617000579833984, 46.207420349121094, 47.7978401184082, 49.38826370239258, 50.97868347167969, 52.56910705566406, 54.15952682495117, 55.74995040893555, 57.340370178222656, 58.930789947509766, 60.521209716796875, 62.11163330078125, 63.70205307006836, 65.29247283935547, 66.88289642333984, 68.47331237792969, 70.06373596191406, 71.65415954589844, 73.24457550048828, 74.83499908447266, 76.4254150390625, 78.01583862304688]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 15.0, 12.0, 16.0, 20.0, 19.0, 22.0, 23.0, 27.0, 26.0, 34.0, 33.0, 38.0, 35.0, 40.0, 36.0, 54.0, 47.0, 44.0, 56.0, 41.0, 39.0, 37.0, 38.0, 36.0, 37.0, 27.0, 22.0, 19.0, 15.0, 16.0, 17.0, 14.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.140039443969727, -11.767104148864746, -11.394168853759766, -11.021232604980469, -10.648297309875488, -10.275362014770508, -9.902426719665527, -9.529491424560547, -9.15655517578125, -8.78361988067627, -8.410684585571289, -8.037748336791992, -7.664813041687012, -7.291877746582031, -6.918942451477051, -6.54600715637207, -6.17307186126709, -5.800136566162109, -5.427200794219971, -5.05426549911499, -4.681329727172852, -4.308394432067871, -3.9354591369628906, -3.562523603439331, -3.1895880699157715, -2.816652536392212, -2.4437170028686523, -2.070781707763672, -1.6978461742401123, -1.3249106407165527, -0.9519753456115723, -0.5790398120880127, -0.20610427856445312, 0.16683119535446167, 0.5397666692733765, 0.9127020835876465, 1.285637617111206, 1.6585731506347656, 2.031508445739746, 2.4044439792633057, 2.7773795127868652, 3.150315046310425, 3.5232505798339844, 3.896185874938965, 4.269121170043945, 4.642056941986084, 5.0149922370910645, 5.387928009033203, 5.760863304138184, 6.133798599243164, 6.506734371185303, 6.879669666290283, 7.252605438232422, 7.625540733337402, 7.998476028442383, 8.371411323547363, 8.744346618652344, 9.117281913757324, 9.490217208862305, 9.863153457641602, 10.236088752746582, 10.609024047851562, 10.981959342956543, 11.354894638061523, 11.72783088684082]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 5.0, 4.0, 8.0, 15.0, 31.0, 64.0, 91.0, 176.0, 367.0, 922.0, 3153.0, 19525.0, 3704030.0, 450623.0, 11423.0, 2401.0, 702.0, 315.0, 162.0, 96.0, 49.0, 40.0, 20.0, 12.0, 11.0, 7.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.837005615234375, -3.69940185546875, -3.561798095703125, -3.4241943359375, -3.286590576171875, -3.14898681640625, -3.011383056640625, -2.873779296875, -2.736175537109375, -2.59857177734375, -2.460968017578125, -2.3233642578125, -2.185760498046875, -2.04815673828125, -1.910552978515625, -1.77294921875, -1.635345458984375, -1.49774169921875, -1.360137939453125, -1.2225341796875, -1.084930419921875, -0.94732666015625, -0.809722900390625, -0.672119140625, -0.534515380859375, -0.39691162109375, -0.259307861328125, -0.1217041015625, 0.015899658203125, 0.15350341796875, 0.291107177734375, 0.4287109375, 0.566314697265625, 0.70391845703125, 0.841522216796875, 0.9791259765625, 1.116729736328125, 1.25433349609375, 1.391937255859375, 1.529541015625, 1.667144775390625, 1.80474853515625, 1.942352294921875, 2.0799560546875, 2.217559814453125, 2.35516357421875, 2.492767333984375, 2.63037109375, 2.767974853515625, 2.90557861328125, 3.043182373046875, 3.1807861328125, 3.318389892578125, 3.45599365234375, 3.593597412109375, 3.731201171875, 3.868804931640625, 4.00640869140625, 4.144012451171875, 4.2816162109375, 4.419219970703125, 4.55682373046875, 4.694427490234375, 4.83203125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 9.0, 17.0, 24.0, 43.0, 64.0, 94.0, 127.0, 134.0, 153.0, 111.0, 77.0, 68.0, 45.0, 13.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.0091400146484375, -0.975311279296875, -0.9414825439453125, -0.90765380859375, -0.8738250732421875, -0.839996337890625, -0.8061676025390625, -0.7723388671875, -0.7385101318359375, -0.704681396484375, -0.6708526611328125, -0.63702392578125, -0.6031951904296875, -0.569366455078125, -0.5355377197265625, -0.501708984375, -0.4678802490234375, -0.434051513671875, -0.4002227783203125, -0.36639404296875, -0.3325653076171875, -0.298736572265625, -0.2649078369140625, -0.2310791015625, -0.1972503662109375, -0.163421630859375, -0.1295928955078125, -0.09576416015625, -0.0619354248046875, -0.028106689453125, 0.0057220458984375, 0.03955078125, 0.0733795166015625, 0.107208251953125, 0.1410369873046875, 0.17486572265625, 0.2086944580078125, 0.242523193359375, 0.2763519287109375, 0.3101806640625, 0.3440093994140625, 0.377838134765625, 0.4116668701171875, 0.44549560546875, 0.4793243408203125, 0.513153076171875, 0.5469818115234375, 0.580810546875, 0.6146392822265625, 0.648468017578125, 0.6822967529296875, 0.71612548828125, 0.7499542236328125, 0.783782958984375, 0.8176116943359375, 0.8514404296875, 0.8852691650390625, 0.919097900390625, 0.9529266357421875, 0.98675537109375, 1.0205841064453125, 1.054412841796875, 1.0882415771484375, 1.1220703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 15.0, 17.0, 22.0, 35.0, 71.0, 157.0, 335.0, 933.0, 3293.0, 17282.0, 302208.0, 3772034.0, 85292.0, 8825.0, 2281.0, 809.0, 330.0, 145.0, 61.0, 35.0, 17.0, 11.0, 12.0, 9.0, 4.0, 7.0, 4.0, 4.0, 9.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.3577880859375, -2.280029296875, -2.2022705078125, -2.12451171875, -2.0467529296875, -1.968994140625, -1.8912353515625, -1.8134765625, -1.7357177734375, -1.657958984375, -1.5802001953125, -1.50244140625, -1.4246826171875, -1.346923828125, -1.2691650390625, -1.19140625, -1.1136474609375, -1.035888671875, -0.9581298828125, -0.88037109375, -0.8026123046875, -0.724853515625, -0.6470947265625, -0.5693359375, -0.4915771484375, -0.413818359375, -0.3360595703125, -0.25830078125, -0.1805419921875, -0.102783203125, -0.0250244140625, 0.052734375, 0.1304931640625, 0.208251953125, 0.2860107421875, 0.36376953125, 0.4415283203125, 0.519287109375, 0.5970458984375, 0.6748046875, 0.7525634765625, 0.830322265625, 0.9080810546875, 0.98583984375, 1.0635986328125, 1.141357421875, 1.2191162109375, 1.296875, 1.3746337890625, 1.452392578125, 1.5301513671875, 1.60791015625, 1.6856689453125, 1.763427734375, 1.8411865234375, 1.9189453125, 1.9967041015625, 2.074462890625, 2.1522216796875, 2.22998046875, 2.3077392578125, 2.385498046875, 2.4632568359375, 2.541015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 19.0, 24.0, 43.0, 75.0, 141.0, 219.0, 640.0, 1587.0, 688.0, 256.0, 137.0, 75.0, 41.0, 34.0, 12.0, 17.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48798370361328125, -0.4696197509765625, -0.45125579833984375, -0.432891845703125, -0.41452789306640625, -0.3961639404296875, -0.37779998779296875, -0.35943603515625, -0.34107208251953125, -0.3227081298828125, -0.30434417724609375, -0.285980224609375, -0.26761627197265625, -0.2492523193359375, -0.23088836669921875, -0.2125244140625, -0.19416046142578125, -0.1757965087890625, -0.15743255615234375, -0.139068603515625, -0.12070465087890625, -0.1023406982421875, -0.08397674560546875, -0.06561279296875, -0.04724884033203125, -0.0288848876953125, -0.01052093505859375, 0.007843017578125, 0.02620697021484375, 0.0445709228515625, 0.06293487548828125, 0.081298828125, 0.09966278076171875, 0.1180267333984375, 0.13639068603515625, 0.154754638671875, 0.17311859130859375, 0.1914825439453125, 0.20984649658203125, 0.22821044921875, 0.24657440185546875, 0.2649383544921875, 0.28330230712890625, 0.301666259765625, 0.32003021240234375, 0.3383941650390625, 0.35675811767578125, 0.3751220703125, 0.39348602294921875, 0.4118499755859375, 0.43021392822265625, 0.448577880859375, 0.46694183349609375, 0.4853057861328125, 0.5036697387695312, 0.52203369140625, 0.5403976440429688, 0.5587615966796875, 0.5771255493164062, 0.595489501953125, 0.6138534545898438, 0.6322174072265625, 0.6505813598632812, 0.6689453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 16.0, 61.0, 149.0, 252.0, 271.0, 161.0, 57.0, 19.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8399262428283691, -1.6879849433898926, -1.5360437631607056, -1.3841025829315186, -1.232161283493042, -1.0802199840545654, -0.9282788038253784, -0.7763376235961914, -0.6243963241577148, -0.47245508432388306, -0.32051384449005127, -0.16857260465621948, -0.016631364822387695, 0.1353098750114441, 0.2872511148452759, 0.4391922950744629, 0.5911335945129395, 0.7430748343467712, 0.895016074180603, 1.04695725440979, 1.1988985538482666, 1.3508398532867432, 1.5027810335159302, 1.6547222137451172, 1.8066635131835938, 1.9586048126220703, 2.110546112060547, 2.2624871730804443, 2.414428472518921, 2.5663697719573975, 2.718310832977295, 2.8702521324157715, 3.02219295501709, 3.1741342544555664, 3.326075553894043, 3.4780166149139404, 3.629957914352417, 3.7818992137908936, 3.933840274810791, 4.085781574249268, 4.237722873687744, 4.389664173126221, 4.541605472564697, 4.693546772003174, 4.845487594604492, 4.997428894042969, 5.149370193481445, 5.301311492919922, 5.453252792358398, 5.605194091796875, 5.757135391235352, 5.909076690673828, 6.061017990112305, 6.212958812713623, 6.3649001121521, 6.516841411590576, 6.668782711029053, 6.820724010467529, 6.972665309906006, 7.124606609344482, 7.276547431945801, 7.428488731384277, 7.580430030822754, 7.7323713302612305, 7.884312629699707]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 6.0, 6.0, 4.0, 6.0, 9.0, 7.0, 12.0, 12.0, 8.0, 22.0, 31.0, 25.0, 39.0, 34.0, 46.0, 39.0, 46.0, 40.0, 32.0, 55.0, 47.0, 39.0, 49.0, 41.0, 46.0, 44.0, 29.0, 32.0, 33.0, 21.0, 23.0, 22.0, 13.0, 11.0, 12.0, 13.0, 12.0, 6.0, 11.0, 8.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4630053043365479, -1.4120441675186157, -1.361082911491394, -1.310121774673462, -1.2591606378555298, -1.2081995010375977, -1.157238245010376, -1.1062771081924438, -1.0553159713745117, -1.0043548345565796, -0.9533936381340027, -0.9024324417114258, -0.8514713048934937, -0.8005101084709167, -0.7495489120483398, -0.6985877752304077, -0.647626519203186, -0.5966653227806091, -0.545704185962677, -0.4947429895401001, -0.4437818229198456, -0.39282065629959106, -0.34185945987701416, -0.29089829325675964, -0.23993712663650513, -0.1889759600162506, -0.1380147784948349, -0.08705359697341919, -0.03609243035316467, 0.014868736267089844, 0.06582993268966675, 0.11679109930992126, 0.16775226593017578, 0.2187134325504303, 0.2696745991706848, 0.3206357955932617, 0.37159696221351624, 0.42255812883377075, 0.47351932525634766, 0.5244804620742798, 0.5754416584968567, 0.6264028549194336, 0.6773639917373657, 0.7283251881599426, 0.7792863845825195, 0.8302475214004517, 0.8812087178230286, 0.9321699142456055, 0.9831310510635376, 1.0340921878814697, 1.0850534439086914, 1.1360145807266235, 1.1869757175445557, 1.2379369735717773, 1.2888981103897095, 1.3398592472076416, 1.3908205032348633, 1.4417816400527954, 1.492742896080017, 1.5437040328979492, 1.5946651697158813, 1.6456263065338135, 1.6965875625610352, 1.7475486993789673, 1.7985098361968994]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 23.0, 39.0, 62.0, 83.0, 190.0, 338.0, 703.0, 1517.0, 4756.0, 29963.0, 413017.0, 546546.0, 42016.0, 6015.0, 1727.0, 737.0, 347.0, 204.0, 114.0, 67.0, 28.0, 18.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.20703125, -3.10382080078125, -3.0006103515625, -2.89739990234375, -2.794189453125, -2.69097900390625, -2.5877685546875, -2.48455810546875, -2.38134765625, -2.27813720703125, -2.1749267578125, -2.07171630859375, -1.968505859375, -1.86529541015625, -1.7620849609375, -1.65887451171875, -1.5556640625, -1.45245361328125, -1.3492431640625, -1.24603271484375, -1.142822265625, -1.03961181640625, -0.9364013671875, -0.83319091796875, -0.72998046875, -0.62677001953125, -0.5235595703125, -0.42034912109375, -0.317138671875, -0.21392822265625, -0.1107177734375, -0.00750732421875, 0.095703125, 0.19891357421875, 0.3021240234375, 0.40533447265625, 0.508544921875, 0.61175537109375, 0.7149658203125, 0.81817626953125, 0.92138671875, 1.02459716796875, 1.1278076171875, 1.23101806640625, 1.334228515625, 1.43743896484375, 1.5406494140625, 1.64385986328125, 1.7470703125, 1.85028076171875, 1.9534912109375, 2.05670166015625, 2.159912109375, 2.26312255859375, 2.3663330078125, 2.46954345703125, 2.57275390625, 2.67596435546875, 2.7791748046875, 2.88238525390625, 2.985595703125, 3.08880615234375, 3.1920166015625, 3.29522705078125, 3.3984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 21.0, 25.0, 42.0, 55.0, 85.0, 125.0, 132.0, 156.0, 110.0, 77.0, 79.0, 45.0, 16.0, 11.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.994140625, -0.9609375, -0.927734375, -0.89453125, -0.861328125, -0.828125, -0.794921875, -0.76171875, -0.728515625, -0.6953125, -0.662109375, -0.62890625, -0.595703125, -0.5625, -0.529296875, -0.49609375, -0.462890625, -0.4296875, -0.396484375, -0.36328125, -0.330078125, -0.296875, -0.263671875, -0.23046875, -0.197265625, -0.1640625, -0.130859375, -0.09765625, -0.064453125, -0.03125, 0.001953125, 0.03515625, 0.068359375, 0.1015625, 0.134765625, 0.16796875, 0.201171875, 0.234375, 0.267578125, 0.30078125, 0.333984375, 0.3671875, 0.400390625, 0.43359375, 0.466796875, 0.5, 0.533203125, 0.56640625, 0.599609375, 0.6328125, 0.666015625, 0.69921875, 0.732421875, 0.765625, 0.798828125, 0.83203125, 0.865234375, 0.8984375, 0.931640625, 0.96484375, 0.998046875, 1.03125, 1.064453125, 1.09765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 16.0, 22.0, 24.0, 45.0, 33.0, 64.0, 80.0, 116.0, 139.0, 178.0, 264.0, 403.0, 512.0, 886.0, 1672.0, 4154.0, 13835.0, 66447.0, 320884.0, 467716.0, 133374.0, 25324.0, 6444.0, 2381.0, 1136.0, 676.0, 471.0, 295.0, 238.0, 143.0, 122.0, 105.0, 77.0, 52.0, 49.0, 20.0, 31.0, 29.0, 16.0, 8.0, 15.0, 8.0, 2.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.90625, -1.848846435546875, -1.79144287109375, -1.734039306640625, -1.6766357421875, -1.619232177734375, -1.56182861328125, -1.504425048828125, -1.447021484375, -1.389617919921875, -1.33221435546875, -1.274810791015625, -1.2174072265625, -1.160003662109375, -1.10260009765625, -1.045196533203125, -0.98779296875, -0.930389404296875, -0.87298583984375, -0.815582275390625, -0.7581787109375, -0.700775146484375, -0.64337158203125, -0.585968017578125, -0.528564453125, -0.471160888671875, -0.41375732421875, -0.356353759765625, -0.2989501953125, -0.241546630859375, -0.18414306640625, -0.126739501953125, -0.0693359375, -0.011932373046875, 0.04547119140625, 0.102874755859375, 0.1602783203125, 0.217681884765625, 0.27508544921875, 0.332489013671875, 0.389892578125, 0.447296142578125, 0.50469970703125, 0.562103271484375, 0.6195068359375, 0.676910400390625, 0.73431396484375, 0.791717529296875, 0.84912109375, 0.906524658203125, 0.96392822265625, 1.021331787109375, 1.0787353515625, 1.136138916015625, 1.19354248046875, 1.250946044921875, 1.308349609375, 1.365753173828125, 1.42315673828125, 1.480560302734375, 1.5379638671875, 1.595367431640625, 1.65277099609375, 1.710174560546875, 1.767578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 13.0, 23.0, 10.0, 17.0, 26.0, 22.0, 24.0, 42.0, 28.0, 39.0, 48.0, 56.0, 43.0, 47.0, 49.0, 52.0, 46.0, 44.0, 33.0, 37.0, 33.0, 27.0, 31.0, 34.0, 25.0, 19.0, 14.0, 18.0, 12.0, 15.0, 7.0, 7.0, 6.0, 8.0, 6.0, 2.0, 2.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.171875, -2.1069183349609375, -2.041961669921875, -1.9770050048828125, -1.91204833984375, -1.8470916748046875, -1.782135009765625, -1.7171783447265625, -1.6522216796875, -1.5872650146484375, -1.522308349609375, -1.4573516845703125, -1.39239501953125, -1.3274383544921875, -1.262481689453125, -1.1975250244140625, -1.132568359375, -1.0676116943359375, -1.002655029296875, -0.9376983642578125, -0.87274169921875, -0.8077850341796875, -0.742828369140625, -0.6778717041015625, -0.6129150390625, -0.5479583740234375, -0.483001708984375, -0.4180450439453125, -0.35308837890625, -0.2881317138671875, -0.223175048828125, -0.1582183837890625, -0.09326171875, -0.0283050537109375, 0.036651611328125, 0.1016082763671875, 0.16656494140625, 0.2315216064453125, 0.296478271484375, 0.3614349365234375, 0.4263916015625, 0.4913482666015625, 0.556304931640625, 0.6212615966796875, 0.68621826171875, 0.7511749267578125, 0.816131591796875, 0.8810882568359375, 0.946044921875, 1.0110015869140625, 1.075958251953125, 1.1409149169921875, 1.20587158203125, 1.2708282470703125, 1.335784912109375, 1.4007415771484375, 1.4656982421875, 1.5306549072265625, 1.595611572265625, 1.6605682373046875, 1.72552490234375, 1.7904815673828125, 1.855438232421875, 1.9203948974609375, 1.9853515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 6.0, 9.0, 10.0, 13.0, 31.0, 41.0, 72.0, 94.0, 148.0, 296.0, 511.0, 1030.0, 2187.0, 5486.0, 18297.0, 84287.0, 421199.0, 406973.0, 80408.0, 17666.0, 5547.0, 2064.0, 894.0, 498.0, 273.0, 158.0, 121.0, 70.0, 46.0, 24.0, 24.0, 21.0, 12.0, 12.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4755859375, -0.4579620361328125, -0.440338134765625, -0.4227142333984375, -0.40509033203125, -0.3874664306640625, -0.369842529296875, -0.3522186279296875, -0.3345947265625, -0.3169708251953125, -0.299346923828125, -0.2817230224609375, -0.26409912109375, -0.2464752197265625, -0.228851318359375, -0.2112274169921875, -0.193603515625, -0.1759796142578125, -0.158355712890625, -0.1407318115234375, -0.12310791015625, -0.1054840087890625, -0.087860107421875, -0.0702362060546875, -0.0526123046875, -0.0349884033203125, -0.017364501953125, 0.0002593994140625, 0.01788330078125, 0.0355072021484375, 0.053131103515625, 0.0707550048828125, 0.08837890625, 0.1060028076171875, 0.123626708984375, 0.1412506103515625, 0.15887451171875, 0.1764984130859375, 0.194122314453125, 0.2117462158203125, 0.2293701171875, 0.2469940185546875, 0.264617919921875, 0.2822418212890625, 0.29986572265625, 0.3174896240234375, 0.335113525390625, 0.3527374267578125, 0.370361328125, 0.3879852294921875, 0.405609130859375, 0.4232330322265625, 0.44085693359375, 0.4584808349609375, 0.476104736328125, 0.4937286376953125, 0.5113525390625, 0.5289764404296875, 0.546600341796875, 0.5642242431640625, 0.58184814453125, 0.5994720458984375, 0.617095947265625, 0.6347198486328125, 0.65234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 8.0, 1.0, 6.0, 1.0, 13.0, 15.0, 11.0, 18.0, 7.0, 21.0, 24.0, 29.0, 27.0, 30.0, 71.0, 72.0, 79.0, 87.0, 107.0, 66.0, 60.0, 48.0, 39.0, 29.0, 25.0, 20.0, 14.0, 19.0, 11.0, 5.0, 8.0, 8.0, 8.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011491775512695312, -0.0001110658049583435, -0.00010721385478973389, -0.00010336190462112427, -9.950995445251465e-05, -9.565800428390503e-05, -9.180605411529541e-05, -8.795410394668579e-05, -8.410215377807617e-05, -8.025020360946655e-05, -7.639825344085693e-05, -7.254630327224731e-05, -6.86943531036377e-05, -6.484240293502808e-05, -6.099045276641846e-05, -5.713850259780884e-05, -5.328655242919922e-05, -4.94346022605896e-05, -4.558265209197998e-05, -4.173070192337036e-05, -3.787875175476074e-05, -3.402680158615112e-05, -3.0174851417541504e-05, -2.6322901248931885e-05, -2.2470951080322266e-05, -1.8619000911712646e-05, -1.4767050743103027e-05, -1.0915100574493408e-05, -7.063150405883789e-06, -3.21120023727417e-06, 6.407499313354492e-07, 4.492700099945068e-06, 8.344650268554688e-06, 1.2196600437164307e-05, 1.6048550605773926e-05, 1.9900500774383545e-05, 2.3752450942993164e-05, 2.7604401111602783e-05, 3.14563512802124e-05, 3.530830144882202e-05, 3.916025161743164e-05, 4.301220178604126e-05, 4.686415195465088e-05, 5.07161021232605e-05, 5.456805229187012e-05, 5.8420002460479736e-05, 6.227195262908936e-05, 6.612390279769897e-05, 6.99758529663086e-05, 7.382780313491821e-05, 7.767975330352783e-05, 8.153170347213745e-05, 8.538365364074707e-05, 8.923560380935669e-05, 9.308755397796631e-05, 9.693950414657593e-05, 0.00010079145431518555, 0.00010464340448379517, 0.00010849535465240479, 0.0001123473048210144, 0.00011619925498962402, 0.00012005120515823364, 0.00012390315532684326, 0.00012775510549545288, 0.0001316070556640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 10.0, 22.0, 38.0, 61.0, 71.0, 105.0, 167.0, 315.0, 561.0, 1146.0, 2699.0, 8680.0, 42277.0, 330276.0, 553629.0, 87291.0, 14319.0, 3758.0, 1445.0, 689.0, 360.0, 217.0, 132.0, 88.0, 60.0, 47.0, 29.0, 16.0, 11.0, 8.0, 9.0, 0.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4921875, -0.4726409912109375, -0.453094482421875, -0.4335479736328125, -0.41400146484375, -0.3944549560546875, -0.374908447265625, -0.3553619384765625, -0.3358154296875, -0.3162689208984375, -0.296722412109375, -0.2771759033203125, -0.25762939453125, -0.2380828857421875, -0.218536376953125, -0.1989898681640625, -0.179443359375, -0.1598968505859375, -0.140350341796875, -0.1208038330078125, -0.10125732421875, -0.0817108154296875, -0.062164306640625, -0.0426177978515625, -0.0230712890625, -0.0035247802734375, 0.016021728515625, 0.0355682373046875, 0.05511474609375, 0.0746612548828125, 0.094207763671875, 0.1137542724609375, 0.13330078125, 0.1528472900390625, 0.172393798828125, 0.1919403076171875, 0.21148681640625, 0.2310333251953125, 0.250579833984375, 0.2701263427734375, 0.2896728515625, 0.3092193603515625, 0.328765869140625, 0.3483123779296875, 0.36785888671875, 0.3874053955078125, 0.406951904296875, 0.4264984130859375, 0.446044921875, 0.4655914306640625, 0.485137939453125, 0.5046844482421875, 0.52423095703125, 0.5437774658203125, 0.563323974609375, 0.5828704833984375, 0.6024169921875, 0.6219635009765625, 0.641510009765625, 0.6610565185546875, 0.68060302734375, 0.7001495361328125, 0.719696044921875, 0.7392425537109375, 0.7587890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 17.0, 14.0, 24.0, 36.0, 31.0, 43.0, 58.0, 70.0, 76.0, 70.0, 84.0, 83.0, 75.0, 59.0, 56.0, 42.0, 41.0, 30.0, 24.0, 16.0, 11.0, 5.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45263671875, -0.4362335205078125, -0.419830322265625, -0.4034271240234375, -0.38702392578125, -0.3706207275390625, -0.354217529296875, -0.3378143310546875, -0.3214111328125, -0.3050079345703125, -0.288604736328125, -0.2722015380859375, -0.25579833984375, -0.2393951416015625, -0.222991943359375, -0.2065887451171875, -0.190185546875, -0.1737823486328125, -0.157379150390625, -0.1409759521484375, -0.12457275390625, -0.1081695556640625, -0.091766357421875, -0.0753631591796875, -0.0589599609375, -0.0425567626953125, -0.026153564453125, -0.0097503662109375, 0.00665283203125, 0.0230560302734375, 0.039459228515625, 0.0558624267578125, 0.072265625, 0.0886688232421875, 0.105072021484375, 0.1214752197265625, 0.13787841796875, 0.1542816162109375, 0.170684814453125, 0.1870880126953125, 0.2034912109375, 0.2198944091796875, 0.236297607421875, 0.2527008056640625, 0.26910400390625, 0.2855072021484375, 0.301910400390625, 0.3183135986328125, 0.334716796875, 0.3511199951171875, 0.367523193359375, 0.3839263916015625, 0.40032958984375, 0.4167327880859375, 0.433135986328125, 0.4495391845703125, 0.4659423828125, 0.4823455810546875, 0.498748779296875, 0.5151519775390625, 0.53155517578125, 0.5479583740234375, 0.564361572265625, 0.5807647705078125, 0.59716796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 10.0, 26.0, 43.0, 102.0, 183.0, 226.0, 203.0, 110.0, 47.0, 30.0, 13.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796490669250488, -9.27469539642334, -8.752901077270508, -8.23110580444336, -7.709310531616211, -7.1875152587890625, -6.665720462799072, -6.143925666809082, -5.622130393981934, -5.100335121154785, -4.578540325164795, -4.056745529174805, -3.5349502563476562, -3.013155221939087, -2.4913601875305176, -1.9695651531219482, -1.447770118713379, -0.9259750843048096, -0.40418004989624023, 0.1176149845123291, 0.6394100189208984, 1.1612050533294678, 1.683000087738037, 2.2047951221466064, 2.726590156555176, 3.248385190963745, 3.7701802253723145, 4.291975021362305, 4.813770294189453, 5.335565567016602, 5.857360363006592, 6.379155158996582, 6.900949478149414, 7.4227447509765625, 7.944539546966553, 8.466334342956543, 8.988129615783691, 9.50992488861084, 10.031719207763672, 10.55351448059082, 11.075309753417969, 11.597105026245117, 12.118900299072266, 12.640694618225098, 13.162489891052246, 13.684285163879395, 14.206079483032227, 14.727874755859375, 15.249670028686523, 15.771465301513672, 16.29326057434082, 16.81505584716797, 17.336849212646484, 17.858644485473633, 18.38043975830078, 18.90223503112793, 19.424030303955078, 19.945825576782227, 20.467620849609375, 20.989416122436523, 21.511211395263672, 22.033004760742188, 22.554800033569336, 23.076595306396484, 23.598390579223633]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 6.0, 11.0, 13.0, 16.0, 18.0, 27.0, 26.0, 37.0, 41.0, 46.0, 72.0, 53.0, 73.0, 59.0, 86.0, 68.0, 64.0, 59.0, 55.0, 43.0, 41.0, 23.0, 13.0, 10.0, 8.0, 6.0, 7.0, 8.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.31768035888672, -16.80611228942871, -16.294544219970703, -15.782975196838379, -15.271406173706055, -14.759838104248047, -14.248270034790039, -13.736701965332031, -13.225132942199707, -12.7135648727417, -12.201995849609375, -11.690427780151367, -11.17885971069336, -10.667290687561035, -10.155722618103027, -9.644153594970703, -9.132585525512695, -8.621017456054688, -8.109448432922363, -7.5978803634643555, -7.0863118171691895, -6.574743270874023, -6.063175201416016, -5.55160665512085, -5.040038108825684, -4.528469562530518, -4.016901016235352, -3.5053329467773438, -2.9937644004821777, -2.4821958541870117, -1.9706275463104248, -1.459059238433838, -0.9474906921386719, -0.4359222650527954, 0.07564616203308105, 0.5872145891189575, 1.098783016204834, 1.6103515625, 2.121919870376587, 2.633488178253174, 3.14505672454834, 3.656625270843506, 4.168193817138672, 4.67976188659668, 5.191330432891846, 5.702898979187012, 6.2144670486450195, 6.7260355949401855, 7.237604141235352, 7.749172687530518, 8.260741233825684, 8.772309303283691, 9.283878326416016, 9.795446395874023, 10.307014465332031, 10.818582534790039, 11.330151557922363, 11.841719627380371, 12.353288650512695, 12.864856719970703, 13.376424789428711, 13.887993812561035, 14.399561882019043, 14.911130905151367, 15.422698974609375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 10.0, 17.0, 27.0, 43.0, 100.0, 154.0, 334.0, 757.0, 2078.0, 9767.0, 147174.0, 3959475.0, 64609.0, 6549.0, 1826.0, 685.0, 297.0, 140.0, 85.0, 41.0, 30.0, 16.0, 19.0, 12.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.8914794921875, -3.763427734375, -3.6353759765625, -3.50732421875, -3.3792724609375, -3.251220703125, -3.1231689453125, -2.9951171875, -2.8670654296875, -2.739013671875, -2.6109619140625, -2.48291015625, -2.3548583984375, -2.226806640625, -2.0987548828125, -1.970703125, -1.8426513671875, -1.714599609375, -1.5865478515625, -1.45849609375, -1.3304443359375, -1.202392578125, -1.0743408203125, -0.9462890625, -0.8182373046875, -0.690185546875, -0.5621337890625, -0.43408203125, -0.3060302734375, -0.177978515625, -0.0499267578125, 0.078125, 0.2061767578125, 0.334228515625, 0.4622802734375, 0.59033203125, 0.7183837890625, 0.846435546875, 0.9744873046875, 1.1025390625, 1.2305908203125, 1.358642578125, 1.4866943359375, 1.61474609375, 1.7427978515625, 1.870849609375, 1.9989013671875, 2.126953125, 2.2550048828125, 2.383056640625, 2.5111083984375, 2.63916015625, 2.7672119140625, 2.895263671875, 3.0233154296875, 3.1513671875, 3.2794189453125, 3.407470703125, 3.5355224609375, 3.66357421875, 3.7916259765625, 3.919677734375, 4.0477294921875, 4.17578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 11.0, 16.0, 30.0, 49.0, 57.0, 91.0, 140.0, 131.0, 139.0, 101.0, 82.0, 72.0, 37.0, 15.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.0478057861328125, -1.012603759765625, -0.9774017333984375, -0.94219970703125, -0.9069976806640625, -0.871795654296875, -0.8365936279296875, -0.8013916015625, -0.7661895751953125, -0.730987548828125, -0.6957855224609375, -0.66058349609375, -0.6253814697265625, -0.590179443359375, -0.5549774169921875, -0.519775390625, -0.4845733642578125, -0.449371337890625, -0.4141693115234375, -0.37896728515625, -0.3437652587890625, -0.308563232421875, -0.2733612060546875, -0.2381591796875, -0.2029571533203125, -0.167755126953125, -0.1325531005859375, -0.09735107421875, -0.0621490478515625, -0.026947021484375, 0.0082550048828125, 0.04345703125, 0.0786590576171875, 0.113861083984375, 0.1490631103515625, 0.18426513671875, 0.2194671630859375, 0.254669189453125, 0.2898712158203125, 0.3250732421875, 0.3602752685546875, 0.395477294921875, 0.4306793212890625, 0.46588134765625, 0.5010833740234375, 0.536285400390625, 0.5714874267578125, 0.606689453125, 0.6418914794921875, 0.677093505859375, 0.7122955322265625, 0.74749755859375, 0.7826995849609375, 0.817901611328125, 0.8531036376953125, 0.8883056640625, 0.9235076904296875, 0.958709716796875, 0.9939117431640625, 1.02911376953125, 1.0643157958984375, 1.099517822265625, 1.1347198486328125, 1.169921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 12.0, 16.0, 14.0, 24.0, 36.0, 58.0, 108.0, 154.0, 246.0, 448.0, 802.0, 1857.0, 5528.0, 30972.0, 920837.0, 3160507.0, 59855.0, 8360.0, 2339.0, 947.0, 488.0, 247.0, 132.0, 106.0, 44.0, 33.0, 21.0, 25.0, 14.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34375, -2.265960693359375, -2.18817138671875, -2.110382080078125, -2.0325927734375, -1.954803466796875, -1.87701416015625, -1.799224853515625, -1.721435546875, -1.643646240234375, -1.56585693359375, -1.488067626953125, -1.4102783203125, -1.332489013671875, -1.25469970703125, -1.176910400390625, -1.09912109375, -1.021331787109375, -0.94354248046875, -0.865753173828125, -0.7879638671875, -0.710174560546875, -0.63238525390625, -0.554595947265625, -0.476806640625, -0.399017333984375, -0.32122802734375, -0.243438720703125, -0.1656494140625, -0.087860107421875, -0.01007080078125, 0.067718505859375, 0.1455078125, 0.223297119140625, 0.30108642578125, 0.378875732421875, 0.4566650390625, 0.534454345703125, 0.61224365234375, 0.690032958984375, 0.767822265625, 0.845611572265625, 0.92340087890625, 1.001190185546875, 1.0789794921875, 1.156768798828125, 1.23455810546875, 1.312347412109375, 1.39013671875, 1.467926025390625, 1.54571533203125, 1.623504638671875, 1.7012939453125, 1.779083251953125, 1.85687255859375, 1.934661865234375, 2.012451171875, 2.090240478515625, 2.16802978515625, 2.245819091796875, 2.3236083984375, 2.401397705078125, 2.47918701171875, 2.556976318359375, 2.634765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 8.0, 9.0, 15.0, 25.0, 45.0, 109.0, 243.0, 744.0, 1863.0, 598.0, 213.0, 87.0, 42.0, 27.0, 20.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5771484375, -1.532623291015625, -1.48809814453125, -1.443572998046875, -1.3990478515625, -1.354522705078125, -1.30999755859375, -1.265472412109375, -1.220947265625, -1.176422119140625, -1.13189697265625, -1.087371826171875, -1.0428466796875, -0.998321533203125, -0.95379638671875, -0.909271240234375, -0.86474609375, -0.820220947265625, -0.77569580078125, -0.731170654296875, -0.6866455078125, -0.642120361328125, -0.59759521484375, -0.553070068359375, -0.508544921875, -0.464019775390625, -0.41949462890625, -0.374969482421875, -0.3304443359375, -0.285919189453125, -0.24139404296875, -0.196868896484375, -0.15234375, -0.107818603515625, -0.06329345703125, -0.018768310546875, 0.0257568359375, 0.070281982421875, 0.11480712890625, 0.159332275390625, 0.203857421875, 0.248382568359375, 0.29290771484375, 0.337432861328125, 0.3819580078125, 0.426483154296875, 0.47100830078125, 0.515533447265625, 0.56005859375, 0.604583740234375, 0.64910888671875, 0.693634033203125, 0.7381591796875, 0.782684326171875, 0.82720947265625, 0.871734619140625, 0.916259765625, 0.960784912109375, 1.00531005859375, 1.049835205078125, 1.0943603515625, 1.138885498046875, 1.18341064453125, 1.227935791015625, 1.2724609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 11.0, 14.0, 46.0, 105.0, 154.0, 240.0, 182.0, 121.0, 58.0, 30.0, 10.0, 9.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.393188953399658, -3.2116799354553223, -3.0301706790924072, -2.848661422729492, -2.6671524047851562, -2.4856433868408203, -2.3041341304779053, -2.1226248741149902, -1.9411158561706543, -1.7596067190170288, -1.5780975818634033, -1.3965884447097778, -1.2150793075561523, -1.0335701704025269, -0.8520610332489014, -0.6705518960952759, -0.4890427589416504, -0.3075336217880249, -0.12602448463439941, 0.055484652519226074, 0.23699378967285156, 0.41850292682647705, 0.6000120639801025, 0.781521201133728, 0.9630303382873535, 1.144539475440979, 1.3260486125946045, 1.50755774974823, 1.6890668869018555, 1.870576024055481, 2.0520851612091064, 2.2335944175720215, 2.4151039123535156, 2.5966129302978516, 2.7781221866607666, 2.9596314430236816, 3.1411404609680176, 3.3226494789123535, 3.5041587352752686, 3.6856679916381836, 3.8671770095825195, 4.0486860275268555, 4.230195045471191, 4.4117045402526855, 4.5932135581970215, 4.774722576141357, 4.956232070922852, 5.1377410888671875, 5.319250106811523, 5.500759124755859, 5.682268142700195, 5.8637776374816895, 6.045286655426025, 6.226795673370361, 6.4083051681518555, 6.589814186096191, 6.771323204040527, 6.952832221984863, 7.134341239929199, 7.315850734710693, 7.497359752655029, 7.678868770599365, 7.860378265380859, 8.041887283325195, 8.223396301269531]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 16.0, 18.0, 19.0, 30.0, 42.0, 55.0, 51.0, 61.0, 90.0, 91.0, 78.0, 86.0, 74.0, 50.0, 48.0, 46.0, 35.0, 34.0, 26.0, 20.0, 4.0, 4.0, 5.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-7.319561958312988, -7.157339572906494, -6.9951171875, -6.832894802093506, -6.670672416687012, -6.508449554443359, -6.346227645874023, -6.184004783630371, -6.021782398223877, -5.859560012817383, -5.697337627410889, -5.5351152420043945, -5.3728928565979, -5.210670471191406, -5.048447608947754, -4.88622522354126, -4.724002838134766, -4.5617804527282715, -4.399558067321777, -4.237335681915283, -4.075113296508789, -3.912890672683716, -3.7506682872772217, -3.5884456634521484, -3.4262237548828125, -3.2640013694763184, -3.101778984069824, -2.93955659866333, -2.777333974838257, -2.6151115894317627, -2.4528892040252686, -2.2906665802001953, -2.128444194793701, -1.966221809387207, -1.8039993047714233, -1.6417769193649292, -1.4795544147491455, -1.3173320293426514, -1.1551096439361572, -0.9928871393203735, -0.8306647539138794, -0.6684423089027405, -0.5062198638916016, -0.3439974784851074, -0.1817750334739685, -0.01955258846282959, 0.14266979694366455, 0.30489230155944824, 0.4671146869659424, 0.6293371319770813, 0.7915595769882202, 0.9537819623947144, 1.116004467010498, 1.2782268524169922, 1.4404492378234863, 1.60267174243927, 1.7648941278457642, 1.9271165132522583, 2.089339017868042, 2.251561403274536, 2.4137837886810303, 2.5760064125061035, 2.7382287979125977, 2.900451183319092, 3.062673568725586]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 16.0, 17.0, 23.0, 26.0, 49.0, 114.0, 159.0, 309.0, 570.0, 1190.0, 2961.0, 10011.0, 68723.0, 587650.0, 333497.0, 32835.0, 6325.0, 2081.0, 924.0, 469.0, 234.0, 136.0, 80.0, 53.0, 25.0, 18.0, 17.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123046875, -3.024932861328125, -2.92681884765625, -2.828704833984375, -2.7305908203125, -2.632476806640625, -2.53436279296875, -2.436248779296875, -2.338134765625, -2.240020751953125, -2.14190673828125, -2.043792724609375, -1.9456787109375, -1.847564697265625, -1.74945068359375, -1.651336669921875, -1.55322265625, -1.455108642578125, -1.35699462890625, -1.258880615234375, -1.1607666015625, -1.062652587890625, -0.96453857421875, -0.866424560546875, -0.768310546875, -0.670196533203125, -0.57208251953125, -0.473968505859375, -0.3758544921875, -0.277740478515625, -0.17962646484375, -0.081512451171875, 0.0166015625, 0.114715576171875, 0.21282958984375, 0.310943603515625, 0.4090576171875, 0.507171630859375, 0.60528564453125, 0.703399658203125, 0.801513671875, 0.899627685546875, 0.99774169921875, 1.095855712890625, 1.1939697265625, 1.292083740234375, 1.39019775390625, 1.488311767578125, 1.58642578125, 1.684539794921875, 1.78265380859375, 1.880767822265625, 1.9788818359375, 2.076995849609375, 2.17510986328125, 2.273223876953125, 2.371337890625, 2.469451904296875, 2.56756591796875, 2.665679931640625, 2.7637939453125, 2.861907958984375, 2.96002197265625, 3.058135986328125, 3.15625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 20.0, 45.0, 52.0, 48.0, 102.0, 146.0, 135.0, 118.0, 95.0, 86.0, 68.0, 24.0, 17.0, 10.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0050048828125, -0.970947265625, -0.9368896484375, -0.90283203125, -0.8687744140625, -0.834716796875, -0.8006591796875, -0.7666015625, -0.7325439453125, -0.698486328125, -0.6644287109375, -0.63037109375, -0.5963134765625, -0.562255859375, -0.5281982421875, -0.494140625, -0.4600830078125, -0.426025390625, -0.3919677734375, -0.35791015625, -0.3238525390625, -0.289794921875, -0.2557373046875, -0.2216796875, -0.1876220703125, -0.153564453125, -0.1195068359375, -0.08544921875, -0.0513916015625, -0.017333984375, 0.0167236328125, 0.05078125, 0.0848388671875, 0.118896484375, 0.1529541015625, 0.18701171875, 0.2210693359375, 0.255126953125, 0.2891845703125, 0.3232421875, 0.3572998046875, 0.391357421875, 0.4254150390625, 0.45947265625, 0.4935302734375, 0.527587890625, 0.5616455078125, 0.595703125, 0.6297607421875, 0.663818359375, 0.6978759765625, 0.73193359375, 0.7659912109375, 0.800048828125, 0.8341064453125, 0.8681640625, 0.9022216796875, 0.936279296875, 0.9703369140625, 1.00439453125, 1.0384521484375, 1.072509765625, 1.1065673828125, 1.140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 9.0, 8.0, 24.0, 21.0, 30.0, 60.0, 106.0, 113.0, 179.0, 259.0, 457.0, 893.0, 2195.0, 7008.0, 40635.0, 288021.0, 554214.0, 129396.0, 17625.0, 4058.0, 1437.0, 666.0, 411.0, 227.0, 146.0, 91.0, 75.0, 51.0, 32.0, 21.0, 16.0, 15.0, 16.0, 9.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.40234375, -2.32794189453125, -2.2535400390625, -2.17913818359375, -2.104736328125, -2.03033447265625, -1.9559326171875, -1.88153076171875, -1.80712890625, -1.73272705078125, -1.6583251953125, -1.58392333984375, -1.509521484375, -1.43511962890625, -1.3607177734375, -1.28631591796875, -1.2119140625, -1.13751220703125, -1.0631103515625, -0.98870849609375, -0.914306640625, -0.83990478515625, -0.7655029296875, -0.69110107421875, -0.61669921875, -0.54229736328125, -0.4678955078125, -0.39349365234375, -0.319091796875, -0.24468994140625, -0.1702880859375, -0.09588623046875, -0.021484375, 0.05291748046875, 0.1273193359375, 0.20172119140625, 0.276123046875, 0.35052490234375, 0.4249267578125, 0.49932861328125, 0.57373046875, 0.64813232421875, 0.7225341796875, 0.79693603515625, 0.871337890625, 0.94573974609375, 1.0201416015625, 1.09454345703125, 1.1689453125, 1.24334716796875, 1.3177490234375, 1.39215087890625, 1.466552734375, 1.54095458984375, 1.6153564453125, 1.68975830078125, 1.76416015625, 1.83856201171875, 1.9129638671875, 1.98736572265625, 2.061767578125, 2.13616943359375, 2.2105712890625, 2.28497314453125, 2.359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 6.0, 15.0, 6.0, 18.0, 37.0, 29.0, 24.0, 28.0, 43.0, 47.0, 40.0, 55.0, 45.0, 48.0, 60.0, 61.0, 43.0, 44.0, 52.0, 41.0, 45.0, 37.0, 28.0, 24.0, 31.0, 19.0, 15.0, 13.0, 8.0, 7.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.512969970703125, -2.43023681640625, -2.347503662109375, -2.2647705078125, -2.182037353515625, -2.09930419921875, -2.016571044921875, -1.933837890625, -1.851104736328125, -1.76837158203125, -1.685638427734375, -1.6029052734375, -1.520172119140625, -1.43743896484375, -1.354705810546875, -1.27197265625, -1.189239501953125, -1.10650634765625, -1.023773193359375, -0.9410400390625, -0.858306884765625, -0.77557373046875, -0.692840576171875, -0.610107421875, -0.527374267578125, -0.44464111328125, -0.361907958984375, -0.2791748046875, -0.196441650390625, -0.11370849609375, -0.030975341796875, 0.0517578125, 0.134490966796875, 0.21722412109375, 0.299957275390625, 0.3826904296875, 0.465423583984375, 0.54815673828125, 0.630889892578125, 0.713623046875, 0.796356201171875, 0.87908935546875, 0.961822509765625, 1.0445556640625, 1.127288818359375, 1.21002197265625, 1.292755126953125, 1.37548828125, 1.458221435546875, 1.54095458984375, 1.623687744140625, 1.7064208984375, 1.789154052734375, 1.87188720703125, 1.954620361328125, 2.037353515625, 2.120086669921875, 2.20281982421875, 2.285552978515625, 2.3682861328125, 2.451019287109375, 2.53375244140625, 2.616485595703125, 2.69921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 6.0, 14.0, 7.0, 6.0, 18.0, 20.0, 25.0, 37.0, 56.0, 109.0, 210.0, 409.0, 1070.0, 3551.0, 16181.0, 237048.0, 740982.0, 39601.0, 6159.0, 1814.0, 588.0, 259.0, 142.0, 77.0, 49.0, 26.0, 21.0, 9.0, 13.0, 10.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.6416015625, -1.6007766723632812, -1.5599517822265625, -1.5191268920898438, -1.478302001953125, -1.4374771118164062, -1.3966522216796875, -1.3558273315429688, -1.31500244140625, -1.2741775512695312, -1.2333526611328125, -1.1925277709960938, -1.151702880859375, -1.1108779907226562, -1.0700531005859375, -1.0292282104492188, -0.9884033203125, -0.9475784301757812, -0.9067535400390625, -0.8659286499023438, -0.825103759765625, -0.7842788696289062, -0.7434539794921875, -0.7026290893554688, -0.66180419921875, -0.6209793090820312, -0.5801544189453125, -0.5393295288085938, -0.498504638671875, -0.45767974853515625, -0.4168548583984375, -0.37602996826171875, -0.335205078125, -0.29438018798828125, -0.2535552978515625, -0.21273040771484375, -0.171905517578125, -0.13108062744140625, -0.0902557373046875, -0.04943084716796875, -0.00860595703125, 0.03221893310546875, 0.0730438232421875, 0.11386871337890625, 0.154693603515625, 0.19551849365234375, 0.2363433837890625, 0.27716827392578125, 0.3179931640625, 0.35881805419921875, 0.3996429443359375, 0.44046783447265625, 0.481292724609375, 0.5221176147460938, 0.5629425048828125, 0.6037673950195312, 0.64459228515625, 0.6854171752929688, 0.7262420654296875, 0.7670669555664062, 0.807891845703125, 0.8487167358398438, 0.8895416259765625, 0.9303665161132812, 0.97119140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 13.0, 9.0, 21.0, 30.0, 45.0, 59.0, 74.0, 115.0, 140.0, 130.0, 98.0, 64.0, 47.0, 26.0, 25.0, 16.0, 20.0, 15.0, 12.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014138221740722656, -0.00013689883053302765, -0.00013241544365882874, -0.00012793205678462982, -0.0001234486699104309, -0.000118965283036232, -0.00011448189616203308, -0.00010999850928783417, -0.00010551512241363525, -0.00010103173553943634, -9.654834866523743e-05, -9.206496179103851e-05, -8.75815749168396e-05, -8.309818804264069e-05, -7.861480116844177e-05, -7.413141429424286e-05, -6.964802742004395e-05, -6.516464054584503e-05, -6.068125367164612e-05, -5.6197866797447205e-05, -5.171447992324829e-05, -4.723109304904938e-05, -4.2747706174850464e-05, -3.826431930065155e-05, -3.378093242645264e-05, -2.9297545552253723e-05, -2.481415867805481e-05, -2.0330771803855896e-05, -1.5847384929656982e-05, -1.1363998055458069e-05, -6.880611181259155e-06, -2.3972243070602417e-06, 2.086162567138672e-06, 6.5695494413375854e-06, 1.1052936315536499e-05, 1.5536323189735413e-05, 2.0019710063934326e-05, 2.450309693813324e-05, 2.8986483812332153e-05, 3.346987068653107e-05, 3.795325756072998e-05, 4.2436644434928894e-05, 4.692003130912781e-05, 5.140341818332672e-05, 5.5886805057525635e-05, 6.037019193172455e-05, 6.485357880592346e-05, 6.933696568012238e-05, 7.382035255432129e-05, 7.83037394285202e-05, 8.278712630271912e-05, 8.727051317691803e-05, 9.175390005111694e-05, 9.623728692531586e-05, 0.00010072067379951477, 0.00010520406067371368, 0.0001096874475479126, 0.00011417083442211151, 0.00011865422129631042, 0.00012313760817050934, 0.00012762099504470825, 0.00013210438191890717, 0.00013658776879310608, 0.000141071155667305, 0.0001455545425415039]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 8.0, 10.0, 15.0, 17.0, 22.0, 37.0, 60.0, 73.0, 139.0, 273.0, 597.0, 1564.0, 4973.0, 26700.0, 586490.0, 400886.0, 20116.0, 4078.0, 1321.0, 522.0, 245.0, 126.0, 63.0, 56.0, 47.0, 19.0, 18.0, 15.0, 10.0, 12.0, 6.0, 6.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1806640625, -1.139862060546875, -1.09906005859375, -1.058258056640625, -1.0174560546875, -0.976654052734375, -0.93585205078125, -0.895050048828125, -0.854248046875, -0.813446044921875, -0.77264404296875, -0.731842041015625, -0.6910400390625, -0.650238037109375, -0.60943603515625, -0.568634033203125, -0.52783203125, -0.487030029296875, -0.44622802734375, -0.405426025390625, -0.3646240234375, -0.323822021484375, -0.28302001953125, -0.242218017578125, -0.201416015625, -0.160614013671875, -0.11981201171875, -0.079010009765625, -0.0382080078125, 0.002593994140625, 0.04339599609375, 0.084197998046875, 0.125, 0.165802001953125, 0.20660400390625, 0.247406005859375, 0.2882080078125, 0.329010009765625, 0.36981201171875, 0.410614013671875, 0.451416015625, 0.492218017578125, 0.53302001953125, 0.573822021484375, 0.6146240234375, 0.655426025390625, 0.69622802734375, 0.737030029296875, 0.77783203125, 0.818634033203125, 0.85943603515625, 0.900238037109375, 0.9410400390625, 0.981842041015625, 1.02264404296875, 1.063446044921875, 1.104248046875, 1.145050048828125, 1.18585205078125, 1.226654052734375, 1.2674560546875, 1.308258056640625, 1.34906005859375, 1.389862060546875, 1.4306640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 20.0, 35.0, 57.0, 79.0, 109.0, 177.0, 181.0, 113.0, 78.0, 45.0, 23.0, 15.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 7.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9677734375, -0.931793212890625, -0.89581298828125, -0.859832763671875, -0.8238525390625, -0.787872314453125, -0.75189208984375, -0.715911865234375, -0.679931640625, -0.643951416015625, -0.60797119140625, -0.571990966796875, -0.5360107421875, -0.500030517578125, -0.46405029296875, -0.428070068359375, -0.39208984375, -0.356109619140625, -0.32012939453125, -0.284149169921875, -0.2481689453125, -0.212188720703125, -0.17620849609375, -0.140228271484375, -0.104248046875, -0.068267822265625, -0.03228759765625, 0.003692626953125, 0.0396728515625, 0.075653076171875, 0.11163330078125, 0.147613525390625, 0.18359375, 0.219573974609375, 0.25555419921875, 0.291534423828125, 0.3275146484375, 0.363494873046875, 0.39947509765625, 0.435455322265625, 0.471435546875, 0.507415771484375, 0.54339599609375, 0.579376220703125, 0.6153564453125, 0.651336669921875, 0.68731689453125, 0.723297119140625, 0.75927734375, 0.795257568359375, 0.83123779296875, 0.867218017578125, 0.9031982421875, 0.939178466796875, 0.97515869140625, 1.011138916015625, 1.047119140625, 1.083099365234375, 1.11907958984375, 1.155059814453125, 1.1910400390625, 1.227020263671875, 1.26300048828125, 1.298980712890625, 1.3349609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 14.0, 29.0, 45.0, 78.0, 116.0, 160.0, 159.0, 140.0, 108.0, 58.0, 32.0, 17.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.490825653076172, -10.090806007385254, -9.690787315368652, -9.290767669677734, -8.890748023986816, -8.490729331970215, -8.090709686279297, -7.690690517425537, -7.290671348571777, -6.890652179718018, -6.4906325340271, -6.09061336517334, -5.69059419631958, -5.29057502746582, -4.890555381774902, -4.490536212921143, -4.090516567230225, -3.6904971599578857, -3.290477991104126, -2.890458583831787, -2.4904394149780273, -2.0904200077056885, -1.6904006004333496, -1.2903814315795898, -0.890362024307251, -0.4903427064418793, -0.09032338857650757, 0.3096959590911865, 0.7097152471542358, 1.1097345352172852, 1.509753942489624, 1.9097731113433838, 2.3097925186157227, 2.7098119258880615, 3.1098310947418213, 3.50985050201416, 3.90986967086792, 4.30988883972168, 4.709908485412598, 5.109927654266357, 5.509946823120117, 5.909965991973877, 6.309985637664795, 6.710004806518555, 7.1100239753723145, 7.510043144226074, 7.910062789916992, 8.310081481933594, 8.710102081298828, 9.110121726989746, 9.510140419006348, 9.910160064697266, 10.310179710388184, 10.710198402404785, 11.110218048095703, 11.510236740112305, 11.910256385803223, 12.31027603149414, 12.710294723510742, 13.11031436920166, 13.510334014892578, 13.91035270690918, 14.310372352600098, 14.710391998291016, 15.110410690307617]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 8.0, 5.0, 9.0, 13.0, 16.0, 18.0, 18.0, 21.0, 31.0, 40.0, 38.0, 53.0, 60.0, 66.0, 52.0, 43.0, 57.0, 39.0, 49.0, 48.0, 54.0, 31.0, 43.0, 38.0, 22.0, 26.0, 28.0, 21.0, 13.0, 7.0, 10.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.935736656188965, -15.460702896118164, -14.985669136047363, -14.510635375976562, -14.035600662231445, -13.560566902160645, -13.085533142089844, -12.610499382019043, -12.135465621948242, -11.660431861877441, -11.18539810180664, -10.710363388061523, -10.235329627990723, -9.760295867919922, -9.285262107849121, -8.81022834777832, -8.335193634033203, -7.860159873962402, -7.385125637054443, -6.910091876983643, -6.435057640075684, -5.960023880004883, -5.484990119934082, -5.009956359863281, -4.534922122955322, -4.0598883628845215, -3.5848541259765625, -3.1098203659057617, -2.634786367416382, -2.159752368927002, -1.6847186088562012, -1.2096846103668213, -0.7346515655517578, -0.2596176266670227, 0.2154163122177124, 0.6904501914978027, 1.1654841899871826, 1.6405181884765625, 2.1155519485473633, 2.590585947036743, 3.065619945526123, 3.540653944015503, 4.015687942504883, 4.490721702575684, 4.965755462646484, 5.440789699554443, 5.915823459625244, 6.390857696533203, 6.865891456604004, 7.340925216674805, 7.815959453582764, 8.290992736816406, 8.766027450561523, 9.241061210632324, 9.716094970703125, 10.191128730773926, 10.666162490844727, 11.141196250915527, 11.616230010986328, 12.091264724731445, 12.566298484802246, 13.041332244873047, 13.516366004943848, 13.991399765014648, 14.466434478759766]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 13.0, 19.0, 29.0, 41.0, 64.0, 110.0, 236.0, 390.0, 903.0, 2223.0, 7088.0, 37159.0, 3388704.0, 723142.0, 25376.0, 5361.0, 1738.0, 733.0, 399.0, 202.0, 118.0, 71.0, 38.0, 33.0, 18.0, 14.0, 20.0, 8.0, 11.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.847076416015625, -2.76055908203125, -2.674041748046875, -2.5875244140625, -2.501007080078125, -2.41448974609375, -2.327972412109375, -2.241455078125, -2.154937744140625, -2.06842041015625, -1.981903076171875, -1.8953857421875, -1.808868408203125, -1.72235107421875, -1.635833740234375, -1.54931640625, -1.462799072265625, -1.37628173828125, -1.289764404296875, -1.2032470703125, -1.116729736328125, -1.03021240234375, -0.943695068359375, -0.857177734375, -0.770660400390625, -0.68414306640625, -0.597625732421875, -0.5111083984375, -0.424591064453125, -0.33807373046875, -0.251556396484375, -0.1650390625, -0.078521728515625, 0.00799560546875, 0.094512939453125, 0.1810302734375, 0.267547607421875, 0.35406494140625, 0.440582275390625, 0.527099609375, 0.613616943359375, 0.70013427734375, 0.786651611328125, 0.8731689453125, 0.959686279296875, 1.04620361328125, 1.132720947265625, 1.21923828125, 1.305755615234375, 1.39227294921875, 1.478790283203125, 1.5653076171875, 1.651824951171875, 1.73834228515625, 1.824859619140625, 1.911376953125, 1.997894287109375, 2.08441162109375, 2.170928955078125, 2.2574462890625, 2.343963623046875, 2.43048095703125, 2.516998291015625, 2.603515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 22.0, 23.0, 37.0, 55.0, 73.0, 83.0, 111.0, 115.0, 118.0, 116.0, 73.0, 54.0, 40.0, 25.0, 11.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9281768798828125, -0.894439697265625, -0.8607025146484375, -0.82696533203125, -0.7932281494140625, -0.759490966796875, -0.7257537841796875, -0.6920166015625, -0.6582794189453125, -0.624542236328125, -0.5908050537109375, -0.55706787109375, -0.5233306884765625, -0.489593505859375, -0.4558563232421875, -0.422119140625, -0.3883819580078125, -0.354644775390625, -0.3209075927734375, -0.28717041015625, -0.2534332275390625, -0.219696044921875, -0.1859588623046875, -0.1522216796875, -0.1184844970703125, -0.084747314453125, -0.0510101318359375, -0.01727294921875, 0.0164642333984375, 0.050201416015625, 0.0839385986328125, 0.11767578125, 0.1514129638671875, 0.185150146484375, 0.2188873291015625, 0.25262451171875, 0.2863616943359375, 0.320098876953125, 0.3538360595703125, 0.3875732421875, 0.4213104248046875, 0.455047607421875, 0.4887847900390625, 0.52252197265625, 0.5562591552734375, 0.589996337890625, 0.6237335205078125, 0.657470703125, 0.6912078857421875, 0.724945068359375, 0.7586822509765625, 0.79241943359375, 0.8261566162109375, 0.859893798828125, 0.8936309814453125, 0.9273681640625, 0.9611053466796875, 0.994842529296875, 1.0285797119140625, 1.06231689453125, 1.0960540771484375, 1.129791259765625, 1.1635284423828125, 1.197265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 10.0, 23.0, 45.0, 126.0, 347.0, 2306.0, 118940.0, 4059463.0, 11728.0, 896.0, 220.0, 86.0, 43.0, 24.0, 12.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.01177978515625, -1.8477783203125, -1.68377685546875, -1.519775390625, -1.35577392578125, -1.1917724609375, -1.02777099609375, -0.86376953125, -0.69976806640625, -0.5357666015625, -0.37176513671875, -0.207763671875, -0.04376220703125, 0.1202392578125, 0.28424072265625, 0.4482421875, 0.61224365234375, 0.7762451171875, 0.94024658203125, 1.104248046875, 1.26824951171875, 1.4322509765625, 1.59625244140625, 1.76025390625, 1.92425537109375, 2.0882568359375, 2.25225830078125, 2.416259765625, 2.58026123046875, 2.7442626953125, 2.90826416015625, 3.072265625, 3.23626708984375, 3.4002685546875, 3.56427001953125, 3.728271484375, 3.89227294921875, 4.0562744140625, 4.22027587890625, 4.38427734375, 4.54827880859375, 4.7122802734375, 4.87628173828125, 5.040283203125, 5.20428466796875, 5.3682861328125, 5.53228759765625, 5.6962890625, 5.86029052734375, 6.0242919921875, 6.18829345703125, 6.352294921875, 6.51629638671875, 6.6802978515625, 6.84429931640625, 7.00830078125, 7.17230224609375, 7.3363037109375, 7.50030517578125, 7.664306640625, 7.82830810546875, 7.9923095703125, 8.15631103515625, 8.3203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 26.0, 40.0, 106.0, 263.0, 1268.0, 1740.0, 342.0, 130.0, 57.0, 35.0, 21.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.6973648071289062, -0.6608428955078125, -0.6243209838867188, -0.587799072265625, -0.5512771606445312, -0.5147552490234375, -0.47823333740234375, -0.44171142578125, -0.40518951416015625, -0.3686676025390625, -0.33214569091796875, -0.295623779296875, -0.25910186767578125, -0.2225799560546875, -0.18605804443359375, -0.1495361328125, -0.11301422119140625, -0.0764923095703125, -0.03997039794921875, -0.003448486328125, 0.03307342529296875, 0.0695953369140625, 0.10611724853515625, 0.14263916015625, 0.17916107177734375, 0.2156829833984375, 0.25220489501953125, 0.288726806640625, 0.32524871826171875, 0.3617706298828125, 0.39829254150390625, 0.434814453125, 0.47133636474609375, 0.5078582763671875, 0.5443801879882812, 0.580902099609375, 0.6174240112304688, 0.6539459228515625, 0.6904678344726562, 0.72698974609375, 0.7635116577148438, 0.8000335693359375, 0.8365554809570312, 0.873077392578125, 0.9095993041992188, 0.9461212158203125, 0.9826431274414062, 1.0191650390625, 1.0556869506835938, 1.0922088623046875, 1.1287307739257812, 1.165252685546875, 1.2017745971679688, 1.2382965087890625, 1.2748184204101562, 1.31134033203125, 1.3478622436523438, 1.3843841552734375, 1.4209060668945312, 1.457427978515625, 1.4939498901367188, 1.5304718017578125, 1.5669937133789062, 1.603515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 25.0, 54.0, 84.0, 131.0, 161.0, 138.0, 136.0, 94.0, 65.0, 43.0, 21.0, 13.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.3084025382995605, -3.204294204711914, -3.1001861095428467, -2.9960777759552, -2.891969680786133, -2.7878613471984863, -2.68375301361084, -2.5796449184417725, -2.475536823272705, -2.3714284896850586, -2.267320394515991, -2.1632120609283447, -2.0591039657592773, -1.9549956321716309, -1.850887417793274, -1.746779203414917, -1.6426708698272705, -1.5385626554489136, -1.4344544410705566, -1.3303461074829102, -1.2262380123138428, -1.1221296787261963, -1.0180214643478394, -0.9139132499694824, -0.8098050355911255, -0.7056968212127686, -0.6015886068344116, -0.4974803328514099, -0.393372118473053, -0.28926390409469604, -0.18515563011169434, -0.0810474157333374, 0.023061037063598633, 0.12716926634311676, 0.2312774956226349, 0.3353857398033142, 0.43949395418167114, 0.5436021685600281, 0.6477104425430298, 0.7518186569213867, 0.8559268712997437, 0.9600350856781006, 1.0641433000564575, 1.1682515144348145, 1.272359848022461, 1.3764679431915283, 1.4805762767791748, 1.5846844911575317, 1.6887927055358887, 1.7929009199142456, 1.8970091342926025, 2.001117467880249, 2.1052255630493164, 2.209333896636963, 2.3134422302246094, 2.4175503253936768, 2.521658420562744, 2.6257667541503906, 2.729874849319458, 2.8339831829071045, 2.938091278076172, 3.0421996116638184, 3.146307945251465, 3.2504160404205322, 3.3545243740081787]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 8.0, 7.0, 14.0, 8.0, 5.0, 9.0, 17.0, 22.0, 19.0, 23.0, 14.0, 28.0, 26.0, 19.0, 31.0, 35.0, 38.0, 37.0, 48.0, 46.0, 37.0, 42.0, 34.0, 53.0, 27.0, 48.0, 29.0, 30.0, 32.0, 29.0, 32.0, 25.0, 27.0, 17.0, 16.0, 15.0, 8.0, 7.0, 9.0, 8.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1050379276275635, -2.041447639465332, -1.9778574705123901, -1.9142673015594482, -1.8506771326065063, -1.7870869636535645, -1.723496675491333, -1.6599065065383911, -1.5963163375854492, -1.5327261686325073, -1.4691358804702759, -1.405545711517334, -1.341955542564392, -1.2783653736114502, -1.2147750854492188, -1.1511849164962769, -1.0875946283340454, -1.0240044593811035, -0.9604142308235168, -0.8968240022659302, -0.8332338333129883, -0.7696436047554016, -0.7060533761978149, -0.642463207244873, -0.5788729786872864, -0.5152827501296997, -0.4516925811767578, -0.38810235261917114, -0.32451215386390686, -0.2609219551086426, -0.1973317265510559, -0.13374152779579163, -0.07015132904052734, -0.006561122834682465, 0.057029083371162415, 0.12061929702758789, 0.18420949578285217, 0.24779969453811646, 0.3113899230957031, 0.3749801218509674, 0.4385703206062317, 0.5021605491638184, 0.5657507181167603, 0.6293409466743469, 0.6929311752319336, 0.7565213441848755, 0.8201115727424622, 0.8837018013000488, 0.9472919702529907, 1.0108821392059326, 1.074472427368164, 1.138062596321106, 1.2016527652740479, 1.2652430534362793, 1.3288332223892212, 1.392423391342163, 1.4560136795043945, 1.5196038484573364, 1.5831941366195679, 1.6467843055725098, 1.7103744745254517, 1.7739646434783936, 1.837554931640625, 1.901145100593567, 1.9647352695465088]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 6.0, 6.0, 26.0, 19.0, 26.0, 35.0, 44.0, 61.0, 105.0, 108.0, 181.0, 251.0, 416.0, 668.0, 1079.0, 1953.0, 3787.0, 8871.0, 24711.0, 77443.0, 239092.0, 394183.0, 198046.0, 62019.0, 20130.0, 7443.0, 3280.0, 1752.0, 972.0, 578.0, 385.0, 270.0, 189.0, 121.0, 89.0, 57.0, 46.0, 30.0, 24.0, 15.0, 14.0, 8.0, 5.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5858306884765625, -1.536895751953125, -1.4879608154296875, -1.43902587890625, -1.3900909423828125, -1.341156005859375, -1.2922210693359375, -1.2432861328125, -1.1943511962890625, -1.145416259765625, -1.0964813232421875, -1.04754638671875, -0.9986114501953125, -0.949676513671875, -0.9007415771484375, -0.851806640625, -0.8028717041015625, -0.753936767578125, -0.7050018310546875, -0.65606689453125, -0.6071319580078125, -0.558197021484375, -0.5092620849609375, -0.4603271484375, -0.4113922119140625, -0.362457275390625, -0.3135223388671875, -0.26458740234375, -0.2156524658203125, -0.166717529296875, -0.1177825927734375, -0.06884765625, -0.0199127197265625, 0.029022216796875, 0.0779571533203125, 0.12689208984375, 0.1758270263671875, 0.224761962890625, 0.2736968994140625, 0.3226318359375, 0.3715667724609375, 0.420501708984375, 0.4694366455078125, 0.51837158203125, 0.5673065185546875, 0.616241455078125, 0.6651763916015625, 0.714111328125, 0.7630462646484375, 0.811981201171875, 0.8609161376953125, 0.90985107421875, 0.9587860107421875, 1.007720947265625, 1.0566558837890625, 1.1055908203125, 1.1545257568359375, 1.203460693359375, 1.2523956298828125, 1.30133056640625, 1.3502655029296875, 1.399200439453125, 1.4481353759765625, 1.4970703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 12.0, 14.0, 30.0, 37.0, 47.0, 69.0, 85.0, 106.0, 117.0, 105.0, 114.0, 87.0, 60.0, 42.0, 26.0, 12.0, 4.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9094696044921875, -0.876556396484375, -0.8436431884765625, -0.81072998046875, -0.7778167724609375, -0.744903564453125, -0.7119903564453125, -0.6790771484375, -0.6461639404296875, -0.613250732421875, -0.5803375244140625, -0.54742431640625, -0.5145111083984375, -0.481597900390625, -0.4486846923828125, -0.415771484375, -0.3828582763671875, -0.349945068359375, -0.3170318603515625, -0.28411865234375, -0.2512054443359375, -0.218292236328125, -0.1853790283203125, -0.1524658203125, -0.1195526123046875, -0.086639404296875, -0.0537261962890625, -0.02081298828125, 0.0121002197265625, 0.045013427734375, 0.0779266357421875, 0.11083984375, 0.1437530517578125, 0.176666259765625, 0.2095794677734375, 0.24249267578125, 0.2754058837890625, 0.308319091796875, 0.3412322998046875, 0.3741455078125, 0.4070587158203125, 0.439971923828125, 0.4728851318359375, 0.50579833984375, 0.5387115478515625, 0.571624755859375, 0.6045379638671875, 0.637451171875, 0.6703643798828125, 0.703277587890625, 0.7361907958984375, 0.76910400390625, 0.8020172119140625, 0.834930419921875, 0.8678436279296875, 0.9007568359375, 0.9336700439453125, 0.966583251953125, 0.9994964599609375, 1.03240966796875, 1.0653228759765625, 1.098236083984375, 1.1311492919921875, 1.1640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 4.0, 14.0, 9.0, 19.0, 19.0, 20.0, 20.0, 38.0, 58.0, 71.0, 90.0, 118.0, 143.0, 173.0, 235.0, 329.0, 492.0, 720.0, 1481.0, 3456.0, 11884.0, 54764.0, 256747.0, 477305.0, 186988.0, 38008.0, 8884.0, 2817.0, 1247.0, 698.0, 422.0, 306.0, 230.0, 159.0, 127.0, 106.0, 68.0, 65.0, 46.0, 35.0, 29.0, 28.0, 21.0, 13.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.796875, -1.7396240234375, -1.682373046875, -1.6251220703125, -1.56787109375, -1.5106201171875, -1.453369140625, -1.3961181640625, -1.3388671875, -1.2816162109375, -1.224365234375, -1.1671142578125, -1.10986328125, -1.0526123046875, -0.995361328125, -0.9381103515625, -0.880859375, -0.8236083984375, -0.766357421875, -0.7091064453125, -0.65185546875, -0.5946044921875, -0.537353515625, -0.4801025390625, -0.4228515625, -0.3656005859375, -0.308349609375, -0.2510986328125, -0.19384765625, -0.1365966796875, -0.079345703125, -0.0220947265625, 0.03515625, 0.0924072265625, 0.149658203125, 0.2069091796875, 0.26416015625, 0.3214111328125, 0.378662109375, 0.4359130859375, 0.4931640625, 0.5504150390625, 0.607666015625, 0.6649169921875, 0.72216796875, 0.7794189453125, 0.836669921875, 0.8939208984375, 0.951171875, 1.0084228515625, 1.065673828125, 1.1229248046875, 1.18017578125, 1.2374267578125, 1.294677734375, 1.3519287109375, 1.4091796875, 1.4664306640625, 1.523681640625, 1.5809326171875, 1.63818359375, 1.6954345703125, 1.752685546875, 1.8099365234375, 1.8671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 8.0, 6.0, 11.0, 17.0, 13.0, 22.0, 19.0, 41.0, 25.0, 35.0, 33.0, 45.0, 39.0, 46.0, 49.0, 43.0, 44.0, 54.0, 56.0, 38.0, 40.0, 39.0, 37.0, 29.0, 39.0, 17.0, 22.0, 19.0, 17.0, 20.0, 19.0, 17.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.13525390625, -2.0615234375, -1.98779296875, -1.9140625, -1.84033203125, -1.7666015625, -1.69287109375, -1.619140625, -1.54541015625, -1.4716796875, -1.39794921875, -1.32421875, -1.25048828125, -1.1767578125, -1.10302734375, -1.029296875, -0.95556640625, -0.8818359375, -0.80810546875, -0.734375, -0.66064453125, -0.5869140625, -0.51318359375, -0.439453125, -0.36572265625, -0.2919921875, -0.21826171875, -0.14453125, -0.07080078125, 0.0029296875, 0.07666015625, 0.150390625, 0.22412109375, 0.2978515625, 0.37158203125, 0.4453125, 0.51904296875, 0.5927734375, 0.66650390625, 0.740234375, 0.81396484375, 0.8876953125, 0.96142578125, 1.03515625, 1.10888671875, 1.1826171875, 1.25634765625, 1.330078125, 1.40380859375, 1.4775390625, 1.55126953125, 1.625, 1.69873046875, 1.7724609375, 1.84619140625, 1.919921875, 1.99365234375, 2.0673828125, 2.14111328125, 2.21484375, 2.28857421875, 2.3623046875, 2.43603515625, 2.509765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 11.0, 6.0, 17.0, 15.0, 21.0, 50.0, 88.0, 179.0, 404.0, 1014.0, 3294.0, 14876.0, 130369.0, 715892.0, 159643.0, 17017.0, 3622.0, 1134.0, 461.0, 201.0, 99.0, 50.0, 35.0, 18.0, 12.0, 13.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0601272583007812, -1.0294342041015625, -0.9987411499023438, -0.968048095703125, -0.9373550415039062, -0.9066619873046875, -0.8759689331054688, -0.84527587890625, -0.8145828247070312, -0.7838897705078125, -0.7531967163085938, -0.722503662109375, -0.6918106079101562, -0.6611175537109375, -0.6304244995117188, -0.5997314453125, -0.5690383911132812, -0.5383453369140625, -0.5076522827148438, -0.476959228515625, -0.44626617431640625, -0.4155731201171875, -0.38488006591796875, -0.35418701171875, -0.32349395751953125, -0.2928009033203125, -0.26210784912109375, -0.231414794921875, -0.20072174072265625, -0.1700286865234375, -0.13933563232421875, -0.108642578125, -0.07794952392578125, -0.0472564697265625, -0.01656341552734375, 0.014129638671875, 0.04482269287109375, 0.0755157470703125, 0.10620880126953125, 0.13690185546875, 0.16759490966796875, 0.1982879638671875, 0.22898101806640625, 0.259674072265625, 0.29036712646484375, 0.3210601806640625, 0.35175323486328125, 0.3824462890625, 0.41313934326171875, 0.4438323974609375, 0.47452545166015625, 0.505218505859375, 0.5359115600585938, 0.5666046142578125, 0.5972976684570312, 0.62799072265625, 0.6586837768554688, 0.6893768310546875, 0.7200698852539062, 0.750762939453125, 0.7814559936523438, 0.8121490478515625, 0.8428421020507812, 0.87353515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 10.0, 10.0, 16.0, 13.0, 21.0, 22.0, 27.0, 29.0, 43.0, 54.0, 86.0, 115.0, 117.0, 92.0, 65.0, 64.0, 46.0, 36.0, 22.0, 26.0, 15.0, 14.0, 11.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010156631469726562, -9.737908840179443e-05, -9.319186210632324e-05, -8.900463581085205e-05, -8.481740951538086e-05, -8.063018321990967e-05, -7.644295692443848e-05, -7.225573062896729e-05, -6.80685043334961e-05, -6.38812780380249e-05, -5.969405174255371e-05, -5.550682544708252e-05, -5.131959915161133e-05, -4.713237285614014e-05, -4.2945146560668945e-05, -3.8757920265197754e-05, -3.457069396972656e-05, -3.038346767425537e-05, -2.619624137878418e-05, -2.2009015083312988e-05, -1.7821788787841797e-05, -1.3634562492370605e-05, -9.447336196899414e-06, -5.260109901428223e-06, -1.0728836059570312e-06, 3.11434268951416e-06, 7.3015689849853516e-06, 1.1488795280456543e-05, 1.5676021575927734e-05, 1.9863247871398926e-05, 2.4050474166870117e-05, 2.823770046234131e-05, 3.24249267578125e-05, 3.661215305328369e-05, 4.079937934875488e-05, 4.4986605644226074e-05, 4.9173831939697266e-05, 5.336105823516846e-05, 5.754828453063965e-05, 6.173551082611084e-05, 6.592273712158203e-05, 7.010996341705322e-05, 7.429718971252441e-05, 7.84844160079956e-05, 8.26716423034668e-05, 8.685886859893799e-05, 9.104609489440918e-05, 9.523332118988037e-05, 9.942054748535156e-05, 0.00010360777378082275, 0.00010779500007629395, 0.00011198222637176514, 0.00011616945266723633, 0.00012035667896270752, 0.0001245439052581787, 0.0001287311315536499, 0.0001329183578491211, 0.00013710558414459229, 0.00014129281044006348, 0.00014548003673553467, 0.00014966726303100586, 0.00015385448932647705, 0.00015804171562194824, 0.00016222894191741943, 0.00016641616821289062]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 7.0, 18.0, 27.0, 34.0, 56.0, 74.0, 103.0, 198.0, 403.0, 855.0, 2426.0, 9578.0, 83747.0, 736043.0, 192545.0, 16795.0, 3412.0, 1121.0, 494.0, 226.0, 118.0, 78.0, 50.0, 28.0, 27.0, 23.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7425308227539062, -0.7111358642578125, -0.6797409057617188, -0.648345947265625, -0.6169509887695312, -0.5855560302734375, -0.5541610717773438, -0.52276611328125, -0.49137115478515625, -0.4599761962890625, -0.42858123779296875, -0.397186279296875, -0.36579132080078125, -0.3343963623046875, -0.30300140380859375, -0.2716064453125, -0.24021148681640625, -0.2088165283203125, -0.17742156982421875, -0.146026611328125, -0.11463165283203125, -0.0832366943359375, -0.05184173583984375, -0.02044677734375, 0.01094818115234375, 0.0423431396484375, 0.07373809814453125, 0.105133056640625, 0.13652801513671875, 0.1679229736328125, 0.19931793212890625, 0.230712890625, 0.26210784912109375, 0.2935028076171875, 0.32489776611328125, 0.356292724609375, 0.38768768310546875, 0.4190826416015625, 0.45047760009765625, 0.48187255859375, 0.5132675170898438, 0.5446624755859375, 0.5760574340820312, 0.607452392578125, 0.6388473510742188, 0.6702423095703125, 0.7016372680664062, 0.7330322265625, 0.7644271850585938, 0.7958221435546875, 0.8272171020507812, 0.858612060546875, 0.8900070190429688, 0.9214019775390625, 0.9527969360351562, 0.98419189453125, 1.0155868530273438, 1.0469818115234375, 1.0783767700195312, 1.109771728515625, 1.1411666870117188, 1.1725616455078125, 1.2039566040039062, 1.2353515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 5.0, 7.0, 13.0, 8.0, 14.0, 21.0, 33.0, 29.0, 57.0, 70.0, 93.0, 90.0, 99.0, 101.0, 88.0, 81.0, 51.0, 41.0, 23.0, 11.0, 11.0, 13.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.83935546875, -0.8156890869140625, -0.792022705078125, -0.7683563232421875, -0.74468994140625, -0.7210235595703125, -0.697357177734375, -0.6736907958984375, -0.6500244140625, -0.6263580322265625, -0.602691650390625, -0.5790252685546875, -0.55535888671875, -0.5316925048828125, -0.508026123046875, -0.4843597412109375, -0.460693359375, -0.4370269775390625, -0.413360595703125, -0.3896942138671875, -0.36602783203125, -0.3423614501953125, -0.318695068359375, -0.2950286865234375, -0.2713623046875, -0.2476959228515625, -0.224029541015625, -0.2003631591796875, -0.17669677734375, -0.1530303955078125, -0.129364013671875, -0.1056976318359375, -0.08203125, -0.0583648681640625, -0.034698486328125, -0.0110321044921875, 0.01263427734375, 0.0363006591796875, 0.059967041015625, 0.0836334228515625, 0.1072998046875, 0.1309661865234375, 0.154632568359375, 0.1782989501953125, 0.20196533203125, 0.2256317138671875, 0.249298095703125, 0.2729644775390625, 0.296630859375, 0.3202972412109375, 0.343963623046875, 0.3676300048828125, 0.39129638671875, 0.4149627685546875, 0.438629150390625, 0.4622955322265625, 0.4859619140625, 0.5096282958984375, 0.533294677734375, 0.5569610595703125, 0.58062744140625, 0.6042938232421875, 0.627960205078125, 0.6516265869140625, 0.67529296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 11.0, 22.0, 50.0, 78.0, 163.0, 192.0, 200.0, 128.0, 68.0, 42.0, 23.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.68433952331543, -20.142208099365234, -19.600074768066406, -19.05794334411621, -18.515811920166016, -17.97368049621582, -17.431547164916992, -16.889415740966797, -16.3472843170166, -15.80515193939209, -15.263020515441895, -14.720888137817383, -14.178756713867188, -13.636624336242676, -13.094491958618164, -12.552360534667969, -12.010228157043457, -11.468095779418945, -10.92596435546875, -10.383831977844238, -9.841700553894043, -9.299568176269531, -8.757436752319336, -8.215304374694824, -7.673172473907471, -7.131040573120117, -6.588908672332764, -6.04677677154541, -5.504644393920898, -4.962512969970703, -4.420380592346191, -3.878248691558838, -3.3361167907714844, -2.793984889984131, -2.2518529891967773, -1.7097208499908447, -1.1675889492034912, -0.6254570484161377, -0.08332490921020508, 0.45880699157714844, 1.000938892364502, 1.5430707931518555, 2.085202693939209, 2.6273348331451416, 3.169466733932495, 3.7115986347198486, 4.253730773925781, 4.795862674713135, 5.337994575500488, 5.880126476287842, 6.422258377075195, 6.964390754699707, 7.506522178649902, 8.048654556274414, 8.59078598022461, 9.132918357849121, 9.675050735473633, 10.217183113098145, 10.75931453704834, 11.301446914672852, 11.843578338623047, 12.385710716247559, 12.92784309387207, 13.469974517822266, 14.012105941772461]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 4.0, 8.0, 9.0, 10.0, 17.0, 20.0, 20.0, 24.0, 18.0, 29.0, 39.0, 25.0, 43.0, 27.0, 35.0, 41.0, 51.0, 38.0, 46.0, 41.0, 51.0, 30.0, 49.0, 39.0, 37.0, 35.0, 28.0, 23.0, 23.0, 16.0, 22.0, 18.0, 13.0, 10.0, 10.0, 11.0, 4.0, 5.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.724607467651367, -13.31413745880127, -12.903668403625488, -12.49319839477539, -12.082728385925293, -11.672258377075195, -11.261789321899414, -10.851319313049316, -10.440849304199219, -10.030379295349121, -9.61991024017334, -9.209440231323242, -8.798970222473145, -8.388500213623047, -7.978031158447266, -7.567561149597168, -7.157092094421387, -6.746622562408447, -6.33615255355835, -5.92568302154541, -5.5152130126953125, -5.104743480682373, -4.694273948669434, -4.283803939819336, -3.8733344078063965, -3.462864637374878, -3.0523948669433594, -2.64192533493042, -2.2314555644989014, -1.8209857940673828, -1.4105162620544434, -1.0000464916229248, -0.5895767211914062, -0.17910701036453247, 0.2313627004623413, 0.6418323516845703, 1.0523021221160889, 1.4627718925476074, 1.8732414245605469, 2.2837111949920654, 2.694180965423584, 3.1046507358551025, 3.515120506286621, 3.9255900382995605, 4.3360595703125, 4.746529579162598, 5.156999111175537, 5.567468643188477, 5.977938652038574, 6.388408184051514, 6.798878192901611, 7.209347724914551, 7.619817733764648, 8.03028678894043, 8.440756797790527, 8.851226806640625, 9.261695861816406, 9.672165870666504, 10.082634925842285, 10.493104934692383, 10.90357494354248, 11.314044952392578, 11.72451400756836, 12.134984016418457, 12.545454025268555]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 7.0, 21.0, 23.0, 42.0, 61.0, 72.0, 130.0, 219.0, 382.0, 686.0, 1485.0, 3513.0, 11201.0, 55000.0, 3360339.0, 712482.0, 35262.0, 8091.0, 2688.0, 1162.0, 576.0, 315.0, 173.0, 89.0, 81.0, 50.0, 29.0, 18.0, 16.0, 17.0, 14.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.14947509765625, -2.0723876953125, -1.99530029296875, -1.918212890625, -1.84112548828125, -1.7640380859375, -1.68695068359375, -1.60986328125, -1.53277587890625, -1.4556884765625, -1.37860107421875, -1.301513671875, -1.22442626953125, -1.1473388671875, -1.07025146484375, -0.9931640625, -0.91607666015625, -0.8389892578125, -0.76190185546875, -0.684814453125, -0.60772705078125, -0.5306396484375, -0.45355224609375, -0.37646484375, -0.29937744140625, -0.2222900390625, -0.14520263671875, -0.068115234375, 0.00897216796875, 0.0860595703125, 0.16314697265625, 0.240234375, 0.31732177734375, 0.3944091796875, 0.47149658203125, 0.548583984375, 0.62567138671875, 0.7027587890625, 0.77984619140625, 0.85693359375, 0.93402099609375, 1.0111083984375, 1.08819580078125, 1.165283203125, 1.24237060546875, 1.3194580078125, 1.39654541015625, 1.4736328125, 1.55072021484375, 1.6278076171875, 1.70489501953125, 1.781982421875, 1.85906982421875, 1.9361572265625, 2.01324462890625, 2.09033203125, 2.16741943359375, 2.2445068359375, 2.32159423828125, 2.398681640625, 2.47576904296875, 2.5528564453125, 2.62994384765625, 2.70703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 7.0, 4.0, 7.0, 16.0, 16.0, 17.0, 27.0, 39.0, 54.0, 72.0, 91.0, 87.0, 100.0, 95.0, 92.0, 78.0, 61.0, 47.0, 31.0, 20.0, 12.0, 10.0, 11.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9013748168945312, -0.8686676025390625, -0.8359603881835938, -0.803253173828125, -0.7705459594726562, -0.7378387451171875, -0.7051315307617188, -0.67242431640625, -0.6397171020507812, -0.6070098876953125, -0.5743026733398438, -0.541595458984375, -0.5088882446289062, -0.4761810302734375, -0.44347381591796875, -0.4107666015625, -0.37805938720703125, -0.3453521728515625, -0.31264495849609375, -0.279937744140625, -0.24723052978515625, -0.2145233154296875, -0.18181610107421875, -0.14910888671875, -0.11640167236328125, -0.0836944580078125, -0.05098724365234375, -0.018280029296875, 0.01442718505859375, 0.0471343994140625, 0.07984161376953125, 0.112548828125, 0.14525604248046875, 0.1779632568359375, 0.21067047119140625, 0.243377685546875, 0.27608489990234375, 0.3087921142578125, 0.34149932861328125, 0.37420654296875, 0.40691375732421875, 0.4396209716796875, 0.47232818603515625, 0.505035400390625, 0.5377426147460938, 0.5704498291015625, 0.6031570434570312, 0.6358642578125, 0.6685714721679688, 0.7012786865234375, 0.7339859008789062, 0.766693115234375, 0.7994003295898438, 0.8321075439453125, 0.8648147583007812, 0.89752197265625, 0.9302291870117188, 0.9629364013671875, 0.9956436157226562, 1.028350830078125, 1.0610580444335938, 1.0937652587890625, 1.1264724731445312, 1.1591796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 8.0, 10.0, 20.0, 34.0, 77.0, 198.0, 537.0, 1691.0, 6533.0, 38230.0, 2001266.0, 2097607.0, 38747.0, 6612.0, 1739.0, 544.0, 225.0, 72.0, 40.0, 26.0, 17.0, 12.0, 3.0, 9.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.705078125, -2.6319732666015625, -2.558868408203125, -2.4857635498046875, -2.41265869140625, -2.3395538330078125, -2.266448974609375, -2.1933441162109375, -2.1202392578125, -2.0471343994140625, -1.974029541015625, -1.9009246826171875, -1.82781982421875, -1.7547149658203125, -1.681610107421875, -1.6085052490234375, -1.535400390625, -1.4622955322265625, -1.389190673828125, -1.3160858154296875, -1.24298095703125, -1.1698760986328125, -1.096771240234375, -1.0236663818359375, -0.9505615234375, -0.8774566650390625, -0.804351806640625, -0.7312469482421875, -0.65814208984375, -0.5850372314453125, -0.511932373046875, -0.4388275146484375, -0.36572265625, -0.2926177978515625, -0.219512939453125, -0.1464080810546875, -0.07330322265625, -0.0001983642578125, 0.072906494140625, 0.1460113525390625, 0.2191162109375, 0.2922210693359375, 0.365325927734375, 0.4384307861328125, 0.51153564453125, 0.5846405029296875, 0.657745361328125, 0.7308502197265625, 0.803955078125, 0.8770599365234375, 0.950164794921875, 1.0232696533203125, 1.09637451171875, 1.1694793701171875, 1.242584228515625, 1.3156890869140625, 1.3887939453125, 1.4618988037109375, 1.535003662109375, 1.6081085205078125, 1.68121337890625, 1.7543182373046875, 1.827423095703125, 1.9005279541015625, 1.9736328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 5.0, 3.0, 13.0, 8.0, 7.0, 15.0, 26.0, 31.0, 52.0, 115.0, 225.0, 590.0, 1550.0, 802.0, 271.0, 136.0, 67.0, 44.0, 21.0, 22.0, 19.0, 10.0, 4.0, 5.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0087890625, -0.981964111328125, -0.95513916015625, -0.928314208984375, -0.9014892578125, -0.874664306640625, -0.84783935546875, -0.821014404296875, -0.794189453125, -0.767364501953125, -0.74053955078125, -0.713714599609375, -0.6868896484375, -0.660064697265625, -0.63323974609375, -0.606414794921875, -0.57958984375, -0.552764892578125, -0.52593994140625, -0.499114990234375, -0.4722900390625, -0.445465087890625, -0.41864013671875, -0.391815185546875, -0.364990234375, -0.338165283203125, -0.31134033203125, -0.284515380859375, -0.2576904296875, -0.230865478515625, -0.20404052734375, -0.177215576171875, -0.150390625, -0.123565673828125, -0.09674072265625, -0.069915771484375, -0.0430908203125, -0.016265869140625, 0.01055908203125, 0.037384033203125, 0.064208984375, 0.091033935546875, 0.11785888671875, 0.144683837890625, 0.1715087890625, 0.198333740234375, 0.22515869140625, 0.251983642578125, 0.27880859375, 0.305633544921875, 0.33245849609375, 0.359283447265625, 0.3861083984375, 0.412933349609375, 0.43975830078125, 0.466583251953125, 0.493408203125, 0.520233154296875, 0.54705810546875, 0.573883056640625, 0.6007080078125, 0.627532958984375, 0.65435791015625, 0.681182861328125, 0.7080078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 21.0, 84.0, 246.0, 348.0, 198.0, 71.0, 16.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.857562065124512, -4.604931354522705, -4.352300643920898, -4.099669456481934, -3.847038745880127, -3.5944080352783203, -3.3417770862579346, -3.089146137237549, -2.836515426635742, -2.5838847160339355, -2.33125376701355, -2.078622817993164, -1.8259921073913574, -1.5733612775802612, -1.320730447769165, -1.0680996179580688, -0.8154687881469727, -0.5628379583358765, -0.3102071285247803, -0.05757629871368408, 0.1950545310974121, 0.4476853609085083, 0.7003161907196045, 0.9529470205307007, 1.2055778503417969, 1.458208680152893, 1.7108395099639893, 1.9634703397750854, 2.2161011695861816, 2.4687318801879883, 2.721362829208374, 2.9739937782287598, 3.2266244888305664, 3.479255199432373, 3.731886148452759, 3.9845170974731445, 4.237147808074951, 4.489778518676758, 4.742409706115723, 4.995040416717529, 5.247671127319336, 5.500301837921143, 5.752932548522949, 6.005563735961914, 6.258194446563721, 6.510825157165527, 6.763456344604492, 7.016087055206299, 7.2687177658081055, 7.521348476409912, 7.773979187011719, 8.026610374450684, 8.279241561889648, 8.531871795654297, 8.784502983093262, 9.03713321685791, 9.289764404296875, 9.54239559173584, 9.795025825500488, 10.047657012939453, 10.300287246704102, 10.552918434143066, 10.805549621582031, 11.05817985534668, 11.310811042785645]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 9.0, 11.0, 17.0, 11.0, 16.0, 16.0, 15.0, 21.0, 24.0, 27.0, 34.0, 34.0, 46.0, 37.0, 31.0, 37.0, 35.0, 36.0, 47.0, 34.0, 45.0, 41.0, 42.0, 27.0, 35.0, 28.0, 30.0, 34.0, 23.0, 28.0, 16.0, 13.0, 10.0, 9.0, 9.0, 8.0, 8.0, 10.0, 4.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.3183841705322266, -2.2475078105926514, -2.176631450653076, -2.105755090713501, -2.034878730773926, -1.9640023708343506, -1.8931260108947754, -1.8222496509552002, -1.751373291015625, -1.6804969310760498, -1.6096205711364746, -1.5387442111968994, -1.4678678512573242, -1.396991491317749, -1.3261151313781738, -1.2552387714385986, -1.1843622922897339, -1.1134859323501587, -1.0426095724105835, -0.9717332124710083, -0.9008568525314331, -0.8299804925918579, -0.7591040730476379, -0.6882277131080627, -0.6173513531684875, -0.5464749932289124, -0.47559863328933716, -0.4047222435474396, -0.3338458836078644, -0.2629695236682892, -0.1920931339263916, -0.1212167739868164, -0.05034041404724121, 0.02053595334291458, 0.09141232073307037, 0.16228869557380676, 0.23316505551338196, 0.30404141545295715, 0.37491780519485474, 0.44579416513442993, 0.5166705250740051, 0.5875468850135803, 0.6584232449531555, 0.7292996644973755, 0.8001760244369507, 0.8710523843765259, 0.9419287443161011, 1.0128051042556763, 1.0836814641952515, 1.1545578241348267, 1.2254341840744019, 1.296310544013977, 1.3671869039535522, 1.4380632638931274, 1.5089397430419922, 1.5798161029815674, 1.6506924629211426, 1.7215688228607178, 1.792445182800293, 1.8633215427398682, 1.9341979026794434, 2.0050742626190186, 2.0759506225585938, 2.146826982498169, 2.217703342437744]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 12.0, 20.0, 23.0, 46.0, 58.0, 80.0, 126.0, 201.0, 321.0, 535.0, 1099.0, 2260.0, 5716.0, 19361.0, 93975.0, 525201.0, 326163.0, 52808.0, 12537.0, 4243.0, 1702.0, 842.0, 452.0, 265.0, 162.0, 114.0, 62.0, 34.0, 41.0, 30.0, 13.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.274627685546875, -2.19573974609375, -2.116851806640625, -2.0379638671875, -1.959075927734375, -1.88018798828125, -1.801300048828125, -1.722412109375, -1.643524169921875, -1.56463623046875, -1.485748291015625, -1.4068603515625, -1.327972412109375, -1.24908447265625, -1.170196533203125, -1.09130859375, -1.012420654296875, -0.93353271484375, -0.854644775390625, -0.7757568359375, -0.696868896484375, -0.61798095703125, -0.539093017578125, -0.460205078125, -0.381317138671875, -0.30242919921875, -0.223541259765625, -0.1446533203125, -0.065765380859375, 0.01312255859375, 0.092010498046875, 0.1708984375, 0.249786376953125, 0.32867431640625, 0.407562255859375, 0.4864501953125, 0.565338134765625, 0.64422607421875, 0.723114013671875, 0.802001953125, 0.880889892578125, 0.95977783203125, 1.038665771484375, 1.1175537109375, 1.196441650390625, 1.27532958984375, 1.354217529296875, 1.43310546875, 1.511993408203125, 1.59088134765625, 1.669769287109375, 1.7486572265625, 1.827545166015625, 1.90643310546875, 1.985321044921875, 2.064208984375, 2.143096923828125, 2.22198486328125, 2.300872802734375, 2.3797607421875, 2.458648681640625, 2.53753662109375, 2.616424560546875, 2.6953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 13.0, 22.0, 25.0, 35.0, 39.0, 67.0, 90.0, 104.0, 101.0, 89.0, 96.0, 95.0, 61.0, 50.0, 35.0, 21.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9285125732421875, -0.895111083984375, -0.8617095947265625, -0.82830810546875, -0.7949066162109375, -0.761505126953125, -0.7281036376953125, -0.6947021484375, -0.6613006591796875, -0.627899169921875, -0.5944976806640625, -0.56109619140625, -0.5276947021484375, -0.494293212890625, -0.4608917236328125, -0.427490234375, -0.3940887451171875, -0.360687255859375, -0.3272857666015625, -0.29388427734375, -0.2604827880859375, -0.227081298828125, -0.1936798095703125, -0.1602783203125, -0.1268768310546875, -0.093475341796875, -0.0600738525390625, -0.02667236328125, 0.0067291259765625, 0.040130615234375, 0.0735321044921875, 0.10693359375, 0.1403350830078125, 0.173736572265625, 0.2071380615234375, 0.24053955078125, 0.2739410400390625, 0.307342529296875, 0.3407440185546875, 0.3741455078125, 0.4075469970703125, 0.440948486328125, 0.4743499755859375, 0.50775146484375, 0.5411529541015625, 0.574554443359375, 0.6079559326171875, 0.641357421875, 0.6747589111328125, 0.708160400390625, 0.7415618896484375, 0.77496337890625, 0.8083648681640625, 0.841766357421875, 0.8751678466796875, 0.9085693359375, 0.9419708251953125, 0.975372314453125, 1.0087738037109375, 1.04217529296875, 1.0755767822265625, 1.108978271484375, 1.1423797607421875, 1.17578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 5.0, 5.0, 9.0, 18.0, 30.0, 26.0, 45.0, 53.0, 62.0, 72.0, 134.0, 138.0, 224.0, 367.0, 547.0, 1136.0, 3134.0, 14244.0, 111635.0, 640837.0, 239749.0, 27501.0, 4920.0, 1503.0, 716.0, 396.0, 294.0, 185.0, 144.0, 93.0, 78.0, 54.0, 37.0, 30.0, 26.0, 22.0, 13.0, 9.0, 16.0, 10.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.619140625, -2.538970947265625, -2.45880126953125, -2.378631591796875, -2.2984619140625, -2.218292236328125, -2.13812255859375, -2.057952880859375, -1.977783203125, -1.897613525390625, -1.81744384765625, -1.737274169921875, -1.6571044921875, -1.576934814453125, -1.49676513671875, -1.416595458984375, -1.33642578125, -1.256256103515625, -1.17608642578125, -1.095916748046875, -1.0157470703125, -0.935577392578125, -0.85540771484375, -0.775238037109375, -0.695068359375, -0.614898681640625, -0.53472900390625, -0.454559326171875, -0.3743896484375, -0.294219970703125, -0.21405029296875, -0.133880615234375, -0.0537109375, 0.026458740234375, 0.10662841796875, 0.186798095703125, 0.2669677734375, 0.347137451171875, 0.42730712890625, 0.507476806640625, 0.587646484375, 0.667816162109375, 0.74798583984375, 0.828155517578125, 0.9083251953125, 0.988494873046875, 1.06866455078125, 1.148834228515625, 1.22900390625, 1.309173583984375, 1.38934326171875, 1.469512939453125, 1.5496826171875, 1.629852294921875, 1.71002197265625, 1.790191650390625, 1.870361328125, 1.950531005859375, 2.03070068359375, 2.110870361328125, 2.1910400390625, 2.271209716796875, 2.35137939453125, 2.431549072265625, 2.51171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 4.0, 11.0, 15.0, 9.0, 18.0, 21.0, 22.0, 27.0, 39.0, 38.0, 32.0, 46.0, 44.0, 49.0, 57.0, 46.0, 75.0, 58.0, 38.0, 41.0, 49.0, 37.0, 30.0, 39.0, 31.0, 21.0, 20.0, 15.0, 9.0, 10.0, 4.0, 4.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.650787353515625, -2.57110595703125, -2.491424560546875, -2.4117431640625, -2.332061767578125, -2.25238037109375, -2.172698974609375, -2.093017578125, -2.013336181640625, -1.93365478515625, -1.853973388671875, -1.7742919921875, -1.694610595703125, -1.61492919921875, -1.535247802734375, -1.45556640625, -1.375885009765625, -1.29620361328125, -1.216522216796875, -1.1368408203125, -1.057159423828125, -0.97747802734375, -0.897796630859375, -0.818115234375, -0.738433837890625, -0.65875244140625, -0.579071044921875, -0.4993896484375, -0.419708251953125, -0.34002685546875, -0.260345458984375, -0.1806640625, -0.100982666015625, -0.02130126953125, 0.058380126953125, 0.1380615234375, 0.217742919921875, 0.29742431640625, 0.377105712890625, 0.456787109375, 0.536468505859375, 0.61614990234375, 0.695831298828125, 0.7755126953125, 0.855194091796875, 0.93487548828125, 1.014556884765625, 1.09423828125, 1.173919677734375, 1.25360107421875, 1.333282470703125, 1.4129638671875, 1.492645263671875, 1.57232666015625, 1.652008056640625, 1.731689453125, 1.811370849609375, 1.89105224609375, 1.970733642578125, 2.0504150390625, 2.130096435546875, 2.20977783203125, 2.289459228515625, 2.369140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 3.0, 20.0, 24.0, 41.0, 86.0, 192.0, 403.0, 1460.0, 7602.0, 75254.0, 867516.0, 85440.0, 8198.0, 1531.0, 424.0, 163.0, 81.0, 44.0, 32.0, 17.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82080078125, -0.7826614379882812, -0.7445220947265625, -0.7063827514648438, -0.668243408203125, -0.6301040649414062, -0.5919647216796875, -0.5538253784179688, -0.51568603515625, -0.47754669189453125, -0.4394073486328125, -0.40126800537109375, -0.363128662109375, -0.32498931884765625, -0.2868499755859375, -0.24871063232421875, -0.2105712890625, -0.17243194580078125, -0.1342926025390625, -0.09615325927734375, -0.058013916015625, -0.01987457275390625, 0.0182647705078125, 0.05640411376953125, 0.09454345703125, 0.13268280029296875, 0.1708221435546875, 0.20896148681640625, 0.247100830078125, 0.28524017333984375, 0.3233795166015625, 0.36151885986328125, 0.399658203125, 0.43779754638671875, 0.4759368896484375, 0.5140762329101562, 0.552215576171875, 0.5903549194335938, 0.6284942626953125, 0.6666336059570312, 0.70477294921875, 0.7429122924804688, 0.7810516357421875, 0.8191909790039062, 0.857330322265625, 0.8954696655273438, 0.9336090087890625, 0.9717483520507812, 1.0098876953125, 1.0480270385742188, 1.0861663818359375, 1.1243057250976562, 1.162445068359375, 1.2005844116210938, 1.2387237548828125, 1.2768630981445312, 1.31500244140625, 1.3531417846679688, 1.3912811279296875, 1.4294204711914062, 1.467559814453125, 1.5056991577148438, 1.5438385009765625, 1.5819778442382812, 1.6201171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 10.0, 5.0, 8.0, 10.0, 20.0, 22.0, 25.0, 31.0, 41.0, 77.0, 144.0, 184.0, 146.0, 81.0, 45.0, 26.0, 17.0, 19.0, 16.0, 12.0, 11.0, 9.0, 7.0, 5.0, 1.0, 7.0, 0.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001761913299560547, -0.0001709330826997757, -0.0001656748354434967, -0.0001604165881872177, -0.00015515834093093872, -0.00014990009367465973, -0.00014464184641838074, -0.00013938359916210175, -0.00013412535190582275, -0.00012886710464954376, -0.00012360885739326477, -0.00011835061013698578, -0.00011309236288070679, -0.0001078341156244278, -0.0001025758683681488, -9.731762111186981e-05, -9.205937385559082e-05, -8.680112659931183e-05, -8.154287934303284e-05, -7.628463208675385e-05, -7.102638483047485e-05, -6.576813757419586e-05, -6.050989031791687e-05, -5.525164306163788e-05, -4.999339580535889e-05, -4.4735148549079895e-05, -3.94769012928009e-05, -3.421865403652191e-05, -2.896040678024292e-05, -2.3702159523963928e-05, -1.8443912267684937e-05, -1.3185665011405945e-05, -7.927417755126953e-06, -2.6691704988479614e-06, 2.5890767574310303e-06, 7.847324013710022e-06, 1.3105571269989014e-05, 1.8363818526268005e-05, 2.3622065782546997e-05, 2.888031303882599e-05, 3.413856029510498e-05, 3.939680755138397e-05, 4.4655054807662964e-05, 4.9913302063941956e-05, 5.517154932022095e-05, 6.042979657649994e-05, 6.568804383277893e-05, 7.094629108905792e-05, 7.620453834533691e-05, 8.14627856016159e-05, 8.67210328578949e-05, 9.197928011417389e-05, 9.723752737045288e-05, 0.00010249577462673187, 0.00010775402188301086, 0.00011301226913928986, 0.00011827051639556885, 0.00012352876365184784, 0.00012878701090812683, 0.00013404525816440582, 0.00013930350542068481, 0.0001445617526769638, 0.0001498199999332428, 0.0001550782471895218, 0.00016033649444580078]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 14.0, 21.0, 26.0, 58.0, 68.0, 114.0, 259.0, 535.0, 1617.0, 8625.0, 128962.0, 864997.0, 37505.0, 3853.0, 1004.0, 366.0, 232.0, 99.0, 61.0, 36.0, 21.0, 15.0, 11.0, 9.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.233062744140625, -1.19366455078125, -1.154266357421875, -1.1148681640625, -1.075469970703125, -1.03607177734375, -0.996673583984375, -0.957275390625, -0.917877197265625, -0.87847900390625, -0.839080810546875, -0.7996826171875, -0.760284423828125, -0.72088623046875, -0.681488037109375, -0.64208984375, -0.602691650390625, -0.56329345703125, -0.523895263671875, -0.4844970703125, -0.445098876953125, -0.40570068359375, -0.366302490234375, -0.326904296875, -0.287506103515625, -0.24810791015625, -0.208709716796875, -0.1693115234375, -0.129913330078125, -0.09051513671875, -0.051116943359375, -0.01171875, 0.027679443359375, 0.06707763671875, 0.106475830078125, 0.1458740234375, 0.185272216796875, 0.22467041015625, 0.264068603515625, 0.303466796875, 0.342864990234375, 0.38226318359375, 0.421661376953125, 0.4610595703125, 0.500457763671875, 0.53985595703125, 0.579254150390625, 0.61865234375, 0.658050537109375, 0.69744873046875, 0.736846923828125, 0.7762451171875, 0.815643310546875, 0.85504150390625, 0.894439697265625, 0.933837890625, 0.973236083984375, 1.01263427734375, 1.052032470703125, 1.0914306640625, 1.130828857421875, 1.17022705078125, 1.209625244140625, 1.2490234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 10.0, 4.0, 7.0, 10.0, 11.0, 20.0, 19.0, 31.0, 48.0, 71.0, 98.0, 107.0, 115.0, 96.0, 98.0, 67.0, 50.0, 32.0, 13.0, 18.0, 13.0, 14.0, 9.0, 7.0, 12.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.51611328125, -0.498046875, -0.47998046875, -0.4619140625, -0.44384765625, -0.42578125, -0.40771484375, -0.3896484375, -0.37158203125, -0.353515625, -0.33544921875, -0.3173828125, -0.29931640625, -0.28125, -0.26318359375, -0.2451171875, -0.22705078125, -0.208984375, -0.19091796875, -0.1728515625, -0.15478515625, -0.13671875, -0.11865234375, -0.1005859375, -0.08251953125, -0.064453125, -0.04638671875, -0.0283203125, -0.01025390625, 0.0078125, 0.02587890625, 0.0439453125, 0.06201171875, 0.080078125, 0.09814453125, 0.1162109375, 0.13427734375, 0.15234375, 0.17041015625, 0.1884765625, 0.20654296875, 0.224609375, 0.24267578125, 0.2607421875, 0.27880859375, 0.296875, 0.31494140625, 0.3330078125, 0.35107421875, 0.369140625, 0.38720703125, 0.4052734375, 0.42333984375, 0.44140625, 0.45947265625, 0.4775390625, 0.49560546875, 0.513671875, 0.53173828125, 0.5498046875, 0.56787109375, 0.5859375, 0.60400390625, 0.6220703125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 29.0, 63.0, 218.0, 342.0, 225.0, 92.0, 22.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.154958724975586, -20.29647445678711, -19.43798828125, -18.579504013061523, -17.721019744873047, -16.862533569335938, -16.00404930114746, -15.145564079284668, -14.287078857421875, -13.428593635559082, -12.570108413696289, -11.711624145507812, -10.85313892364502, -9.994653701782227, -9.13616943359375, -8.277684211730957, -7.419198989868164, -6.560713768005371, -5.702229022979736, -4.843744277954102, -3.9852590560913086, -3.1267738342285156, -2.268289089202881, -1.409804344177246, -0.5513191223144531, 0.30716586112976074, 1.1656508445739746, 2.0241358280181885, 2.8826208114624023, 3.7411060333251953, 4.59959077835083, 5.458075523376465, 6.316558837890625, 7.175044059753418, 8.033529281616211, 8.892013549804688, 9.75049877166748, 10.608983993530273, 11.46746826171875, 12.325953483581543, 13.184438705444336, 14.042923927307129, 14.901409149169922, 15.759893417358398, 16.618377685546875, 17.476863861083984, 18.33534812927246, 19.193832397460938, 20.052318572998047, 20.910802841186523, 21.769289016723633, 22.62777328491211, 23.48625946044922, 24.344743728637695, 25.203227996826172, 26.06171417236328, 26.920198440551758, 27.778682708740234, 28.637168884277344, 29.49565315246582, 30.354137420654297, 31.212623596191406, 32.071109771728516, 32.92959213256836, 33.78807830810547]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 9.0, 10.0, 16.0, 20.0, 21.0, 19.0, 22.0, 36.0, 44.0, 42.0, 37.0, 41.0, 52.0, 37.0, 40.0, 35.0, 47.0, 49.0, 49.0, 36.0, 39.0, 34.0, 33.0, 30.0, 39.0, 22.0, 20.0, 19.0, 15.0, 12.0, 10.0, 10.0, 11.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.42428207397461, -14.031539916992188, -13.638798713684082, -13.24605655670166, -12.853315353393555, -12.460573196411133, -12.067831039428711, -11.675089836120605, -11.282347679138184, -10.889605522155762, -10.496864318847656, -10.104122161865234, -9.711380958557129, -9.318638801574707, -8.925897598266602, -8.53315544128418, -8.140413284301758, -7.747671604156494, -7.3549299240112305, -6.962187767028809, -6.569446086883545, -6.176704406738281, -5.783962726593018, -5.391221046447754, -4.998479843139648, -4.605738162994385, -4.212996482849121, -3.8202545642852783, -3.4275126457214355, -3.034770965576172, -2.642029285430908, -2.2492873668670654, -1.8565454483032227, -1.4638036489486694, -1.0710618495941162, -0.6783201694488525, -0.2855783700942993, 0.1071634292602539, 0.4999051094055176, 0.8926470279693604, 1.285388708114624, 1.6781305074691772, 2.0708723068237305, 2.463613986968994, 2.856355667114258, 3.2490975856781006, 3.6418392658233643, 4.034581184387207, 4.427322864532471, 4.820064544677734, 5.212806224822998, 5.605547904968262, 5.998290061950684, 6.391031742095947, 6.783773422241211, 7.176515579223633, 7.569256782531738, 7.961998462677002, 8.354740142822266, 8.747482299804688, 9.140223503112793, 9.532965660095215, 9.92570686340332, 10.318449020385742, 10.711191177368164]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 8.0, 3.0, 14.0, 12.0, 18.0, 34.0, 38.0, 63.0, 86.0, 130.0, 241.0, 382.0, 727.0, 1362.0, 3068.0, 7530.0, 25819.0, 214233.0, 3802029.0, 109262.0, 18736.0, 5781.0, 2318.0, 1039.0, 499.0, 308.0, 185.0, 121.0, 64.0, 40.0, 36.0, 21.0, 20.0, 12.0, 13.0, 8.0, 5.0, 9.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.23828125, -2.169158935546875, -2.10003662109375, -2.030914306640625, -1.9617919921875, -1.892669677734375, -1.82354736328125, -1.754425048828125, -1.685302734375, -1.616180419921875, -1.54705810546875, -1.477935791015625, -1.4088134765625, -1.339691162109375, -1.27056884765625, -1.201446533203125, -1.13232421875, -1.063201904296875, -0.99407958984375, -0.924957275390625, -0.8558349609375, -0.786712646484375, -0.71759033203125, -0.648468017578125, -0.579345703125, -0.510223388671875, -0.44110107421875, -0.371978759765625, -0.3028564453125, -0.233734130859375, -0.16461181640625, -0.095489501953125, -0.0263671875, 0.042755126953125, 0.11187744140625, 0.180999755859375, 0.2501220703125, 0.319244384765625, 0.38836669921875, 0.457489013671875, 0.526611328125, 0.595733642578125, 0.66485595703125, 0.733978271484375, 0.8031005859375, 0.872222900390625, 0.94134521484375, 1.010467529296875, 1.07958984375, 1.148712158203125, 1.21783447265625, 1.286956787109375, 1.3560791015625, 1.425201416015625, 1.49432373046875, 1.563446044921875, 1.632568359375, 1.701690673828125, 1.77081298828125, 1.839935302734375, 1.9090576171875, 1.978179931640625, 2.04730224609375, 2.116424560546875, 2.185546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 13.0, 19.0, 27.0, 41.0, 60.0, 57.0, 86.0, 94.0, 113.0, 107.0, 79.0, 81.0, 61.0, 45.0, 36.0, 16.0, 20.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1225128173828125, -1.085845947265625, -1.0491790771484375, -1.01251220703125, -0.9758453369140625, -0.939178466796875, -0.9025115966796875, -0.8658447265625, -0.8291778564453125, -0.792510986328125, -0.7558441162109375, -0.71917724609375, -0.6825103759765625, -0.645843505859375, -0.6091766357421875, -0.572509765625, -0.5358428955078125, -0.499176025390625, -0.4625091552734375, -0.42584228515625, -0.3891754150390625, -0.352508544921875, -0.3158416748046875, -0.2791748046875, -0.2425079345703125, -0.205841064453125, -0.1691741943359375, -0.13250732421875, -0.0958404541015625, -0.059173583984375, -0.0225067138671875, 0.01416015625, 0.0508270263671875, 0.087493896484375, 0.1241607666015625, 0.16082763671875, 0.1974945068359375, 0.234161376953125, 0.2708282470703125, 0.3074951171875, 0.3441619873046875, 0.380828857421875, 0.4174957275390625, 0.45416259765625, 0.4908294677734375, 0.527496337890625, 0.5641632080078125, 0.600830078125, 0.6374969482421875, 0.674163818359375, 0.7108306884765625, 0.74749755859375, 0.7841644287109375, 0.820831298828125, 0.8574981689453125, 0.8941650390625, 0.9308319091796875, 0.967498779296875, 1.0041656494140625, 1.04083251953125, 1.0774993896484375, 1.114166259765625, 1.1508331298828125, 1.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 24.0, 27.0, 43.0, 92.0, 172.0, 390.0, 1670.0, 13322.0, 1667219.0, 2493786.0, 14864.0, 1890.0, 452.0, 131.0, 83.0, 46.0, 26.0, 15.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.816162109375, -4.69873046875, -4.581298828125, -4.4638671875, -4.346435546875, -4.22900390625, -4.111572265625, -3.994140625, -3.876708984375, -3.75927734375, -3.641845703125, -3.5244140625, -3.406982421875, -3.28955078125, -3.172119140625, -3.0546875, -2.937255859375, -2.81982421875, -2.702392578125, -2.5849609375, -2.467529296875, -2.35009765625, -2.232666015625, -2.115234375, -1.997802734375, -1.88037109375, -1.762939453125, -1.6455078125, -1.528076171875, -1.41064453125, -1.293212890625, -1.17578125, -1.058349609375, -0.94091796875, -0.823486328125, -0.7060546875, -0.588623046875, -0.47119140625, -0.353759765625, -0.236328125, -0.118896484375, -0.00146484375, 0.115966796875, 0.2333984375, 0.350830078125, 0.46826171875, 0.585693359375, 0.703125, 0.820556640625, 0.93798828125, 1.055419921875, 1.1728515625, 1.290283203125, 1.40771484375, 1.525146484375, 1.642578125, 1.760009765625, 1.87744140625, 1.994873046875, 2.1123046875, 2.229736328125, 2.34716796875, 2.464599609375, 2.58203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 15.0, 43.0, 76.0, 200.0, 1268.0, 2043.0, 247.0, 77.0, 35.0, 20.0, 11.0, 8.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.966796875, -1.92218017578125, -1.8775634765625, -1.83294677734375, -1.788330078125, -1.74371337890625, -1.6990966796875, -1.65447998046875, -1.60986328125, -1.56524658203125, -1.5206298828125, -1.47601318359375, -1.431396484375, -1.38677978515625, -1.3421630859375, -1.29754638671875, -1.2529296875, -1.20831298828125, -1.1636962890625, -1.11907958984375, -1.074462890625, -1.02984619140625, -0.9852294921875, -0.94061279296875, -0.89599609375, -0.85137939453125, -0.8067626953125, -0.76214599609375, -0.717529296875, -0.67291259765625, -0.6282958984375, -0.58367919921875, -0.5390625, -0.49444580078125, -0.4498291015625, -0.40521240234375, -0.360595703125, -0.31597900390625, -0.2713623046875, -0.22674560546875, -0.18212890625, -0.13751220703125, -0.0928955078125, -0.04827880859375, -0.003662109375, 0.04095458984375, 0.0855712890625, 0.13018798828125, 0.1748046875, 0.21942138671875, 0.2640380859375, 0.30865478515625, 0.353271484375, 0.39788818359375, 0.4425048828125, 0.48712158203125, 0.53173828125, 0.57635498046875, 0.6209716796875, 0.66558837890625, 0.710205078125, 0.75482177734375, 0.7994384765625, 0.84405517578125, 0.888671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 38.0, 117.0, 233.0, 275.0, 176.0, 105.0, 27.0, 15.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.992796421051025, -6.801046371459961, -6.609296798706055, -6.417547225952148, -6.225797176361084, -6.0340471267700195, -5.842297554016113, -5.650547981262207, -5.458797931671143, -5.267047882080078, -5.075298309326172, -4.883548736572266, -4.691798686981201, -4.500048637390137, -4.3082990646362305, -4.116549491882324, -3.9247994422912598, -3.7330496311187744, -3.541299819946289, -3.3495500087738037, -3.1578001976013184, -2.966050386428833, -2.7743005752563477, -2.5825507640838623, -2.390800952911377, -2.1990511417388916, -2.0073013305664062, -1.815551519393921, -1.6238017082214355, -1.4320518970489502, -1.2403020858764648, -1.0485522747039795, -0.8568029403686523, -0.665053129196167, -0.47330331802368164, -0.2815535068511963, -0.08980369567871094, 0.10194611549377441, 0.29369592666625977, 0.4854457378387451, 0.6771955490112305, 0.8689453601837158, 1.0606951713562012, 1.2524449825286865, 1.4441947937011719, 1.6359446048736572, 1.8276944160461426, 2.019444227218628, 2.2111940383911133, 2.4029438495635986, 2.594693660736084, 2.7864434719085693, 2.9781932830810547, 3.16994309425354, 3.3616929054260254, 3.5534427165985107, 3.745192527770996, 3.9369423389434814, 4.128692150115967, 4.320442199707031, 4.5121917724609375, 4.703941345214844, 4.895691394805908, 5.087441444396973, 5.279191017150879]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 13.0, 22.0, 22.0, 22.0, 27.0, 32.0, 41.0, 52.0, 36.0, 39.0, 42.0, 63.0, 49.0, 46.0, 64.0, 44.0, 35.0, 49.0, 47.0, 35.0, 43.0, 37.0, 27.0, 14.0, 15.0, 12.0, 12.0, 5.0, 6.0, 3.0, 4.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7964301109313965, -2.7224783897399902, -2.648526668548584, -2.5745749473571777, -2.5006232261657715, -2.4266717433929443, -2.352720022201538, -2.278768301010132, -2.2048165798187256, -2.1308648586273193, -2.056913137435913, -1.9829615354537964, -1.9090098142623901, -1.8350580930709839, -1.7611064910888672, -1.687154769897461, -1.6132030487060547, -1.5392513275146484, -1.4652996063232422, -1.3913480043411255, -1.3173962831497192, -1.243444561958313, -1.1694929599761963, -1.09554123878479, -1.0215895175933838, -0.9476377964019775, -0.8736861348152161, -0.7997344732284546, -0.7257827520370483, -0.6518310308456421, -0.5778793692588806, -0.5039277076721191, -0.4299759864807129, -0.35602429509162903, -0.28207260370254517, -0.2081209123134613, -0.13416922092437744, -0.06021752953529358, 0.013734161853790283, 0.08768582344055176, 0.161637544631958, 0.23558923602104187, 0.30954092741012573, 0.3834926187992096, 0.45744431018829346, 0.5313960313796997, 0.6053476929664612, 0.6792993545532227, 0.7532510757446289, 0.8272027969360352, 0.9011544585227966, 0.9751061201095581, 1.0490578413009644, 1.1230095624923706, 1.1969611644744873, 1.2709128856658936, 1.3448646068572998, 1.418816328048706, 1.4927680492401123, 1.566719651222229, 1.6406713724136353, 1.7146230936050415, 1.7885746955871582, 1.8625264167785645, 1.9364781379699707]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 13.0, 19.0, 26.0, 48.0, 79.0, 106.0, 240.0, 426.0, 899.0, 2224.0, 7812.0, 45435.0, 374305.0, 527171.0, 73629.0, 11037.0, 2863.0, 1103.0, 520.0, 246.0, 114.0, 98.0, 54.0, 29.0, 17.0, 11.0, 7.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.21484375, -3.125823974609375, -3.03680419921875, -2.947784423828125, -2.8587646484375, -2.769744873046875, -2.68072509765625, -2.591705322265625, -2.502685546875, -2.413665771484375, -2.32464599609375, -2.235626220703125, -2.1466064453125, -2.057586669921875, -1.96856689453125, -1.879547119140625, -1.79052734375, -1.701507568359375, -1.61248779296875, -1.523468017578125, -1.4344482421875, -1.345428466796875, -1.25640869140625, -1.167388916015625, -1.078369140625, -0.989349365234375, -0.90032958984375, -0.811309814453125, -0.7222900390625, -0.633270263671875, -0.54425048828125, -0.455230712890625, -0.3662109375, -0.277191162109375, -0.18817138671875, -0.099151611328125, -0.0101318359375, 0.078887939453125, 0.16790771484375, 0.256927490234375, 0.345947265625, 0.434967041015625, 0.52398681640625, 0.613006591796875, 0.7020263671875, 0.791046142578125, 0.88006591796875, 0.969085693359375, 1.05810546875, 1.147125244140625, 1.23614501953125, 1.325164794921875, 1.4141845703125, 1.503204345703125, 1.59222412109375, 1.681243896484375, 1.770263671875, 1.859283447265625, 1.94830322265625, 2.037322998046875, 2.1263427734375, 2.215362548828125, 2.30438232421875, 2.393402099609375, 2.482421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 10.0, 8.0, 20.0, 27.0, 37.0, 61.0, 65.0, 56.0, 115.0, 92.0, 112.0, 98.0, 83.0, 63.0, 52.0, 32.0, 16.0, 23.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1455078125, -1.1083984375, -1.0712890625, -1.0341796875, -0.9970703125, -0.9599609375, -0.9228515625, -0.8857421875, -0.8486328125, -0.8115234375, -0.7744140625, -0.7373046875, -0.7001953125, -0.6630859375, -0.6259765625, -0.5888671875, -0.5517578125, -0.5146484375, -0.4775390625, -0.4404296875, -0.4033203125, -0.3662109375, -0.3291015625, -0.2919921875, -0.2548828125, -0.2177734375, -0.1806640625, -0.1435546875, -0.1064453125, -0.0693359375, -0.0322265625, 0.0048828125, 0.0419921875, 0.0791015625, 0.1162109375, 0.1533203125, 0.1904296875, 0.2275390625, 0.2646484375, 0.3017578125, 0.3388671875, 0.3759765625, 0.4130859375, 0.4501953125, 0.4873046875, 0.5244140625, 0.5615234375, 0.5986328125, 0.6357421875, 0.6728515625, 0.7099609375, 0.7470703125, 0.7841796875, 0.8212890625, 0.8583984375, 0.8955078125, 0.9326171875, 0.9697265625, 1.0068359375, 1.0439453125, 1.0810546875, 1.1181640625, 1.1552734375, 1.1923828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 10.0, 11.0, 9.0, 15.0, 24.0, 39.0, 32.0, 40.0, 70.0, 89.0, 122.0, 169.0, 284.0, 478.0, 1257.0, 4693.0, 25043.0, 183206.0, 638629.0, 164845.0, 22557.0, 4302.0, 1241.0, 478.0, 271.0, 176.0, 104.0, 84.0, 66.0, 47.0, 41.0, 31.0, 17.0, 22.0, 10.0, 4.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.256683349609375, -2.17742919921875, -2.098175048828125, -2.0189208984375, -1.939666748046875, -1.86041259765625, -1.781158447265625, -1.701904296875, -1.622650146484375, -1.54339599609375, -1.464141845703125, -1.3848876953125, -1.305633544921875, -1.22637939453125, -1.147125244140625, -1.06787109375, -0.988616943359375, -0.90936279296875, -0.830108642578125, -0.7508544921875, -0.671600341796875, -0.59234619140625, -0.513092041015625, -0.433837890625, -0.354583740234375, -0.27532958984375, -0.196075439453125, -0.1168212890625, -0.037567138671875, 0.04168701171875, 0.120941162109375, 0.2001953125, 0.279449462890625, 0.35870361328125, 0.437957763671875, 0.5172119140625, 0.596466064453125, 0.67572021484375, 0.754974365234375, 0.834228515625, 0.913482666015625, 0.99273681640625, 1.071990966796875, 1.1512451171875, 1.230499267578125, 1.30975341796875, 1.389007568359375, 1.46826171875, 1.547515869140625, 1.62677001953125, 1.706024169921875, 1.7852783203125, 1.864532470703125, 1.94378662109375, 2.023040771484375, 2.102294921875, 2.181549072265625, 2.26080322265625, 2.340057373046875, 2.4193115234375, 2.498565673828125, 2.57781982421875, 2.657073974609375, 2.736328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 5.0, 15.0, 9.0, 7.0, 20.0, 20.0, 20.0, 18.0, 24.0, 31.0, 27.0, 35.0, 33.0, 40.0, 35.0, 53.0, 53.0, 56.0, 39.0, 45.0, 41.0, 39.0, 41.0, 31.0, 33.0, 18.0, 33.0, 31.0, 25.0, 13.0, 17.0, 12.0, 17.0, 11.0, 6.0, 7.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2578125, -2.18255615234375, -2.1072998046875, -2.03204345703125, -1.956787109375, -1.88153076171875, -1.8062744140625, -1.73101806640625, -1.65576171875, -1.58050537109375, -1.5052490234375, -1.42999267578125, -1.354736328125, -1.27947998046875, -1.2042236328125, -1.12896728515625, -1.0537109375, -0.97845458984375, -0.9031982421875, -0.82794189453125, -0.752685546875, -0.67742919921875, -0.6021728515625, -0.52691650390625, -0.45166015625, -0.37640380859375, -0.3011474609375, -0.22589111328125, -0.150634765625, -0.07537841796875, -0.0001220703125, 0.07513427734375, 0.150390625, 0.22564697265625, 0.3009033203125, 0.37615966796875, 0.451416015625, 0.52667236328125, 0.6019287109375, 0.67718505859375, 0.75244140625, 0.82769775390625, 0.9029541015625, 0.97821044921875, 1.053466796875, 1.12872314453125, 1.2039794921875, 1.27923583984375, 1.3544921875, 1.42974853515625, 1.5050048828125, 1.58026123046875, 1.655517578125, 1.73077392578125, 1.8060302734375, 1.88128662109375, 1.95654296875, 2.03179931640625, 2.1070556640625, 2.18231201171875, 2.257568359375, 2.33282470703125, 2.4080810546875, 2.48333740234375, 2.55859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 14.0, 23.0, 33.0, 30.0, 79.0, 89.0, 178.0, 271.0, 571.0, 1769.0, 7594.0, 71875.0, 858809.0, 94715.0, 9081.0, 1944.0, 633.0, 299.0, 176.0, 113.0, 69.0, 58.0, 38.0, 18.0, 21.0, 12.0, 10.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19140625, -1.1548004150390625, -1.118194580078125, -1.0815887451171875, -1.04498291015625, -1.0083770751953125, -0.971771240234375, -0.9351654052734375, -0.8985595703125, -0.8619537353515625, -0.825347900390625, -0.7887420654296875, -0.75213623046875, -0.7155303955078125, -0.678924560546875, -0.6423187255859375, -0.605712890625, -0.5691070556640625, -0.532501220703125, -0.4958953857421875, -0.45928955078125, -0.4226837158203125, -0.386077880859375, -0.3494720458984375, -0.3128662109375, -0.2762603759765625, -0.239654541015625, -0.2030487060546875, -0.16644287109375, -0.1298370361328125, -0.093231201171875, -0.0566253662109375, -0.02001953125, 0.0165863037109375, 0.053192138671875, 0.0897979736328125, 0.12640380859375, 0.1630096435546875, 0.199615478515625, 0.2362213134765625, 0.2728271484375, 0.3094329833984375, 0.346038818359375, 0.3826446533203125, 0.41925048828125, 0.4558563232421875, 0.492462158203125, 0.5290679931640625, 0.565673828125, 0.6022796630859375, 0.638885498046875, 0.6754913330078125, 0.71209716796875, 0.7487030029296875, 0.785308837890625, 0.8219146728515625, 0.8585205078125, 0.8951263427734375, 0.931732177734375, 0.9683380126953125, 1.00494384765625, 1.0415496826171875, 1.078155517578125, 1.1147613525390625, 1.1513671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 3.0, 5.0, 5.0, 7.0, 13.0, 18.0, 23.0, 28.0, 46.0, 71.0, 155.0, 201.0, 150.0, 107.0, 39.0, 32.0, 20.0, 13.0, 16.0, 9.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019168853759765625, -0.00018670596182346344, -0.00018172338604927063, -0.00017674081027507782, -0.000171758234500885, -0.0001667756587266922, -0.0001617930829524994, -0.00015681050717830658, -0.00015182793140411377, -0.00014684535562992096, -0.00014186277985572815, -0.00013688020408153534, -0.00013189762830734253, -0.00012691505253314972, -0.00012193247675895691, -0.0001169499009847641, -0.00011196732521057129, -0.00010698474943637848, -0.00010200217366218567, -9.701959788799286e-05, -9.203702211380005e-05, -8.705444633960724e-05, -8.207187056541443e-05, -7.708929479122162e-05, -7.210671901702881e-05, -6.7124143242836e-05, -6.214156746864319e-05, -5.715899169445038e-05, -5.217641592025757e-05, -4.719384014606476e-05, -4.221126437187195e-05, -3.722868859767914e-05, -3.224611282348633e-05, -2.7263537049293518e-05, -2.2280961275100708e-05, -1.7298385500907898e-05, -1.2315809726715088e-05, -7.333233952522278e-06, -2.3506581783294678e-06, 2.6319175958633423e-06, 7.614493370056152e-06, 1.2597069144248962e-05, 1.7579644918441772e-05, 2.2562220692634583e-05, 2.7544796466827393e-05, 3.25273722410202e-05, 3.750994801521301e-05, 4.249252378940582e-05, 4.747509956359863e-05, 5.245767533779144e-05, 5.744025111198425e-05, 6.242282688617706e-05, 6.740540266036987e-05, 7.238797843456268e-05, 7.737055420875549e-05, 8.23531299829483e-05, 8.733570575714111e-05, 9.231828153133392e-05, 9.730085730552673e-05, 0.00010228343307971954, 0.00010726600885391235, 0.00011224858462810516, 0.00011723116040229797, 0.00012221373617649078, 0.0001271963119506836]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 12.0, 11.0, 20.0, 66.0, 178.0, 972.0, 822104.0, 224211.0, 736.0, 152.0, 57.0, 21.0, 13.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.70428466796875, -2.5687255859375, -2.43316650390625, -2.297607421875, -2.16204833984375, -2.0264892578125, -1.89093017578125, -1.75537109375, -1.61981201171875, -1.4842529296875, -1.34869384765625, -1.213134765625, -1.07757568359375, -0.9420166015625, -0.80645751953125, -0.6708984375, -0.53533935546875, -0.3997802734375, -0.26422119140625, -0.128662109375, 0.00689697265625, 0.1424560546875, 0.27801513671875, 0.41357421875, 0.54913330078125, 0.6846923828125, 0.82025146484375, 0.955810546875, 1.09136962890625, 1.2269287109375, 1.36248779296875, 1.498046875, 1.63360595703125, 1.7691650390625, 1.90472412109375, 2.040283203125, 2.17584228515625, 2.3114013671875, 2.44696044921875, 2.58251953125, 2.71807861328125, 2.8536376953125, 2.98919677734375, 3.124755859375, 3.26031494140625, 3.3958740234375, 3.53143310546875, 3.6669921875, 3.80255126953125, 3.9381103515625, 4.07366943359375, 4.209228515625, 4.34478759765625, 4.4803466796875, 4.61590576171875, 4.75146484375, 4.88702392578125, 5.0225830078125, 5.15814208984375, 5.293701171875, 5.42926025390625, 5.5648193359375, 5.70037841796875, 5.8359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 10.0, 6.0, 16.0, 25.0, 52.0, 119.0, 279.0, 278.0, 106.0, 47.0, 32.0, 14.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5401840209960938, -0.4861297607421875, -0.43207550048828125, -0.378021240234375, -0.32396697998046875, -0.2699127197265625, -0.21585845947265625, -0.16180419921875, -0.10774993896484375, -0.0536956787109375, 0.00035858154296875, 0.054412841796875, 0.10846710205078125, 0.1625213623046875, 0.21657562255859375, 0.2706298828125, 0.32468414306640625, 0.3787384033203125, 0.43279266357421875, 0.486846923828125, 0.5409011840820312, 0.5949554443359375, 0.6490097045898438, 0.70306396484375, 0.7571182250976562, 0.8111724853515625, 0.8652267456054688, 0.919281005859375, 0.9733352661132812, 1.0273895263671875, 1.0814437866210938, 1.135498046875, 1.1895523071289062, 1.2436065673828125, 1.2976608276367188, 1.351715087890625, 1.4057693481445312, 1.4598236083984375, 1.5138778686523438, 1.56793212890625, 1.6219863891601562, 1.6760406494140625, 1.7300949096679688, 1.784149169921875, 1.8382034301757812, 1.8922576904296875, 1.9463119506835938, 2.0003662109375, 2.0544204711914062, 2.1084747314453125, 2.1625289916992188, 2.216583251953125, 2.2706375122070312, 2.3246917724609375, 2.3787460327148438, 2.43280029296875, 2.4868545532226562, 2.5409088134765625, 2.5949630737304688, 2.649017333984375, 2.7030715942382812, 2.7571258544921875, 2.8111801147460938, 2.865234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 16.0, 67.0, 168.0, 302.0, 253.0, 119.0, 50.0, 12.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.849552154541016, -16.07211685180664, -15.294679641723633, -14.517243385314941, -13.73980712890625, -12.962370872497559, -12.184934616088867, -11.407499313354492, -10.630062103271484, -9.852625846862793, -9.075189590454102, -8.29775333404541, -7.520317077636719, -6.742880821228027, -5.965445041656494, -5.188008785247803, -4.4105730056762695, -3.633136749267578, -2.8557004928588867, -2.0782644748687744, -1.300828218460083, -0.5233919620513916, 0.2540440559387207, 1.031480312347412, 1.8089165687561035, 2.586352825164795, 3.3637890815734863, 4.1412248611450195, 4.918661117553711, 5.696097373962402, 6.473533630371094, 7.250969886779785, 8.028406143188477, 8.805842399597168, 9.58327865600586, 10.36071491241455, 11.138151168823242, 11.915587425231934, 12.693023681640625, 13.470458984375, 14.247896194458008, 15.0253324508667, 15.80276870727539, 16.580204010009766, 17.357641220092773, 18.13507652282715, 18.912513732910156, 19.68994903564453, 20.467384338378906, 21.24481964111328, 22.02225685119629, 22.799692153930664, 23.577129364013672, 24.354564666748047, 25.132001876831055, 25.90943717956543, 26.686874389648438, 27.464309692382812, 28.24174690246582, 29.019182205200195, 29.796619415283203, 30.574054718017578, 31.351491928100586, 32.128929138183594, 32.90636444091797]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 6.0, 10.0, 14.0, 15.0, 11.0, 14.0, 20.0, 24.0, 20.0, 27.0, 25.0, 28.0, 34.0, 24.0, 41.0, 37.0, 47.0, 35.0, 42.0, 39.0, 54.0, 40.0, 31.0, 31.0, 31.0, 37.0, 33.0, 31.0, 23.0, 29.0, 24.0, 17.0, 10.0, 16.0, 18.0, 14.0, 7.0, 6.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.650754928588867, -11.311110496520996, -10.971466064453125, -10.63182258605957, -10.2921781539917, -9.952533721923828, -9.612890243530273, -9.273245811462402, -8.933601379394531, -8.59395694732666, -8.254312515258789, -7.914669036865234, -7.575024604797363, -7.235380172729492, -6.895736217498779, -6.556092262268066, -6.216447830200195, -5.876803398132324, -5.537159442901611, -5.197515487670898, -4.857871055603027, -4.518226623535156, -4.178582668304443, -3.8389384746551514, -3.4992942810058594, -3.1596500873565674, -2.8200058937072754, -2.4803617000579834, -2.1407175064086914, -1.8010733127593994, -1.4614291191101074, -1.1217849254608154, -0.7821407318115234, -0.44249653816223145, -0.10285234451293945, 0.23679184913635254, 0.5764360427856445, 0.9160802364349365, 1.2557244300842285, 1.5953686237335205, 1.9350128173828125, 2.2746570110321045, 2.6143012046813965, 2.9539453983306885, 3.2935895919799805, 3.6332337856292725, 3.9728779792785645, 4.312521934509277, 4.652166366577148, 4.9918107986450195, 5.331454753875732, 5.671098709106445, 6.010743141174316, 6.3503875732421875, 6.6900315284729, 7.029675483703613, 7.369319915771484, 7.7089643478393555, 8.048608779907227, 8.388252258300781, 8.727896690368652, 9.067541122436523, 9.407184600830078, 9.74682903289795, 10.08647346496582]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 9.0, 10.0, 17.0, 39.0, 43.0, 78.0, 132.0, 222.0, 457.0, 1044.0, 2780.0, 9787.0, 65638.0, 3984631.0, 111098.0, 12674.0, 3330.0, 1141.0, 486.0, 262.0, 144.0, 90.0, 52.0, 40.0, 22.0, 9.0, 10.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71484375, -4.574462890625, -4.43408203125, -4.293701171875, -4.1533203125, -4.012939453125, -3.87255859375, -3.732177734375, -3.591796875, -3.451416015625, -3.31103515625, -3.170654296875, -3.0302734375, -2.889892578125, -2.74951171875, -2.609130859375, -2.46875, -2.328369140625, -2.18798828125, -2.047607421875, -1.9072265625, -1.766845703125, -1.62646484375, -1.486083984375, -1.345703125, -1.205322265625, -1.06494140625, -0.924560546875, -0.7841796875, -0.643798828125, -0.50341796875, -0.363037109375, -0.22265625, -0.082275390625, 0.05810546875, 0.198486328125, 0.3388671875, 0.479248046875, 0.61962890625, 0.760009765625, 0.900390625, 1.040771484375, 1.18115234375, 1.321533203125, 1.4619140625, 1.602294921875, 1.74267578125, 1.883056640625, 2.0234375, 2.163818359375, 2.30419921875, 2.444580078125, 2.5849609375, 2.725341796875, 2.86572265625, 3.006103515625, 3.146484375, 3.286865234375, 3.42724609375, 3.567626953125, 3.7080078125, 3.848388671875, 3.98876953125, 4.129150390625, 4.26953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 20.0, 15.0, 18.0, 35.0, 43.0, 52.0, 69.0, 84.0, 80.0, 91.0, 86.0, 88.0, 73.0, 58.0, 53.0, 39.0, 29.0, 18.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2041015625, -1.16839599609375, -1.1326904296875, -1.09698486328125, -1.061279296875, -1.02557373046875, -0.9898681640625, -0.95416259765625, -0.91845703125, -0.88275146484375, -0.8470458984375, -0.81134033203125, -0.775634765625, -0.73992919921875, -0.7042236328125, -0.66851806640625, -0.6328125, -0.59710693359375, -0.5614013671875, -0.52569580078125, -0.489990234375, -0.45428466796875, -0.4185791015625, -0.38287353515625, -0.34716796875, -0.31146240234375, -0.2757568359375, -0.24005126953125, -0.204345703125, -0.16864013671875, -0.1329345703125, -0.09722900390625, -0.0615234375, -0.02581787109375, 0.0098876953125, 0.04559326171875, 0.081298828125, 0.11700439453125, 0.1527099609375, 0.18841552734375, 0.22412109375, 0.25982666015625, 0.2955322265625, 0.33123779296875, 0.366943359375, 0.40264892578125, 0.4383544921875, 0.47406005859375, 0.509765625, 0.54547119140625, 0.5811767578125, 0.61688232421875, 0.652587890625, 0.68829345703125, 0.7239990234375, 0.75970458984375, 0.79541015625, 0.83111572265625, 0.8668212890625, 0.90252685546875, 0.938232421875, 0.97393798828125, 1.0096435546875, 1.04534912109375, 1.0810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 16.0, 27.0, 52.0, 98.0, 223.0, 543.0, 1723.0, 6160.0, 32162.0, 788395.0, 3308474.0, 45331.0, 7844.0, 2077.0, 684.0, 245.0, 98.0, 58.0, 20.0, 15.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.75, -3.654052734375, -3.55810546875, -3.462158203125, -3.3662109375, -3.270263671875, -3.17431640625, -3.078369140625, -2.982421875, -2.886474609375, -2.79052734375, -2.694580078125, -2.5986328125, -2.502685546875, -2.40673828125, -2.310791015625, -2.21484375, -2.118896484375, -2.02294921875, -1.927001953125, -1.8310546875, -1.735107421875, -1.63916015625, -1.543212890625, -1.447265625, -1.351318359375, -1.25537109375, -1.159423828125, -1.0634765625, -0.967529296875, -0.87158203125, -0.775634765625, -0.6796875, -0.583740234375, -0.48779296875, -0.391845703125, -0.2958984375, -0.199951171875, -0.10400390625, -0.008056640625, 0.087890625, 0.183837890625, 0.27978515625, 0.375732421875, 0.4716796875, 0.567626953125, 0.66357421875, 0.759521484375, 0.85546875, 0.951416015625, 1.04736328125, 1.143310546875, 1.2392578125, 1.335205078125, 1.43115234375, 1.527099609375, 1.623046875, 1.718994140625, 1.81494140625, 1.910888671875, 2.0068359375, 2.102783203125, 2.19873046875, 2.294677734375, 2.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 7.0, 10.0, 23.0, 38.0, 48.0, 67.0, 134.0, 348.0, 2124.0, 790.0, 196.0, 76.0, 50.0, 37.0, 18.0, 15.0, 19.0, 8.0, 11.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0712890625, -1.04046630859375, -1.0096435546875, -0.97882080078125, -0.947998046875, -0.91717529296875, -0.8863525390625, -0.85552978515625, -0.82470703125, -0.79388427734375, -0.7630615234375, -0.73223876953125, -0.701416015625, -0.67059326171875, -0.6397705078125, -0.60894775390625, -0.578125, -0.54730224609375, -0.5164794921875, -0.48565673828125, -0.454833984375, -0.42401123046875, -0.3931884765625, -0.36236572265625, -0.33154296875, -0.30072021484375, -0.2698974609375, -0.23907470703125, -0.208251953125, -0.17742919921875, -0.1466064453125, -0.11578369140625, -0.0849609375, -0.05413818359375, -0.0233154296875, 0.00750732421875, 0.038330078125, 0.06915283203125, 0.0999755859375, 0.13079833984375, 0.16162109375, 0.19244384765625, 0.2232666015625, 0.25408935546875, 0.284912109375, 0.31573486328125, 0.3465576171875, 0.37738037109375, 0.408203125, 0.43902587890625, 0.4698486328125, 0.50067138671875, 0.531494140625, 0.56231689453125, 0.5931396484375, 0.62396240234375, 0.65478515625, 0.68560791015625, 0.7164306640625, 0.74725341796875, 0.778076171875, 0.80889892578125, 0.8397216796875, 0.87054443359375, 0.9013671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 7.0, 19.0, 59.0, 291.0, 431.0, 166.0, 25.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.842453956604004, -14.46622085571289, -14.089987754821777, -13.713754653930664, -13.33752155303955, -12.961288452148438, -12.585055351257324, -12.208822250366211, -11.832589149475098, -11.456356048583984, -11.080122947692871, -10.703889846801758, -10.327656745910645, -9.951423645019531, -9.575190544128418, -9.198957443237305, -8.822724342346191, -8.446491241455078, -8.070258140563965, -7.694025039672852, -7.317791938781738, -6.941558837890625, -6.565325736999512, -6.189092636108398, -5.812859535217285, -5.436626434326172, -5.060393333435059, -4.684160232543945, -4.307927131652832, -3.9316940307617188, -3.5554609298706055, -3.179227828979492, -2.8029937744140625, -2.426760673522949, -2.050527572631836, -1.6742944717407227, -1.2980613708496094, -0.9218282699584961, -0.5455951690673828, -0.16936206817626953, 0.20687103271484375, 0.583104133605957, 0.9593372344970703, 1.3355703353881836, 1.7118034362792969, 2.08803653717041, 2.4642696380615234, 2.8405027389526367, 3.21673583984375, 3.5929689407348633, 3.9692020416259766, 4.34543514251709, 4.721668243408203, 5.097901344299316, 5.47413444519043, 5.850367546081543, 6.226600646972656, 6.6028337478637695, 6.979066848754883, 7.355299949645996, 7.731533050537109, 8.107766151428223, 8.483999252319336, 8.86023235321045, 9.236465454101562]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 10.0, 8.0, 14.0, 14.0, 19.0, 22.0, 25.0, 32.0, 35.0, 47.0, 37.0, 49.0, 45.0, 55.0, 53.0, 52.0, 46.0, 49.0, 43.0, 36.0, 51.0, 48.0, 32.0, 30.0, 26.0, 18.0, 28.0, 16.0, 6.0, 14.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0137557983398438, -2.9173333644866943, -2.820911169052124, -2.7244887351989746, -2.6280665397644043, -2.531644105911255, -2.4352216720581055, -2.338799476623535, -2.2423770427703857, -2.1459546089172363, -2.049532413482666, -1.9531099796295166, -1.8566876649856567, -1.7602653503417969, -1.6638429164886475, -1.5674206018447876, -1.4709982872009277, -1.3745759725570679, -1.278153657913208, -1.1817312240600586, -1.0853089094161987, -0.9888865947723389, -0.8924642205238342, -0.7960418462753296, -0.6996195316314697, -0.6031972169876099, -0.5067748427391052, -0.410352498292923, -0.3139301538467407, -0.21750780940055847, -0.12108546495437622, -0.024663090705871582, 0.07175898551940918, 0.16818132996559143, 0.2646036744117737, 0.36102601885795593, 0.4574483633041382, 0.553870677947998, 0.6502930521965027, 0.7467154264450073, 0.8431377410888672, 0.939560055732727, 1.035982370376587, 1.1324048042297363, 1.2288271188735962, 1.325249433517456, 1.4216718673706055, 1.5180941820144653, 1.6145164966583252, 1.710938811302185, 1.807361125946045, 1.9037835597991943, 2.0002059936523438, 2.096628189086914, 2.1930506229400635, 2.289473056793213, 2.385895252227783, 2.4823176860809326, 2.578739881515503, 2.6751623153686523, 2.7715845108032227, 2.868006944656372, 2.9644293785095215, 3.060851573944092, 3.157274007797241]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 14.0, 21.0, 26.0, 38.0, 51.0, 79.0, 125.0, 187.0, 344.0, 636.0, 1123.0, 2411.0, 5664.0, 15747.0, 54255.0, 218866.0, 476503.0, 198023.0, 49665.0, 14621.0, 5249.0, 2304.0, 1119.0, 566.0, 345.0, 195.0, 116.0, 72.0, 46.0, 31.0, 24.0, 19.0, 19.0, 3.0, 5.0, 4.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.421875, -2.342376708984375, -2.26287841796875, -2.183380126953125, -2.1038818359375, -2.024383544921875, -1.94488525390625, -1.865386962890625, -1.785888671875, -1.706390380859375, -1.62689208984375, -1.547393798828125, -1.4678955078125, -1.388397216796875, -1.30889892578125, -1.229400634765625, -1.14990234375, -1.070404052734375, -0.99090576171875, -0.911407470703125, -0.8319091796875, -0.752410888671875, -0.67291259765625, -0.593414306640625, -0.513916015625, -0.434417724609375, -0.35491943359375, -0.275421142578125, -0.1959228515625, -0.116424560546875, -0.03692626953125, 0.042572021484375, 0.1220703125, 0.201568603515625, 0.28106689453125, 0.360565185546875, 0.4400634765625, 0.519561767578125, 0.59906005859375, 0.678558349609375, 0.758056640625, 0.837554931640625, 0.91705322265625, 0.996551513671875, 1.0760498046875, 1.155548095703125, 1.23504638671875, 1.314544677734375, 1.39404296875, 1.473541259765625, 1.55303955078125, 1.632537841796875, 1.7120361328125, 1.791534423828125, 1.87103271484375, 1.950531005859375, 2.030029296875, 2.109527587890625, 2.18902587890625, 2.268524169921875, 2.3480224609375, 2.427520751953125, 2.50701904296875, 2.586517333984375, 2.666015625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 13.0, 23.0, 20.0, 27.0, 53.0, 73.0, 56.0, 90.0, 79.0, 99.0, 99.0, 83.0, 66.0, 60.0, 51.0, 31.0, 24.0, 13.0, 13.0, 9.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.251953125, -1.21453857421875, -1.1771240234375, -1.13970947265625, -1.102294921875, -1.06488037109375, -1.0274658203125, -0.99005126953125, -0.95263671875, -0.91522216796875, -0.8778076171875, -0.84039306640625, -0.802978515625, -0.76556396484375, -0.7281494140625, -0.69073486328125, -0.6533203125, -0.61590576171875, -0.5784912109375, -0.54107666015625, -0.503662109375, -0.46624755859375, -0.4288330078125, -0.39141845703125, -0.35400390625, -0.31658935546875, -0.2791748046875, -0.24176025390625, -0.204345703125, -0.16693115234375, -0.1295166015625, -0.09210205078125, -0.0546875, -0.01727294921875, 0.0201416015625, 0.05755615234375, 0.094970703125, 0.13238525390625, 0.1697998046875, 0.20721435546875, 0.24462890625, 0.28204345703125, 0.3194580078125, 0.35687255859375, 0.394287109375, 0.43170166015625, 0.4691162109375, 0.50653076171875, 0.5439453125, 0.58135986328125, 0.6187744140625, 0.65618896484375, 0.693603515625, 0.73101806640625, 0.7684326171875, 0.80584716796875, 0.84326171875, 0.88067626953125, 0.9180908203125, 0.95550537109375, 0.992919921875, 1.03033447265625, 1.0677490234375, 1.10516357421875, 1.142578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 16.0, 29.0, 43.0, 71.0, 89.0, 174.0, 279.0, 578.0, 1398.0, 4538.0, 26623.0, 407822.0, 561867.0, 36426.0, 5544.0, 1567.0, 610.0, 326.0, 186.0, 128.0, 60.0, 53.0, 42.0, 19.0, 14.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.9818115234375, -3.834716796875, -3.6876220703125, -3.54052734375, -3.3934326171875, -3.246337890625, -3.0992431640625, -2.9521484375, -2.8050537109375, -2.657958984375, -2.5108642578125, -2.36376953125, -2.2166748046875, -2.069580078125, -1.9224853515625, -1.775390625, -1.6282958984375, -1.481201171875, -1.3341064453125, -1.18701171875, -1.0399169921875, -0.892822265625, -0.7457275390625, -0.5986328125, -0.4515380859375, -0.304443359375, -0.1573486328125, -0.01025390625, 0.1368408203125, 0.283935546875, 0.4310302734375, 0.578125, 0.7252197265625, 0.872314453125, 1.0194091796875, 1.16650390625, 1.3135986328125, 1.460693359375, 1.6077880859375, 1.7548828125, 1.9019775390625, 2.049072265625, 2.1961669921875, 2.34326171875, 2.4903564453125, 2.637451171875, 2.7845458984375, 2.931640625, 3.0787353515625, 3.225830078125, 3.3729248046875, 3.52001953125, 3.6671142578125, 3.814208984375, 3.9613037109375, 4.1083984375, 4.2554931640625, 4.402587890625, 4.5496826171875, 4.69677734375, 4.8438720703125, 4.990966796875, 5.1380615234375, 5.28515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 12.0, 18.0, 18.0, 21.0, 36.0, 56.0, 66.0, 71.0, 86.0, 62.0, 84.0, 77.0, 82.0, 83.0, 47.0, 44.0, 35.0, 28.0, 14.0, 11.0, 14.0, 4.0, 6.0, 1.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.12890625, -6.9537353515625, -6.778564453125, -6.6033935546875, -6.42822265625, -6.2530517578125, -6.077880859375, -5.9027099609375, -5.7275390625, -5.5523681640625, -5.377197265625, -5.2020263671875, -5.02685546875, -4.8516845703125, -4.676513671875, -4.5013427734375, -4.326171875, -4.1510009765625, -3.975830078125, -3.8006591796875, -3.62548828125, -3.4503173828125, -3.275146484375, -3.0999755859375, -2.9248046875, -2.7496337890625, -2.574462890625, -2.3992919921875, -2.22412109375, -2.0489501953125, -1.873779296875, -1.6986083984375, -1.5234375, -1.3482666015625, -1.173095703125, -0.9979248046875, -0.82275390625, -0.6475830078125, -0.472412109375, -0.2972412109375, -0.1220703125, 0.0531005859375, 0.228271484375, 0.4034423828125, 0.57861328125, 0.7537841796875, 0.928955078125, 1.1041259765625, 1.279296875, 1.4544677734375, 1.629638671875, 1.8048095703125, 1.97998046875, 2.1551513671875, 2.330322265625, 2.5054931640625, 2.6806640625, 2.8558349609375, 3.031005859375, 3.2061767578125, 3.38134765625, 3.5565185546875, 3.731689453125, 3.9068603515625, 4.08203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 12.0, 14.0, 23.0, 26.0, 53.0, 84.0, 124.0, 229.0, 508.0, 1086.0, 2678.0, 9521.0, 55850.0, 896756.0, 65947.0, 10371.0, 2882.0, 1146.0, 567.0, 245.0, 170.0, 109.0, 47.0, 27.0, 17.0, 22.0, 3.0, 8.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.99609375, -2.911773681640625, -2.82745361328125, -2.743133544921875, -2.6588134765625, -2.574493408203125, -2.49017333984375, -2.405853271484375, -2.321533203125, -2.237213134765625, -2.15289306640625, -2.068572998046875, -1.9842529296875, -1.899932861328125, -1.81561279296875, -1.731292724609375, -1.64697265625, -1.562652587890625, -1.47833251953125, -1.394012451171875, -1.3096923828125, -1.225372314453125, -1.14105224609375, -1.056732177734375, -0.972412109375, -0.888092041015625, -0.80377197265625, -0.719451904296875, -0.6351318359375, -0.550811767578125, -0.46649169921875, -0.382171630859375, -0.2978515625, -0.213531494140625, -0.12921142578125, -0.044891357421875, 0.0394287109375, 0.123748779296875, 0.20806884765625, 0.292388916015625, 0.376708984375, 0.461029052734375, 0.54534912109375, 0.629669189453125, 0.7139892578125, 0.798309326171875, 0.88262939453125, 0.966949462890625, 1.05126953125, 1.135589599609375, 1.21990966796875, 1.304229736328125, 1.3885498046875, 1.472869873046875, 1.55718994140625, 1.641510009765625, 1.725830078125, 1.810150146484375, 1.89447021484375, 1.978790283203125, 2.0631103515625, 2.147430419921875, 2.23175048828125, 2.316070556640625, 2.400390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 3.0, 3.0, 6.0, 12.0, 12.0, 12.0, 19.0, 25.0, 40.0, 50.0, 64.0, 105.0, 190.0, 146.0, 85.0, 50.0, 40.0, 36.0, 23.0, 17.0, 14.0, 8.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.00026969239115715027, -0.0002623423933982849, -0.00025499239563941956, -0.0002476423978805542, -0.00024029240012168884, -0.00023294240236282349, -0.00022559240460395813, -0.00021824240684509277, -0.00021089240908622742, -0.00020354241132736206, -0.0001961924135684967, -0.00018884241580963135, -0.000181492418050766, -0.00017414242029190063, -0.00016679242253303528, -0.00015944242477416992, -0.00015209242701530457, -0.0001447424292564392, -0.00013739243149757385, -0.0001300424337387085, -0.00012269243597984314, -0.00011534243822097778, -0.00010799244046211243, -0.00010064244270324707, -9.329244494438171e-05, -8.594244718551636e-05, -7.8592449426651e-05, -7.124245166778564e-05, -6.389245390892029e-05, -5.654245615005493e-05, -4.9192458391189575e-05, -4.184246063232422e-05, -3.449246287345886e-05, -2.7142465114593506e-05, -1.979246735572815e-05, -1.2442469596862793e-05, -5.0924718379974365e-06, 2.25752592086792e-06, 9.607523679733276e-06, 1.6957521438598633e-05, 2.430751919746399e-05, 3.1657516956329346e-05, 3.90075147151947e-05, 4.635751247406006e-05, 5.3707510232925415e-05, 6.105750799179077e-05, 6.840750575065613e-05, 7.575750350952148e-05, 8.310750126838684e-05, 9.04574990272522e-05, 9.780749678611755e-05, 0.00010515749454498291, 0.00011250749230384827, 0.00011985749006271362, 0.00012720748782157898, 0.00013455748558044434, 0.0001419074833393097, 0.00014925748109817505, 0.0001566074788570404, 0.00016395747661590576, 0.00017130747437477112, 0.00017865747213363647, 0.00018600746989250183, 0.0001933574676513672]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 6.0, 12.0, 13.0, 23.0, 38.0, 64.0, 128.0, 325.0, 1050.0, 7110.0, 707507.0, 325704.0, 5193.0, 836.0, 289.0, 100.0, 61.0, 31.0, 17.0, 12.0, 8.0, 5.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.348480224609375, -4.21649169921875, -4.084503173828125, -3.9525146484375, -3.820526123046875, -3.68853759765625, -3.556549072265625, -3.424560546875, -3.292572021484375, -3.16058349609375, -3.028594970703125, -2.8966064453125, -2.764617919921875, -2.63262939453125, -2.500640869140625, -2.36865234375, -2.236663818359375, -2.10467529296875, -1.972686767578125, -1.8406982421875, -1.708709716796875, -1.57672119140625, -1.444732666015625, -1.312744140625, -1.180755615234375, -1.04876708984375, -0.916778564453125, -0.7847900390625, -0.652801513671875, -0.52081298828125, -0.388824462890625, -0.2568359375, -0.124847412109375, 0.00714111328125, 0.139129638671875, 0.2711181640625, 0.403106689453125, 0.53509521484375, 0.667083740234375, 0.799072265625, 0.931060791015625, 1.06304931640625, 1.195037841796875, 1.3270263671875, 1.459014892578125, 1.59100341796875, 1.722991943359375, 1.85498046875, 1.986968994140625, 2.11895751953125, 2.250946044921875, 2.3829345703125, 2.514923095703125, 2.64691162109375, 2.778900146484375, 2.910888671875, 3.042877197265625, 3.17486572265625, 3.306854248046875, 3.4388427734375, 3.570831298828125, 3.70281982421875, 3.834808349609375, 3.966796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 8.0, 12.0, 25.0, 37.0, 98.0, 282.0, 312.0, 113.0, 41.0, 26.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.97265625, -5.8533782958984375, -5.734100341796875, -5.6148223876953125, -5.49554443359375, -5.3762664794921875, -5.256988525390625, -5.1377105712890625, -5.0184326171875, -4.8991546630859375, -4.779876708984375, -4.6605987548828125, -4.54132080078125, -4.4220428466796875, -4.302764892578125, -4.1834869384765625, -4.064208984375, -3.9449310302734375, -3.825653076171875, -3.7063751220703125, -3.58709716796875, -3.4678192138671875, -3.348541259765625, -3.2292633056640625, -3.1099853515625, -2.9907073974609375, -2.871429443359375, -2.7521514892578125, -2.63287353515625, -2.5135955810546875, -2.394317626953125, -2.2750396728515625, -2.15576171875, -2.0364837646484375, -1.917205810546875, -1.7979278564453125, -1.67864990234375, -1.5593719482421875, -1.440093994140625, -1.3208160400390625, -1.2015380859375, -1.0822601318359375, -0.962982177734375, -0.8437042236328125, -0.72442626953125, -0.6051483154296875, -0.485870361328125, -0.3665924072265625, -0.247314453125, -0.1280364990234375, -0.008758544921875, 0.1105194091796875, 0.22979736328125, 0.3490753173828125, 0.468353271484375, 0.5876312255859375, 0.7069091796875, 0.8261871337890625, 0.945465087890625, 1.0647430419921875, 1.18402099609375, 1.3032989501953125, 1.422576904296875, 1.5418548583984375, 1.6611328125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 12.0, 22.0, 31.0, 54.0, 77.0, 117.0, 122.0, 109.0, 143.0, 90.0, 79.0, 49.0, 39.0, 19.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.470020294189453, -20.790857315063477, -20.1116943359375, -19.43252944946289, -18.753366470336914, -18.074203491210938, -17.395038604736328, -16.71587562561035, -16.036712646484375, -15.357549667358398, -14.678385734558105, -13.999221801757812, -13.320058822631836, -12.64089584350586, -11.961731910705566, -11.282567977905273, -10.603404998779297, -9.92424201965332, -9.245078086853027, -8.565914154052734, -7.886751174926758, -7.207587718963623, -6.528424263000488, -5.8492608070373535, -5.170097351074219, -4.490933895111084, -3.811770439147949, -3.1326069831848145, -2.4534435272216797, -1.774280071258545, -1.0951166152954102, -0.4159531593322754, 0.2632102966308594, 0.9423737525939941, 1.621537208557129, 2.3007006645202637, 2.9798641204833984, 3.659027576446533, 4.338191032409668, 5.017354488372803, 5.6965179443359375, 6.375681400299072, 7.054844856262207, 7.734008312225342, 8.413171768188477, 9.092334747314453, 9.771498680114746, 10.450662612915039, 11.129825592041016, 11.808988571166992, 12.488152503967285, 13.167316436767578, 13.846479415893555, 14.525642395019531, 15.204806327819824, 15.883970260620117, 16.563133239746094, 17.24229621887207, 17.921459197998047, 18.600624084472656, 19.279787063598633, 19.95895004272461, 20.63811492919922, 21.317277908325195, 21.996440887451172]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 6.0, 13.0, 15.0, 11.0, 17.0, 17.0, 21.0, 17.0, 24.0, 23.0, 25.0, 33.0, 50.0, 42.0, 42.0, 43.0, 38.0, 56.0, 51.0, 46.0, 48.0, 29.0, 46.0, 36.0, 26.0, 35.0, 30.0, 28.0, 10.0, 19.0, 14.0, 17.0, 11.0, 11.0, 8.0, 13.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.925865173339844, -22.208505630493164, -21.491146087646484, -20.773786544799805, -20.056427001953125, -19.339067459106445, -18.621707916259766, -17.904348373413086, -17.186988830566406, -16.469629287719727, -15.752269744873047, -15.034910202026367, -14.317550659179688, -13.600191116333008, -12.882831573486328, -12.165472030639648, -11.448111534118652, -10.730751991271973, -10.013392448425293, -9.296032905578613, -8.578673362731934, -7.861313819885254, -7.143953800201416, -6.426594257354736, -5.709234714508057, -4.991875171661377, -4.274515628814697, -3.5571558475494385, -2.839796304702759, -2.122436761856079, -1.4050769805908203, -0.6877174377441406, 0.029642105102539062, 0.7470017075538635, 1.464361310005188, 2.1817209720611572, 2.899080514907837, 3.6164400577545166, 4.333799839019775, 5.051159381866455, 5.768518924713135, 6.4858784675598145, 7.203238010406494, 7.920598030090332, 8.637957572937012, 9.355317115783691, 10.072676658630371, 10.79003620147705, 11.50739574432373, 12.22475528717041, 12.94211483001709, 13.65947437286377, 14.37683391571045, 15.094193458557129, 15.811553955078125, 16.528913497924805, 17.246273040771484, 17.963632583618164, 18.680992126464844, 19.398351669311523, 20.115711212158203, 20.833070755004883, 21.550430297851562, 22.267789840698242, 22.985149383544922]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 10.0, 12.0, 30.0, 46.0, 72.0, 113.0, 231.0, 449.0, 896.0, 2131.0, 5565.0, 21250.0, 185597.0, 3849141.0, 104352.0, 16165.0, 4524.0, 1868.0, 808.0, 476.0, 221.0, 121.0, 76.0, 51.0, 26.0, 11.0, 9.0, 11.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.34844970703125, -3.2418212890625, -3.13519287109375, -3.028564453125, -2.92193603515625, -2.8153076171875, -2.70867919921875, -2.60205078125, -2.49542236328125, -2.3887939453125, -2.28216552734375, -2.175537109375, -2.06890869140625, -1.9622802734375, -1.85565185546875, -1.7490234375, -1.64239501953125, -1.5357666015625, -1.42913818359375, -1.322509765625, -1.21588134765625, -1.1092529296875, -1.00262451171875, -0.89599609375, -0.78936767578125, -0.6827392578125, -0.57611083984375, -0.469482421875, -0.36285400390625, -0.2562255859375, -0.14959716796875, -0.04296875, 0.06365966796875, 0.1702880859375, 0.27691650390625, 0.383544921875, 0.49017333984375, 0.5968017578125, 0.70343017578125, 0.81005859375, 0.91668701171875, 1.0233154296875, 1.12994384765625, 1.236572265625, 1.34320068359375, 1.4498291015625, 1.55645751953125, 1.6630859375, 1.76971435546875, 1.8763427734375, 1.98297119140625, 2.089599609375, 2.19622802734375, 2.3028564453125, 2.40948486328125, 2.51611328125, 2.62274169921875, 2.7293701171875, 2.83599853515625, 2.942626953125, 3.04925537109375, 3.1558837890625, 3.26251220703125, 3.369140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 12.0, 16.0, 36.0, 33.0, 51.0, 50.0, 56.0, 58.0, 72.0, 88.0, 60.0, 72.0, 71.0, 66.0, 52.0, 37.0, 44.0, 19.0, 21.0, 17.0, 10.0, 10.0, 7.0, 12.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3291015625, -1.29022216796875, -1.2513427734375, -1.21246337890625, -1.173583984375, -1.13470458984375, -1.0958251953125, -1.05694580078125, -1.01806640625, -0.97918701171875, -0.9403076171875, -0.90142822265625, -0.862548828125, -0.82366943359375, -0.7847900390625, -0.74591064453125, -0.70703125, -0.66815185546875, -0.6292724609375, -0.59039306640625, -0.551513671875, -0.51263427734375, -0.4737548828125, -0.43487548828125, -0.39599609375, -0.35711669921875, -0.3182373046875, -0.27935791015625, -0.240478515625, -0.20159912109375, -0.1627197265625, -0.12384033203125, -0.0849609375, -0.04608154296875, -0.0072021484375, 0.03167724609375, 0.070556640625, 0.10943603515625, 0.1483154296875, 0.18719482421875, 0.22607421875, 0.26495361328125, 0.3038330078125, 0.34271240234375, 0.381591796875, 0.42047119140625, 0.4593505859375, 0.49822998046875, 0.537109375, 0.57598876953125, 0.6148681640625, 0.65374755859375, 0.692626953125, 0.73150634765625, 0.7703857421875, 0.80926513671875, 0.84814453125, 0.88702392578125, 0.9259033203125, 0.96478271484375, 1.003662109375, 1.04254150390625, 1.0814208984375, 1.12030029296875, 1.1591796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 13.0, 13.0, 13.0, 23.0, 43.0, 70.0, 88.0, 144.0, 229.0, 351.0, 555.0, 1039.0, 1882.0, 3702.0, 9249.0, 28335.0, 134732.0, 3279886.0, 639233.0, 65124.0, 17178.0, 6139.0, 2710.0, 1423.0, 784.0, 420.0, 285.0, 224.0, 124.0, 72.0, 59.0, 39.0, 25.0, 18.0, 10.0, 10.0, 8.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.673828125, -1.611358642578125, -1.54888916015625, -1.486419677734375, -1.4239501953125, -1.361480712890625, -1.29901123046875, -1.236541748046875, -1.174072265625, -1.111602783203125, -1.04913330078125, -0.986663818359375, -0.9241943359375, -0.861724853515625, -0.79925537109375, -0.736785888671875, -0.67431640625, -0.611846923828125, -0.54937744140625, -0.486907958984375, -0.4244384765625, -0.361968994140625, -0.29949951171875, -0.237030029296875, -0.174560546875, -0.112091064453125, -0.04962158203125, 0.012847900390625, 0.0753173828125, 0.137786865234375, 0.20025634765625, 0.262725830078125, 0.3251953125, 0.387664794921875, 0.45013427734375, 0.512603759765625, 0.5750732421875, 0.637542724609375, 0.70001220703125, 0.762481689453125, 0.824951171875, 0.887420654296875, 0.94989013671875, 1.012359619140625, 1.0748291015625, 1.137298583984375, 1.19976806640625, 1.262237548828125, 1.32470703125, 1.387176513671875, 1.44964599609375, 1.512115478515625, 1.5745849609375, 1.637054443359375, 1.69952392578125, 1.761993408203125, 1.824462890625, 1.886932373046875, 1.94940185546875, 2.011871337890625, 2.0743408203125, 2.136810302734375, 2.19927978515625, 2.261749267578125, 2.32421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 8.0, 7.0, 13.0, 32.0, 40.0, 69.0, 101.0, 255.0, 1055.0, 1832.0, 316.0, 138.0, 71.0, 36.0, 24.0, 13.0, 12.0, 12.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.73046875, -1.68255615234375, -1.6346435546875, -1.58673095703125, -1.538818359375, -1.49090576171875, -1.4429931640625, -1.39508056640625, -1.34716796875, -1.29925537109375, -1.2513427734375, -1.20343017578125, -1.155517578125, -1.10760498046875, -1.0596923828125, -1.01177978515625, -0.9638671875, -0.91595458984375, -0.8680419921875, -0.82012939453125, -0.772216796875, -0.72430419921875, -0.6763916015625, -0.62847900390625, -0.58056640625, -0.53265380859375, -0.4847412109375, -0.43682861328125, -0.388916015625, -0.34100341796875, -0.2930908203125, -0.24517822265625, -0.197265625, -0.14935302734375, -0.1014404296875, -0.05352783203125, -0.005615234375, 0.04229736328125, 0.0902099609375, 0.13812255859375, 0.18603515625, 0.23394775390625, 0.2818603515625, 0.32977294921875, 0.377685546875, 0.42559814453125, 0.4735107421875, 0.52142333984375, 0.5693359375, 0.61724853515625, 0.6651611328125, 0.71307373046875, 0.760986328125, 0.80889892578125, 0.8568115234375, 0.90472412109375, 0.95263671875, 1.00054931640625, 1.0484619140625, 1.09637451171875, 1.144287109375, 1.19219970703125, 1.2401123046875, 1.28802490234375, 1.3359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 8.0, 13.0, 28.0, 67.0, 145.0, 197.0, 225.0, 154.0, 96.0, 28.0, 19.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.687761306762695, -4.416144371032715, -4.144527435302734, -3.872910261154175, -3.6012930870056152, -3.3296761512756348, -3.0580592155456543, -2.786442279815674, -2.5148251056671143, -2.243208169937134, -1.9715909957885742, -1.6999740600585938, -1.4283570051193237, -1.1567399501800537, -0.8851230144500732, -0.6135059595108032, -0.3418889045715332, -0.07027187943458557, 0.20134514570236206, 0.4729621410369873, 0.7445791959762573, 1.0161962509155273, 1.2878131866455078, 1.5594302415847778, 1.8310472965240479, 2.1026642322540283, 2.374281406402588, 2.6458983421325684, 2.917515277862549, 3.1891324520111084, 3.460749387741089, 3.7323665618896484, 4.003983497619629, 4.275600433349609, 4.54721736907959, 4.81883430480957, 5.090451717376709, 5.3620686531066895, 5.63368558883667, 5.90530252456665, 6.176919937133789, 6.4485368728637695, 6.72015380859375, 6.9917707443237305, 7.263388156890869, 7.53500509262085, 7.80662202835083, 8.078239440917969, 8.349855422973633, 8.621472358703613, 8.893089294433594, 9.164706230163574, 9.436323165893555, 9.707941055297852, 9.979557037353516, 10.251174926757812, 10.522791862487793, 10.794408798217773, 11.066025733947754, 11.337642669677734, 11.609259605407715, 11.880876541137695, 12.152494430541992, 12.424111366271973, 12.695728302001953]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 6.0, 12.0, 9.0, 17.0, 22.0, 22.0, 24.0, 26.0, 21.0, 28.0, 32.0, 44.0, 41.0, 44.0, 51.0, 39.0, 46.0, 50.0, 48.0, 32.0, 47.0, 48.0, 33.0, 47.0, 22.0, 29.0, 31.0, 26.0, 18.0, 20.0, 13.0, 10.0, 4.0, 7.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.408178806304932, -4.283382415771484, -4.158586025238037, -4.03378963470459, -3.9089930057525635, -3.784196615219116, -3.659400224685669, -3.5346035957336426, -3.4098072052001953, -3.285010814666748, -3.160214424133301, -3.0354177951812744, -2.910621404647827, -2.78582501411438, -2.6610286235809326, -2.5362319946289062, -2.411435604095459, -2.2866392135620117, -2.1618428230285645, -2.037046194076538, -1.9122498035430908, -1.7874534130096436, -1.6626570224761963, -1.5378605127334595, -1.4130642414093018, -1.2882678508758545, -1.1634713411331177, -1.0386749505996704, -0.9138784408569336, -0.7890820503234863, -0.6642856001853943, -0.5394891500473022, -0.41469264030456543, -0.2898961901664734, -0.16509975492954254, -0.040303319692611694, 0.08449313044548035, 0.20928955078125, 0.33408600091934204, 0.4588824510574341, 0.5836789011955261, 0.7084753513336182, 0.8332718014717102, 0.9580682516098022, 1.0828646421432495, 1.2076611518859863, 1.3324575424194336, 1.4572539329528809, 1.5820504426956177, 1.706846833229065, 1.8316433429718018, 1.956439733505249, 2.0812361240386963, 2.2060327529907227, 2.33082914352417, 2.455625534057617, 2.5804219245910645, 2.7052183151245117, 2.830014705657959, 2.9548113346099854, 3.0796077251434326, 3.20440411567688, 3.329200506210327, 3.4539971351623535, 3.578793525695801]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 6.0, 16.0, 27.0, 37.0, 56.0, 91.0, 175.0, 290.0, 534.0, 1039.0, 2398.0, 6177.0, 19549.0, 71327.0, 261043.0, 432019.0, 183580.0, 48125.0, 13675.0, 4635.0, 1824.0, 853.0, 443.0, 233.0, 145.0, 84.0, 49.0, 44.0, 22.0, 16.0, 9.0, 3.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.86328125, -2.7747802734375, -2.686279296875, -2.5977783203125, -2.50927734375, -2.4207763671875, -2.332275390625, -2.2437744140625, -2.1552734375, -2.0667724609375, -1.978271484375, -1.8897705078125, -1.80126953125, -1.7127685546875, -1.624267578125, -1.5357666015625, -1.447265625, -1.3587646484375, -1.270263671875, -1.1817626953125, -1.09326171875, -1.0047607421875, -0.916259765625, -0.8277587890625, -0.7392578125, -0.6507568359375, -0.562255859375, -0.4737548828125, -0.38525390625, -0.2967529296875, -0.208251953125, -0.1197509765625, -0.03125, 0.0572509765625, 0.145751953125, 0.2342529296875, 0.32275390625, 0.4112548828125, 0.499755859375, 0.5882568359375, 0.6767578125, 0.7652587890625, 0.853759765625, 0.9422607421875, 1.03076171875, 1.1192626953125, 1.207763671875, 1.2962646484375, 1.384765625, 1.4732666015625, 1.561767578125, 1.6502685546875, 1.73876953125, 1.8272705078125, 1.915771484375, 2.0042724609375, 2.0927734375, 2.1812744140625, 2.269775390625, 2.3582763671875, 2.44677734375, 2.5352783203125, 2.623779296875, 2.7122802734375, 2.80078125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 8.0, 14.0, 15.0, 29.0, 33.0, 45.0, 59.0, 55.0, 71.0, 71.0, 64.0, 85.0, 66.0, 80.0, 60.0, 52.0, 49.0, 30.0, 33.0, 18.0, 16.0, 11.0, 7.0, 9.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.328125, -1.2882080078125, -1.248291015625, -1.2083740234375, -1.16845703125, -1.1285400390625, -1.088623046875, -1.0487060546875, -1.0087890625, -0.9688720703125, -0.928955078125, -0.8890380859375, -0.84912109375, -0.8092041015625, -0.769287109375, -0.7293701171875, -0.689453125, -0.6495361328125, -0.609619140625, -0.5697021484375, -0.52978515625, -0.4898681640625, -0.449951171875, -0.4100341796875, -0.3701171875, -0.3302001953125, -0.290283203125, -0.2503662109375, -0.21044921875, -0.1705322265625, -0.130615234375, -0.0906982421875, -0.05078125, -0.0108642578125, 0.029052734375, 0.0689697265625, 0.10888671875, 0.1488037109375, 0.188720703125, 0.2286376953125, 0.2685546875, 0.3084716796875, 0.348388671875, 0.3883056640625, 0.42822265625, 0.4681396484375, 0.508056640625, 0.5479736328125, 0.587890625, 0.6278076171875, 0.667724609375, 0.7076416015625, 0.74755859375, 0.7874755859375, 0.827392578125, 0.8673095703125, 0.9072265625, 0.9471435546875, 0.987060546875, 1.0269775390625, 1.06689453125, 1.1068115234375, 1.146728515625, 1.1866455078125, 1.2265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 12.0, 15.0, 7.0, 21.0, 27.0, 49.0, 87.0, 121.0, 199.0, 388.0, 907.0, 2279.0, 9755.0, 102537.0, 777665.0, 138114.0, 11706.0, 2730.0, 949.0, 408.0, 233.0, 119.0, 85.0, 35.0, 26.0, 21.0, 9.0, 15.0, 5.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -7.01129150390625, -6.8194580078125, -6.62762451171875, -6.435791015625, -6.24395751953125, -6.0521240234375, -5.86029052734375, -5.66845703125, -5.47662353515625, -5.2847900390625, -5.09295654296875, -4.901123046875, -4.70928955078125, -4.5174560546875, -4.32562255859375, -4.1337890625, -3.94195556640625, -3.7501220703125, -3.55828857421875, -3.366455078125, -3.17462158203125, -2.9827880859375, -2.79095458984375, -2.59912109375, -2.40728759765625, -2.2154541015625, -2.02362060546875, -1.831787109375, -1.63995361328125, -1.4481201171875, -1.25628662109375, -1.064453125, -0.87261962890625, -0.6807861328125, -0.48895263671875, -0.297119140625, -0.10528564453125, 0.0865478515625, 0.27838134765625, 0.47021484375, 0.66204833984375, 0.8538818359375, 1.04571533203125, 1.237548828125, 1.42938232421875, 1.6212158203125, 1.81304931640625, 2.0048828125, 2.19671630859375, 2.3885498046875, 2.58038330078125, 2.772216796875, 2.96405029296875, 3.1558837890625, 3.34771728515625, 3.53955078125, 3.73138427734375, 3.9232177734375, 4.11505126953125, 4.306884765625, 4.49871826171875, 4.6905517578125, 4.88238525390625, 5.07421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 5.0, 9.0, 14.0, 30.0, 38.0, 43.0, 65.0, 60.0, 85.0, 89.0, 84.0, 72.0, 80.0, 70.0, 72.0, 37.0, 33.0, 35.0, 11.0, 13.0, 9.0, 6.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.44512939453125, -7.1832275390625, -6.92132568359375, -6.659423828125, -6.39752197265625, -6.1356201171875, -5.87371826171875, -5.61181640625, -5.34991455078125, -5.0880126953125, -4.82611083984375, -4.564208984375, -4.30230712890625, -4.0404052734375, -3.77850341796875, -3.5166015625, -3.25469970703125, -2.9927978515625, -2.73089599609375, -2.468994140625, -2.20709228515625, -1.9451904296875, -1.68328857421875, -1.42138671875, -1.15948486328125, -0.8975830078125, -0.63568115234375, -0.373779296875, -0.11187744140625, 0.1500244140625, 0.41192626953125, 0.673828125, 0.93572998046875, 1.1976318359375, 1.45953369140625, 1.721435546875, 1.98333740234375, 2.2452392578125, 2.50714111328125, 2.76904296875, 3.03094482421875, 3.2928466796875, 3.55474853515625, 3.816650390625, 4.07855224609375, 4.3404541015625, 4.60235595703125, 4.8642578125, 5.12615966796875, 5.3880615234375, 5.64996337890625, 5.911865234375, 6.17376708984375, 6.4356689453125, 6.69757080078125, 6.95947265625, 7.22137451171875, 7.4832763671875, 7.74517822265625, 8.007080078125, 8.26898193359375, 8.5308837890625, 8.79278564453125, 9.0546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 6.0, 23.0, 20.0, 38.0, 43.0, 73.0, 75.0, 153.0, 233.0, 422.0, 912.0, 2793.0, 11569.0, 128945.0, 825853.0, 65393.0, 8000.0, 2115.0, 884.0, 366.0, 188.0, 131.0, 90.0, 51.0, 41.0, 31.0, 23.0, 26.0, 12.0, 7.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.06640625, -2.97174072265625, -2.8770751953125, -2.78240966796875, -2.687744140625, -2.59307861328125, -2.4984130859375, -2.40374755859375, -2.30908203125, -2.21441650390625, -2.1197509765625, -2.02508544921875, -1.930419921875, -1.83575439453125, -1.7410888671875, -1.64642333984375, -1.5517578125, -1.45709228515625, -1.3624267578125, -1.26776123046875, -1.173095703125, -1.07843017578125, -0.9837646484375, -0.88909912109375, -0.79443359375, -0.69976806640625, -0.6051025390625, -0.51043701171875, -0.415771484375, -0.32110595703125, -0.2264404296875, -0.13177490234375, -0.037109375, 0.05755615234375, 0.1522216796875, 0.24688720703125, 0.341552734375, 0.43621826171875, 0.5308837890625, 0.62554931640625, 0.72021484375, 0.81488037109375, 0.9095458984375, 1.00421142578125, 1.098876953125, 1.19354248046875, 1.2882080078125, 1.38287353515625, 1.4775390625, 1.57220458984375, 1.6668701171875, 1.76153564453125, 1.856201171875, 1.95086669921875, 2.0455322265625, 2.14019775390625, 2.23486328125, 2.32952880859375, 2.4241943359375, 2.51885986328125, 2.613525390625, 2.70819091796875, 2.8028564453125, 2.89752197265625, 2.9921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 15.0, 13.0, 20.0, 35.0, 57.0, 95.0, 124.0, 137.0, 149.0, 127.0, 101.0, 36.0, 33.0, 14.0, 15.0, 12.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002875328063964844, -0.0002743825316429138, -0.00026123225688934326, -0.0002480819821357727, -0.00023493170738220215, -0.0002217814326286316, -0.00020863115787506104, -0.00019548088312149048, -0.00018233060836791992, -0.00016918033361434937, -0.0001560300588607788, -0.00014287978410720825, -0.0001297295093536377, -0.00011657923460006714, -0.00010342895984649658, -9.027868509292603e-05, -7.712841033935547e-05, -6.397813558578491e-05, -5.0827860832214355e-05, -3.76775860786438e-05, -2.4527311325073242e-05, -1.1377036571502686e-05, 1.773238182067871e-06, 1.4923512935638428e-05, 2.8073787689208984e-05, 4.122406244277954e-05, 5.43743371963501e-05, 6.752461194992065e-05, 8.067488670349121e-05, 9.382516145706177e-05, 0.00010697543621063232, 0.00012012571096420288, 0.00013327598571777344, 0.000146426260471344, 0.00015957653522491455, 0.0001727268099784851, 0.00018587708473205566, 0.00019902735948562622, 0.00021217763423919678, 0.00022532790899276733, 0.0002384781837463379, 0.00025162845849990845, 0.000264778733253479, 0.00027792900800704956, 0.0002910792827606201, 0.0003042295575141907, 0.00031737983226776123, 0.0003305301070213318, 0.00034368038177490234, 0.0003568306565284729, 0.00036998093128204346, 0.000383131206035614, 0.00039628148078918457, 0.0004094317555427551, 0.0004225820302963257, 0.00043573230504989624, 0.0004488825798034668, 0.00046203285455703735, 0.0004751831293106079, 0.0004883334040641785, 0.000501483678817749, 0.0005146339535713196, 0.0005277842283248901, 0.0005409345030784607, 0.0005540847778320312]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 8.0, 11.0, 16.0, 34.0, 48.0, 102.0, 231.0, 541.0, 1742.0, 9786.0, 260038.0, 748833.0, 22835.0, 2924.0, 788.0, 286.0, 157.0, 75.0, 35.0, 23.0, 10.0, 8.0, 7.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.77734375, -3.67291259765625, -3.5684814453125, -3.46405029296875, -3.359619140625, -3.25518798828125, -3.1507568359375, -3.04632568359375, -2.94189453125, -2.83746337890625, -2.7330322265625, -2.62860107421875, -2.524169921875, -2.41973876953125, -2.3153076171875, -2.21087646484375, -2.1064453125, -2.00201416015625, -1.8975830078125, -1.79315185546875, -1.688720703125, -1.58428955078125, -1.4798583984375, -1.37542724609375, -1.27099609375, -1.16656494140625, -1.0621337890625, -0.95770263671875, -0.853271484375, -0.74884033203125, -0.6444091796875, -0.53997802734375, -0.435546875, -0.33111572265625, -0.2266845703125, -0.12225341796875, -0.017822265625, 0.08660888671875, 0.1910400390625, 0.29547119140625, 0.39990234375, 0.50433349609375, 0.6087646484375, 0.71319580078125, 0.817626953125, 0.92205810546875, 1.0264892578125, 1.13092041015625, 1.2353515625, 1.33978271484375, 1.4442138671875, 1.54864501953125, 1.653076171875, 1.75750732421875, 1.8619384765625, 1.96636962890625, 2.07080078125, 2.17523193359375, 2.2796630859375, 2.38409423828125, 2.488525390625, 2.59295654296875, 2.6973876953125, 2.80181884765625, 2.90625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 4.0, 9.0, 16.0, 39.0, 49.0, 95.0, 155.0, 234.0, 149.0, 127.0, 39.0, 28.0, 21.0, 9.0, 6.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.098358154296875, -2.97210693359375, -2.845855712890625, -2.7196044921875, -2.593353271484375, -2.46710205078125, -2.340850830078125, -2.214599609375, -2.088348388671875, -1.96209716796875, -1.835845947265625, -1.7095947265625, -1.583343505859375, -1.45709228515625, -1.330841064453125, -1.20458984375, -1.078338623046875, -0.95208740234375, -0.825836181640625, -0.6995849609375, -0.573333740234375, -0.44708251953125, -0.320831298828125, -0.194580078125, -0.068328857421875, 0.05792236328125, 0.184173583984375, 0.3104248046875, 0.436676025390625, 0.56292724609375, 0.689178466796875, 0.8154296875, 0.941680908203125, 1.06793212890625, 1.194183349609375, 1.3204345703125, 1.446685791015625, 1.57293701171875, 1.699188232421875, 1.825439453125, 1.951690673828125, 2.07794189453125, 2.204193115234375, 2.3304443359375, 2.456695556640625, 2.58294677734375, 2.709197998046875, 2.83544921875, 2.961700439453125, 3.08795166015625, 3.214202880859375, 3.3404541015625, 3.466705322265625, 3.59295654296875, 3.719207763671875, 3.845458984375, 3.971710205078125, 4.09796142578125, 4.224212646484375, 4.3504638671875, 4.476715087890625, 4.60296630859375, 4.729217529296875, 4.85546875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 20.0, 63.0, 161.0, 253.0, 249.0, 148.0, 64.0, 28.0, 12.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-96.59833526611328, -94.80694580078125, -93.01554870605469, -91.22415924072266, -89.43276977539062, -87.64137268066406, -85.84998321533203, -84.05859375, -82.26719665527344, -80.4758071899414, -78.68441009521484, -76.89302062988281, -75.10163116455078, -73.31023406982422, -71.51884460449219, -69.72745513916016, -67.93606567382812, -66.1446762084961, -64.35327911376953, -62.5618896484375, -60.7704963684082, -58.979103088378906, -57.187713623046875, -55.39632034301758, -53.60492706298828, -51.813533782958984, -50.02214431762695, -48.230751037597656, -46.43935775756836, -44.64796447753906, -42.85657501220703, -41.065181732177734, -39.27378463745117, -37.482391357421875, -35.691001892089844, -33.89960861206055, -32.10821533203125, -30.316823959350586, -28.525432586669922, -26.734039306640625, -24.94264793395996, -23.151256561279297, -21.35986328125, -19.568471908569336, -17.777080535888672, -15.985687255859375, -14.194295883178711, -12.40290355682373, -10.61151123046875, -8.82011890411377, -7.028727054595947, -5.237335205078125, -3.4459428787231445, -1.654550552368164, 0.1368408203125, 1.9282331466674805, 3.719625473022461, 5.511017799377441, 7.302409648895264, 9.093801498413086, 10.885193824768066, 12.676586151123047, 14.467977523803711, 16.259368896484375, 18.050762176513672]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 9.0, 2.0, 8.0, 5.0, 18.0, 16.0, 21.0, 22.0, 20.0, 17.0, 30.0, 38.0, 41.0, 45.0, 51.0, 59.0, 66.0, 42.0, 41.0, 51.0, 56.0, 50.0, 36.0, 46.0, 25.0, 23.0, 17.0, 30.0, 17.0, 17.0, 12.0, 15.0, 10.0, 3.0, 11.0, 6.0, 6.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.830528259277344, -29.80434226989746, -28.778156280517578, -27.751970291137695, -26.725784301757812, -25.69959831237793, -24.673412322998047, -23.647226333618164, -22.62104034423828, -21.5948543548584, -20.568668365478516, -19.542482376098633, -18.51629638671875, -17.490110397338867, -16.463924407958984, -15.437738418579102, -14.411552429199219, -13.385366439819336, -12.359180450439453, -11.33299446105957, -10.306808471679688, -9.280622482299805, -8.254436492919922, -7.228250503540039, -6.202064514160156, -5.175878524780273, -4.149692535400391, -3.123506546020508, -2.097320556640625, -1.0711345672607422, -0.044948577880859375, 0.9812374114990234, 2.0074234008789062, 3.033609390258789, 4.059795379638672, 5.085981369018555, 6.1121673583984375, 7.13835334777832, 8.164539337158203, 9.190725326538086, 10.216911315917969, 11.243097305297852, 12.269283294677734, 13.295469284057617, 14.3216552734375, 15.347841262817383, 16.374027252197266, 17.40021324157715, 18.42639923095703, 19.452585220336914, 20.478771209716797, 21.50495719909668, 22.531143188476562, 23.557329177856445, 24.583515167236328, 25.60970115661621, 26.635887145996094, 27.662073135375977, 28.68825912475586, 29.714445114135742, 30.740631103515625, 31.766817092895508, 32.79300308227539, 33.819190979003906, 34.845375061035156]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 16.0, 13.0, 32.0, 48.0, 48.0, 94.0, 124.0, 203.0, 334.0, 532.0, 869.0, 1675.0, 3084.0, 6647.0, 16821.0, 57977.0, 3309463.0, 712840.0, 53439.0, 16277.0, 6494.0, 3057.0, 1638.0, 938.0, 558.0, 372.0, 227.0, 149.0, 92.0, 67.0, 32.0, 28.0, 26.0, 14.0, 9.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9384765625, -1.8666229248046875, -1.794769287109375, -1.7229156494140625, -1.65106201171875, -1.5792083740234375, -1.507354736328125, -1.4355010986328125, -1.3636474609375, -1.2917938232421875, -1.219940185546875, -1.1480865478515625, -1.07623291015625, -1.0043792724609375, -0.932525634765625, -0.8606719970703125, -0.788818359375, -0.7169647216796875, -0.645111083984375, -0.5732574462890625, -0.50140380859375, -0.4295501708984375, -0.357696533203125, -0.2858428955078125, -0.2139892578125, -0.1421356201171875, -0.070281982421875, 0.0015716552734375, 0.07342529296875, 0.1452789306640625, 0.217132568359375, 0.2889862060546875, 0.36083984375, 0.4326934814453125, 0.504547119140625, 0.5764007568359375, 0.64825439453125, 0.7201080322265625, 0.791961669921875, 0.8638153076171875, 0.9356689453125, 1.0075225830078125, 1.079376220703125, 1.1512298583984375, 1.22308349609375, 1.2949371337890625, 1.366790771484375, 1.4386444091796875, 1.510498046875, 1.5823516845703125, 1.654205322265625, 1.7260589599609375, 1.79791259765625, 1.8697662353515625, 1.941619873046875, 2.0134735107421875, 2.0853271484375, 2.1571807861328125, 2.229034423828125, 2.3008880615234375, 2.37274169921875, 2.4445953369140625, 2.516448974609375, 2.5883026123046875, 2.66015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 2.0, 9.0, 15.0, 17.0, 22.0, 23.0, 23.0, 49.0, 42.0, 44.0, 47.0, 58.0, 75.0, 47.0, 57.0, 70.0, 52.0, 63.0, 45.0, 33.0, 38.0, 27.0, 25.0, 22.0, 14.0, 12.0, 12.0, 15.0, 4.0, 4.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4990234375, -1.4566802978515625, -1.414337158203125, -1.3719940185546875, -1.32965087890625, -1.2873077392578125, -1.244964599609375, -1.2026214599609375, -1.1602783203125, -1.1179351806640625, -1.075592041015625, -1.0332489013671875, -0.99090576171875, -0.9485626220703125, -0.906219482421875, -0.8638763427734375, -0.821533203125, -0.7791900634765625, -0.736846923828125, -0.6945037841796875, -0.65216064453125, -0.6098175048828125, -0.567474365234375, -0.5251312255859375, -0.4827880859375, -0.4404449462890625, -0.398101806640625, -0.3557586669921875, -0.31341552734375, -0.2710723876953125, -0.228729248046875, -0.1863861083984375, -0.14404296875, -0.1016998291015625, -0.059356689453125, -0.0170135498046875, 0.02532958984375, 0.0676727294921875, 0.110015869140625, 0.1523590087890625, 0.1947021484375, 0.2370452880859375, 0.279388427734375, 0.3217315673828125, 0.36407470703125, 0.4064178466796875, 0.448760986328125, 0.4911041259765625, 0.533447265625, 0.5757904052734375, 0.618133544921875, 0.6604766845703125, 0.70281982421875, 0.7451629638671875, 0.787506103515625, 0.8298492431640625, 0.8721923828125, 0.9145355224609375, 0.956878662109375, 0.9992218017578125, 1.04156494140625, 1.0839080810546875, 1.126251220703125, 1.1685943603515625, 1.2109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 12.0, 14.0, 8.0, 25.0, 26.0, 35.0, 58.0, 77.0, 110.0, 146.0, 213.0, 296.0, 471.0, 788.0, 1149.0, 2136.0, 3852.0, 8700.0, 22959.0, 99332.0, 3721222.0, 267553.0, 40531.0, 12534.0, 5396.0, 2683.0, 1433.0, 823.0, 562.0, 336.0, 269.0, 140.0, 121.0, 67.0, 71.0, 35.0, 33.0, 24.0, 12.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.232421875, -2.16619873046875, -2.0999755859375, -2.03375244140625, -1.967529296875, -1.90130615234375, -1.8350830078125, -1.76885986328125, -1.70263671875, -1.63641357421875, -1.5701904296875, -1.50396728515625, -1.437744140625, -1.37152099609375, -1.3052978515625, -1.23907470703125, -1.1728515625, -1.10662841796875, -1.0404052734375, -0.97418212890625, -0.907958984375, -0.84173583984375, -0.7755126953125, -0.70928955078125, -0.64306640625, -0.57684326171875, -0.5106201171875, -0.44439697265625, -0.378173828125, -0.31195068359375, -0.2457275390625, -0.17950439453125, -0.11328125, -0.04705810546875, 0.0191650390625, 0.08538818359375, 0.151611328125, 0.21783447265625, 0.2840576171875, 0.35028076171875, 0.41650390625, 0.48272705078125, 0.5489501953125, 0.61517333984375, 0.681396484375, 0.74761962890625, 0.8138427734375, 0.88006591796875, 0.9462890625, 1.01251220703125, 1.0787353515625, 1.14495849609375, 1.211181640625, 1.27740478515625, 1.3436279296875, 1.40985107421875, 1.47607421875, 1.54229736328125, 1.6085205078125, 1.67474365234375, 1.740966796875, 1.80718994140625, 1.8734130859375, 1.93963623046875, 2.005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 9.0, 5.0, 20.0, 16.0, 40.0, 51.0, 116.0, 764.0, 2632.0, 194.0, 72.0, 54.0, 31.0, 15.0, 9.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.83544921875, -0.8140640258789062, -0.7926788330078125, -0.7712936401367188, -0.749908447265625, -0.7285232543945312, -0.7071380615234375, -0.6857528686523438, -0.66436767578125, -0.6429824829101562, -0.6215972900390625, -0.6002120971679688, -0.578826904296875, -0.5574417114257812, -0.5360565185546875, -0.5146713256835938, -0.4932861328125, -0.47190093994140625, -0.4505157470703125, -0.42913055419921875, -0.407745361328125, -0.38636016845703125, -0.3649749755859375, -0.34358978271484375, -0.32220458984375, -0.30081939697265625, -0.2794342041015625, -0.25804901123046875, -0.236663818359375, -0.21527862548828125, -0.1938934326171875, -0.17250823974609375, -0.151123046875, -0.12973785400390625, -0.1083526611328125, -0.08696746826171875, -0.065582275390625, -0.04419708251953125, -0.0228118896484375, -0.00142669677734375, 0.01995849609375, 0.04134368896484375, 0.0627288818359375, 0.08411407470703125, 0.105499267578125, 0.12688446044921875, 0.1482696533203125, 0.16965484619140625, 0.1910400390625, 0.21242523193359375, 0.2338104248046875, 0.25519561767578125, 0.276580810546875, 0.29796600341796875, 0.3193511962890625, 0.34073638916015625, 0.36212158203125, 0.38350677490234375, 0.4048919677734375, 0.42627716064453125, 0.447662353515625, 0.46904754638671875, 0.4904327392578125, 0.5118179321289062, 0.533203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 11.0, 72.0, 179.0, 292.0, 268.0, 122.0, 35.0, 12.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6621408462524414, -3.482419490814209, -3.3026981353759766, -3.122976779937744, -2.9432554244995117, -2.7635340690612793, -2.583812713623047, -2.4040913581848145, -2.224370002746582, -2.0446486473083496, -1.8649272918701172, -1.6852059364318848, -1.5054845809936523, -1.32576322555542, -1.146041750907898, -0.9663203954696655, -0.7865989208221436, -0.6068775653839111, -0.4271561801433563, -0.2474347949028015, -0.06771343946456909, 0.11200791597366333, 0.2917293310165405, 0.47145068645477295, 0.6511720418930054, 0.8308933973312378, 1.0106147527694702, 1.1903362274169922, 1.3700575828552246, 1.549778938293457, 1.7295002937316895, 1.9092216491699219, 2.0889430046081543, 2.2686643600463867, 2.448385715484619, 2.6281070709228516, 2.807828426361084, 2.9875497817993164, 3.167271137237549, 3.3469924926757812, 3.5267138481140137, 3.706435203552246, 3.8861565589904785, 4.065877914428711, 4.245599269866943, 4.425320625305176, 4.605041980743408, 4.784763336181641, 4.964485168457031, 5.144206523895264, 5.323927879333496, 5.5036492347717285, 5.683370590209961, 5.863091945648193, 6.042813301086426, 6.222534656524658, 6.402256011962891, 6.581977367401123, 6.7616987228393555, 6.941420078277588, 7.12114143371582, 7.300862789154053, 7.480584144592285, 7.660305500030518, 7.84002685546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 13.0, 2.0, 12.0, 9.0, 11.0, 19.0, 25.0, 24.0, 18.0, 23.0, 36.0, 26.0, 27.0, 25.0, 32.0, 36.0, 44.0, 33.0, 35.0, 49.0, 27.0, 37.0, 36.0, 41.0, 41.0, 39.0, 35.0, 30.0, 23.0, 24.0, 29.0, 19.0, 21.0, 16.0, 20.0, 9.0, 10.0, 8.0, 7.0, 9.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3430497646331787, -1.2991077899932861, -1.255165934562683, -1.21122407913208, -1.1672821044921875, -1.123340129852295, -1.079398274421692, -1.0354564189910889, -0.9915144443511963, -0.9475725293159485, -0.9036306142807007, -0.8596886992454529, -0.8157467842102051, -0.7718048691749573, -0.7278629541397095, -0.6839210391044617, -0.6399791240692139, -0.5960372090339661, -0.5520952939987183, -0.5081533789634705, -0.46421146392822266, -0.42026954889297485, -0.37632763385772705, -0.33238571882247925, -0.28844380378723145, -0.24450188875198364, -0.20055997371673584, -0.15661805868148804, -0.11267614364624023, -0.06873422861099243, -0.02479231357574463, 0.019149601459503174, 0.06309151649475098, 0.10703343152999878, 0.15097534656524658, 0.19491726160049438, 0.2388591766357422, 0.28280109167099, 0.3267430067062378, 0.3706849217414856, 0.4146268367767334, 0.4585687518119812, 0.502510666847229, 0.5464525818824768, 0.5903944969177246, 0.6343364119529724, 0.6782783269882202, 0.722220242023468, 0.7661621570587158, 0.8101040720939636, 0.8540459871292114, 0.8979879021644592, 0.941929817199707, 0.9858717322349548, 1.0298136472702026, 1.0737555027008057, 1.1176974773406982, 1.1616394519805908, 1.2055813074111938, 1.2495231628417969, 1.2934651374816895, 1.337407112121582, 1.381348967552185, 1.425290822982788, 1.4692327976226807]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 18.0, 18.0, 27.0, 33.0, 76.0, 127.0, 256.0, 611.0, 1440.0, 4414.0, 16749.0, 78335.0, 350520.0, 443777.0, 117738.0, 24391.0, 6490.0, 2075.0, 715.0, 327.0, 153.0, 88.0, 53.0, 32.0, 22.0, 13.0, 11.0, 10.0, 8.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.05078125, -3.93865966796875, -3.8265380859375, -3.71441650390625, -3.602294921875, -3.49017333984375, -3.3780517578125, -3.26593017578125, -3.15380859375, -3.04168701171875, -2.9295654296875, -2.81744384765625, -2.705322265625, -2.59320068359375, -2.4810791015625, -2.36895751953125, -2.2568359375, -2.14471435546875, -2.0325927734375, -1.92047119140625, -1.808349609375, -1.69622802734375, -1.5841064453125, -1.47198486328125, -1.35986328125, -1.24774169921875, -1.1356201171875, -1.02349853515625, -0.911376953125, -0.79925537109375, -0.6871337890625, -0.57501220703125, -0.462890625, -0.35076904296875, -0.2386474609375, -0.12652587890625, -0.014404296875, 0.09771728515625, 0.2098388671875, 0.32196044921875, 0.43408203125, 0.54620361328125, 0.6583251953125, 0.77044677734375, 0.882568359375, 0.99468994140625, 1.1068115234375, 1.21893310546875, 1.3310546875, 1.44317626953125, 1.5552978515625, 1.66741943359375, 1.779541015625, 1.89166259765625, 2.0037841796875, 2.11590576171875, 2.22802734375, 2.34014892578125, 2.4522705078125, 2.56439208984375, 2.676513671875, 2.78863525390625, 2.9007568359375, 3.01287841796875, 3.125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 8.0, 6.0, 6.0, 9.0, 14.0, 22.0, 21.0, 23.0, 36.0, 44.0, 45.0, 47.0, 51.0, 74.0, 44.0, 60.0, 71.0, 63.0, 50.0, 55.0, 48.0, 31.0, 24.0, 26.0, 28.0, 20.0, 15.0, 11.0, 12.0, 11.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5556640625, -1.512298583984375, -1.46893310546875, -1.425567626953125, -1.3822021484375, -1.338836669921875, -1.29547119140625, -1.252105712890625, -1.208740234375, -1.165374755859375, -1.12200927734375, -1.078643798828125, -1.0352783203125, -0.991912841796875, -0.94854736328125, -0.905181884765625, -0.86181640625, -0.818450927734375, -0.77508544921875, -0.731719970703125, -0.6883544921875, -0.644989013671875, -0.60162353515625, -0.558258056640625, -0.514892578125, -0.471527099609375, -0.42816162109375, -0.384796142578125, -0.3414306640625, -0.298065185546875, -0.25469970703125, -0.211334228515625, -0.16796875, -0.124603271484375, -0.08123779296875, -0.037872314453125, 0.0054931640625, 0.048858642578125, 0.09222412109375, 0.135589599609375, 0.178955078125, 0.222320556640625, 0.26568603515625, 0.309051513671875, 0.3524169921875, 0.395782470703125, 0.43914794921875, 0.482513427734375, 0.52587890625, 0.569244384765625, 0.61260986328125, 0.655975341796875, 0.6993408203125, 0.742706298828125, 0.78607177734375, 0.829437255859375, 0.872802734375, 0.916168212890625, 0.95953369140625, 1.002899169921875, 1.0462646484375, 1.089630126953125, 1.13299560546875, 1.176361083984375, 1.2197265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 12.0, 16.0, 31.0, 46.0, 93.0, 183.0, 398.0, 1061.0, 5011.0, 92015.0, 902275.0, 42403.0, 3448.0, 877.0, 339.0, 142.0, 90.0, 46.0, 23.0, 13.0, 4.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.9375, -12.61724853515625, -12.2969970703125, -11.97674560546875, -11.656494140625, -11.33624267578125, -11.0159912109375, -10.69573974609375, -10.37548828125, -10.05523681640625, -9.7349853515625, -9.41473388671875, -9.094482421875, -8.77423095703125, -8.4539794921875, -8.13372802734375, -7.8134765625, -7.49322509765625, -7.1729736328125, -6.85272216796875, -6.532470703125, -6.21221923828125, -5.8919677734375, -5.57171630859375, -5.25146484375, -4.93121337890625, -4.6109619140625, -4.29071044921875, -3.970458984375, -3.65020751953125, -3.3299560546875, -3.00970458984375, -2.689453125, -2.36920166015625, -2.0489501953125, -1.72869873046875, -1.408447265625, -1.08819580078125, -0.7679443359375, -0.44769287109375, -0.12744140625, 0.19281005859375, 0.5130615234375, 0.83331298828125, 1.153564453125, 1.47381591796875, 1.7940673828125, 2.11431884765625, 2.4345703125, 2.75482177734375, 3.0750732421875, 3.39532470703125, 3.715576171875, 4.03582763671875, 4.3560791015625, 4.67633056640625, 4.99658203125, 5.31683349609375, 5.6370849609375, 5.95733642578125, 6.277587890625, 6.59783935546875, 6.9180908203125, 7.23834228515625, 7.55859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 7.0, 7.0, 13.0, 15.0, 19.0, 24.0, 38.0, 56.0, 55.0, 80.0, 89.0, 92.0, 81.0, 95.0, 85.0, 66.0, 49.0, 43.0, 25.0, 23.0, 17.0, 9.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.946533203125, -15.54931640625, -15.152099609375, -14.7548828125, -14.357666015625, -13.96044921875, -13.563232421875, -13.166015625, -12.768798828125, -12.37158203125, -11.974365234375, -11.5771484375, -11.179931640625, -10.78271484375, -10.385498046875, -9.98828125, -9.591064453125, -9.19384765625, -8.796630859375, -8.3994140625, -8.002197265625, -7.60498046875, -7.207763671875, -6.810546875, -6.413330078125, -6.01611328125, -5.618896484375, -5.2216796875, -4.824462890625, -4.42724609375, -4.030029296875, -3.6328125, -3.235595703125, -2.83837890625, -2.441162109375, -2.0439453125, -1.646728515625, -1.24951171875, -0.852294921875, -0.455078125, -0.057861328125, 0.33935546875, 0.736572265625, 1.1337890625, 1.531005859375, 1.92822265625, 2.325439453125, 2.72265625, 3.119873046875, 3.51708984375, 3.914306640625, 4.3115234375, 4.708740234375, 5.10595703125, 5.503173828125, 5.900390625, 6.297607421875, 6.69482421875, 7.092041015625, 7.4892578125, 7.886474609375, 8.28369140625, 8.680908203125, 9.078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 26.0, 39.0, 56.0, 151.0, 904.0, 87116.0, 958156.0, 1699.0, 233.0, 85.0, 46.0, 18.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -16.068359375, -15.66796875, -15.267578125, -14.8671875, -14.466796875, -14.06640625, -13.666015625, -13.265625, -12.865234375, -12.46484375, -12.064453125, -11.6640625, -11.263671875, -10.86328125, -10.462890625, -10.0625, -9.662109375, -9.26171875, -8.861328125, -8.4609375, -8.060546875, -7.66015625, -7.259765625, -6.859375, -6.458984375, -6.05859375, -5.658203125, -5.2578125, -4.857421875, -4.45703125, -4.056640625, -3.65625, -3.255859375, -2.85546875, -2.455078125, -2.0546875, -1.654296875, -1.25390625, -0.853515625, -0.453125, -0.052734375, 0.34765625, 0.748046875, 1.1484375, 1.548828125, 1.94921875, 2.349609375, 2.75, 3.150390625, 3.55078125, 3.951171875, 4.3515625, 4.751953125, 5.15234375, 5.552734375, 5.953125, 6.353515625, 6.75390625, 7.154296875, 7.5546875, 7.955078125, 8.35546875, 8.755859375, 9.15625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 12.0, 15.0, 37.0, 57.0, 95.0, 107.0, 149.0, 146.0, 142.0, 93.0, 51.0, 32.0, 29.0, 12.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004754066467285156, -0.0004635229706764221, -0.0004516392946243286, -0.0004397556185722351, -0.0004278719425201416, -0.0004159882664680481, -0.0004041045904159546, -0.0003922209143638611, -0.0003803372383117676, -0.00036845356225967407, -0.00035656988620758057, -0.00034468621015548706, -0.00033280253410339355, -0.00032091885805130005, -0.00030903518199920654, -0.00029715150594711304, -0.00028526782989501953, -0.000273384153842926, -0.0002615004777908325, -0.000249616801738739, -0.0002377331256866455, -0.000225849449634552, -0.0002139657735824585, -0.000202082097530365, -0.00019019842147827148, -0.00017831474542617798, -0.00016643106937408447, -0.00015454739332199097, -0.00014266371726989746, -0.00013078004121780396, -0.00011889636516571045, -0.00010701268911361694, -9.512901306152344e-05, -8.324533700942993e-05, -7.136166095733643e-05, -5.947798490524292e-05, -4.7594308853149414e-05, -3.571063280105591e-05, -2.3826956748962402e-05, -1.1943280696868896e-05, -5.960464477539063e-08, 1.1824071407318115e-05, 2.370774745941162e-05, 3.559142351150513e-05, 4.747509956359863e-05, 5.935877561569214e-05, 7.124245166778564e-05, 8.312612771987915e-05, 9.500980377197266e-05, 0.00010689347982406616, 0.00011877715587615967, 0.00013066083192825317, 0.00014254450798034668, 0.00015442818403244019, 0.0001663118600845337, 0.0001781955361366272, 0.0001900792121887207, 0.0002019628882408142, 0.00021384656429290771, 0.00022573024034500122, 0.00023761391639709473, 0.00024949759244918823, 0.00026138126850128174, 0.00027326494455337524, 0.00028514862060546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 7.0, 16.0, 25.0, 63.0, 90.0, 263.0, 813.0, 3527.0, 42441.0, 959483.0, 37417.0, 3116.0, 777.0, 275.0, 93.0, 47.0, 35.0, 19.0, 4.0, 8.0, 8.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.666015625, -3.532623291015625, -3.39923095703125, -3.265838623046875, -3.1324462890625, -2.999053955078125, -2.86566162109375, -2.732269287109375, -2.598876953125, -2.465484619140625, -2.33209228515625, -2.198699951171875, -2.0653076171875, -1.931915283203125, -1.79852294921875, -1.665130615234375, -1.53173828125, -1.398345947265625, -1.26495361328125, -1.131561279296875, -0.9981689453125, -0.864776611328125, -0.73138427734375, -0.597991943359375, -0.464599609375, -0.331207275390625, -0.19781494140625, -0.064422607421875, 0.0689697265625, 0.202362060546875, 0.33575439453125, 0.469146728515625, 0.6025390625, 0.735931396484375, 0.86932373046875, 1.002716064453125, 1.1361083984375, 1.269500732421875, 1.40289306640625, 1.536285400390625, 1.669677734375, 1.803070068359375, 1.93646240234375, 2.069854736328125, 2.2032470703125, 2.336639404296875, 2.47003173828125, 2.603424072265625, 2.73681640625, 2.870208740234375, 3.00360107421875, 3.136993408203125, 3.2703857421875, 3.403778076171875, 3.53717041015625, 3.670562744140625, 3.803955078125, 3.937347412109375, 4.07073974609375, 4.204132080078125, 4.3375244140625, 4.470916748046875, 4.60430908203125, 4.737701416015625, 4.87109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 7.0, 4.0, 23.0, 25.0, 64.0, 135.0, 263.0, 258.0, 120.0, 38.0, 20.0, 19.0, 1.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.390625, -7.20086669921875, -7.0111083984375, -6.82135009765625, -6.631591796875, -6.44183349609375, -6.2520751953125, -6.06231689453125, -5.87255859375, -5.68280029296875, -5.4930419921875, -5.30328369140625, -5.113525390625, -4.92376708984375, -4.7340087890625, -4.54425048828125, -4.3544921875, -4.16473388671875, -3.9749755859375, -3.78521728515625, -3.595458984375, -3.40570068359375, -3.2159423828125, -3.02618408203125, -2.83642578125, -2.64666748046875, -2.4569091796875, -2.26715087890625, -2.077392578125, -1.88763427734375, -1.6978759765625, -1.50811767578125, -1.318359375, -1.12860107421875, -0.9388427734375, -0.74908447265625, -0.559326171875, -0.36956787109375, -0.1798095703125, 0.00994873046875, 0.19970703125, 0.38946533203125, 0.5792236328125, 0.76898193359375, 0.958740234375, 1.14849853515625, 1.3382568359375, 1.52801513671875, 1.7177734375, 1.90753173828125, 2.0972900390625, 2.28704833984375, 2.476806640625, 2.66656494140625, 2.8563232421875, 3.04608154296875, 3.23583984375, 3.42559814453125, 3.6153564453125, 3.80511474609375, 3.994873046875, 4.18463134765625, 4.3743896484375, 4.56414794921875, 4.75390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 18.0, 23.0, 51.0, 75.0, 117.0, 155.0, 181.0, 142.0, 94.0, 64.0, 32.0, 16.0, 14.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.954381942749023, -27.606109619140625, -26.25783920288086, -24.90956687927246, -23.561294555664062, -22.213024139404297, -20.8647518157959, -19.5164794921875, -18.168209075927734, -16.819936752319336, -15.471665382385254, -14.123394012451172, -12.775121688842773, -11.426850318908691, -10.07857894897461, -8.730306625366211, -7.3820343017578125, -6.033762454986572, -4.685490608215332, -3.33721923828125, -1.9889473915100098, -0.6406755447387695, 0.7075958251953125, 2.055868148803711, 3.404139518737793, 4.752411365509033, 6.100683212280273, 7.4489545822143555, 8.797225952148438, 10.145498275756836, 11.493769645690918, 12.842041969299316, 14.190311431884766, 15.538582801818848, 16.88685417175293, 18.235126495361328, 19.583398818969727, 20.931671142578125, 22.27994155883789, 23.62821388244629, 24.976486206054688, 26.324758529663086, 27.67302894592285, 29.02130126953125, 30.36957359313965, 31.717845916748047, 33.06611633300781, 34.414390563964844, 35.762657165527344, 37.11092758178711, 38.45920181274414, 39.807472229003906, 41.15574264526367, 42.5040168762207, 43.85228729248047, 45.2005615234375, 46.548831939697266, 47.89710235595703, 49.24537658691406, 50.59364700317383, 51.941917419433594, 53.290191650390625, 54.63846206665039, 55.986732482910156, 57.33500671386719]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 10.0, 16.0, 16.0, 21.0, 17.0, 33.0, 28.0, 22.0, 52.0, 47.0, 45.0, 44.0, 56.0, 71.0, 66.0, 59.0, 42.0, 47.0, 43.0, 46.0, 35.0, 32.0, 31.0, 25.0, 17.0, 12.0, 15.0, 9.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.43495178222656, -38.23347091674805, -37.0319938659668, -35.83051300048828, -34.629032135009766, -33.427555084228516, -32.22607421875, -31.024595260620117, -29.823116302490234, -28.62163734436035, -27.420156478881836, -26.218677520751953, -25.01719856262207, -23.815719604492188, -22.614238739013672, -21.41275978088379, -20.211278915405273, -19.00979995727539, -17.808319091796875, -16.606840133666992, -15.40536117553711, -14.20388126373291, -13.002401351928711, -11.800922393798828, -10.599442481994629, -9.39796257019043, -8.196483612060547, -6.995003700256348, -5.793524265289307, -4.592044830322266, -3.3905649185180664, -2.1890859603881836, -0.9876060485839844, 0.2138735055923462, 1.4153530597686768, 2.616832733154297, 3.818312168121338, 5.019791603088379, 6.221271514892578, 7.422750473022461, 8.62423038482666, 9.82571029663086, 11.027189254760742, 12.228669166564941, 13.43014907836914, 14.631628036499023, 15.833107948303223, 17.034587860107422, 18.236066818237305, 19.437545776367188, 20.639026641845703, 21.840505599975586, 23.04198455810547, 24.243465423583984, 25.444944381713867, 26.64642333984375, 27.847904205322266, 29.04938316345215, 30.250864028930664, 31.452342987060547, 32.65382385253906, 33.85530090332031, 35.05678176879883, 36.258262634277344, 37.459739685058594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 12.0, 8.0, 14.0, 8.0, 17.0, 33.0, 46.0, 60.0, 97.0, 160.0, 285.0, 484.0, 961.0, 1928.0, 4784.0, 14538.0, 77981.0, 3898472.0, 160568.0, 22184.0, 6507.0, 2603.0, 1114.0, 555.0, 314.0, 196.0, 122.0, 75.0, 40.0, 33.0, 26.0, 15.0, 11.0, 11.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.279296875, -3.156219482421875, -3.03314208984375, -2.910064697265625, -2.7869873046875, -2.663909912109375, -2.54083251953125, -2.417755126953125, -2.294677734375, -2.171600341796875, -2.04852294921875, -1.925445556640625, -1.8023681640625, -1.679290771484375, -1.55621337890625, -1.433135986328125, -1.31005859375, -1.186981201171875, -1.06390380859375, -0.940826416015625, -0.8177490234375, -0.694671630859375, -0.57159423828125, -0.448516845703125, -0.325439453125, -0.202362060546875, -0.07928466796875, 0.043792724609375, 0.1668701171875, 0.289947509765625, 0.41302490234375, 0.536102294921875, 0.6591796875, 0.782257080078125, 0.90533447265625, 1.028411865234375, 1.1514892578125, 1.274566650390625, 1.39764404296875, 1.520721435546875, 1.643798828125, 1.766876220703125, 1.88995361328125, 2.013031005859375, 2.1361083984375, 2.259185791015625, 2.38226318359375, 2.505340576171875, 2.62841796875, 2.751495361328125, 2.87457275390625, 2.997650146484375, 3.1207275390625, 3.243804931640625, 3.36688232421875, 3.489959716796875, 3.613037109375, 3.736114501953125, 3.85919189453125, 3.982269287109375, 4.1053466796875, 4.228424072265625, 4.35150146484375, 4.474578857421875, 4.59765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 14.0, 9.0, 23.0, 19.0, 32.0, 43.0, 39.0, 55.0, 87.0, 66.0, 99.0, 101.0, 65.0, 70.0, 44.0, 47.0, 39.0, 21.0, 30.0, 19.0, 10.0, 10.0, 9.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.693359375, -1.630615234375, -1.56787109375, -1.505126953125, -1.4423828125, -1.379638671875, -1.31689453125, -1.254150390625, -1.19140625, -1.128662109375, -1.06591796875, -1.003173828125, -0.9404296875, -0.877685546875, -0.81494140625, -0.752197265625, -0.689453125, -0.626708984375, -0.56396484375, -0.501220703125, -0.4384765625, -0.375732421875, -0.31298828125, -0.250244140625, -0.1875, -0.124755859375, -0.06201171875, 0.000732421875, 0.0634765625, 0.126220703125, 0.18896484375, 0.251708984375, 0.314453125, 0.377197265625, 0.43994140625, 0.502685546875, 0.5654296875, 0.628173828125, 0.69091796875, 0.753662109375, 0.81640625, 0.879150390625, 0.94189453125, 1.004638671875, 1.0673828125, 1.130126953125, 1.19287109375, 1.255615234375, 1.318359375, 1.381103515625, 1.44384765625, 1.506591796875, 1.5693359375, 1.632080078125, 1.69482421875, 1.757568359375, 1.8203125, 1.883056640625, 1.94580078125, 2.008544921875, 2.0712890625, 2.134033203125, 2.19677734375, 2.259521484375, 2.322265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 12.0, 17.0, 22.0, 26.0, 58.0, 94.0, 112.0, 162.0, 273.0, 446.0, 795.0, 1426.0, 2935.0, 6127.0, 14400.0, 42287.0, 194073.0, 3607810.0, 244808.0, 48559.0, 16042.0, 6865.0, 3186.0, 1615.0, 812.0, 461.0, 304.0, 183.0, 105.0, 83.0, 65.0, 26.0, 25.0, 26.0, 19.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.267578125, -2.18817138671875, -2.1087646484375, -2.02935791015625, -1.949951171875, -1.87054443359375, -1.7911376953125, -1.71173095703125, -1.63232421875, -1.55291748046875, -1.4735107421875, -1.39410400390625, -1.314697265625, -1.23529052734375, -1.1558837890625, -1.07647705078125, -0.9970703125, -0.91766357421875, -0.8382568359375, -0.75885009765625, -0.679443359375, -0.60003662109375, -0.5206298828125, -0.44122314453125, -0.36181640625, -0.28240966796875, -0.2030029296875, -0.12359619140625, -0.044189453125, 0.03521728515625, 0.1146240234375, 0.19403076171875, 0.2734375, 0.35284423828125, 0.4322509765625, 0.51165771484375, 0.591064453125, 0.67047119140625, 0.7498779296875, 0.82928466796875, 0.90869140625, 0.98809814453125, 1.0675048828125, 1.14691162109375, 1.226318359375, 1.30572509765625, 1.3851318359375, 1.46453857421875, 1.5439453125, 1.62335205078125, 1.7027587890625, 1.78216552734375, 1.861572265625, 1.94097900390625, 2.0203857421875, 2.09979248046875, 2.17919921875, 2.25860595703125, 2.3380126953125, 2.41741943359375, 2.496826171875, 2.57623291015625, 2.6556396484375, 2.73504638671875, 2.814453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 13.0, 15.0, 14.0, 25.0, 29.0, 63.0, 141.0, 269.0, 2719.0, 431.0, 138.0, 71.0, 47.0, 31.0, 18.0, 10.0, 6.0, 6.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5090255737304688, -0.4765472412109375, -0.44406890869140625, -0.411590576171875, -0.37911224365234375, -0.3466339111328125, -0.31415557861328125, -0.28167724609375, -0.24919891357421875, -0.2167205810546875, -0.18424224853515625, -0.151763916015625, -0.11928558349609375, -0.0868072509765625, -0.05432891845703125, -0.0218505859375, 0.01062774658203125, 0.0431060791015625, 0.07558441162109375, 0.108062744140625, 0.14054107666015625, 0.1730194091796875, 0.20549774169921875, 0.23797607421875, 0.27045440673828125, 0.3029327392578125, 0.33541107177734375, 0.367889404296875, 0.40036773681640625, 0.4328460693359375, 0.46532440185546875, 0.497802734375, 0.5302810668945312, 0.5627593994140625, 0.5952377319335938, 0.627716064453125, 0.6601943969726562, 0.6926727294921875, 0.7251510620117188, 0.75762939453125, 0.7901077270507812, 0.8225860595703125, 0.8550643920898438, 0.887542724609375, 0.9200210571289062, 0.9524993896484375, 0.9849777221679688, 1.0174560546875, 1.0499343872070312, 1.0824127197265625, 1.1148910522460938, 1.147369384765625, 1.1798477172851562, 1.2123260498046875, 1.2448043823242188, 1.27728271484375, 1.3097610473632812, 1.3422393798828125, 1.3747177124023438, 1.407196044921875, 1.4396743774414062, 1.4721527099609375, 1.5046310424804688, 1.537109375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 10.0, 14.0, 11.0, 31.0, 42.0, 53.0, 104.0, 113.0, 121.0, 126.0, 109.0, 62.0, 80.0, 52.0, 30.0, 18.0, 12.0, 2.0, 1.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.582845687866211, -3.4714548587799072, -3.3600640296936035, -3.2486732006073, -3.137282371520996, -3.0258915424346924, -2.9145007133483887, -2.803109884262085, -2.6917190551757812, -2.5803282260894775, -2.468937397003174, -2.35754656791687, -2.2461557388305664, -2.1347649097442627, -2.023374080657959, -1.9119832515716553, -1.8005925416946411, -1.6892017126083374, -1.5778108835220337, -1.46642005443573, -1.3550292253494263, -1.243638515472412, -1.1322476863861084, -1.0208568572998047, -0.9094659686088562, -0.7980751395225525, -0.6866843104362488, -0.5752935409545898, -0.46390268206596375, -0.3525118827819824, -0.2411210536956787, -0.129730224609375, -0.01833939552307129, 0.09305142611265182, 0.20444224774837494, 0.31583306193351746, 0.42722389101982117, 0.5386146903038025, 0.6500055193901062, 0.7613963484764099, 0.8727871775627136, 0.9841780066490173, 1.0955687761306763, 1.20695960521698, 1.3183504343032837, 1.4297412633895874, 1.5411320924758911, 1.6525229215621948, 1.7639137506484985, 1.8753045797348022, 1.986695408821106, 2.09808611869812, 2.209476947784424, 2.3208677768707275, 2.4322586059570312, 2.543649435043335, 2.6550402641296387, 2.7664310932159424, 2.877821922302246, 2.98921275138855, 3.1006035804748535, 3.2119944095611572, 3.323385238647461, 3.4347760677337646, 3.5461668968200684]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 11.0, 11.0, 10.0, 30.0, 34.0, 22.0, 15.0, 31.0, 39.0, 26.0, 42.0, 47.0, 45.0, 45.0, 35.0, 45.0, 48.0, 51.0, 45.0, 40.0, 40.0, 24.0, 31.0, 26.0, 27.0, 31.0, 19.0, 16.0, 11.0, 16.0, 8.0, 15.0, 8.0, 5.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.2001447677612305, -2.1328296661376953, -2.0655148029327393, -1.998199701309204, -1.9308847188949585, -1.863569736480713, -1.7962547540664673, -1.7289397716522217, -1.6616246700286865, -1.594309687614441, -1.5269947052001953, -1.4596796035766602, -1.3923646211624146, -1.325049638748169, -1.2577346563339233, -1.1904196739196777, -1.1231046915054321, -1.0557897090911865, -0.9884746670722961, -0.9211596846580505, -0.8538446426391602, -0.7865296602249146, -0.719214677810669, -0.6518996953964233, -0.584584653377533, -0.5172696709632874, -0.449954628944397, -0.38263964653015137, -0.3153246343135834, -0.24800962209701538, -0.18069463968276978, -0.11337962746620178, -0.04606461524963379, 0.021250389516353607, 0.088565394282341, 0.1558803915977478, 0.2231954038143158, 0.2905104160308838, 0.3578253984451294, 0.4251404106616974, 0.4924554228782654, 0.559770405292511, 0.6270854473114014, 0.694400429725647, 0.7617154121398926, 0.829030454158783, 0.8963454365730286, 0.963660478591919, 1.0309754610061646, 1.0982904434204102, 1.1656054258346558, 1.2329204082489014, 1.3002355098724365, 1.3675504922866821, 1.4348654747009277, 1.5021804571151733, 1.569495439529419, 1.6368104219436646, 1.7041254043579102, 1.7714405059814453, 1.838755488395691, 1.9060704708099365, 1.9733854532241821, 2.0407004356384277, 2.108015537261963]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 9.0, 15.0, 30.0, 37.0, 65.0, 88.0, 161.0, 396.0, 988.0, 2940.0, 13000.0, 85044.0, 560428.0, 334392.0, 40249.0, 7405.0, 1986.0, 676.0, 278.0, 151.0, 80.0, 36.0, 33.0, 11.0, 13.0, 10.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.609375, -5.464874267578125, -5.32037353515625, -5.175872802734375, -5.0313720703125, -4.886871337890625, -4.74237060546875, -4.597869873046875, -4.453369140625, -4.308868408203125, -4.16436767578125, -4.019866943359375, -3.8753662109375, -3.730865478515625, -3.58636474609375, -3.441864013671875, -3.29736328125, -3.152862548828125, -3.00836181640625, -2.863861083984375, -2.7193603515625, -2.574859619140625, -2.43035888671875, -2.285858154296875, -2.141357421875, -1.996856689453125, -1.85235595703125, -1.707855224609375, -1.5633544921875, -1.418853759765625, -1.27435302734375, -1.129852294921875, -0.9853515625, -0.840850830078125, -0.69635009765625, -0.551849365234375, -0.4073486328125, -0.262847900390625, -0.11834716796875, 0.026153564453125, 0.170654296875, 0.315155029296875, 0.45965576171875, 0.604156494140625, 0.7486572265625, 0.893157958984375, 1.03765869140625, 1.182159423828125, 1.32666015625, 1.471160888671875, 1.61566162109375, 1.760162353515625, 1.9046630859375, 2.049163818359375, 2.19366455078125, 2.338165283203125, 2.482666015625, 2.627166748046875, 2.77166748046875, 2.916168212890625, 3.0606689453125, 3.205169677734375, 3.34967041015625, 3.494171142578125, 3.638671875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 10.0, 12.0, 17.0, 13.0, 27.0, 43.0, 32.0, 52.0, 71.0, 65.0, 73.0, 80.0, 85.0, 77.0, 51.0, 48.0, 44.0, 38.0, 29.0, 26.0, 18.0, 13.0, 15.0, 11.0, 13.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.617828369140625, -1.55987548828125, -1.501922607421875, -1.4439697265625, -1.386016845703125, -1.32806396484375, -1.270111083984375, -1.212158203125, -1.154205322265625, -1.09625244140625, -1.038299560546875, -0.9803466796875, -0.922393798828125, -0.86444091796875, -0.806488037109375, -0.74853515625, -0.690582275390625, -0.63262939453125, -0.574676513671875, -0.5167236328125, -0.458770751953125, -0.40081787109375, -0.342864990234375, -0.284912109375, -0.226959228515625, -0.16900634765625, -0.111053466796875, -0.0531005859375, 0.004852294921875, 0.06280517578125, 0.120758056640625, 0.1787109375, 0.236663818359375, 0.29461669921875, 0.352569580078125, 0.4105224609375, 0.468475341796875, 0.52642822265625, 0.584381103515625, 0.642333984375, 0.700286865234375, 0.75823974609375, 0.816192626953125, 0.8741455078125, 0.932098388671875, 0.99005126953125, 1.048004150390625, 1.10595703125, 1.163909912109375, 1.22186279296875, 1.279815673828125, 1.3377685546875, 1.395721435546875, 1.45367431640625, 1.511627197265625, 1.569580078125, 1.627532958984375, 1.68548583984375, 1.743438720703125, 1.8013916015625, 1.859344482421875, 1.91729736328125, 1.975250244140625, 2.033203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 19.0, 23.0, 47.0, 69.0, 130.0, 316.0, 877.0, 3967.0, 92608.0, 927678.0, 19592.0, 2136.0, 585.0, 234.0, 102.0, 53.0, 36.0, 12.0, 22.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.2625732421875, -7.892333984375, -7.5220947265625, -7.15185546875, -6.7816162109375, -6.411376953125, -6.0411376953125, -5.6708984375, -5.3006591796875, -4.930419921875, -4.5601806640625, -4.18994140625, -3.8197021484375, -3.449462890625, -3.0792236328125, -2.708984375, -2.3387451171875, -1.968505859375, -1.5982666015625, -1.22802734375, -0.8577880859375, -0.487548828125, -0.1173095703125, 0.2529296875, 0.6231689453125, 0.993408203125, 1.3636474609375, 1.73388671875, 2.1041259765625, 2.474365234375, 2.8446044921875, 3.21484375, 3.5850830078125, 3.955322265625, 4.3255615234375, 4.69580078125, 5.0660400390625, 5.436279296875, 5.8065185546875, 6.1767578125, 6.5469970703125, 6.917236328125, 7.2874755859375, 7.65771484375, 8.0279541015625, 8.398193359375, 8.7684326171875, 9.138671875, 9.5089111328125, 9.879150390625, 10.2493896484375, 10.61962890625, 10.9898681640625, 11.360107421875, 11.7303466796875, 12.1005859375, 12.4708251953125, 12.841064453125, 13.2113037109375, 13.58154296875, 13.9517822265625, 14.322021484375, 14.6922607421875, 15.0625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 6.0, 9.0, 19.0, 15.0, 21.0, 31.0, 36.0, 47.0, 49.0, 50.0, 49.0, 72.0, 66.0, 59.0, 59.0, 64.0, 54.0, 45.0, 46.0, 41.0, 28.0, 23.0, 19.0, 19.0, 12.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.47515869140625, -7.1885986328125, -6.90203857421875, -6.615478515625, -6.32891845703125, -6.0423583984375, -5.75579833984375, -5.46923828125, -5.18267822265625, -4.8961181640625, -4.60955810546875, -4.322998046875, -4.03643798828125, -3.7498779296875, -3.46331787109375, -3.1767578125, -2.89019775390625, -2.6036376953125, -2.31707763671875, -2.030517578125, -1.74395751953125, -1.4573974609375, -1.17083740234375, -0.88427734375, -0.59771728515625, -0.3111572265625, -0.02459716796875, 0.261962890625, 0.54852294921875, 0.8350830078125, 1.12164306640625, 1.408203125, 1.69476318359375, 1.9813232421875, 2.26788330078125, 2.554443359375, 2.84100341796875, 3.1275634765625, 3.41412353515625, 3.70068359375, 3.98724365234375, 4.2738037109375, 4.56036376953125, 4.846923828125, 5.13348388671875, 5.4200439453125, 5.70660400390625, 5.9931640625, 6.27972412109375, 6.5662841796875, 6.85284423828125, 7.139404296875, 7.42596435546875, 7.7125244140625, 7.99908447265625, 8.28564453125, 8.57220458984375, 8.8587646484375, 9.14532470703125, 9.431884765625, 9.71844482421875, 10.0050048828125, 10.29156494140625, 10.578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 22.0, 17.0, 40.0, 82.0, 121.0, 287.0, 898.0, 4652.0, 652479.0, 384743.0, 3880.0, 749.0, 257.0, 94.0, 70.0, 39.0, 28.0, 13.0, 17.0, 10.0, 8.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.09912109375, -7.8857421875, -7.67236328125, -7.458984375, -7.24560546875, -7.0322265625, -6.81884765625, -6.60546875, -6.39208984375, -6.1787109375, -5.96533203125, -5.751953125, -5.53857421875, -5.3251953125, -5.11181640625, -4.8984375, -4.68505859375, -4.4716796875, -4.25830078125, -4.044921875, -3.83154296875, -3.6181640625, -3.40478515625, -3.19140625, -2.97802734375, -2.7646484375, -2.55126953125, -2.337890625, -2.12451171875, -1.9111328125, -1.69775390625, -1.484375, -1.27099609375, -1.0576171875, -0.84423828125, -0.630859375, -0.41748046875, -0.2041015625, 0.00927734375, 0.22265625, 0.43603515625, 0.6494140625, 0.86279296875, 1.076171875, 1.28955078125, 1.5029296875, 1.71630859375, 1.9296875, 2.14306640625, 2.3564453125, 2.56982421875, 2.783203125, 2.99658203125, 3.2099609375, 3.42333984375, 3.63671875, 3.85009765625, 4.0634765625, 4.27685546875, 4.490234375, 4.70361328125, 4.9169921875, 5.13037109375, 5.34375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 15.0, 30.0, 63.0, 103.0, 175.0, 202.0, 178.0, 116.0, 49.0, 30.0, 16.0, 11.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002694129943847656, -0.0002508088946342468, -0.00023220479488372803, -0.00021360069513320923, -0.00019499659538269043, -0.00017639249563217163, -0.00015778839588165283, -0.00013918429613113403, -0.00012058019638061523, -0.00010197609663009644, -8.337199687957764e-05, -6.476789712905884e-05, -4.616379737854004e-05, -2.755969762802124e-05, -8.955597877502441e-06, 9.648501873016357e-06, 2.8252601623535156e-05, 4.6856701374053955e-05, 6.546080112457275e-05, 8.406490087509155e-05, 0.00010266900062561035, 0.00012127310037612915, 0.00013987720012664795, 0.00015848129987716675, 0.00017708539962768555, 0.00019568949937820435, 0.00021429359912872314, 0.00023289769887924194, 0.00025150179862976074, 0.00027010589838027954, 0.00028870999813079834, 0.00030731409788131714, 0.00032591819763183594, 0.00034452229738235474, 0.00036312639713287354, 0.00038173049688339233, 0.00040033459663391113, 0.00041893869638442993, 0.00043754279613494873, 0.00045614689588546753, 0.00047475099563598633, 0.0004933550953865051, 0.0005119591951370239, 0.0005305632948875427, 0.0005491673946380615, 0.0005677714943885803, 0.0005863755941390991, 0.0006049796938896179, 0.0006235837936401367, 0.0006421878933906555, 0.0006607919931411743, 0.0006793960928916931, 0.0006980001926422119, 0.0007166042923927307, 0.0007352083921432495, 0.0007538124918937683, 0.0007724165916442871, 0.0007910206913948059, 0.0008096247911453247, 0.0008282288908958435, 0.0008468329906463623, 0.0008654370903968811, 0.0008840411901473999, 0.0009026452898979187, 0.0009212493896484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 10.0, 12.0, 22.0, 28.0, 66.0, 163.0, 438.0, 1641.0, 13122.0, 894398.0, 133081.0, 4216.0, 848.0, 274.0, 100.0, 47.0, 32.0, 14.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.03125, -4.87286376953125, -4.7144775390625, -4.55609130859375, -4.397705078125, -4.23931884765625, -4.0809326171875, -3.92254638671875, -3.76416015625, -3.60577392578125, -3.4473876953125, -3.28900146484375, -3.130615234375, -2.97222900390625, -2.8138427734375, -2.65545654296875, -2.4970703125, -2.33868408203125, -2.1802978515625, -2.02191162109375, -1.863525390625, -1.70513916015625, -1.5467529296875, -1.38836669921875, -1.22998046875, -1.07159423828125, -0.9132080078125, -0.75482177734375, -0.596435546875, -0.43804931640625, -0.2796630859375, -0.12127685546875, 0.037109375, 0.19549560546875, 0.3538818359375, 0.51226806640625, 0.670654296875, 0.82904052734375, 0.9874267578125, 1.14581298828125, 1.30419921875, 1.46258544921875, 1.6209716796875, 1.77935791015625, 1.937744140625, 2.09613037109375, 2.2545166015625, 2.41290283203125, 2.5712890625, 2.72967529296875, 2.8880615234375, 3.04644775390625, 3.204833984375, 3.36322021484375, 3.5216064453125, 3.67999267578125, 3.83837890625, 3.99676513671875, 4.1551513671875, 4.31353759765625, 4.471923828125, 4.63031005859375, 4.7886962890625, 4.94708251953125, 5.10546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 17.0, 31.0, 88.0, 190.0, 263.0, 209.0, 100.0, 38.0, 22.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.6695556640625, -6.487548828125, -6.3055419921875, -6.12353515625, -5.9415283203125, -5.759521484375, -5.5775146484375, -5.3955078125, -5.2135009765625, -5.031494140625, -4.8494873046875, -4.66748046875, -4.4854736328125, -4.303466796875, -4.1214599609375, -3.939453125, -3.7574462890625, -3.575439453125, -3.3934326171875, -3.21142578125, -3.0294189453125, -2.847412109375, -2.6654052734375, -2.4833984375, -2.3013916015625, -2.119384765625, -1.9373779296875, -1.75537109375, -1.5733642578125, -1.391357421875, -1.2093505859375, -1.02734375, -0.8453369140625, -0.663330078125, -0.4813232421875, -0.29931640625, -0.1173095703125, 0.064697265625, 0.2467041015625, 0.4287109375, 0.6107177734375, 0.792724609375, 0.9747314453125, 1.15673828125, 1.3387451171875, 1.520751953125, 1.7027587890625, 1.884765625, 2.0667724609375, 2.248779296875, 2.4307861328125, 2.61279296875, 2.7947998046875, 2.976806640625, 3.1588134765625, 3.3408203125, 3.5228271484375, 3.704833984375, 3.8868408203125, 4.06884765625, 4.2508544921875, 4.432861328125, 4.6148681640625, 4.796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 12.0, 36.0, 59.0, 97.0, 177.0, 243.0, 186.0, 84.0, 51.0, 25.0, 13.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.23371887207031, -74.42720794677734, -72.6207046508789, -70.81419372558594, -69.00768280029297, -67.201171875, -65.39466857910156, -63.588157653808594, -61.78165054321289, -59.97514343261719, -58.16863250732422, -56.362125396728516, -54.55561828613281, -52.749107360839844, -50.94260025024414, -49.13609313964844, -47.32958221435547, -45.523075103759766, -43.7165641784668, -41.910057067871094, -40.103546142578125, -38.29703903198242, -36.49053192138672, -34.68402099609375, -32.87751388549805, -31.07100486755371, -29.264495849609375, -27.457988739013672, -25.651479721069336, -23.844970703125, -22.038463592529297, -20.23195457458496, -18.42544937133789, -16.618940353393555, -14.812432289123535, -13.005924224853516, -11.19941520690918, -9.392906188964844, -7.586398124694824, -5.779890060424805, -3.9733810424804688, -2.166872501373291, -0.3603639602661133, 1.4461445808410645, 3.252653121948242, 5.059162139892578, 6.865670204162598, 8.672178268432617, 10.478687286376953, 12.285196304321289, 14.091704368591309, 15.898212432861328, 17.704721450805664, 19.51123046875, 21.317737579345703, 23.12424659729004, 24.930755615234375, 26.73726463317871, 28.543773651123047, 30.35028076171875, 32.15679168701172, 33.96329879760742, 35.769805908203125, 37.576316833496094, 39.3828239440918]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 12.0, 9.0, 11.0, 9.0, 17.0, 26.0, 27.0, 30.0, 45.0, 29.0, 38.0, 49.0, 63.0, 49.0, 51.0, 61.0, 60.0, 61.0, 52.0, 36.0, 58.0, 42.0, 34.0, 30.0, 23.0, 13.0, 11.0, 9.0, 7.0, 8.0, 9.0, 7.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4068603515625, -33.26789474487305, -32.12893295288086, -30.98996925354004, -29.85100555419922, -28.7120418548584, -27.573078155517578, -26.434112548828125, -25.295150756835938, -24.156187057495117, -23.017223358154297, -21.878259658813477, -20.739295959472656, -19.600332260131836, -18.461368560791016, -17.322402954101562, -16.183439254760742, -15.044475555419922, -13.905511856079102, -12.766548156738281, -11.627584457397461, -10.48862075805664, -9.349656105041504, -8.210692405700684, -7.071728706359863, -5.932765007019043, -4.793801307678223, -3.654837131500244, -2.515873432159424, -1.3769097328186035, -0.237945556640625, 0.9010181427001953, 2.0399818420410156, 3.178945541381836, 4.317909240722656, 5.456873416900635, 6.595837116241455, 7.734800815582275, 8.873764991760254, 10.012728691101074, 11.151692390441895, 12.290656089782715, 13.429619789123535, 14.568584442138672, 15.707548141479492, 16.846511840820312, 17.985475540161133, 19.124439239501953, 20.263402938842773, 21.402366638183594, 22.541330337524414, 23.680294036865234, 24.819257736206055, 25.958221435546875, 27.097187042236328, 28.236148834228516, 29.37511444091797, 30.51407814025879, 31.65304183959961, 32.79200744628906, 33.93096923828125, 35.0699348449707, 36.20889663696289, 37.347862243652344, 38.48682403564453]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 16.0, 14.0, 28.0, 33.0, 61.0, 110.0, 199.0, 306.0, 721.0, 1795.0, 6032.0, 40089.0, 4079566.0, 54272.0, 7287.0, 2053.0, 824.0, 362.0, 214.0, 108.0, 67.0, 51.0, 22.0, 13.0, 8.0, 9.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.13116455078125, -5.8912353515625, -5.65130615234375, -5.411376953125, -5.17144775390625, -4.9315185546875, -4.69158935546875, -4.45166015625, -4.21173095703125, -3.9718017578125, -3.73187255859375, -3.491943359375, -3.25201416015625, -3.0120849609375, -2.77215576171875, -2.5322265625, -2.29229736328125, -2.0523681640625, -1.81243896484375, -1.572509765625, -1.33258056640625, -1.0926513671875, -0.85272216796875, -0.61279296875, -0.37286376953125, -0.1329345703125, 0.10699462890625, 0.346923828125, 0.58685302734375, 0.8267822265625, 1.06671142578125, 1.306640625, 1.54656982421875, 1.7864990234375, 2.02642822265625, 2.266357421875, 2.50628662109375, 2.7462158203125, 2.98614501953125, 3.22607421875, 3.46600341796875, 3.7059326171875, 3.94586181640625, 4.185791015625, 4.42572021484375, 4.6656494140625, 4.90557861328125, 5.1455078125, 5.38543701171875, 5.6253662109375, 5.86529541015625, 6.105224609375, 6.34515380859375, 6.5850830078125, 6.82501220703125, 7.06494140625, 7.30487060546875, 7.5447998046875, 7.78472900390625, 8.024658203125, 8.26458740234375, 8.5045166015625, 8.74444580078125, 8.984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 8.0, 8.0, 22.0, 27.0, 24.0, 33.0, 53.0, 87.0, 73.0, 92.0, 93.0, 86.0, 76.0, 66.0, 49.0, 47.0, 33.0, 32.0, 16.0, 13.0, 9.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.548828125, -2.47540283203125, -2.4019775390625, -2.32855224609375, -2.255126953125, -2.18170166015625, -2.1082763671875, -2.03485107421875, -1.96142578125, -1.88800048828125, -1.8145751953125, -1.74114990234375, -1.667724609375, -1.59429931640625, -1.5208740234375, -1.44744873046875, -1.3740234375, -1.30059814453125, -1.2271728515625, -1.15374755859375, -1.080322265625, -1.00689697265625, -0.9334716796875, -0.86004638671875, -0.78662109375, -0.71319580078125, -0.6397705078125, -0.56634521484375, -0.492919921875, -0.41949462890625, -0.3460693359375, -0.27264404296875, -0.19921875, -0.12579345703125, -0.0523681640625, 0.02105712890625, 0.094482421875, 0.16790771484375, 0.2413330078125, 0.31475830078125, 0.38818359375, 0.46160888671875, 0.5350341796875, 0.60845947265625, 0.681884765625, 0.75531005859375, 0.8287353515625, 0.90216064453125, 0.9755859375, 1.04901123046875, 1.1224365234375, 1.19586181640625, 1.269287109375, 1.34271240234375, 1.4161376953125, 1.48956298828125, 1.56298828125, 1.63641357421875, 1.7098388671875, 1.78326416015625, 1.856689453125, 1.93011474609375, 2.0035400390625, 2.07696533203125, 2.150390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 7.0, 2.0, 6.0, 9.0, 20.0, 27.0, 43.0, 66.0, 88.0, 139.0, 256.0, 476.0, 884.0, 2070.0, 5240.0, 17880.0, 109281.0, 3922819.0, 108001.0, 17780.0, 5268.0, 1965.0, 875.0, 435.0, 241.0, 116.0, 108.0, 58.0, 54.0, 23.0, 23.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.233245849609375, -3.08953857421875, -2.945831298828125, -2.8021240234375, -2.658416748046875, -2.51470947265625, -2.371002197265625, -2.227294921875, -2.083587646484375, -1.93988037109375, -1.796173095703125, -1.6524658203125, -1.508758544921875, -1.36505126953125, -1.221343994140625, -1.07763671875, -0.933929443359375, -0.79022216796875, -0.646514892578125, -0.5028076171875, -0.359100341796875, -0.21539306640625, -0.071685791015625, 0.072021484375, 0.215728759765625, 0.35943603515625, 0.503143310546875, 0.6468505859375, 0.790557861328125, 0.93426513671875, 1.077972412109375, 1.2216796875, 1.365386962890625, 1.50909423828125, 1.652801513671875, 1.7965087890625, 1.940216064453125, 2.08392333984375, 2.227630615234375, 2.371337890625, 2.515045166015625, 2.65875244140625, 2.802459716796875, 2.9461669921875, 3.089874267578125, 3.23358154296875, 3.377288818359375, 3.52099609375, 3.664703369140625, 3.80841064453125, 3.952117919921875, 4.0958251953125, 4.239532470703125, 4.38323974609375, 4.526947021484375, 4.670654296875, 4.814361572265625, 4.95806884765625, 5.101776123046875, 5.2454833984375, 5.389190673828125, 5.53289794921875, 5.676605224609375, 5.8203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 10.0, 14.0, 10.0, 30.0, 64.0, 151.0, 3050.0, 544.0, 109.0, 43.0, 17.0, 18.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23828125, -1.184173583984375, -1.13006591796875, -1.075958251953125, -1.0218505859375, -0.967742919921875, -0.91363525390625, -0.859527587890625, -0.805419921875, -0.751312255859375, -0.69720458984375, -0.643096923828125, -0.5889892578125, -0.534881591796875, -0.48077392578125, -0.426666259765625, -0.37255859375, -0.318450927734375, -0.26434326171875, -0.210235595703125, -0.1561279296875, -0.102020263671875, -0.04791259765625, 0.006195068359375, 0.060302734375, 0.114410400390625, 0.16851806640625, 0.222625732421875, 0.2767333984375, 0.330841064453125, 0.38494873046875, 0.439056396484375, 0.4931640625, 0.547271728515625, 0.60137939453125, 0.655487060546875, 0.7095947265625, 0.763702392578125, 0.81781005859375, 0.871917724609375, 0.926025390625, 0.980133056640625, 1.03424072265625, 1.088348388671875, 1.1424560546875, 1.196563720703125, 1.25067138671875, 1.304779052734375, 1.35888671875, 1.412994384765625, 1.46710205078125, 1.521209716796875, 1.5753173828125, 1.629425048828125, 1.68353271484375, 1.737640380859375, 1.791748046875, 1.845855712890625, 1.89996337890625, 1.954071044921875, 2.0081787109375, 2.062286376953125, 2.11639404296875, 2.170501708984375, 2.224609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 14.0, 18.0, 68.0, 198.0, 275.0, 262.0, 115.0, 37.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0846452713012695, -3.776580810546875, -3.4685165882110596, -3.160452365875244, -2.8523879051208496, -2.544323444366455, -2.2362592220306396, -1.9281949996948242, -1.6201305389404297, -1.3120661973953247, -1.0040018558502197, -0.6959375143051147, -0.38787317276000977, -0.07980883121490479, 0.2282555103302002, 0.5363197326660156, 0.8443841934204102, 1.1524485349655151, 1.4605128765106201, 1.768577218055725, 2.07664155960083, 2.3847060203552246, 2.69277024269104, 3.0008344650268555, 3.30889892578125, 3.6169633865356445, 3.92502760887146, 4.233091831207275, 4.54115629196167, 4.8492207527160645, 5.157284736633301, 5.465349197387695, 5.77341365814209, 6.081478118896484, 6.389542579650879, 6.697606563568115, 7.00567102432251, 7.313735485076904, 7.621799468994141, 7.929863929748535, 8.23792839050293, 8.545992851257324, 8.854057312011719, 9.162121772766113, 9.470186233520508, 9.778249740600586, 10.08631420135498, 10.394378662109375, 10.70244312286377, 11.010507583618164, 11.318572044372559, 11.626636505126953, 11.934700012207031, 12.242764472961426, 12.55082893371582, 12.858893394470215, 13.16695785522461, 13.475022315979004, 13.783086776733398, 14.091151237487793, 14.399215698242188, 14.707279205322266, 15.01534366607666, 15.323408126831055, 15.63147258758545]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 9.0, 11.0, 10.0, 25.0, 16.0, 18.0, 27.0, 28.0, 36.0, 42.0, 37.0, 47.0, 44.0, 47.0, 51.0, 44.0, 48.0, 46.0, 51.0, 49.0, 45.0, 42.0, 41.0, 32.0, 34.0, 28.0, 19.0, 18.0, 13.0, 12.0, 4.0, 5.0, 11.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.261713743209839, -3.1487832069396973, -3.0358526706695557, -2.922922134399414, -2.8099918365478516, -2.697061061859131, -2.5841307640075684, -2.4712002277374268, -2.358269691467285, -2.2453391551971436, -2.132408618927002, -2.0194780826568604, -1.9065476655960083, -1.7936171293258667, -1.6806867122650146, -1.567756175994873, -1.4548256397247314, -1.3418951034545898, -1.2289645671844482, -1.1160341501235962, -1.0031036138534546, -0.890173077583313, -0.7772426009178162, -0.6643121242523193, -0.5513815879821777, -0.4384510815143585, -0.3255205750465393, -0.2125900685787201, -0.09965956211090088, 0.013270974159240723, 0.12620145082473755, 0.23913192749023438, 0.3520627021789551, 0.4649932086467743, 0.5779237151145935, 0.6908541917800903, 0.8037847280502319, 0.9167152643203735, 1.0296456813812256, 1.1425762176513672, 1.2555067539215088, 1.3684372901916504, 1.481367826461792, 1.594298243522644, 1.7072287797927856, 1.8201593160629272, 1.9330897331237793, 2.046020269393921, 2.1589508056640625, 2.271881341934204, 2.3848118782043457, 2.4977424144744873, 2.610672950744629, 2.7236032485961914, 2.836533784866333, 2.9494643211364746, 3.062394857406616, 3.175325393676758, 3.2882559299468994, 3.401186466217041, 3.5141167640686035, 3.627047538757324, 3.7399778366088867, 3.8529083728790283, 3.96583890914917]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 13.0, 16.0, 23.0, 31.0, 52.0, 79.0, 108.0, 172.0, 309.0, 485.0, 942.0, 1885.0, 4112.0, 10213.0, 34057.0, 158143.0, 525334.0, 240357.0, 48698.0, 13765.0, 5011.0, 2135.0, 1101.0, 622.0, 347.0, 186.0, 113.0, 74.0, 40.0, 28.0, 19.0, 18.0, 21.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.96856689453125, -2.8648681640625, -2.76116943359375, -2.657470703125, -2.55377197265625, -2.4500732421875, -2.34637451171875, -2.24267578125, -2.13897705078125, -2.0352783203125, -1.93157958984375, -1.827880859375, -1.72418212890625, -1.6204833984375, -1.51678466796875, -1.4130859375, -1.30938720703125, -1.2056884765625, -1.10198974609375, -0.998291015625, -0.89459228515625, -0.7908935546875, -0.68719482421875, -0.58349609375, -0.47979736328125, -0.3760986328125, -0.27239990234375, -0.168701171875, -0.06500244140625, 0.0386962890625, 0.14239501953125, 0.24609375, 0.34979248046875, 0.4534912109375, 0.55718994140625, 0.660888671875, 0.76458740234375, 0.8682861328125, 0.97198486328125, 1.07568359375, 1.17938232421875, 1.2830810546875, 1.38677978515625, 1.490478515625, 1.59417724609375, 1.6978759765625, 1.80157470703125, 1.9052734375, 2.00897216796875, 2.1126708984375, 2.21636962890625, 2.320068359375, 2.42376708984375, 2.5274658203125, 2.63116455078125, 2.73486328125, 2.83856201171875, 2.9422607421875, 3.04595947265625, 3.149658203125, 3.25335693359375, 3.3570556640625, 3.46075439453125, 3.564453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 18.0, 24.0, 20.0, 60.0, 53.0, 60.0, 92.0, 87.0, 78.0, 81.0, 90.0, 64.0, 49.0, 48.0, 29.0, 29.0, 27.0, 13.0, 15.0, 4.0, 6.0, 4.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.845703125, -2.7723388671875, -2.698974609375, -2.6256103515625, -2.55224609375, -2.4788818359375, -2.405517578125, -2.3321533203125, -2.2587890625, -2.1854248046875, -2.112060546875, -2.0386962890625, -1.96533203125, -1.8919677734375, -1.818603515625, -1.7452392578125, -1.671875, -1.5985107421875, -1.525146484375, -1.4517822265625, -1.37841796875, -1.3050537109375, -1.231689453125, -1.1583251953125, -1.0849609375, -1.0115966796875, -0.938232421875, -0.8648681640625, -0.79150390625, -0.7181396484375, -0.644775390625, -0.5714111328125, -0.498046875, -0.4246826171875, -0.351318359375, -0.2779541015625, -0.20458984375, -0.1312255859375, -0.057861328125, 0.0155029296875, 0.0888671875, 0.1622314453125, 0.235595703125, 0.3089599609375, 0.38232421875, 0.4556884765625, 0.529052734375, 0.6024169921875, 0.67578125, 0.7491455078125, 0.822509765625, 0.8958740234375, 0.96923828125, 1.0426025390625, 1.115966796875, 1.1893310546875, 1.2626953125, 1.3360595703125, 1.409423828125, 1.4827880859375, 1.55615234375, 1.6295166015625, 1.702880859375, 1.7762451171875, 1.849609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 8.0, 7.0, 11.0, 8.0, 25.0, 31.0, 38.0, 60.0, 108.0, 179.0, 421.0, 790.0, 2068.0, 8922.0, 231880.0, 774910.0, 23562.0, 3199.0, 1143.0, 525.0, 284.0, 142.0, 92.0, 39.0, 37.0, 17.0, 12.0, 8.0, 7.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.35504150390625, -6.1124267578125, -5.86981201171875, -5.627197265625, -5.38458251953125, -5.1419677734375, -4.89935302734375, -4.65673828125, -4.41412353515625, -4.1715087890625, -3.92889404296875, -3.686279296875, -3.44366455078125, -3.2010498046875, -2.95843505859375, -2.7158203125, -2.47320556640625, -2.2305908203125, -1.98797607421875, -1.745361328125, -1.50274658203125, -1.2601318359375, -1.01751708984375, -0.77490234375, -0.53228759765625, -0.2896728515625, -0.04705810546875, 0.195556640625, 0.43817138671875, 0.6807861328125, 0.92340087890625, 1.166015625, 1.40863037109375, 1.6512451171875, 1.89385986328125, 2.136474609375, 2.37908935546875, 2.6217041015625, 2.86431884765625, 3.10693359375, 3.34954833984375, 3.5921630859375, 3.83477783203125, 4.077392578125, 4.32000732421875, 4.5626220703125, 4.80523681640625, 5.0478515625, 5.29046630859375, 5.5330810546875, 5.77569580078125, 6.018310546875, 6.26092529296875, 6.5035400390625, 6.74615478515625, 6.98876953125, 7.23138427734375, 7.4739990234375, 7.71661376953125, 7.959228515625, 8.20184326171875, 8.4444580078125, 8.68707275390625, 8.9296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 10.0, 12.0, 16.0, 10.0, 24.0, 31.0, 30.0, 23.0, 44.0, 50.0, 48.0, 43.0, 46.0, 44.0, 58.0, 54.0, 52.0, 49.0, 53.0, 43.0, 47.0, 32.0, 33.0, 27.0, 20.0, 17.0, 16.0, 15.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.28228759765625, -6.0372314453125, -5.79217529296875, -5.547119140625, -5.30206298828125, -5.0570068359375, -4.81195068359375, -4.56689453125, -4.32183837890625, -4.0767822265625, -3.83172607421875, -3.586669921875, -3.34161376953125, -3.0965576171875, -2.85150146484375, -2.6064453125, -2.36138916015625, -2.1163330078125, -1.87127685546875, -1.626220703125, -1.38116455078125, -1.1361083984375, -0.89105224609375, -0.64599609375, -0.40093994140625, -0.1558837890625, 0.08917236328125, 0.334228515625, 0.57928466796875, 0.8243408203125, 1.06939697265625, 1.314453125, 1.55950927734375, 1.8045654296875, 2.04962158203125, 2.294677734375, 2.53973388671875, 2.7847900390625, 3.02984619140625, 3.27490234375, 3.51995849609375, 3.7650146484375, 4.01007080078125, 4.255126953125, 4.50018310546875, 4.7452392578125, 4.99029541015625, 5.2353515625, 5.48040771484375, 5.7254638671875, 5.97052001953125, 6.215576171875, 6.46063232421875, 6.7056884765625, 6.95074462890625, 7.19580078125, 7.44085693359375, 7.6859130859375, 7.93096923828125, 8.176025390625, 8.42108154296875, 8.6661376953125, 8.91119384765625, 9.15625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 17.0, 13.0, 15.0, 40.0, 51.0, 96.0, 154.0, 367.0, 913.0, 3843.0, 94127.0, 927382.0, 18261.0, 2056.0, 593.0, 284.0, 126.0, 66.0, 49.0, 35.0, 11.0, 9.0, 7.0, 12.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.59619140625, -3.4541015625, -3.31201171875, -3.169921875, -3.02783203125, -2.8857421875, -2.74365234375, -2.6015625, -2.45947265625, -2.3173828125, -2.17529296875, -2.033203125, -1.89111328125, -1.7490234375, -1.60693359375, -1.46484375, -1.32275390625, -1.1806640625, -1.03857421875, -0.896484375, -0.75439453125, -0.6123046875, -0.47021484375, -0.328125, -0.18603515625, -0.0439453125, 0.09814453125, 0.240234375, 0.38232421875, 0.5244140625, 0.66650390625, 0.80859375, 0.95068359375, 1.0927734375, 1.23486328125, 1.376953125, 1.51904296875, 1.6611328125, 1.80322265625, 1.9453125, 2.08740234375, 2.2294921875, 2.37158203125, 2.513671875, 2.65576171875, 2.7978515625, 2.93994140625, 3.08203125, 3.22412109375, 3.3662109375, 3.50830078125, 3.650390625, 3.79248046875, 3.9345703125, 4.07666015625, 4.21875, 4.36083984375, 4.5029296875, 4.64501953125, 4.787109375, 4.92919921875, 5.0712890625, 5.21337890625, 5.35546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 5.0, 6.0, 10.0, 18.0, 34.0, 43.0, 55.0, 71.0, 98.0, 131.0, 124.0, 109.0, 100.0, 68.0, 39.0, 35.0, 19.0, 14.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003714561462402344, -0.0003603249788284302, -0.000349193811416626, -0.0003380626440048218, -0.0003269314765930176, -0.0003158003091812134, -0.0003046691417694092, -0.000293537974357605, -0.0002824068069458008, -0.0002712756395339966, -0.0002601444721221924, -0.0002490133047103882, -0.00023788213729858398, -0.00022675096988677979, -0.00021561980247497559, -0.0002044886350631714, -0.0001933574676513672, -0.000182226300239563, -0.0001710951328277588, -0.0001599639654159546, -0.0001488327980041504, -0.0001377016305923462, -0.000126570463180542, -0.00011543929576873779, -0.0001043081283569336, -9.31769609451294e-05, -8.20457935333252e-05, -7.0914626121521e-05, -5.97834587097168e-05, -4.86522912979126e-05, -3.75211238861084e-05, -2.63899564743042e-05, -1.52587890625e-05, -4.127621650695801e-06, 7.0035457611083984e-06, 1.8134713172912598e-05, 2.9265880584716797e-05, 4.0397047996520996e-05, 5.1528215408325195e-05, 6.26593828201294e-05, 7.37905502319336e-05, 8.492171764373779e-05, 9.605288505554199e-05, 0.00010718405246734619, 0.00011831521987915039, 0.0001294463872909546, 0.0001405775547027588, 0.000151708722114563, 0.0001628398895263672, 0.0001739710569381714, 0.00018510222434997559, 0.00019623339176177979, 0.00020736455917358398, 0.00021849572658538818, 0.00022962689399719238, 0.00024075806140899658, 0.0002518892288208008, 0.000263020396232605, 0.0002741515636444092, 0.0002852827310562134, 0.0002964138984680176, 0.0003075450658798218, 0.000318676233291626, 0.0003298074007034302, 0.0003409385681152344]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 6.0, 10.0, 9.0, 16.0, 37.0, 82.0, 123.0, 283.0, 760.0, 3164.0, 28410.0, 878062.0, 129031.0, 6349.0, 1384.0, 419.0, 172.0, 90.0, 47.0, 25.0, 18.0, 15.0, 8.0, 3.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.869140625, -3.750823974609375, -3.63250732421875, -3.514190673828125, -3.3958740234375, -3.277557373046875, -3.15924072265625, -3.040924072265625, -2.922607421875, -2.804290771484375, -2.68597412109375, -2.567657470703125, -2.4493408203125, -2.331024169921875, -2.21270751953125, -2.094390869140625, -1.97607421875, -1.857757568359375, -1.73944091796875, -1.621124267578125, -1.5028076171875, -1.384490966796875, -1.26617431640625, -1.147857666015625, -1.029541015625, -0.911224365234375, -0.79290771484375, -0.674591064453125, -0.5562744140625, -0.437957763671875, -0.31964111328125, -0.201324462890625, -0.0830078125, 0.035308837890625, 0.15362548828125, 0.271942138671875, 0.3902587890625, 0.508575439453125, 0.62689208984375, 0.745208740234375, 0.863525390625, 0.981842041015625, 1.10015869140625, 1.218475341796875, 1.3367919921875, 1.455108642578125, 1.57342529296875, 1.691741943359375, 1.81005859375, 1.928375244140625, 2.04669189453125, 2.165008544921875, 2.2833251953125, 2.401641845703125, 2.51995849609375, 2.638275146484375, 2.756591796875, 2.874908447265625, 2.99322509765625, 3.111541748046875, 3.2298583984375, 3.348175048828125, 3.46649169921875, 3.584808349609375, 3.703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 15.0, 19.0, 34.0, 57.0, 80.0, 111.0, 121.0, 121.0, 108.0, 89.0, 74.0, 49.0, 35.0, 22.0, 19.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.029296875, -2.9462890625, -2.86328125, -2.7802734375, -2.697265625, -2.6142578125, -2.53125, -2.4482421875, -2.365234375, -2.2822265625, -2.19921875, -2.1162109375, -2.033203125, -1.9501953125, -1.8671875, -1.7841796875, -1.701171875, -1.6181640625, -1.53515625, -1.4521484375, -1.369140625, -1.2861328125, -1.203125, -1.1201171875, -1.037109375, -0.9541015625, -0.87109375, -0.7880859375, -0.705078125, -0.6220703125, -0.5390625, -0.4560546875, -0.373046875, -0.2900390625, -0.20703125, -0.1240234375, -0.041015625, 0.0419921875, 0.125, 0.2080078125, 0.291015625, 0.3740234375, 0.45703125, 0.5400390625, 0.623046875, 0.7060546875, 0.7890625, 0.8720703125, 0.955078125, 1.0380859375, 1.12109375, 1.2041015625, 1.287109375, 1.3701171875, 1.453125, 1.5361328125, 1.619140625, 1.7021484375, 1.78515625, 1.8681640625, 1.951171875, 2.0341796875, 2.1171875, 2.2001953125, 2.283203125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 30.0, 65.0, 170.0, 297.0, 231.0, 124.0, 50.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.95179748535156, -67.0815658569336, -65.21134185791016, -63.34111404418945, -61.47088623046875, -59.60065460205078, -57.73042678833008, -55.860198974609375, -53.98997116088867, -52.11974334716797, -50.249515533447266, -48.37928771972656, -46.509056091308594, -44.638832092285156, -42.76860046386719, -40.898372650146484, -39.02814483642578, -37.15791702270508, -35.287689208984375, -33.41746139526367, -31.547231674194336, -29.677003860473633, -27.806774139404297, -25.936546325683594, -24.06631851196289, -22.196090698242188, -20.325862884521484, -18.45563316345215, -16.585405349731445, -14.715177536010742, -12.844948768615723, -10.974720001220703, -9.104488372802734, -7.234260082244873, -5.364031791687012, -3.4938035011291504, -1.623575210571289, 0.24665260314941406, 2.1168813705444336, 3.987110137939453, 5.857337951660156, 7.727566242218018, 9.597794532775879, 11.468023300170898, 13.338251113891602, 15.208478927612305, 17.07870864868164, 18.948936462402344, 20.819164276123047, 22.68939208984375, 24.559619903564453, 26.42984962463379, 28.300077438354492, 30.170305252075195, 32.04053497314453, 33.910762786865234, 35.78099060058594, 37.65121841430664, 39.521446228027344, 41.39167404174805, 43.26190185546875, 45.13213348388672, 47.00236129760742, 48.872589111328125, 50.74281692504883]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 8.0, 4.0, 7.0, 12.0, 14.0, 26.0, 26.0, 38.0, 34.0, 39.0, 39.0, 44.0, 59.0, 46.0, 54.0, 68.0, 42.0, 43.0, 50.0, 44.0, 42.0, 30.0, 27.0, 30.0, 29.0, 20.0, 19.0, 17.0, 16.0, 13.0, 11.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.26447296142578, -31.31891441345215, -30.373355865478516, -29.427797317504883, -28.48223876953125, -27.53668212890625, -26.591123580932617, -25.645565032958984, -24.70000648498535, -23.75444793701172, -22.808889389038086, -21.863330841064453, -20.917774200439453, -19.972213745117188, -19.026657104492188, -18.081098556518555, -17.135540008544922, -16.18998146057129, -15.244422912597656, -14.29886531829834, -13.353306770324707, -12.407748222351074, -11.462190628051758, -10.516632080078125, -9.571073532104492, -8.62551498413086, -7.679956912994385, -6.73439884185791, -5.788840293884277, -4.8432817459106445, -3.89772367477417, -2.9521656036376953, -2.0066089630126953, -1.0610506534576416, -0.11549234390258789, 0.8300659656524658, 1.7756242752075195, 2.7211828231811523, 3.666740894317627, 4.612298965454102, 5.557857513427734, 6.503416061401367, 7.448974132537842, 8.394532203674316, 9.34009075164795, 10.285649299621582, 11.231206893920898, 12.176765441894531, 13.122323989868164, 14.067882537841797, 15.01344108581543, 15.958998680114746, 16.904556274414062, 17.850116729736328, 18.795673370361328, 19.74123191833496, 20.686790466308594, 21.632349014282227, 22.57790756225586, 23.523466110229492, 24.469024658203125, 25.414581298828125, 26.360139846801758, 27.30569839477539, 28.251256942749023]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 15.0, 19.0, 32.0, 43.0, 79.0, 191.0, 393.0, 1026.0, 3582.0, 23353.0, 3721031.0, 424199.0, 15973.0, 2882.0, 806.0, 304.0, 156.0, 66.0, 45.0, 22.0, 22.0, 18.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.1751708984375, -7.975341796875, -7.7755126953125, -7.57568359375, -7.3758544921875, -7.176025390625, -6.9761962890625, -6.7763671875, -6.5765380859375, -6.376708984375, -6.1768798828125, -5.97705078125, -5.7772216796875, -5.577392578125, -5.3775634765625, -5.177734375, -4.9779052734375, -4.778076171875, -4.5782470703125, -4.37841796875, -4.1785888671875, -3.978759765625, -3.7789306640625, -3.5791015625, -3.3792724609375, -3.179443359375, -2.9796142578125, -2.77978515625, -2.5799560546875, -2.380126953125, -2.1802978515625, -1.98046875, -1.7806396484375, -1.580810546875, -1.3809814453125, -1.18115234375, -0.9813232421875, -0.781494140625, -0.5816650390625, -0.3818359375, -0.1820068359375, 0.017822265625, 0.2176513671875, 0.41748046875, 0.6173095703125, 0.817138671875, 1.0169677734375, 1.216796875, 1.4166259765625, 1.616455078125, 1.8162841796875, 2.01611328125, 2.2159423828125, 2.415771484375, 2.6156005859375, 2.8154296875, 3.0152587890625, 3.215087890625, 3.4149169921875, 3.61474609375, 3.8145751953125, 4.014404296875, 4.2142333984375, 4.4140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 10.0, 8.0, 12.0, 25.0, 31.0, 58.0, 81.0, 136.0, 114.0, 140.0, 119.0, 86.0, 56.0, 43.0, 33.0, 16.0, 10.0, 10.0, 10.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.51953125, -4.417083740234375, -4.31463623046875, -4.212188720703125, -4.1097412109375, -4.007293701171875, -3.90484619140625, -3.802398681640625, -3.699951171875, -3.597503662109375, -3.49505615234375, -3.392608642578125, -3.2901611328125, -3.187713623046875, -3.08526611328125, -2.982818603515625, -2.88037109375, -2.777923583984375, -2.67547607421875, -2.573028564453125, -2.4705810546875, -2.368133544921875, -2.26568603515625, -2.163238525390625, -2.060791015625, -1.958343505859375, -1.85589599609375, -1.753448486328125, -1.6510009765625, -1.548553466796875, -1.44610595703125, -1.343658447265625, -1.2412109375, -1.138763427734375, -1.03631591796875, -0.933868408203125, -0.8314208984375, -0.728973388671875, -0.62652587890625, -0.524078369140625, -0.421630859375, -0.319183349609375, -0.21673583984375, -0.114288330078125, -0.0118408203125, 0.090606689453125, 0.19305419921875, 0.295501708984375, 0.39794921875, 0.500396728515625, 0.60284423828125, 0.705291748046875, 0.8077392578125, 0.910186767578125, 1.01263427734375, 1.115081787109375, 1.217529296875, 1.319976806640625, 1.42242431640625, 1.524871826171875, 1.6273193359375, 1.729766845703125, 1.83221435546875, 1.934661865234375, 2.037109375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 13.0, 11.0, 18.0, 20.0, 28.0, 36.0, 61.0, 71.0, 107.0, 144.0, 213.0, 312.0, 543.0, 868.0, 1618.0, 3484.0, 8492.0, 25932.0, 117199.0, 3296498.0, 639740.0, 68500.0, 17850.0, 6313.0, 2649.0, 1376.0, 743.0, 442.0, 321.0, 178.0, 151.0, 100.0, 74.0, 45.0, 35.0, 31.0, 13.0, 11.0, 9.0, 11.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.310546875, -2.230438232421875, -2.15032958984375, -2.070220947265625, -1.9901123046875, -1.910003662109375, -1.82989501953125, -1.749786376953125, -1.669677734375, -1.589569091796875, -1.50946044921875, -1.429351806640625, -1.3492431640625, -1.269134521484375, -1.18902587890625, -1.108917236328125, -1.02880859375, -0.948699951171875, -0.86859130859375, -0.788482666015625, -0.7083740234375, -0.628265380859375, -0.54815673828125, -0.468048095703125, -0.387939453125, -0.307830810546875, -0.22772216796875, -0.147613525390625, -0.0675048828125, 0.012603759765625, 0.09271240234375, 0.172821044921875, 0.2529296875, 0.333038330078125, 0.41314697265625, 0.493255615234375, 0.5733642578125, 0.653472900390625, 0.73358154296875, 0.813690185546875, 0.893798828125, 0.973907470703125, 1.05401611328125, 1.134124755859375, 1.2142333984375, 1.294342041015625, 1.37445068359375, 1.454559326171875, 1.53466796875, 1.614776611328125, 1.69488525390625, 1.774993896484375, 1.8551025390625, 1.935211181640625, 2.01531982421875, 2.095428466796875, 2.175537109375, 2.255645751953125, 2.33575439453125, 2.415863037109375, 2.4959716796875, 2.576080322265625, 2.65618896484375, 2.736297607421875, 2.81640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 19.0, 21.0, 42.0, 70.0, 176.0, 941.0, 2317.0, 275.0, 103.0, 50.0, 24.0, 16.0, 6.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.765625, -2.68902587890625, -2.6124267578125, -2.53582763671875, -2.459228515625, -2.38262939453125, -2.3060302734375, -2.22943115234375, -2.15283203125, -2.07623291015625, -1.9996337890625, -1.92303466796875, -1.846435546875, -1.76983642578125, -1.6932373046875, -1.61663818359375, -1.5400390625, -1.46343994140625, -1.3868408203125, -1.31024169921875, -1.233642578125, -1.15704345703125, -1.0804443359375, -1.00384521484375, -0.92724609375, -0.85064697265625, -0.7740478515625, -0.69744873046875, -0.620849609375, -0.54425048828125, -0.4676513671875, -0.39105224609375, -0.314453125, -0.23785400390625, -0.1612548828125, -0.08465576171875, -0.008056640625, 0.06854248046875, 0.1451416015625, 0.22174072265625, 0.29833984375, 0.37493896484375, 0.4515380859375, 0.52813720703125, 0.604736328125, 0.68133544921875, 0.7579345703125, 0.83453369140625, 0.9111328125, 0.98773193359375, 1.0643310546875, 1.14093017578125, 1.217529296875, 1.29412841796875, 1.3707275390625, 1.44732666015625, 1.52392578125, 1.60052490234375, 1.6771240234375, 1.75372314453125, 1.830322265625, 1.90692138671875, 1.9835205078125, 2.06011962890625, 2.13671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 8.0, 19.0, 26.0, 43.0, 58.0, 84.0, 126.0, 101.0, 109.0, 100.0, 87.0, 82.0, 44.0, 33.0, 20.0, 14.0, 7.0, 6.0, 6.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.335238456726074, -5.158055305480957, -4.98087215423584, -4.803689002990723, -4.6265058517456055, -4.4493231773376465, -4.272140026092529, -4.094956874847412, -3.917773723602295, -3.7405905723571777, -3.5634074211120605, -3.3862245082855225, -3.2090413570404053, -3.031858205795288, -2.85467529296875, -2.677492141723633, -2.5003089904785156, -2.3231258392333984, -2.1459426879882812, -1.9687597751617432, -1.791576623916626, -1.6143934726715088, -1.4372104406356812, -1.2600274085998535, -1.0828442573547363, -0.9056611657142639, -0.7284780740737915, -0.5512949824333191, -0.3741118907928467, -0.19692879915237427, -0.019745707511901855, 0.15743732452392578, 0.33462047576904297, 0.5118035674095154, 0.6889866590499878, 0.8661697506904602, 1.0433528423309326, 1.2205359935760498, 1.3977190256118774, 1.574902057647705, 1.7520852088928223, 1.9292683601379395, 2.1064515113830566, 2.2836344242095947, 2.460817575454712, 2.638000726699829, 2.815183639526367, 2.9923667907714844, 3.1695499420166016, 3.3467330932617188, 3.523916244506836, 3.701099157333374, 3.878282308578491, 4.055465221405029, 4.2326483726501465, 4.409831523895264, 4.587014675140381, 4.764197826385498, 4.941380977630615, 5.118564128875732, 5.295746803283691, 5.472929954528809, 5.650113105773926, 5.827296257019043, 6.00447940826416]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 19.0, 20.0, 14.0, 16.0, 22.0, 30.0, 30.0, 33.0, 39.0, 50.0, 55.0, 49.0, 74.0, 53.0, 59.0, 45.0, 50.0, 43.0, 56.0, 33.0, 43.0, 31.0, 26.0, 24.0, 18.0, 17.0, 14.0, 10.0, 12.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.105953216552734, -4.934338569641113, -4.76272439956665, -4.591109752655029, -4.419495582580566, -4.247880935668945, -4.076266288757324, -3.9046521186828613, -3.7330377101898193, -3.5614233016967773, -3.3898088932037354, -3.2181944847106934, -3.0465798377990723, -2.8749656677246094, -2.7033510208129883, -2.5317366123199463, -2.3601222038269043, -2.1885077953338623, -2.0168933868408203, -1.8452788591384888, -1.6736644506454468, -1.5020500421524048, -1.3304355144500732, -1.1588211059570312, -0.9872066974639893, -0.8155922889709473, -0.6439778208732605, -0.47236335277557373, -0.30074894428253174, -0.12913453578948975, 0.0424799919128418, 0.2140944004058838, 0.3857088088989258, 0.5573232173919678, 0.7289376854896545, 0.9005521535873413, 1.0721665620803833, 1.2437809705734253, 1.4153954982757568, 1.5870099067687988, 1.7586243152618408, 1.9302387237548828, 2.101853132247925, 2.273467540740967, 2.445082187652588, 2.616696357727051, 2.788311004638672, 2.959925413131714, 3.131539821624756, 3.303154230117798, 3.47476863861084, 3.646383285522461, 3.817997455596924, 3.989612102508545, 4.161226272583008, 4.332840919494629, 4.50445556640625, 4.676070213317871, 4.847684383392334, 5.019299030303955, 5.190913200378418, 5.362527847290039, 5.53414249420166, 5.705756664276123, 5.877370834350586]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 1.0, 5.0, 11.0, 18.0, 24.0, 35.0, 58.0, 91.0, 232.0, 648.0, 2751.0, 29628.0, 826152.0, 179631.0, 7304.0, 1243.0, 354.0, 162.0, 74.0, 46.0, 24.0, 19.0, 16.0, 6.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.5086669921875, -8.212646484375, -7.9166259765625, -7.62060546875, -7.3245849609375, -7.028564453125, -6.7325439453125, -6.4365234375, -6.1405029296875, -5.844482421875, -5.5484619140625, -5.25244140625, -4.9564208984375, -4.660400390625, -4.3643798828125, -4.068359375, -3.7723388671875, -3.476318359375, -3.1802978515625, -2.88427734375, -2.5882568359375, -2.292236328125, -1.9962158203125, -1.7001953125, -1.4041748046875, -1.108154296875, -0.8121337890625, -0.51611328125, -0.2200927734375, 0.075927734375, 0.3719482421875, 0.66796875, 0.9639892578125, 1.260009765625, 1.5560302734375, 1.85205078125, 2.1480712890625, 2.444091796875, 2.7401123046875, 3.0361328125, 3.3321533203125, 3.628173828125, 3.9241943359375, 4.22021484375, 4.5162353515625, 4.812255859375, 5.1082763671875, 5.404296875, 5.7003173828125, 5.996337890625, 6.2923583984375, 6.58837890625, 6.8843994140625, 7.180419921875, 7.4764404296875, 7.7724609375, 8.0684814453125, 8.364501953125, 8.6605224609375, 8.95654296875, 9.2525634765625, 9.548583984375, 9.8446044921875, 10.140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 9.0, 3.0, 4.0, 7.0, 16.0, 15.0, 31.0, 43.0, 51.0, 87.0, 92.0, 103.0, 108.0, 93.0, 77.0, 63.0, 55.0, 42.0, 27.0, 27.0, 26.0, 10.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.140625, -3.063140869140625, -2.98565673828125, -2.908172607421875, -2.8306884765625, -2.753204345703125, -2.67572021484375, -2.598236083984375, -2.520751953125, -2.443267822265625, -2.36578369140625, -2.288299560546875, -2.2108154296875, -2.133331298828125, -2.05584716796875, -1.978363037109375, -1.90087890625, -1.823394775390625, -1.74591064453125, -1.668426513671875, -1.5909423828125, -1.513458251953125, -1.43597412109375, -1.358489990234375, -1.281005859375, -1.203521728515625, -1.12603759765625, -1.048553466796875, -0.9710693359375, -0.893585205078125, -0.81610107421875, -0.738616943359375, -0.6611328125, -0.583648681640625, -0.50616455078125, -0.428680419921875, -0.3511962890625, -0.273712158203125, -0.19622802734375, -0.118743896484375, -0.041259765625, 0.036224365234375, 0.11370849609375, 0.191192626953125, 0.2686767578125, 0.346160888671875, 0.42364501953125, 0.501129150390625, 0.57861328125, 0.656097412109375, 0.73358154296875, 0.811065673828125, 0.8885498046875, 0.966033935546875, 1.04351806640625, 1.121002197265625, 1.198486328125, 1.275970458984375, 1.35345458984375, 1.430938720703125, 1.5084228515625, 1.585906982421875, 1.66339111328125, 1.740875244140625, 1.818359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 8.0, 12.0, 23.0, 19.0, 52.0, 129.0, 284.0, 601.0, 1863.0, 9930.0, 370160.0, 647995.0, 13825.0, 2363.0, 674.0, 286.0, 138.0, 58.0, 32.0, 27.0, 18.0, 14.0, 9.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.0703125, -9.7911376953125, -9.511962890625, -9.2327880859375, -8.95361328125, -8.6744384765625, -8.395263671875, -8.1160888671875, -7.8369140625, -7.5577392578125, -7.278564453125, -6.9993896484375, -6.72021484375, -6.4410400390625, -6.161865234375, -5.8826904296875, -5.603515625, -5.3243408203125, -5.045166015625, -4.7659912109375, -4.48681640625, -4.2076416015625, -3.928466796875, -3.6492919921875, -3.3701171875, -3.0909423828125, -2.811767578125, -2.5325927734375, -2.25341796875, -1.9742431640625, -1.695068359375, -1.4158935546875, -1.13671875, -0.8575439453125, -0.578369140625, -0.2991943359375, -0.02001953125, 0.2591552734375, 0.538330078125, 0.8175048828125, 1.0966796875, 1.3758544921875, 1.655029296875, 1.9342041015625, 2.21337890625, 2.4925537109375, 2.771728515625, 3.0509033203125, 3.330078125, 3.6092529296875, 3.888427734375, 4.1676025390625, 4.44677734375, 4.7259521484375, 5.005126953125, 5.2843017578125, 5.5634765625, 5.8426513671875, 6.121826171875, 6.4010009765625, 6.68017578125, 6.9593505859375, 7.238525390625, 7.5177001953125, 7.796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 2.0, 10.0, 6.0, 5.0, 5.0, 12.0, 19.0, 18.0, 28.0, 39.0, 28.0, 30.0, 32.0, 31.0, 41.0, 64.0, 66.0, 48.0, 47.0, 46.0, 47.0, 55.0, 47.0, 40.0, 35.0, 33.0, 30.0, 20.0, 27.0, 22.0, 12.0, 13.0, 10.0, 6.0, 3.0, 9.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.64453125, -6.46246337890625, -6.2803955078125, -6.09832763671875, -5.916259765625, -5.73419189453125, -5.5521240234375, -5.37005615234375, -5.18798828125, -5.00592041015625, -4.8238525390625, -4.64178466796875, -4.459716796875, -4.27764892578125, -4.0955810546875, -3.91351318359375, -3.7314453125, -3.54937744140625, -3.3673095703125, -3.18524169921875, -3.003173828125, -2.82110595703125, -2.6390380859375, -2.45697021484375, -2.27490234375, -2.09283447265625, -1.9107666015625, -1.72869873046875, -1.546630859375, -1.36456298828125, -1.1824951171875, -1.00042724609375, -0.818359375, -0.63629150390625, -0.4542236328125, -0.27215576171875, -0.090087890625, 0.09197998046875, 0.2740478515625, 0.45611572265625, 0.63818359375, 0.82025146484375, 1.0023193359375, 1.18438720703125, 1.366455078125, 1.54852294921875, 1.7305908203125, 1.91265869140625, 2.0947265625, 2.27679443359375, 2.4588623046875, 2.64093017578125, 2.822998046875, 3.00506591796875, 3.1871337890625, 3.36920166015625, 3.55126953125, 3.73333740234375, 3.9154052734375, 4.09747314453125, 4.279541015625, 4.46160888671875, 4.6436767578125, 4.82574462890625, 5.0078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 10.0, 11.0, 12.0, 26.0, 29.0, 48.0, 64.0, 165.0, 380.0, 907.0, 3485.0, 37253.0, 865573.0, 131777.0, 6508.0, 1395.0, 446.0, 205.0, 107.0, 55.0, 28.0, 27.0, 16.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.486328125, -3.400604248046875, -3.31488037109375, -3.229156494140625, -3.1434326171875, -3.057708740234375, -2.97198486328125, -2.886260986328125, -2.800537109375, -2.714813232421875, -2.62908935546875, -2.543365478515625, -2.4576416015625, -2.371917724609375, -2.28619384765625, -2.200469970703125, -2.11474609375, -2.029022216796875, -1.94329833984375, -1.857574462890625, -1.7718505859375, -1.686126708984375, -1.60040283203125, -1.514678955078125, -1.428955078125, -1.343231201171875, -1.25750732421875, -1.171783447265625, -1.0860595703125, -1.000335693359375, -0.91461181640625, -0.828887939453125, -0.7431640625, -0.657440185546875, -0.57171630859375, -0.485992431640625, -0.4002685546875, -0.314544677734375, -0.22882080078125, -0.143096923828125, -0.057373046875, 0.028350830078125, 0.11407470703125, 0.199798583984375, 0.2855224609375, 0.371246337890625, 0.45697021484375, 0.542694091796875, 0.62841796875, 0.714141845703125, 0.79986572265625, 0.885589599609375, 0.9713134765625, 1.057037353515625, 1.14276123046875, 1.228485107421875, 1.314208984375, 1.399932861328125, 1.48565673828125, 1.571380615234375, 1.6571044921875, 1.742828369140625, 1.82855224609375, 1.914276123046875, 2.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 10.0, 12.0, 17.0, 18.0, 26.0, 39.0, 44.0, 45.0, 47.0, 68.0, 95.0, 103.0, 81.0, 64.0, 41.0, 36.0, 45.0, 30.0, 27.0, 14.0, 23.0, 15.0, 11.0, 15.0, 5.0, 8.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002579689025878906, -0.00025023147463798523, -0.00024249404668807983, -0.00023475661873817444, -0.00022701919078826904, -0.00021928176283836365, -0.00021154433488845825, -0.00020380690693855286, -0.00019606947898864746, -0.00018833205103874207, -0.00018059462308883667, -0.00017285719513893127, -0.00016511976718902588, -0.00015738233923912048, -0.0001496449112892151, -0.0001419074833393097, -0.0001341700553894043, -0.0001264326274394989, -0.0001186951994895935, -0.00011095777153968811, -0.00010322034358978271, -9.548291563987732e-05, -8.774548768997192e-05, -8.000805974006653e-05, -7.227063179016113e-05, -6.453320384025574e-05, -5.679577589035034e-05, -4.9058347940444946e-05, -4.132091999053955e-05, -3.3583492040634155e-05, -2.584606409072876e-05, -1.8108636140823364e-05, -1.0371208190917969e-05, -2.6337802410125732e-06, 5.103647708892822e-06, 1.2841075658798218e-05, 2.0578503608703613e-05, 2.831593155860901e-05, 3.6053359508514404e-05, 4.37907874584198e-05, 5.1528215408325195e-05, 5.926564335823059e-05, 6.700307130813599e-05, 7.474049925804138e-05, 8.247792720794678e-05, 9.021535515785217e-05, 9.795278310775757e-05, 0.00010569021105766296, 0.00011342763900756836, 0.00012116506695747375, 0.00012890249490737915, 0.00013663992285728455, 0.00014437735080718994, 0.00015211477875709534, 0.00015985220670700073, 0.00016758963465690613, 0.00017532706260681152, 0.00018306449055671692, 0.00019080191850662231, 0.0001985393464565277, 0.0002062767744064331, 0.0002140142023563385, 0.0002217516303062439, 0.0002294890582561493, 0.0002372264862060547]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 16.0, 21.0, 31.0, 40.0, 74.0, 134.0, 300.0, 585.0, 1473.0, 4224.0, 18104.0, 487155.0, 511092.0, 18256.0, 4354.0, 1472.0, 538.0, 251.0, 160.0, 90.0, 49.0, 34.0, 20.0, 23.0, 12.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.732421875, -2.652069091796875, -2.57171630859375, -2.491363525390625, -2.4110107421875, -2.330657958984375, -2.25030517578125, -2.169952392578125, -2.089599609375, -2.009246826171875, -1.92889404296875, -1.848541259765625, -1.7681884765625, -1.687835693359375, -1.60748291015625, -1.527130126953125, -1.44677734375, -1.366424560546875, -1.28607177734375, -1.205718994140625, -1.1253662109375, -1.045013427734375, -0.96466064453125, -0.884307861328125, -0.803955078125, -0.723602294921875, -0.64324951171875, -0.562896728515625, -0.4825439453125, -0.402191162109375, -0.32183837890625, -0.241485595703125, -0.1611328125, -0.080780029296875, -0.00042724609375, 0.079925537109375, 0.1602783203125, 0.240631103515625, 0.32098388671875, 0.401336669921875, 0.481689453125, 0.562042236328125, 0.64239501953125, 0.722747802734375, 0.8031005859375, 0.883453369140625, 0.96380615234375, 1.044158935546875, 1.12451171875, 1.204864501953125, 1.28521728515625, 1.365570068359375, 1.4459228515625, 1.526275634765625, 1.60662841796875, 1.686981201171875, 1.767333984375, 1.847686767578125, 1.92803955078125, 2.008392333984375, 2.0887451171875, 2.169097900390625, 2.24945068359375, 2.329803466796875, 2.41015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 5.0, 1.0, 12.0, 14.0, 17.0, 20.0, 37.0, 37.0, 72.0, 89.0, 91.0, 100.0, 110.0, 83.0, 81.0, 64.0, 45.0, 30.0, 25.0, 19.0, 8.0, 11.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8154296875, -1.7589569091796875, -1.702484130859375, -1.6460113525390625, -1.58953857421875, -1.5330657958984375, -1.476593017578125, -1.4201202392578125, -1.3636474609375, -1.3071746826171875, -1.250701904296875, -1.1942291259765625, -1.13775634765625, -1.0812835693359375, -1.024810791015625, -0.9683380126953125, -0.911865234375, -0.8553924560546875, -0.798919677734375, -0.7424468994140625, -0.68597412109375, -0.6295013427734375, -0.573028564453125, -0.5165557861328125, -0.4600830078125, -0.4036102294921875, -0.347137451171875, -0.2906646728515625, -0.23419189453125, -0.1777191162109375, -0.121246337890625, -0.0647735595703125, -0.00830078125, 0.0481719970703125, 0.104644775390625, 0.1611175537109375, 0.21759033203125, 0.2740631103515625, 0.330535888671875, 0.3870086669921875, 0.4434814453125, 0.4999542236328125, 0.556427001953125, 0.6128997802734375, 0.66937255859375, 0.7258453369140625, 0.782318115234375, 0.8387908935546875, 0.895263671875, 0.9517364501953125, 1.008209228515625, 1.0646820068359375, 1.12115478515625, 1.1776275634765625, 1.234100341796875, 1.2905731201171875, 1.3470458984375, 1.4035186767578125, 1.459991455078125, 1.5164642333984375, 1.57293701171875, 1.6294097900390625, 1.685882568359375, 1.7423553466796875, 1.798828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 33.0, 58.0, 116.0, 161.0, 175.0, 163.0, 131.0, 58.0, 28.0, 21.0, 11.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.944555282592773, -30.780574798583984, -29.616592407226562, -28.45261001586914, -27.28862953186035, -26.124649047851562, -24.96066665649414, -23.79668426513672, -22.63270378112793, -21.46872329711914, -20.30474090576172, -19.140758514404297, -17.976778030395508, -16.81279754638672, -15.648815155029297, -14.484833717346191, -13.320852279663086, -12.15687084197998, -10.992889404296875, -9.82890796661377, -8.664926528930664, -7.500945091247559, -6.336963653564453, -5.172982215881348, -4.009000778198242, -2.8450193405151367, -1.6810379028320312, -0.5170564651489258, 0.6469249725341797, 1.8109064102172852, 2.9748878479003906, 4.138869285583496, 5.302852630615234, 6.46683406829834, 7.630815505981445, 8.79479694366455, 9.958778381347656, 11.122759819030762, 12.286741256713867, 13.450722694396973, 14.614704132080078, 15.778685569763184, 16.94266700744629, 18.106647491455078, 19.2706298828125, 20.434612274169922, 21.59859275817871, 22.7625732421875, 23.926555633544922, 25.090538024902344, 26.254518508911133, 27.418498992919922, 28.582481384277344, 29.746463775634766, 30.910444259643555, 32.074424743652344, 33.238407135009766, 34.40238952636719, 35.566368103027344, 36.730350494384766, 37.89433288574219, 39.05831527709961, 40.22229766845703, 41.38627624511719, 42.55025863647461]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 13.0, 11.0, 7.0, 15.0, 8.0, 15.0, 20.0, 18.0, 27.0, 42.0, 26.0, 45.0, 42.0, 44.0, 47.0, 51.0, 51.0, 55.0, 43.0, 46.0, 51.0, 44.0, 33.0, 33.0, 32.0, 27.0, 25.0, 24.0, 23.0, 8.0, 11.0, 6.0, 9.0, 13.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.931686401367188, -22.114774703979492, -21.297863006591797, -20.4809513092041, -19.664039611816406, -18.84712791442871, -18.030216217041016, -17.213302612304688, -16.396392822265625, -15.57948112487793, -14.762569427490234, -13.945657730102539, -13.128746032714844, -12.311834335327148, -11.494921684265137, -10.678009986877441, -9.86109733581543, -9.044185638427734, -8.227273941040039, -7.4103617668151855, -6.59345006942749, -5.776538372039795, -4.959626197814941, -4.142714500427246, -3.325802803039551, -2.5088911056518555, -1.691979169845581, -0.8750672340393066, -0.05815553665161133, 0.758756160736084, 1.5756683349609375, 2.392580032348633, 3.209491729736328, 4.026403427124023, 4.843315124511719, 5.660227298736572, 6.477138996124268, 7.294050693511963, 8.110962867736816, 8.927874565124512, 9.744786262512207, 10.561697959899902, 11.378609657287598, 12.19552230834961, 13.012434005737305, 13.829345703125, 14.646257400512695, 15.46316909790039, 16.280080795288086, 17.09699249267578, 17.913904190063477, 18.730815887451172, 19.547727584838867, 20.364639282226562, 21.18155288696289, 21.998462677001953, 22.81537628173828, 23.632287979125977, 24.449199676513672, 25.266111373901367, 26.083023071289062, 26.899934768676758, 27.716846466064453, 28.53376007080078, 29.350669860839844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 5.0, 3.0, 10.0, 10.0, 22.0, 25.0, 32.0, 50.0, 55.0, 108.0, 183.0, 367.0, 839.0, 2533.0, 13150.0, 219318.0, 3841812.0, 103148.0, 9189.0, 2062.0, 719.0, 248.0, 136.0, 76.0, 43.0, 35.0, 25.0, 23.0, 9.0, 14.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.57421875, -4.43304443359375, -4.2918701171875, -4.15069580078125, -4.009521484375, -3.86834716796875, -3.7271728515625, -3.58599853515625, -3.44482421875, -3.30364990234375, -3.1624755859375, -3.02130126953125, -2.880126953125, -2.73895263671875, -2.5977783203125, -2.45660400390625, -2.3154296875, -2.17425537109375, -2.0330810546875, -1.89190673828125, -1.750732421875, -1.60955810546875, -1.4683837890625, -1.32720947265625, -1.18603515625, -1.04486083984375, -0.9036865234375, -0.76251220703125, -0.621337890625, -0.48016357421875, -0.3389892578125, -0.19781494140625, -0.056640625, 0.08453369140625, 0.2257080078125, 0.36688232421875, 0.508056640625, 0.64923095703125, 0.7904052734375, 0.93157958984375, 1.07275390625, 1.21392822265625, 1.3551025390625, 1.49627685546875, 1.637451171875, 1.77862548828125, 1.9197998046875, 2.06097412109375, 2.2021484375, 2.34332275390625, 2.4844970703125, 2.62567138671875, 2.766845703125, 2.90802001953125, 3.0491943359375, 3.19036865234375, 3.33154296875, 3.47271728515625, 3.6138916015625, 3.75506591796875, 3.896240234375, 4.03741455078125, 4.1785888671875, 4.31976318359375, 4.4609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 12.0, 9.0, 20.0, 19.0, 29.0, 41.0, 50.0, 44.0, 55.0, 56.0, 46.0, 56.0, 61.0, 60.0, 53.0, 49.0, 47.0, 44.0, 38.0, 29.0, 24.0, 20.0, 24.0, 18.0, 12.0, 22.0, 5.0, 6.0, 3.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.330078125, -1.2928924560546875, -1.255706787109375, -1.2185211181640625, -1.18133544921875, -1.1441497802734375, -1.106964111328125, -1.0697784423828125, -1.0325927734375, -0.9954071044921875, -0.958221435546875, -0.9210357666015625, -0.88385009765625, -0.8466644287109375, -0.809478759765625, -0.7722930908203125, -0.735107421875, -0.6979217529296875, -0.660736083984375, -0.6235504150390625, -0.58636474609375, -0.5491790771484375, -0.511993408203125, -0.4748077392578125, -0.4376220703125, -0.4004364013671875, -0.363250732421875, -0.3260650634765625, -0.28887939453125, -0.2516937255859375, -0.214508056640625, -0.1773223876953125, -0.14013671875, -0.1029510498046875, -0.065765380859375, -0.0285797119140625, 0.00860595703125, 0.0457916259765625, 0.082977294921875, 0.1201629638671875, 0.1573486328125, 0.1945343017578125, 0.231719970703125, 0.2689056396484375, 0.30609130859375, 0.3432769775390625, 0.380462646484375, 0.4176483154296875, 0.454833984375, 0.4920196533203125, 0.529205322265625, 0.5663909912109375, 0.60357666015625, 0.6407623291015625, 0.677947998046875, 0.7151336669921875, 0.7523193359375, 0.7895050048828125, 0.826690673828125, 0.8638763427734375, 0.90106201171875, 0.9382476806640625, 0.975433349609375, 1.0126190185546875, 1.0498046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 24.0, 20.0, 23.0, 30.0, 61.0, 124.0, 260.0, 597.0, 2332.0, 14064.0, 251411.0, 3802186.0, 112025.0, 8716.0, 1538.0, 462.0, 164.0, 82.0, 38.0, 28.0, 27.0, 8.0, 11.0, 3.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.036224365234375, -2.90643310546875, -2.776641845703125, -2.6468505859375, -2.517059326171875, -2.38726806640625, -2.257476806640625, -2.127685546875, -1.997894287109375, -1.86810302734375, -1.738311767578125, -1.6085205078125, -1.478729248046875, -1.34893798828125, -1.219146728515625, -1.08935546875, -0.959564208984375, -0.82977294921875, -0.699981689453125, -0.5701904296875, -0.440399169921875, -0.31060791015625, -0.180816650390625, -0.051025390625, 0.078765869140625, 0.20855712890625, 0.338348388671875, 0.4681396484375, 0.597930908203125, 0.72772216796875, 0.857513427734375, 0.9873046875, 1.117095947265625, 1.24688720703125, 1.376678466796875, 1.5064697265625, 1.636260986328125, 1.76605224609375, 1.895843505859375, 2.025634765625, 2.155426025390625, 2.28521728515625, 2.415008544921875, 2.5447998046875, 2.674591064453125, 2.80438232421875, 2.934173583984375, 3.06396484375, 3.193756103515625, 3.32354736328125, 3.453338623046875, 3.5831298828125, 3.712921142578125, 3.84271240234375, 3.972503662109375, 4.102294921875, 4.232086181640625, 4.36187744140625, 4.491668701171875, 4.6214599609375, 4.751251220703125, 4.88104248046875, 5.010833740234375, 5.140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 15.0, 15.0, 26.0, 46.0, 56.0, 104.0, 130.0, 240.0, 382.0, 675.0, 847.0, 591.0, 351.0, 188.0, 125.0, 56.0, 51.0, 40.0, 27.0, 22.0, 12.0, 8.0, 11.0, 3.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.384765625, -3.3008880615234375, -3.217010498046875, -3.1331329345703125, -3.04925537109375, -2.9653778076171875, -2.881500244140625, -2.7976226806640625, -2.7137451171875, -2.6298675537109375, -2.545989990234375, -2.4621124267578125, -2.37823486328125, -2.2943572998046875, -2.210479736328125, -2.1266021728515625, -2.042724609375, -1.9588470458984375, -1.874969482421875, -1.7910919189453125, -1.70721435546875, -1.6233367919921875, -1.539459228515625, -1.4555816650390625, -1.3717041015625, -1.2878265380859375, -1.203948974609375, -1.1200714111328125, -1.03619384765625, -0.9523162841796875, -0.868438720703125, -0.7845611572265625, -0.70068359375, -0.6168060302734375, -0.532928466796875, -0.4490509033203125, -0.36517333984375, -0.2812957763671875, -0.197418212890625, -0.1135406494140625, -0.0296630859375, 0.0542144775390625, 0.138092041015625, 0.2219696044921875, 0.30584716796875, 0.3897247314453125, 0.473602294921875, 0.5574798583984375, 0.641357421875, 0.7252349853515625, 0.809112548828125, 0.8929901123046875, 0.97686767578125, 1.0607452392578125, 1.144622802734375, 1.2285003662109375, 1.3123779296875, 1.3962554931640625, 1.480133056640625, 1.5640106201171875, 1.64788818359375, 1.7317657470703125, 1.815643310546875, 1.8995208740234375, 1.9833984375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 34.0, 65.0, 184.0, 299.0, 253.0, 86.0, 42.0, 14.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.51862716674805, -34.3272590637207, -33.13589096069336, -31.944522857666016, -30.753154754638672, -29.561786651611328, -28.370420455932617, -27.179052352905273, -25.98768424987793, -24.796316146850586, -23.604948043823242, -22.4135799407959, -21.222213745117188, -20.030845642089844, -18.8394775390625, -17.648109436035156, -16.456741333007812, -15.265373229980469, -14.074005126953125, -12.882637977600098, -11.691269874572754, -10.49990177154541, -9.308534622192383, -8.117166519165039, -6.925798416137695, -5.734430313110352, -4.543062686920166, -3.3516948223114014, -2.1603269577026367, -0.968958854675293, 0.22240877151489258, 1.4137763977050781, 2.6051406860351562, 3.796508550643921, 4.9878764152526855, 6.179244041442871, 7.370612144470215, 8.561980247497559, 9.753347396850586, 10.94471549987793, 12.136083602905273, 13.327451705932617, 14.518819808959961, 15.710186958312988, 16.901554107666016, 18.09292221069336, 19.284290313720703, 20.475658416748047, 21.66702651977539, 22.858394622802734, 24.049762725830078, 25.241130828857422, 26.432498931884766, 27.62386703491211, 28.81523323059082, 30.006601333618164, 31.197969436645508, 32.38933563232422, 33.58070373535156, 34.772071838378906, 35.96343994140625, 37.154808044433594, 38.34617614746094, 39.53754425048828, 40.728912353515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 7.0, 18.0, 12.0, 17.0, 19.0, 29.0, 15.0, 26.0, 32.0, 33.0, 37.0, 32.0, 41.0, 31.0, 39.0, 41.0, 41.0, 34.0, 45.0, 54.0, 46.0, 39.0, 41.0, 25.0, 29.0, 30.0, 25.0, 24.0, 17.0, 20.0, 9.0, 16.0, 20.0, 7.0, 8.0, 6.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0], "bins": [-14.137614250183105, -13.76831340789795, -13.39901351928711, -13.029712677001953, -12.660411834716797, -12.291111946105957, -11.9218111038208, -11.552511215209961, -11.183210372924805, -10.813909530639648, -10.444609642028809, -10.075308799743652, -9.706008911132812, -9.336708068847656, -8.9674072265625, -8.598106384277344, -8.228806495666504, -7.859506130218506, -7.490205764770508, -7.120904922485352, -6.7516045570373535, -6.3823041915893555, -6.013003349304199, -5.643702983856201, -5.274402618408203, -4.905102252960205, -4.535801887512207, -4.166501045227051, -3.7972006797790527, -3.4279003143310547, -3.0585997104644775, -2.6892991065979004, -2.319997787475586, -1.9506973028182983, -1.5813968181610107, -1.2120963335037231, -0.8427958488464355, -0.47349536418914795, -0.10419487953186035, 0.2651057243347168, 0.6344060897827148, 1.0037065744400024, 1.37300705909729, 1.7423075437545776, 2.1116080284118652, 2.4809083938598633, 2.8502089977264404, 3.2195096015930176, 3.5888099670410156, 3.9581103324890137, 4.327410697937012, 4.696711540222168, 5.066011905670166, 5.435312271118164, 5.80461311340332, 6.173913478851318, 6.543213844299316, 6.9125142097473145, 7.2818145751953125, 7.651115417480469, 8.020416259765625, 8.389716148376465, 8.759016990661621, 9.128316879272461, 9.497617721557617]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 10.0, 16.0, 17.0, 31.0, 40.0, 90.0, 155.0, 242.0, 494.0, 959.0, 2062.0, 4915.0, 13856.0, 46740.0, 200040.0, 547056.0, 170656.0, 40439.0, 12449.0, 4468.0, 1901.0, 841.0, 448.0, 249.0, 136.0, 91.0, 52.0, 35.0, 20.0, 13.0, 10.0, 4.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.0833740234375, -2.998779296875, -2.9141845703125, -2.82958984375, -2.7449951171875, -2.660400390625, -2.5758056640625, -2.4912109375, -2.4066162109375, -2.322021484375, -2.2374267578125, -2.15283203125, -2.0682373046875, -1.983642578125, -1.8990478515625, -1.814453125, -1.7298583984375, -1.645263671875, -1.5606689453125, -1.47607421875, -1.3914794921875, -1.306884765625, -1.2222900390625, -1.1376953125, -1.0531005859375, -0.968505859375, -0.8839111328125, -0.79931640625, -0.7147216796875, -0.630126953125, -0.5455322265625, -0.4609375, -0.3763427734375, -0.291748046875, -0.2071533203125, -0.12255859375, -0.0379638671875, 0.046630859375, 0.1312255859375, 0.2158203125, 0.3004150390625, 0.385009765625, 0.4696044921875, 0.55419921875, 0.6387939453125, 0.723388671875, 0.8079833984375, 0.892578125, 0.9771728515625, 1.061767578125, 1.1463623046875, 1.23095703125, 1.3155517578125, 1.400146484375, 1.4847412109375, 1.5693359375, 1.6539306640625, 1.738525390625, 1.8231201171875, 1.90771484375, 1.9923095703125, 2.076904296875, 2.1614990234375, 2.24609375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 11.0, 16.0, 20.0, 21.0, 26.0, 35.0, 34.0, 49.0, 59.0, 44.0, 46.0, 45.0, 64.0, 60.0, 63.0, 52.0, 47.0, 48.0, 35.0, 46.0, 33.0, 19.0, 22.0, 23.0, 14.0, 15.0, 11.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.408203125, -1.37042236328125, -1.3326416015625, -1.29486083984375, -1.257080078125, -1.21929931640625, -1.1815185546875, -1.14373779296875, -1.10595703125, -1.06817626953125, -1.0303955078125, -0.99261474609375, -0.954833984375, -0.91705322265625, -0.8792724609375, -0.84149169921875, -0.8037109375, -0.76593017578125, -0.7281494140625, -0.69036865234375, -0.652587890625, -0.61480712890625, -0.5770263671875, -0.53924560546875, -0.50146484375, -0.46368408203125, -0.4259033203125, -0.38812255859375, -0.350341796875, -0.31256103515625, -0.2747802734375, -0.23699951171875, -0.19921875, -0.16143798828125, -0.1236572265625, -0.08587646484375, -0.048095703125, -0.01031494140625, 0.0274658203125, 0.06524658203125, 0.10302734375, 0.14080810546875, 0.1785888671875, 0.21636962890625, 0.254150390625, 0.29193115234375, 0.3297119140625, 0.36749267578125, 0.4052734375, 0.44305419921875, 0.4808349609375, 0.51861572265625, 0.556396484375, 0.59417724609375, 0.6319580078125, 0.66973876953125, 0.70751953125, 0.74530029296875, 0.7830810546875, 0.82086181640625, 0.858642578125, 0.89642333984375, 0.9342041015625, 0.97198486328125, 1.009765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 4.0, 9.0, 13.0, 15.0, 26.0, 31.0, 55.0, 62.0, 109.0, 131.0, 262.0, 396.0, 760.0, 1452.0, 3870.0, 19547.0, 283559.0, 689505.0, 38846.0, 5705.0, 1887.0, 929.0, 523.0, 313.0, 178.0, 113.0, 76.0, 39.0, 36.0, 26.0, 27.0, 16.0, 5.0, 12.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.54296875, -4.40167236328125, -4.2603759765625, -4.11907958984375, -3.977783203125, -3.83648681640625, -3.6951904296875, -3.55389404296875, -3.41259765625, -3.27130126953125, -3.1300048828125, -2.98870849609375, -2.847412109375, -2.70611572265625, -2.5648193359375, -2.42352294921875, -2.2822265625, -2.14093017578125, -1.9996337890625, -1.85833740234375, -1.717041015625, -1.57574462890625, -1.4344482421875, -1.29315185546875, -1.15185546875, -1.01055908203125, -0.8692626953125, -0.72796630859375, -0.586669921875, -0.44537353515625, -0.3040771484375, -0.16278076171875, -0.021484375, 0.11981201171875, 0.2611083984375, 0.40240478515625, 0.543701171875, 0.68499755859375, 0.8262939453125, 0.96759033203125, 1.10888671875, 1.25018310546875, 1.3914794921875, 1.53277587890625, 1.674072265625, 1.81536865234375, 1.9566650390625, 2.09796142578125, 2.2392578125, 2.38055419921875, 2.5218505859375, 2.66314697265625, 2.804443359375, 2.94573974609375, 3.0870361328125, 3.22833251953125, 3.36962890625, 3.51092529296875, 3.6522216796875, 3.79351806640625, 3.934814453125, 4.07611083984375, 4.2174072265625, 4.35870361328125, 4.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 11.0, 7.0, 12.0, 12.0, 22.0, 24.0, 27.0, 24.0, 33.0, 49.0, 47.0, 49.0, 47.0, 50.0, 65.0, 45.0, 56.0, 56.0, 48.0, 44.0, 49.0, 25.0, 34.0, 28.0, 22.0, 20.0, 16.0, 14.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.046875, -4.8984375, -4.75, -4.6015625, -4.453125, -4.3046875, -4.15625, -4.0078125, -3.859375, -3.7109375, -3.5625, -3.4140625, -3.265625, -3.1171875, -2.96875, -2.8203125, -2.671875, -2.5234375, -2.375, -2.2265625, -2.078125, -1.9296875, -1.78125, -1.6328125, -1.484375, -1.3359375, -1.1875, -1.0390625, -0.890625, -0.7421875, -0.59375, -0.4453125, -0.296875, -0.1484375, 0.0, 0.1484375, 0.296875, 0.4453125, 0.59375, 0.7421875, 0.890625, 1.0390625, 1.1875, 1.3359375, 1.484375, 1.6328125, 1.78125, 1.9296875, 2.078125, 2.2265625, 2.375, 2.5234375, 2.671875, 2.8203125, 2.96875, 3.1171875, 3.265625, 3.4140625, 3.5625, 3.7109375, 3.859375, 4.0078125, 4.15625, 4.3046875, 4.453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 12.0, 17.0, 24.0, 35.0, 85.0, 193.0, 508.0, 2443.0, 47507.0, 984592.0, 11251.0, 1277.0, 319.0, 137.0, 52.0, 26.0, 19.0, 14.0, 10.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.5028076171875, -5.337646484375, -5.1724853515625, -5.00732421875, -4.8421630859375, -4.677001953125, -4.5118408203125, -4.3466796875, -4.1815185546875, -4.016357421875, -3.8511962890625, -3.68603515625, -3.5208740234375, -3.355712890625, -3.1905517578125, -3.025390625, -2.8602294921875, -2.695068359375, -2.5299072265625, -2.36474609375, -2.1995849609375, -2.034423828125, -1.8692626953125, -1.7041015625, -1.5389404296875, -1.373779296875, -1.2086181640625, -1.04345703125, -0.8782958984375, -0.713134765625, -0.5479736328125, -0.3828125, -0.2176513671875, -0.052490234375, 0.1126708984375, 0.27783203125, 0.4429931640625, 0.608154296875, 0.7733154296875, 0.9384765625, 1.1036376953125, 1.268798828125, 1.4339599609375, 1.59912109375, 1.7642822265625, 1.929443359375, 2.0946044921875, 2.259765625, 2.4249267578125, 2.590087890625, 2.7552490234375, 2.92041015625, 3.0855712890625, 3.250732421875, 3.4158935546875, 3.5810546875, 3.7462158203125, 3.911376953125, 4.0765380859375, 4.24169921875, 4.4068603515625, 4.572021484375, 4.7371826171875, 4.90234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 16.0, 12.0, 26.0, 42.0, 83.0, 266.0, 280.0, 122.0, 53.0, 25.0, 24.0, 10.0, 7.0, 4.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007967948913574219, -0.0007758811116218567, -0.0007549673318862915, -0.0007340535521507263, -0.0007131397724151611, -0.000692225992679596, -0.0006713122129440308, -0.0006503984332084656, -0.0006294846534729004, -0.0006085708737373352, -0.00058765709400177, -0.0005667433142662048, -0.0005458295345306396, -0.0005249157547950745, -0.0005040019750595093, -0.0004830881953239441, -0.0004621744155883789, -0.0004412606358528137, -0.00042034685611724854, -0.00039943307638168335, -0.00037851929664611816, -0.000357605516910553, -0.0003366917371749878, -0.0003157779574394226, -0.0002948641777038574, -0.00027395039796829224, -0.00025303661823272705, -0.00023212283849716187, -0.00021120905876159668, -0.0001902952790260315, -0.0001693814992904663, -0.00014846771955490112, -0.00012755393981933594, -0.00010664016008377075, -8.572638034820557e-05, -6.481260061264038e-05, -4.3898820877075195e-05, -2.298504114151001e-05, -2.0712614059448242e-06, 1.884251832962036e-05, 3.975629806518555e-05, 6.067007780075073e-05, 8.158385753631592e-05, 0.0001024976372718811, 0.0001234114170074463, 0.00014432519674301147, 0.00016523897647857666, 0.00018615275621414185, 0.00020706653594970703, 0.00022798031568527222, 0.0002488940954208374, 0.0002698078751564026, 0.0002907216548919678, 0.00031163543462753296, 0.00033254921436309814, 0.00035346299409866333, 0.0003743767738342285, 0.0003952905535697937, 0.0004162043333053589, 0.00043711811304092407, 0.00045803189277648926, 0.00047894567251205444, 0.0004998594522476196, 0.0005207732319831848, 0.00054168701171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 1.0, 9.0, 4.0, 6.0, 8.0, 19.0, 22.0, 41.0, 54.0, 88.0, 179.0, 316.0, 620.0, 1400.0, 3557.0, 14647.0, 965757.0, 52406.0, 5701.0, 1905.0, 836.0, 433.0, 228.0, 127.0, 54.0, 45.0, 15.0, 11.0, 16.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.39776611328125, -4.2330322265625, -4.06829833984375, -3.903564453125, -3.73883056640625, -3.5740966796875, -3.40936279296875, -3.24462890625, -3.07989501953125, -2.9151611328125, -2.75042724609375, -2.585693359375, -2.42095947265625, -2.2562255859375, -2.09149169921875, -1.9267578125, -1.76202392578125, -1.5972900390625, -1.43255615234375, -1.267822265625, -1.10308837890625, -0.9383544921875, -0.77362060546875, -0.60888671875, -0.44415283203125, -0.2794189453125, -0.11468505859375, 0.050048828125, 0.21478271484375, 0.3795166015625, 0.54425048828125, 0.708984375, 0.87371826171875, 1.0384521484375, 1.20318603515625, 1.367919921875, 1.53265380859375, 1.6973876953125, 1.86212158203125, 2.02685546875, 2.19158935546875, 2.3563232421875, 2.52105712890625, 2.685791015625, 2.85052490234375, 3.0152587890625, 3.17999267578125, 3.3447265625, 3.50946044921875, 3.6741943359375, 3.83892822265625, 4.003662109375, 4.16839599609375, 4.3331298828125, 4.49786376953125, 4.66259765625, 4.82733154296875, 4.9920654296875, 5.15679931640625, 5.321533203125, 5.48626708984375, 5.6510009765625, 5.81573486328125, 5.98046875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 14.0, 13.0, 25.0, 59.0, 103.0, 188.0, 224.0, 147.0, 89.0, 48.0, 28.0, 8.0, 9.0, 6.0, 8.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.125, -3.01055908203125, -2.8961181640625, -2.78167724609375, -2.667236328125, -2.55279541015625, -2.4383544921875, -2.32391357421875, -2.20947265625, -2.09503173828125, -1.9805908203125, -1.86614990234375, -1.751708984375, -1.63726806640625, -1.5228271484375, -1.40838623046875, -1.2939453125, -1.17950439453125, -1.0650634765625, -0.95062255859375, -0.836181640625, -0.72174072265625, -0.6072998046875, -0.49285888671875, -0.37841796875, -0.26397705078125, -0.1495361328125, -0.03509521484375, 0.079345703125, 0.19378662109375, 0.3082275390625, 0.42266845703125, 0.537109375, 0.65155029296875, 0.7659912109375, 0.88043212890625, 0.994873046875, 1.10931396484375, 1.2237548828125, 1.33819580078125, 1.45263671875, 1.56707763671875, 1.6815185546875, 1.79595947265625, 1.910400390625, 2.02484130859375, 2.1392822265625, 2.25372314453125, 2.3681640625, 2.48260498046875, 2.5970458984375, 2.71148681640625, 2.825927734375, 2.94036865234375, 3.0548095703125, 3.16925048828125, 3.28369140625, 3.39813232421875, 3.5125732421875, 3.62701416015625, 3.741455078125, 3.85589599609375, 3.9703369140625, 4.08477783203125, 4.19921875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 14.0, 48.0, 258.0, 456.0, 153.0, 44.0, 14.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.081878662109375, -60.8508186340332, -58.619754791259766, -56.388694763183594, -54.157630920410156, -51.926570892333984, -49.69551086425781, -47.464447021484375, -45.2333869934082, -43.00232696533203, -40.771263122558594, -38.54020309448242, -36.30914306640625, -34.07807922363281, -31.84701919555664, -29.615957260131836, -27.38489532470703, -25.153833389282227, -22.922771453857422, -20.69171142578125, -18.460649490356445, -16.22958755493164, -13.998526573181152, -11.767465591430664, -9.53640365600586, -7.305342197418213, -5.074280738830566, -2.84321928024292, -0.6121578216552734, 1.6189041137695312, 3.8499650955200195, 6.081026077270508, 8.312080383300781, 10.543142318725586, 12.774203300476074, 15.005264282226562, 17.236326217651367, 19.467388153076172, 21.698448181152344, 23.92951011657715, 26.160572052001953, 28.391633987426758, 30.622695922851562, 32.853755950927734, 35.084815979003906, 37.315879821777344, 39.546939849853516, 41.77799987792969, 44.009063720703125, 46.2401237487793, 48.471187591552734, 50.702247619628906, 52.933311462402344, 55.164371490478516, 57.39543151855469, 59.626495361328125, 61.8575553894043, 64.08861541748047, 66.3196792602539, 68.55074310302734, 70.78179931640625, 73.01286315917969, 75.24392700195312, 77.47498321533203, 79.70604705810547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 11.0, 10.0, 16.0, 27.0, 30.0, 33.0, 53.0, 59.0, 52.0, 72.0, 82.0, 99.0, 75.0, 77.0, 54.0, 40.0, 58.0, 39.0, 33.0, 23.0, 17.0, 9.0, 13.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.815162658691406, -25.937559127807617, -25.059955596923828, -24.182350158691406, -23.304746627807617, -22.427143096923828, -21.54953956604004, -20.67193603515625, -19.794330596923828, -18.91672706604004, -18.03912353515625, -17.161518096923828, -16.28391456604004, -15.40631103515625, -14.528707504272461, -13.651103973388672, -12.773500442504883, -11.895896911621094, -11.018292427062988, -10.1406888961792, -9.263084411621094, -8.385480880737305, -7.507877349853516, -6.630273342132568, -5.752669334411621, -4.875065326690674, -3.9974615573883057, -3.1198577880859375, -2.2422537803649902, -1.364649772644043, -0.4870462417602539, 0.39055776596069336, 1.2681636810302734, 2.1457676887512207, 3.023371458053589, 3.900975227355957, 4.778579235076904, 5.656183242797852, 6.533786773681641, 7.411390781402588, 8.288994789123535, 9.166598320007324, 10.04420280456543, 10.921806335449219, 11.799409866333008, 12.677014350891113, 13.554617881774902, 14.432222366333008, 15.309825897216797, 16.187429428100586, 17.065032958984375, 17.942638397216797, 18.820241928100586, 19.697845458984375, 20.575448989868164, 21.453052520751953, 22.330657958984375, 23.208261489868164, 24.085865020751953, 24.963470458984375, 25.841073989868164, 26.718677520751953, 27.596281051635742, 28.47388458251953, 29.35148811340332]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 8.0, 4.0, 1.0, 9.0, 12.0, 5.0, 12.0, 24.0, 38.0, 88.0, 178.0, 847.0, 8231.0, 3400509.0, 777861.0, 5396.0, 758.0, 169.0, 67.0, 25.0, 14.0, 13.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.453125, -10.239410400390625, -10.02569580078125, -9.811981201171875, -9.5982666015625, -9.384552001953125, -9.17083740234375, -8.957122802734375, -8.743408203125, -8.529693603515625, -8.31597900390625, -8.102264404296875, -7.8885498046875, -7.674835205078125, -7.46112060546875, -7.247406005859375, -7.03369140625, -6.819976806640625, -6.60626220703125, -6.392547607421875, -6.1788330078125, -5.965118408203125, -5.75140380859375, -5.537689208984375, -5.323974609375, -5.110260009765625, -4.89654541015625, -4.682830810546875, -4.4691162109375, -4.255401611328125, -4.04168701171875, -3.827972412109375, -3.6142578125, -3.400543212890625, -3.18682861328125, -2.973114013671875, -2.7593994140625, -2.545684814453125, -2.33197021484375, -2.118255615234375, -1.904541015625, -1.690826416015625, -1.47711181640625, -1.263397216796875, -1.0496826171875, -0.835968017578125, -0.62225341796875, -0.408538818359375, -0.19482421875, 0.018890380859375, 0.23260498046875, 0.446319580078125, 0.6600341796875, 0.873748779296875, 1.08746337890625, 1.301177978515625, 1.514892578125, 1.728607177734375, 1.94232177734375, 2.156036376953125, 2.3697509765625, 2.583465576171875, 2.79718017578125, 3.010894775390625, 3.224609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 25.0, 34.0, 35.0, 79.0, 76.0, 91.0, 117.0, 109.0, 98.0, 103.0, 62.0, 53.0, 36.0, 26.0, 16.0, 13.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.968048095703125, -1.90289306640625, -1.837738037109375, -1.7725830078125, -1.707427978515625, -1.64227294921875, -1.577117919921875, -1.511962890625, -1.446807861328125, -1.38165283203125, -1.316497802734375, -1.2513427734375, -1.186187744140625, -1.12103271484375, -1.055877685546875, -0.99072265625, -0.925567626953125, -0.86041259765625, -0.795257568359375, -0.7301025390625, -0.664947509765625, -0.59979248046875, -0.534637451171875, -0.469482421875, -0.404327392578125, -0.33917236328125, -0.274017333984375, -0.2088623046875, -0.143707275390625, -0.07855224609375, -0.013397216796875, 0.0517578125, 0.116912841796875, 0.18206787109375, 0.247222900390625, 0.3123779296875, 0.377532958984375, 0.44268798828125, 0.507843017578125, 0.572998046875, 0.638153076171875, 0.70330810546875, 0.768463134765625, 0.8336181640625, 0.898773193359375, 0.96392822265625, 1.029083251953125, 1.09423828125, 1.159393310546875, 1.22454833984375, 1.289703369140625, 1.3548583984375, 1.420013427734375, 1.48516845703125, 1.550323486328125, 1.615478515625, 1.680633544921875, 1.74578857421875, 1.810943603515625, 1.8760986328125, 1.941253662109375, 2.00640869140625, 2.071563720703125, 2.13671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 24.0, 53.0, 84.0, 193.0, 438.0, 1277.0, 4782.0, 29371.0, 801387.0, 3265023.0, 80535.0, 8554.0, 1731.0, 472.0, 163.0, 75.0, 43.0, 16.0, 12.0, 8.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.26885986328125, -2.1666259765625, -2.06439208984375, -1.962158203125, -1.85992431640625, -1.7576904296875, -1.65545654296875, -1.55322265625, -1.45098876953125, -1.3487548828125, -1.24652099609375, -1.144287109375, -1.04205322265625, -0.9398193359375, -0.83758544921875, -0.7353515625, -0.63311767578125, -0.5308837890625, -0.42864990234375, -0.326416015625, -0.22418212890625, -0.1219482421875, -0.01971435546875, 0.08251953125, 0.18475341796875, 0.2869873046875, 0.38922119140625, 0.491455078125, 0.59368896484375, 0.6959228515625, 0.79815673828125, 0.900390625, 1.00262451171875, 1.1048583984375, 1.20709228515625, 1.309326171875, 1.41156005859375, 1.5137939453125, 1.61602783203125, 1.71826171875, 1.82049560546875, 1.9227294921875, 2.02496337890625, 2.127197265625, 2.22943115234375, 2.3316650390625, 2.43389892578125, 2.5361328125, 2.63836669921875, 2.7406005859375, 2.84283447265625, 2.945068359375, 3.04730224609375, 3.1495361328125, 3.25177001953125, 3.35400390625, 3.45623779296875, 3.5584716796875, 3.66070556640625, 3.762939453125, 3.86517333984375, 3.9674072265625, 4.06964111328125, 4.171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 9.0, 25.0, 43.0, 55.0, 96.0, 147.0, 290.0, 540.0, 859.0, 793.0, 479.0, 296.0, 169.0, 91.0, 52.0, 23.0, 32.0, 14.0, 8.0, 12.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.427734375, -3.349639892578125, -3.27154541015625, -3.193450927734375, -3.1153564453125, -3.037261962890625, -2.95916748046875, -2.881072998046875, -2.802978515625, -2.724884033203125, -2.64678955078125, -2.568695068359375, -2.4906005859375, -2.412506103515625, -2.33441162109375, -2.256317138671875, -2.17822265625, -2.100128173828125, -2.02203369140625, -1.943939208984375, -1.8658447265625, -1.787750244140625, -1.70965576171875, -1.631561279296875, -1.553466796875, -1.475372314453125, -1.39727783203125, -1.319183349609375, -1.2410888671875, -1.162994384765625, -1.08489990234375, -1.006805419921875, -0.9287109375, -0.850616455078125, -0.77252197265625, -0.694427490234375, -0.6163330078125, -0.538238525390625, -0.46014404296875, -0.382049560546875, -0.303955078125, -0.225860595703125, -0.14776611328125, -0.069671630859375, 0.0084228515625, 0.086517333984375, 0.16461181640625, 0.242706298828125, 0.32080078125, 0.398895263671875, 0.47698974609375, 0.555084228515625, 0.6331787109375, 0.711273193359375, 0.78936767578125, 0.867462158203125, 0.945556640625, 1.023651123046875, 1.10174560546875, 1.179840087890625, 1.2579345703125, 1.336029052734375, 1.41412353515625, 1.492218017578125, 1.5703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 16.0, 20.0, 58.0, 91.0, 182.0, 193.0, 186.0, 116.0, 44.0, 35.0, 10.0, 5.0, 6.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.719686508178711, -15.100394248962402, -14.481101989746094, -13.861809730529785, -13.242517471313477, -12.623225212097168, -12.00393295288086, -11.38464069366455, -10.765348434448242, -10.146056175231934, -9.526763916015625, -8.907471656799316, -8.288179397583008, -7.668887138366699, -7.049594879150391, -6.430302619934082, -5.811010360717773, -5.191718101501465, -4.572425842285156, -3.9531335830688477, -3.333841323852539, -2.7145490646362305, -2.095256805419922, -1.4759645462036133, -0.8566722869873047, -0.2373800277709961, 0.3819122314453125, 1.001204490661621, 1.6204967498779297, 2.2397890090942383, 2.859081268310547, 3.4783735275268555, 4.097663879394531, 4.71695613861084, 5.336248397827148, 5.955540657043457, 6.574832916259766, 7.194125175476074, 7.813417434692383, 8.432709693908691, 9.052001953125, 9.671294212341309, 10.290586471557617, 10.909878730773926, 11.529170989990234, 12.148463249206543, 12.767755508422852, 13.38704776763916, 14.006340026855469, 14.625632286071777, 15.244924545288086, 15.864216804504395, 16.483509063720703, 17.102802276611328, 17.72209358215332, 18.341384887695312, 18.960678100585938, 19.579971313476562, 20.199262619018555, 20.818553924560547, 21.437847137451172, 22.057140350341797, 22.67643165588379, 23.29572296142578, 23.915016174316406]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 3.0, 9.0, 14.0, 21.0, 24.0, 23.0, 25.0, 36.0, 51.0, 60.0, 47.0, 51.0, 60.0, 73.0, 56.0, 64.0, 63.0, 52.0, 55.0, 41.0, 39.0, 24.0, 31.0, 16.0, 14.0, 9.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.317985534667969, -11.934821128845215, -11.551656723022461, -11.168492317199707, -10.785327911376953, -10.402162551879883, -10.018998146057129, -9.635833740234375, -9.252669334411621, -8.869504928588867, -8.486340522766113, -8.10317611694336, -7.720011234283447, -7.336846828460693, -6.953681945800781, -6.570517539978027, -6.187353134155273, -5.8041887283325195, -5.421024322509766, -5.0378594398498535, -4.6546950340271, -4.271530628204346, -3.8883659839630127, -3.5052013397216797, -3.122036933898926, -2.738872528076172, -2.355707883834839, -1.9725433588027954, -1.589378833770752, -1.2062143087387085, -0.823049783706665, -0.43988513946533203, -0.056720733642578125, 0.32644379138946533, 0.7096083164215088, 1.0927728414535522, 1.4759373664855957, 1.8591018915176392, 2.2422664165496826, 2.6254310607910156, 3.0085954666137695, 3.3917598724365234, 3.7749245166778564, 4.1580891609191895, 4.541253566741943, 4.924417972564697, 5.307582855224609, 5.690747261047363, 6.073911666870117, 6.457076072692871, 6.840240478515625, 7.223405361175537, 7.606569766998291, 7.989734172821045, 8.372899055480957, 8.756063461303711, 9.139227867126465, 9.522392272949219, 9.905556678771973, 10.288721084594727, 10.671886444091797, 11.05505084991455, 11.438215255737305, 11.821379661560059, 12.204544067382812]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 2.0, 6.0, 13.0, 9.0, 30.0, 39.0, 66.0, 118.0, 435.0, 2391.0, 28292.0, 821437.0, 186474.0, 7727.0, 1050.0, 259.0, 79.0, 46.0, 22.0, 13.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.39605712890625, -5.1866455078125, -4.97723388671875, -4.767822265625, -4.55841064453125, -4.3489990234375, -4.13958740234375, -3.93017578125, -3.72076416015625, -3.5113525390625, -3.30194091796875, -3.092529296875, -2.88311767578125, -2.6737060546875, -2.46429443359375, -2.2548828125, -2.04547119140625, -1.8360595703125, -1.62664794921875, -1.417236328125, -1.20782470703125, -0.9984130859375, -0.78900146484375, -0.57958984375, -0.37017822265625, -0.1607666015625, 0.04864501953125, 0.258056640625, 0.46746826171875, 0.6768798828125, 0.88629150390625, 1.095703125, 1.30511474609375, 1.5145263671875, 1.72393798828125, 1.933349609375, 2.14276123046875, 2.3521728515625, 2.56158447265625, 2.77099609375, 2.98040771484375, 3.1898193359375, 3.39923095703125, 3.608642578125, 3.81805419921875, 4.0274658203125, 4.23687744140625, 4.4462890625, 4.65570068359375, 4.8651123046875, 5.07452392578125, 5.283935546875, 5.49334716796875, 5.7027587890625, 5.91217041015625, 6.12158203125, 6.33099365234375, 6.5404052734375, 6.74981689453125, 6.959228515625, 7.16864013671875, 7.3780517578125, 7.58746337890625, 7.796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 6.0, 14.0, 18.0, 14.0, 24.0, 29.0, 31.0, 45.0, 68.0, 63.0, 79.0, 58.0, 73.0, 82.0, 62.0, 61.0, 49.0, 44.0, 37.0, 44.0, 28.0, 12.0, 11.0, 14.0, 10.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7353515625, -1.6913299560546875, -1.647308349609375, -1.6032867431640625, -1.55926513671875, -1.5152435302734375, -1.471221923828125, -1.4272003173828125, -1.3831787109375, -1.3391571044921875, -1.295135498046875, -1.2511138916015625, -1.20709228515625, -1.1630706787109375, -1.119049072265625, -1.0750274658203125, -1.031005859375, -0.9869842529296875, -0.942962646484375, -0.8989410400390625, -0.85491943359375, -0.8108978271484375, -0.766876220703125, -0.7228546142578125, -0.6788330078125, -0.6348114013671875, -0.590789794921875, -0.5467681884765625, -0.50274658203125, -0.4587249755859375, -0.414703369140625, -0.3706817626953125, -0.32666015625, -0.2826385498046875, -0.238616943359375, -0.1945953369140625, -0.15057373046875, -0.1065521240234375, -0.062530517578125, -0.0185089111328125, 0.0255126953125, 0.0695343017578125, 0.113555908203125, 0.1575775146484375, 0.20159912109375, 0.2456207275390625, 0.289642333984375, 0.3336639404296875, 0.377685546875, 0.4217071533203125, 0.465728759765625, 0.5097503662109375, 0.55377197265625, 0.5977935791015625, 0.641815185546875, 0.6858367919921875, 0.7298583984375, 0.7738800048828125, 0.817901611328125, 0.8619232177734375, 0.90594482421875, 0.9499664306640625, 0.993988037109375, 1.0380096435546875, 1.08203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 4.0, 14.0, 20.0, 34.0, 51.0, 92.0, 185.0, 304.0, 693.0, 1999.0, 10258.0, 135228.0, 839750.0, 51924.0, 5473.0, 1386.0, 477.0, 262.0, 137.0, 77.0, 46.0, 26.0, 21.0, 12.0, 9.0, 9.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.390625, -6.22393798828125, -6.0572509765625, -5.89056396484375, -5.723876953125, -5.55718994140625, -5.3905029296875, -5.22381591796875, -5.05712890625, -4.89044189453125, -4.7237548828125, -4.55706787109375, -4.390380859375, -4.22369384765625, -4.0570068359375, -3.89031982421875, -3.7236328125, -3.55694580078125, -3.3902587890625, -3.22357177734375, -3.056884765625, -2.89019775390625, -2.7235107421875, -2.55682373046875, -2.39013671875, -2.22344970703125, -2.0567626953125, -1.89007568359375, -1.723388671875, -1.55670166015625, -1.3900146484375, -1.22332763671875, -1.056640625, -0.88995361328125, -0.7232666015625, -0.55657958984375, -0.389892578125, -0.22320556640625, -0.0565185546875, 0.11016845703125, 0.27685546875, 0.44354248046875, 0.6102294921875, 0.77691650390625, 0.943603515625, 1.11029052734375, 1.2769775390625, 1.44366455078125, 1.6103515625, 1.77703857421875, 1.9437255859375, 2.11041259765625, 2.277099609375, 2.44378662109375, 2.6104736328125, 2.77716064453125, 2.94384765625, 3.11053466796875, 3.2772216796875, 3.44390869140625, 3.610595703125, 3.77728271484375, 3.9439697265625, 4.11065673828125, 4.27734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 6.0, 4.0, 1.0, 19.0, 24.0, 14.0, 29.0, 31.0, 37.0, 46.0, 42.0, 54.0, 62.0, 58.0, 53.0, 65.0, 61.0, 62.0, 52.0, 52.0, 31.0, 47.0, 32.0, 27.0, 19.0, 10.0, 13.0, 10.0, 3.0, 10.0, 3.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.88671875, -4.73272705078125, -4.5787353515625, -4.42474365234375, -4.270751953125, -4.11676025390625, -3.9627685546875, -3.80877685546875, -3.65478515625, -3.50079345703125, -3.3468017578125, -3.19281005859375, -3.038818359375, -2.88482666015625, -2.7308349609375, -2.57684326171875, -2.4228515625, -2.26885986328125, -2.1148681640625, -1.96087646484375, -1.806884765625, -1.65289306640625, -1.4989013671875, -1.34490966796875, -1.19091796875, -1.03692626953125, -0.8829345703125, -0.72894287109375, -0.574951171875, -0.42095947265625, -0.2669677734375, -0.11297607421875, 0.041015625, 0.19500732421875, 0.3489990234375, 0.50299072265625, 0.656982421875, 0.81097412109375, 0.9649658203125, 1.11895751953125, 1.27294921875, 1.42694091796875, 1.5809326171875, 1.73492431640625, 1.888916015625, 2.04290771484375, 2.1968994140625, 2.35089111328125, 2.5048828125, 2.65887451171875, 2.8128662109375, 2.96685791015625, 3.120849609375, 3.27484130859375, 3.4288330078125, 3.58282470703125, 3.73681640625, 3.89080810546875, 4.0447998046875, 4.19879150390625, 4.352783203125, 4.50677490234375, 4.6607666015625, 4.81475830078125, 4.96875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 10.0, 19.0, 24.0, 46.0, 96.0, 202.0, 580.0, 2460.0, 22754.0, 852991.0, 160354.0, 7236.0, 1187.0, 309.0, 140.0, 61.0, 18.0, 19.0, 11.0, 4.0, 7.0, 11.0, 0.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.296875, -2.211090087890625, -2.12530517578125, -2.039520263671875, -1.9537353515625, -1.867950439453125, -1.78216552734375, -1.696380615234375, -1.610595703125, -1.524810791015625, -1.43902587890625, -1.353240966796875, -1.2674560546875, -1.181671142578125, -1.09588623046875, -1.010101318359375, -0.92431640625, -0.838531494140625, -0.75274658203125, -0.666961669921875, -0.5811767578125, -0.495391845703125, -0.40960693359375, -0.323822021484375, -0.238037109375, -0.152252197265625, -0.06646728515625, 0.019317626953125, 0.1051025390625, 0.190887451171875, 0.27667236328125, 0.362457275390625, 0.4482421875, 0.534027099609375, 0.61981201171875, 0.705596923828125, 0.7913818359375, 0.877166748046875, 0.96295166015625, 1.048736572265625, 1.134521484375, 1.220306396484375, 1.30609130859375, 1.391876220703125, 1.4776611328125, 1.563446044921875, 1.64923095703125, 1.735015869140625, 1.82080078125, 1.906585693359375, 1.99237060546875, 2.078155517578125, 2.1639404296875, 2.249725341796875, 2.33551025390625, 2.421295166015625, 2.507080078125, 2.592864990234375, 2.67864990234375, 2.764434814453125, 2.8502197265625, 2.936004638671875, 3.02178955078125, 3.107574462890625, 3.193359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 18.0, 22.0, 42.0, 74.0, 111.0, 221.0, 190.0, 90.0, 49.0, 46.0, 27.0, 26.0, 19.0, 10.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005249977111816406, -0.0005117915570735931, -0.0004985854029655457, -0.00048537924885749817, -0.0004721730947494507, -0.0004589669406414032, -0.0004457607865333557, -0.00043255463242530823, -0.00041934847831726074, -0.00040614232420921326, -0.00039293617010116577, -0.0003797300159931183, -0.0003665238618850708, -0.0003533177077770233, -0.00034011155366897583, -0.00032690539956092834, -0.00031369924545288086, -0.0003004930913448334, -0.0002872869372367859, -0.0002740807831287384, -0.0002608746290206909, -0.00024766847491264343, -0.00023446232080459595, -0.00022125616669654846, -0.00020805001258850098, -0.0001948438584804535, -0.000181637704372406, -0.00016843155026435852, -0.00015522539615631104, -0.00014201924204826355, -0.00012881308794021606, -0.00011560693383216858, -0.0001024007797241211, -8.919462561607361e-05, -7.598847150802612e-05, -6.278231739997864e-05, -4.957616329193115e-05, -3.637000918388367e-05, -2.316385507583618e-05, -9.957700967788696e-06, 3.248453140258789e-06, 1.6454607248306274e-05, 2.966076135635376e-05, 4.2866915464401245e-05, 5.607306957244873e-05, 6.927922368049622e-05, 8.24853777885437e-05, 9.569153189659119e-05, 0.00010889768600463867, 0.00012210384011268616, 0.00013530999422073364, 0.00014851614832878113, 0.0001617223024368286, 0.0001749284565448761, 0.00018813461065292358, 0.00020134076476097107, 0.00021454691886901855, 0.00022775307297706604, 0.00024095922708511353, 0.000254165381193161, 0.0002673715353012085, 0.000280577689409256, 0.00029378384351730347, 0.00030698999762535095, 0.00032019615173339844]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 8.0, 10.0, 8.0, 15.0, 14.0, 19.0, 29.0, 42.0, 70.0, 130.0, 225.0, 371.0, 781.0, 1759.0, 4782.0, 18414.0, 124201.0, 754798.0, 116854.0, 17966.0, 4699.0, 1720.0, 753.0, 355.0, 187.0, 114.0, 82.0, 35.0, 31.0, 26.0, 13.0, 13.0, 8.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.482421875, -1.4394378662109375, -1.396453857421875, -1.3534698486328125, -1.31048583984375, -1.2675018310546875, -1.224517822265625, -1.1815338134765625, -1.1385498046875, -1.0955657958984375, -1.052581787109375, -1.0095977783203125, -0.96661376953125, -0.9236297607421875, -0.880645751953125, -0.8376617431640625, -0.794677734375, -0.7516937255859375, -0.708709716796875, -0.6657257080078125, -0.62274169921875, -0.5797576904296875, -0.536773681640625, -0.4937896728515625, -0.4508056640625, -0.4078216552734375, -0.364837646484375, -0.3218536376953125, -0.27886962890625, -0.2358856201171875, -0.192901611328125, -0.1499176025390625, -0.10693359375, -0.0639495849609375, -0.020965576171875, 0.0220184326171875, 0.06500244140625, 0.1079864501953125, 0.150970458984375, 0.1939544677734375, 0.2369384765625, 0.2799224853515625, 0.322906494140625, 0.3658905029296875, 0.40887451171875, 0.4518585205078125, 0.494842529296875, 0.5378265380859375, 0.580810546875, 0.6237945556640625, 0.666778564453125, 0.7097625732421875, 0.75274658203125, 0.7957305908203125, 0.838714599609375, 0.8816986083984375, 0.9246826171875, 0.9676666259765625, 1.010650634765625, 1.0536346435546875, 1.09661865234375, 1.1396026611328125, 1.182586669921875, 1.2255706787109375, 1.2685546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 3.0, 9.0, 17.0, 24.0, 42.0, 64.0, 73.0, 124.0, 144.0, 147.0, 95.0, 65.0, 55.0, 28.0, 30.0, 15.0, 9.0, 11.0, 12.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.1813812255859375, -1.127410888671875, -1.0734405517578125, -1.01947021484375, -0.9654998779296875, -0.911529541015625, -0.8575592041015625, -0.8035888671875, -0.7496185302734375, -0.695648193359375, -0.6416778564453125, -0.58770751953125, -0.5337371826171875, -0.479766845703125, -0.4257965087890625, -0.371826171875, -0.3178558349609375, -0.263885498046875, -0.2099151611328125, -0.15594482421875, -0.1019744873046875, -0.048004150390625, 0.0059661865234375, 0.0599365234375, 0.1139068603515625, 0.167877197265625, 0.2218475341796875, 0.27581787109375, 0.3297882080078125, 0.383758544921875, 0.4377288818359375, 0.49169921875, 0.5456695556640625, 0.599639892578125, 0.6536102294921875, 0.70758056640625, 0.7615509033203125, 0.815521240234375, 0.8694915771484375, 0.9234619140625, 0.9774322509765625, 1.031402587890625, 1.0853729248046875, 1.13934326171875, 1.1933135986328125, 1.247283935546875, 1.3012542724609375, 1.355224609375, 1.4091949462890625, 1.463165283203125, 1.5171356201171875, 1.57110595703125, 1.6250762939453125, 1.679046630859375, 1.7330169677734375, 1.7869873046875, 1.8409576416015625, 1.894927978515625, 1.9488983154296875, 2.00286865234375, 2.0568389892578125, 2.110809326171875, 2.1647796630859375, 2.21875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 14.0, 88.0, 226.0, 381.0, 168.0, 76.0, 18.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.920076370239258, -28.51514434814453, -27.110210418701172, -25.705276489257812, -24.300344467163086, -22.89541244506836, -21.490478515625, -20.08554458618164, -18.680612564086914, -17.275680541992188, -15.870746612548828, -14.465813636779785, -13.060880661010742, -11.6559476852417, -10.251014709472656, -8.846081733703613, -7.44114875793457, -6.036215782165527, -4.631282806396484, -3.2263498306274414, -1.8214168548583984, -0.41648387908935547, 0.9884490966796875, 2.3933820724487305, 3.7983150482177734, 5.203248023986816, 6.608180999755859, 8.013113975524902, 9.418046951293945, 10.822979927062988, 12.227912902832031, 13.632845878601074, 15.03778076171875, 16.44271469116211, 17.847646713256836, 19.252578735351562, 20.657512664794922, 22.06244659423828, 23.467378616333008, 24.872310638427734, 26.277244567871094, 27.682178497314453, 29.08711051940918, 30.492042541503906, 31.896976470947266, 33.301910400390625, 34.70684051513672, 36.11177444458008, 37.51670837402344, 38.9216423034668, 40.326576232910156, 41.73150634765625, 43.13644027709961, 44.54137420654297, 45.94630432128906, 47.35123825073242, 48.75617218017578, 50.16110610961914, 51.5660400390625, 52.970970153808594, 54.37590408325195, 55.78083801269531, 57.185768127441406, 58.590702056884766, 59.995635986328125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 9.0, 6.0, 9.0, 18.0, 13.0, 28.0, 16.0, 27.0, 31.0, 34.0, 40.0, 45.0, 52.0, 59.0, 59.0, 81.0, 67.0, 58.0, 54.0, 51.0, 44.0, 30.0, 32.0, 22.0, 18.0, 14.0, 12.0, 15.0, 18.0, 8.0, 3.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.2938175201416, -16.683446884155273, -16.073078155517578, -15.46270751953125, -14.852337837219238, -14.241968154907227, -13.631597518920898, -13.021227836608887, -12.410858154296875, -11.800488471984863, -11.190118789672852, -10.579748153686523, -9.969378471374512, -9.3590087890625, -8.748638153076172, -8.13826847076416, -7.527898788452148, -6.917529106140137, -6.307158946990967, -5.696788787841797, -5.086419105529785, -4.476049423217773, -3.8656792640686035, -3.2553091049194336, -2.644939422607422, -2.034569501876831, -1.4241995811462402, -0.8138296604156494, -0.2034597396850586, 0.4069101810455322, 1.017280101776123, 1.627650260925293, 2.2380218505859375, 2.8483917713165283, 3.458761692047119, 4.069131851196289, 4.679501533508301, 5.2898712158203125, 5.900241374969482, 6.510611534118652, 7.120981216430664, 7.731350898742676, 8.341720581054688, 8.952091217041016, 9.562460899353027, 10.172830581665039, 10.783201217651367, 11.393570899963379, 12.00394058227539, 12.614310264587402, 13.224679946899414, 13.835050582885742, 14.445420265197754, 15.055789947509766, 15.666160583496094, 16.276531219482422, 16.886899948120117, 17.497270584106445, 18.10763931274414, 18.71800994873047, 19.328380584716797, 19.938749313354492, 20.54911994934082, 21.159488677978516, 21.769859313964844]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 5.0, 5.0, 5.0, 6.0, 4.0, 5.0, 10.0, 11.0, 25.0, 38.0, 69.0, 111.0, 428.0, 3308.0, 213196.0, 3949524.0, 25038.0, 1718.0, 463.0, 143.0, 66.0, 31.0, 21.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.86328125, -7.697021484375, -7.53076171875, -7.364501953125, -7.1982421875, -7.031982421875, -6.86572265625, -6.699462890625, -6.533203125, -6.366943359375, -6.20068359375, -6.034423828125, -5.8681640625, -5.701904296875, -5.53564453125, -5.369384765625, -5.203125, -5.036865234375, -4.87060546875, -4.704345703125, -4.5380859375, -4.371826171875, -4.20556640625, -4.039306640625, -3.873046875, -3.706787109375, -3.54052734375, -3.374267578125, -3.2080078125, -3.041748046875, -2.87548828125, -2.709228515625, -2.54296875, -2.376708984375, -2.21044921875, -2.044189453125, -1.8779296875, -1.711669921875, -1.54541015625, -1.379150390625, -1.212890625, -1.046630859375, -0.88037109375, -0.714111328125, -0.5478515625, -0.381591796875, -0.21533203125, -0.049072265625, 0.1171875, 0.283447265625, 0.44970703125, 0.615966796875, 0.7822265625, 0.948486328125, 1.11474609375, 1.281005859375, 1.447265625, 1.613525390625, 1.77978515625, 1.946044921875, 2.1123046875, 2.278564453125, 2.44482421875, 2.611083984375, 2.77734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 8.0, 14.0, 17.0, 44.0, 69.0, 102.0, 124.0, 126.0, 133.0, 117.0, 83.0, 67.0, 51.0, 23.0, 17.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.775390625, -1.701263427734375, -1.62713623046875, -1.553009033203125, -1.4788818359375, -1.404754638671875, -1.33062744140625, -1.256500244140625, -1.182373046875, -1.108245849609375, -1.03411865234375, -0.959991455078125, -0.8858642578125, -0.811737060546875, -0.73760986328125, -0.663482666015625, -0.58935546875, -0.515228271484375, -0.44110107421875, -0.366973876953125, -0.2928466796875, -0.218719482421875, -0.14459228515625, -0.070465087890625, 0.003662109375, 0.077789306640625, 0.15191650390625, 0.226043701171875, 0.3001708984375, 0.374298095703125, 0.44842529296875, 0.522552490234375, 0.5966796875, 0.670806884765625, 0.74493408203125, 0.819061279296875, 0.8931884765625, 0.967315673828125, 1.04144287109375, 1.115570068359375, 1.189697265625, 1.263824462890625, 1.33795166015625, 1.412078857421875, 1.4862060546875, 1.560333251953125, 1.63446044921875, 1.708587646484375, 1.78271484375, 1.856842041015625, 1.93096923828125, 2.005096435546875, 2.0792236328125, 2.153350830078125, 2.22747802734375, 2.301605224609375, 2.375732421875, 2.449859619140625, 2.52398681640625, 2.598114013671875, 2.6722412109375, 2.746368408203125, 2.82049560546875, 2.894622802734375, 2.96875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 7.0, 2.0, 4.0, 7.0, 22.0, 22.0, 42.0, 49.0, 79.0, 134.0, 217.0, 427.0, 959.0, 2772.0, 11038.0, 57888.0, 649289.0, 3183597.0, 248447.0, 29060.0, 6552.0, 2101.0, 788.0, 323.0, 152.0, 105.0, 59.0, 41.0, 20.0, 21.0, 10.0, 9.0, 7.0, 9.0, 5.0, 0.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.189453125, -2.119598388671875, -2.04974365234375, -1.979888916015625, -1.9100341796875, -1.840179443359375, -1.77032470703125, -1.700469970703125, -1.630615234375, -1.560760498046875, -1.49090576171875, -1.421051025390625, -1.3511962890625, -1.281341552734375, -1.21148681640625, -1.141632080078125, -1.07177734375, -1.001922607421875, -0.93206787109375, -0.862213134765625, -0.7923583984375, -0.722503662109375, -0.65264892578125, -0.582794189453125, -0.512939453125, -0.443084716796875, -0.37322998046875, -0.303375244140625, -0.2335205078125, -0.163665771484375, -0.09381103515625, -0.023956298828125, 0.0458984375, 0.115753173828125, 0.18560791015625, 0.255462646484375, 0.3253173828125, 0.395172119140625, 0.46502685546875, 0.534881591796875, 0.604736328125, 0.674591064453125, 0.74444580078125, 0.814300537109375, 0.8841552734375, 0.954010009765625, 1.02386474609375, 1.093719482421875, 1.16357421875, 1.233428955078125, 1.30328369140625, 1.373138427734375, 1.4429931640625, 1.512847900390625, 1.58270263671875, 1.652557373046875, 1.722412109375, 1.792266845703125, 1.86212158203125, 1.931976318359375, 2.0018310546875, 2.071685791015625, 2.14154052734375, 2.211395263671875, 2.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 8.0, 10.0, 9.0, 17.0, 22.0, 32.0, 26.0, 39.0, 66.0, 94.0, 160.0, 222.0, 306.0, 486.0, 626.0, 606.0, 451.0, 318.0, 180.0, 125.0, 65.0, 59.0, 51.0, 25.0, 17.0, 17.0, 9.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.361328125, -2.291656494140625, -2.22198486328125, -2.152313232421875, -2.0826416015625, -2.012969970703125, -1.94329833984375, -1.873626708984375, -1.803955078125, -1.734283447265625, -1.66461181640625, -1.594940185546875, -1.5252685546875, -1.455596923828125, -1.38592529296875, -1.316253662109375, -1.24658203125, -1.176910400390625, -1.10723876953125, -1.037567138671875, -0.9678955078125, -0.898223876953125, -0.82855224609375, -0.758880615234375, -0.689208984375, -0.619537353515625, -0.54986572265625, -0.480194091796875, -0.4105224609375, -0.340850830078125, -0.27117919921875, -0.201507568359375, -0.1318359375, -0.062164306640625, 0.00750732421875, 0.077178955078125, 0.1468505859375, 0.216522216796875, 0.28619384765625, 0.355865478515625, 0.425537109375, 0.495208740234375, 0.56488037109375, 0.634552001953125, 0.7042236328125, 0.773895263671875, 0.84356689453125, 0.913238525390625, 0.98291015625, 1.052581787109375, 1.12225341796875, 1.191925048828125, 1.2615966796875, 1.331268310546875, 1.40093994140625, 1.470611572265625, 1.540283203125, 1.609954833984375, 1.67962646484375, 1.749298095703125, 1.8189697265625, 1.888641357421875, 1.95831298828125, 2.027984619140625, 2.09765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 16.0, 35.0, 115.0, 318.0, 337.0, 121.0, 34.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.05979537963867, -55.604862213134766, -54.14992904663086, -52.69499969482422, -51.24006652832031, -49.785133361816406, -48.3302001953125, -46.875267028808594, -45.42033386230469, -43.96540069580078, -42.510467529296875, -41.05553436279297, -39.60060501098633, -38.14567184448242, -36.690738677978516, -35.23580551147461, -33.78087615966797, -32.32594299316406, -30.87101173400879, -29.416078567504883, -27.96114730834961, -26.506214141845703, -25.051280975341797, -23.59634780883789, -22.141416549682617, -20.68648338317871, -19.231552124023438, -17.77661895751953, -16.321685791015625, -14.866754531860352, -13.411821365356445, -11.956889152526855, -10.501956939697266, -9.047024726867676, -7.592092037200928, -6.13715934753418, -4.68222713470459, -3.227294921875, -1.7723617553710938, -0.3174295425415039, 1.137502670288086, 2.592435121536255, 4.047367572784424, 5.502300262451172, 6.957232475280762, 8.412164688110352, 9.867097854614258, 11.322030067443848, 12.776962280273438, 14.231894493103027, 15.686826705932617, 17.141759872436523, 18.596691131591797, 20.051624298095703, 21.50655746459961, 22.961490631103516, 24.41642189025879, 25.871355056762695, 27.32628631591797, 28.781219482421875, 30.23615264892578, 31.691083908081055, 33.146018981933594, 34.600948333740234, 36.05588150024414]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 8.0, 13.0, 16.0, 25.0, 27.0, 43.0, 40.0, 48.0, 61.0, 63.0, 57.0, 64.0, 62.0, 61.0, 65.0, 60.0, 60.0, 46.0, 32.0, 36.0, 20.0, 20.0, 13.0, 8.0, 15.0, 9.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-20.59213638305664, -20.09067153930664, -19.589208602905273, -19.087743759155273, -18.586280822753906, -18.084815979003906, -17.583351135253906, -17.08188819885254, -16.58042335510254, -16.07895851135254, -15.577495574951172, -15.076030731201172, -14.574566841125488, -14.073102951049805, -13.571638107299805, -13.070174217224121, -12.568710327148438, -12.067246437072754, -11.56578254699707, -11.06431770324707, -10.562853813171387, -10.061389923095703, -9.559925079345703, -9.05846118927002, -8.556997299194336, -8.055533409118652, -7.5540690422058105, -7.052604675292969, -6.551140785217285, -6.049676895141602, -5.54821252822876, -5.046748161315918, -4.545284271240234, -4.043820381164551, -3.542356014251709, -3.0408918857574463, -2.5394277572631836, -2.037963628768921, -1.5364995002746582, -1.0350353717803955, -0.5335712432861328, -0.03210711479187012, 0.4693570137023926, 0.9708211421966553, 1.472285270690918, 1.9737493991851807, 2.4752135276794434, 2.976677656173706, 3.4781417846679688, 3.9796059131622314, 4.481070041656494, 4.982534408569336, 5.4839982986450195, 5.985462188720703, 6.486926555633545, 6.988390922546387, 7.48985481262207, 7.991318702697754, 8.492782592773438, 8.994247436523438, 9.495711326599121, 9.997175216674805, 10.498640060424805, 11.000103950500488, 11.501567840576172]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 11.0, 12.0, 18.0, 30.0, 37.0, 89.0, 202.0, 819.0, 5754.0, 82177.0, 822973.0, 126931.0, 7918.0, 1060.0, 279.0, 96.0, 39.0, 27.0, 19.0, 19.0, 8.0, 5.0, 3.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.66290283203125, -4.4937744140625, -4.32464599609375, -4.155517578125, -3.98638916015625, -3.8172607421875, -3.64813232421875, -3.47900390625, -3.30987548828125, -3.1407470703125, -2.97161865234375, -2.802490234375, -2.63336181640625, -2.4642333984375, -2.29510498046875, -2.1259765625, -1.95684814453125, -1.7877197265625, -1.61859130859375, -1.449462890625, -1.28033447265625, -1.1112060546875, -0.94207763671875, -0.77294921875, -0.60382080078125, -0.4346923828125, -0.26556396484375, -0.096435546875, 0.07269287109375, 0.2418212890625, 0.41094970703125, 0.580078125, 0.74920654296875, 0.9183349609375, 1.08746337890625, 1.256591796875, 1.42572021484375, 1.5948486328125, 1.76397705078125, 1.93310546875, 2.10223388671875, 2.2713623046875, 2.44049072265625, 2.609619140625, 2.77874755859375, 2.9478759765625, 3.11700439453125, 3.2861328125, 3.45526123046875, 3.6243896484375, 3.79351806640625, 3.962646484375, 4.13177490234375, 4.3009033203125, 4.47003173828125, 4.63916015625, 4.80828857421875, 4.9774169921875, 5.14654541015625, 5.315673828125, 5.48480224609375, 5.6539306640625, 5.82305908203125, 5.9921875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 12.0, 27.0, 32.0, 33.0, 60.0, 68.0, 71.0, 83.0, 93.0, 78.0, 78.0, 76.0, 69.0, 52.0, 49.0, 37.0, 20.0, 24.0, 9.0, 5.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6385650634765625, -1.590606689453125, -1.5426483154296875, -1.49468994140625, -1.4467315673828125, -1.398773193359375, -1.3508148193359375, -1.3028564453125, -1.2548980712890625, -1.206939697265625, -1.1589813232421875, -1.11102294921875, -1.0630645751953125, -1.015106201171875, -0.9671478271484375, -0.919189453125, -0.8712310791015625, -0.823272705078125, -0.7753143310546875, -0.72735595703125, -0.6793975830078125, -0.631439208984375, -0.5834808349609375, -0.5355224609375, -0.4875640869140625, -0.439605712890625, -0.3916473388671875, -0.34368896484375, -0.2957305908203125, -0.247772216796875, -0.1998138427734375, -0.15185546875, -0.1038970947265625, -0.055938720703125, -0.0079803466796875, 0.03997802734375, 0.0879364013671875, 0.135894775390625, 0.1838531494140625, 0.2318115234375, 0.2797698974609375, 0.327728271484375, 0.3756866455078125, 0.42364501953125, 0.4716033935546875, 0.519561767578125, 0.5675201416015625, 0.615478515625, 0.6634368896484375, 0.711395263671875, 0.7593536376953125, 0.80731201171875, 0.8552703857421875, 0.903228759765625, 0.9511871337890625, 0.9991455078125, 1.0471038818359375, 1.095062255859375, 1.1430206298828125, 1.19097900390625, 1.2389373779296875, 1.286895751953125, 1.3348541259765625, 1.3828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 4.0, 13.0, 26.0, 35.0, 40.0, 91.0, 146.0, 236.0, 384.0, 791.0, 1651.0, 4734.0, 29154.0, 771028.0, 221497.0, 12909.0, 3212.0, 1206.0, 617.0, 322.0, 177.0, 94.0, 68.0, 27.0, 26.0, 18.0, 11.0, 5.0, 9.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.33984375, -6.15777587890625, -5.9757080078125, -5.79364013671875, -5.611572265625, -5.42950439453125, -5.2474365234375, -5.06536865234375, -4.88330078125, -4.70123291015625, -4.5191650390625, -4.33709716796875, -4.155029296875, -3.97296142578125, -3.7908935546875, -3.60882568359375, -3.4267578125, -3.24468994140625, -3.0626220703125, -2.88055419921875, -2.698486328125, -2.51641845703125, -2.3343505859375, -2.15228271484375, -1.97021484375, -1.78814697265625, -1.6060791015625, -1.42401123046875, -1.241943359375, -1.05987548828125, -0.8778076171875, -0.69573974609375, -0.513671875, -0.33160400390625, -0.1495361328125, 0.03253173828125, 0.214599609375, 0.39666748046875, 0.5787353515625, 0.76080322265625, 0.94287109375, 1.12493896484375, 1.3070068359375, 1.48907470703125, 1.671142578125, 1.85321044921875, 2.0352783203125, 2.21734619140625, 2.3994140625, 2.58148193359375, 2.7635498046875, 2.94561767578125, 3.127685546875, 3.30975341796875, 3.4918212890625, 3.67388916015625, 3.85595703125, 4.03802490234375, 4.2200927734375, 4.40216064453125, 4.584228515625, 4.76629638671875, 4.9483642578125, 5.13043212890625, 5.3125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 7.0, 9.0, 8.0, 8.0, 7.0, 11.0, 16.0, 18.0, 21.0, 28.0, 25.0, 28.0, 37.0, 29.0, 32.0, 40.0, 32.0, 51.0, 47.0, 47.0, 51.0, 48.0, 45.0, 30.0, 40.0, 40.0, 27.0, 23.0, 37.0, 24.0, 21.0, 17.0, 16.0, 15.0, 12.0, 9.0, 6.0, 4.0, 8.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.947265625, -3.83111572265625, -3.7149658203125, -3.59881591796875, -3.482666015625, -3.36651611328125, -3.2503662109375, -3.13421630859375, -3.01806640625, -2.90191650390625, -2.7857666015625, -2.66961669921875, -2.553466796875, -2.43731689453125, -2.3211669921875, -2.20501708984375, -2.0888671875, -1.97271728515625, -1.8565673828125, -1.74041748046875, -1.624267578125, -1.50811767578125, -1.3919677734375, -1.27581787109375, -1.15966796875, -1.04351806640625, -0.9273681640625, -0.81121826171875, -0.695068359375, -0.57891845703125, -0.4627685546875, -0.34661865234375, -0.23046875, -0.11431884765625, 0.0018310546875, 0.11798095703125, 0.234130859375, 0.35028076171875, 0.4664306640625, 0.58258056640625, 0.69873046875, 0.81488037109375, 0.9310302734375, 1.04718017578125, 1.163330078125, 1.27947998046875, 1.3956298828125, 1.51177978515625, 1.6279296875, 1.74407958984375, 1.8602294921875, 1.97637939453125, 2.092529296875, 2.20867919921875, 2.3248291015625, 2.44097900390625, 2.55712890625, 2.67327880859375, 2.7894287109375, 2.90557861328125, 3.021728515625, 3.13787841796875, 3.2540283203125, 3.37017822265625, 3.486328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 9.0, 5.0, 10.0, 10.0, 17.0, 15.0, 38.0, 78.0, 225.0, 851.0, 7660.0, 996169.0, 41257.0, 1668.0, 332.0, 114.0, 38.0, 26.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.7193603515625, -7.509033203125, -7.2987060546875, -7.08837890625, -6.8780517578125, -6.667724609375, -6.4573974609375, -6.2470703125, -6.0367431640625, -5.826416015625, -5.6160888671875, -5.40576171875, -5.1954345703125, -4.985107421875, -4.7747802734375, -4.564453125, -4.3541259765625, -4.143798828125, -3.9334716796875, -3.72314453125, -3.5128173828125, -3.302490234375, -3.0921630859375, -2.8818359375, -2.6715087890625, -2.461181640625, -2.2508544921875, -2.04052734375, -1.8302001953125, -1.619873046875, -1.4095458984375, -1.19921875, -0.9888916015625, -0.778564453125, -0.5682373046875, -0.35791015625, -0.1475830078125, 0.062744140625, 0.2730712890625, 0.4833984375, 0.6937255859375, 0.904052734375, 1.1143798828125, 1.32470703125, 1.5350341796875, 1.745361328125, 1.9556884765625, 2.166015625, 2.3763427734375, 2.586669921875, 2.7969970703125, 3.00732421875, 3.2176513671875, 3.427978515625, 3.6383056640625, 3.8486328125, 4.0589599609375, 4.269287109375, 4.4796142578125, 4.68994140625, 4.9002685546875, 5.110595703125, 5.3209228515625, 5.53125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 6.0, 7.0, 13.0, 22.0, 25.0, 43.0, 73.0, 134.0, 289.0, 146.0, 72.0, 72.0, 39.0, 20.0, 17.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004684925079345703, -0.0004458390176296234, -0.0004231855273246765, -0.0004005320370197296, -0.0003778785467147827, -0.0003552250564098358, -0.0003325715661048889, -0.000309918075799942, -0.0002872645854949951, -0.0002646110951900482, -0.00024195760488510132, -0.00021930411458015442, -0.00019665062427520752, -0.00017399713397026062, -0.00015134364366531372, -0.00012869015336036682, -0.00010603666305541992, -8.338317275047302e-05, -6.072968244552612e-05, -3.8076192140579224e-05, -1.5422701835632324e-05, 7.230788469314575e-06, 2.9884278774261475e-05, 5.2537769079208374e-05, 7.519125938415527e-05, 9.784474968910217e-05, 0.00012049823999404907, 0.00014315173029899597, 0.00016580522060394287, 0.00018845871090888977, 0.00021111220121383667, 0.00023376569151878357, 0.00025641918182373047, 0.00027907267212867737, 0.00030172616243362427, 0.00032437965273857117, 0.00034703314304351807, 0.00036968663334846497, 0.00039234012365341187, 0.00041499361395835876, 0.00043764710426330566, 0.00046030059456825256, 0.00048295408487319946, 0.0005056075751781464, 0.0005282610654830933, 0.0005509145557880402, 0.0005735680460929871, 0.000596221536397934, 0.0006188750267028809, 0.0006415285170078278, 0.0006641820073127747, 0.0006868354976177216, 0.0007094889879226685, 0.0007321424782276154, 0.0007547959685325623, 0.0007774494588375092, 0.0008001029491424561, 0.000822756439447403, 0.0008454099297523499, 0.0008680634200572968, 0.0008907169103622437, 0.0009133704006671906, 0.0009360238909721375, 0.0009586773812770844, 0.0009813308715820312]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 11.0, 6.0, 12.0, 23.0, 19.0, 27.0, 40.0, 75.0, 100.0, 163.0, 314.0, 638.0, 1445.0, 3646.0, 13877.0, 778521.0, 233233.0, 10773.0, 3076.0, 1192.0, 606.0, 279.0, 163.0, 97.0, 52.0, 42.0, 31.0, 15.0, 9.0, 9.0, 8.0, 6.0, 7.0, 8.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.5860595703125, -4.437744140625, -4.2894287109375, -4.14111328125, -3.9927978515625, -3.844482421875, -3.6961669921875, -3.5478515625, -3.3995361328125, -3.251220703125, -3.1029052734375, -2.95458984375, -2.8062744140625, -2.657958984375, -2.5096435546875, -2.361328125, -2.2130126953125, -2.064697265625, -1.9163818359375, -1.76806640625, -1.6197509765625, -1.471435546875, -1.3231201171875, -1.1748046875, -1.0264892578125, -0.878173828125, -0.7298583984375, -0.58154296875, -0.4332275390625, -0.284912109375, -0.1365966796875, 0.01171875, 0.1600341796875, 0.308349609375, 0.4566650390625, 0.60498046875, 0.7532958984375, 0.901611328125, 1.0499267578125, 1.1982421875, 1.3465576171875, 1.494873046875, 1.6431884765625, 1.79150390625, 1.9398193359375, 2.088134765625, 2.2364501953125, 2.384765625, 2.5330810546875, 2.681396484375, 2.8297119140625, 2.97802734375, 3.1263427734375, 3.274658203125, 3.4229736328125, 3.5712890625, 3.7196044921875, 3.867919921875, 4.0162353515625, 4.16455078125, 4.3128662109375, 4.461181640625, 4.6094970703125, 4.7578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 19.0, 24.0, 54.0, 101.0, 143.0, 255.0, 143.0, 78.0, 50.0, 34.0, 10.0, 13.0, 11.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.979217529296875, -2.87445068359375, -2.769683837890625, -2.6649169921875, -2.560150146484375, -2.45538330078125, -2.350616455078125, -2.245849609375, -2.141082763671875, -2.03631591796875, -1.931549072265625, -1.8267822265625, -1.722015380859375, -1.61724853515625, -1.512481689453125, -1.40771484375, -1.302947998046875, -1.19818115234375, -1.093414306640625, -0.9886474609375, -0.883880615234375, -0.77911376953125, -0.674346923828125, -0.569580078125, -0.464813232421875, -0.36004638671875, -0.255279541015625, -0.1505126953125, -0.045745849609375, 0.05902099609375, 0.163787841796875, 0.2685546875, 0.373321533203125, 0.47808837890625, 0.582855224609375, 0.6876220703125, 0.792388916015625, 0.89715576171875, 1.001922607421875, 1.106689453125, 1.211456298828125, 1.31622314453125, 1.420989990234375, 1.5257568359375, 1.630523681640625, 1.73529052734375, 1.840057373046875, 1.94482421875, 2.049591064453125, 2.15435791015625, 2.259124755859375, 2.3638916015625, 2.468658447265625, 2.57342529296875, 2.678192138671875, 2.782958984375, 2.887725830078125, 2.99249267578125, 3.097259521484375, 3.2020263671875, 3.306793212890625, 3.41156005859375, 3.516326904296875, 3.62109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 8.0, 17.0, 61.0, 164.0, 424.0, 218.0, 71.0, 20.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.67119598388672, -42.775901794433594, -40.880611419677734, -38.98531723022461, -37.090023040771484, -35.194732666015625, -33.2994384765625, -31.404146194458008, -29.508853912353516, -27.613561630249023, -25.7182674407959, -23.822975158691406, -21.927682876586914, -20.032390594482422, -18.137096405029297, -16.241804122924805, -14.34650993347168, -12.451216697692871, -10.555924415588379, -8.66063117980957, -6.76533842086792, -4.8700456619262695, -2.974752426147461, -1.0794601440429688, 0.8158330917358398, 2.7111258506774902, 4.606418609619141, 6.501711845397949, 8.397005081176758, 10.29229736328125, 12.187590599060059, 14.08288288116455, 15.97817611694336, 17.87346839904785, 19.768762588500977, 21.66405487060547, 23.55934715270996, 25.454639434814453, 27.349933624267578, 29.24522590637207, 31.140518188476562, 33.03581237792969, 34.93110275268555, 36.82639694213867, 38.7216911315918, 40.616981506347656, 42.51227569580078, 44.407569885253906, 46.30286407470703, 48.198158264160156, 50.093448638916016, 51.98874282836914, 53.884037017822266, 55.779327392578125, 57.67462158203125, 59.569915771484375, 61.465206146240234, 63.36050033569336, 65.25579071044922, 67.15108489990234, 69.04637908935547, 70.9416732788086, 72.83695983886719, 74.73225402832031, 76.62754821777344]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 1.0, 11.0, 9.0, 13.0, 11.0, 16.0, 16.0, 21.0, 23.0, 28.0, 26.0, 25.0, 23.0, 25.0, 40.0, 54.0, 71.0, 68.0, 77.0, 54.0, 50.0, 49.0, 36.0, 37.0, 38.0, 18.0, 17.0, 18.0, 27.0, 13.0, 15.0, 7.0, 15.0, 7.0, 8.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.888042449951172, -17.329771041870117, -16.771499633789062, -16.213228225708008, -15.654956817626953, -15.096685409545898, -14.538414001464844, -13.980142593383789, -13.421871185302734, -12.86359977722168, -12.305328369140625, -11.74705696105957, -11.188785552978516, -10.630514144897461, -10.072242736816406, -9.513971328735352, -8.95569896697998, -8.397427558898926, -7.839156150817871, -7.280884742736816, -6.722613334655762, -6.164341926574707, -5.606070041656494, -5.0477986335754395, -4.489527225494385, -3.93125581741333, -3.3729844093322754, -2.8147127628326416, -2.256441354751587, -1.6981699466705322, -1.1398983001708984, -0.5816268920898438, -0.023355484008789062, 0.5349159836769104, 1.0931874513626099, 1.651458978652954, 2.209730386734009, 2.7680017948150635, 3.3262734413146973, 3.884544849395752, 4.442816257476807, 5.001087665557861, 5.559359073638916, 6.117630958557129, 6.675902366638184, 7.234173774719238, 7.792445182800293, 8.350716590881348, 8.908987998962402, 9.467259407043457, 10.025530815124512, 10.583802223205566, 11.142073631286621, 11.700345039367676, 12.258617401123047, 12.816888809204102, 13.375160217285156, 13.933431625366211, 14.491703033447266, 15.04997444152832, 15.608245849609375, 16.16651725769043, 16.724788665771484, 17.28306007385254, 17.841331481933594]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 9.0, 12.0, 4.0, 12.0, 17.0, 20.0, 38.0, 53.0, 106.0, 258.0, 1053.0, 19494.0, 4081787.0, 87288.0, 2586.0, 940.0, 328.0, 113.0, 52.0, 28.0, 8.0, 12.0, 12.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.2890625, -9.085540771484375, -8.88201904296875, -8.678497314453125, -8.4749755859375, -8.271453857421875, -8.06793212890625, -7.864410400390625, -7.660888671875, -7.457366943359375, -7.25384521484375, -7.050323486328125, -6.8468017578125, -6.643280029296875, -6.43975830078125, -6.236236572265625, -6.03271484375, -5.829193115234375, -5.62567138671875, -5.422149658203125, -5.2186279296875, -5.015106201171875, -4.81158447265625, -4.608062744140625, -4.404541015625, -4.201019287109375, -3.99749755859375, -3.793975830078125, -3.5904541015625, -3.386932373046875, -3.18341064453125, -2.979888916015625, -2.7763671875, -2.572845458984375, -2.36932373046875, -2.165802001953125, -1.9622802734375, -1.758758544921875, -1.55523681640625, -1.351715087890625, -1.148193359375, -0.944671630859375, -0.74114990234375, -0.537628173828125, -0.3341064453125, -0.130584716796875, 0.07293701171875, 0.276458740234375, 0.47998046875, 0.683502197265625, 0.88702392578125, 1.090545654296875, 1.2940673828125, 1.497589111328125, 1.70111083984375, 1.904632568359375, 2.108154296875, 2.311676025390625, 2.51519775390625, 2.718719482421875, 2.9222412109375, 3.125762939453125, 3.32928466796875, 3.532806396484375, 3.736328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 12.0, 18.0, 28.0, 51.0, 78.0, 115.0, 123.0, 127.0, 123.0, 108.0, 73.0, 61.0, 37.0, 22.0, 14.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.710968017578125, -2.63677978515625, -2.562591552734375, -2.4884033203125, -2.414215087890625, -2.34002685546875, -2.265838623046875, -2.191650390625, -2.117462158203125, -2.04327392578125, -1.969085693359375, -1.8948974609375, -1.820709228515625, -1.74652099609375, -1.672332763671875, -1.59814453125, -1.523956298828125, -1.44976806640625, -1.375579833984375, -1.3013916015625, -1.227203369140625, -1.15301513671875, -1.078826904296875, -1.004638671875, -0.930450439453125, -0.85626220703125, -0.782073974609375, -0.7078857421875, -0.633697509765625, -0.55950927734375, -0.485321044921875, -0.4111328125, -0.336944580078125, -0.26275634765625, -0.188568115234375, -0.1143798828125, -0.040191650390625, 0.03399658203125, 0.108184814453125, 0.182373046875, 0.256561279296875, 0.33074951171875, 0.404937744140625, 0.4791259765625, 0.553314208984375, 0.62750244140625, 0.701690673828125, 0.77587890625, 0.850067138671875, 0.92425537109375, 0.998443603515625, 1.0726318359375, 1.146820068359375, 1.22100830078125, 1.295196533203125, 1.369384765625, 1.443572998046875, 1.51776123046875, 1.591949462890625, 1.6661376953125, 1.740325927734375, 1.81451416015625, 1.888702392578125, 1.962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 10.0, 22.0, 32.0, 55.0, 83.0, 186.0, 350.0, 877.0, 2914.0, 16692.0, 352169.0, 3700970.0, 107519.0, 8834.0, 2040.0, 798.0, 340.0, 167.0, 92.0, 44.0, 25.0, 18.0, 13.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.271484375, -3.160003662109375, -3.04852294921875, -2.937042236328125, -2.8255615234375, -2.714080810546875, -2.60260009765625, -2.491119384765625, -2.379638671875, -2.268157958984375, -2.15667724609375, -2.045196533203125, -1.9337158203125, -1.822235107421875, -1.71075439453125, -1.599273681640625, -1.48779296875, -1.376312255859375, -1.26483154296875, -1.153350830078125, -1.0418701171875, -0.930389404296875, -0.81890869140625, -0.707427978515625, -0.595947265625, -0.484466552734375, -0.37298583984375, -0.261505126953125, -0.1500244140625, -0.038543701171875, 0.07293701171875, 0.184417724609375, 0.2958984375, 0.407379150390625, 0.51885986328125, 0.630340576171875, 0.7418212890625, 0.853302001953125, 0.96478271484375, 1.076263427734375, 1.187744140625, 1.299224853515625, 1.41070556640625, 1.522186279296875, 1.6336669921875, 1.745147705078125, 1.85662841796875, 1.968109130859375, 2.07958984375, 2.191070556640625, 2.30255126953125, 2.414031982421875, 2.5255126953125, 2.636993408203125, 2.74847412109375, 2.859954833984375, 2.971435546875, 3.082916259765625, 3.19439697265625, 3.305877685546875, 3.4173583984375, 3.528839111328125, 3.64031982421875, 3.751800537109375, 3.86328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 8.0, 10.0, 13.0, 14.0, 13.0, 28.0, 34.0, 56.0, 69.0, 114.0, 182.0, 327.0, 439.0, 599.0, 666.0, 529.0, 352.0, 217.0, 139.0, 89.0, 49.0, 32.0, 23.0, 17.0, 13.0, 9.0, 9.0, 9.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.912109375, -1.84405517578125, -1.7760009765625, -1.70794677734375, -1.639892578125, -1.57183837890625, -1.5037841796875, -1.43572998046875, -1.36767578125, -1.29962158203125, -1.2315673828125, -1.16351318359375, -1.095458984375, -1.02740478515625, -0.9593505859375, -0.89129638671875, -0.8232421875, -0.75518798828125, -0.6871337890625, -0.61907958984375, -0.551025390625, -0.48297119140625, -0.4149169921875, -0.34686279296875, -0.27880859375, -0.21075439453125, -0.1427001953125, -0.07464599609375, -0.006591796875, 0.06146240234375, 0.1295166015625, 0.19757080078125, 0.265625, 0.33367919921875, 0.4017333984375, 0.46978759765625, 0.537841796875, 0.60589599609375, 0.6739501953125, 0.74200439453125, 0.81005859375, 0.87811279296875, 0.9461669921875, 1.01422119140625, 1.082275390625, 1.15032958984375, 1.2183837890625, 1.28643798828125, 1.3544921875, 1.42254638671875, 1.4906005859375, 1.55865478515625, 1.626708984375, 1.69476318359375, 1.7628173828125, 1.83087158203125, 1.89892578125, 1.96697998046875, 2.0350341796875, 2.10308837890625, 2.171142578125, 2.23919677734375, 2.3072509765625, 2.37530517578125, 2.443359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 42.0, 89.0, 155.0, 236.0, 225.0, 125.0, 55.0, 22.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-31.735456466674805, -30.874797821044922, -30.01413917541504, -29.153480529785156, -28.292821884155273, -27.43216323852539, -26.571504592895508, -25.710845947265625, -24.850187301635742, -23.98952865600586, -23.128870010375977, -22.268211364746094, -21.40755271911621, -20.546894073486328, -19.686235427856445, -18.825576782226562, -17.96491813659668, -17.104259490966797, -16.243600845336914, -15.382942199707031, -14.522283554077148, -13.661624908447266, -12.800966262817383, -11.9403076171875, -11.079648971557617, -10.218990325927734, -9.358331680297852, -8.497673034667969, -7.637014389038086, -6.776355743408203, -5.91569709777832, -5.0550384521484375, -4.194377899169922, -3.333719253540039, -2.4730606079101562, -1.6124019622802734, -0.7517433166503906, 0.10891532897949219, 0.969573974609375, 1.8302326202392578, 2.6908912658691406, 3.5515499114990234, 4.412208557128906, 5.272867202758789, 6.133525848388672, 6.994184494018555, 7.8548431396484375, 8.71550178527832, 9.576160430908203, 10.436819076538086, 11.297477722167969, 12.158136367797852, 13.018795013427734, 13.879453659057617, 14.7401123046875, 15.600770950317383, 16.461429595947266, 17.32208824157715, 18.18274688720703, 19.043405532836914, 19.904064178466797, 20.76472282409668, 21.625381469726562, 22.486040115356445, 23.346698760986328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 15.0, 17.0, 17.0, 42.0, 39.0, 55.0, 53.0, 63.0, 71.0, 83.0, 85.0, 78.0, 75.0, 74.0, 55.0, 41.0, 31.0, 29.0, 19.0, 16.0, 8.0, 6.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.731535911560059, -14.249303817749023, -13.767070770263672, -13.28483772277832, -12.802605628967285, -12.32037353515625, -11.838140487670898, -11.355907440185547, -10.873675346374512, -10.391443252563477, -9.909210205078125, -9.426977157592773, -8.944745063781738, -8.462512969970703, -7.980279922485352, -7.498047351837158, -7.015814781188965, -6.5335822105407715, -6.051349639892578, -5.569117069244385, -5.086884498596191, -4.604651927947998, -4.122419357299805, -3.6401867866516113, -3.157954216003418, -2.6757216453552246, -2.1934890747070312, -1.711256504058838, -1.2290239334106445, -0.7467913627624512, -0.2645587921142578, 0.21767377853393555, 0.6999053955078125, 1.1821379661560059, 1.6643705368041992, 2.1466031074523926, 2.628835678100586, 3.1110682487487793, 3.5933008193969727, 4.075533390045166, 4.557765960693359, 5.039998531341553, 5.522231101989746, 6.0044636726379395, 6.486696243286133, 6.968928813934326, 7.4511613845825195, 7.933393955230713, 8.415626525878906, 8.897859573364258, 9.380091667175293, 9.862323760986328, 10.34455680847168, 10.826789855957031, 11.309021949768066, 11.791254043579102, 12.273487091064453, 12.755720138549805, 13.23795223236084, 13.720184326171875, 14.202417373657227, 14.684650421142578, 15.166882514953613, 15.649114608764648, 16.13134765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 9.0, 14.0, 16.0, 38.0, 64.0, 125.0, 341.0, 1661.0, 23890.0, 939485.0, 79226.0, 2889.0, 455.0, 118.0, 60.0, 37.0, 25.0, 24.0, 20.0, 10.0, 3.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.546875, -10.26666259765625, -9.9864501953125, -9.70623779296875, -9.426025390625, -9.14581298828125, -8.8656005859375, -8.58538818359375, -8.30517578125, -8.02496337890625, -7.7447509765625, -7.46453857421875, -7.184326171875, -6.90411376953125, -6.6239013671875, -6.34368896484375, -6.0634765625, -5.78326416015625, -5.5030517578125, -5.22283935546875, -4.942626953125, -4.66241455078125, -4.3822021484375, -4.10198974609375, -3.82177734375, -3.54156494140625, -3.2613525390625, -2.98114013671875, -2.700927734375, -2.42071533203125, -2.1405029296875, -1.86029052734375, -1.580078125, -1.29986572265625, -1.0196533203125, -0.73944091796875, -0.459228515625, -0.17901611328125, 0.1011962890625, 0.38140869140625, 0.66162109375, 0.94183349609375, 1.2220458984375, 1.50225830078125, 1.782470703125, 2.06268310546875, 2.3428955078125, 2.62310791015625, 2.9033203125, 3.18353271484375, 3.4637451171875, 3.74395751953125, 4.024169921875, 4.30438232421875, 4.5845947265625, 4.86480712890625, 5.14501953125, 5.42523193359375, 5.7054443359375, 5.98565673828125, 6.265869140625, 6.54608154296875, 6.8262939453125, 7.10650634765625, 7.38671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 21.0, 21.0, 37.0, 55.0, 68.0, 76.0, 94.0, 97.0, 124.0, 105.0, 78.0, 68.0, 50.0, 45.0, 24.0, 10.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.732421875, -2.6714630126953125, -2.610504150390625, -2.5495452880859375, -2.48858642578125, -2.4276275634765625, -2.366668701171875, -2.3057098388671875, -2.2447509765625, -2.1837921142578125, -2.122833251953125, -2.0618743896484375, -2.00091552734375, -1.9399566650390625, -1.878997802734375, -1.8180389404296875, -1.757080078125, -1.6961212158203125, -1.635162353515625, -1.5742034912109375, -1.51324462890625, -1.4522857666015625, -1.391326904296875, -1.3303680419921875, -1.2694091796875, -1.2084503173828125, -1.147491455078125, -1.0865325927734375, -1.02557373046875, -0.9646148681640625, -0.903656005859375, -0.8426971435546875, -0.78173828125, -0.7207794189453125, -0.659820556640625, -0.5988616943359375, -0.53790283203125, -0.4769439697265625, -0.415985107421875, -0.3550262451171875, -0.2940673828125, -0.2331085205078125, -0.172149658203125, -0.1111907958984375, -0.05023193359375, 0.0107269287109375, 0.071685791015625, 0.1326446533203125, 0.193603515625, 0.2545623779296875, 0.315521240234375, 0.3764801025390625, 0.43743896484375, 0.4983978271484375, 0.559356689453125, 0.6203155517578125, 0.6812744140625, 0.7422332763671875, 0.803192138671875, 0.8641510009765625, 0.92510986328125, 0.9860687255859375, 1.047027587890625, 1.1079864501953125, 1.1689453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 16.0, 16.0, 33.0, 45.0, 73.0, 151.0, 375.0, 969.0, 4057.0, 77796.0, 946697.0, 15077.0, 2114.0, 620.0, 231.0, 110.0, 62.0, 22.0, 19.0, 11.0, 5.0, 11.0, 5.0, 7.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.8670654296875, -12.531005859375, -12.1949462890625, -11.85888671875, -11.5228271484375, -11.186767578125, -10.8507080078125, -10.5146484375, -10.1785888671875, -9.842529296875, -9.5064697265625, -9.17041015625, -8.8343505859375, -8.498291015625, -8.1622314453125, -7.826171875, -7.4901123046875, -7.154052734375, -6.8179931640625, -6.48193359375, -6.1458740234375, -5.809814453125, -5.4737548828125, -5.1376953125, -4.8016357421875, -4.465576171875, -4.1295166015625, -3.79345703125, -3.4573974609375, -3.121337890625, -2.7852783203125, -2.44921875, -2.1131591796875, -1.777099609375, -1.4410400390625, -1.10498046875, -0.7689208984375, -0.432861328125, -0.0968017578125, 0.2392578125, 0.5753173828125, 0.911376953125, 1.2474365234375, 1.58349609375, 1.9195556640625, 2.255615234375, 2.5916748046875, 2.927734375, 3.2637939453125, 3.599853515625, 3.9359130859375, 4.27197265625, 4.6080322265625, 4.944091796875, 5.2801513671875, 5.6162109375, 5.9522705078125, 6.288330078125, 6.6243896484375, 6.96044921875, 7.2965087890625, 7.632568359375, 7.9686279296875, 8.3046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 26.0, 24.0, 29.0, 36.0, 44.0, 42.0, 65.0, 65.0, 80.0, 77.0, 83.0, 51.0, 49.0, 52.0, 39.0, 43.0, 43.0, 25.0, 20.0, 13.0, 11.0, 9.0, 6.0, 5.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03515625, -5.8660888671875, -5.697021484375, -5.5279541015625, -5.35888671875, -5.1898193359375, -5.020751953125, -4.8516845703125, -4.6826171875, -4.5135498046875, -4.344482421875, -4.1754150390625, -4.00634765625, -3.8372802734375, -3.668212890625, -3.4991455078125, -3.330078125, -3.1610107421875, -2.991943359375, -2.8228759765625, -2.65380859375, -2.4847412109375, -2.315673828125, -2.1466064453125, -1.9775390625, -1.8084716796875, -1.639404296875, -1.4703369140625, -1.30126953125, -1.1322021484375, -0.963134765625, -0.7940673828125, -0.625, -0.4559326171875, -0.286865234375, -0.1177978515625, 0.05126953125, 0.2203369140625, 0.389404296875, 0.5584716796875, 0.7275390625, 0.8966064453125, 1.065673828125, 1.2347412109375, 1.40380859375, 1.5728759765625, 1.741943359375, 1.9110107421875, 2.080078125, 2.2491455078125, 2.418212890625, 2.5872802734375, 2.75634765625, 2.9254150390625, 3.094482421875, 3.2635498046875, 3.4326171875, 3.6016845703125, 3.770751953125, 3.9398193359375, 4.10888671875, 4.2779541015625, 4.447021484375, 4.6160888671875, 4.78515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 10.0, 4.0, 9.0, 15.0, 17.0, 23.0, 27.0, 37.0, 64.0, 75.0, 112.0, 231.0, 352.0, 784.0, 1691.0, 4919.0, 19412.0, 146336.0, 800034.0, 57942.0, 10627.0, 3298.0, 1173.0, 547.0, 287.0, 163.0, 106.0, 68.0, 55.0, 29.0, 27.0, 18.0, 17.0, 10.0, 7.0, 8.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.392578125, -2.32073974609375, -2.2489013671875, -2.17706298828125, -2.105224609375, -2.03338623046875, -1.9615478515625, -1.88970947265625, -1.81787109375, -1.74603271484375, -1.6741943359375, -1.60235595703125, -1.530517578125, -1.45867919921875, -1.3868408203125, -1.31500244140625, -1.2431640625, -1.17132568359375, -1.0994873046875, -1.02764892578125, -0.955810546875, -0.88397216796875, -0.8121337890625, -0.74029541015625, -0.66845703125, -0.59661865234375, -0.5247802734375, -0.45294189453125, -0.381103515625, -0.30926513671875, -0.2374267578125, -0.16558837890625, -0.09375, -0.02191162109375, 0.0499267578125, 0.12176513671875, 0.193603515625, 0.26544189453125, 0.3372802734375, 0.40911865234375, 0.48095703125, 0.55279541015625, 0.6246337890625, 0.69647216796875, 0.768310546875, 0.84014892578125, 0.9119873046875, 0.98382568359375, 1.0556640625, 1.12750244140625, 1.1993408203125, 1.27117919921875, 1.343017578125, 1.41485595703125, 1.4866943359375, 1.55853271484375, 1.63037109375, 1.70220947265625, 1.7740478515625, 1.84588623046875, 1.917724609375, 1.98956298828125, 2.0614013671875, 2.13323974609375, 2.205078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 15.0, 14.0, 21.0, 31.0, 46.0, 87.0, 154.0, 259.0, 135.0, 76.0, 41.0, 26.0, 17.0, 15.0, 13.0, 7.0, 10.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007104873657226562, -0.0006871521472930908, -0.0006638169288635254, -0.00064048171043396, -0.0006171464920043945, -0.0005938112735748291, -0.0005704760551452637, -0.0005471408367156982, -0.0005238056182861328, -0.0005004703998565674, -0.00047713518142700195, -0.0004537999629974365, -0.0004304647445678711, -0.00040712952613830566, -0.00038379430770874023, -0.0003604590892791748, -0.0003371238708496094, -0.00031378865242004395, -0.0002904534339904785, -0.0002671182155609131, -0.00024378299713134766, -0.00022044777870178223, -0.0001971125602722168, -0.00017377734184265137, -0.00015044212341308594, -0.0001271069049835205, -0.00010377168655395508, -8.043646812438965e-05, -5.710124969482422e-05, -3.376603126525879e-05, -1.043081283569336e-05, 1.290440559387207e-05, 3.62396240234375e-05, 5.957484245300293e-05, 8.291006088256836e-05, 0.00010624527931213379, 0.00012958049774169922, 0.00015291571617126465, 0.00017625093460083008, 0.0001995861530303955, 0.00022292137145996094, 0.00024625658988952637, 0.0002695918083190918, 0.0002929270267486572, 0.00031626224517822266, 0.0003395974636077881, 0.0003629326820373535, 0.00038626790046691895, 0.0004096031188964844, 0.0004329383373260498, 0.00045627355575561523, 0.00047960877418518066, 0.0005029439926147461, 0.0005262792110443115, 0.000549614429473877, 0.0005729496479034424, 0.0005962848663330078, 0.0006196200847625732, 0.0006429553031921387, 0.0006662905216217041, 0.0006896257400512695, 0.000712960958480835, 0.0007362961769104004, 0.0007596313953399658, 0.0007829666137695312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 14.0, 14.0, 15.0, 12.0, 22.0, 21.0, 36.0, 44.0, 54.0, 90.0, 101.0, 183.0, 312.0, 577.0, 1022.0, 2083.0, 4585.0, 12595.0, 50335.0, 663717.0, 262507.0, 33359.0, 9318.0, 3676.0, 1705.0, 857.0, 470.0, 285.0, 152.0, 111.0, 69.0, 52.0, 30.0, 31.0, 20.0, 12.0, 12.0, 10.0, 9.0, 7.0, 5.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.74609375, -1.6876373291015625, -1.629180908203125, -1.5707244873046875, -1.51226806640625, -1.4538116455078125, -1.395355224609375, -1.3368988037109375, -1.2784423828125, -1.2199859619140625, -1.161529541015625, -1.1030731201171875, -1.04461669921875, -0.9861602783203125, -0.927703857421875, -0.8692474365234375, -0.810791015625, -0.7523345947265625, -0.693878173828125, -0.6354217529296875, -0.57696533203125, -0.5185089111328125, -0.460052490234375, -0.4015960693359375, -0.3431396484375, -0.2846832275390625, -0.226226806640625, -0.1677703857421875, -0.10931396484375, -0.0508575439453125, 0.007598876953125, 0.0660552978515625, 0.12451171875, 0.1829681396484375, 0.241424560546875, 0.2998809814453125, 0.35833740234375, 0.4167938232421875, 0.475250244140625, 0.5337066650390625, 0.5921630859375, 0.6506195068359375, 0.709075927734375, 0.7675323486328125, 0.82598876953125, 0.8844451904296875, 0.942901611328125, 1.0013580322265625, 1.059814453125, 1.1182708740234375, 1.176727294921875, 1.2351837158203125, 1.29364013671875, 1.3520965576171875, 1.410552978515625, 1.4690093994140625, 1.5274658203125, 1.5859222412109375, 1.644378662109375, 1.7028350830078125, 1.76129150390625, 1.8197479248046875, 1.878204345703125, 1.9366607666015625, 1.9951171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 5.0, 9.0, 7.0, 13.0, 9.0, 14.0, 25.0, 44.0, 59.0, 97.0, 136.0, 151.0, 144.0, 91.0, 45.0, 30.0, 22.0, 16.0, 12.0, 5.0, 8.0, 7.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.732421875, -1.673248291015625, -1.61407470703125, -1.554901123046875, -1.4957275390625, -1.436553955078125, -1.37738037109375, -1.318206787109375, -1.259033203125, -1.199859619140625, -1.14068603515625, -1.081512451171875, -1.0223388671875, -0.963165283203125, -0.90399169921875, -0.844818115234375, -0.78564453125, -0.726470947265625, -0.66729736328125, -0.608123779296875, -0.5489501953125, -0.489776611328125, -0.43060302734375, -0.371429443359375, -0.312255859375, -0.253082275390625, -0.19390869140625, -0.134735107421875, -0.0755615234375, -0.016387939453125, 0.04278564453125, 0.101959228515625, 0.1611328125, 0.220306396484375, 0.27947998046875, 0.338653564453125, 0.3978271484375, 0.457000732421875, 0.51617431640625, 0.575347900390625, 0.634521484375, 0.693695068359375, 0.75286865234375, 0.812042236328125, 0.8712158203125, 0.930389404296875, 0.98956298828125, 1.048736572265625, 1.10791015625, 1.167083740234375, 1.22625732421875, 1.285430908203125, 1.3446044921875, 1.403778076171875, 1.46295166015625, 1.522125244140625, 1.581298828125, 1.640472412109375, 1.69964599609375, 1.758819580078125, 1.8179931640625, 1.877166748046875, 1.93634033203125, 1.995513916015625, 2.0546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 12.0, 57.0, 149.0, 421.0, 225.0, 77.0, 20.0, 7.0, 6.0, 4.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.21904754638672, -58.52818298339844, -56.83732223510742, -55.14645767211914, -53.45559310913086, -51.764732360839844, -50.07386779785156, -48.38300323486328, -46.692138671875, -45.00127410888672, -43.3104133605957, -41.61954879760742, -39.92868423461914, -38.237823486328125, -36.546958923339844, -34.85609436035156, -33.16522979736328, -31.474367141723633, -29.78350257873535, -28.092639923095703, -26.401775360107422, -24.710912704467773, -23.020050048828125, -21.329185485839844, -19.638324737548828, -17.94746208190918, -16.2565975189209, -14.56573486328125, -12.874870300292969, -11.18400764465332, -9.493144035339355, -7.802280426025391, -6.111415863037109, -4.4205522537231445, -2.729688882827759, -1.038825511932373, 0.6520380973815918, 2.3429012298583984, 4.033764839172363, 5.724628448486328, 7.415492057800293, 9.106355667114258, 10.797219276428223, 12.488082885742188, 14.178945541381836, 15.8698091506958, 17.560672760009766, 19.251537322998047, 20.942399978637695, 22.633262634277344, 24.324127197265625, 26.014989852905273, 27.705854415893555, 29.396717071533203, 31.087581634521484, 32.7784423828125, 34.46930694580078, 36.16017150878906, 37.85103225708008, 39.54189682006836, 41.23276138305664, 42.923622131347656, 44.61448669433594, 46.30535125732422, 47.9962158203125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 12.0, 6.0, 5.0, 15.0, 18.0, 19.0, 21.0, 23.0, 19.0, 25.0, 26.0, 32.0, 23.0, 23.0, 32.0, 35.0, 43.0, 50.0, 60.0, 67.0, 54.0, 50.0, 38.0, 39.0, 27.0, 18.0, 23.0, 29.0, 21.0, 23.0, 10.0, 15.0, 14.0, 5.0, 10.0, 9.0, 16.0, 10.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-14.028838157653809, -13.60805606842041, -13.187273979187012, -12.766490936279297, -12.345708847045898, -11.9249267578125, -11.504144668579102, -11.083362579345703, -10.662579536437988, -10.24179744720459, -9.821015357971191, -9.400232315063477, -8.979450225830078, -8.55866813659668, -8.137886047363281, -7.717103481292725, -7.296321392059326, -6.875539302825928, -6.454756736755371, -6.033974647521973, -5.613192081451416, -5.192409992218018, -4.771627426147461, -4.3508453369140625, -3.930063009262085, -3.5092806816101074, -3.08849835395813, -2.6677160263061523, -2.246933937072754, -1.8261516094207764, -1.4053692817687988, -0.9845869541168213, -0.5638046264648438, -0.1430223286151886, 0.27775996923446655, 0.6985422372817993, 1.1193245649337769, 1.5401067733764648, 1.9608891010284424, 2.38167142868042, 2.8024537563323975, 3.223236083984375, 3.6440184116363525, 4.06480073928833, 4.4855828285217285, 4.906365394592285, 5.327147483825684, 5.747929573059082, 6.168712139129639, 6.589494228363037, 7.010276794433594, 7.431058883666992, 7.851841449737549, 8.272623062133789, 8.693406105041504, 9.114188194274902, 9.5349702835083, 9.9557523727417, 10.376534461975098, 10.797317504882812, 11.218099594116211, 11.63888168334961, 12.059663772583008, 12.480445861816406, 12.901228904724121]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 10.0, 17.0, 30.0, 30.0, 58.0, 98.0, 190.0, 610.0, 2945.0, 55608.0, 4090954.0, 39764.0, 2716.0, 740.0, 209.0, 122.0, 49.0, 29.0, 21.0, 13.0, 11.0, 7.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.5859375, -7.4029541015625, -7.219970703125, -7.0369873046875, -6.85400390625, -6.6710205078125, -6.488037109375, -6.3050537109375, -6.1220703125, -5.9390869140625, -5.756103515625, -5.5731201171875, -5.39013671875, -5.2071533203125, -5.024169921875, -4.8411865234375, -4.658203125, -4.4752197265625, -4.292236328125, -4.1092529296875, -3.92626953125, -3.7432861328125, -3.560302734375, -3.3773193359375, -3.1943359375, -3.0113525390625, -2.828369140625, -2.6453857421875, -2.46240234375, -2.2794189453125, -2.096435546875, -1.9134521484375, -1.73046875, -1.5474853515625, -1.364501953125, -1.1815185546875, -0.99853515625, -0.8155517578125, -0.632568359375, -0.4495849609375, -0.2666015625, -0.0836181640625, 0.099365234375, 0.2823486328125, 0.46533203125, 0.6483154296875, 0.831298828125, 1.0142822265625, 1.197265625, 1.3802490234375, 1.563232421875, 1.7462158203125, 1.92919921875, 2.1121826171875, 2.295166015625, 2.4781494140625, 2.6611328125, 2.8441162109375, 3.027099609375, 3.2100830078125, 3.39306640625, 3.5760498046875, 3.759033203125, 3.9420166015625, 4.125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 14.0, 12.0, 13.0, 22.0, 31.0, 38.0, 67.0, 59.0, 85.0, 78.0, 86.0, 86.0, 87.0, 76.0, 60.0, 56.0, 38.0, 29.0, 20.0, 14.0, 8.0, 10.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.6247406005859375, -1.573699951171875, -1.5226593017578125, -1.47161865234375, -1.4205780029296875, -1.369537353515625, -1.3184967041015625, -1.2674560546875, -1.2164154052734375, -1.165374755859375, -1.1143341064453125, -1.06329345703125, -1.0122528076171875, -0.961212158203125, -0.9101715087890625, -0.859130859375, -0.8080902099609375, -0.757049560546875, -0.7060089111328125, -0.65496826171875, -0.6039276123046875, -0.552886962890625, -0.5018463134765625, -0.4508056640625, -0.3997650146484375, -0.348724365234375, -0.2976837158203125, -0.24664306640625, -0.1956024169921875, -0.144561767578125, -0.0935211181640625, -0.04248046875, 0.0085601806640625, 0.059600830078125, 0.1106414794921875, 0.16168212890625, 0.2127227783203125, 0.263763427734375, 0.3148040771484375, 0.3658447265625, 0.4168853759765625, 0.467926025390625, 0.5189666748046875, 0.57000732421875, 0.6210479736328125, 0.672088623046875, 0.7231292724609375, 0.774169921875, 0.8252105712890625, 0.876251220703125, 0.9272918701171875, 0.97833251953125, 1.0293731689453125, 1.080413818359375, 1.1314544677734375, 1.1824951171875, 1.2335357666015625, 1.284576416015625, 1.3356170654296875, 1.38665771484375, 1.4376983642578125, 1.488739013671875, 1.5397796630859375, 1.5908203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 18.0, 32.0, 161.0, 468.0, 1670.0, 19636.0, 4154421.0, 16087.0, 1258.0, 324.0, 120.0, 50.0, 18.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6484375, -13.293701171875, -12.93896484375, -12.584228515625, -12.2294921875, -11.874755859375, -11.52001953125, -11.165283203125, -10.810546875, -10.455810546875, -10.10107421875, -9.746337890625, -9.3916015625, -9.036865234375, -8.68212890625, -8.327392578125, -7.97265625, -7.617919921875, -7.26318359375, -6.908447265625, -6.5537109375, -6.198974609375, -5.84423828125, -5.489501953125, -5.134765625, -4.780029296875, -4.42529296875, -4.070556640625, -3.7158203125, -3.361083984375, -3.00634765625, -2.651611328125, -2.296875, -1.942138671875, -1.58740234375, -1.232666015625, -0.8779296875, -0.523193359375, -0.16845703125, 0.186279296875, 0.541015625, 0.895751953125, 1.25048828125, 1.605224609375, 1.9599609375, 2.314697265625, 2.66943359375, 3.024169921875, 3.37890625, 3.733642578125, 4.08837890625, 4.443115234375, 4.7978515625, 5.152587890625, 5.50732421875, 5.862060546875, 6.216796875, 6.571533203125, 6.92626953125, 7.281005859375, 7.6357421875, 7.990478515625, 8.34521484375, 8.699951171875, 9.0546875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 10.0, 14.0, 39.0, 112.0, 339.0, 1347.0, 1576.0, 438.0, 99.0, 42.0, 28.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.13360595703125, -4.9508056640625, -4.76800537109375, -4.585205078125, -4.40240478515625, -4.2196044921875, -4.03680419921875, -3.85400390625, -3.67120361328125, -3.4884033203125, -3.30560302734375, -3.122802734375, -2.94000244140625, -2.7572021484375, -2.57440185546875, -2.3916015625, -2.20880126953125, -2.0260009765625, -1.84320068359375, -1.660400390625, -1.47760009765625, -1.2947998046875, -1.11199951171875, -0.92919921875, -0.74639892578125, -0.5635986328125, -0.38079833984375, -0.197998046875, -0.01519775390625, 0.1676025390625, 0.35040283203125, 0.533203125, 0.71600341796875, 0.8988037109375, 1.08160400390625, 1.264404296875, 1.44720458984375, 1.6300048828125, 1.81280517578125, 1.99560546875, 2.17840576171875, 2.3612060546875, 2.54400634765625, 2.726806640625, 2.90960693359375, 3.0924072265625, 3.27520751953125, 3.4580078125, 3.64080810546875, 3.8236083984375, 4.00640869140625, 4.189208984375, 4.37200927734375, 4.5548095703125, 4.73760986328125, 4.92041015625, 5.10321044921875, 5.2860107421875, 5.46881103515625, 5.651611328125, 5.83441162109375, 6.0172119140625, 6.20001220703125, 6.3828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 6.0, 7.0, 15.0, 34.0, 94.0, 236.0, 275.0, 199.0, 81.0, 29.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-54.58929443359375, -53.48629379272461, -52.38329315185547, -51.28029251098633, -50.17729187011719, -49.07429122924805, -47.971290588378906, -46.86829376220703, -45.765289306640625, -44.662288665771484, -43.559288024902344, -42.4562873840332, -41.35328674316406, -40.25028610229492, -39.14728546142578, -38.044288635253906, -36.941287994384766, -35.838287353515625, -34.735286712646484, -33.632286071777344, -32.5292854309082, -31.426284790039062, -30.323286056518555, -29.220285415649414, -28.117284774780273, -27.014284133911133, -25.911283493041992, -24.80828285217285, -23.705284118652344, -22.602283477783203, -21.499282836914062, -20.396282196044922, -19.293277740478516, -18.190277099609375, -17.087276458740234, -15.98427677154541, -14.88127613067627, -13.778275489807129, -12.675275802612305, -11.572275161743164, -10.469274520874023, -9.366273880004883, -8.263273239135742, -7.160273551940918, -6.057272911071777, -4.954272270202637, -3.8512721061706543, -2.748271942138672, -1.6452713012695312, -0.5422708988189697, 0.5607295036315918, 1.6637299060821533, 2.766730308532715, 3.8697309494018555, 4.972731113433838, 6.07573127746582, 7.178731918334961, 8.281732559204102, 9.384733200073242, 10.487732887268066, 11.590733528137207, 12.693734169006348, 13.796733856201172, 14.899734497070312, 16.002735137939453]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 17.0, 17.0, 31.0, 47.0, 84.0, 122.0, 147.0, 143.0, 128.0, 118.0, 84.0, 31.0, 17.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.470855712890625, -15.603269577026367, -14.73568344116211, -13.868098258972168, -13.00051212310791, -12.132925987243652, -11.265340805053711, -10.397754669189453, -9.530168533325195, -8.662582397460938, -7.794996738433838, -6.927411079406738, -6.0598249435424805, -5.192238807678223, -4.324653148651123, -3.4570674896240234, -2.5894813537597656, -1.721895456314087, -0.8543095588684082, 0.013276338577270508, 0.8808622360229492, 1.748448371887207, 2.6160340309143066, 3.4836196899414062, 4.351205825805664, 5.218791961669922, 6.0863776206970215, 6.953963279724121, 7.821549415588379, 8.689135551452637, 9.556720733642578, 10.424306869506836, 11.291893005371094, 12.159479141235352, 13.02706527709961, 13.89465045928955, 14.762236595153809, 15.629822731018066, 16.497407913208008, 17.364994049072266, 18.232580184936523, 19.10016632080078, 19.96775245666504, 20.835338592529297, 21.702922821044922, 22.570510864257812, 23.438095092773438, 24.305681228637695, 25.173267364501953, 26.04085350036621, 26.90843963623047, 27.776025772094727, 28.643611907958984, 29.51119613647461, 30.378782272338867, 31.246368408203125, 32.11395263671875, 32.981536865234375, 33.849124908447266, 34.71670913696289, 35.58429718017578, 36.451881408691406, 37.3194694519043, 38.18705368041992, 39.05464172363281]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 9.0, 17.0, 36.0, 65.0, 129.0, 305.0, 1101.0, 5916.0, 95968.0, 864566.0, 73843.0, 5133.0, 936.0, 281.0, 99.0, 54.0, 30.0, 19.0, 13.0, 10.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.517242431640625, -3.36065673828125, -3.204071044921875, -3.0474853515625, -2.890899658203125, -2.73431396484375, -2.577728271484375, -2.421142578125, -2.264556884765625, -2.10797119140625, -1.951385498046875, -1.7947998046875, -1.638214111328125, -1.48162841796875, -1.325042724609375, -1.16845703125, -1.011871337890625, -0.85528564453125, -0.698699951171875, -0.5421142578125, -0.385528564453125, -0.22894287109375, -0.072357177734375, 0.084228515625, 0.240814208984375, 0.39739990234375, 0.553985595703125, 0.7105712890625, 0.867156982421875, 1.02374267578125, 1.180328369140625, 1.3369140625, 1.493499755859375, 1.65008544921875, 1.806671142578125, 1.9632568359375, 2.119842529296875, 2.27642822265625, 2.433013916015625, 2.589599609375, 2.746185302734375, 2.90277099609375, 3.059356689453125, 3.2159423828125, 3.372528076171875, 3.52911376953125, 3.685699462890625, 3.84228515625, 3.998870849609375, 4.15545654296875, 4.312042236328125, 4.4686279296875, 4.625213623046875, 4.78179931640625, 4.938385009765625, 5.094970703125, 5.251556396484375, 5.40814208984375, 5.564727783203125, 5.7213134765625, 5.877899169921875, 6.03448486328125, 6.191070556640625, 6.34765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 13.0, 11.0, 13.0, 11.0, 16.0, 27.0, 27.0, 52.0, 44.0, 62.0, 66.0, 60.0, 57.0, 71.0, 79.0, 44.0, 66.0, 47.0, 46.0, 48.0, 36.0, 27.0, 14.0, 12.0, 15.0, 9.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.3634033203125, -1.322509765625, -1.2816162109375, -1.24072265625, -1.1998291015625, -1.158935546875, -1.1180419921875, -1.0771484375, -1.0362548828125, -0.995361328125, -0.9544677734375, -0.91357421875, -0.8726806640625, -0.831787109375, -0.7908935546875, -0.75, -0.7091064453125, -0.668212890625, -0.6273193359375, -0.58642578125, -0.5455322265625, -0.504638671875, -0.4637451171875, -0.4228515625, -0.3819580078125, -0.341064453125, -0.3001708984375, -0.25927734375, -0.2183837890625, -0.177490234375, -0.1365966796875, -0.095703125, -0.0548095703125, -0.013916015625, 0.0269775390625, 0.06787109375, 0.1087646484375, 0.149658203125, 0.1905517578125, 0.2314453125, 0.2723388671875, 0.313232421875, 0.3541259765625, 0.39501953125, 0.4359130859375, 0.476806640625, 0.5177001953125, 0.55859375, 0.5994873046875, 0.640380859375, 0.6812744140625, 0.72216796875, 0.7630615234375, 0.803955078125, 0.8448486328125, 0.8857421875, 0.9266357421875, 0.967529296875, 1.0084228515625, 1.04931640625, 1.0902099609375, 1.131103515625, 1.1719970703125, 1.212890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 5.0, 3.0, 5.0, 9.0, 11.0, 19.0, 19.0, 34.0, 52.0, 67.0, 125.0, 183.0, 355.0, 843.0, 1955.0, 6446.0, 27510.0, 176202.0, 694042.0, 113512.0, 19368.0, 4803.0, 1543.0, 641.0, 329.0, 139.0, 92.0, 66.0, 64.0, 29.0, 15.0, 16.0, 10.0, 8.0, 4.0, 9.0, 2.0, 2.0, 9.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.661956787109375, -2.57977294921875, -2.497589111328125, -2.4154052734375, -2.333221435546875, -2.25103759765625, -2.168853759765625, -2.086669921875, -2.004486083984375, -1.92230224609375, -1.840118408203125, -1.7579345703125, -1.675750732421875, -1.59356689453125, -1.511383056640625, -1.42919921875, -1.347015380859375, -1.26483154296875, -1.182647705078125, -1.1004638671875, -1.018280029296875, -0.93609619140625, -0.853912353515625, -0.771728515625, -0.689544677734375, -0.60736083984375, -0.525177001953125, -0.4429931640625, -0.360809326171875, -0.27862548828125, -0.196441650390625, -0.1142578125, -0.032073974609375, 0.05010986328125, 0.132293701171875, 0.2144775390625, 0.296661376953125, 0.37884521484375, 0.461029052734375, 0.543212890625, 0.625396728515625, 0.70758056640625, 0.789764404296875, 0.8719482421875, 0.954132080078125, 1.03631591796875, 1.118499755859375, 1.20068359375, 1.282867431640625, 1.36505126953125, 1.447235107421875, 1.5294189453125, 1.611602783203125, 1.69378662109375, 1.775970458984375, 1.858154296875, 1.940338134765625, 2.02252197265625, 2.104705810546875, 2.1868896484375, 2.269073486328125, 2.35125732421875, 2.433441162109375, 2.515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 7.0, 5.0, 11.0, 15.0, 19.0, 22.0, 27.0, 27.0, 33.0, 42.0, 43.0, 58.0, 46.0, 66.0, 60.0, 50.0, 66.0, 54.0, 48.0, 53.0, 33.0, 38.0, 32.0, 31.0, 13.0, 20.0, 18.0, 21.0, 8.0, 3.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.27734375, -3.14697265625, -3.0166015625, -2.88623046875, -2.755859375, -2.62548828125, -2.4951171875, -2.36474609375, -2.234375, -2.10400390625, -1.9736328125, -1.84326171875, -1.712890625, -1.58251953125, -1.4521484375, -1.32177734375, -1.19140625, -1.06103515625, -0.9306640625, -0.80029296875, -0.669921875, -0.53955078125, -0.4091796875, -0.27880859375, -0.1484375, -0.01806640625, 0.1123046875, 0.24267578125, 0.373046875, 0.50341796875, 0.6337890625, 0.76416015625, 0.89453125, 1.02490234375, 1.1552734375, 1.28564453125, 1.416015625, 1.54638671875, 1.6767578125, 1.80712890625, 1.9375, 2.06787109375, 2.1982421875, 2.32861328125, 2.458984375, 2.58935546875, 2.7197265625, 2.85009765625, 2.98046875, 3.11083984375, 3.2412109375, 3.37158203125, 3.501953125, 3.63232421875, 3.7626953125, 3.89306640625, 4.0234375, 4.15380859375, 4.2841796875, 4.41455078125, 4.544921875, 4.67529296875, 4.8056640625, 4.93603515625, 5.06640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 9.0, 7.0, 8.0, 12.0, 26.0, 26.0, 58.0, 98.0, 168.0, 321.0, 655.0, 1226.0, 2654.0, 6031.0, 15783.0, 51632.0, 271385.0, 585943.0, 77658.0, 20909.0, 7635.0, 3226.0, 1485.0, 771.0, 350.0, 196.0, 109.0, 55.0, 44.0, 27.0, 11.0, 15.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8468246459960938, -0.8196258544921875, -0.7924270629882812, -0.765228271484375, -0.7380294799804688, -0.7108306884765625, -0.6836318969726562, -0.65643310546875, -0.6292343139648438, -0.6020355224609375, -0.5748367309570312, -0.547637939453125, -0.5204391479492188, -0.4932403564453125, -0.46604156494140625, -0.4388427734375, -0.41164398193359375, -0.3844451904296875, -0.35724639892578125, -0.330047607421875, -0.30284881591796875, -0.2756500244140625, -0.24845123291015625, -0.22125244140625, -0.19405364990234375, -0.1668548583984375, -0.13965606689453125, -0.112457275390625, -0.08525848388671875, -0.0580596923828125, -0.03086090087890625, -0.003662109375, 0.02353668212890625, 0.0507354736328125, 0.07793426513671875, 0.105133056640625, 0.13233184814453125, 0.1595306396484375, 0.18672943115234375, 0.21392822265625, 0.24112701416015625, 0.2683258056640625, 0.29552459716796875, 0.322723388671875, 0.34992218017578125, 0.3771209716796875, 0.40431976318359375, 0.4315185546875, 0.45871734619140625, 0.4859161376953125, 0.5131149291992188, 0.540313720703125, 0.5675125122070312, 0.5947113037109375, 0.6219100952148438, 0.64910888671875, 0.6763076782226562, 0.7035064697265625, 0.7307052612304688, 0.757904052734375, 0.7851028442382812, 0.8123016357421875, 0.8395004272460938, 0.86669921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 7.0, 3.0, 9.0, 12.0, 20.0, 40.0, 65.0, 105.0, 152.0, 211.0, 127.0, 93.0, 43.0, 32.0, 17.0, 18.0, 14.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003895759582519531, -0.000378243625164032, -0.00036691129207611084, -0.0003555789589881897, -0.00034424662590026855, -0.0003329142928123474, -0.00032158195972442627, -0.0003102496266365051, -0.000298917293548584, -0.00028758496046066284, -0.0002762526273727417, -0.00026492029428482056, -0.0002535879611968994, -0.00024225562810897827, -0.00023092329502105713, -0.00021959096193313599, -0.00020825862884521484, -0.0001969262957572937, -0.00018559396266937256, -0.00017426162958145142, -0.00016292929649353027, -0.00015159696340560913, -0.000140264630317688, -0.00012893229722976685, -0.0001175999641418457, -0.00010626763105392456, -9.493529796600342e-05, -8.360296487808228e-05, -7.227063179016113e-05, -6.093829870223999e-05, -4.960596561431885e-05, -3.8273632526397705e-05, -2.6941299438476562e-05, -1.560896635055542e-05, -4.276633262634277e-06, 7.055699825286865e-06, 1.8388032913208008e-05, 2.972036600112915e-05, 4.105269908905029e-05, 5.2385032176971436e-05, 6.371736526489258e-05, 7.504969835281372e-05, 8.638203144073486e-05, 9.7714364528656e-05, 0.00010904669761657715, 0.00012037903070449829, 0.00013171136379241943, 0.00014304369688034058, 0.00015437602996826172, 0.00016570836305618286, 0.000177040696144104, 0.00018837302923202515, 0.0001997053623199463, 0.00021103769540786743, 0.00022237002849578857, 0.00023370236158370972, 0.00024503469467163086, 0.000256367027759552, 0.00026769936084747314, 0.0002790316939353943, 0.00029036402702331543, 0.00030169636011123657, 0.0003130286931991577, 0.00032436102628707886, 0.000335693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 13.0, 12.0, 17.0, 35.0, 80.0, 149.0, 313.0, 715.0, 1950.0, 5774.0, 22278.0, 130750.0, 735681.0, 120846.0, 21092.0, 5653.0, 1867.0, 711.0, 300.0, 139.0, 61.0, 52.0, 23.0, 13.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.967376708984375, -0.93084716796875, -0.894317626953125, -0.8577880859375, -0.821258544921875, -0.78472900390625, -0.748199462890625, -0.711669921875, -0.675140380859375, -0.63861083984375, -0.602081298828125, -0.5655517578125, -0.529022216796875, -0.49249267578125, -0.455963134765625, -0.41943359375, -0.382904052734375, -0.34637451171875, -0.309844970703125, -0.2733154296875, -0.236785888671875, -0.20025634765625, -0.163726806640625, -0.127197265625, -0.090667724609375, -0.05413818359375, -0.017608642578125, 0.0189208984375, 0.055450439453125, 0.09197998046875, 0.128509521484375, 0.1650390625, 0.201568603515625, 0.23809814453125, 0.274627685546875, 0.3111572265625, 0.347686767578125, 0.38421630859375, 0.420745849609375, 0.457275390625, 0.493804931640625, 0.53033447265625, 0.566864013671875, 0.6033935546875, 0.639923095703125, 0.67645263671875, 0.712982177734375, 0.74951171875, 0.786041259765625, 0.82257080078125, 0.859100341796875, 0.8956298828125, 0.932159423828125, 0.96868896484375, 1.005218505859375, 1.041748046875, 1.078277587890625, 1.11480712890625, 1.151336669921875, 1.1878662109375, 1.224395751953125, 1.26092529296875, 1.297454833984375, 1.333984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 14.0, 12.0, 19.0, 23.0, 30.0, 44.0, 43.0, 62.0, 75.0, 71.0, 78.0, 80.0, 71.0, 78.0, 51.0, 57.0, 33.0, 31.0, 24.0, 15.0, 10.0, 2.0, 8.0, 8.0, 11.0, 4.0, 5.0, 1.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7910308837890625, -0.766143798828125, -0.7412567138671875, -0.71636962890625, -0.6914825439453125, -0.666595458984375, -0.6417083740234375, -0.6168212890625, -0.5919342041015625, -0.567047119140625, -0.5421600341796875, -0.51727294921875, -0.4923858642578125, -0.467498779296875, -0.4426116943359375, -0.417724609375, -0.3928375244140625, -0.367950439453125, -0.3430633544921875, -0.31817626953125, -0.2932891845703125, -0.268402099609375, -0.2435150146484375, -0.2186279296875, -0.1937408447265625, -0.168853759765625, -0.1439666748046875, -0.11907958984375, -0.0941925048828125, -0.069305419921875, -0.0444183349609375, -0.01953125, 0.0053558349609375, 0.030242919921875, 0.0551300048828125, 0.08001708984375, 0.1049041748046875, 0.129791259765625, 0.1546783447265625, 0.1795654296875, 0.2044525146484375, 0.229339599609375, 0.2542266845703125, 0.27911376953125, 0.3040008544921875, 0.328887939453125, 0.3537750244140625, 0.378662109375, 0.4035491943359375, 0.428436279296875, 0.4533233642578125, 0.47821044921875, 0.5030975341796875, 0.527984619140625, 0.5528717041015625, 0.5777587890625, 0.6026458740234375, 0.627532958984375, 0.6524200439453125, 0.67730712890625, 0.7021942138671875, 0.727081298828125, 0.7519683837890625, 0.77685546875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 15.0, 34.0, 95.0, 217.0, 370.0, 152.0, 60.0, 25.0, 10.0, 6.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.86220932006836, -22.836746215820312, -21.811283111572266, -20.785818099975586, -19.76035499572754, -18.734891891479492, -17.709426879882812, -16.683963775634766, -15.658500671386719, -14.633037567138672, -13.607573509216309, -12.582109451293945, -11.556646347045898, -10.531183242797852, -9.505719184875488, -8.480255126953125, -7.454792022705078, -6.429328441619873, -5.403864860534668, -4.378401279449463, -3.352937698364258, -2.3274741172790527, -1.3020105361938477, -0.2765469551086426, 0.7489166259765625, 1.7743802070617676, 2.7998437881469727, 3.8253073692321777, 4.850770950317383, 5.876234531402588, 6.901698112487793, 7.927161693572998, 8.952621459960938, 9.978084564208984, 11.003548622131348, 12.029012680053711, 13.054475784301758, 14.079938888549805, 15.105402946472168, 16.13086700439453, 17.156330108642578, 18.181793212890625, 19.207256317138672, 20.23272132873535, 21.2581844329834, 22.283647537231445, 23.309112548828125, 24.334575653076172, 25.36003875732422, 26.385501861572266, 27.410964965820312, 28.436429977416992, 29.46189308166504, 30.487356185913086, 31.512821197509766, 32.53828430175781, 33.56374740600586, 34.589210510253906, 35.61467361450195, 36.64013671875, 37.66560363769531, 38.69106674194336, 39.716529846191406, 40.74199295043945, 41.7674560546875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 7.0, 6.0, 12.0, 14.0, 15.0, 20.0, 14.0, 34.0, 34.0, 34.0, 52.0, 43.0, 54.0, 80.0, 91.0, 101.0, 69.0, 56.0, 37.0, 36.0, 30.0, 27.0, 29.0, 23.0, 10.0, 14.0, 8.0, 15.0, 8.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.43801498413086, -17.904478073120117, -17.370943069458008, -16.837406158447266, -16.303871154785156, -15.77033519744873, -15.236799240112305, -14.703262329101562, -14.169727325439453, -13.636191368103027, -13.102655410766602, -12.569119453430176, -12.03558349609375, -11.502047538757324, -10.968511581420898, -10.434974670410156, -9.90143871307373, -9.367902755737305, -8.834366798400879, -8.300830841064453, -7.767294883728027, -7.233758926391602, -6.700222492218018, -6.166686534881592, -5.633150577545166, -5.09961462020874, -4.5660786628723145, -4.0325422286987305, -3.499006509780884, -2.965470552444458, -2.431934356689453, -1.8983983993530273, -1.3648624420166016, -0.831326425075531, -0.29779040813446045, 0.23574566841125488, 0.7692816257476807, 1.3028175830841064, 1.8363537788391113, 2.369889736175537, 2.903425693511963, 3.4369616508483887, 3.9704976081848145, 4.504034042358398, 5.037569999694824, 5.57110595703125, 6.104641914367676, 6.638177871704102, 7.171713829040527, 7.705249786376953, 8.238785743713379, 8.772321701049805, 9.30585765838623, 9.839393615722656, 10.372930526733398, 10.906465530395508, 11.44000244140625, 11.973538398742676, 12.507074356079102, 13.040610313415527, 13.574146270751953, 14.107682228088379, 14.641218185424805, 15.174755096435547, 15.708290100097656]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 24.0, 47.0, 152.0, 526.0, 3904.0, 195221.0, 3979135.0, 13214.0, 1398.0, 354.0, 128.0, 52.0, 35.0, 15.0, 12.0, 10.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -7.01324462890625, -6.8389892578125, -6.66473388671875, -6.490478515625, -6.31622314453125, -6.1419677734375, -5.96771240234375, -5.79345703125, -5.61920166015625, -5.4449462890625, -5.27069091796875, -5.096435546875, -4.92218017578125, -4.7479248046875, -4.57366943359375, -4.3994140625, -4.22515869140625, -4.0509033203125, -3.87664794921875, -3.702392578125, -3.52813720703125, -3.3538818359375, -3.17962646484375, -3.00537109375, -2.83111572265625, -2.6568603515625, -2.48260498046875, -2.308349609375, -2.13409423828125, -1.9598388671875, -1.78558349609375, -1.611328125, -1.43707275390625, -1.2628173828125, -1.08856201171875, -0.914306640625, -0.74005126953125, -0.5657958984375, -0.39154052734375, -0.21728515625, -0.04302978515625, 0.1312255859375, 0.30548095703125, 0.479736328125, 0.65399169921875, 0.8282470703125, 1.00250244140625, 1.1767578125, 1.35101318359375, 1.5252685546875, 1.69952392578125, 1.873779296875, 2.04803466796875, 2.2222900390625, 2.39654541015625, 2.57080078125, 2.74505615234375, 2.9193115234375, 3.09356689453125, 3.267822265625, 3.44207763671875, 3.6163330078125, 3.79058837890625, 3.96484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 8.0, 11.0, 17.0, 17.0, 24.0, 28.0, 42.0, 45.0, 55.0, 46.0, 66.0, 53.0, 67.0, 84.0, 62.0, 54.0, 54.0, 41.0, 38.0, 27.0, 36.0, 26.0, 28.0, 10.0, 8.0, 7.0, 8.0, 9.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2265625, -1.1894073486328125, -1.152252197265625, -1.1150970458984375, -1.07794189453125, -1.0407867431640625, -1.003631591796875, -0.9664764404296875, -0.9293212890625, -0.8921661376953125, -0.855010986328125, -0.8178558349609375, -0.78070068359375, -0.7435455322265625, -0.706390380859375, -0.6692352294921875, -0.632080078125, -0.5949249267578125, -0.557769775390625, -0.5206146240234375, -0.48345947265625, -0.4463043212890625, -0.409149169921875, -0.3719940185546875, -0.3348388671875, -0.2976837158203125, -0.260528564453125, -0.2233734130859375, -0.18621826171875, -0.1490631103515625, -0.111907958984375, -0.0747528076171875, -0.03759765625, -0.0004425048828125, 0.036712646484375, 0.0738677978515625, 0.11102294921875, 0.1481781005859375, 0.185333251953125, 0.2224884033203125, 0.2596435546875, 0.2967987060546875, 0.333953857421875, 0.3711090087890625, 0.40826416015625, 0.4454193115234375, 0.482574462890625, 0.5197296142578125, 0.556884765625, 0.5940399169921875, 0.631195068359375, 0.6683502197265625, 0.70550537109375, 0.7426605224609375, 0.779815673828125, 0.8169708251953125, 0.8541259765625, 0.8912811279296875, 0.928436279296875, 0.9655914306640625, 1.00274658203125, 1.0399017333984375, 1.077056884765625, 1.1142120361328125, 1.1513671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 10.0, 19.0, 40.0, 68.0, 122.0, 231.0, 610.0, 2926.0, 35783.0, 3829400.0, 315256.0, 7947.0, 1157.0, 382.0, 153.0, 60.0, 39.0, 22.0, 14.0, 12.0, 1.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.195068359375, -3.06591796875, -2.936767578125, -2.8076171875, -2.678466796875, -2.54931640625, -2.420166015625, -2.291015625, -2.161865234375, -2.03271484375, -1.903564453125, -1.7744140625, -1.645263671875, -1.51611328125, -1.386962890625, -1.2578125, -1.128662109375, -0.99951171875, -0.870361328125, -0.7412109375, -0.612060546875, -0.48291015625, -0.353759765625, -0.224609375, -0.095458984375, 0.03369140625, 0.162841796875, 0.2919921875, 0.421142578125, 0.55029296875, 0.679443359375, 0.80859375, 0.937744140625, 1.06689453125, 1.196044921875, 1.3251953125, 1.454345703125, 1.58349609375, 1.712646484375, 1.841796875, 1.970947265625, 2.10009765625, 2.229248046875, 2.3583984375, 2.487548828125, 2.61669921875, 2.745849609375, 2.875, 3.004150390625, 3.13330078125, 3.262451171875, 3.3916015625, 3.520751953125, 3.64990234375, 3.779052734375, 3.908203125, 4.037353515625, 4.16650390625, 4.295654296875, 4.4248046875, 4.553955078125, 4.68310546875, 4.812255859375, 4.94140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 7.0, 16.0, 18.0, 22.0, 37.0, 83.0, 120.0, 199.0, 393.0, 658.0, 895.0, 697.0, 368.0, 238.0, 123.0, 68.0, 38.0, 20.0, 25.0, 16.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.4751434326171875, -2.407318115234375, -2.3394927978515625, -2.27166748046875, -2.2038421630859375, -2.136016845703125, -2.0681915283203125, -2.0003662109375, -1.9325408935546875, -1.864715576171875, -1.7968902587890625, -1.72906494140625, -1.6612396240234375, -1.593414306640625, -1.5255889892578125, -1.457763671875, -1.3899383544921875, -1.322113037109375, -1.2542877197265625, -1.18646240234375, -1.1186370849609375, -1.050811767578125, -0.9829864501953125, -0.9151611328125, -0.8473358154296875, -0.779510498046875, -0.7116851806640625, -0.64385986328125, -0.5760345458984375, -0.508209228515625, -0.4403839111328125, -0.37255859375, -0.3047332763671875, -0.236907958984375, -0.1690826416015625, -0.10125732421875, -0.0334320068359375, 0.034393310546875, 0.1022186279296875, 0.1700439453125, 0.2378692626953125, 0.305694580078125, 0.3735198974609375, 0.44134521484375, 0.5091705322265625, 0.576995849609375, 0.6448211669921875, 0.712646484375, 0.7804718017578125, 0.848297119140625, 0.9161224365234375, 0.98394775390625, 1.0517730712890625, 1.119598388671875, 1.1874237060546875, 1.2552490234375, 1.3230743408203125, 1.390899658203125, 1.4587249755859375, 1.52655029296875, 1.5943756103515625, 1.662200927734375, 1.7300262451171875, 1.7978515625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 11.0, 33.0, 73.0, 204.0, 276.0, 220.0, 114.0, 38.0, 16.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-43.545555114746094, -42.720123291015625, -41.894691467285156, -41.06925582885742, -40.24382400512695, -39.418392181396484, -38.592960357666016, -37.76752853393555, -36.94209289550781, -36.116661071777344, -35.291229248046875, -34.46579360961914, -33.64036178588867, -32.8149299621582, -31.989498138427734, -31.164066314697266, -30.338634490966797, -29.513202667236328, -28.687768936157227, -27.862337112426758, -27.036903381347656, -26.211471557617188, -25.38603973388672, -24.56060791015625, -23.73517417907715, -22.90974235534668, -22.084308624267578, -21.25887680053711, -20.43344497680664, -19.60801124572754, -18.78257942199707, -17.95714569091797, -17.1317138671875, -16.30628204345703, -15.48084831237793, -14.655416488647461, -13.829983711242676, -13.00455093383789, -12.179119110107422, -11.353686332702637, -10.528254508972168, -9.702821731567383, -8.877389907836914, -8.051957130432129, -7.226524353027344, -6.401091575622559, -5.575659275054932, -4.750226974487305, -3.9247941970825195, -3.0993616580963135, -2.2739291191101074, -1.4484965801239014, -0.6230640411376953, 0.20236873626708984, 1.0278010368347168, 1.8532333374023438, 2.678666114807129, 3.504098653793335, 4.329531192779541, 5.154963493347168, 5.980396270751953, 6.805829048156738, 7.631261348724365, 8.456693649291992, 9.282126426696777]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 7.0, 9.0, 10.0, 11.0, 11.0, 15.0, 19.0, 18.0, 26.0, 28.0, 30.0, 41.0, 40.0, 50.0, 50.0, 37.0, 48.0, 63.0, 52.0, 50.0, 60.0, 59.0, 44.0, 33.0, 24.0, 20.0, 21.0, 17.0, 20.0, 10.0, 13.0, 14.0, 9.0, 7.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.044180870056152, -7.785304069519043, -7.526427268981934, -7.267550468444824, -7.008673667907715, -6.7497968673706055, -6.490919589996338, -6.2320427894592285, -5.973165988922119, -5.71428918838501, -5.4554123878479, -5.196535587310791, -4.937658309936523, -4.678781509399414, -4.419904708862305, -4.161027908325195, -3.902151107788086, -3.6432743072509766, -3.384397506713867, -3.1255204677581787, -2.8666436672210693, -2.60776686668396, -2.3488898277282715, -2.090013027191162, -1.8311362266540527, -1.5722594261169434, -1.3133825063705444, -1.0545055866241455, -0.7956287860870361, -0.5367519855499268, -0.27787506580352783, -0.018998146057128906, 0.23987865447998047, 0.4987555146217346, 0.7576323747634888, 1.0165092945098877, 1.275386095046997, 1.5342628955841064, 1.7931398153305054, 2.0520167350769043, 2.3108935356140137, 2.569770336151123, 2.8286471366882324, 3.087524175643921, 3.3464009761810303, 3.6052777767181396, 3.864154815673828, 4.1230316162109375, 4.381908416748047, 4.640785217285156, 4.899662017822266, 5.158538818359375, 5.417415618896484, 5.676292419433594, 5.935169696807861, 6.194046497344971, 6.45292329788208, 6.7118000984191895, 6.970676898956299, 7.229553699493408, 7.488430976867676, 7.747307777404785, 8.006184577941895, 8.265061378479004, 8.523938179016113]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 5.0, 11.0, 8.0, 11.0, 12.0, 29.0, 44.0, 89.0, 130.0, 276.0, 772.0, 2926.0, 20608.0, 477416.0, 519470.0, 22248.0, 3080.0, 801.0, 288.0, 114.0, 57.0, 52.0, 37.0, 21.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3359375, -4.20050048828125, -4.0650634765625, -3.92962646484375, -3.794189453125, -3.65875244140625, -3.5233154296875, -3.38787841796875, -3.25244140625, -3.11700439453125, -2.9815673828125, -2.84613037109375, -2.710693359375, -2.57525634765625, -2.4398193359375, -2.30438232421875, -2.1689453125, -2.03350830078125, -1.8980712890625, -1.76263427734375, -1.627197265625, -1.49176025390625, -1.3563232421875, -1.22088623046875, -1.08544921875, -0.95001220703125, -0.8145751953125, -0.67913818359375, -0.543701171875, -0.40826416015625, -0.2728271484375, -0.13739013671875, -0.001953125, 0.13348388671875, 0.2689208984375, 0.40435791015625, 0.539794921875, 0.67523193359375, 0.8106689453125, 0.94610595703125, 1.08154296875, 1.21697998046875, 1.3524169921875, 1.48785400390625, 1.623291015625, 1.75872802734375, 1.8941650390625, 2.02960205078125, 2.1650390625, 2.30047607421875, 2.4359130859375, 2.57135009765625, 2.706787109375, 2.84222412109375, 2.9776611328125, 3.11309814453125, 3.24853515625, 3.38397216796875, 3.5194091796875, 3.65484619140625, 3.790283203125, 3.92572021484375, 4.0611572265625, 4.19659423828125, 4.33203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 8.0, 17.0, 31.0, 39.0, 50.0, 55.0, 75.0, 87.0, 86.0, 90.0, 83.0, 82.0, 75.0, 63.0, 42.0, 27.0, 25.0, 24.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.631072998046875, -1.57562255859375, -1.520172119140625, -1.4647216796875, -1.409271240234375, -1.35382080078125, -1.298370361328125, -1.242919921875, -1.187469482421875, -1.13201904296875, -1.076568603515625, -1.0211181640625, -0.965667724609375, -0.91021728515625, -0.854766845703125, -0.79931640625, -0.743865966796875, -0.68841552734375, -0.632965087890625, -0.5775146484375, -0.522064208984375, -0.46661376953125, -0.411163330078125, -0.355712890625, -0.300262451171875, -0.24481201171875, -0.189361572265625, -0.1339111328125, -0.078460693359375, -0.02301025390625, 0.032440185546875, 0.087890625, 0.143341064453125, 0.19879150390625, 0.254241943359375, 0.3096923828125, 0.365142822265625, 0.42059326171875, 0.476043701171875, 0.531494140625, 0.586944580078125, 0.64239501953125, 0.697845458984375, 0.7532958984375, 0.808746337890625, 0.86419677734375, 0.919647216796875, 0.97509765625, 1.030548095703125, 1.08599853515625, 1.141448974609375, 1.1968994140625, 1.252349853515625, 1.30780029296875, 1.363250732421875, 1.418701171875, 1.474151611328125, 1.52960205078125, 1.585052490234375, 1.6405029296875, 1.695953369140625, 1.75140380859375, 1.806854248046875, 1.8623046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 9.0, 11.0, 18.0, 44.0, 42.0, 89.0, 126.0, 201.0, 389.0, 994.0, 2871.0, 14264.0, 167190.0, 809339.0, 43639.0, 6325.0, 1643.0, 611.0, 262.0, 147.0, 101.0, 73.0, 44.0, 32.0, 13.0, 18.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.674774169921875, -2.55462646484375, -2.434478759765625, -2.3143310546875, -2.194183349609375, -2.07403564453125, -1.953887939453125, -1.833740234375, -1.713592529296875, -1.59344482421875, -1.473297119140625, -1.3531494140625, -1.233001708984375, -1.11285400390625, -0.992706298828125, -0.87255859375, -0.752410888671875, -0.63226318359375, -0.512115478515625, -0.3919677734375, -0.271820068359375, -0.15167236328125, -0.031524658203125, 0.088623046875, 0.208770751953125, 0.32891845703125, 0.449066162109375, 0.5692138671875, 0.689361572265625, 0.80950927734375, 0.929656982421875, 1.0498046875, 1.169952392578125, 1.29010009765625, 1.410247802734375, 1.5303955078125, 1.650543212890625, 1.77069091796875, 1.890838623046875, 2.010986328125, 2.131134033203125, 2.25128173828125, 2.371429443359375, 2.4915771484375, 2.611724853515625, 2.73187255859375, 2.852020263671875, 2.97216796875, 3.092315673828125, 3.21246337890625, 3.332611083984375, 3.4527587890625, 3.572906494140625, 3.69305419921875, 3.813201904296875, 3.933349609375, 4.053497314453125, 4.17364501953125, 4.293792724609375, 4.4139404296875, 4.534088134765625, 4.65423583984375, 4.774383544921875, 4.89453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 18.0, 17.0, 19.0, 35.0, 31.0, 41.0, 54.0, 79.0, 75.0, 80.0, 65.0, 66.0, 76.0, 63.0, 44.0, 41.0, 38.0, 20.0, 20.0, 16.0, 10.0, 12.0, 9.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.694580078125, -4.53369140625, -4.372802734375, -4.2119140625, -4.051025390625, -3.89013671875, -3.729248046875, -3.568359375, -3.407470703125, -3.24658203125, -3.085693359375, -2.9248046875, -2.763916015625, -2.60302734375, -2.442138671875, -2.28125, -2.120361328125, -1.95947265625, -1.798583984375, -1.6376953125, -1.476806640625, -1.31591796875, -1.155029296875, -0.994140625, -0.833251953125, -0.67236328125, -0.511474609375, -0.3505859375, -0.189697265625, -0.02880859375, 0.132080078125, 0.29296875, 0.453857421875, 0.61474609375, 0.775634765625, 0.9365234375, 1.097412109375, 1.25830078125, 1.419189453125, 1.580078125, 1.740966796875, 1.90185546875, 2.062744140625, 2.2236328125, 2.384521484375, 2.54541015625, 2.706298828125, 2.8671875, 3.028076171875, 3.18896484375, 3.349853515625, 3.5107421875, 3.671630859375, 3.83251953125, 3.993408203125, 4.154296875, 4.315185546875, 4.47607421875, 4.636962890625, 4.7978515625, 4.958740234375, 5.11962890625, 5.280517578125, 5.44140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 6.0, 11.0, 11.0, 11.0, 14.0, 34.0, 48.0, 64.0, 110.0, 156.0, 279.0, 545.0, 1024.0, 2449.0, 6701.0, 23310.0, 148327.0, 778714.0, 64569.0, 13998.0, 4510.0, 1800.0, 777.0, 426.0, 226.0, 147.0, 84.0, 61.0, 33.0, 20.0, 15.0, 13.0, 10.0, 4.0, 10.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.154296875, -1.1216049194335938, -1.0889129638671875, -1.0562210083007812, -1.023529052734375, -0.9908370971679688, -0.9581451416015625, -0.9254531860351562, -0.89276123046875, -0.8600692749023438, -0.8273773193359375, -0.7946853637695312, -0.761993408203125, -0.7293014526367188, -0.6966094970703125, -0.6639175415039062, -0.6312255859375, -0.5985336303710938, -0.5658416748046875, -0.5331497192382812, -0.500457763671875, -0.46776580810546875, -0.4350738525390625, -0.40238189697265625, -0.36968994140625, -0.33699798583984375, -0.3043060302734375, -0.27161407470703125, -0.238922119140625, -0.20623016357421875, -0.1735382080078125, -0.14084625244140625, -0.108154296875, -0.07546234130859375, -0.0427703857421875, -0.01007843017578125, 0.022613525390625, 0.05530548095703125, 0.0879974365234375, 0.12068939208984375, 0.15338134765625, 0.18607330322265625, 0.2187652587890625, 0.25145721435546875, 0.284149169921875, 0.31684112548828125, 0.3495330810546875, 0.38222503662109375, 0.4149169921875, 0.44760894775390625, 0.4803009033203125, 0.5129928588867188, 0.545684814453125, 0.5783767700195312, 0.6110687255859375, 0.6437606811523438, 0.67645263671875, 0.7091445922851562, 0.7418365478515625, 0.7745285034179688, 0.807220458984375, 0.8399124145507812, 0.8726043701171875, 0.9052963256835938, 0.93798828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 9.0, 18.0, 16.0, 25.0, 40.0, 63.0, 84.0, 98.0, 174.0, 164.0, 74.0, 56.0, 43.0, 33.0, 15.0, 7.0, 14.0, 4.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002396106719970703, -0.00023225322365760803, -0.00022489577531814575, -0.00021753832697868347, -0.0002101808786392212, -0.0002028234302997589, -0.00019546598196029663, -0.00018810853362083435, -0.00018075108528137207, -0.0001733936369419098, -0.0001660361886024475, -0.00015867874026298523, -0.00015132129192352295, -0.00014396384358406067, -0.0001366063952445984, -0.0001292489469051361, -0.00012189149856567383, -0.00011453405022621155, -0.00010717660188674927, -9.981915354728699e-05, -9.246170520782471e-05, -8.510425686836243e-05, -7.774680852890015e-05, -7.038936018943787e-05, -6.303191184997559e-05, -5.5674463510513306e-05, -4.8317015171051025e-05, -4.0959566831588745e-05, -3.3602118492126465e-05, -2.6244670152664185e-05, -1.8887221813201904e-05, -1.1529773473739624e-05, -4.172325134277344e-06, 3.1851232051849365e-06, 1.0542571544647217e-05, 1.7900019884109497e-05, 2.5257468223571777e-05, 3.261491656303406e-05, 3.997236490249634e-05, 4.732981324195862e-05, 5.46872615814209e-05, 6.204470992088318e-05, 6.940215826034546e-05, 7.675960659980774e-05, 8.411705493927002e-05, 9.14745032787323e-05, 9.883195161819458e-05, 0.00010618939995765686, 0.00011354684829711914, 0.00012090429663658142, 0.0001282617449760437, 0.00013561919331550598, 0.00014297664165496826, 0.00015033408999443054, 0.00015769153833389282, 0.0001650489866733551, 0.00017240643501281738, 0.00017976388335227966, 0.00018712133169174194, 0.00019447878003120422, 0.0002018362283706665, 0.00020919367671012878, 0.00021655112504959106, 0.00022390857338905334, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 21.0, 10.0, 39.0, 50.0, 75.0, 114.0, 181.0, 284.0, 572.0, 1104.0, 2320.0, 5826.0, 15667.0, 53904.0, 578123.0, 318236.0, 47856.0, 14111.0, 5315.0, 2324.0, 1029.0, 558.0, 297.0, 171.0, 110.0, 75.0, 31.0, 41.0, 22.0, 15.0, 8.0, 15.0, 15.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8271484375, -0.7995376586914062, -0.7719268798828125, -0.7443161010742188, -0.716705322265625, -0.6890945434570312, -0.6614837646484375, -0.6338729858398438, -0.60626220703125, -0.5786514282226562, -0.5510406494140625, -0.5234298706054688, -0.495819091796875, -0.46820831298828125, -0.4405975341796875, -0.41298675537109375, -0.3853759765625, -0.35776519775390625, -0.3301544189453125, -0.30254364013671875, -0.274932861328125, -0.24732208251953125, -0.2197113037109375, -0.19210052490234375, -0.16448974609375, -0.13687896728515625, -0.1092681884765625, -0.08165740966796875, -0.054046630859375, -0.02643585205078125, 0.0011749267578125, 0.02878570556640625, 0.056396484375, 0.08400726318359375, 0.1116180419921875, 0.13922882080078125, 0.166839599609375, 0.19445037841796875, 0.2220611572265625, 0.24967193603515625, 0.27728271484375, 0.30489349365234375, 0.3325042724609375, 0.36011505126953125, 0.387725830078125, 0.41533660888671875, 0.4429473876953125, 0.47055816650390625, 0.4981689453125, 0.5257797241210938, 0.5533905029296875, 0.5810012817382812, 0.608612060546875, 0.6362228393554688, 0.6638336181640625, 0.6914443969726562, 0.71905517578125, 0.7466659545898438, 0.7742767333984375, 0.8018875122070312, 0.829498291015625, 0.8571090698242188, 0.8847198486328125, 0.9123306274414062, 0.93994140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 9.0, 5.0, 5.0, 4.0, 9.0, 26.0, 9.0, 14.0, 30.0, 33.0, 46.0, 69.0, 106.0, 134.0, 114.0, 101.0, 81.0, 54.0, 26.0, 32.0, 22.0, 16.0, 13.0, 11.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0047836303710938, -0.9744110107421875, -0.9440383911132812, -0.913665771484375, -0.8832931518554688, -0.8529205322265625, -0.8225479125976562, -0.79217529296875, -0.7618026733398438, -0.7314300537109375, -0.7010574340820312, -0.670684814453125, -0.6403121948242188, -0.6099395751953125, -0.5795669555664062, -0.5491943359375, -0.5188217163085938, -0.4884490966796875, -0.45807647705078125, -0.427703857421875, -0.39733123779296875, -0.3669586181640625, -0.33658599853515625, -0.30621337890625, -0.27584075927734375, -0.2454681396484375, -0.21509552001953125, -0.184722900390625, -0.15435028076171875, -0.1239776611328125, -0.09360504150390625, -0.063232421875, -0.03285980224609375, -0.0024871826171875, 0.02788543701171875, 0.058258056640625, 0.08863067626953125, 0.1190032958984375, 0.14937591552734375, 0.17974853515625, 0.21012115478515625, 0.2404937744140625, 0.27086639404296875, 0.301239013671875, 0.33161163330078125, 0.3619842529296875, 0.39235687255859375, 0.4227294921875, 0.45310211181640625, 0.4834747314453125, 0.5138473510742188, 0.544219970703125, 0.5745925903320312, 0.6049652099609375, 0.6353378295898438, 0.66571044921875, 0.6960830688476562, 0.7264556884765625, 0.7568283081054688, 0.787200927734375, 0.8175735473632812, 0.8479461669921875, 0.8783187866210938, 0.90869140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 5.0, 9.0, 16.0, 29.0, 69.0, 162.0, 338.0, 143.0, 106.0, 49.0, 27.0, 12.0, 10.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.242923736572266, -21.51378631591797, -20.784648895263672, -20.055511474609375, -19.326372146606445, -18.59723472595215, -17.86809730529785, -17.138959884643555, -16.409820556640625, -15.680683135986328, -14.951544761657715, -14.222407341003418, -13.493268966674805, -12.764131546020508, -12.034994125366211, -11.305856704711914, -10.576719284057617, -9.84758186340332, -9.118443489074707, -8.38930606842041, -7.660168170928955, -6.9310302734375, -6.201892852783203, -5.472754955291748, -4.743617057800293, -4.014479160308838, -3.285341501235962, -2.556203842163086, -1.8270659446716309, -1.0979280471801758, -0.3687906265258789, 0.36034727096557617, 1.089487075805664, 1.8186248540878296, 2.547762632369995, 3.276900291442871, 4.006038188934326, 4.735176086425781, 5.464313507080078, 6.193451404571533, 6.922589302062988, 7.651727199554443, 8.380865097045898, 9.110002517700195, 9.839139938354492, 10.568278312683105, 11.297415733337402, 12.026554107666016, 12.755691528320312, 13.48482894897461, 14.213967323303223, 14.94310474395752, 15.672243118286133, 16.40138053894043, 17.130517959594727, 17.859655380249023, 18.588794708251953, 19.31793212890625, 20.047069549560547, 20.776206970214844, 21.505346298217773, 22.23448371887207, 22.963621139526367, 23.692758560180664, 24.42189598083496]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 1.0, 7.0, 7.0, 8.0, 16.0, 17.0, 19.0, 21.0, 23.0, 27.0, 25.0, 37.0, 38.0, 40.0, 56.0, 86.0, 101.0, 96.0, 57.0, 49.0, 37.0, 30.0, 25.0, 15.0, 39.0, 22.0, 16.0, 13.0, 17.0, 8.0, 9.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.328241348266602, -14.824905395507812, -14.321569442749023, -13.81823444366455, -13.314898490905762, -12.811562538146973, -12.3082275390625, -11.804891586303711, -11.301555633544922, -10.798219680786133, -10.294883728027344, -9.791548728942871, -9.288212776184082, -8.784876823425293, -8.28154182434082, -7.778205871582031, -7.274869918823242, -6.771533966064453, -6.268198490142822, -5.764863014221191, -5.261527061462402, -4.758191108703613, -4.254855632781982, -3.7515199184417725, -3.2481842041015625, -2.7448484897613525, -2.2415127754211426, -1.7381770610809326, -1.2348413467407227, -0.7315056324005127, -0.22816991806030273, 0.2751657962799072, 0.77850341796875, 1.28183913230896, 1.78517484664917, 2.28851056098938, 2.79184627532959, 3.2951819896698, 3.7985177040100098, 4.301853179931641, 4.80518913269043, 5.308525085449219, 5.81186056137085, 6.3151960372924805, 6.8185319900512695, 7.321867942810059, 7.8252034187316895, 8.32853889465332, 8.83187484741211, 9.335210800170898, 9.838546752929688, 10.34188175201416, 10.84521770477295, 11.348553657531738, 11.851888656616211, 12.355224609375, 12.858560562133789, 13.361896514892578, 13.865232467651367, 14.36856746673584, 14.871903419494629, 15.375239372253418, 15.87857437133789, 16.38191032409668, 16.88524627685547]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 11.0, 13.0, 20.0, 40.0, 74.0, 176.0, 670.0, 5215.0, 524565.0, 3649411.0, 12114.0, 1425.0, 318.0, 109.0, 43.0, 18.0, 13.0, 6.0, 1.0, 11.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.24609375, -7.07421875, -6.90234375, -6.73046875, -6.55859375, -6.38671875, -6.21484375, -6.04296875, -5.87109375, -5.69921875, -5.52734375, -5.35546875, -5.18359375, -5.01171875, -4.83984375, -4.66796875, -4.49609375, -4.32421875, -4.15234375, -3.98046875, -3.80859375, -3.63671875, -3.46484375, -3.29296875, -3.12109375, -2.94921875, -2.77734375, -2.60546875, -2.43359375, -2.26171875, -2.08984375, -1.91796875, -1.74609375, -1.57421875, -1.40234375, -1.23046875, -1.05859375, -0.88671875, -0.71484375, -0.54296875, -0.37109375, -0.19921875, -0.02734375, 0.14453125, 0.31640625, 0.48828125, 0.66015625, 0.83203125, 1.00390625, 1.17578125, 1.34765625, 1.51953125, 1.69140625, 1.86328125, 2.03515625, 2.20703125, 2.37890625, 2.55078125, 2.72265625, 2.89453125, 3.06640625, 3.23828125, 3.41015625, 3.58203125, 3.75390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 8.0, 12.0, 10.0, 15.0, 32.0, 36.0, 50.0, 40.0, 56.0, 56.0, 68.0, 77.0, 76.0, 78.0, 81.0, 58.0, 60.0, 53.0, 35.0, 26.0, 16.0, 15.0, 9.0, 10.0, 4.0, 6.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4970703125, -1.44927978515625, -1.4014892578125, -1.35369873046875, -1.305908203125, -1.25811767578125, -1.2103271484375, -1.16253662109375, -1.11474609375, -1.06695556640625, -1.0191650390625, -0.97137451171875, -0.923583984375, -0.87579345703125, -0.8280029296875, -0.78021240234375, -0.732421875, -0.68463134765625, -0.6368408203125, -0.58905029296875, -0.541259765625, -0.49346923828125, -0.4456787109375, -0.39788818359375, -0.35009765625, -0.30230712890625, -0.2545166015625, -0.20672607421875, -0.158935546875, -0.11114501953125, -0.0633544921875, -0.01556396484375, 0.0322265625, 0.08001708984375, 0.1278076171875, 0.17559814453125, 0.223388671875, 0.27117919921875, 0.3189697265625, 0.36676025390625, 0.41455078125, 0.46234130859375, 0.5101318359375, 0.55792236328125, 0.605712890625, 0.65350341796875, 0.7012939453125, 0.74908447265625, 0.796875, 0.84466552734375, 0.8924560546875, 0.94024658203125, 0.988037109375, 1.03582763671875, 1.0836181640625, 1.13140869140625, 1.17919921875, 1.22698974609375, 1.2747802734375, 1.32257080078125, 1.370361328125, 1.41815185546875, 1.4659423828125, 1.51373291015625, 1.5615234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 9.0, 16.0, 19.0, 20.0, 51.0, 88.0, 170.0, 430.0, 2036.0, 21113.0, 3709769.0, 451320.0, 7604.0, 1057.0, 261.0, 109.0, 80.0, 40.0, 29.0, 20.0, 8.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.696746826171875, -3.54779052734375, -3.398834228515625, -3.2498779296875, -3.100921630859375, -2.95196533203125, -2.803009033203125, -2.654052734375, -2.505096435546875, -2.35614013671875, -2.207183837890625, -2.0582275390625, -1.909271240234375, -1.76031494140625, -1.611358642578125, -1.46240234375, -1.313446044921875, -1.16448974609375, -1.015533447265625, -0.8665771484375, -0.717620849609375, -0.56866455078125, -0.419708251953125, -0.270751953125, -0.121795654296875, 0.02716064453125, 0.176116943359375, 0.3250732421875, 0.474029541015625, 0.62298583984375, 0.771942138671875, 0.9208984375, 1.069854736328125, 1.21881103515625, 1.367767333984375, 1.5167236328125, 1.665679931640625, 1.81463623046875, 1.963592529296875, 2.112548828125, 2.261505126953125, 2.41046142578125, 2.559417724609375, 2.7083740234375, 2.857330322265625, 3.00628662109375, 3.155242919921875, 3.30419921875, 3.453155517578125, 3.60211181640625, 3.751068115234375, 3.9000244140625, 4.048980712890625, 4.19793701171875, 4.346893310546875, 4.495849609375, 4.644805908203125, 4.79376220703125, 4.942718505859375, 5.0916748046875, 5.240631103515625, 5.38958740234375, 5.538543701171875, 5.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 14.0, 23.0, 18.0, 37.0, 34.0, 64.0, 104.0, 146.0, 270.0, 356.0, 527.0, 638.0, 562.0, 431.0, 282.0, 174.0, 103.0, 74.0, 54.0, 34.0, 27.0, 19.0, 14.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.94140625, -1.886871337890625, -1.83233642578125, -1.777801513671875, -1.7232666015625, -1.668731689453125, -1.61419677734375, -1.559661865234375, -1.505126953125, -1.450592041015625, -1.39605712890625, -1.341522216796875, -1.2869873046875, -1.232452392578125, -1.17791748046875, -1.123382568359375, -1.06884765625, -1.014312744140625, -0.95977783203125, -0.905242919921875, -0.8507080078125, -0.796173095703125, -0.74163818359375, -0.687103271484375, -0.632568359375, -0.578033447265625, -0.52349853515625, -0.468963623046875, -0.4144287109375, -0.359893798828125, -0.30535888671875, -0.250823974609375, -0.1962890625, -0.141754150390625, -0.08721923828125, -0.032684326171875, 0.0218505859375, 0.076385498046875, 0.13092041015625, 0.185455322265625, 0.239990234375, 0.294525146484375, 0.34906005859375, 0.403594970703125, 0.4581298828125, 0.512664794921875, 0.56719970703125, 0.621734619140625, 0.67626953125, 0.730804443359375, 0.78533935546875, 0.839874267578125, 0.8944091796875, 0.948944091796875, 1.00347900390625, 1.058013916015625, 1.112548828125, 1.167083740234375, 1.22161865234375, 1.276153564453125, 1.3306884765625, 1.385223388671875, 1.43975830078125, 1.494293212890625, 1.548828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 24.0, 30.0, 58.0, 76.0, 135.0, 162.0, 159.0, 112.0, 90.0, 55.0, 18.0, 14.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.80241584777832, -20.313108444213867, -19.82379913330078, -19.334491729736328, -18.845184326171875, -18.355876922607422, -17.866567611694336, -17.377260208129883, -16.88795280456543, -16.398645401000977, -15.909337043762207, -15.420028686523438, -14.930721282958984, -14.441412925720215, -13.952104568481445, -13.462797164916992, -12.973487854003906, -12.484179496765137, -11.994872093200684, -11.505563735961914, -11.016256332397461, -10.526947975158691, -10.037639617919922, -9.548332214355469, -9.059024810791016, -8.569716453552246, -8.080409049987793, -7.591100692749023, -7.101792812347412, -6.612484931945801, -6.1231770515441895, -5.633869171142578, -5.144560813903809, -4.655252933502197, -4.165945053100586, -3.6766369342803955, -3.187328815460205, -2.6980209350585938, -2.2087130546569824, -1.719404935836792, -1.2300970554351807, -0.7407890558242798, -0.2514811158180237, 0.23782682418823242, 0.7271348237991333, 1.2164428234100342, 1.7057507038116455, 2.195058822631836, 2.6843667030334473, 3.1736745834350586, 3.662982702255249, 4.152290344238281, 4.641598701477051, 5.130906581878662, 5.620214462280273, 6.109522819519043, 6.598830223083496, 7.088138103485107, 7.577445983886719, 8.066754341125488, 8.556061744689941, 9.045370101928711, 9.534677505493164, 10.023985862731934, 10.513294219970703]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 5.0, 8.0, 11.0, 12.0, 9.0, 18.0, 16.0, 27.0, 23.0, 28.0, 29.0, 33.0, 41.0, 53.0, 39.0, 48.0, 37.0, 30.0, 51.0, 42.0, 47.0, 52.0, 36.0, 39.0, 31.0, 33.0, 29.0, 31.0, 24.0, 14.0, 20.0, 10.0, 10.0, 7.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.916905403137207, -7.673770427703857, -7.430635929107666, -7.187500953674316, -6.944366455078125, -6.701231479644775, -6.458096504211426, -6.214962005615234, -5.971827507019043, -5.728692531585693, -5.485558032989502, -5.242423057556152, -4.999288558959961, -4.756153583526611, -4.513018608093262, -4.26988410949707, -4.026749134063721, -3.78361439704895, -3.5404796600341797, -3.29734468460083, -3.0542101860046387, -2.811075210571289, -2.5679404735565186, -2.324805736541748, -2.0816709995269775, -1.838536262512207, -1.5954015254974365, -1.3522666692733765, -1.109131932258606, -0.8659971952438354, -0.6228623390197754, -0.3797276020050049, -0.13659238815307617, 0.10654237866401672, 0.3496771454811096, 0.5928119421005249, 0.8359466791152954, 1.079081416130066, 1.322216272354126, 1.5653510093688965, 1.808485746383667, 2.0516204833984375, 2.294755220413208, 2.5378899574279785, 2.781024932861328, 3.0241594314575195, 3.267294406890869, 3.5104291439056396, 3.75356388092041, 3.9966986179351807, 4.239833354949951, 4.482968330383301, 4.726102828979492, 4.969237804412842, 5.212372779846191, 5.455507278442383, 5.698641777038574, 5.941776752471924, 6.184911251068115, 6.428046226501465, 6.671180725097656, 6.914315700531006, 7.1574506759643555, 7.400585174560547, 7.6437201499938965]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 13.0, 4.0, 13.0, 16.0, 32.0, 40.0, 45.0, 78.0, 119.0, 166.0, 386.0, 752.0, 1893.0, 5270.0, 19503.0, 96576.0, 540556.0, 313269.0, 51857.0, 11839.0, 3495.0, 1276.0, 576.0, 280.0, 175.0, 95.0, 58.0, 45.0, 25.0, 29.0, 20.0, 12.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.185546875, -2.1146240234375, -2.043701171875, -1.9727783203125, -1.90185546875, -1.8309326171875, -1.760009765625, -1.6890869140625, -1.6181640625, -1.5472412109375, -1.476318359375, -1.4053955078125, -1.33447265625, -1.2635498046875, -1.192626953125, -1.1217041015625, -1.05078125, -0.9798583984375, -0.908935546875, -0.8380126953125, -0.76708984375, -0.6961669921875, -0.625244140625, -0.5543212890625, -0.4833984375, -0.4124755859375, -0.341552734375, -0.2706298828125, -0.19970703125, -0.1287841796875, -0.057861328125, 0.0130615234375, 0.083984375, 0.1549072265625, 0.225830078125, 0.2967529296875, 0.36767578125, 0.4385986328125, 0.509521484375, 0.5804443359375, 0.6513671875, 0.7222900390625, 0.793212890625, 0.8641357421875, 0.93505859375, 1.0059814453125, 1.076904296875, 1.1478271484375, 1.21875, 1.2896728515625, 1.360595703125, 1.4315185546875, 1.50244140625, 1.5733642578125, 1.644287109375, 1.7152099609375, 1.7861328125, 1.8570556640625, 1.927978515625, 1.9989013671875, 2.06982421875, 2.1407470703125, 2.211669921875, 2.2825927734375, 2.353515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 8.0, 6.0, 7.0, 18.0, 14.0, 23.0, 36.0, 45.0, 53.0, 47.0, 66.0, 61.0, 57.0, 55.0, 79.0, 83.0, 63.0, 57.0, 42.0, 36.0, 33.0, 33.0, 26.0, 18.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6790771484375, -1.634521484375, -1.5899658203125, -1.54541015625, -1.5008544921875, -1.456298828125, -1.4117431640625, -1.3671875, -1.3226318359375, -1.278076171875, -1.2335205078125, -1.18896484375, -1.1444091796875, -1.099853515625, -1.0552978515625, -1.0107421875, -0.9661865234375, -0.921630859375, -0.8770751953125, -0.83251953125, -0.7879638671875, -0.743408203125, -0.6988525390625, -0.654296875, -0.6097412109375, -0.565185546875, -0.5206298828125, -0.47607421875, -0.4315185546875, -0.386962890625, -0.3424072265625, -0.2978515625, -0.2532958984375, -0.208740234375, -0.1641845703125, -0.11962890625, -0.0750732421875, -0.030517578125, 0.0140380859375, 0.05859375, 0.1031494140625, 0.147705078125, 0.1922607421875, 0.23681640625, 0.2813720703125, 0.325927734375, 0.3704833984375, 0.4150390625, 0.4595947265625, 0.504150390625, 0.5487060546875, 0.59326171875, 0.6378173828125, 0.682373046875, 0.7269287109375, 0.771484375, 0.8160400390625, 0.860595703125, 0.9051513671875, 0.94970703125, 0.9942626953125, 1.038818359375, 1.0833740234375, 1.1279296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 8.0, 9.0, 17.0, 28.0, 40.0, 51.0, 109.0, 185.0, 382.0, 819.0, 2326.0, 10527.0, 173486.0, 828753.0, 25655.0, 3810.0, 1191.0, 522.0, 246.0, 121.0, 80.0, 55.0, 34.0, 21.0, 20.0, 5.0, 7.0, 9.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.30859375, -5.16961669921875, -5.0306396484375, -4.89166259765625, -4.752685546875, -4.61370849609375, -4.4747314453125, -4.33575439453125, -4.19677734375, -4.05780029296875, -3.9188232421875, -3.77984619140625, -3.640869140625, -3.50189208984375, -3.3629150390625, -3.22393798828125, -3.0849609375, -2.94598388671875, -2.8070068359375, -2.66802978515625, -2.529052734375, -2.39007568359375, -2.2510986328125, -2.11212158203125, -1.97314453125, -1.83416748046875, -1.6951904296875, -1.55621337890625, -1.417236328125, -1.27825927734375, -1.1392822265625, -1.00030517578125, -0.861328125, -0.72235107421875, -0.5833740234375, -0.44439697265625, -0.305419921875, -0.16644287109375, -0.0274658203125, 0.11151123046875, 0.25048828125, 0.38946533203125, 0.5284423828125, 0.66741943359375, 0.806396484375, 0.94537353515625, 1.0843505859375, 1.22332763671875, 1.3623046875, 1.50128173828125, 1.6402587890625, 1.77923583984375, 1.918212890625, 2.05718994140625, 2.1961669921875, 2.33514404296875, 2.47412109375, 2.61309814453125, 2.7520751953125, 2.89105224609375, 3.030029296875, 3.16900634765625, 3.3079833984375, 3.44696044921875, 3.5859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 13.0, 15.0, 16.0, 35.0, 44.0, 54.0, 73.0, 94.0, 97.0, 91.0, 86.0, 94.0, 77.0, 58.0, 48.0, 28.0, 25.0, 17.0, 10.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.3046875, -7.08013916015625, -6.8555908203125, -6.63104248046875, -6.406494140625, -6.18194580078125, -5.9573974609375, -5.73284912109375, -5.50830078125, -5.28375244140625, -5.0592041015625, -4.83465576171875, -4.610107421875, -4.38555908203125, -4.1610107421875, -3.93646240234375, -3.7119140625, -3.48736572265625, -3.2628173828125, -3.03826904296875, -2.813720703125, -2.58917236328125, -2.3646240234375, -2.14007568359375, -1.91552734375, -1.69097900390625, -1.4664306640625, -1.24188232421875, -1.017333984375, -0.79278564453125, -0.5682373046875, -0.34368896484375, -0.119140625, 0.10540771484375, 0.3299560546875, 0.55450439453125, 0.779052734375, 1.00360107421875, 1.2281494140625, 1.45269775390625, 1.67724609375, 1.90179443359375, 2.1263427734375, 2.35089111328125, 2.575439453125, 2.79998779296875, 3.0245361328125, 3.24908447265625, 3.4736328125, 3.69818115234375, 3.9227294921875, 4.14727783203125, 4.371826171875, 4.59637451171875, 4.8209228515625, 5.04547119140625, 5.27001953125, 5.49456787109375, 5.7191162109375, 5.94366455078125, 6.168212890625, 6.39276123046875, 6.6173095703125, 6.84185791015625, 7.06640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 16.0, 22.0, 16.0, 35.0, 52.0, 100.0, 244.0, 504.0, 1557.0, 7739.0, 136076.0, 879617.0, 18611.0, 2596.0, 768.0, 282.0, 127.0, 67.0, 46.0, 14.0, 15.0, 10.0, 8.0, 3.0, 8.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9169921875, -1.8592376708984375, -1.801483154296875, -1.7437286376953125, -1.68597412109375, -1.6282196044921875, -1.570465087890625, -1.5127105712890625, -1.4549560546875, -1.3972015380859375, -1.339447021484375, -1.2816925048828125, -1.22393798828125, -1.1661834716796875, -1.108428955078125, -1.0506744384765625, -0.992919921875, -0.9351654052734375, -0.877410888671875, -0.8196563720703125, -0.76190185546875, -0.7041473388671875, -0.646392822265625, -0.5886383056640625, -0.5308837890625, -0.4731292724609375, -0.415374755859375, -0.3576202392578125, -0.29986572265625, -0.2421112060546875, -0.184356689453125, -0.1266021728515625, -0.06884765625, -0.0110931396484375, 0.046661376953125, 0.1044158935546875, 0.16217041015625, 0.2199249267578125, 0.277679443359375, 0.3354339599609375, 0.3931884765625, 0.4509429931640625, 0.508697509765625, 0.5664520263671875, 0.62420654296875, 0.6819610595703125, 0.739715576171875, 0.7974700927734375, 0.855224609375, 0.9129791259765625, 0.970733642578125, 1.0284881591796875, 1.08624267578125, 1.1439971923828125, 1.201751708984375, 1.2595062255859375, 1.3172607421875, 1.3750152587890625, 1.432769775390625, 1.4905242919921875, 1.54827880859375, 1.6060333251953125, 1.663787841796875, 1.7215423583984375, 1.779296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 5.0, 6.0, 4.0, 8.0, 10.0, 7.0, 20.0, 22.0, 28.0, 56.0, 90.0, 149.0, 187.0, 138.0, 85.0, 62.0, 33.0, 29.0, 12.0, 4.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0002636909484863281, -0.0002553500235080719, -0.0002470090985298157, -0.00023866817355155945, -0.00023032724857330322, -0.000221986323595047, -0.00021364539861679077, -0.00020530447363853455, -0.00019696354866027832, -0.0001886226236820221, -0.00018028169870376587, -0.00017194077372550964, -0.00016359984874725342, -0.0001552589237689972, -0.00014691799879074097, -0.00013857707381248474, -0.00013023614883422852, -0.00012189522385597229, -0.00011355429887771606, -0.00010521337389945984, -9.687244892120361e-05, -8.853152394294739e-05, -8.019059896469116e-05, -7.184967398643494e-05, -6.350874900817871e-05, -5.5167824029922485e-05, -4.682689905166626e-05, -3.8485974073410034e-05, -3.014504909515381e-05, -2.1804124116897583e-05, -1.3463199138641357e-05, -5.122274160385132e-06, 3.2186508178710938e-06, 1.155957579612732e-05, 1.9900500774383545e-05, 2.824142575263977e-05, 3.6582350730895996e-05, 4.492327570915222e-05, 5.326420068740845e-05, 6.160512566566467e-05, 6.99460506439209e-05, 7.828697562217712e-05, 8.662790060043335e-05, 9.496882557868958e-05, 0.0001033097505569458, 0.00011165067553520203, 0.00011999160051345825, 0.00012833252549171448, 0.0001366734504699707, 0.00014501437544822693, 0.00015335530042648315, 0.00016169622540473938, 0.0001700371503829956, 0.00017837807536125183, 0.00018671900033950806, 0.00019505992531776428, 0.0002034008502960205, 0.00021174177527427673, 0.00022008270025253296, 0.00022842362523078918, 0.0002367645502090454, 0.00024510547518730164, 0.00025344640016555786, 0.0002617873251438141, 0.0002701282501220703]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 7.0, 22.0, 11.0, 21.0, 27.0, 48.0, 92.0, 153.0, 275.0, 685.0, 1633.0, 4815.0, 22233.0, 315398.0, 667981.0, 26276.0, 5549.0, 1858.0, 734.0, 336.0, 144.0, 89.0, 49.0, 31.0, 25.0, 9.0, 14.0, 7.0, 4.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4921875, -1.451904296875, -1.41162109375, -1.371337890625, -1.3310546875, -1.290771484375, -1.25048828125, -1.210205078125, -1.169921875, -1.129638671875, -1.08935546875, -1.049072265625, -1.0087890625, -0.968505859375, -0.92822265625, -0.887939453125, -0.84765625, -0.807373046875, -0.76708984375, -0.726806640625, -0.6865234375, -0.646240234375, -0.60595703125, -0.565673828125, -0.525390625, -0.485107421875, -0.44482421875, -0.404541015625, -0.3642578125, -0.323974609375, -0.28369140625, -0.243408203125, -0.203125, -0.162841796875, -0.12255859375, -0.082275390625, -0.0419921875, -0.001708984375, 0.03857421875, 0.078857421875, 0.119140625, 0.159423828125, 0.19970703125, 0.239990234375, 0.2802734375, 0.320556640625, 0.36083984375, 0.401123046875, 0.44140625, 0.481689453125, 0.52197265625, 0.562255859375, 0.6025390625, 0.642822265625, 0.68310546875, 0.723388671875, 0.763671875, 0.803955078125, 0.84423828125, 0.884521484375, 0.9248046875, 0.965087890625, 1.00537109375, 1.045654296875, 1.0859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 11.0, 15.0, 9.0, 34.0, 42.0, 50.0, 100.0, 154.0, 171.0, 148.0, 90.0, 61.0, 30.0, 17.0, 14.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5311431884765625, -1.489044189453125, -1.4469451904296875, -1.40484619140625, -1.3627471923828125, -1.320648193359375, -1.2785491943359375, -1.2364501953125, -1.1943511962890625, -1.152252197265625, -1.1101531982421875, -1.06805419921875, -1.0259552001953125, -0.983856201171875, -0.9417572021484375, -0.899658203125, -0.8575592041015625, -0.815460205078125, -0.7733612060546875, -0.73126220703125, -0.6891632080078125, -0.647064208984375, -0.6049652099609375, -0.5628662109375, -0.5207672119140625, -0.478668212890625, -0.4365692138671875, -0.39447021484375, -0.3523712158203125, -0.310272216796875, -0.2681732177734375, -0.22607421875, -0.1839752197265625, -0.141876220703125, -0.0997772216796875, -0.05767822265625, -0.0155792236328125, 0.026519775390625, 0.0686187744140625, 0.1107177734375, 0.1528167724609375, 0.194915771484375, 0.2370147705078125, 0.27911376953125, 0.3212127685546875, 0.363311767578125, 0.4054107666015625, 0.447509765625, 0.4896087646484375, 0.531707763671875, 0.5738067626953125, 0.61590576171875, 0.6580047607421875, 0.700103759765625, 0.7422027587890625, 0.7843017578125, 0.8264007568359375, 0.868499755859375, 0.9105987548828125, 0.95269775390625, 0.9947967529296875, 1.036895751953125, 1.0789947509765625, 1.12109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 7.0, 8.0, 14.0, 19.0, 76.0, 215.0, 435.0, 136.0, 45.0, 13.0, 15.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.24333190917969, -47.12641906738281, -46.00950241088867, -44.8925895690918, -43.775672912597656, -42.65876007080078, -41.54184341430664, -40.424930572509766, -39.308013916015625, -38.19110107421875, -37.07418441772461, -35.957271575927734, -34.840354919433594, -33.72344207763672, -32.60652542114258, -31.489612579345703, -30.372699737548828, -29.25578498840332, -28.138870239257812, -27.021955490112305, -25.905040740966797, -24.788127899169922, -23.671213150024414, -22.554298400878906, -21.4373836517334, -20.32046890258789, -19.203554153442383, -18.086639404296875, -16.9697265625, -15.852810859680176, -14.735897064208984, -13.618982315063477, -12.502071380615234, -11.385156631469727, -10.268241882324219, -9.151328086853027, -8.03441333770752, -6.917498588562012, -5.800584316253662, -4.6836700439453125, -3.5667552947998047, -2.449840784072876, -1.3329262733459473, -0.21601176261901855, 0.9009027481079102, 2.017817497253418, 3.1347317695617676, 4.251646041870117, 5.368560791015625, 6.485475540161133, 7.602389812469482, 8.719304084777832, 9.83621883392334, 10.953133583068848, 12.070047378540039, 13.186962127685547, 14.303876876831055, 15.420791625976562, 16.53770637512207, 17.654621124267578, 18.771533966064453, 19.888450622558594, 21.00536346435547, 22.122278213500977, 23.239192962646484]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 12.0, 7.0, 9.0, 14.0, 14.0, 11.0, 18.0, 29.0, 37.0, 35.0, 34.0, 50.0, 64.0, 134.0, 148.0, 83.0, 44.0, 40.0, 44.0, 30.0, 29.0, 18.0, 26.0, 15.0, 9.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.70281219482422, -18.060890197753906, -17.418970108032227, -16.777048110961914, -16.135128021240234, -15.493206024169922, -14.85128402709961, -14.209362983703613, -13.567441940307617, -12.925520896911621, -12.283599853515625, -11.641677856445312, -10.999756813049316, -10.35783576965332, -9.715913772583008, -9.073992729187012, -8.432071685791016, -7.7901506423950195, -7.148229122161865, -6.506307601928711, -5.864386558532715, -5.222465515136719, -4.5805439949035645, -3.93862247467041, -3.296701431274414, -2.654780149459839, -2.0128588676452637, -1.3709375858306885, -0.7290163040161133, -0.08709502220153809, 0.5548262596130371, 1.1967477798461914, 1.8386707305908203, 2.4805920124053955, 3.1225132942199707, 3.764434576034546, 4.406355857849121, 5.048276901245117, 5.6901984214782715, 6.332119941711426, 6.974040985107422, 7.615962028503418, 8.257883071899414, 8.899805068969727, 9.541726112365723, 10.183647155761719, 10.825569152832031, 11.467490196228027, 12.109411239624023, 12.75133228302002, 13.393253326416016, 14.035175323486328, 14.677096366882324, 15.31901741027832, 15.960939407348633, 16.602859497070312, 17.244781494140625, 17.886703491210938, 18.528623580932617, 19.17054557800293, 19.81246566772461, 20.454387664794922, 21.096309661865234, 21.738231658935547, 22.380151748657227]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 4.0, 5.0, 4.0, 17.0, 18.0, 17.0, 22.0, 42.0, 54.0, 106.0, 194.0, 452.0, 1390.0, 5784.0, 58263.0, 2904045.0, 1192840.0, 25150.0, 3893.0, 1114.0, 397.0, 193.0, 95.0, 51.0, 39.0, 22.0, 13.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.546875, -6.390472412109375, -6.23406982421875, -6.077667236328125, -5.9212646484375, -5.764862060546875, -5.60845947265625, -5.452056884765625, -5.295654296875, -5.139251708984375, -4.98284912109375, -4.826446533203125, -4.6700439453125, -4.513641357421875, -4.35723876953125, -4.200836181640625, -4.04443359375, -3.888031005859375, -3.73162841796875, -3.575225830078125, -3.4188232421875, -3.262420654296875, -3.10601806640625, -2.949615478515625, -2.793212890625, -2.636810302734375, -2.48040771484375, -2.324005126953125, -2.1676025390625, -2.011199951171875, -1.85479736328125, -1.698394775390625, -1.5419921875, -1.385589599609375, -1.22918701171875, -1.072784423828125, -0.9163818359375, -0.759979248046875, -0.60357666015625, -0.447174072265625, -0.290771484375, -0.134368896484375, 0.02203369140625, 0.178436279296875, 0.3348388671875, 0.491241455078125, 0.64764404296875, 0.804046630859375, 0.96044921875, 1.116851806640625, 1.27325439453125, 1.429656982421875, 1.5860595703125, 1.742462158203125, 1.89886474609375, 2.055267333984375, 2.211669921875, 2.368072509765625, 2.52447509765625, 2.680877685546875, 2.8372802734375, 2.993682861328125, 3.15008544921875, 3.306488037109375, 3.462890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 6.0, 9.0, 15.0, 17.0, 25.0, 39.0, 47.0, 56.0, 54.0, 63.0, 64.0, 66.0, 74.0, 75.0, 65.0, 68.0, 59.0, 51.0, 33.0, 35.0, 19.0, 15.0, 14.0, 5.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5263519287109375, -1.477508544921875, -1.4286651611328125, -1.37982177734375, -1.3309783935546875, -1.282135009765625, -1.2332916259765625, -1.1844482421875, -1.1356048583984375, -1.086761474609375, -1.0379180908203125, -0.98907470703125, -0.9402313232421875, -0.891387939453125, -0.8425445556640625, -0.793701171875, -0.7448577880859375, -0.696014404296875, -0.6471710205078125, -0.59832763671875, -0.5494842529296875, -0.500640869140625, -0.4517974853515625, -0.4029541015625, -0.3541107177734375, -0.305267333984375, -0.2564239501953125, -0.20758056640625, -0.1587371826171875, -0.109893798828125, -0.0610504150390625, -0.01220703125, 0.0366363525390625, 0.085479736328125, 0.1343231201171875, 0.18316650390625, 0.2320098876953125, 0.280853271484375, 0.3296966552734375, 0.3785400390625, 0.4273834228515625, 0.476226806640625, 0.5250701904296875, 0.57391357421875, 0.6227569580078125, 0.671600341796875, 0.7204437255859375, 0.769287109375, 0.8181304931640625, 0.866973876953125, 0.9158172607421875, 0.96466064453125, 1.0135040283203125, 1.062347412109375, 1.1111907958984375, 1.1600341796875, 1.2088775634765625, 1.257720947265625, 1.3065643310546875, 1.35540771484375, 1.4042510986328125, 1.453094482421875, 1.5019378662109375, 1.55078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 12.0, 24.0, 36.0, 77.0, 209.0, 617.0, 2262.0, 60822.0, 4121977.0, 6725.0, 1033.0, 281.0, 105.0, 51.0, 18.0, 12.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.8082275390625, -20.303955078125, -19.7996826171875, -19.29541015625, -18.7911376953125, -18.286865234375, -17.7825927734375, -17.2783203125, -16.7740478515625, -16.269775390625, -15.7655029296875, -15.26123046875, -14.7569580078125, -14.252685546875, -13.7484130859375, -13.244140625, -12.7398681640625, -12.235595703125, -11.7313232421875, -11.22705078125, -10.7227783203125, -10.218505859375, -9.7142333984375, -9.2099609375, -8.7056884765625, -8.201416015625, -7.6971435546875, -7.19287109375, -6.6885986328125, -6.184326171875, -5.6800537109375, -5.17578125, -4.6715087890625, -4.167236328125, -3.6629638671875, -3.15869140625, -2.6544189453125, -2.150146484375, -1.6458740234375, -1.1416015625, -0.6373291015625, -0.133056640625, 0.3712158203125, 0.87548828125, 1.3797607421875, 1.884033203125, 2.3883056640625, 2.892578125, 3.3968505859375, 3.901123046875, 4.4053955078125, 4.90966796875, 5.4139404296875, 5.918212890625, 6.4224853515625, 6.9267578125, 7.4310302734375, 7.935302734375, 8.4395751953125, 8.94384765625, 9.4481201171875, 9.952392578125, 10.4566650390625, 10.9609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 9.0, 10.0, 12.0, 21.0, 38.0, 74.0, 95.0, 182.0, 337.0, 628.0, 878.0, 766.0, 459.0, 231.0, 146.0, 74.0, 41.0, 27.0, 18.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.9609375, -7.782623291015625, -7.60430908203125, -7.425994873046875, -7.2476806640625, -7.069366455078125, -6.89105224609375, -6.712738037109375, -6.534423828125, -6.356109619140625, -6.17779541015625, -5.999481201171875, -5.8211669921875, -5.642852783203125, -5.46453857421875, -5.286224365234375, -5.10791015625, -4.929595947265625, -4.75128173828125, -4.572967529296875, -4.3946533203125, -4.216339111328125, -4.03802490234375, -3.859710693359375, -3.681396484375, -3.503082275390625, -3.32476806640625, -3.146453857421875, -2.9681396484375, -2.789825439453125, -2.61151123046875, -2.433197021484375, -2.2548828125, -2.076568603515625, -1.89825439453125, -1.719940185546875, -1.5416259765625, -1.363311767578125, -1.18499755859375, -1.006683349609375, -0.828369140625, -0.650054931640625, -0.47174072265625, -0.293426513671875, -0.1151123046875, 0.063201904296875, 0.24151611328125, 0.419830322265625, 0.59814453125, 0.776458740234375, 0.95477294921875, 1.133087158203125, 1.3114013671875, 1.489715576171875, 1.66802978515625, 1.846343994140625, 2.024658203125, 2.202972412109375, 2.38128662109375, 2.559600830078125, 2.7379150390625, 2.916229248046875, 3.09454345703125, 3.272857666015625, 3.451171875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 15.0, 14.0, 42.0, 71.0, 117.0, 169.0, 186.0, 155.0, 74.0, 65.0, 26.0, 13.0, 6.0, 8.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.243656158447266, -52.8559684753418, -51.46828079223633, -50.08059310913086, -48.69290542602539, -47.305213928222656, -45.91752624511719, -44.52983856201172, -43.14215087890625, -41.75446319580078, -40.36677551269531, -38.979087829589844, -37.591400146484375, -36.203712463378906, -34.81602478027344, -33.4283332824707, -32.0406494140625, -30.65296173095703, -29.265274047851562, -27.877586364746094, -26.489896774291992, -25.102209091186523, -23.714521408081055, -22.326831817626953, -20.939144134521484, -19.551456451416016, -18.163768768310547, -16.776081085205078, -15.388391494750977, -14.000703811645508, -12.613016128540039, -11.225327491760254, -9.837638854980469, -8.449951171875, -7.062262535095215, -5.674574851989746, -4.286886692047119, -2.899198532104492, -1.5115108489990234, -0.12382221221923828, 1.2638654708862305, 2.6515536308288574, 4.039241790771484, 5.426929473876953, 6.81461763381958, 8.202305793762207, 9.589993476867676, 10.977682113647461, 12.36536979675293, 13.753057479858398, 15.140746116638184, 16.52843475341797, 17.916122436523438, 19.303810119628906, 20.691497802734375, 22.079185485839844, 23.466873168945312, 24.85456085205078, 26.24224853515625, 27.62993621826172, 29.01762580871582, 30.40531349182129, 31.793001174926758, 33.18069076538086, 34.56837844848633]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 14.0, 32.0, 25.0, 42.0, 43.0, 48.0, 68.0, 79.0, 70.0, 68.0, 82.0, 62.0, 70.0, 48.0, 51.0, 44.0, 21.0, 32.0, 20.0, 8.0, 10.0, 8.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.871252059936523, -29.007728576660156, -28.144203186035156, -27.28067970275879, -26.417156219482422, -25.553630828857422, -24.690107345581055, -23.826583862304688, -22.963058471679688, -22.09953498840332, -21.23600959777832, -20.372486114501953, -19.508960723876953, -18.645437240600586, -17.78191375732422, -16.91838836669922, -16.05486488342285, -15.191340446472168, -14.327816009521484, -13.464292526245117, -12.600768089294434, -11.73724365234375, -10.873720169067383, -10.0101957321167, -9.146671295166016, -8.283146858215332, -7.419622898101807, -6.556098937988281, -5.692574501037598, -4.829050064086914, -3.9655261039733887, -3.1020021438598633, -2.2384796142578125, -1.374955415725708, -0.5114312171936035, 0.352092981338501, 1.2156171798706055, 2.079141616821289, 2.9426655769348145, 3.80618953704834, 4.669713973999023, 5.533238410949707, 6.396762371063232, 7.260286331176758, 8.123810768127441, 8.987335205078125, 9.850858688354492, 10.714383125305176, 11.57790756225586, 12.441431999206543, 13.304956436157227, 14.168479919433594, 15.032004356384277, 15.895528793334961, 16.759052276611328, 17.622577667236328, 18.486101150512695, 19.349624633789062, 20.213150024414062, 21.07667350769043, 21.940196990966797, 22.803722381591797, 23.667245864868164, 24.53076934814453, 25.39429473876953]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 12.0, 22.0, 23.0, 41.0, 78.0, 100.0, 167.0, 314.0, 652.0, 1540.0, 3905.0, 13753.0, 70212.0, 659237.0, 252258.0, 33581.0, 7874.0, 2547.0, 1059.0, 510.0, 234.0, 146.0, 88.0, 55.0, 40.0, 24.0, 15.0, 11.0, 8.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.219879150390625, -2.13702392578125, -2.054168701171875, -1.9713134765625, -1.888458251953125, -1.80560302734375, -1.722747802734375, -1.639892578125, -1.557037353515625, -1.47418212890625, -1.391326904296875, -1.3084716796875, -1.225616455078125, -1.14276123046875, -1.059906005859375, -0.97705078125, -0.894195556640625, -0.81134033203125, -0.728485107421875, -0.6456298828125, -0.562774658203125, -0.47991943359375, -0.397064208984375, -0.314208984375, -0.231353759765625, -0.14849853515625, -0.065643310546875, 0.0172119140625, 0.100067138671875, 0.18292236328125, 0.265777587890625, 0.3486328125, 0.431488037109375, 0.51434326171875, 0.597198486328125, 0.6800537109375, 0.762908935546875, 0.84576416015625, 0.928619384765625, 1.011474609375, 1.094329833984375, 1.17718505859375, 1.260040283203125, 1.3428955078125, 1.425750732421875, 1.50860595703125, 1.591461181640625, 1.67431640625, 1.757171630859375, 1.84002685546875, 1.922882080078125, 2.0057373046875, 2.088592529296875, 2.17144775390625, 2.254302978515625, 2.337158203125, 2.420013427734375, 2.50286865234375, 2.585723876953125, 2.6685791015625, 2.751434326171875, 2.83428955078125, 2.917144775390625, 3.0]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 13.0, 10.0, 26.0, 28.0, 46.0, 47.0, 68.0, 75.0, 85.0, 86.0, 88.0, 70.0, 77.0, 52.0, 52.0, 45.0, 32.0, 25.0, 16.0, 13.0, 5.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.512054443359375, -2.44012451171875, -2.368194580078125, -2.2962646484375, -2.224334716796875, -2.15240478515625, -2.080474853515625, -2.008544921875, -1.936614990234375, -1.86468505859375, -1.792755126953125, -1.7208251953125, -1.648895263671875, -1.57696533203125, -1.505035400390625, -1.43310546875, -1.361175537109375, -1.28924560546875, -1.217315673828125, -1.1453857421875, -1.073455810546875, -1.00152587890625, -0.929595947265625, -0.857666015625, -0.785736083984375, -0.71380615234375, -0.641876220703125, -0.5699462890625, -0.498016357421875, -0.42608642578125, -0.354156494140625, -0.2822265625, -0.210296630859375, -0.13836669921875, -0.066436767578125, 0.0054931640625, 0.077423095703125, 0.14935302734375, 0.221282958984375, 0.293212890625, 0.365142822265625, 0.43707275390625, 0.509002685546875, 0.5809326171875, 0.652862548828125, 0.72479248046875, 0.796722412109375, 0.86865234375, 0.940582275390625, 1.01251220703125, 1.084442138671875, 1.1563720703125, 1.228302001953125, 1.30023193359375, 1.372161865234375, 1.444091796875, 1.516021728515625, 1.58795166015625, 1.659881591796875, 1.7318115234375, 1.803741455078125, 1.87567138671875, 1.947601318359375, 2.01953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 13.0, 10.0, 18.0, 24.0, 44.0, 48.0, 98.0, 163.0, 260.0, 520.0, 1543.0, 9030.0, 647450.0, 378031.0, 8684.0, 1523.0, 481.0, 255.0, 145.0, 76.0, 50.0, 37.0, 20.0, 15.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.697662353515625, -2.56915283203125, -2.440643310546875, -2.3121337890625, -2.183624267578125, -2.05511474609375, -1.926605224609375, -1.798095703125, -1.669586181640625, -1.54107666015625, -1.412567138671875, -1.2840576171875, -1.155548095703125, -1.02703857421875, -0.898529052734375, -0.77001953125, -0.641510009765625, -0.51300048828125, -0.384490966796875, -0.2559814453125, -0.127471923828125, 0.00103759765625, 0.129547119140625, 0.258056640625, 0.386566162109375, 0.51507568359375, 0.643585205078125, 0.7720947265625, 0.900604248046875, 1.02911376953125, 1.157623291015625, 1.2861328125, 1.414642333984375, 1.54315185546875, 1.671661376953125, 1.8001708984375, 1.928680419921875, 2.05718994140625, 2.185699462890625, 2.314208984375, 2.442718505859375, 2.57122802734375, 2.699737548828125, 2.8282470703125, 2.956756591796875, 3.08526611328125, 3.213775634765625, 3.34228515625, 3.470794677734375, 3.59930419921875, 3.727813720703125, 3.8563232421875, 3.984832763671875, 4.11334228515625, 4.241851806640625, 4.370361328125, 4.498870849609375, 4.62738037109375, 4.755889892578125, 4.8843994140625, 5.012908935546875, 5.14141845703125, 5.269927978515625, 5.3984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 11.0, 11.0, 9.0, 10.0, 11.0, 10.0, 16.0, 28.0, 28.0, 27.0, 27.0, 32.0, 57.0, 61.0, 69.0, 75.0, 80.0, 79.0, 55.0, 54.0, 47.0, 36.0, 27.0, 23.0, 25.0, 16.0, 9.0, 16.0, 12.0, 14.0, 2.0, 8.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.09375, -4.91943359375, -4.7451171875, -4.57080078125, -4.396484375, -4.22216796875, -4.0478515625, -3.87353515625, -3.69921875, -3.52490234375, -3.3505859375, -3.17626953125, -3.001953125, -2.82763671875, -2.6533203125, -2.47900390625, -2.3046875, -2.13037109375, -1.9560546875, -1.78173828125, -1.607421875, -1.43310546875, -1.2587890625, -1.08447265625, -0.91015625, -0.73583984375, -0.5615234375, -0.38720703125, -0.212890625, -0.03857421875, 0.1357421875, 0.31005859375, 0.484375, 0.65869140625, 0.8330078125, 1.00732421875, 1.181640625, 1.35595703125, 1.5302734375, 1.70458984375, 1.87890625, 2.05322265625, 2.2275390625, 2.40185546875, 2.576171875, 2.75048828125, 2.9248046875, 3.09912109375, 3.2734375, 3.44775390625, 3.6220703125, 3.79638671875, 3.970703125, 4.14501953125, 4.3193359375, 4.49365234375, 4.66796875, 4.84228515625, 5.0166015625, 5.19091796875, 5.365234375, 5.53955078125, 5.7138671875, 5.88818359375, 6.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 13.0, 19.0, 36.0, 58.0, 94.0, 153.0, 359.0, 992.0, 3289.0, 17314.0, 640506.0, 363682.0, 17113.0, 3242.0, 978.0, 306.0, 156.0, 98.0, 49.0, 27.0, 22.0, 11.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53955078125, -0.5202789306640625, -0.501007080078125, -0.4817352294921875, -0.46246337890625, -0.4431915283203125, -0.423919677734375, -0.4046478271484375, -0.3853759765625, -0.3661041259765625, -0.346832275390625, -0.3275604248046875, -0.30828857421875, -0.2890167236328125, -0.269744873046875, -0.2504730224609375, -0.231201171875, -0.2119293212890625, -0.192657470703125, -0.1733856201171875, -0.15411376953125, -0.1348419189453125, -0.115570068359375, -0.0962982177734375, -0.0770263671875, -0.0577545166015625, -0.038482666015625, -0.0192108154296875, 6.103515625e-05, 0.0193328857421875, 0.038604736328125, 0.0578765869140625, 0.0771484375, 0.0964202880859375, 0.115692138671875, 0.1349639892578125, 0.15423583984375, 0.1735076904296875, 0.192779541015625, 0.2120513916015625, 0.2313232421875, 0.2505950927734375, 0.269866943359375, 0.2891387939453125, 0.30841064453125, 0.3276824951171875, 0.346954345703125, 0.3662261962890625, 0.385498046875, 0.4047698974609375, 0.424041748046875, 0.4433135986328125, 0.46258544921875, 0.4818572998046875, 0.501129150390625, 0.5204010009765625, 0.5396728515625, 0.5589447021484375, 0.578216552734375, 0.5974884033203125, 0.61676025390625, 0.6360321044921875, 0.655303955078125, 0.6745758056640625, 0.69384765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 6.0, 14.0, 16.0, 18.0, 30.0, 55.0, 65.0, 104.0, 116.0, 107.0, 108.0, 80.0, 58.0, 35.0, 24.0, 25.0, 13.0, 17.0, 16.0, 6.0, 5.0, 11.0, 6.0, 7.0, 5.0, 2.0, 1.0, 6.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011563301086425781, -0.00011194590479135513, -0.00010825879871845245, -0.00010457169264554977, -0.0001008845865726471, -9.719748049974442e-05, -9.351037442684174e-05, -8.982326835393906e-05, -8.613616228103638e-05, -8.24490562081337e-05, -7.876195013523102e-05, -7.507484406232834e-05, -7.138773798942566e-05, -6.770063191652298e-05, -6.40135258436203e-05, -6.032641977071762e-05, -5.663931369781494e-05, -5.295220762491226e-05, -4.926510155200958e-05, -4.55779954791069e-05, -4.1890889406204224e-05, -3.8203783333301544e-05, -3.4516677260398865e-05, -3.0829571187496185e-05, -2.7142465114593506e-05, -2.3455359041690826e-05, -1.9768252968788147e-05, -1.6081146895885468e-05, -1.2394040822982788e-05, -8.706934750080109e-06, -5.019828677177429e-06, -1.3327226042747498e-06, 2.3543834686279297e-06, 6.041489541530609e-06, 9.728595614433289e-06, 1.3415701687335968e-05, 1.7102807760238647e-05, 2.0789913833141327e-05, 2.4477019906044006e-05, 2.8164125978946686e-05, 3.1851232051849365e-05, 3.5538338124752045e-05, 3.9225444197654724e-05, 4.2912550270557404e-05, 4.659965634346008e-05, 5.028676241636276e-05, 5.397386848926544e-05, 5.766097456216812e-05, 6.13480806350708e-05, 6.503518670797348e-05, 6.872229278087616e-05, 7.240939885377884e-05, 7.609650492668152e-05, 7.97836109995842e-05, 8.347071707248688e-05, 8.715782314538956e-05, 9.084492921829224e-05, 9.453203529119492e-05, 9.82191413640976e-05, 0.00010190624743700027, 0.00010559335350990295, 0.00010928045958280563, 0.00011296756565570831, 0.00011665467172861099, 0.00012034177780151367]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 8.0, 8.0, 14.0, 18.0, 34.0, 42.0, 81.0, 132.0, 253.0, 455.0, 1113.0, 2938.0, 9130.0, 41843.0, 836211.0, 129662.0, 18429.0, 4998.0, 1707.0, 704.0, 344.0, 161.0, 96.0, 62.0, 38.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.6044921875, -0.5884819030761719, -0.5724716186523438, -0.5564613342285156, -0.5404510498046875, -0.5244407653808594, -0.5084304809570312, -0.4924201965332031, -0.476409912109375, -0.4603996276855469, -0.44438934326171875, -0.4283790588378906, -0.4123687744140625, -0.3963584899902344, -0.38034820556640625, -0.3643379211425781, -0.34832763671875, -0.3323173522949219, -0.31630706787109375, -0.3002967834472656, -0.2842864990234375, -0.2682762145996094, -0.25226593017578125, -0.23625564575195312, -0.220245361328125, -0.20423507690429688, -0.18822479248046875, -0.17221450805664062, -0.1562042236328125, -0.14019393920898438, -0.12418365478515625, -0.10817337036132812, -0.0921630859375, -0.07615280151367188, -0.06014251708984375, -0.044132232666015625, -0.0281219482421875, -0.012111663818359375, 0.00389862060546875, 0.019908905029296875, 0.035919189453125, 0.051929473876953125, 0.06793975830078125, 0.08395004272460938, 0.0999603271484375, 0.11597061157226562, 0.13198089599609375, 0.14799118041992188, 0.16400146484375, 0.18001174926757812, 0.19602203369140625, 0.21203231811523438, 0.2280426025390625, 0.24405288696289062, 0.26006317138671875, 0.2760734558105469, 0.292083740234375, 0.3080940246582031, 0.32410430908203125, 0.3401145935058594, 0.3561248779296875, 0.3721351623535156, 0.38814544677734375, 0.4041557312011719, 0.420166015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 5.0, 9.0, 6.0, 9.0, 14.0, 18.0, 10.0, 20.0, 22.0, 38.0, 58.0, 81.0, 153.0, 138.0, 132.0, 76.0, 55.0, 38.0, 29.0, 14.0, 15.0, 14.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5802230834960938, -0.5618133544921875, -0.5434036254882812, -0.524993896484375, -0.5065841674804688, -0.4881744384765625, -0.46976470947265625, -0.45135498046875, -0.43294525146484375, -0.4145355224609375, -0.39612579345703125, -0.377716064453125, -0.35930633544921875, -0.3408966064453125, -0.32248687744140625, -0.3040771484375, -0.28566741943359375, -0.2672576904296875, -0.24884796142578125, -0.230438232421875, -0.21202850341796875, -0.1936187744140625, -0.17520904541015625, -0.15679931640625, -0.13838958740234375, -0.1199798583984375, -0.10157012939453125, -0.083160400390625, -0.06475067138671875, -0.0463409423828125, -0.02793121337890625, -0.009521484375, 0.00888824462890625, 0.0272979736328125, 0.04570770263671875, 0.064117431640625, 0.08252716064453125, 0.1009368896484375, 0.11934661865234375, 0.13775634765625, 0.15616607666015625, 0.1745758056640625, 0.19298553466796875, 0.211395263671875, 0.22980499267578125, 0.2482147216796875, 0.26662445068359375, 0.2850341796875, 0.30344390869140625, 0.3218536376953125, 0.34026336669921875, 0.358673095703125, 0.37708282470703125, 0.3954925537109375, 0.41390228271484375, 0.43231201171875, 0.45072174072265625, 0.4691314697265625, 0.48754119873046875, 0.505950927734375, 0.5243606567382812, 0.5427703857421875, 0.5611801147460938, 0.57958984375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 21.0, 26.0, 75.0, 176.0, 469.0, 106.0, 47.0, 27.0, 14.0, 9.0, 7.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.616363525390625, -20.924623489379883, -20.23288345336914, -19.541141510009766, -18.849401473999023, -18.15766143798828, -17.46592140197754, -16.774181365966797, -16.082439422607422, -15.39069938659668, -14.698958396911621, -14.007218360900879, -13.31547737121582, -12.623737335205078, -11.931997299194336, -11.240256309509277, -10.548516273498535, -9.856776237487793, -9.165035247802734, -8.473295211791992, -7.781554222106934, -7.089814186096191, -6.398073673248291, -5.706333160400391, -5.01459264755249, -4.32285213470459, -3.6311116218566895, -2.939371347427368, -2.2476308345794678, -1.5558903217315674, -0.8641500473022461, -0.1724095344543457, 0.5193309783935547, 1.211071491241455, 1.902811884880066, 2.5945522785186768, 3.286292791366577, 3.9780333042144775, 4.669773578643799, 5.361514091491699, 6.0532546043396, 6.7449951171875, 7.4367356300354, 8.1284761428833, 8.820216178894043, 9.511957168579102, 10.203697204589844, 10.895437240600586, 11.587178230285645, 12.278918266296387, 12.970659255981445, 13.662399291992188, 14.354140281677246, 15.045880317687988, 15.737621307373047, 16.42936134338379, 17.12110137939453, 17.812841415405273, 18.504581451416016, 19.19632339477539, 19.888063430786133, 20.579803466796875, 21.271543502807617, 21.96328353881836, 22.655025482177734]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 16.0, 6.0, 21.0, 14.0, 16.0, 12.0, 26.0, 26.0, 30.0, 44.0, 47.0, 169.0, 240.0, 107.0, 41.0, 34.0, 30.0, 24.0, 23.0, 14.0, 10.0, 11.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.212543487548828, -19.622610092163086, -19.032678604125977, -18.442745208740234, -17.852813720703125, -17.262880325317383, -16.672948837280273, -16.08301544189453, -15.493083000183105, -14.90315055847168, -14.313218116760254, -13.723285675048828, -13.133352279663086, -12.543420791625977, -11.953487396240234, -11.363554954528809, -10.773622512817383, -10.183690071105957, -9.593757629394531, -9.003825187683105, -8.41389274597168, -7.823959827423096, -7.234026908874512, -6.644094467163086, -6.05416202545166, -5.464229583740234, -4.874297142028809, -4.284364223480225, -3.694431781768799, -3.104499340057373, -2.514566659927368, -1.9246339797973633, -1.3346996307373047, -0.7447670698165894, -0.15483450889587402, 0.4350980520248413, 1.0250306129455566, 1.6149630546569824, 2.2048957347869873, 2.794828414916992, 3.384760856628418, 3.9746932983398438, 4.5646257400512695, 5.1545586585998535, 5.744491100311279, 6.334423542022705, 6.924356460571289, 7.514288902282715, 8.10422134399414, 8.694153785705566, 9.284086227416992, 9.874018669128418, 10.463951110839844, 11.053884506225586, 11.643816947937012, 12.233749389648438, 12.823681831359863, 13.413614273071289, 14.003546714782715, 14.59347915649414, 15.183412551879883, 15.773344039916992, 16.363277435302734, 16.953208923339844, 17.543142318725586]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 9.0, 12.0, 11.0, 13.0, 20.0, 33.0, 40.0, 33.0, 45.0, 57.0, 173.0, 222.0, 73.0, 47.0, 47.0, 39.0, 28.0, 19.0, 22.0, 16.0, 9.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25, -2.182098388671875, -2.11419677734375, -2.046295166015625, -1.9783935546875, -1.910491943359375, -1.84259033203125, -1.774688720703125, -1.706787109375, -1.638885498046875, -1.57098388671875, -1.503082275390625, -1.4351806640625, -1.367279052734375, -1.29937744140625, -1.231475830078125, -1.16357421875, -1.095672607421875, -1.02777099609375, -0.959869384765625, -0.8919677734375, -0.824066162109375, -0.75616455078125, -0.688262939453125, -0.620361328125, -0.552459716796875, -0.48455810546875, -0.416656494140625, -0.3487548828125, -0.280853271484375, -0.21295166015625, -0.145050048828125, -0.0771484375, -0.009246826171875, 0.05865478515625, 0.126556396484375, 0.1944580078125, 0.262359619140625, 0.33026123046875, 0.398162841796875, 0.466064453125, 0.533966064453125, 0.60186767578125, 0.669769287109375, 0.7376708984375, 0.805572509765625, 0.87347412109375, 0.941375732421875, 1.00927734375, 1.077178955078125, 1.14508056640625, 1.212982177734375, 1.2808837890625, 1.348785400390625, 1.41668701171875, 1.484588623046875, 1.552490234375, 1.620391845703125, 1.68829345703125, 1.756195068359375, 1.8240966796875, 1.891998291015625, 1.95989990234375, 2.027801513671875, 2.095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 14.0, 13.0, 22.0, 30.0, 56.0, 104.0, 215.0, 553.0, 3300.0, 8071451.0, 308893.0, 2881.0, 573.0, 184.0, 99.0, 44.0, 24.0, 30.0, 10.0, 13.0, 8.0, 7.0, 5.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-19.148574829101562, -18.56783103942871, -17.98708724975586, -17.406341552734375, -16.825597763061523, -16.244853973388672, -15.664109230041504, -15.083364486694336, -14.502620697021484, -13.921876907348633, -13.341132164001465, -12.760387420654297, -12.179643630981445, -11.598899841308594, -11.018155097961426, -10.437410354614258, -9.856666564941406, -9.275922775268555, -8.695178031921387, -8.114433288574219, -7.533689498901367, -6.952945232391357, -6.372200965881348, -5.791456699371338, -5.210712432861328, -4.629968166351318, -4.049223899841309, -3.468479633331299, -2.887735366821289, -2.3069911003112793, -1.7262468338012695, -1.1455025672912598, -0.5647602081298828, 0.015984058380126953, 0.5967283248901367, 1.1774725914001465, 1.7582168579101562, 2.338961124420166, 2.919705390930176, 3.5004496574401855, 4.081193923950195, 4.661938190460205, 5.242682456970215, 5.823426723480225, 6.404170989990234, 6.984915256500244, 7.565659523010254, 8.146404266357422, 8.727148056030273, 9.307891845703125, 9.888636589050293, 10.469381332397461, 11.050125122070312, 11.630868911743164, 12.211613655090332, 12.7923583984375, 13.373102188110352, 13.953845977783203, 14.534590721130371, 15.115335464477539, 15.69607925415039, 16.276823043823242, 16.857566833496094, 17.438312530517578, 18.01905632019043]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.392813682556152, -11.846787452697754, -11.300761222839355, -10.754734992980957, -10.208708763122559, -9.66268253326416, -9.116656303405762, -8.570630073547363, -8.024603843688965, -7.478577613830566, -6.932551383972168, -6.3865251541137695, -5.840498924255371, -5.294472694396973, -4.748446464538574, -4.202420234680176, -3.6563940048217773, -3.110367774963379, -2.5643415451049805, -2.018315315246582, -1.4722890853881836, -0.9262628555297852, -0.3802366256713867, 0.16578960418701172, 0.7118158340454102, 1.2578420639038086, 1.803868293762207, 2.3498945236206055, 2.895920753479004, 3.4419469833374023, 3.987973213195801, 4.533999443054199, 5.080024719238281, 5.62605094909668, 6.172077178955078, 6.718103408813477, 7.264129638671875, 7.810155868530273, 8.356182098388672, 8.90220832824707, 9.448234558105469, 9.994260787963867, 10.540287017822266, 11.086313247680664, 11.632339477539062, 12.178365707397461, 12.72439193725586, 13.270418167114258, 13.816444396972656, 14.362470626831055, 14.908496856689453, 15.454523086547852, 16.00054931640625, 16.54657554626465, 17.092601776123047, 17.638628005981445, 18.184654235839844, 18.730680465698242, 19.27670669555664, 19.82273292541504, 20.368759155273438, 20.914785385131836, 21.460811614990234, 22.006837844848633, 22.55286407470703]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 9.0, 15.0, 15.0, 23.0, 22.0, 34.0, 41.0, 71.0, 82.0, 103.0, 86.0, 92.0, 93.0, 75.0, 64.0, 48.0, 35.0, 26.0, 21.0, 18.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44891357421875, -1.4075927734375, -1.36627197265625, -1.324951171875, -1.28363037109375, -1.2423095703125, -1.20098876953125, -1.15966796875, -1.11834716796875, -1.0770263671875, -1.03570556640625, -0.994384765625, -0.95306396484375, -0.9117431640625, -0.87042236328125, -0.8291015625, -0.78778076171875, -0.7464599609375, -0.70513916015625, -0.663818359375, -0.62249755859375, -0.5811767578125, -0.53985595703125, -0.49853515625, -0.45721435546875, -0.4158935546875, -0.37457275390625, -0.333251953125, -0.29193115234375, -0.2506103515625, -0.20928955078125, -0.16796875, -0.12664794921875, -0.0853271484375, -0.04400634765625, -0.002685546875, 0.03863525390625, 0.0799560546875, 0.12127685546875, 0.16259765625, 0.20391845703125, 0.2452392578125, 0.28656005859375, 0.327880859375, 0.36920166015625, 0.4105224609375, 0.45184326171875, 0.4931640625, 0.53448486328125, 0.5758056640625, 0.61712646484375, 0.658447265625, 0.69976806640625, 0.7410888671875, 0.78240966796875, 0.82373046875, 0.86505126953125, 0.9063720703125, 0.94769287109375, 0.989013671875, 1.03033447265625, 1.0716552734375, 1.11297607421875, 1.154296875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 11.0, 12.0, 31.0, 40.0, 58.0, 112.0, 224.0, 538.0, 1763.0, 7536.0, 42884.0, 256526.0, 181016.0, 26725.0, 4648.0, 1203.0, 423.0, 205.0, 110.0, 68.0, 31.0, 29.0, 8.0, 14.0, 9.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-20.8125, -20.3487548828125, -19.885009765625, -19.4212646484375, -18.95751953125, -18.4937744140625, -18.030029296875, -17.5662841796875, -17.1025390625, -16.6387939453125, -16.175048828125, -15.7113037109375, -15.24755859375, -14.7838134765625, -14.320068359375, -13.8563232421875, -13.392578125, -12.9288330078125, -12.465087890625, -12.0013427734375, -11.53759765625, -11.0738525390625, -10.610107421875, -10.1463623046875, -9.6826171875, -9.2188720703125, -8.755126953125, -8.2913818359375, -7.82763671875, -7.3638916015625, -6.900146484375, -6.4364013671875, -5.97265625, -5.5089111328125, -5.045166015625, -4.5814208984375, -4.11767578125, -3.6539306640625, -3.190185546875, -2.7264404296875, -2.2626953125, -1.7989501953125, -1.335205078125, -0.8714599609375, -0.40771484375, 0.0560302734375, 0.519775390625, 0.9835205078125, 1.447265625, 1.9110107421875, 2.374755859375, 2.8385009765625, 3.30224609375, 3.7659912109375, 4.229736328125, 4.6934814453125, 5.1572265625, 5.6209716796875, 6.084716796875, 6.5484619140625, 7.01220703125, 7.4759521484375, 7.939697265625, 8.4034423828125, 8.8671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 13.0, 11.0, 12.0, 26.0, 17.0, 33.0, 45.0, 63.0, 69.0, 56.0, 77.0, 99.0, 91.0, 82.0, 82.0, 48.0, 40.0, 37.0, 20.0, 24.0, 17.0, 8.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9189453125, -1.8602142333984375, -1.801483154296875, -1.7427520751953125, -1.68402099609375, -1.6252899169921875, -1.566558837890625, -1.5078277587890625, -1.4490966796875, -1.3903656005859375, -1.331634521484375, -1.2729034423828125, -1.21417236328125, -1.1554412841796875, -1.096710205078125, -1.0379791259765625, -0.979248046875, -0.9205169677734375, -0.861785888671875, -0.8030548095703125, -0.74432373046875, -0.6855926513671875, -0.626861572265625, -0.5681304931640625, -0.5093994140625, -0.4506683349609375, -0.391937255859375, -0.3332061767578125, -0.27447509765625, -0.2157440185546875, -0.157012939453125, -0.0982818603515625, -0.03955078125, 0.0191802978515625, 0.077911376953125, 0.1366424560546875, 0.19537353515625, 0.2541046142578125, 0.312835693359375, 0.3715667724609375, 0.4302978515625, 0.4890289306640625, 0.547760009765625, 0.6064910888671875, 0.66522216796875, 0.7239532470703125, 0.782684326171875, 0.8414154052734375, 0.900146484375, 0.9588775634765625, 1.017608642578125, 1.0763397216796875, 1.13507080078125, 1.1938018798828125, 1.252532958984375, 1.3112640380859375, 1.3699951171875, 1.4287261962890625, 1.487457275390625, 1.5461883544921875, 1.60491943359375, 1.6636505126953125, 1.722381591796875, 1.7811126708984375, 1.83984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 7.0, 1.0, 12.0, 10.0, 22.0, 29.0, 75.0, 84.0, 73.0, 61.0, 33.0, 20.0, 11.0, 9.0, 7.0, 5.0, 2.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.542501926422119, -7.254260540008545, -6.966019630432129, -6.677778244018555, -6.3895368576049805, -6.101295471191406, -5.813054084777832, -5.524813175201416, -5.236571788787842, -4.948330402374268, -4.660089492797852, -4.371848106384277, -4.083606719970703, -3.795365333557129, -3.507124185562134, -3.2188830375671387, -2.9306416511535645, -2.6424002647399902, -2.354159116744995, -2.06591796875, -1.7776765823364258, -1.4894353151321411, -1.2011940479278564, -0.9129528999328613, -0.6247115135192871, -0.33647024631500244, -0.04822897911071777, 0.2400122880935669, 0.5282535552978516, 0.8164948225021362, 1.104736089706421, 1.392977237701416, 1.6812191009521484, 1.969460368156433, 2.2577016353607178, 2.545942783355713, 2.834184169769287, 3.1224255561828613, 3.4106667041778564, 3.6989078521728516, 3.987149238586426, 4.275390625, 4.563632011413574, 4.85187292098999, 5.1401143074035645, 5.428355693817139, 5.716596603393555, 6.004837989807129, 6.293079376220703, 6.581320762634277, 6.869562149047852, 7.157803058624268, 7.446044445037842, 7.734285831451416, 8.022526741027832, 8.310768127441406, 8.59900951385498, 8.887250900268555, 9.175492286682129, 9.463733673095703, 9.751974105834961, 10.040215492248535, 10.32845687866211, 10.616698265075684, 10.904939651489258]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 6.0, 2.0, 4.0, 3.0, 6.0, 10.0, 12.0, 27.0, 36.0, 60.0, 78.0, 77.0, 47.0, 42.0, 19.0, 10.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.591365814208984, -8.322317123413086, -8.053268432617188, -7.784219741821289, -7.515171051025391, -7.246122360229492, -6.977073669433594, -6.708024978637695, -6.438976287841797, -6.169927597045898, -5.90087890625, -5.631830215454102, -5.362781524658203, -5.093732833862305, -4.824684143066406, -4.555635452270508, -4.286587238311768, -4.017538547515869, -3.7484898567199707, -3.4794411659240723, -3.210392475128174, -2.9413437843322754, -2.672295331954956, -2.4032466411590576, -2.134197950363159, -1.8651492595672607, -1.5961005687713623, -1.3270519971847534, -1.058003306388855, -0.7889546155929565, -0.5199060440063477, -0.2508573532104492, 0.01819133758544922, 0.28723999857902527, 0.5562886595726013, 0.825337290763855, 1.0943859815597534, 1.3634346723556519, 1.6324832439422607, 1.9015319347381592, 2.1705806255340576, 2.439629316329956, 2.7086780071258545, 2.977726459503174, 3.2467751502990723, 3.5158238410949707, 3.784872531890869, 4.053921222686768, 4.322969913482666, 4.5920186042785645, 4.861067295074463, 5.130115985870361, 5.39916467666626, 5.668213367462158, 5.937261581420898, 6.206310272216797, 6.475358963012695, 6.744407653808594, 7.013456344604492, 7.282505035400391, 7.551553726196289, 7.8206024169921875, 8.089651107788086, 8.358699798583984, 8.627748489379883]}, "eval/loss": 4.328446388244629, "eval/wer": 1.8473819912733043, "eval/runtime": 935.4027, "eval/samples_per_second": 2.824, "eval/steps_per_second": 0.354} \ No newline at end of file