diff --git "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" --- "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" +++ "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0608, "train/learning_rate": 4.156769596199525e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 114529, "_timestamp": 1647708406, "_step": 17847, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 6.0, 15.0, 19.0, 22.0, 48.0, 65.0, 61.0, 84.0, 114.0, 110.0, 103.0, 76.0, 77.0, 49.0, 35.0, 19.0, 15.0, 16.0, 9.0, 7.0, 10.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.100801467895508, -26.244380950927734, -25.38796043395996, -24.531539916992188, -23.675119400024414, -22.81869888305664, -21.9622802734375, -21.105859756469727, -20.249439239501953, -19.39301872253418, -18.536598205566406, -17.680177688598633, -16.82375717163086, -15.967337608337402, -15.110917091369629, -14.254497528076172, -13.398076057434082, -12.541655540466309, -11.685235023498535, -10.828815460205078, -9.972394943237305, -9.115974426269531, -8.259553909301758, -7.403133869171143, -6.546713352203369, -5.690292835235596, -4.8338727951049805, -3.977452278137207, -3.1210319995880127, -2.2646117210388184, -1.408191204071045, -0.5517711639404297, 0.30464935302734375, 1.161069631576538, 2.0174899101257324, 2.873910427093506, 3.7303307056427, 4.5867509841918945, 5.443171501159668, 6.299591541290283, 7.156012058258057, 8.012432098388672, 8.868852615356445, 9.725273132324219, 10.581693649291992, 11.438114166259766, 12.294534683227539, 13.150954246520996, 14.00737476348877, 14.863795280456543, 15.720215797424316, 16.576635360717773, 17.433055877685547, 18.28947639465332, 19.145896911621094, 20.002317428588867, 20.85873794555664, 21.715158462524414, 22.571578979492188, 23.42799949645996, 24.284420013427734, 25.140838623046875, 25.99726104736328, 26.853679656982422, 27.710100173950195]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 13.0, 14.0, 18.0, 24.0, 29.0, 38.0, 54.0, 58.0, 64.0, 54.0, 61.0, 62.0, 63.0, 63.0, 54.0, 68.0, 43.0, 42.0, 37.0, 36.0, 24.0, 15.0, 15.0, 10.0, 5.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.098886489868164, -20.288461685180664, -19.478036880493164, -18.66761016845703, -17.85718536376953, -17.04676055908203, -16.23633575439453, -15.425910949707031, -14.615485191345215, -13.805060386657715, -12.994634628295898, -12.184209823608398, -11.373785018920898, -10.563359260559082, -9.752934455871582, -8.942508697509766, -8.132083892822266, -7.321658611297607, -6.511233329772949, -5.700808525085449, -4.890383243560791, -4.079957962036133, -3.269533157348633, -2.4591078758239746, -1.6486825942993164, -0.8382574319839478, -0.0278322696685791, 0.7825927734375, 1.5930180549621582, 2.4034433364868164, 3.2138681411743164, 4.024293422698975, 4.834716796875, 5.645142078399658, 6.455567359924316, 7.265992164611816, 8.076417922973633, 8.886842727661133, 9.697267532348633, 10.507692337036133, 11.31811809539795, 12.12854290008545, 12.938968658447266, 13.749393463134766, 14.559818267822266, 15.370244026184082, 16.180667877197266, 16.9910945892334, 17.8015193939209, 18.6119441986084, 19.4223690032959, 20.23279571533203, 21.04322052001953, 21.85364532470703, 22.66407012939453, 23.47449493408203, 24.28491973876953, 25.09534454345703, 25.90576934814453, 26.71619415283203, 27.526620864868164, 28.337045669555664, 29.147470474243164, 29.957895278930664, 30.768321990966797]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 8.0, 9.0, 16.0, 16.0, 30.0, 23.0, 38.0, 41.0, 47.0, 67.0, 64.0, 59.0, 52.0, 64.0, 59.0, 64.0, 69.0, 52.0, 27.0, 43.0, 26.0, 33.0, 21.0, 15.0, 14.0, 3.0, 8.0, 8.0, 5.0, 4.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.3742828369140625, -1.317901611328125, -1.2615203857421875, -1.20513916015625, -1.1487579345703125, -1.092376708984375, -1.0359954833984375, -0.9796142578125, -0.9232330322265625, -0.866851806640625, -0.8104705810546875, -0.75408935546875, -0.6977081298828125, -0.641326904296875, -0.5849456787109375, -0.528564453125, -0.4721832275390625, -0.415802001953125, -0.3594207763671875, -0.30303955078125, -0.2466583251953125, -0.190277099609375, -0.1338958740234375, -0.0775146484375, -0.0211334228515625, 0.035247802734375, 0.0916290283203125, 0.14801025390625, 0.2043914794921875, 0.260772705078125, 0.3171539306640625, 0.37353515625, 0.4299163818359375, 0.486297607421875, 0.5426788330078125, 0.59906005859375, 0.6554412841796875, 0.711822509765625, 0.7682037353515625, 0.8245849609375, 0.8809661865234375, 0.937347412109375, 0.9937286376953125, 1.05010986328125, 1.1064910888671875, 1.162872314453125, 1.2192535400390625, 1.275634765625, 1.3320159912109375, 1.388397216796875, 1.4447784423828125, 1.50115966796875, 1.5575408935546875, 1.613922119140625, 1.6703033447265625, 1.7266845703125, 1.7830657958984375, 1.839447021484375, 1.8958282470703125, 1.95220947265625, 2.0085906982421875, 2.064971923828125, 2.1213531494140625, 2.177734375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 15.0, 16.0, 30.0, 34.0, 41.0, 80.0, 131.0, 151.0, 344.0, 714.0, 1926.0, 6215.0, 26205.0, 199978.0, 3804105.0, 125763.0, 19798.0, 5179.0, 1791.0, 763.0, 362.0, 202.0, 134.0, 92.0, 56.0, 38.0, 24.0, 22.0, 17.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.3924560546875, -11.839599609375, -11.2867431640625, -10.73388671875, -10.1810302734375, -9.628173828125, -9.0753173828125, -8.5224609375, -7.9696044921875, -7.416748046875, -6.8638916015625, -6.31103515625, -5.7581787109375, -5.205322265625, -4.6524658203125, -4.099609375, -3.5467529296875, -2.993896484375, -2.4410400390625, -1.88818359375, -1.3353271484375, -0.782470703125, -0.2296142578125, 0.3232421875, 0.8760986328125, 1.428955078125, 1.9818115234375, 2.53466796875, 3.0875244140625, 3.640380859375, 4.1932373046875, 4.74609375, 5.2989501953125, 5.851806640625, 6.4046630859375, 6.95751953125, 7.5103759765625, 8.063232421875, 8.6160888671875, 9.1689453125, 9.7218017578125, 10.274658203125, 10.8275146484375, 11.38037109375, 11.9332275390625, 12.486083984375, 13.0389404296875, 13.591796875, 14.1446533203125, 14.697509765625, 15.2503662109375, 15.80322265625, 16.3560791015625, 16.908935546875, 17.4617919921875, 18.0146484375, 18.5675048828125, 19.120361328125, 19.6732177734375, 20.22607421875, 20.7789306640625, 21.331787109375, 21.8846435546875, 22.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 6.0, 15.0, 35.0, 68.0, 88.0, 197.0, 534.0, 1911.0, 663.0, 258.0, 125.0, 63.0, 40.0, 25.0, 19.0, 8.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9921875, -13.5498046875, -13.107421875, -12.6650390625, -12.22265625, -11.7802734375, -11.337890625, -10.8955078125, -10.453125, -10.0107421875, -9.568359375, -9.1259765625, -8.68359375, -8.2412109375, -7.798828125, -7.3564453125, -6.9140625, -6.4716796875, -6.029296875, -5.5869140625, -5.14453125, -4.7021484375, -4.259765625, -3.8173828125, -3.375, -2.9326171875, -2.490234375, -2.0478515625, -1.60546875, -1.1630859375, -0.720703125, -0.2783203125, 0.1640625, 0.6064453125, 1.048828125, 1.4912109375, 1.93359375, 2.3759765625, 2.818359375, 3.2607421875, 3.703125, 4.1455078125, 4.587890625, 5.0302734375, 5.47265625, 5.9150390625, 6.357421875, 6.7998046875, 7.2421875, 7.6845703125, 8.126953125, 8.5693359375, 9.01171875, 9.4541015625, 9.896484375, 10.3388671875, 10.78125, 11.2236328125, 11.666015625, 12.1083984375, 12.55078125, 12.9931640625, 13.435546875, 13.8779296875, 14.3203125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 17.0, 38.0, 40.0, 66.0, 94.0, 142.0, 256.0, 571.0, 1528.0, 5103.0, 24760.0, 246907.0, 3771734.0, 120822.0, 16099.0, 3772.0, 1178.0, 476.0, 235.0, 141.0, 101.0, 70.0, 39.0, 30.0, 21.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.58349609375, -36.3857421875, -35.18798828125, -33.990234375, -32.79248046875, -31.5947265625, -30.39697265625, -29.19921875, -28.00146484375, -26.8037109375, -25.60595703125, -24.408203125, -23.21044921875, -22.0126953125, -20.81494140625, -19.6171875, -18.41943359375, -17.2216796875, -16.02392578125, -14.826171875, -13.62841796875, -12.4306640625, -11.23291015625, -10.03515625, -8.83740234375, -7.6396484375, -6.44189453125, -5.244140625, -4.04638671875, -2.8486328125, -1.65087890625, -0.453125, 0.74462890625, 1.9423828125, 3.14013671875, 4.337890625, 5.53564453125, 6.7333984375, 7.93115234375, 9.12890625, 10.32666015625, 11.5244140625, 12.72216796875, 13.919921875, 15.11767578125, 16.3154296875, 17.51318359375, 18.7109375, 19.90869140625, 21.1064453125, 22.30419921875, 23.501953125, 24.69970703125, 25.8974609375, 27.09521484375, 28.29296875, 29.49072265625, 30.6884765625, 31.88623046875, 33.083984375, 34.28173828125, 35.4794921875, 36.67724609375, 37.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 15.0, 11.0, 16.0, 36.0, 54.0, 90.0, 97.0, 144.0, 154.0, 118.0, 78.0, 61.0, 31.0, 30.0, 27.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.96833801269531, -54.66822052001953, -53.36810302734375, -52.06798553466797, -50.76786804199219, -49.467750549316406, -48.167633056640625, -46.867515563964844, -45.56739807128906, -44.26728057861328, -42.9671630859375, -41.66704559326172, -40.36692810058594, -39.066810607910156, -37.766693115234375, -36.466575622558594, -35.16645431518555, -33.866336822509766, -32.566219329833984, -31.266101837158203, -29.965984344482422, -28.66586685180664, -27.365747451782227, -26.065629959106445, -24.765512466430664, -23.465394973754883, -22.1652774810791, -20.86515998840332, -19.565040588378906, -18.264923095703125, -16.964805603027344, -15.664688110351562, -14.364574432373047, -13.064456939697266, -11.764339447021484, -10.464221000671387, -9.164103507995605, -7.863986015319824, -6.563868045806885, -5.263750076293945, -3.963632583618164, -2.6635148525238037, -1.3633971214294434, -0.06327939033508301, 1.2368383407592773, 2.5369558334350586, 3.837073802947998, 5.1371917724609375, 6.437309265136719, 7.7374267578125, 9.037544250488281, 10.337662696838379, 11.63778018951416, 12.937897682189941, 14.238016128540039, 15.53813362121582, 16.8382511138916, 18.138368606567383, 19.438486099243164, 20.738603591918945, 22.03872299194336, 23.33884048461914, 24.638957977294922, 25.939075469970703, 27.239192962646484]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 16.0, 9.0, 18.0, 16.0, 14.0, 33.0, 21.0, 28.0, 30.0, 41.0, 50.0, 37.0, 39.0, 39.0, 40.0, 51.0, 35.0, 51.0, 41.0, 38.0, 31.0, 33.0, 35.0, 30.0, 27.0, 10.0, 18.0, 19.0, 26.0, 15.0, 12.0, 16.0, 10.0, 8.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.482481002807617, -20.81058120727539, -20.13867950439453, -19.466779708862305, -18.794879913330078, -18.12297821044922, -17.451078414916992, -16.779178619384766, -16.107276916503906, -15.435376167297363, -14.76347541809082, -14.091575622558594, -13.41967487335205, -12.747774124145508, -12.075874328613281, -11.403973579406738, -10.732072830200195, -10.060172080993652, -9.38827133178711, -8.716371536254883, -8.04447078704834, -7.372570037841797, -6.700669765472412, -6.028769493103027, -5.356868743896484, -4.684967994689941, -4.013067722320557, -3.3411672115325928, -2.669266700744629, -1.997366189956665, -1.3254656791687012, -0.6535654067993164, 0.018337249755859375, 0.6902377605438232, 1.362138271331787, 2.034038782119751, 2.705939292907715, 3.3778398036956787, 4.049740314483643, 4.721640586853027, 5.39354133605957, 6.065442085266113, 6.737342357635498, 7.409242630004883, 8.081143379211426, 8.753044128417969, 9.424943923950195, 10.096844673156738, 10.768745422363281, 11.440646171569824, 12.112546920776367, 12.784446716308594, 13.456347465515137, 14.12824821472168, 14.800148010253906, 15.47204875946045, 16.143949508666992, 16.81584930419922, 17.487751007080078, 18.159650802612305, 18.83155059814453, 19.50345230102539, 20.175352096557617, 20.847251892089844, 21.519153594970703]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 4.0, 8.0, 10.0, 14.0, 12.0, 22.0, 25.0, 30.0, 35.0, 35.0, 35.0, 40.0, 47.0, 60.0, 54.0, 61.0, 59.0, 52.0, 54.0, 56.0, 44.0, 32.0, 34.0, 38.0, 28.0, 29.0, 17.0, 14.0, 13.0, 7.0, 15.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7455596923828125, -1.691314697265625, -1.6370697021484375, -1.58282470703125, -1.5285797119140625, -1.474334716796875, -1.4200897216796875, -1.3658447265625, -1.3115997314453125, -1.257354736328125, -1.2031097412109375, -1.14886474609375, -1.0946197509765625, -1.040374755859375, -0.9861297607421875, -0.931884765625, -0.8776397705078125, -0.823394775390625, -0.7691497802734375, -0.71490478515625, -0.6606597900390625, -0.606414794921875, -0.5521697998046875, -0.4979248046875, -0.4436798095703125, -0.389434814453125, -0.3351898193359375, -0.28094482421875, -0.2266998291015625, -0.172454833984375, -0.1182098388671875, -0.06396484375, -0.0097198486328125, 0.044525146484375, 0.0987701416015625, 0.15301513671875, 0.2072601318359375, 0.261505126953125, 0.3157501220703125, 0.3699951171875, 0.4242401123046875, 0.478485107421875, 0.5327301025390625, 0.58697509765625, 0.6412200927734375, 0.695465087890625, 0.7497100830078125, 0.803955078125, 0.8582000732421875, 0.912445068359375, 0.9666900634765625, 1.02093505859375, 1.0751800537109375, 1.129425048828125, 1.1836700439453125, 1.2379150390625, 1.2921600341796875, 1.346405029296875, 1.4006500244140625, 1.45489501953125, 1.5091400146484375, 1.563385009765625, 1.6176300048828125, 1.671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 16.0, 13.0, 20.0, 20.0, 48.0, 60.0, 103.0, 149.0, 240.0, 362.0, 684.0, 1206.0, 2251.0, 4407.0, 9451.0, 22248.0, 66329.0, 679915.0, 191254.0, 40420.0, 15206.0, 6726.0, 3343.0, 1734.0, 923.0, 526.0, 301.0, 201.0, 140.0, 80.0, 45.0, 44.0, 26.0, 18.0, 15.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.43798828125, -8.1806640625, -7.92333984375, -7.666015625, -7.40869140625, -7.1513671875, -6.89404296875, -6.63671875, -6.37939453125, -6.1220703125, -5.86474609375, -5.607421875, -5.35009765625, -5.0927734375, -4.83544921875, -4.578125, -4.32080078125, -4.0634765625, -3.80615234375, -3.548828125, -3.29150390625, -3.0341796875, -2.77685546875, -2.51953125, -2.26220703125, -2.0048828125, -1.74755859375, -1.490234375, -1.23291015625, -0.9755859375, -0.71826171875, -0.4609375, -0.20361328125, 0.0537109375, 0.31103515625, 0.568359375, 0.82568359375, 1.0830078125, 1.34033203125, 1.59765625, 1.85498046875, 2.1123046875, 2.36962890625, 2.626953125, 2.88427734375, 3.1416015625, 3.39892578125, 3.65625, 3.91357421875, 4.1708984375, 4.42822265625, 4.685546875, 4.94287109375, 5.2001953125, 5.45751953125, 5.71484375, 5.97216796875, 6.2294921875, 6.48681640625, 6.744140625, 7.00146484375, 7.2587890625, 7.51611328125, 7.7734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 2.0, 10.0, 12.0, 13.0, 13.0, 18.0, 20.0, 25.0, 26.0, 36.0, 35.0, 39.0, 32.0, 45.0, 31.0, 43.0, 38.0, 39.0, 1057.0, 46.0, 44.0, 45.0, 42.0, 35.0, 32.0, 31.0, 26.0, 22.0, 19.0, 22.0, 17.0, 17.0, 9.0, 17.0, 14.0, 7.0, 10.0, 7.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.058868408203125, -1.02105712890625, -0.983245849609375, -0.9454345703125, -0.907623291015625, -0.86981201171875, -0.832000732421875, -0.794189453125, -0.756378173828125, -0.71856689453125, -0.680755615234375, -0.6429443359375, -0.605133056640625, -0.56732177734375, -0.529510498046875, -0.49169921875, -0.453887939453125, -0.41607666015625, -0.378265380859375, -0.3404541015625, -0.302642822265625, -0.26483154296875, -0.227020263671875, -0.189208984375, -0.151397705078125, -0.11358642578125, -0.075775146484375, -0.0379638671875, -0.000152587890625, 0.03765869140625, 0.075469970703125, 0.11328125, 0.151092529296875, 0.18890380859375, 0.226715087890625, 0.2645263671875, 0.302337646484375, 0.34014892578125, 0.377960205078125, 0.415771484375, 0.453582763671875, 0.49139404296875, 0.529205322265625, 0.5670166015625, 0.604827880859375, 0.64263916015625, 0.680450439453125, 0.71826171875, 0.756072998046875, 0.79388427734375, 0.831695556640625, 0.8695068359375, 0.907318115234375, 0.94512939453125, 0.982940673828125, 1.020751953125, 1.058563232421875, 1.09637451171875, 1.134185791015625, 1.1719970703125, 1.209808349609375, 1.24761962890625, 1.285430908203125, 1.3232421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 13.0, 12.0, 15.0, 22.0, 25.0, 34.0, 57.0, 75.0, 89.0, 131.0, 197.0, 290.0, 402.0, 590.0, 972.0, 1543.0, 2527.0, 4484.0, 8431.0, 19502.0, 60751.0, 1383133.0, 529715.0, 49483.0, 16652.0, 7581.0, 3949.0, 2268.0, 1377.0, 895.0, 585.0, 405.0, 263.0, 199.0, 109.0, 93.0, 60.0, 48.0, 40.0, 27.0, 19.0, 16.0, 15.0, 3.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.810546875, -2.71966552734375, -2.6287841796875, -2.53790283203125, -2.447021484375, -2.35614013671875, -2.2652587890625, -2.17437744140625, -2.08349609375, -1.99261474609375, -1.9017333984375, -1.81085205078125, -1.719970703125, -1.62908935546875, -1.5382080078125, -1.44732666015625, -1.3564453125, -1.26556396484375, -1.1746826171875, -1.08380126953125, -0.992919921875, -0.90203857421875, -0.8111572265625, -0.72027587890625, -0.62939453125, -0.53851318359375, -0.4476318359375, -0.35675048828125, -0.265869140625, -0.17498779296875, -0.0841064453125, 0.00677490234375, 0.09765625, 0.18853759765625, 0.2794189453125, 0.37030029296875, 0.461181640625, 0.55206298828125, 0.6429443359375, 0.73382568359375, 0.82470703125, 0.91558837890625, 1.0064697265625, 1.09735107421875, 1.188232421875, 1.27911376953125, 1.3699951171875, 1.46087646484375, 1.5517578125, 1.64263916015625, 1.7335205078125, 1.82440185546875, 1.915283203125, 2.00616455078125, 2.0970458984375, 2.18792724609375, 2.27880859375, 2.36968994140625, 2.4605712890625, 2.55145263671875, 2.642333984375, 2.73321533203125, 2.8240966796875, 2.91497802734375, 3.005859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 8.0, 19.0, 149.0, 709.0, 73.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.934814453125, -2.85400390625, -2.773193359375, -2.6923828125, -2.611572265625, -2.53076171875, -2.449951171875, -2.369140625, -2.288330078125, -2.20751953125, -2.126708984375, -2.0458984375, -1.965087890625, -1.88427734375, -1.803466796875, -1.72265625, -1.641845703125, -1.56103515625, -1.480224609375, -1.3994140625, -1.318603515625, -1.23779296875, -1.156982421875, -1.076171875, -0.995361328125, -0.91455078125, -0.833740234375, -0.7529296875, -0.672119140625, -0.59130859375, -0.510498046875, -0.4296875, -0.348876953125, -0.26806640625, -0.187255859375, -0.1064453125, -0.025634765625, 0.05517578125, 0.135986328125, 0.216796875, 0.297607421875, 0.37841796875, 0.459228515625, 0.5400390625, 0.620849609375, 0.70166015625, 0.782470703125, 0.86328125, 0.944091796875, 1.02490234375, 1.105712890625, 1.1865234375, 1.267333984375, 1.34814453125, 1.428955078125, 1.509765625, 1.590576171875, 1.67138671875, 1.752197265625, 1.8330078125, 1.913818359375, 1.99462890625, 2.075439453125, 2.15625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 3.0, 9.0, 12.0, 11.0, 17.0, 28.0, 87.0, 377.0, 3379.0, 1025580.0, 17285.0, 1361.0, 210.0, 74.0, 25.0, 17.0, 9.0, 9.0, 3.0, 4.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.7587890625, -36.673828125, -35.5888671875, -34.50390625, -33.4189453125, -32.333984375, -31.2490234375, -30.1640625, -29.0791015625, -27.994140625, -26.9091796875, -25.82421875, -24.7392578125, -23.654296875, -22.5693359375, -21.484375, -20.3994140625, -19.314453125, -18.2294921875, -17.14453125, -16.0595703125, -14.974609375, -13.8896484375, -12.8046875, -11.7197265625, -10.634765625, -9.5498046875, -8.46484375, -7.3798828125, -6.294921875, -5.2099609375, -4.125, -3.0400390625, -1.955078125, -0.8701171875, 0.21484375, 1.2998046875, 2.384765625, 3.4697265625, 4.5546875, 5.6396484375, 6.724609375, 7.8095703125, 8.89453125, 9.9794921875, 11.064453125, 12.1494140625, 13.234375, 14.3193359375, 15.404296875, 16.4892578125, 17.57421875, 18.6591796875, 19.744140625, 20.8291015625, 21.9140625, 22.9990234375, 24.083984375, 25.1689453125, 26.25390625, 27.3388671875, 28.423828125, 29.5087890625, 30.59375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 12.0, 65.0, 204.0, 488.0, 172.0, 41.0, 19.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.455366611480713, -7.2503156661987305, -7.045264720916748, -6.840213775634766, -6.635162830352783, -6.430111885070801, -6.225060939788818, -6.020009994506836, -5.8149590492248535, -5.609908103942871, -5.404857158660889, -5.199806213378906, -4.994755268096924, -4.789704322814941, -4.584653377532959, -4.379602432250977, -4.174551486968994, -3.9695005416870117, -3.7644495964050293, -3.559398651123047, -3.3543477058410645, -3.149296760559082, -2.9442458152770996, -2.739194869995117, -2.5341439247131348, -2.3290929794311523, -2.12404203414917, -1.9189910888671875, -1.713940143585205, -1.5088891983032227, -1.3038382530212402, -1.0987873077392578, -0.8937363624572754, -0.688685417175293, -0.48363447189331055, -0.2785835266113281, -0.0735325813293457, 0.13151836395263672, 0.33656930923461914, 0.5416202545166016, 0.746671199798584, 0.9517221450805664, 1.1567730903625488, 1.3618240356445312, 1.5668749809265137, 1.771925926208496, 1.9769768714904785, 2.182027816772461, 2.3870787620544434, 2.592129707336426, 2.797180652618408, 3.0022315979003906, 3.207282543182373, 3.4123334884643555, 3.617384433746338, 3.8224353790283203, 4.027486324310303, 4.232537269592285, 4.437588214874268, 4.64263916015625, 4.847690105438232, 5.052741050720215, 5.257791996002197, 5.46284294128418, 5.667893886566162]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 9.0, 5.0, 6.0, 15.0, 16.0, 23.0, 12.0, 25.0, 37.0, 25.0, 33.0, 27.0, 36.0, 37.0, 45.0, 40.0, 34.0, 35.0, 35.0, 34.0, 45.0, 33.0, 42.0, 38.0, 24.0, 30.0, 31.0, 23.0, 32.0, 30.0, 27.0, 16.0, 10.0, 16.0, 12.0, 12.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4209628105163574, -1.3770132064819336, -1.3330636024475098, -1.289113998413086, -1.245164394378662, -1.2012147903442383, -1.1572651863098145, -1.1133155822753906, -1.0693659782409668, -1.025416374206543, -0.9814667701721191, -0.9375171661376953, -0.8935675621032715, -0.8496179580688477, -0.8056683540344238, -0.76171875, -0.7177691459655762, -0.6738195419311523, -0.6298699378967285, -0.5859203338623047, -0.5419707298278809, -0.49802112579345703, -0.4540715217590332, -0.4101219177246094, -0.36617231369018555, -0.3222227096557617, -0.2782731056213379, -0.23432350158691406, -0.19037389755249023, -0.1464242935180664, -0.10247468948364258, -0.05852508544921875, -0.014575481414794922, 0.029374122619628906, 0.07332372665405273, 0.11727333068847656, 0.1612229347229004, 0.20517253875732422, 0.24912214279174805, 0.2930717468261719, 0.3370213508605957, 0.38097095489501953, 0.42492055892944336, 0.4688701629638672, 0.512819766998291, 0.5567693710327148, 0.6007189750671387, 0.6446685791015625, 0.6886181831359863, 0.7325677871704102, 0.776517391204834, 0.8204669952392578, 0.8644165992736816, 0.9083662033081055, 0.9523158073425293, 0.9962654113769531, 1.040215015411377, 1.0841646194458008, 1.1281142234802246, 1.1720638275146484, 1.2160134315490723, 1.259963035583496, 1.30391263961792, 1.3478622436523438, 1.3918118476867676]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 10.0, 19.0, 20.0, 17.0, 32.0, 41.0, 37.0, 45.0, 55.0, 62.0, 64.0, 74.0, 69.0, 61.0, 46.0, 50.0, 49.0, 40.0, 44.0, 34.0, 25.0, 24.0, 15.0, 12.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9296417236328125, -1.868072509765625, -1.8065032958984375, -1.74493408203125, -1.6833648681640625, -1.621795654296875, -1.5602264404296875, -1.4986572265625, -1.4370880126953125, -1.375518798828125, -1.3139495849609375, -1.25238037109375, -1.1908111572265625, -1.129241943359375, -1.0676727294921875, -1.006103515625, -0.9445343017578125, -0.882965087890625, -0.8213958740234375, -0.75982666015625, -0.6982574462890625, -0.636688232421875, -0.5751190185546875, -0.5135498046875, -0.4519805908203125, -0.390411376953125, -0.3288421630859375, -0.26727294921875, -0.2057037353515625, -0.144134521484375, -0.0825653076171875, -0.02099609375, 0.0405731201171875, 0.102142333984375, 0.1637115478515625, 0.22528076171875, 0.2868499755859375, 0.348419189453125, 0.4099884033203125, 0.4715576171875, 0.5331268310546875, 0.594696044921875, 0.6562652587890625, 0.71783447265625, 0.7794036865234375, 0.840972900390625, 0.9025421142578125, 0.964111328125, 1.0256805419921875, 1.087249755859375, 1.1488189697265625, 1.21038818359375, 1.2719573974609375, 1.333526611328125, 1.3950958251953125, 1.4566650390625, 1.5182342529296875, 1.579803466796875, 1.6413726806640625, 1.70294189453125, 1.7645111083984375, 1.826080322265625, 1.8876495361328125, 1.94921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 13.0, 26.0, 43.0, 71.0, 101.0, 159.0, 323.0, 636.0, 1258.0, 2356.0, 4870.0, 11814.0, 31549.0, 109248.0, 485832.0, 295952.0, 66730.0, 21353.0, 8443.0, 3852.0, 1804.0, 969.0, 512.0, 255.0, 156.0, 87.0, 42.0, 28.0, 17.0, 12.0, 6.0, 8.0, 6.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.55206298828125, -5.3775634765625, -5.20306396484375, -5.028564453125, -4.85406494140625, -4.6795654296875, -4.50506591796875, -4.33056640625, -4.15606689453125, -3.9815673828125, -3.80706787109375, -3.632568359375, -3.45806884765625, -3.2835693359375, -3.10906982421875, -2.9345703125, -2.76007080078125, -2.5855712890625, -2.41107177734375, -2.236572265625, -2.06207275390625, -1.8875732421875, -1.71307373046875, -1.53857421875, -1.36407470703125, -1.1895751953125, -1.01507568359375, -0.840576171875, -0.66607666015625, -0.4915771484375, -0.31707763671875, -0.142578125, 0.03192138671875, 0.2064208984375, 0.38092041015625, 0.555419921875, 0.72991943359375, 0.9044189453125, 1.07891845703125, 1.25341796875, 1.42791748046875, 1.6024169921875, 1.77691650390625, 1.951416015625, 2.12591552734375, 2.3004150390625, 2.47491455078125, 2.6494140625, 2.82391357421875, 2.9984130859375, 3.17291259765625, 3.347412109375, 3.52191162109375, 3.6964111328125, 3.87091064453125, 4.04541015625, 4.21990966796875, 4.3944091796875, 4.56890869140625, 4.743408203125, 4.91790771484375, 5.0924072265625, 5.26690673828125, 5.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 11.0, 12.0, 12.0, 16.0, 27.0, 29.0, 41.0, 51.0, 69.0, 104.0, 117.0, 249.0, 1515.0, 264.0, 134.0, 79.0, 66.0, 60.0, 43.0, 27.0, 16.0, 18.0, 19.0, 21.0, 5.0, 5.0, 8.0, 3.0, 9.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.78125, -8.547119140625, -8.31298828125, -8.078857421875, -7.8447265625, -7.610595703125, -7.37646484375, -7.142333984375, -6.908203125, -6.674072265625, -6.43994140625, -6.205810546875, -5.9716796875, -5.737548828125, -5.50341796875, -5.269287109375, -5.03515625, -4.801025390625, -4.56689453125, -4.332763671875, -4.0986328125, -3.864501953125, -3.63037109375, -3.396240234375, -3.162109375, -2.927978515625, -2.69384765625, -2.459716796875, -2.2255859375, -1.991455078125, -1.75732421875, -1.523193359375, -1.2890625, -1.054931640625, -0.82080078125, -0.586669921875, -0.3525390625, -0.118408203125, 0.11572265625, 0.349853515625, 0.583984375, 0.818115234375, 1.05224609375, 1.286376953125, 1.5205078125, 1.754638671875, 1.98876953125, 2.222900390625, 2.45703125, 2.691162109375, 2.92529296875, 3.159423828125, 3.3935546875, 3.627685546875, 3.86181640625, 4.095947265625, 4.330078125, 4.564208984375, 4.79833984375, 5.032470703125, 5.2666015625, 5.500732421875, 5.73486328125, 5.968994140625, 6.203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 12.0, 15.0, 11.0, 16.0, 24.0, 30.0, 37.0, 42.0, 86.0, 247.0, 3052.0, 528091.0, 2606748.0, 6641.0, 334.0, 81.0, 60.0, 35.0, 36.0, 21.0, 18.0, 11.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.21875, -27.177734375, -26.13671875, -25.095703125, -24.0546875, -23.013671875, -21.97265625, -20.931640625, -19.890625, -18.849609375, -17.80859375, -16.767578125, -15.7265625, -14.685546875, -13.64453125, -12.603515625, -11.5625, -10.521484375, -9.48046875, -8.439453125, -7.3984375, -6.357421875, -5.31640625, -4.275390625, -3.234375, -2.193359375, -1.15234375, -0.111328125, 0.9296875, 1.970703125, 3.01171875, 4.052734375, 5.09375, 6.134765625, 7.17578125, 8.216796875, 9.2578125, 10.298828125, 11.33984375, 12.380859375, 13.421875, 14.462890625, 15.50390625, 16.544921875, 17.5859375, 18.626953125, 19.66796875, 20.708984375, 21.75, 22.791015625, 23.83203125, 24.873046875, 25.9140625, 26.955078125, 27.99609375, 29.037109375, 30.078125, 31.119140625, 32.16015625, 33.201171875, 34.2421875, 35.283203125, 36.32421875, 37.365234375, 38.40625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 105.0, 311.0, 411.0, 143.0, 33.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.548988342285156, -15.81141471862793, -14.07384204864502, -12.33626937866211, -10.598695755004883, -8.861122131347656, -7.123549461364746, -5.385976791381836, -3.6484031677246094, -1.910830020904541, -0.17325687408447266, 1.5643162727355957, 3.301889419555664, 5.039463043212891, 6.777035713195801, 8.514608383178711, 10.252182006835938, 11.989755630493164, 13.727328300476074, 15.464900970458984, 17.20247459411621, 18.940048217773438, 20.67761993408203, 22.415193557739258, 24.152767181396484, 25.89034080505371, 27.627914428710938, 29.36548614501953, 31.103059768676758, 32.840633392333984, 34.57820510864258, 36.31578063964844, 38.05335235595703, 39.790924072265625, 41.528499603271484, 43.26607131958008, 45.00364685058594, 46.74121856689453, 48.478790283203125, 50.21636199951172, 51.95393753051758, 53.69150924682617, 55.42908477783203, 57.166656494140625, 58.90422821044922, 60.64180374145508, 62.37937545776367, 64.11695098876953, 65.85452270507812, 67.59209442138672, 69.32966613769531, 71.06724548339844, 72.80481719970703, 74.54238891601562, 76.27996063232422, 78.01753234863281, 79.75511169433594, 81.49268341064453, 83.23025512695312, 84.96783447265625, 86.70540618896484, 88.44297790527344, 90.18054962158203, 91.91812133789062, 93.65569305419922]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 2.0, 6.0, 10.0, 8.0, 17.0, 15.0, 25.0, 17.0, 22.0, 29.0, 28.0, 44.0, 30.0, 45.0, 46.0, 44.0, 45.0, 48.0, 57.0, 40.0, 38.0, 40.0, 42.0, 34.0, 29.0, 36.0, 31.0, 23.0, 19.0, 21.0, 21.0, 18.0, 16.0, 9.0, 11.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-18.908187866210938, -18.34250259399414, -17.776817321777344, -17.211132049560547, -16.64544677734375, -16.079761505126953, -15.514076232910156, -14.94839096069336, -14.382705688476562, -13.817020416259766, -13.251335144042969, -12.685649871826172, -12.119964599609375, -11.554279327392578, -10.988594055175781, -10.422908782958984, -9.857222557067871, -9.291537284851074, -8.725852012634277, -8.16016674041748, -7.594481468200684, -7.028796195983887, -6.463110446929932, -5.897425174713135, -5.331739902496338, -4.766054630279541, -4.200369358062744, -3.634683847427368, -3.0689985752105713, -2.5033133029937744, -1.9376277923583984, -1.3719425201416016, -0.8062572479248047, -0.24057191610336304, 0.3251134157180786, 0.890798807144165, 1.456484079360962, 2.022169351577759, 2.5878548622131348, 3.1535401344299316, 3.7192254066467285, 4.284910678863525, 4.850595951080322, 5.416281700134277, 5.981966972351074, 6.547652244567871, 7.113337516784668, 7.679022789001465, 8.244708061218262, 8.810393333435059, 9.376078605651855, 9.941763877868652, 10.50744915008545, 11.073134422302246, 11.63882064819336, 12.204505920410156, 12.770191192626953, 13.33587646484375, 13.901561737060547, 14.467247009277344, 15.03293228149414, 15.598617553710938, 16.164302825927734, 16.72998809814453, 17.295673370361328]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 9.0, 12.0, 16.0, 20.0, 31.0, 30.0, 36.0, 36.0, 43.0, 50.0, 51.0, 53.0, 55.0, 56.0, 49.0, 46.0, 53.0, 53.0, 36.0, 48.0, 34.0, 36.0, 23.0, 20.0, 16.0, 16.0, 17.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6923980712890625, -1.635772705078125, -1.5791473388671875, -1.52252197265625, -1.4658966064453125, -1.409271240234375, -1.3526458740234375, -1.2960205078125, -1.2393951416015625, -1.182769775390625, -1.1261444091796875, -1.06951904296875, -1.0128936767578125, -0.956268310546875, -0.8996429443359375, -0.843017578125, -0.7863922119140625, -0.729766845703125, -0.6731414794921875, -0.61651611328125, -0.5598907470703125, -0.503265380859375, -0.4466400146484375, -0.3900146484375, -0.3333892822265625, -0.276763916015625, -0.2201385498046875, -0.16351318359375, -0.1068878173828125, -0.050262451171875, 0.0063629150390625, 0.06298828125, 0.1196136474609375, 0.176239013671875, 0.2328643798828125, 0.28948974609375, 0.3461151123046875, 0.402740478515625, 0.4593658447265625, 0.5159912109375, 0.5726165771484375, 0.629241943359375, 0.6858673095703125, 0.74249267578125, 0.7991180419921875, 0.855743408203125, 0.9123687744140625, 0.968994140625, 1.0256195068359375, 1.082244873046875, 1.1388702392578125, 1.19549560546875, 1.2521209716796875, 1.308746337890625, 1.3653717041015625, 1.4219970703125, 1.4786224365234375, 1.535247802734375, 1.5918731689453125, 1.64849853515625, 1.7051239013671875, 1.761749267578125, 1.8183746337890625, 1.875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 16.0, 19.0, 23.0, 39.0, 63.0, 99.0, 161.0, 247.0, 440.0, 763.0, 1389.0, 2432.0, 4509.0, 9173.0, 19044.0, 45304.0, 142590.0, 2512468.0, 1276869.0, 108832.0, 37382.0, 16242.0, 7622.0, 3742.0, 2093.0, 1023.0, 634.0, 368.0, 247.0, 133.0, 93.0, 72.0, 32.0, 27.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.2421875, -7.98388671875, -7.7255859375, -7.46728515625, -7.208984375, -6.95068359375, -6.6923828125, -6.43408203125, -6.17578125, -5.91748046875, -5.6591796875, -5.40087890625, -5.142578125, -4.88427734375, -4.6259765625, -4.36767578125, -4.109375, -3.85107421875, -3.5927734375, -3.33447265625, -3.076171875, -2.81787109375, -2.5595703125, -2.30126953125, -2.04296875, -1.78466796875, -1.5263671875, -1.26806640625, -1.009765625, -0.75146484375, -0.4931640625, -0.23486328125, 0.0234375, 0.28173828125, 0.5400390625, 0.79833984375, 1.056640625, 1.31494140625, 1.5732421875, 1.83154296875, 2.08984375, 2.34814453125, 2.6064453125, 2.86474609375, 3.123046875, 3.38134765625, 3.6396484375, 3.89794921875, 4.15625, 4.41455078125, 4.6728515625, 4.93115234375, 5.189453125, 5.44775390625, 5.7060546875, 5.96435546875, 6.22265625, 6.48095703125, 6.7392578125, 6.99755859375, 7.255859375, 7.51416015625, 7.7724609375, 8.03076171875, 8.2890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 11.0, 17.0, 23.0, 35.0, 54.0, 47.0, 78.0, 110.0, 160.0, 243.0, 453.0, 862.0, 817.0, 435.0, 243.0, 136.0, 97.0, 68.0, 38.0, 39.0, 22.0, 15.0, 13.0, 10.0, 10.0, 8.0, 5.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.63653564453125, -8.3824462890625, -8.12835693359375, -7.874267578125, -7.62017822265625, -7.3660888671875, -7.11199951171875, -6.85791015625, -6.60382080078125, -6.3497314453125, -6.09564208984375, -5.841552734375, -5.58746337890625, -5.3333740234375, -5.07928466796875, -4.8251953125, -4.57110595703125, -4.3170166015625, -4.06292724609375, -3.808837890625, -3.55474853515625, -3.3006591796875, -3.04656982421875, -2.79248046875, -2.53839111328125, -2.2843017578125, -2.03021240234375, -1.776123046875, -1.52203369140625, -1.2679443359375, -1.01385498046875, -0.759765625, -0.50567626953125, -0.2515869140625, 0.00250244140625, 0.256591796875, 0.51068115234375, 0.7647705078125, 1.01885986328125, 1.27294921875, 1.52703857421875, 1.7811279296875, 2.03521728515625, 2.289306640625, 2.54339599609375, 2.7974853515625, 3.05157470703125, 3.3056640625, 3.55975341796875, 3.8138427734375, 4.06793212890625, 4.322021484375, 4.57611083984375, 4.8302001953125, 5.08428955078125, 5.33837890625, 5.59246826171875, 5.8465576171875, 6.10064697265625, 6.354736328125, 6.60882568359375, 6.8629150390625, 7.11700439453125, 7.37109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 6.0, 16.0, 33.0, 45.0, 83.0, 133.0, 211.0, 333.0, 617.0, 1089.0, 2109.0, 4169.0, 8404.0, 18610.0, 47134.0, 151846.0, 1340661.0, 2332577.0, 189572.0, 56206.0, 21460.0, 9447.0, 4509.0, 2160.0, 1175.0, 659.0, 404.0, 192.0, 148.0, 90.0, 45.0, 40.0, 23.0, 18.0, 18.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.39208984375, -14.9404296875, -14.48876953125, -14.037109375, -13.58544921875, -13.1337890625, -12.68212890625, -12.23046875, -11.77880859375, -11.3271484375, -10.87548828125, -10.423828125, -9.97216796875, -9.5205078125, -9.06884765625, -8.6171875, -8.16552734375, -7.7138671875, -7.26220703125, -6.810546875, -6.35888671875, -5.9072265625, -5.45556640625, -5.00390625, -4.55224609375, -4.1005859375, -3.64892578125, -3.197265625, -2.74560546875, -2.2939453125, -1.84228515625, -1.390625, -0.93896484375, -0.4873046875, -0.03564453125, 0.416015625, 0.86767578125, 1.3193359375, 1.77099609375, 2.22265625, 2.67431640625, 3.1259765625, 3.57763671875, 4.029296875, 4.48095703125, 4.9326171875, 5.38427734375, 5.8359375, 6.28759765625, 6.7392578125, 7.19091796875, 7.642578125, 8.09423828125, 8.5458984375, 8.99755859375, 9.44921875, 9.90087890625, 10.3525390625, 10.80419921875, 11.255859375, 11.70751953125, 12.1591796875, 12.61083984375, 13.0625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 17.0, 30.0, 35.0, 72.0, 139.0, 220.0, 203.0, 116.0, 72.0, 30.0, 33.0, 14.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.809171676635742, -23.043285369873047, -21.27739906311035, -19.511512756347656, -17.745624542236328, -15.97973918914795, -14.213851928710938, -12.447965621948242, -10.682079315185547, -8.916193008422852, -7.150306224822998, -5.3844194412231445, -3.618533134460449, -1.852646827697754, -0.08675956726074219, 1.6791267395019531, 3.4450130462646484, 5.210899353027344, 6.976786136627197, 8.74267292022705, 10.508559226989746, 12.274445533752441, 14.040332794189453, 15.806219100952148, 17.572105407714844, 19.33799171447754, 21.103878021240234, 22.869766235351562, 24.635650634765625, 26.401538848876953, 28.16742515563965, 29.933311462402344, 31.699195861816406, 33.465084075927734, 35.2309684753418, 36.996856689453125, 38.76274108886719, 40.528629302978516, 42.294517517089844, 44.060401916503906, 45.82628631591797, 47.5921745300293, 49.35805892944336, 51.12394714355469, 52.88983154296875, 54.65571975708008, 56.421607971191406, 58.18749237060547, 59.9533805847168, 61.719268798828125, 63.48515319824219, 65.25103759765625, 67.01692962646484, 68.7828140258789, 70.54869842529297, 72.31459045410156, 74.08047485351562, 75.84635925292969, 77.61225128173828, 79.37813568115234, 81.1440200805664, 82.90990447998047, 84.67579650878906, 86.44168090820312, 88.20756530761719]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 8.0, 13.0, 17.0, 15.0, 21.0, 16.0, 21.0, 25.0, 23.0, 26.0, 26.0, 28.0, 35.0, 42.0, 34.0, 34.0, 30.0, 32.0, 43.0, 42.0, 37.0, 24.0, 32.0, 27.0, 30.0, 22.0, 26.0, 21.0, 39.0, 20.0, 20.0, 23.0, 23.0, 20.0, 14.0, 14.0, 8.0, 10.0, 11.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.984928131103516, -18.428075790405273, -17.87122344970703, -17.31437110900879, -16.757518768310547, -16.200666427612305, -15.643814086914062, -15.08696174621582, -14.530109405517578, -13.973257064819336, -13.416404724121094, -12.859552383422852, -12.30270004272461, -11.745847702026367, -11.188995361328125, -10.632143020629883, -10.075289726257324, -9.518437385559082, -8.96158504486084, -8.404732704162598, -7.8478803634643555, -7.291028022766113, -6.734175205230713, -6.177322864532471, -5.6204705238342285, -5.063618183135986, -4.506765842437744, -3.949913263320923, -3.3930609226226807, -2.8362085819244385, -2.279356002807617, -1.722503662109375, -1.1656513214111328, -0.6087989211082458, -0.05194652080535889, 0.5049059391021729, 1.061758279800415, 1.6186106204986572, 2.1754631996154785, 2.7323155403137207, 3.289167881011963, 3.846020221710205, 4.402872562408447, 4.959725379943848, 5.51657772064209, 6.073430061340332, 6.630282402038574, 7.187134742736816, 7.743987083435059, 8.3008394241333, 8.857691764831543, 9.414544105529785, 9.971396446228027, 10.52824878692627, 11.085102081298828, 11.64195442199707, 12.198806762695312, 12.755659103393555, 13.312511444091797, 13.869363784790039, 14.426216125488281, 14.983068466186523, 15.539920806884766, 16.096773147583008, 16.65362548828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 7.0, 7.0, 9.0, 13.0, 13.0, 18.0, 20.0, 25.0, 23.0, 36.0, 28.0, 28.0, 30.0, 47.0, 49.0, 49.0, 50.0, 48.0, 59.0, 60.0, 54.0, 36.0, 38.0, 44.0, 25.0, 21.0, 25.0, 24.0, 27.0, 13.0, 15.0, 12.0, 9.0, 12.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6366424560546875, -1.584808349609375, -1.5329742431640625, -1.48114013671875, -1.4293060302734375, -1.377471923828125, -1.3256378173828125, -1.2738037109375, -1.2219696044921875, -1.170135498046875, -1.1183013916015625, -1.06646728515625, -1.0146331787109375, -0.962799072265625, -0.9109649658203125, -0.859130859375, -0.8072967529296875, -0.755462646484375, -0.7036285400390625, -0.65179443359375, -0.5999603271484375, -0.548126220703125, -0.4962921142578125, -0.4444580078125, -0.3926239013671875, -0.340789794921875, -0.2889556884765625, -0.23712158203125, -0.1852874755859375, -0.133453369140625, -0.0816192626953125, -0.02978515625, 0.0220489501953125, 0.073883056640625, 0.1257171630859375, 0.17755126953125, 0.2293853759765625, 0.281219482421875, 0.3330535888671875, 0.3848876953125, 0.4367218017578125, 0.488555908203125, 0.5403900146484375, 0.59222412109375, 0.6440582275390625, 0.695892333984375, 0.7477264404296875, 0.799560546875, 0.8513946533203125, 0.903228759765625, 0.9550628662109375, 1.00689697265625, 1.0587310791015625, 1.110565185546875, 1.1623992919921875, 1.2142333984375, 1.2660675048828125, 1.317901611328125, 1.3697357177734375, 1.42156982421875, 1.4734039306640625, 1.525238037109375, 1.5770721435546875, 1.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 7.0, 6.0, 9.0, 20.0, 22.0, 45.0, 59.0, 82.0, 120.0, 191.0, 326.0, 494.0, 722.0, 1188.0, 1899.0, 3161.0, 5391.0, 9684.0, 18303.0, 39062.0, 104645.0, 453598.0, 271888.0, 73123.0, 30123.0, 14815.0, 7935.0, 4505.0, 2621.0, 1626.0, 1074.0, 609.0, 421.0, 263.0, 157.0, 95.0, 90.0, 43.0, 29.0, 25.0, 17.0, 13.0, 15.0, 9.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-8.6640625, -8.41534423828125, -8.1666259765625, -7.91790771484375, -7.669189453125, -7.42047119140625, -7.1717529296875, -6.92303466796875, -6.67431640625, -6.42559814453125, -6.1768798828125, -5.92816162109375, -5.679443359375, -5.43072509765625, -5.1820068359375, -4.93328857421875, -4.6845703125, -4.43585205078125, -4.1871337890625, -3.93841552734375, -3.689697265625, -3.44097900390625, -3.1922607421875, -2.94354248046875, -2.69482421875, -2.44610595703125, -2.1973876953125, -1.94866943359375, -1.699951171875, -1.45123291015625, -1.2025146484375, -0.95379638671875, -0.705078125, -0.45635986328125, -0.2076416015625, 0.04107666015625, 0.289794921875, 0.53851318359375, 0.7872314453125, 1.03594970703125, 1.28466796875, 1.53338623046875, 1.7821044921875, 2.03082275390625, 2.279541015625, 2.52825927734375, 2.7769775390625, 3.02569580078125, 3.2744140625, 3.52313232421875, 3.7718505859375, 4.02056884765625, 4.269287109375, 4.51800537109375, 4.7667236328125, 5.01544189453125, 5.26416015625, 5.51287841796875, 5.7615966796875, 6.01031494140625, 6.259033203125, 6.50775146484375, 6.7564697265625, 7.00518798828125, 7.25390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 2.0, 10.0, 12.0, 8.0, 10.0, 16.0, 9.0, 20.0, 33.0, 41.0, 40.0, 41.0, 35.0, 30.0, 51.0, 50.0, 35.0, 1065.0, 46.0, 40.0, 38.0, 48.0, 47.0, 42.0, 34.0, 33.0, 29.0, 35.0, 20.0, 16.0, 21.0, 7.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2813262939453125, -1.239410400390625, -1.1974945068359375, -1.15557861328125, -1.1136627197265625, -1.071746826171875, -1.0298309326171875, -0.9879150390625, -0.9459991455078125, -0.904083251953125, -0.8621673583984375, -0.82025146484375, -0.7783355712890625, -0.736419677734375, -0.6945037841796875, -0.652587890625, -0.6106719970703125, -0.568756103515625, -0.5268402099609375, -0.48492431640625, -0.4430084228515625, -0.401092529296875, -0.3591766357421875, -0.3172607421875, -0.2753448486328125, -0.233428955078125, -0.1915130615234375, -0.14959716796875, -0.1076812744140625, -0.065765380859375, -0.0238494873046875, 0.01806640625, 0.0599822998046875, 0.101898193359375, 0.1438140869140625, 0.18572998046875, 0.2276458740234375, 0.269561767578125, 0.3114776611328125, 0.3533935546875, 0.3953094482421875, 0.437225341796875, 0.4791412353515625, 0.52105712890625, 0.5629730224609375, 0.604888916015625, 0.6468048095703125, 0.688720703125, 0.7306365966796875, 0.772552490234375, 0.8144683837890625, 0.85638427734375, 0.8983001708984375, 0.940216064453125, 0.9821319580078125, 1.0240478515625, 1.0659637451171875, 1.107879638671875, 1.1497955322265625, 1.19171142578125, 1.2336273193359375, 1.275543212890625, 1.3174591064453125, 1.359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 8.0, 16.0, 19.0, 24.0, 43.0, 49.0, 70.0, 83.0, 142.0, 213.0, 274.0, 400.0, 624.0, 880.0, 1410.0, 2124.0, 3360.0, 5928.0, 11335.0, 26321.0, 84356.0, 1206892.0, 629569.0, 73494.0, 24076.0, 10481.0, 5511.0, 3260.0, 2039.0, 1249.0, 861.0, 576.0, 403.0, 279.0, 217.0, 131.0, 98.0, 64.0, 64.0, 43.0, 34.0, 19.0, 17.0, 9.0, 17.0, 3.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.83203125, -5.64361572265625, -5.4552001953125, -5.26678466796875, -5.078369140625, -4.88995361328125, -4.7015380859375, -4.51312255859375, -4.32470703125, -4.13629150390625, -3.9478759765625, -3.75946044921875, -3.571044921875, -3.38262939453125, -3.1942138671875, -3.00579833984375, -2.8173828125, -2.62896728515625, -2.4405517578125, -2.25213623046875, -2.063720703125, -1.87530517578125, -1.6868896484375, -1.49847412109375, -1.31005859375, -1.12164306640625, -0.9332275390625, -0.74481201171875, -0.556396484375, -0.36798095703125, -0.1795654296875, 0.00885009765625, 0.197265625, 0.38568115234375, 0.5740966796875, 0.76251220703125, 0.950927734375, 1.13934326171875, 1.3277587890625, 1.51617431640625, 1.70458984375, 1.89300537109375, 2.0814208984375, 2.26983642578125, 2.458251953125, 2.64666748046875, 2.8350830078125, 3.02349853515625, 3.2119140625, 3.40032958984375, 3.5887451171875, 3.77716064453125, 3.965576171875, 4.15399169921875, 4.3424072265625, 4.53082275390625, 4.71923828125, 4.90765380859375, 5.0960693359375, 5.28448486328125, 5.472900390625, 5.66131591796875, 5.8497314453125, 6.03814697265625, 6.2265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 14.0, 49.0, 182.0, 521.0, 80.0, 27.0, 14.0, 11.0, 10.0, 7.0, 5.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.212493896484375, -3.09881591796875, -2.985137939453125, -2.8714599609375, -2.757781982421875, -2.64410400390625, -2.530426025390625, -2.416748046875, -2.303070068359375, -2.18939208984375, -2.075714111328125, -1.9620361328125, -1.848358154296875, -1.73468017578125, -1.621002197265625, -1.50732421875, -1.393646240234375, -1.27996826171875, -1.166290283203125, -1.0526123046875, -0.938934326171875, -0.82525634765625, -0.711578369140625, -0.597900390625, -0.484222412109375, -0.37054443359375, -0.256866455078125, -0.1431884765625, -0.029510498046875, 0.08416748046875, 0.197845458984375, 0.3115234375, 0.425201416015625, 0.53887939453125, 0.652557373046875, 0.7662353515625, 0.879913330078125, 0.99359130859375, 1.107269287109375, 1.220947265625, 1.334625244140625, 1.44830322265625, 1.561981201171875, 1.6756591796875, 1.789337158203125, 1.90301513671875, 2.016693115234375, 2.13037109375, 2.244049072265625, 2.35772705078125, 2.471405029296875, 2.5850830078125, 2.698760986328125, 2.81243896484375, 2.926116943359375, 3.039794921875, 3.153472900390625, 3.26715087890625, 3.380828857421875, 3.4945068359375, 3.608184814453125, 3.72186279296875, 3.835540771484375, 3.94921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 11.0, 19.0, 22.0, 37.0, 48.0, 103.0, 309.0, 1315.0, 9255.0, 1002341.0, 31241.0, 2921.0, 543.0, 171.0, 65.0, 46.0, 26.0, 20.0, 8.0, 4.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.8125, -53.23388671875, -51.6552734375, -50.07666015625, -48.498046875, -46.91943359375, -45.3408203125, -43.76220703125, -42.18359375, -40.60498046875, -39.0263671875, -37.44775390625, -35.869140625, -34.29052734375, -32.7119140625, -31.13330078125, -29.5546875, -27.97607421875, -26.3974609375, -24.81884765625, -23.240234375, -21.66162109375, -20.0830078125, -18.50439453125, -16.92578125, -15.34716796875, -13.7685546875, -12.18994140625, -10.611328125, -9.03271484375, -7.4541015625, -5.87548828125, -4.296875, -2.71826171875, -1.1396484375, 0.43896484375, 2.017578125, 3.59619140625, 5.1748046875, 6.75341796875, 8.33203125, 9.91064453125, 11.4892578125, 13.06787109375, 14.646484375, 16.22509765625, 17.8037109375, 19.38232421875, 20.9609375, 22.53955078125, 24.1181640625, 25.69677734375, 27.275390625, 28.85400390625, 30.4326171875, 32.01123046875, 33.58984375, 35.16845703125, 36.7470703125, 38.32568359375, 39.904296875, 41.48291015625, 43.0615234375, 44.64013671875, 46.21875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 8.0, 5.0, 17.0, 27.0, 16.0, 46.0, 66.0, 71.0, 139.0, 140.0, 114.0, 94.0, 57.0, 36.0, 29.0, 25.0, 14.0, 17.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6988325119018555, -2.601017475128174, -2.503202438354492, -2.4053874015808105, -2.307572364807129, -2.2097573280334473, -2.1119422912597656, -2.014127492904663, -1.9163124561309814, -1.8184974193572998, -1.7206823825836182, -1.6228673458099365, -1.5250524282455444, -1.4272373914718628, -1.3294223546981812, -1.231607437133789, -1.1337922811508179, -1.0359772443771362, -0.9381622672080994, -0.8403472304344177, -0.7425322532653809, -0.6447172164916992, -0.5469021797180176, -0.4490872025489807, -0.3512721657752991, -0.2534571588039398, -0.15564213693141937, -0.057827115058898926, 0.03998789191246033, 0.13780289888381958, 0.23561793565750122, 0.3334329128265381, 0.4312479496002197, 0.5290629863739014, 0.6268779635429382, 0.7246930003166199, 0.8225079774856567, 0.9203230142593384, 1.01813805103302, 1.115952968597412, 1.2137680053710938, 1.3115830421447754, 1.409398078918457, 1.5072131156921387, 1.6050280332565308, 1.7028430700302124, 1.800658106803894, 1.8984730243682861, 1.9962881803512573, 2.0941030979156494, 2.191918134689331, 2.2897331714630127, 2.3875482082366943, 2.485363245010376, 2.5831782817840576, 2.6809933185577393, 2.778808355331421, 2.8766233921051025, 2.974438428878784, 3.072253465652466, 3.1700685024261475, 3.26788330078125, 3.3656983375549316, 3.4635133743286133, 3.561328411102295]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 10.0, 14.0, 11.0, 13.0, 7.0, 22.0, 28.0, 21.0, 29.0, 31.0, 29.0, 45.0, 46.0, 30.0, 48.0, 40.0, 59.0, 50.0, 44.0, 45.0, 47.0, 36.0, 37.0, 36.0, 25.0, 29.0, 31.0, 28.0, 21.0, 11.0, 14.0, 12.0, 14.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5662386417388916, -2.489405632019043, -2.4125723838806152, -2.3357393741607666, -2.258906364440918, -2.1820731163024902, -2.1052401065826416, -2.028407096862793, -1.9515738487243652, -1.874740719795227, -1.7979077100753784, -1.7210745811462402, -1.644241452217102, -1.5674083232879639, -1.4905753135681152, -1.413742184638977, -1.3369091749191284, -1.2600760459899902, -1.1832430362701416, -1.1064099073410034, -1.0295767784118652, -0.9527437090873718, -0.8759106397628784, -0.7990775108337402, -0.7222444415092468, -0.6454113721847534, -0.5685782432556152, -0.4917451739311218, -0.41491207480430603, -0.33807897567749023, -0.2612459063529968, -0.18441277742385864, -0.10757970809936523, -0.030746616423130035, 0.046086475253105164, 0.12291955947875977, 0.19975265860557556, 0.27658575773239136, 0.35341882705688477, 0.43025195598602295, 0.5070850253105164, 0.5839180946350098, 0.660751223564148, 0.7375842928886414, 0.8144173622131348, 0.891250491142273, 0.9680835604667664, 1.0449166297912598, 1.121749758720398, 1.1985828876495361, 1.2754158973693848, 1.352249026298523, 1.4290821552276611, 1.5059151649475098, 1.582748293876648, 1.6595814228057861, 1.7364144325256348, 1.813247561454773, 1.8900805711746216, 1.9669137001037598, 2.0437467098236084, 2.120579957962036, 2.1974129676818848, 2.2742462158203125, 2.351079225540161]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 10.0, 4.0, 10.0, 15.0, 17.0, 13.0, 19.0, 24.0, 22.0, 27.0, 36.0, 30.0, 35.0, 46.0, 52.0, 38.0, 50.0, 58.0, 52.0, 53.0, 50.0, 42.0, 48.0, 40.0, 29.0, 23.0, 25.0, 22.0, 21.0, 12.0, 16.0, 9.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4736785888671875, -1.421966552734375, -1.3702545166015625, -1.31854248046875, -1.2668304443359375, -1.215118408203125, -1.1634063720703125, -1.1116943359375, -1.0599822998046875, -1.008270263671875, -0.9565582275390625, -0.90484619140625, -0.8531341552734375, -0.801422119140625, -0.7497100830078125, -0.697998046875, -0.6462860107421875, -0.594573974609375, -0.5428619384765625, -0.49114990234375, -0.4394378662109375, -0.387725830078125, -0.3360137939453125, -0.2843017578125, -0.2325897216796875, -0.180877685546875, -0.1291656494140625, -0.07745361328125, -0.0257415771484375, 0.025970458984375, 0.0776824951171875, 0.12939453125, 0.1811065673828125, 0.232818603515625, 0.2845306396484375, 0.33624267578125, 0.3879547119140625, 0.439666748046875, 0.4913787841796875, 0.5430908203125, 0.5948028564453125, 0.646514892578125, 0.6982269287109375, 0.74993896484375, 0.8016510009765625, 0.853363037109375, 0.9050750732421875, 0.956787109375, 1.0084991455078125, 1.060211181640625, 1.1119232177734375, 1.16363525390625, 1.2153472900390625, 1.267059326171875, 1.3187713623046875, 1.3704833984375, 1.4221954345703125, 1.473907470703125, 1.5256195068359375, 1.57733154296875, 1.6290435791015625, 1.680755615234375, 1.7324676513671875, 1.7841796875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 20.0, 21.0, 48.0, 63.0, 101.0, 146.0, 252.0, 426.0, 799.0, 1555.0, 3268.0, 7324.0, 19001.0, 64964.0, 405593.0, 440507.0, 69748.0, 20190.0, 7629.0, 3264.0, 1549.0, 864.0, 469.0, 267.0, 165.0, 108.0, 61.0, 40.0, 32.0, 11.0, 9.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9349365234375, -5.760498046875, -5.5860595703125, -5.41162109375, -5.2371826171875, -5.062744140625, -4.8883056640625, -4.7138671875, -4.5394287109375, -4.364990234375, -4.1905517578125, -4.01611328125, -3.8416748046875, -3.667236328125, -3.4927978515625, -3.318359375, -3.1439208984375, -2.969482421875, -2.7950439453125, -2.62060546875, -2.4461669921875, -2.271728515625, -2.0972900390625, -1.9228515625, -1.7484130859375, -1.573974609375, -1.3995361328125, -1.22509765625, -1.0506591796875, -0.876220703125, -0.7017822265625, -0.52734375, -0.3529052734375, -0.178466796875, -0.0040283203125, 0.17041015625, 0.3448486328125, 0.519287109375, 0.6937255859375, 0.8681640625, 1.0426025390625, 1.217041015625, 1.3914794921875, 1.56591796875, 1.7403564453125, 1.914794921875, 2.0892333984375, 2.263671875, 2.4381103515625, 2.612548828125, 2.7869873046875, 2.96142578125, 3.1358642578125, 3.310302734375, 3.4847412109375, 3.6591796875, 3.8336181640625, 4.008056640625, 4.1824951171875, 4.35693359375, 4.5313720703125, 4.705810546875, 4.8802490234375, 5.0546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 13.0, 10.0, 7.0, 14.0, 14.0, 18.0, 19.0, 23.0, 32.0, 28.0, 31.0, 32.0, 38.0, 57.0, 67.0, 78.0, 131.0, 293.0, 1410.0, 158.0, 88.0, 80.0, 60.0, 39.0, 40.0, 37.0, 37.0, 28.0, 22.0, 22.0, 21.0, 15.0, 14.0, 10.0, 12.0, 7.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.64453125, -6.45556640625, -6.2666015625, -6.07763671875, -5.888671875, -5.69970703125, -5.5107421875, -5.32177734375, -5.1328125, -4.94384765625, -4.7548828125, -4.56591796875, -4.376953125, -4.18798828125, -3.9990234375, -3.81005859375, -3.62109375, -3.43212890625, -3.2431640625, -3.05419921875, -2.865234375, -2.67626953125, -2.4873046875, -2.29833984375, -2.109375, -1.92041015625, -1.7314453125, -1.54248046875, -1.353515625, -1.16455078125, -0.9755859375, -0.78662109375, -0.59765625, -0.40869140625, -0.2197265625, -0.03076171875, 0.158203125, 0.34716796875, 0.5361328125, 0.72509765625, 0.9140625, 1.10302734375, 1.2919921875, 1.48095703125, 1.669921875, 1.85888671875, 2.0478515625, 2.23681640625, 2.42578125, 2.61474609375, 2.8037109375, 2.99267578125, 3.181640625, 3.37060546875, 3.5595703125, 3.74853515625, 3.9375, 4.12646484375, 4.3154296875, 4.50439453125, 4.693359375, 4.88232421875, 5.0712890625, 5.26025390625, 5.44921875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 5.0, 11.0, 19.0, 17.0, 23.0, 31.0, 47.0, 76.0, 105.0, 203.0, 369.0, 755.0, 1600.0, 3776.0, 9398.0, 26711.0, 104771.0, 938916.0, 1853056.0, 150674.0, 35031.0, 11654.0, 4638.0, 1823.0, 874.0, 468.0, 226.0, 148.0, 85.0, 51.0, 29.0, 26.0, 20.0, 9.0, 11.0, 9.0, 8.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.521484375, -7.25390625, -6.986328125, -6.71875, -6.451171875, -6.18359375, -5.916015625, -5.6484375, -5.380859375, -5.11328125, -4.845703125, -4.578125, -4.310546875, -4.04296875, -3.775390625, -3.5078125, -3.240234375, -2.97265625, -2.705078125, -2.4375, -2.169921875, -1.90234375, -1.634765625, -1.3671875, -1.099609375, -0.83203125, -0.564453125, -0.296875, -0.029296875, 0.23828125, 0.505859375, 0.7734375, 1.041015625, 1.30859375, 1.576171875, 1.84375, 2.111328125, 2.37890625, 2.646484375, 2.9140625, 3.181640625, 3.44921875, 3.716796875, 3.984375, 4.251953125, 4.51953125, 4.787109375, 5.0546875, 5.322265625, 5.58984375, 5.857421875, 6.125, 6.392578125, 6.66015625, 6.927734375, 7.1953125, 7.462890625, 7.73046875, 7.998046875, 8.265625, 8.533203125, 8.80078125, 9.068359375, 9.3359375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 10.0, 78.0, 349.0, 436.0, 121.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.652995109558105, -13.462892532348633, -11.272789001464844, -9.082686424255371, -6.892583847045898, -4.702481269836426, -2.5123777389526367, -0.32227516174316406, 1.8678274154663086, 4.057929992675781, 6.248033046722412, 8.438136100769043, 10.628238677978516, 12.818341255187988, 15.008444786071777, 17.19854736328125, 19.388648986816406, 21.578752517700195, 23.76885414123535, 25.95895767211914, 28.149059295654297, 30.339162826538086, 32.529266357421875, 34.71936798095703, 36.90947341918945, 39.09957504272461, 41.28968048095703, 43.47978210449219, 45.669883728027344, 47.8599853515625, 50.05009078979492, 52.24019241333008, 54.43029022216797, 56.620391845703125, 58.81049728393555, 61.0005989074707, 63.19070053100586, 65.38080596923828, 67.57090759277344, 69.7610092163086, 71.95111083984375, 74.1412124633789, 76.33131408691406, 78.52142333984375, 80.7115249633789, 82.90162658691406, 85.09172821044922, 87.28182983398438, 89.47193908691406, 91.66204071044922, 93.85214233398438, 96.04225158691406, 98.23235321044922, 100.42245483398438, 102.61255645751953, 104.80265808105469, 106.99275970458984, 109.182861328125, 111.37296295166016, 113.56306457519531, 115.753173828125, 117.94327545166016, 120.13337707519531, 122.32347869873047, 124.51358032226562]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 15.0, 11.0, 21.0, 12.0, 14.0, 19.0, 24.0, 24.0, 36.0, 36.0, 36.0, 29.0, 35.0, 46.0, 69.0, 31.0, 39.0, 43.0, 43.0, 46.0, 40.0, 45.0, 47.0, 26.0, 17.0, 32.0, 20.0, 25.0, 21.0, 9.0, 11.0, 13.0, 4.0, 10.0, 4.0, 2.0, 6.0, 7.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.92365074157715, -21.245601654052734, -20.56755256652832, -19.889503479003906, -19.21145248413086, -18.533403396606445, -17.85535430908203, -17.177305221557617, -16.499256134033203, -15.821207046508789, -15.143157005310059, -14.465107917785645, -13.787057876586914, -13.1090087890625, -12.430959701538086, -11.752910614013672, -11.074859619140625, -10.396810531616211, -9.71876049041748, -9.040711402893066, -8.362661361694336, -7.684612274169922, -7.006563186645508, -6.3285136222839355, -5.650464057922363, -4.972414493560791, -4.294364929199219, -3.6163158416748047, -2.9382662773132324, -2.26021671295166, -1.582167625427246, -0.9041180610656738, -0.22606849670410156, 0.45198094844818115, 1.1300303936004639, 1.808079719543457, 2.4861292839050293, 3.1641788482666016, 3.8422279357910156, 4.520277500152588, 5.19832706451416, 5.876376628875732, 6.554426193237305, 7.232475280761719, 7.910524845123291, 8.588574409484863, 9.266623497009277, 9.944673538208008, 10.622722625732422, 11.300771713256836, 11.978821754455566, 12.65687084197998, 13.334920883178711, 14.012969970703125, 14.691019058227539, 15.369068145751953, 16.047119140625, 16.725168228149414, 17.403217315673828, 18.081268310546875, 18.75931739807129, 19.437366485595703, 20.115415573120117, 20.79346466064453, 21.471513748168945]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 12.0, 20.0, 18.0, 24.0, 24.0, 27.0, 29.0, 38.0, 28.0, 38.0, 46.0, 52.0, 55.0, 49.0, 55.0, 60.0, 42.0, 41.0, 50.0, 47.0, 49.0, 37.0, 24.0, 18.0, 21.0, 21.0, 9.0, 14.0, 8.0, 5.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.798919677734375, -1.73944091796875, -1.679962158203125, -1.6204833984375, -1.561004638671875, -1.50152587890625, -1.442047119140625, -1.382568359375, -1.323089599609375, -1.26361083984375, -1.204132080078125, -1.1446533203125, -1.085174560546875, -1.02569580078125, -0.966217041015625, -0.90673828125, -0.847259521484375, -0.78778076171875, -0.728302001953125, -0.6688232421875, -0.609344482421875, -0.54986572265625, -0.490386962890625, -0.430908203125, -0.371429443359375, -0.31195068359375, -0.252471923828125, -0.1929931640625, -0.133514404296875, -0.07403564453125, -0.014556884765625, 0.044921875, 0.104400634765625, 0.16387939453125, 0.223358154296875, 0.2828369140625, 0.342315673828125, 0.40179443359375, 0.461273193359375, 0.520751953125, 0.580230712890625, 0.63970947265625, 0.699188232421875, 0.7586669921875, 0.818145751953125, 0.87762451171875, 0.937103271484375, 0.99658203125, 1.056060791015625, 1.11553955078125, 1.175018310546875, 1.2344970703125, 1.293975830078125, 1.35345458984375, 1.412933349609375, 1.472412109375, 1.531890869140625, 1.59136962890625, 1.650848388671875, 1.7103271484375, 1.769805908203125, 1.82928466796875, 1.888763427734375, 1.9482421875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 16.0, 23.0, 23.0, 36.0, 63.0, 129.0, 198.0, 399.0, 863.0, 2439.0, 8102.0, 31760.0, 256106.0, 3760769.0, 106491.0, 18688.0, 5237.0, 1573.0, 620.0, 285.0, 175.0, 103.0, 56.0, 40.0, 17.0, 17.0, 17.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.17431640625, -12.6923828125, -12.21044921875, -11.728515625, -11.24658203125, -10.7646484375, -10.28271484375, -9.80078125, -9.31884765625, -8.8369140625, -8.35498046875, -7.873046875, -7.39111328125, -6.9091796875, -6.42724609375, -5.9453125, -5.46337890625, -4.9814453125, -4.49951171875, -4.017578125, -3.53564453125, -3.0537109375, -2.57177734375, -2.08984375, -1.60791015625, -1.1259765625, -0.64404296875, -0.162109375, 0.31982421875, 0.8017578125, 1.28369140625, 1.765625, 2.24755859375, 2.7294921875, 3.21142578125, 3.693359375, 4.17529296875, 4.6572265625, 5.13916015625, 5.62109375, 6.10302734375, 6.5849609375, 7.06689453125, 7.548828125, 8.03076171875, 8.5126953125, 8.99462890625, 9.4765625, 9.95849609375, 10.4404296875, 10.92236328125, 11.404296875, 11.88623046875, 12.3681640625, 12.85009765625, 13.33203125, 13.81396484375, 14.2958984375, 14.77783203125, 15.259765625, 15.74169921875, 16.2236328125, 16.70556640625, 17.1875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 2.0, 14.0, 16.0, 27.0, 37.0, 43.0, 69.0, 94.0, 142.0, 290.0, 600.0, 1024.0, 822.0, 329.0, 198.0, 104.0, 75.0, 63.0, 28.0, 29.0, 18.0, 11.0, 5.0, 9.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.364013671875, -10.05615234375, -9.748291015625, -9.4404296875, -9.132568359375, -8.82470703125, -8.516845703125, -8.208984375, -7.901123046875, -7.59326171875, -7.285400390625, -6.9775390625, -6.669677734375, -6.36181640625, -6.053955078125, -5.74609375, -5.438232421875, -5.13037109375, -4.822509765625, -4.5146484375, -4.206787109375, -3.89892578125, -3.591064453125, -3.283203125, -2.975341796875, -2.66748046875, -2.359619140625, -2.0517578125, -1.743896484375, -1.43603515625, -1.128173828125, -0.8203125, -0.512451171875, -0.20458984375, 0.103271484375, 0.4111328125, 0.718994140625, 1.02685546875, 1.334716796875, 1.642578125, 1.950439453125, 2.25830078125, 2.566162109375, 2.8740234375, 3.181884765625, 3.48974609375, 3.797607421875, 4.10546875, 4.413330078125, 4.72119140625, 5.029052734375, 5.3369140625, 5.644775390625, 5.95263671875, 6.260498046875, 6.568359375, 6.876220703125, 7.18408203125, 7.491943359375, 7.7998046875, 8.107666015625, 8.41552734375, 8.723388671875, 9.03125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 4.0, 13.0, 12.0, 18.0, 18.0, 32.0, 61.0, 68.0, 129.0, 203.0, 343.0, 579.0, 1065.0, 2054.0, 4148.0, 8872.0, 21268.0, 57608.0, 197488.0, 2362900.0, 1305131.0, 151496.0, 47402.0, 18012.0, 7658.0, 3720.0, 1752.0, 931.0, 496.0, 291.0, 188.0, 105.0, 75.0, 32.0, 25.0, 15.0, 22.0, 10.0, 10.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.2838134765625, -12.880126953125, -12.4764404296875, -12.07275390625, -11.6690673828125, -11.265380859375, -10.8616943359375, -10.4580078125, -10.0543212890625, -9.650634765625, -9.2469482421875, -8.84326171875, -8.4395751953125, -8.035888671875, -7.6322021484375, -7.228515625, -6.8248291015625, -6.421142578125, -6.0174560546875, -5.61376953125, -5.2100830078125, -4.806396484375, -4.4027099609375, -3.9990234375, -3.5953369140625, -3.191650390625, -2.7879638671875, -2.38427734375, -1.9805908203125, -1.576904296875, -1.1732177734375, -0.76953125, -0.3658447265625, 0.037841796875, 0.4415283203125, 0.84521484375, 1.2489013671875, 1.652587890625, 2.0562744140625, 2.4599609375, 2.8636474609375, 3.267333984375, 3.6710205078125, 4.07470703125, 4.4783935546875, 4.882080078125, 5.2857666015625, 5.689453125, 6.0931396484375, 6.496826171875, 6.9005126953125, 7.30419921875, 7.7078857421875, 8.111572265625, 8.5152587890625, 8.9189453125, 9.3226318359375, 9.726318359375, 10.1300048828125, 10.53369140625, 10.9373779296875, 11.341064453125, 11.7447509765625, 12.1484375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 14.0, 32.0, 46.0, 63.0, 100.0, 134.0, 131.0, 141.0, 84.0, 66.0, 52.0, 36.0, 19.0, 14.0, 12.0, 10.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.166698455810547, -28.94232749938965, -27.71795654296875, -26.493587493896484, -25.269216537475586, -24.044845581054688, -22.820476531982422, -21.596105575561523, -20.371734619140625, -19.147363662719727, -17.922992706298828, -16.698623657226562, -15.474252700805664, -14.249881744384766, -13.025511741638184, -11.801141738891602, -10.576770782470703, -9.352399826049805, -8.128029823303223, -6.903659343719482, -5.679288864135742, -4.454918384552002, -3.2305479049682617, -2.0061779022216797, -0.7818069458007812, 0.442563533782959, 1.6669340133666992, 2.8913044929504395, 4.11567497253418, 5.34004545211792, 6.56441593170166, 7.788785934448242, 9.01315689086914, 10.237527847290039, 11.461897850036621, 12.686267852783203, 13.910638809204102, 15.135009765625, 16.359378814697266, 17.583749771118164, 18.808120727539062, 20.03249168395996, 21.25686264038086, 22.481231689453125, 23.705602645874023, 24.929973602294922, 26.154342651367188, 27.378713607788086, 28.603084564208984, 29.827455520629883, 31.05182647705078, 32.27619552612305, 33.50056457519531, 34.724937438964844, 35.94930648803711, 37.173675537109375, 38.398048400878906, 39.62241744995117, 40.8467903137207, 42.07115936279297, 43.2955322265625, 44.519901275634766, 45.74427032470703, 46.96864318847656, 48.19301223754883]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 6.0, 4.0, 17.0, 11.0, 19.0, 19.0, 22.0, 28.0, 21.0, 32.0, 35.0, 35.0, 38.0, 35.0, 51.0, 51.0, 46.0, 49.0, 42.0, 43.0, 43.0, 35.0, 49.0, 30.0, 37.0, 46.0, 34.0, 20.0, 22.0, 10.0, 10.0, 11.0, 11.0, 2.0, 7.0, 4.0, 5.0, 0.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.810224533081055, -19.05238151550293, -18.294538497924805, -17.536697387695312, -16.778854370117188, -16.021011352539062, -15.263168334960938, -14.505325317382812, -13.747483253479004, -12.989640235900879, -12.23179817199707, -11.473955154418945, -10.71611213684082, -9.958270072937012, -9.200427055358887, -8.442584991455078, -7.684741973876953, -6.926899433135986, -6.1690568923950195, -5.4112138748168945, -4.653371334075928, -3.895528793334961, -3.137685775756836, -2.379843235015869, -1.6220006942749023, -0.864158034324646, -0.10631537437438965, 0.6515274047851562, 1.409369945526123, 2.16721248626709, 2.925055503845215, 3.6828980445861816, 4.440740585327148, 5.198583126068115, 5.956425666809082, 6.714268684387207, 7.472111225128174, 8.22995376586914, 8.987796783447266, 9.74563980102539, 10.5034818649292, 11.261324882507324, 12.019166946411133, 12.777009963989258, 13.534852981567383, 14.292695045471191, 15.050538063049316, 15.808380126953125, 16.56622314453125, 17.324066162109375, 18.0819091796875, 18.839752197265625, 19.597593307495117, 20.355436325073242, 21.113279342651367, 21.871122360229492, 22.628963470458984, 23.38680648803711, 24.144649505615234, 24.90249252319336, 25.66033363342285, 26.418176651000977, 27.1760196685791, 27.933862686157227, 28.69170570373535]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 13.0, 6.0, 8.0, 18.0, 17.0, 24.0, 26.0, 26.0, 22.0, 30.0, 30.0, 31.0, 39.0, 43.0, 46.0, 30.0, 58.0, 49.0, 44.0, 41.0, 55.0, 41.0, 44.0, 34.0, 28.0, 28.0, 32.0, 16.0, 21.0, 17.0, 15.0, 12.0, 12.0, 9.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8505859375, -1.7976531982421875, -1.744720458984375, -1.6917877197265625, -1.63885498046875, -1.5859222412109375, -1.532989501953125, -1.4800567626953125, -1.4271240234375, -1.3741912841796875, -1.321258544921875, -1.2683258056640625, -1.21539306640625, -1.1624603271484375, -1.109527587890625, -1.0565948486328125, -1.003662109375, -0.9507293701171875, -0.897796630859375, -0.8448638916015625, -0.79193115234375, -0.7389984130859375, -0.686065673828125, -0.6331329345703125, -0.5802001953125, -0.5272674560546875, -0.474334716796875, -0.4214019775390625, -0.36846923828125, -0.3155364990234375, -0.262603759765625, -0.2096710205078125, -0.15673828125, -0.1038055419921875, -0.050872802734375, 0.0020599365234375, 0.05499267578125, 0.1079254150390625, 0.160858154296875, 0.2137908935546875, 0.2667236328125, 0.3196563720703125, 0.372589111328125, 0.4255218505859375, 0.47845458984375, 0.5313873291015625, 0.584320068359375, 0.6372528076171875, 0.690185546875, 0.7431182861328125, 0.796051025390625, 0.8489837646484375, 0.90191650390625, 0.9548492431640625, 1.007781982421875, 1.0607147216796875, 1.1136474609375, 1.1665802001953125, 1.219512939453125, 1.2724456787109375, 1.32537841796875, 1.3783111572265625, 1.431243896484375, 1.4841766357421875, 1.537109375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 3.0, 6.0, 11.0, 15.0, 29.0, 44.0, 71.0, 88.0, 150.0, 221.0, 446.0, 738.0, 1334.0, 2427.0, 4721.0, 9796.0, 21573.0, 48253.0, 117982.0, 291562.0, 318361.0, 131426.0, 53521.0, 23522.0, 11069.0, 5136.0, 2687.0, 1446.0, 809.0, 416.0, 249.0, 151.0, 87.0, 63.0, 45.0, 39.0, 17.0, 11.0, 10.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.1915283203125, -8.875244140625, -8.5589599609375, -8.24267578125, -7.9263916015625, -7.610107421875, -7.2938232421875, -6.9775390625, -6.6612548828125, -6.344970703125, -6.0286865234375, -5.71240234375, -5.3961181640625, -5.079833984375, -4.7635498046875, -4.447265625, -4.1309814453125, -3.814697265625, -3.4984130859375, -3.18212890625, -2.8658447265625, -2.549560546875, -2.2332763671875, -1.9169921875, -1.6007080078125, -1.284423828125, -0.9681396484375, -0.65185546875, -0.3355712890625, -0.019287109375, 0.2969970703125, 0.61328125, 0.9295654296875, 1.245849609375, 1.5621337890625, 1.87841796875, 2.1947021484375, 2.510986328125, 2.8272705078125, 3.1435546875, 3.4598388671875, 3.776123046875, 4.0924072265625, 4.40869140625, 4.7249755859375, 5.041259765625, 5.3575439453125, 5.673828125, 5.9901123046875, 6.306396484375, 6.6226806640625, 6.93896484375, 7.2552490234375, 7.571533203125, 7.8878173828125, 8.2041015625, 8.5203857421875, 8.836669921875, 9.1529541015625, 9.46923828125, 9.7855224609375, 10.101806640625, 10.4180908203125, 10.734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 7.0, 13.0, 15.0, 13.0, 18.0, 16.0, 17.0, 16.0, 26.0, 32.0, 29.0, 39.0, 43.0, 35.0, 34.0, 48.0, 1063.0, 47.0, 44.0, 38.0, 53.0, 46.0, 29.0, 42.0, 36.0, 33.0, 26.0, 20.0, 33.0, 13.0, 17.0, 9.0, 10.0, 6.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4404296875, -1.3959197998046875, -1.351409912109375, -1.3069000244140625, -1.26239013671875, -1.2178802490234375, -1.173370361328125, -1.1288604736328125, -1.0843505859375, -1.0398406982421875, -0.995330810546875, -0.9508209228515625, -0.90631103515625, -0.8618011474609375, -0.817291259765625, -0.7727813720703125, -0.728271484375, -0.6837615966796875, -0.639251708984375, -0.5947418212890625, -0.55023193359375, -0.5057220458984375, -0.461212158203125, -0.4167022705078125, -0.3721923828125, -0.3276824951171875, -0.283172607421875, -0.2386627197265625, -0.19415283203125, -0.1496429443359375, -0.105133056640625, -0.0606231689453125, -0.01611328125, 0.0283966064453125, 0.072906494140625, 0.1174163818359375, 0.16192626953125, 0.2064361572265625, 0.250946044921875, 0.2954559326171875, 0.3399658203125, 0.3844757080078125, 0.428985595703125, 0.4734954833984375, 0.51800537109375, 0.5625152587890625, 0.607025146484375, 0.6515350341796875, 0.696044921875, 0.7405548095703125, 0.785064697265625, 0.8295745849609375, 0.87408447265625, 0.9185943603515625, 0.963104248046875, 1.0076141357421875, 1.0521240234375, 1.0966339111328125, 1.141143798828125, 1.1856536865234375, 1.23016357421875, 1.2746734619140625, 1.319183349609375, 1.3636932373046875, 1.408203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 7.0, 35.0, 34.0, 44.0, 89.0, 114.0, 227.0, 374.0, 550.0, 1078.0, 1815.0, 3912.0, 9233.0, 30366.0, 170941.0, 1609085.0, 214818.0, 35321.0, 10293.0, 4083.0, 2018.0, 1013.0, 605.0, 398.0, 216.0, 144.0, 82.0, 74.0, 45.0, 20.0, 16.0, 12.0, 19.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.6009521484375, -12.225341796875, -11.8497314453125, -11.47412109375, -11.0985107421875, -10.722900390625, -10.3472900390625, -9.9716796875, -9.5960693359375, -9.220458984375, -8.8448486328125, -8.46923828125, -8.0936279296875, -7.718017578125, -7.3424072265625, -6.966796875, -6.5911865234375, -6.215576171875, -5.8399658203125, -5.46435546875, -5.0887451171875, -4.713134765625, -4.3375244140625, -3.9619140625, -3.5863037109375, -3.210693359375, -2.8350830078125, -2.45947265625, -2.0838623046875, -1.708251953125, -1.3326416015625, -0.95703125, -0.5814208984375, -0.205810546875, 0.1697998046875, 0.54541015625, 0.9210205078125, 1.296630859375, 1.6722412109375, 2.0478515625, 2.4234619140625, 2.799072265625, 3.1746826171875, 3.55029296875, 3.9259033203125, 4.301513671875, 4.6771240234375, 5.052734375, 5.4283447265625, 5.803955078125, 6.1795654296875, 6.55517578125, 6.9307861328125, 7.306396484375, 7.6820068359375, 8.0576171875, 8.4332275390625, 8.808837890625, 9.1844482421875, 9.56005859375, 9.9356689453125, 10.311279296875, 10.6868896484375, 11.0625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 6.0, 3.0, 8.0, 3.0, 10.0, 8.0, 9.0, 23.0, 34.0, 74.0, 94.0, 163.0, 175.0, 155.0, 77.0, 36.0, 27.0, 26.0, 13.0, 9.0, 10.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.265625, -3.16156005859375, -3.0574951171875, -2.95343017578125, -2.849365234375, -2.74530029296875, -2.6412353515625, -2.53717041015625, -2.43310546875, -2.32904052734375, -2.2249755859375, -2.12091064453125, -2.016845703125, -1.91278076171875, -1.8087158203125, -1.70465087890625, -1.6005859375, -1.49652099609375, -1.3924560546875, -1.28839111328125, -1.184326171875, -1.08026123046875, -0.9761962890625, -0.87213134765625, -0.76806640625, -0.66400146484375, -0.5599365234375, -0.45587158203125, -0.351806640625, -0.24774169921875, -0.1436767578125, -0.03961181640625, 0.064453125, 0.16851806640625, 0.2725830078125, 0.37664794921875, 0.480712890625, 0.58477783203125, 0.6888427734375, 0.79290771484375, 0.89697265625, 1.00103759765625, 1.1051025390625, 1.20916748046875, 1.313232421875, 1.41729736328125, 1.5213623046875, 1.62542724609375, 1.7294921875, 1.83355712890625, 1.9376220703125, 2.04168701171875, 2.145751953125, 2.24981689453125, 2.3538818359375, 2.45794677734375, 2.56201171875, 2.66607666015625, 2.7701416015625, 2.87420654296875, 2.978271484375, 3.08233642578125, 3.1864013671875, 3.29046630859375, 3.39453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 4.0, 8.0, 9.0, 12.0, 22.0, 18.0, 45.0, 42.0, 79.0, 154.0, 454.0, 2122.0, 19717.0, 1004554.0, 18438.0, 1969.0, 470.0, 172.0, 77.0, 44.0, 36.0, 28.0, 15.0, 7.0, 9.0, 10.0, 1.0, 4.0, 7.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -49.09716796875, -47.5380859375, -45.97900390625, -44.419921875, -42.86083984375, -41.3017578125, -39.74267578125, -38.18359375, -36.62451171875, -35.0654296875, -33.50634765625, -31.947265625, -30.38818359375, -28.8291015625, -27.27001953125, -25.7109375, -24.15185546875, -22.5927734375, -21.03369140625, -19.474609375, -17.91552734375, -16.3564453125, -14.79736328125, -13.23828125, -11.67919921875, -10.1201171875, -8.56103515625, -7.001953125, -5.44287109375, -3.8837890625, -2.32470703125, -0.765625, 0.79345703125, 2.3525390625, 3.91162109375, 5.470703125, 7.02978515625, 8.5888671875, 10.14794921875, 11.70703125, 13.26611328125, 14.8251953125, 16.38427734375, 17.943359375, 19.50244140625, 21.0615234375, 22.62060546875, 24.1796875, 25.73876953125, 27.2978515625, 28.85693359375, 30.416015625, 31.97509765625, 33.5341796875, 35.09326171875, 36.65234375, 38.21142578125, 39.7705078125, 41.32958984375, 42.888671875, 44.44775390625, 46.0068359375, 47.56591796875, 49.125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 10.0, 44.0, 99.0, 249.0, 350.0, 150.0, 63.0, 25.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.100538730621338, -6.691324710845947, -6.282110691070557, -5.872896194458008, -5.463682174682617, -5.054468154907227, -4.645254135131836, -4.236040115356445, -3.8268260955810547, -3.417612075805664, -3.0083980560302734, -2.5991837978363037, -2.189969778060913, -1.7807557582855225, -1.3715415000915527, -0.9623274803161621, -0.5531134605407715, -0.14389938116073608, 0.2653146982192993, 0.6745288372039795, 1.0837428569793701, 1.4929568767547607, 1.9021711349487305, 2.311385154724121, 2.7205991744995117, 3.1298131942749023, 3.539027214050293, 3.9482414722442627, 4.357455253601074, 4.766669273376465, 5.175883769989014, 5.585097789764404, 5.994312286376953, 6.403526306152344, 6.812740325927734, 7.221954345703125, 7.631168365478516, 8.040382385253906, 8.449596405029297, 8.858810424804688, 9.268024444580078, 9.677238464355469, 10.08645248413086, 10.49566650390625, 10.90488052368164, 11.314094543457031, 11.723308563232422, 12.132522583007812, 12.54173755645752, 12.95095157623291, 13.3601655960083, 13.769379615783691, 14.178593635559082, 14.587807655334473, 14.99702262878418, 15.40623664855957, 15.815450668334961, 16.22466468811035, 16.633878707885742, 17.043092727661133, 17.452306747436523, 17.861520767211914, 18.270734786987305, 18.679948806762695, 19.089162826538086]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 7.0, 3.0, 11.0, 10.0, 9.0, 21.0, 23.0, 23.0, 24.0, 29.0, 25.0, 35.0, 34.0, 48.0, 46.0, 46.0, 43.0, 51.0, 39.0, 53.0, 56.0, 38.0, 43.0, 41.0, 42.0, 22.0, 27.0, 26.0, 18.0, 27.0, 19.0, 15.0, 6.0, 11.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.884923934936523, -4.75705099105835, -4.629178524017334, -4.50130558013916, -4.373432636260986, -4.2455596923828125, -4.117687225341797, -3.989814281463623, -3.8619415760040283, -3.7340688705444336, -3.6061959266662598, -3.478323221206665, -3.3504505157470703, -3.2225775718688965, -3.0947048664093018, -2.966832160949707, -2.838959217071533, -2.7110865116119385, -2.5832135677337646, -2.45534086227417, -2.327467918395996, -2.1995952129364014, -2.0717225074768066, -1.9438496828079224, -1.815976858139038, -1.6881040334701538, -1.5602312088012695, -1.4323585033416748, -1.3044856786727905, -1.1766128540039062, -1.0487401485443115, -0.9208673238754272, -0.7929940223693848, -0.6651211977005005, -0.537248432636261, -0.4093756377696991, -0.2815028429031372, -0.15363001823425293, -0.025757253170013428, 0.10211551189422607, 0.22998833656311035, 0.35786113142967224, 0.48573392629623413, 0.6136066913604736, 0.7414795160293579, 0.8693523406982422, 0.9972251057624817, 1.1250978708267212, 1.2529706954956055, 1.3808435201644897, 1.508716344833374, 1.6365890502929688, 1.764461874961853, 1.8923346996307373, 2.020207405090332, 2.148080348968506, 2.2759530544281006, 2.4038257598876953, 2.531698703765869, 2.659571409225464, 2.7874441146850586, 2.9153170585632324, 3.043189764022827, 3.171062469482422, 3.2989354133605957]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 15.0, 9.0, 9.0, 8.0, 13.0, 9.0, 20.0, 24.0, 25.0, 31.0, 33.0, 31.0, 33.0, 35.0, 40.0, 34.0, 45.0, 45.0, 46.0, 40.0, 46.0, 46.0, 43.0, 37.0, 42.0, 26.0, 39.0, 23.0, 20.0, 26.0, 30.0, 17.0, 19.0, 11.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7112274169921875, -1.657806396484375, -1.6043853759765625, -1.55096435546875, -1.4975433349609375, -1.444122314453125, -1.3907012939453125, -1.3372802734375, -1.2838592529296875, -1.230438232421875, -1.1770172119140625, -1.12359619140625, -1.0701751708984375, -1.016754150390625, -0.9633331298828125, -0.909912109375, -0.8564910888671875, -0.803070068359375, -0.7496490478515625, -0.69622802734375, -0.6428070068359375, -0.589385986328125, -0.5359649658203125, -0.4825439453125, -0.4291229248046875, -0.375701904296875, -0.3222808837890625, -0.26885986328125, -0.2154388427734375, -0.162017822265625, -0.1085968017578125, -0.05517578125, -0.0017547607421875, 0.051666259765625, 0.1050872802734375, 0.15850830078125, 0.2119293212890625, 0.265350341796875, 0.3187713623046875, 0.3721923828125, 0.4256134033203125, 0.479034423828125, 0.5324554443359375, 0.58587646484375, 0.6392974853515625, 0.692718505859375, 0.7461395263671875, 0.799560546875, 0.8529815673828125, 0.906402587890625, 0.9598236083984375, 1.01324462890625, 1.0666656494140625, 1.120086669921875, 1.1735076904296875, 1.2269287109375, 1.2803497314453125, 1.333770751953125, 1.3871917724609375, 1.44061279296875, 1.4940338134765625, 1.547454833984375, 1.6008758544921875, 1.654296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 16.0, 21.0, 27.0, 51.0, 82.0, 111.0, 148.0, 195.0, 341.0, 549.0, 800.0, 1296.0, 2206.0, 4000.0, 8629.0, 32631.0, 586669.0, 369272.0, 24918.0, 7450.0, 3595.0, 2014.0, 1243.0, 735.0, 505.0, 352.0, 205.0, 138.0, 96.0, 62.0, 48.0, 36.0, 27.0, 14.0, 13.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.84765625, -6.64581298828125, -6.4439697265625, -6.24212646484375, -6.040283203125, -5.83843994140625, -5.6365966796875, -5.43475341796875, -5.23291015625, -5.03106689453125, -4.8292236328125, -4.62738037109375, -4.425537109375, -4.22369384765625, -4.0218505859375, -3.82000732421875, -3.6181640625, -3.41632080078125, -3.2144775390625, -3.01263427734375, -2.810791015625, -2.60894775390625, -2.4071044921875, -2.20526123046875, -2.00341796875, -1.80157470703125, -1.5997314453125, -1.39788818359375, -1.196044921875, -0.99420166015625, -0.7923583984375, -0.59051513671875, -0.388671875, -0.18682861328125, 0.0150146484375, 0.21685791015625, 0.418701171875, 0.62054443359375, 0.8223876953125, 1.02423095703125, 1.22607421875, 1.42791748046875, 1.6297607421875, 1.83160400390625, 2.033447265625, 2.23529052734375, 2.4371337890625, 2.63897705078125, 2.8408203125, 3.04266357421875, 3.2445068359375, 3.44635009765625, 3.648193359375, 3.85003662109375, 4.0518798828125, 4.25372314453125, 4.45556640625, 4.65740966796875, 4.8592529296875, 5.06109619140625, 5.262939453125, 5.46478271484375, 5.6666259765625, 5.86846923828125, 6.0703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 4.0, 6.0, 10.0, 15.0, 17.0, 21.0, 13.0, 19.0, 27.0, 29.0, 24.0, 47.0, 27.0, 46.0, 63.0, 73.0, 79.0, 179.0, 1620.0, 158.0, 93.0, 91.0, 62.0, 50.0, 53.0, 31.0, 29.0, 31.0, 24.0, 20.0, 15.0, 12.0, 10.0, 6.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.9140625, -7.6907958984375, -7.467529296875, -7.2442626953125, -7.02099609375, -6.7977294921875, -6.574462890625, -6.3511962890625, -6.1279296875, -5.9046630859375, -5.681396484375, -5.4581298828125, -5.23486328125, -5.0115966796875, -4.788330078125, -4.5650634765625, -4.341796875, -4.1185302734375, -3.895263671875, -3.6719970703125, -3.44873046875, -3.2254638671875, -3.002197265625, -2.7789306640625, -2.5556640625, -2.3323974609375, -2.109130859375, -1.8858642578125, -1.66259765625, -1.4393310546875, -1.216064453125, -0.9927978515625, -0.76953125, -0.5462646484375, -0.322998046875, -0.0997314453125, 0.12353515625, 0.3468017578125, 0.570068359375, 0.7933349609375, 1.0166015625, 1.2398681640625, 1.463134765625, 1.6864013671875, 1.90966796875, 2.1329345703125, 2.356201171875, 2.5794677734375, 2.802734375, 3.0260009765625, 3.249267578125, 3.4725341796875, 3.69580078125, 3.9190673828125, 4.142333984375, 4.3656005859375, 4.5888671875, 4.8121337890625, 5.035400390625, 5.2586669921875, 5.48193359375, 5.7052001953125, 5.928466796875, 6.1517333984375, 6.375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 4.0, 13.0, 24.0, 26.0, 38.0, 50.0, 109.0, 130.0, 293.0, 526.0, 1124.0, 2801.0, 8692.0, 34005.0, 351680.0, 2653148.0, 70702.0, 14561.0, 4482.0, 1711.0, 706.0, 366.0, 188.0, 103.0, 69.0, 50.0, 31.0, 24.0, 16.0, 15.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.0718994140625, -11.628173828125, -11.1844482421875, -10.74072265625, -10.2969970703125, -9.853271484375, -9.4095458984375, -8.9658203125, -8.5220947265625, -8.078369140625, -7.6346435546875, -7.19091796875, -6.7471923828125, -6.303466796875, -5.8597412109375, -5.416015625, -4.9722900390625, -4.528564453125, -4.0848388671875, -3.64111328125, -3.1973876953125, -2.753662109375, -2.3099365234375, -1.8662109375, -1.4224853515625, -0.978759765625, -0.5350341796875, -0.09130859375, 0.3524169921875, 0.796142578125, 1.2398681640625, 1.68359375, 2.1273193359375, 2.571044921875, 3.0147705078125, 3.45849609375, 3.9022216796875, 4.345947265625, 4.7896728515625, 5.2333984375, 5.6771240234375, 6.120849609375, 6.5645751953125, 7.00830078125, 7.4520263671875, 7.895751953125, 8.3394775390625, 8.783203125, 9.2269287109375, 9.670654296875, 10.1143798828125, 10.55810546875, 11.0018310546875, 11.445556640625, 11.8892822265625, 12.3330078125, 12.7767333984375, 13.220458984375, 13.6641845703125, 14.10791015625, 14.5516357421875, 14.995361328125, 15.4390869140625, 15.8828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 76.0, 378.0, 425.0, 101.0, 18.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90983581542969, -50.507896423339844, -48.10595703125, -45.704017639160156, -43.30207824707031, -40.90013885498047, -38.49819564819336, -36.096256256103516, -33.69431686401367, -31.292377471923828, -28.890438079833984, -26.488496780395508, -24.086557388305664, -21.68461799621582, -19.282676696777344, -16.8807373046875, -14.478797912597656, -12.076858520507812, -9.674918174743652, -7.27297830581665, -4.871038436889648, -2.4690990447998047, -0.06715869903564453, 2.3347816467285156, 4.736721038818359, 7.138660907745361, 9.540600776672363, 11.942541122436523, 14.344480514526367, 16.74641990661621, 19.148361206054688, 21.55030059814453, 23.952232360839844, 26.354171752929688, 28.75611114501953, 31.158052444458008, 33.55998992919922, 35.96192932128906, 38.36387252807617, 40.765811920166016, 43.16775131225586, 45.5696907043457, 47.97163009643555, 50.37356948852539, 52.7755126953125, 55.177452087402344, 57.57939147949219, 59.98133087158203, 62.383270263671875, 64.78520965576172, 67.18714904785156, 69.5890884399414, 71.99102783203125, 74.3929672241211, 76.79490661621094, 79.19685363769531, 81.59878540039062, 84.00072479248047, 86.40266418457031, 88.80460357666016, 91.20654296875, 93.60848236083984, 96.01042175292969, 98.41236877441406, 100.8143081665039]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 2.0, 5.0, 13.0, 8.0, 9.0, 22.0, 14.0, 23.0, 17.0, 29.0, 25.0, 31.0, 32.0, 41.0, 38.0, 51.0, 46.0, 41.0, 32.0, 43.0, 51.0, 41.0, 43.0, 37.0, 41.0, 29.0, 30.0, 26.0, 15.0, 26.0, 23.0, 22.0, 17.0, 18.0, 10.0, 13.0, 7.0, 10.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.594375610351562, -19.866798400878906, -19.139219284057617, -18.41164207458496, -17.684064865112305, -16.956485748291016, -16.22890853881836, -15.501331329345703, -14.77375316619873, -14.046175003051758, -13.318597793579102, -12.591019630432129, -11.863441467285156, -11.1358642578125, -10.408286094665527, -9.680707931518555, -8.953130722045898, -8.225552558898926, -7.4979753494262695, -6.770397186279297, -6.042819499969482, -5.315241813659668, -4.587663650512695, -3.860085964202881, -3.1325082778930664, -2.404930591583252, -1.6773526668548584, -0.9497747421264648, -0.2221970558166504, 0.5053806304931641, 1.2329587936401367, 1.9605364799499512, 2.688112258911133, 3.4156899452209473, 4.143267631530762, 4.870845794677734, 5.598423480987549, 6.326001167297363, 7.053579330444336, 7.78115701675415, 8.508734703063965, 9.236312866210938, 9.963890075683594, 10.691468238830566, 11.419046401977539, 12.146623611450195, 12.874201774597168, 13.60177993774414, 14.329357147216797, 15.05693531036377, 15.784512519836426, 16.5120906829834, 17.239667892456055, 17.967247009277344, 18.69482421875, 19.422401428222656, 20.149978637695312, 20.87755584716797, 21.605134963989258, 22.332712173461914, 23.06028938293457, 23.78786849975586, 24.515445709228516, 25.243022918701172, 25.97060203552246]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 6.0, 11.0, 10.0, 11.0, 9.0, 21.0, 15.0, 21.0, 34.0, 20.0, 24.0, 25.0, 34.0, 48.0, 36.0, 34.0, 43.0, 54.0, 39.0, 47.0, 43.0, 49.0, 35.0, 41.0, 29.0, 35.0, 33.0, 21.0, 24.0, 23.0, 21.0, 15.0, 14.0, 8.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.794921875, -1.7416534423828125, -1.688385009765625, -1.6351165771484375, -1.58184814453125, -1.5285797119140625, -1.475311279296875, -1.4220428466796875, -1.3687744140625, -1.3155059814453125, -1.262237548828125, -1.2089691162109375, -1.15570068359375, -1.1024322509765625, -1.049163818359375, -0.9958953857421875, -0.942626953125, -0.8893585205078125, -0.836090087890625, -0.7828216552734375, -0.72955322265625, -0.6762847900390625, -0.623016357421875, -0.5697479248046875, -0.5164794921875, -0.4632110595703125, -0.409942626953125, -0.3566741943359375, -0.30340576171875, -0.2501373291015625, -0.196868896484375, -0.1436004638671875, -0.09033203125, -0.0370635986328125, 0.016204833984375, 0.0694732666015625, 0.12274169921875, 0.1760101318359375, 0.229278564453125, 0.2825469970703125, 0.3358154296875, 0.3890838623046875, 0.442352294921875, 0.4956207275390625, 0.54888916015625, 0.6021575927734375, 0.655426025390625, 0.7086944580078125, 0.761962890625, 0.8152313232421875, 0.868499755859375, 0.9217681884765625, 0.97503662109375, 1.0283050537109375, 1.081573486328125, 1.1348419189453125, 1.1881103515625, 1.2413787841796875, 1.294647216796875, 1.3479156494140625, 1.40118408203125, 1.4544525146484375, 1.507720947265625, 1.5609893798828125, 1.6142578125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 13.0, 11.0, 21.0, 19.0, 18.0, 37.0, 43.0, 84.0, 124.0, 215.0, 304.0, 509.0, 870.0, 1611.0, 2886.0, 5368.0, 11372.0, 25495.0, 68031.0, 295125.0, 3256945.0, 400281.0, 75026.0, 27016.0, 11402.0, 5284.0, 2779.0, 1451.0, 766.0, 437.0, 250.0, 165.0, 103.0, 74.0, 30.0, 37.0, 28.0, 15.0, 14.0, 9.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.27337646484375, -7.0428466796875, -6.81231689453125, -6.581787109375, -6.35125732421875, -6.1207275390625, -5.89019775390625, -5.65966796875, -5.42913818359375, -5.1986083984375, -4.96807861328125, -4.737548828125, -4.50701904296875, -4.2764892578125, -4.04595947265625, -3.8154296875, -3.58489990234375, -3.3543701171875, -3.12384033203125, -2.893310546875, -2.66278076171875, -2.4322509765625, -2.20172119140625, -1.97119140625, -1.74066162109375, -1.5101318359375, -1.27960205078125, -1.049072265625, -0.81854248046875, -0.5880126953125, -0.35748291015625, -0.126953125, 0.10357666015625, 0.3341064453125, 0.56463623046875, 0.795166015625, 1.02569580078125, 1.2562255859375, 1.48675537109375, 1.71728515625, 1.94781494140625, 2.1783447265625, 2.40887451171875, 2.639404296875, 2.86993408203125, 3.1004638671875, 3.33099365234375, 3.5615234375, 3.79205322265625, 4.0225830078125, 4.25311279296875, 4.483642578125, 4.71417236328125, 4.9447021484375, 5.17523193359375, 5.40576171875, 5.63629150390625, 5.8668212890625, 6.09735107421875, 6.327880859375, 6.55841064453125, 6.7889404296875, 7.01947021484375, 7.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 12.0, 16.0, 18.0, 30.0, 41.0, 64.0, 60.0, 95.0, 125.0, 253.0, 458.0, 1021.0, 838.0, 362.0, 207.0, 157.0, 76.0, 69.0, 48.0, 38.0, 23.0, 18.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.78179931640625, -6.4971923828125, -6.21258544921875, -5.927978515625, -5.64337158203125, -5.3587646484375, -5.07415771484375, -4.78955078125, -4.50494384765625, -4.2203369140625, -3.93572998046875, -3.651123046875, -3.36651611328125, -3.0819091796875, -2.79730224609375, -2.5126953125, -2.22808837890625, -1.9434814453125, -1.65887451171875, -1.374267578125, -1.08966064453125, -0.8050537109375, -0.52044677734375, -0.23583984375, 0.04876708984375, 0.3333740234375, 0.61798095703125, 0.902587890625, 1.18719482421875, 1.4718017578125, 1.75640869140625, 2.041015625, 2.32562255859375, 2.6102294921875, 2.89483642578125, 3.179443359375, 3.46405029296875, 3.7486572265625, 4.03326416015625, 4.31787109375, 4.60247802734375, 4.8870849609375, 5.17169189453125, 5.456298828125, 5.74090576171875, 6.0255126953125, 6.31011962890625, 6.5947265625, 6.87933349609375, 7.1639404296875, 7.44854736328125, 7.733154296875, 8.01776123046875, 8.3023681640625, 8.58697509765625, 8.87158203125, 9.15618896484375, 9.4407958984375, 9.72540283203125, 10.010009765625, 10.29461669921875, 10.5792236328125, 10.86383056640625, 11.1484375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 11.0, 12.0, 23.0, 21.0, 26.0, 44.0, 66.0, 122.0, 193.0, 340.0, 598.0, 1199.0, 2514.0, 6167.0, 16359.0, 50694.0, 200574.0, 2786965.0, 950454.0, 123257.0, 34204.0, 11727.0, 4599.0, 1914.0, 929.0, 530.0, 257.0, 156.0, 98.0, 61.0, 51.0, 33.0, 17.0, 13.0, 10.0, 10.0, 7.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.4921875, -15.0474853515625, -14.602783203125, -14.1580810546875, -13.71337890625, -13.2686767578125, -12.823974609375, -12.3792724609375, -11.9345703125, -11.4898681640625, -11.045166015625, -10.6004638671875, -10.15576171875, -9.7110595703125, -9.266357421875, -8.8216552734375, -8.376953125, -7.9322509765625, -7.487548828125, -7.0428466796875, -6.59814453125, -6.1534423828125, -5.708740234375, -5.2640380859375, -4.8193359375, -4.3746337890625, -3.929931640625, -3.4852294921875, -3.04052734375, -2.5958251953125, -2.151123046875, -1.7064208984375, -1.26171875, -0.8170166015625, -0.372314453125, 0.0723876953125, 0.51708984375, 0.9617919921875, 1.406494140625, 1.8511962890625, 2.2958984375, 2.7406005859375, 3.185302734375, 3.6300048828125, 4.07470703125, 4.5194091796875, 4.964111328125, 5.4088134765625, 5.853515625, 6.2982177734375, 6.742919921875, 7.1876220703125, 7.63232421875, 8.0770263671875, 8.521728515625, 8.9664306640625, 9.4111328125, 9.8558349609375, 10.300537109375, 10.7452392578125, 11.18994140625, 11.6346435546875, 12.079345703125, 12.5240478515625, 12.96875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 10.0, 15.0, 19.0, 22.0, 27.0, 38.0, 70.0, 71.0, 103.0, 105.0, 102.0, 96.0, 72.0, 70.0, 36.0, 33.0, 19.0, 25.0, 14.0, 13.0, 6.0, 3.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.627105712890625, -40.634674072265625, -39.64223861694336, -38.649803161621094, -37.657371520996094, -36.664939880371094, -35.67250442504883, -34.68006896972656, -33.68763732910156, -32.69520568847656, -31.702770233154297, -30.710336685180664, -29.71790313720703, -28.7254695892334, -27.733036041259766, -26.740602493286133, -25.7481689453125, -24.755735397338867, -23.763301849365234, -22.7708683013916, -21.77843475341797, -20.786001205444336, -19.793567657470703, -18.80113410949707, -17.808700561523438, -16.816267013549805, -15.823833465576172, -14.831399917602539, -13.838966369628906, -12.846532821655273, -11.85409927368164, -10.861665725708008, -9.869230270385742, -8.87679672241211, -7.884363174438477, -6.891929626464844, -5.899496078491211, -4.907062530517578, -3.9146289825439453, -2.9221954345703125, -1.9297618865966797, -0.9373283386230469, 0.05510520935058594, 1.0475387573242188, 2.0399723052978516, 3.0324058532714844, 4.024839401245117, 5.01727294921875, 6.009706497192383, 7.002140045166016, 7.994573593139648, 8.987007141113281, 9.979440689086914, 10.971874237060547, 11.96430778503418, 12.956741333007812, 13.949174880981445, 14.941608428955078, 15.934041976928711, 16.926475524902344, 17.918909072875977, 18.91134262084961, 19.903776168823242, 20.896209716796875, 21.888643264770508]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 10.0, 10.0, 20.0, 12.0, 17.0, 28.0, 25.0, 21.0, 28.0, 28.0, 36.0, 40.0, 35.0, 36.0, 46.0, 38.0, 41.0, 49.0, 41.0, 41.0, 29.0, 41.0, 41.0, 27.0, 40.0, 15.0, 28.0, 27.0, 27.0, 15.0, 14.0, 14.0, 7.0, 10.0, 10.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.314502716064453, -21.644657135009766, -20.97481346130371, -20.304967880249023, -19.63512420654297, -18.96527862548828, -18.295434951782227, -17.62558937072754, -16.955745697021484, -16.285900115966797, -15.616056442260742, -14.946211814880371, -14.2763671875, -13.606522560119629, -12.936677932739258, -12.26683235168457, -11.5969877243042, -10.927143096923828, -10.257298469543457, -9.587453842163086, -8.917609214782715, -8.247764587402344, -7.5779194831848145, -6.908074855804443, -6.238230228424072, -5.568385601043701, -4.89854097366333, -4.228695869445801, -3.558851480484009, -2.8890068531036377, -2.2191619873046875, -1.5493173599243164, -0.8794727325439453, -0.20962804555892944, 0.4602166414260864, 1.130061388015747, 1.7999060153961182, 2.4697506427764893, 3.1395955085754395, 3.8094401359558105, 4.479284763336182, 5.149129390716553, 5.818974018096924, 6.488819122314453, 7.158663749694824, 7.828508377075195, 8.498353004455566, 9.168197631835938, 9.838042259216309, 10.50788688659668, 11.17773151397705, 11.847576141357422, 12.517420768737793, 13.187265396118164, 13.857110977172852, 14.526954650878906, 15.196800231933594, 15.866644859313965, 16.536489486694336, 17.206335067749023, 17.876178741455078, 18.546024322509766, 19.21586799621582, 19.885713577270508, 20.555557250976562]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 13.0, 19.0, 15.0, 20.0, 18.0, 27.0, 33.0, 30.0, 34.0, 35.0, 46.0, 38.0, 35.0, 60.0, 48.0, 33.0, 42.0, 51.0, 53.0, 40.0, 38.0, 26.0, 33.0, 32.0, 23.0, 24.0, 26.0, 24.0, 11.0, 12.0, 7.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.126953125, -2.0662384033203125, -2.005523681640625, -1.9448089599609375, -1.88409423828125, -1.8233795166015625, -1.762664794921875, -1.7019500732421875, -1.6412353515625, -1.5805206298828125, -1.519805908203125, -1.4590911865234375, -1.39837646484375, -1.3376617431640625, -1.276947021484375, -1.2162322998046875, -1.155517578125, -1.0948028564453125, -1.034088134765625, -0.9733734130859375, -0.91265869140625, -0.8519439697265625, -0.791229248046875, -0.7305145263671875, -0.6697998046875, -0.6090850830078125, -0.548370361328125, -0.4876556396484375, -0.42694091796875, -0.3662261962890625, -0.305511474609375, -0.2447967529296875, -0.18408203125, -0.1233673095703125, -0.062652587890625, -0.0019378662109375, 0.05877685546875, 0.1194915771484375, 0.180206298828125, 0.2409210205078125, 0.3016357421875, 0.3623504638671875, 0.423065185546875, 0.4837799072265625, 0.54449462890625, 0.6052093505859375, 0.665924072265625, 0.7266387939453125, 0.787353515625, 0.8480682373046875, 0.908782958984375, 0.9694976806640625, 1.03021240234375, 1.0909271240234375, 1.151641845703125, 1.2123565673828125, 1.2730712890625, 1.3337860107421875, 1.394500732421875, 1.4552154541015625, 1.51593017578125, 1.5766448974609375, 1.637359619140625, 1.6980743408203125, 1.7587890625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 5.0, 8.0, 14.0, 19.0, 26.0, 40.0, 75.0, 103.0, 164.0, 230.0, 325.0, 557.0, 890.0, 1386.0, 2401.0, 4185.0, 6981.0, 12640.0, 23114.0, 45474.0, 94733.0, 230778.0, 362975.0, 132082.0, 60989.0, 30189.0, 16326.0, 9055.0, 5108.0, 2979.0, 1714.0, 1074.0, 664.0, 399.0, 275.0, 196.0, 129.0, 79.0, 50.0, 36.0, 23.0, 21.0, 12.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3695068359375, -9.059326171875, -8.7491455078125, -8.43896484375, -8.1287841796875, -7.818603515625, -7.5084228515625, -7.1982421875, -6.8880615234375, -6.577880859375, -6.2677001953125, -5.95751953125, -5.6473388671875, -5.337158203125, -5.0269775390625, -4.716796875, -4.4066162109375, -4.096435546875, -3.7862548828125, -3.47607421875, -3.1658935546875, -2.855712890625, -2.5455322265625, -2.2353515625, -1.9251708984375, -1.614990234375, -1.3048095703125, -0.99462890625, -0.6844482421875, -0.374267578125, -0.0640869140625, 0.24609375, 0.5562744140625, 0.866455078125, 1.1766357421875, 1.48681640625, 1.7969970703125, 2.107177734375, 2.4173583984375, 2.7275390625, 3.0377197265625, 3.347900390625, 3.6580810546875, 3.96826171875, 4.2784423828125, 4.588623046875, 4.8988037109375, 5.208984375, 5.5191650390625, 5.829345703125, 6.1395263671875, 6.44970703125, 6.7598876953125, 7.070068359375, 7.3802490234375, 7.6904296875, 8.0006103515625, 8.310791015625, 8.6209716796875, 8.93115234375, 9.2413330078125, 9.551513671875, 9.8616943359375, 10.171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 10.0, 9.0, 11.0, 13.0, 19.0, 23.0, 30.0, 35.0, 28.0, 28.0, 31.0, 41.0, 46.0, 52.0, 51.0, 44.0, 1068.0, 46.0, 48.0, 27.0, 54.0, 29.0, 45.0, 45.0, 27.0, 26.0, 26.0, 19.0, 14.0, 10.0, 15.0, 13.0, 7.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9279937744140625, -1.865753173828125, -1.8035125732421875, -1.74127197265625, -1.6790313720703125, -1.616790771484375, -1.5545501708984375, -1.4923095703125, -1.4300689697265625, -1.367828369140625, -1.3055877685546875, -1.24334716796875, -1.1811065673828125, -1.118865966796875, -1.0566253662109375, -0.994384765625, -0.9321441650390625, -0.869903564453125, -0.8076629638671875, -0.74542236328125, -0.6831817626953125, -0.620941162109375, -0.5587005615234375, -0.4964599609375, -0.4342193603515625, -0.371978759765625, -0.3097381591796875, -0.24749755859375, -0.1852569580078125, -0.123016357421875, -0.0607757568359375, 0.00146484375, 0.0637054443359375, 0.125946044921875, 0.1881866455078125, 0.25042724609375, 0.3126678466796875, 0.374908447265625, 0.4371490478515625, 0.4993896484375, 0.5616302490234375, 0.623870849609375, 0.6861114501953125, 0.74835205078125, 0.8105926513671875, 0.872833251953125, 0.9350738525390625, 0.997314453125, 1.0595550537109375, 1.121795654296875, 1.1840362548828125, 1.24627685546875, 1.3085174560546875, 1.370758056640625, 1.4329986572265625, 1.4952392578125, 1.5574798583984375, 1.619720458984375, 1.6819610595703125, 1.74420166015625, 1.8064422607421875, 1.868682861328125, 1.9309234619140625, 1.9931640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 12.0, 9.0, 18.0, 33.0, 52.0, 83.0, 143.0, 251.0, 360.0, 687.0, 1285.0, 2331.0, 4612.0, 10008.0, 25140.0, 78515.0, 779240.0, 1062726.0, 85201.0, 25904.0, 10361.0, 4815.0, 2409.0, 1183.0, 734.0, 416.0, 251.0, 114.0, 94.0, 46.0, 31.0, 24.0, 12.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.953125, -12.5487060546875, -12.144287109375, -11.7398681640625, -11.33544921875, -10.9310302734375, -10.526611328125, -10.1221923828125, -9.7177734375, -9.3133544921875, -8.908935546875, -8.5045166015625, -8.10009765625, -7.6956787109375, -7.291259765625, -6.8868408203125, -6.482421875, -6.0780029296875, -5.673583984375, -5.2691650390625, -4.86474609375, -4.4603271484375, -4.055908203125, -3.6514892578125, -3.2470703125, -2.8426513671875, -2.438232421875, -2.0338134765625, -1.62939453125, -1.2249755859375, -0.820556640625, -0.4161376953125, -0.01171875, 0.3927001953125, 0.797119140625, 1.2015380859375, 1.60595703125, 2.0103759765625, 2.414794921875, 2.8192138671875, 3.2236328125, 3.6280517578125, 4.032470703125, 4.4368896484375, 4.84130859375, 5.2457275390625, 5.650146484375, 6.0545654296875, 6.458984375, 6.8634033203125, 7.267822265625, 7.6722412109375, 8.07666015625, 8.4810791015625, 8.885498046875, 9.2899169921875, 9.6943359375, 10.0987548828125, 10.503173828125, 10.9075927734375, 11.31201171875, 11.7164306640625, 12.120849609375, 12.5252685546875, 12.9296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 23.0, 27.0, 43.0, 65.0, 199.0, 302.0, 108.0, 65.0, 39.0, 23.0, 12.0, 11.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.54296875, -4.410369873046875, -4.27777099609375, -4.145172119140625, -4.0125732421875, -3.879974365234375, -3.74737548828125, -3.614776611328125, -3.482177734375, -3.349578857421875, -3.21697998046875, -3.084381103515625, -2.9517822265625, -2.819183349609375, -2.68658447265625, -2.553985595703125, -2.42138671875, -2.288787841796875, -2.15618896484375, -2.023590087890625, -1.8909912109375, -1.758392333984375, -1.62579345703125, -1.493194580078125, -1.360595703125, -1.227996826171875, -1.09539794921875, -0.962799072265625, -0.8302001953125, -0.697601318359375, -0.56500244140625, -0.432403564453125, -0.2998046875, -0.167205810546875, -0.03460693359375, 0.097991943359375, 0.2305908203125, 0.363189697265625, 0.49578857421875, 0.628387451171875, 0.760986328125, 0.893585205078125, 1.02618408203125, 1.158782958984375, 1.2913818359375, 1.423980712890625, 1.55657958984375, 1.689178466796875, 1.82177734375, 1.954376220703125, 2.08697509765625, 2.219573974609375, 2.3521728515625, 2.484771728515625, 2.61737060546875, 2.749969482421875, 2.882568359375, 3.015167236328125, 3.14776611328125, 3.280364990234375, 3.4129638671875, 3.545562744140625, 3.67816162109375, 3.810760498046875, 3.943359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 7.0, 16.0, 14.0, 29.0, 30.0, 42.0, 67.0, 133.0, 401.0, 1306.0, 6589.0, 203829.0, 825381.0, 8315.0, 1583.0, 409.0, 136.0, 77.0, 33.0, 31.0, 19.0, 16.0, 14.0, 9.0, 8.0, 6.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.97119140625, -47.2861328125, -45.60107421875, -43.916015625, -42.23095703125, -40.5458984375, -38.86083984375, -37.17578125, -35.49072265625, -33.8056640625, -32.12060546875, -30.435546875, -28.75048828125, -27.0654296875, -25.38037109375, -23.6953125, -22.01025390625, -20.3251953125, -18.64013671875, -16.955078125, -15.27001953125, -13.5849609375, -11.89990234375, -10.21484375, -8.52978515625, -6.8447265625, -5.15966796875, -3.474609375, -1.78955078125, -0.1044921875, 1.58056640625, 3.265625, 4.95068359375, 6.6357421875, 8.32080078125, 10.005859375, 11.69091796875, 13.3759765625, 15.06103515625, 16.74609375, 18.43115234375, 20.1162109375, 21.80126953125, 23.486328125, 25.17138671875, 26.8564453125, 28.54150390625, 30.2265625, 31.91162109375, 33.5966796875, 35.28173828125, 36.966796875, 38.65185546875, 40.3369140625, 42.02197265625, 43.70703125, 45.39208984375, 47.0771484375, 48.76220703125, 50.447265625, 52.13232421875, 53.8173828125, 55.50244140625, 57.1875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 18.0, 59.0, 165.0, 398.0, 257.0, 75.0, 19.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.732600212097168, -5.197275161743164, -4.661950588226318, -4.126626014709473, -3.5913009643554688, -3.055976152420044, -2.520651340484619, -1.9853265285491943, -1.4500017166137695, -0.9146769046783447, -0.3793520927429199, 0.15597271919250488, 0.6912975311279297, 1.2266223430633545, 1.7619471549987793, 2.297271966934204, 2.832596778869629, 3.3679215908050537, 3.9032464027404785, 4.438570976257324, 4.973896026611328, 5.509221076965332, 6.044545650482178, 6.579870223999023, 7.115195274353027, 7.650520324707031, 8.185844421386719, 8.721169471740723, 9.256494522094727, 9.79181957244873, 10.327144622802734, 10.862468719482422, 11.39779281616211, 11.933117866516113, 12.468442916870117, 13.003767013549805, 13.539092063903809, 14.074417114257812, 14.6097412109375, 15.145066261291504, 15.680391311645508, 16.215715408325195, 16.751041412353516, 17.286365509033203, 17.82168960571289, 18.35701560974121, 18.8923397064209, 19.42766571044922, 19.962989807128906, 20.498313903808594, 21.033639907836914, 21.5689640045166, 22.104290008544922, 22.63961410522461, 23.174938201904297, 23.710264205932617, 24.245588302612305, 24.780912399291992, 25.316238403320312, 25.8515625, 26.386886596679688, 26.922212600708008, 27.457536697387695, 27.992862701416016, 28.528186798095703]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 10.0, 4.0, 5.0, 9.0, 8.0, 18.0, 19.0, 22.0, 17.0, 24.0, 30.0, 32.0, 34.0, 44.0, 61.0, 46.0, 53.0, 50.0, 58.0, 49.0, 50.0, 49.0, 39.0, 36.0, 43.0, 48.0, 25.0, 20.0, 24.0, 25.0, 13.0, 14.0, 14.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4067554473876953, -2.2869205474853516, -2.167085886001587, -2.047250986099243, -1.927416205406189, -1.8075814247131348, -1.687746524810791, -1.5679117441177368, -1.4480769634246826, -1.3282421827316284, -1.2084074020385742, -1.0885725021362305, -0.9687377214431763, -0.8489029407501221, -0.7290681004524231, -0.6092332601547241, -0.4893984794616699, -0.36956366896629333, -0.24972885847091675, -0.12989404797554016, -0.010059237480163574, 0.10977554321289062, 0.2296103835105896, 0.3494452238082886, 0.4692800045013428, 0.589114785194397, 0.708949625492096, 0.8287844657897949, 0.9486192464828491, 1.0684540271759033, 1.188288927078247, 1.3081237077713013, 1.4279584884643555, 1.5477932691574097, 1.6676280498504639, 1.7874629497528076, 1.9072977304458618, 2.027132511138916, 2.1469674110412598, 2.2668023109436035, 2.386636972427368, 2.506471872329712, 2.6263065338134766, 2.7461414337158203, 2.865976333618164, 2.9858109951019287, 3.1056458950042725, 3.225480556488037, 3.345315456390381, 3.4651503562927246, 3.5849850177764893, 3.704819917678833, 3.8246545791625977, 3.9444894790649414, 4.064324378967285, 4.184159278869629, 4.303994178771973, 4.423829078674316, 4.54366397857666, 4.663498401641846, 4.7833333015441895, 4.903168201446533, 5.023003101348877, 5.142838001251221, 5.262672424316406]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 12.0, 10.0, 11.0, 17.0, 23.0, 24.0, 29.0, 25.0, 32.0, 30.0, 39.0, 57.0, 39.0, 58.0, 56.0, 46.0, 50.0, 45.0, 53.0, 41.0, 45.0, 33.0, 44.0, 27.0, 27.0, 29.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.17535400390625, -2.1085205078125, -2.04168701171875, -1.974853515625, -1.90802001953125, -1.8411865234375, -1.77435302734375, -1.70751953125, -1.64068603515625, -1.5738525390625, -1.50701904296875, -1.440185546875, -1.37335205078125, -1.3065185546875, -1.23968505859375, -1.1728515625, -1.10601806640625, -1.0391845703125, -0.97235107421875, -0.905517578125, -0.83868408203125, -0.7718505859375, -0.70501708984375, -0.63818359375, -0.57135009765625, -0.5045166015625, -0.43768310546875, -0.370849609375, -0.30401611328125, -0.2371826171875, -0.17034912109375, -0.103515625, -0.03668212890625, 0.0301513671875, 0.09698486328125, 0.163818359375, 0.23065185546875, 0.2974853515625, 0.36431884765625, 0.43115234375, 0.49798583984375, 0.5648193359375, 0.63165283203125, 0.698486328125, 0.76531982421875, 0.8321533203125, 0.89898681640625, 0.9658203125, 1.03265380859375, 1.0994873046875, 1.16632080078125, 1.233154296875, 1.29998779296875, 1.3668212890625, 1.43365478515625, 1.50048828125, 1.56732177734375, 1.6341552734375, 1.70098876953125, 1.767822265625, 1.83465576171875, 1.9014892578125, 1.96832275390625, 2.03515625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 16.0, 14.0, 20.0, 30.0, 33.0, 53.0, 89.0, 126.0, 224.0, 297.0, 479.0, 943.0, 1737.0, 3461.0, 7274.0, 18681.0, 61330.0, 308724.0, 493430.0, 104745.0, 27379.0, 10033.0, 4329.0, 2192.0, 1130.0, 657.0, 388.0, 238.0, 148.0, 96.0, 77.0, 47.0, 34.0, 21.0, 20.0, 16.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.135162353515625, -2.05938720703125, -1.983612060546875, -1.9078369140625, -1.832061767578125, -1.75628662109375, -1.680511474609375, -1.604736328125, -1.528961181640625, -1.45318603515625, -1.377410888671875, -1.3016357421875, -1.225860595703125, -1.15008544921875, -1.074310302734375, -0.99853515625, -0.922760009765625, -0.84698486328125, -0.771209716796875, -0.6954345703125, -0.619659423828125, -0.54388427734375, -0.468109130859375, -0.392333984375, -0.316558837890625, -0.24078369140625, -0.165008544921875, -0.0892333984375, -0.013458251953125, 0.06231689453125, 0.138092041015625, 0.2138671875, 0.289642333984375, 0.36541748046875, 0.441192626953125, 0.5169677734375, 0.592742919921875, 0.66851806640625, 0.744293212890625, 0.820068359375, 0.895843505859375, 0.97161865234375, 1.047393798828125, 1.1231689453125, 1.198944091796875, 1.27471923828125, 1.350494384765625, 1.42626953125, 1.502044677734375, 1.57781982421875, 1.653594970703125, 1.7293701171875, 1.805145263671875, 1.88092041015625, 1.956695556640625, 2.032470703125, 2.108245849609375, 2.18402099609375, 2.259796142578125, 2.3355712890625, 2.411346435546875, 2.48712158203125, 2.562896728515625, 2.638671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 17.0, 14.0, 11.0, 13.0, 22.0, 34.0, 35.0, 27.0, 30.0, 49.0, 37.0, 54.0, 104.0, 481.0, 1569.0, 102.0, 55.0, 53.0, 37.0, 42.0, 43.0, 29.0, 25.0, 25.0, 18.0, 21.0, 21.0, 13.0, 9.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.0390625, -7.79559326171875, -7.5521240234375, -7.30865478515625, -7.065185546875, -6.82171630859375, -6.5782470703125, -6.33477783203125, -6.09130859375, -5.84783935546875, -5.6043701171875, -5.36090087890625, -5.117431640625, -4.87396240234375, -4.6304931640625, -4.38702392578125, -4.1435546875, -3.90008544921875, -3.6566162109375, -3.41314697265625, -3.169677734375, -2.92620849609375, -2.6827392578125, -2.43927001953125, -2.19580078125, -1.95233154296875, -1.7088623046875, -1.46539306640625, -1.221923828125, -0.97845458984375, -0.7349853515625, -0.49151611328125, -0.248046875, -0.00457763671875, 0.2388916015625, 0.48236083984375, 0.725830078125, 0.96929931640625, 1.2127685546875, 1.45623779296875, 1.69970703125, 1.94317626953125, 2.1866455078125, 2.43011474609375, 2.673583984375, 2.91705322265625, 3.1605224609375, 3.40399169921875, 3.6474609375, 3.89093017578125, 4.1343994140625, 4.37786865234375, 4.621337890625, 4.86480712890625, 5.1082763671875, 5.35174560546875, 5.59521484375, 5.83868408203125, 6.0821533203125, 6.32562255859375, 6.569091796875, 6.81256103515625, 7.0560302734375, 7.29949951171875, 7.54296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 10.0, 7.0, 8.0, 19.0, 12.0, 28.0, 22.0, 41.0, 37.0, 67.0, 93.0, 169.0, 352.0, 963.0, 3785.0, 20974.0, 371483.0, 2680276.0, 56846.0, 7645.0, 1760.0, 505.0, 214.0, 96.0, 75.0, 56.0, 40.0, 28.0, 21.0, 10.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.16082763671875, -7.9075927734375, -7.65435791015625, -7.401123046875, -7.14788818359375, -6.8946533203125, -6.64141845703125, -6.38818359375, -6.13494873046875, -5.8817138671875, -5.62847900390625, -5.375244140625, -5.12200927734375, -4.8687744140625, -4.61553955078125, -4.3623046875, -4.10906982421875, -3.8558349609375, -3.60260009765625, -3.349365234375, -3.09613037109375, -2.8428955078125, -2.58966064453125, -2.33642578125, -2.08319091796875, -1.8299560546875, -1.57672119140625, -1.323486328125, -1.07025146484375, -0.8170166015625, -0.56378173828125, -0.310546875, -0.05731201171875, 0.1959228515625, 0.44915771484375, 0.702392578125, 0.95562744140625, 1.2088623046875, 1.46209716796875, 1.71533203125, 1.96856689453125, 2.2218017578125, 2.47503662109375, 2.728271484375, 2.98150634765625, 3.2347412109375, 3.48797607421875, 3.7412109375, 3.99444580078125, 4.2476806640625, 4.50091552734375, 4.754150390625, 5.00738525390625, 5.2606201171875, 5.51385498046875, 5.76708984375, 6.02032470703125, 6.2735595703125, 6.52679443359375, 6.780029296875, 7.03326416015625, 7.2864990234375, 7.53973388671875, 7.79296875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [25.0, 547.0, 427.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.352025032043457, -2.1149377822875977, 0.12214946746826172, 2.359236717224121, 4.5963239669799805, 6.83341121673584, 9.0704984664917, 11.307585716247559, 13.544672966003418, 15.781760215759277, 18.018848419189453, 20.255935668945312, 22.493022918701172, 24.73011016845703, 26.96719741821289, 29.20428466796875, 31.44137191772461, 33.67845916748047, 35.91554641723633, 38.15263366699219, 40.38972091674805, 42.626808166503906, 44.863895416259766, 47.100982666015625, 49.338069915771484, 51.575157165527344, 53.8122444152832, 56.04933166503906, 58.28641891479492, 60.52350616455078, 62.76059341430664, 64.9976806640625, 67.23477172851562, 69.47186279296875, 71.70894622802734, 73.94602966308594, 76.18312072753906, 78.42021179199219, 80.65729522705078, 82.89437866210938, 85.1314697265625, 87.36856079101562, 89.60564422607422, 91.84272766113281, 94.07981872558594, 96.31690979003906, 98.55399322509766, 100.79107666015625, 103.02816772460938, 105.2652587890625, 107.5023422241211, 109.73942565917969, 111.97651672363281, 114.21360778808594, 116.45069122314453, 118.68777465820312, 120.92486572265625, 123.16195678710938, 125.39904022216797, 127.63612365722656, 129.8732147216797, 132.1103057861328, 134.34738159179688, 136.58447265625, 138.82156372070312]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 13.0, 13.0, 18.0, 17.0, 24.0, 24.0, 34.0, 48.0, 36.0, 42.0, 48.0, 44.0, 37.0, 32.0, 34.0, 58.0, 39.0, 34.0, 23.0, 36.0, 38.0, 31.0, 34.0, 28.0, 27.0, 22.0, 17.0, 22.0, 19.0, 17.0, 9.0, 13.0, 8.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.37146759033203, -19.653667449951172, -18.935867309570312, -18.218067169189453, -17.500267028808594, -16.782468795776367, -16.064668655395508, -15.346868515014648, -14.629068374633789, -13.91126823425293, -13.19346809387207, -12.475668907165527, -11.757868766784668, -11.040068626403809, -10.322269439697266, -9.604469299316406, -8.886669158935547, -8.168869018554688, -7.451069355010986, -6.733269691467285, -6.015469551086426, -5.297669410705566, -4.579869747161865, -3.862070083618164, -3.1442699432373047, -2.4264700412750244, -1.7086701393127441, -0.9908702373504639, -0.2730703353881836, 0.4447295665740967, 1.162529468536377, 1.8803291320800781, 2.5981311798095703, 3.3159310817718506, 4.033730983734131, 4.751530647277832, 5.469330787658691, 6.187130928039551, 6.904930591583252, 7.622730255126953, 8.340530395507812, 9.058330535888672, 9.776130676269531, 10.493929862976074, 11.211730003356934, 11.929530143737793, 12.647329330444336, 13.365129470825195, 14.082929611206055, 14.800729751586914, 15.518529891967773, 16.236330032348633, 16.95412826538086, 17.67192840576172, 18.389728546142578, 19.107528686523438, 19.825328826904297, 20.543128967285156, 21.260929107666016, 21.978729248046875, 22.696529388427734, 23.41432762145996, 24.13212776184082, 24.84992790222168, 25.56772804260254]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 17.0, 11.0, 26.0, 32.0, 19.0, 30.0, 28.0, 38.0, 41.0, 32.0, 39.0, 58.0, 49.0, 34.0, 64.0, 56.0, 51.0, 43.0, 38.0, 40.0, 41.0, 32.0, 38.0, 19.0, 17.0, 13.0, 18.0, 7.0, 11.0, 9.0, 3.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.302734375, -2.2364501953125, -2.170166015625, -2.1038818359375, -2.03759765625, -1.9713134765625, -1.905029296875, -1.8387451171875, -1.7724609375, -1.7061767578125, -1.639892578125, -1.5736083984375, -1.50732421875, -1.4410400390625, -1.374755859375, -1.3084716796875, -1.2421875, -1.1759033203125, -1.109619140625, -1.0433349609375, -0.97705078125, -0.9107666015625, -0.844482421875, -0.7781982421875, -0.7119140625, -0.6456298828125, -0.579345703125, -0.5130615234375, -0.44677734375, -0.3804931640625, -0.314208984375, -0.2479248046875, -0.181640625, -0.1153564453125, -0.049072265625, 0.0172119140625, 0.08349609375, 0.1497802734375, 0.216064453125, 0.2823486328125, 0.3486328125, 0.4149169921875, 0.481201171875, 0.5474853515625, 0.61376953125, 0.6800537109375, 0.746337890625, 0.8126220703125, 0.87890625, 0.9451904296875, 1.011474609375, 1.0777587890625, 1.14404296875, 1.2103271484375, 1.276611328125, 1.3428955078125, 1.4091796875, 1.4754638671875, 1.541748046875, 1.6080322265625, 1.67431640625, 1.7406005859375, 1.806884765625, 1.8731689453125, 1.939453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 42.0, 66.0, 99.0, 115.0, 150.0, 218.0, 335.0, 504.0, 727.0, 1181.0, 1778.0, 2761.0, 4440.0, 7495.0, 12859.0, 22770.0, 44294.0, 103832.0, 626466.0, 2775035.0, 412048.0, 88648.0, 39105.0, 20446.0, 11462.0, 6531.0, 3892.0, 2381.0, 1542.0, 932.0, 605.0, 439.0, 277.0, 225.0, 148.0, 110.0, 89.0, 42.0, 38.0, 23.0, 11.0, 15.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.87890625, -4.72357177734375, -4.5682373046875, -4.41290283203125, -4.257568359375, -4.10223388671875, -3.9468994140625, -3.79156494140625, -3.63623046875, -3.48089599609375, -3.3255615234375, -3.17022705078125, -3.014892578125, -2.85955810546875, -2.7042236328125, -2.54888916015625, -2.3935546875, -2.23822021484375, -2.0828857421875, -1.92755126953125, -1.772216796875, -1.61688232421875, -1.4615478515625, -1.30621337890625, -1.15087890625, -0.99554443359375, -0.8402099609375, -0.68487548828125, -0.529541015625, -0.37420654296875, -0.2188720703125, -0.06353759765625, 0.091796875, 0.24713134765625, 0.4024658203125, 0.55780029296875, 0.713134765625, 0.86846923828125, 1.0238037109375, 1.17913818359375, 1.33447265625, 1.48980712890625, 1.6451416015625, 1.80047607421875, 1.955810546875, 2.11114501953125, 2.2664794921875, 2.42181396484375, 2.5771484375, 2.73248291015625, 2.8878173828125, 3.04315185546875, 3.198486328125, 3.35382080078125, 3.5091552734375, 3.66448974609375, 3.81982421875, 3.97515869140625, 4.1304931640625, 4.28582763671875, 4.441162109375, 4.59649658203125, 4.7518310546875, 4.90716552734375, 5.0625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 14.0, 17.0, 34.0, 45.0, 71.0, 117.0, 173.0, 297.0, 708.0, 1141.0, 655.0, 288.0, 174.0, 100.0, 75.0, 43.0, 32.0, 19.0, 12.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2578125, -10.9488525390625, -10.639892578125, -10.3309326171875, -10.02197265625, -9.7130126953125, -9.404052734375, -9.0950927734375, -8.7861328125, -8.4771728515625, -8.168212890625, -7.8592529296875, -7.55029296875, -7.2413330078125, -6.932373046875, -6.6234130859375, -6.314453125, -6.0054931640625, -5.696533203125, -5.3875732421875, -5.07861328125, -4.7696533203125, -4.460693359375, -4.1517333984375, -3.8427734375, -3.5338134765625, -3.224853515625, -2.9158935546875, -2.60693359375, -2.2979736328125, -1.989013671875, -1.6800537109375, -1.37109375, -1.0621337890625, -0.753173828125, -0.4442138671875, -0.13525390625, 0.1737060546875, 0.482666015625, 0.7916259765625, 1.1005859375, 1.4095458984375, 1.718505859375, 2.0274658203125, 2.33642578125, 2.6453857421875, 2.954345703125, 3.2633056640625, 3.572265625, 3.8812255859375, 4.190185546875, 4.4991455078125, 4.80810546875, 5.1170654296875, 5.426025390625, 5.7349853515625, 6.0439453125, 6.3529052734375, 6.661865234375, 6.9708251953125, 7.27978515625, 7.5887451171875, 7.897705078125, 8.2066650390625, 8.515625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 12.0, 14.0, 13.0, 24.0, 36.0, 23.0, 41.0, 46.0, 72.0, 103.0, 136.0, 175.0, 263.0, 428.0, 745.0, 1329.0, 2720.0, 5510.0, 12774.0, 31928.0, 96561.0, 472135.0, 3078413.0, 357934.0, 82316.0, 28538.0, 11259.0, 5018.0, 2443.0, 1182.0, 710.0, 469.0, 223.0, 179.0, 110.0, 98.0, 60.0, 55.0, 38.0, 29.0, 27.0, 16.0, 12.0, 13.0, 5.0, 8.0, 13.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5625, -10.2154541015625, -9.868408203125, -9.5213623046875, -9.17431640625, -8.8272705078125, -8.480224609375, -8.1331787109375, -7.7861328125, -7.4390869140625, -7.092041015625, -6.7449951171875, -6.39794921875, -6.0509033203125, -5.703857421875, -5.3568115234375, -5.009765625, -4.6627197265625, -4.315673828125, -3.9686279296875, -3.62158203125, -3.2745361328125, -2.927490234375, -2.5804443359375, -2.2333984375, -1.8863525390625, -1.539306640625, -1.1922607421875, -0.84521484375, -0.4981689453125, -0.151123046875, 0.1959228515625, 0.54296875, 0.8900146484375, 1.237060546875, 1.5841064453125, 1.93115234375, 2.2781982421875, 2.625244140625, 2.9722900390625, 3.3193359375, 3.6663818359375, 4.013427734375, 4.3604736328125, 4.70751953125, 5.0545654296875, 5.401611328125, 5.7486572265625, 6.095703125, 6.4427490234375, 6.789794921875, 7.1368408203125, 7.48388671875, 7.8309326171875, 8.177978515625, 8.5250244140625, 8.8720703125, 9.2191162109375, 9.566162109375, 9.9132080078125, 10.26025390625, 10.6072998046875, 10.954345703125, 11.3013916015625, 11.6484375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 10.0, 9.0, 15.0, 24.0, 30.0, 39.0, 44.0, 94.0, 118.0, 160.0, 138.0, 104.0, 72.0, 42.0, 43.0, 26.0, 16.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.158594131469727, -16.842029571533203, -15.525463104248047, -14.208897590637207, -12.892332077026367, -11.575766563415527, -10.259201049804688, -8.942635536193848, -7.626070022583008, -6.309504508972168, -4.992938995361328, -3.6763734817504883, -2.3598079681396484, -1.0432424545288086, 0.27332305908203125, 1.589888572692871, 2.906454086303711, 4.223019599914551, 5.539585113525391, 6.8561506271362305, 8.17271614074707, 9.48928165435791, 10.80584716796875, 12.12241268157959, 13.43897819519043, 14.75554370880127, 16.07210922241211, 17.388675689697266, 18.70524024963379, 20.021804809570312, 21.33837127685547, 22.654937744140625, 23.97150421142578, 25.288070678710938, 26.60463523864746, 27.921199798583984, 29.23776626586914, 30.554332733154297, 31.87089729309082, 33.187461853027344, 34.5040283203125, 35.820594787597656, 37.13716125488281, 38.4537239074707, 39.77029037475586, 41.086856842041016, 42.403419494628906, 43.71998596191406, 45.03655242919922, 46.353118896484375, 47.66968536376953, 48.98624801635742, 50.30281448364258, 51.619380950927734, 52.935943603515625, 54.25251007080078, 55.56907653808594, 56.885643005371094, 58.20220947265625, 59.51877212524414, 60.8353385925293, 62.15190505981445, 63.468467712402344, 64.7850341796875, 66.10160064697266]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 1.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 22.0, 28.0, 14.0, 22.0, 19.0, 31.0, 35.0, 39.0, 36.0, 38.0, 29.0, 29.0, 37.0, 36.0, 44.0, 49.0, 33.0, 44.0, 32.0, 37.0, 25.0, 34.0, 26.0, 29.0, 22.0, 30.0, 14.0, 12.0, 16.0, 17.0, 9.0, 10.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 6.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.290016174316406, -17.674758911132812, -17.059499740600586, -16.444242477416992, -15.828984260559082, -15.213726043701172, -14.598468780517578, -13.983210563659668, -13.367952346801758, -12.752694129943848, -12.137436866760254, -11.522178649902344, -10.906920433044434, -10.291662216186523, -9.67640495300293, -9.06114673614502, -8.445889472961426, -7.830631732940674, -7.215373516082764, -6.600115776062012, -5.984857559204102, -5.36959981918335, -4.754342079162598, -4.1390838623046875, -3.5238261222839355, -2.9085681438446045, -2.2933101654052734, -1.6780524253845215, -1.0627944469451904, -0.4475364685058594, 0.16772127151489258, 0.7829794883728027, 1.3982372283935547, 2.0134952068328857, 2.628753185272217, 3.2440109252929688, 3.8592689037323, 4.474526882171631, 5.089784622192383, 5.705042839050293, 6.320300579071045, 6.935558319091797, 7.550816535949707, 8.166074752807617, 8.781332015991211, 9.396590232849121, 10.011848449707031, 10.627105712890625, 11.242363929748535, 11.857622146606445, 12.472879409790039, 13.08813762664795, 13.70339584350586, 14.318653106689453, 14.933911323547363, 15.549169540405273, 16.164426803588867, 16.77968406677246, 17.394943237304688, 18.01020050048828, 18.625457763671875, 19.2407169342041, 19.855974197387695, 20.471233367919922, 21.086490631103516]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 19.0, 17.0, 19.0, 20.0, 23.0, 21.0, 33.0, 29.0, 43.0, 38.0, 39.0, 42.0, 47.0, 48.0, 44.0, 57.0, 49.0, 36.0, 46.0, 50.0, 34.0, 29.0, 29.0, 34.0, 28.0, 21.0, 17.0, 15.0, 18.0, 14.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.6990509033203125, -1.633453369140625, -1.5678558349609375, -1.50225830078125, -1.4366607666015625, -1.371063232421875, -1.3054656982421875, -1.2398681640625, -1.1742706298828125, -1.108673095703125, -1.0430755615234375, -0.97747802734375, -0.9118804931640625, -0.846282958984375, -0.7806854248046875, -0.715087890625, -0.6494903564453125, -0.583892822265625, -0.5182952880859375, -0.45269775390625, -0.3871002197265625, -0.321502685546875, -0.2559051513671875, -0.1903076171875, -0.1247100830078125, -0.059112548828125, 0.0064849853515625, 0.07208251953125, 0.1376800537109375, 0.203277587890625, 0.2688751220703125, 0.33447265625, 0.4000701904296875, 0.465667724609375, 0.5312652587890625, 0.59686279296875, 0.6624603271484375, 0.728057861328125, 0.7936553955078125, 0.8592529296875, 0.9248504638671875, 0.990447998046875, 1.0560455322265625, 1.12164306640625, 1.1872406005859375, 1.252838134765625, 1.3184356689453125, 1.384033203125, 1.4496307373046875, 1.515228271484375, 1.5808258056640625, 1.64642333984375, 1.7120208740234375, 1.777618408203125, 1.8432159423828125, 1.9088134765625, 1.9744110107421875, 2.040008544921875, 2.1056060791015625, 2.17120361328125, 2.2368011474609375, 2.302398681640625, 2.3679962158203125, 2.43359375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 9.0, 18.0, 22.0, 32.0, 32.0, 83.0, 110.0, 175.0, 240.0, 455.0, 601.0, 1092.0, 1709.0, 3130.0, 5302.0, 9713.0, 18598.0, 37554.0, 83641.0, 210482.0, 371410.0, 167647.0, 68728.0, 31721.0, 16166.0, 8395.0, 4635.0, 2703.0, 1528.0, 965.0, 588.0, 401.0, 201.0, 150.0, 99.0, 65.0, 57.0, 20.0, 24.0, 14.0, 15.0, 4.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6484375, -8.34375, -8.0390625, -7.734375, -7.4296875, -7.125, -6.8203125, -6.515625, -6.2109375, -5.90625, -5.6015625, -5.296875, -4.9921875, -4.6875, -4.3828125, -4.078125, -3.7734375, -3.46875, -3.1640625, -2.859375, -2.5546875, -2.25, -1.9453125, -1.640625, -1.3359375, -1.03125, -0.7265625, -0.421875, -0.1171875, 0.1875, 0.4921875, 0.796875, 1.1015625, 1.40625, 1.7109375, 2.015625, 2.3203125, 2.625, 2.9296875, 3.234375, 3.5390625, 3.84375, 4.1484375, 4.453125, 4.7578125, 5.0625, 5.3671875, 5.671875, 5.9765625, 6.28125, 6.5859375, 6.890625, 7.1953125, 7.5, 7.8046875, 8.109375, 8.4140625, 8.71875, 9.0234375, 9.328125, 9.6328125, 9.9375, 10.2421875, 10.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 7.0, 8.0, 12.0, 16.0, 19.0, 24.0, 21.0, 21.0, 30.0, 35.0, 37.0, 36.0, 49.0, 50.0, 42.0, 54.0, 1076.0, 46.0, 42.0, 52.0, 47.0, 49.0, 36.0, 37.0, 28.0, 22.0, 20.0, 17.0, 20.0, 13.0, 17.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08984375, -2.025390625, -1.9609375, -1.896484375, -1.83203125, -1.767578125, -1.703125, -1.638671875, -1.57421875, -1.509765625, -1.4453125, -1.380859375, -1.31640625, -1.251953125, -1.1875, -1.123046875, -1.05859375, -0.994140625, -0.9296875, -0.865234375, -0.80078125, -0.736328125, -0.671875, -0.607421875, -0.54296875, -0.478515625, -0.4140625, -0.349609375, -0.28515625, -0.220703125, -0.15625, -0.091796875, -0.02734375, 0.037109375, 0.1015625, 0.166015625, 0.23046875, 0.294921875, 0.359375, 0.423828125, 0.48828125, 0.552734375, 0.6171875, 0.681640625, 0.74609375, 0.810546875, 0.875, 0.939453125, 1.00390625, 1.068359375, 1.1328125, 1.197265625, 1.26171875, 1.326171875, 1.390625, 1.455078125, 1.51953125, 1.583984375, 1.6484375, 1.712890625, 1.77734375, 1.841796875, 1.90625, 1.970703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 15.0, 11.0, 39.0, 30.0, 52.0, 107.0, 154.0, 280.0, 399.0, 677.0, 1158.0, 2551.0, 5547.0, 14616.0, 52972.0, 1054775.0, 886692.0, 51394.0, 14457.0, 5503.0, 2576.0, 1287.0, 691.0, 423.0, 225.0, 169.0, 107.0, 73.0, 40.0, 27.0, 14.0, 14.0, 6.0, 9.0, 1.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.359619140625, -18.73486328125, -18.110107421875, -17.4853515625, -16.860595703125, -16.23583984375, -15.611083984375, -14.986328125, -14.361572265625, -13.73681640625, -13.112060546875, -12.4873046875, -11.862548828125, -11.23779296875, -10.613037109375, -9.98828125, -9.363525390625, -8.73876953125, -8.114013671875, -7.4892578125, -6.864501953125, -6.23974609375, -5.614990234375, -4.990234375, -4.365478515625, -3.74072265625, -3.115966796875, -2.4912109375, -1.866455078125, -1.24169921875, -0.616943359375, 0.0078125, 0.632568359375, 1.25732421875, 1.882080078125, 2.5068359375, 3.131591796875, 3.75634765625, 4.381103515625, 5.005859375, 5.630615234375, 6.25537109375, 6.880126953125, 7.5048828125, 8.129638671875, 8.75439453125, 9.379150390625, 10.00390625, 10.628662109375, 11.25341796875, 11.878173828125, 12.5029296875, 13.127685546875, 13.75244140625, 14.377197265625, 15.001953125, 15.626708984375, 16.25146484375, 16.876220703125, 17.5009765625, 18.125732421875, 18.75048828125, 19.375244140625, 20.0]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 27.0, 33.0, 66.0, 94.0, 208.0, 224.0, 114.0, 55.0, 41.0, 21.0, 15.0, 10.0, 11.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.415283203125, -4.25244140625, -4.089599609375, -3.9267578125, -3.763916015625, -3.60107421875, -3.438232421875, -3.275390625, -3.112548828125, -2.94970703125, -2.786865234375, -2.6240234375, -2.461181640625, -2.29833984375, -2.135498046875, -1.97265625, -1.809814453125, -1.64697265625, -1.484130859375, -1.3212890625, -1.158447265625, -0.99560546875, -0.832763671875, -0.669921875, -0.507080078125, -0.34423828125, -0.181396484375, -0.0185546875, 0.144287109375, 0.30712890625, 0.469970703125, 0.6328125, 0.795654296875, 0.95849609375, 1.121337890625, 1.2841796875, 1.447021484375, 1.60986328125, 1.772705078125, 1.935546875, 2.098388671875, 2.26123046875, 2.424072265625, 2.5869140625, 2.749755859375, 2.91259765625, 3.075439453125, 3.23828125, 3.401123046875, 3.56396484375, 3.726806640625, 3.8896484375, 4.052490234375, 4.21533203125, 4.378173828125, 4.541015625, 4.703857421875, 4.86669921875, 5.029541015625, 5.1923828125, 5.355224609375, 5.51806640625, 5.680908203125, 5.84375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 7.0, 8.0, 14.0, 9.0, 22.0, 37.0, 55.0, 89.0, 208.0, 703.0, 4402.0, 356710.0, 680264.0, 4748.0, 733.0, 240.0, 112.0, 57.0, 34.0, 29.0, 14.0, 14.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.8125, -84.40234375, -81.9921875, -79.58203125, -77.171875, -74.76171875, -72.3515625, -69.94140625, -67.53125, -65.12109375, -62.7109375, -60.30078125, -57.890625, -55.48046875, -53.0703125, -50.66015625, -48.25, -45.83984375, -43.4296875, -41.01953125, -38.609375, -36.19921875, -33.7890625, -31.37890625, -28.96875, -26.55859375, -24.1484375, -21.73828125, -19.328125, -16.91796875, -14.5078125, -12.09765625, -9.6875, -7.27734375, -4.8671875, -2.45703125, -0.046875, 2.36328125, 4.7734375, 7.18359375, 9.59375, 12.00390625, 14.4140625, 16.82421875, 19.234375, 21.64453125, 24.0546875, 26.46484375, 28.875, 31.28515625, 33.6953125, 36.10546875, 38.515625, 40.92578125, 43.3359375, 45.74609375, 48.15625, 50.56640625, 52.9765625, 55.38671875, 57.796875, 60.20703125, 62.6171875, 65.02734375, 67.4375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 17.0, 55.0, 133.0, 351.0, 290.0, 101.0, 35.0, 17.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.813743591308594, -8.370620727539062, -7.927497863769531, -7.484375, -7.041252613067627, -6.598129749298096, -6.1550068855285645, -5.711884498596191, -5.26876163482666, -4.825638771057129, -4.382515907287598, -3.9393932819366455, -3.4962706565856934, -3.053147792816162, -2.610024929046631, -2.1669023036956787, -1.7237792015075684, -1.2806564569473267, -0.8375336527824402, -0.3944108486175537, 0.04871189594268799, 0.4918346405029297, 0.9349575042724609, 1.378080129623413, 1.8212029933929443, 2.2643258571624756, 2.7074484825134277, 3.150571346282959, 3.5936942100524902, 4.036816596984863, 4.4799394607543945, 4.923062324523926, 5.366185188293457, 5.809308052062988, 6.2524309158325195, 6.695553779602051, 7.138676166534424, 7.581799030303955, 8.024921417236328, 8.46804428100586, 8.91116714477539, 9.354290008544922, 9.797412872314453, 10.240535736083984, 10.683658599853516, 11.126781463623047, 11.569904327392578, 12.013026237487793, 12.45615005493164, 12.899272918701172, 13.342395782470703, 13.785518646240234, 14.228641510009766, 14.671764373779297, 15.114887237548828, 15.558009147644043, 16.001131057739258, 16.44425392150879, 16.88737678527832, 17.33049964904785, 17.773622512817383, 18.216745376586914, 18.659868240356445, 19.102991104125977, 19.546113967895508]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 23.0, 21.0, 37.0, 42.0, 46.0, 58.0, 56.0, 62.0, 71.0, 71.0, 65.0, 60.0, 57.0, 61.0, 53.0, 40.0, 34.0, 23.0, 34.0, 20.0, 21.0, 15.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7889270782470703, -3.6258251667022705, -3.4627232551574707, -3.299621343612671, -3.136519432067871, -2.973417282104492, -2.8103153705596924, -2.6472134590148926, -2.4841115474700928, -2.321009635925293, -2.157907724380493, -1.9948056936264038, -1.831703782081604, -1.6686018705368042, -1.5054998397827148, -1.342397928237915, -1.1792960166931152, -1.0161941051483154, -0.8530921339988708, -0.6899901628494263, -0.5268882513046265, -0.36378633975982666, -0.20068436861038208, -0.0375823974609375, 0.1255195140838623, 0.2886214554309845, 0.4517233967781067, 0.6148253679275513, 0.7779272794723511, 0.9410291910171509, 1.1041312217712402, 1.26723313331604, 1.4303350448608398, 1.5934369564056396, 1.7565388679504395, 1.9196408987045288, 2.082742691040039, 2.245844841003418, 2.4089467525482178, 2.5720486640930176, 2.7351505756378174, 2.898252487182617, 3.061354398727417, 3.224456310272217, 3.3875584602355957, 3.5506601333618164, 3.7137622833251953, 3.876864194869995, 4.039966106414795, 4.203068256378174, 4.3661699295043945, 4.529272079467773, 4.692373752593994, 4.855475902557373, 5.018577575683594, 5.181679725646973, 5.344781875610352, 5.5078840255737305, 5.670985698699951, 5.83408784866333, 5.997189521789551, 6.16029167175293, 6.32339334487915, 6.486495494842529, 6.64959716796875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 15.0, 23.0, 33.0, 34.0, 26.0, 39.0, 43.0, 54.0, 61.0, 55.0, 54.0, 55.0, 73.0, 57.0, 49.0, 53.0, 44.0, 38.0, 35.0, 34.0, 26.0, 26.0, 15.0, 10.0, 11.0, 8.0, 5.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24273681640625, -2.1593017578125, -2.07586669921875, -1.992431640625, -1.90899658203125, -1.8255615234375, -1.74212646484375, -1.65869140625, -1.57525634765625, -1.4918212890625, -1.40838623046875, -1.324951171875, -1.24151611328125, -1.1580810546875, -1.07464599609375, -0.9912109375, -0.90777587890625, -0.8243408203125, -0.74090576171875, -0.657470703125, -0.57403564453125, -0.4906005859375, -0.40716552734375, -0.32373046875, -0.24029541015625, -0.1568603515625, -0.07342529296875, 0.010009765625, 0.09344482421875, 0.1768798828125, 0.26031494140625, 0.34375, 0.42718505859375, 0.5106201171875, 0.59405517578125, 0.677490234375, 0.76092529296875, 0.8443603515625, 0.92779541015625, 1.01123046875, 1.09466552734375, 1.1781005859375, 1.26153564453125, 1.344970703125, 1.42840576171875, 1.5118408203125, 1.59527587890625, 1.6787109375, 1.76214599609375, 1.8455810546875, 1.92901611328125, 2.012451171875, 2.09588623046875, 2.1793212890625, 2.26275634765625, 2.34619140625, 2.42962646484375, 2.5130615234375, 2.59649658203125, 2.679931640625, 2.76336669921875, 2.8468017578125, 2.93023681640625, 3.013671875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 9.0, 8.0, 13.0, 9.0, 18.0, 21.0, 43.0, 54.0, 82.0, 96.0, 154.0, 241.0, 305.0, 459.0, 737.0, 989.0, 1544.0, 2397.0, 4013.0, 6952.0, 14391.0, 58775.0, 695115.0, 214136.0, 24401.0, 9550.0, 5023.0, 3097.0, 1993.0, 1366.0, 790.0, 522.0, 348.0, 251.0, 200.0, 117.0, 87.0, 62.0, 48.0, 51.0, 22.0, 16.0, 14.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.29315185546875, -4.1488037109375, -4.00445556640625, -3.860107421875, -3.71575927734375, -3.5714111328125, -3.42706298828125, -3.28271484375, -3.13836669921875, -2.9940185546875, -2.84967041015625, -2.705322265625, -2.56097412109375, -2.4166259765625, -2.27227783203125, -2.1279296875, -1.98358154296875, -1.8392333984375, -1.69488525390625, -1.550537109375, -1.40618896484375, -1.2618408203125, -1.11749267578125, -0.97314453125, -0.82879638671875, -0.6844482421875, -0.54010009765625, -0.395751953125, -0.25140380859375, -0.1070556640625, 0.03729248046875, 0.181640625, 0.32598876953125, 0.4703369140625, 0.61468505859375, 0.759033203125, 0.90338134765625, 1.0477294921875, 1.19207763671875, 1.33642578125, 1.48077392578125, 1.6251220703125, 1.76947021484375, 1.913818359375, 2.05816650390625, 2.2025146484375, 2.34686279296875, 2.4912109375, 2.63555908203125, 2.7799072265625, 2.92425537109375, 3.068603515625, 3.21295166015625, 3.3572998046875, 3.50164794921875, 3.64599609375, 3.79034423828125, 3.9346923828125, 4.07904052734375, 4.223388671875, 4.36773681640625, 4.5120849609375, 4.65643310546875, 4.80078125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 9.0, 11.0, 11.0, 20.0, 16.0, 16.0, 33.0, 20.0, 34.0, 43.0, 30.0, 39.0, 35.0, 47.0, 46.0, 103.0, 249.0, 1549.0, 211.0, 91.0, 57.0, 43.0, 52.0, 44.0, 30.0, 28.0, 23.0, 26.0, 17.0, 10.0, 13.0, 13.0, 13.0, 12.0, 6.0, 4.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.84375, -5.6307373046875, -5.417724609375, -5.2047119140625, -4.99169921875, -4.7786865234375, -4.565673828125, -4.3526611328125, -4.1396484375, -3.9266357421875, -3.713623046875, -3.5006103515625, -3.28759765625, -3.0745849609375, -2.861572265625, -2.6485595703125, -2.435546875, -2.2225341796875, -2.009521484375, -1.7965087890625, -1.58349609375, -1.3704833984375, -1.157470703125, -0.9444580078125, -0.7314453125, -0.5184326171875, -0.305419921875, -0.0924072265625, 0.12060546875, 0.3336181640625, 0.546630859375, 0.7596435546875, 0.97265625, 1.1856689453125, 1.398681640625, 1.6116943359375, 1.82470703125, 2.0377197265625, 2.250732421875, 2.4637451171875, 2.6767578125, 2.8897705078125, 3.102783203125, 3.3157958984375, 3.52880859375, 3.7418212890625, 3.954833984375, 4.1678466796875, 4.380859375, 4.5938720703125, 4.806884765625, 5.0198974609375, 5.23291015625, 5.4459228515625, 5.658935546875, 5.8719482421875, 6.0849609375, 6.2979736328125, 6.510986328125, 6.7239990234375, 6.93701171875, 7.1500244140625, 7.363037109375, 7.5760498046875, 7.7890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 11.0, 4.0, 7.0, 10.0, 12.0, 20.0, 20.0, 26.0, 45.0, 72.0, 101.0, 159.0, 296.0, 543.0, 985.0, 1948.0, 4352.0, 12097.0, 53617.0, 2012978.0, 1000333.0, 40026.0, 10216.0, 4013.0, 1690.0, 898.0, 440.0, 264.0, 157.0, 89.0, 84.0, 46.0, 34.0, 26.0, 20.0, 14.0, 9.0, 14.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0], "bins": [-9.1953125, -8.9462890625, -8.697265625, -8.4482421875, -8.19921875, -7.9501953125, -7.701171875, -7.4521484375, -7.203125, -6.9541015625, -6.705078125, -6.4560546875, -6.20703125, -5.9580078125, -5.708984375, -5.4599609375, -5.2109375, -4.9619140625, -4.712890625, -4.4638671875, -4.21484375, -3.9658203125, -3.716796875, -3.4677734375, -3.21875, -2.9697265625, -2.720703125, -2.4716796875, -2.22265625, -1.9736328125, -1.724609375, -1.4755859375, -1.2265625, -0.9775390625, -0.728515625, -0.4794921875, -0.23046875, 0.0185546875, 0.267578125, 0.5166015625, 0.765625, 1.0146484375, 1.263671875, 1.5126953125, 1.76171875, 2.0107421875, 2.259765625, 2.5087890625, 2.7578125, 3.0068359375, 3.255859375, 3.5048828125, 3.75390625, 4.0029296875, 4.251953125, 4.5009765625, 4.75, 4.9990234375, 5.248046875, 5.4970703125, 5.74609375, 5.9951171875, 6.244140625, 6.4931640625, 6.7421875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 25.0, 156.0, 511.0, 269.0, 49.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640542030334473, -4.840981960296631, -3.041422128677368, -1.2418622970581055, 0.5576977729797363, 2.357257843017578, 4.156817436218262, 5.956377983093262, 7.755937576293945, 9.555497169494629, 11.355057716369629, 13.154617309570312, 14.954177856445312, 16.753738403320312, 18.55329704284668, 20.35285758972168, 22.152416229248047, 23.951976776123047, 25.751535415649414, 27.551095962524414, 29.350656509399414, 31.15021514892578, 32.94977569580078, 34.74933624267578, 36.54889678955078, 38.34845733642578, 40.14801788330078, 41.94757843017578, 43.747135162353516, 45.546695709228516, 47.346256256103516, 49.145816802978516, 50.945377349853516, 52.744937896728516, 54.544498443603516, 56.34405517578125, 58.14361572265625, 59.94317626953125, 61.74273681640625, 63.54229736328125, 65.34185791015625, 67.14141845703125, 68.94097900390625, 70.74053955078125, 72.54010009765625, 74.33966064453125, 76.13922119140625, 77.93878173828125, 79.73833465576172, 81.53789520263672, 83.33745574951172, 85.13701629638672, 86.93657684326172, 88.73613739013672, 90.53569030761719, 92.33525085449219, 94.13481903076172, 95.93437957763672, 97.73394012451172, 99.53350067138672, 101.33306121826172, 103.13262176513672, 104.93217468261719, 106.73173522949219, 108.53129577636719]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 9.0, 6.0, 13.0, 14.0, 19.0, 15.0, 15.0, 24.0, 42.0, 28.0, 38.0, 34.0, 35.0, 59.0, 37.0, 33.0, 38.0, 61.0, 44.0, 47.0, 48.0, 42.0, 41.0, 37.0, 28.0, 37.0, 18.0, 14.0, 17.0, 20.0, 14.0, 16.0, 10.0, 9.0, 12.0, 10.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.468992233276367, -24.713703155517578, -23.95841407775879, -23.203125, -22.447834014892578, -21.69254493713379, -20.937255859375, -20.18196678161621, -19.426677703857422, -18.671388626098633, -17.916099548339844, -17.160808563232422, -16.405519485473633, -15.650230407714844, -14.894941329956055, -14.139652252197266, -13.384361267089844, -12.629072189331055, -11.87378215789795, -11.11849308013916, -10.363203048706055, -9.607913970947266, -8.852624893188477, -8.097335815429688, -7.342045783996582, -6.586756229400635, -5.8314666748046875, -5.076177597045898, -4.320888042449951, -3.565598487854004, -2.810309410095215, -2.0550198554992676, -1.2997283935546875, -0.5444389581680298, 0.21085047721862793, 0.9661397933959961, 1.7214293479919434, 2.4767189025878906, 3.2320079803466797, 3.987297534942627, 4.742587089538574, 5.4978766441345215, 6.253166198730469, 7.008455276489258, 7.763744831085205, 8.519034385681152, 9.274323463439941, 10.029613494873047, 10.784902572631836, 11.540191650390625, 12.29548168182373, 13.05077075958252, 13.806060791015625, 14.561349868774414, 15.316638946533203, 16.071928024291992, 16.82721710205078, 17.58250617980957, 18.33779525756836, 19.09308624267578, 19.84837532043457, 20.60366439819336, 21.35895347595215, 22.114242553710938, 22.86953353881836]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 13.0, 13.0, 14.0, 19.0, 30.0, 24.0, 33.0, 40.0, 31.0, 43.0, 46.0, 59.0, 51.0, 54.0, 60.0, 42.0, 57.0, 51.0, 39.0, 35.0, 35.0, 26.0, 31.0, 39.0, 24.0, 21.0, 12.0, 10.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.016082763671875, -1.94232177734375, -1.868560791015625, -1.7947998046875, -1.721038818359375, -1.64727783203125, -1.573516845703125, -1.499755859375, -1.425994873046875, -1.35223388671875, -1.278472900390625, -1.2047119140625, -1.130950927734375, -1.05718994140625, -0.983428955078125, -0.90966796875, -0.835906982421875, -0.76214599609375, -0.688385009765625, -0.6146240234375, -0.540863037109375, -0.46710205078125, -0.393341064453125, -0.319580078125, -0.245819091796875, -0.17205810546875, -0.098297119140625, -0.0245361328125, 0.049224853515625, 0.12298583984375, 0.196746826171875, 0.2705078125, 0.344268798828125, 0.41802978515625, 0.491790771484375, 0.5655517578125, 0.639312744140625, 0.71307373046875, 0.786834716796875, 0.860595703125, 0.934356689453125, 1.00811767578125, 1.081878662109375, 1.1556396484375, 1.229400634765625, 1.30316162109375, 1.376922607421875, 1.45068359375, 1.524444580078125, 1.59820556640625, 1.671966552734375, 1.7457275390625, 1.819488525390625, 1.89324951171875, 1.967010498046875, 2.040771484375, 2.114532470703125, 2.18829345703125, 2.262054443359375, 2.3358154296875, 2.409576416015625, 2.48333740234375, 2.557098388671875, 2.630859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 4.0, 6.0, 6.0, 14.0, 13.0, 26.0, 28.0, 52.0, 56.0, 86.0, 143.0, 200.0, 298.0, 446.0, 651.0, 1080.0, 1685.0, 2792.0, 4601.0, 8269.0, 15021.0, 29550.0, 65355.0, 248620.0, 2837591.0, 795599.0, 99004.0, 39165.0, 19105.0, 10193.0, 5752.0, 3350.0, 1987.0, 1249.0, 784.0, 507.0, 301.0, 227.0, 133.0, 103.0, 72.0, 56.0, 23.0, 29.0, 16.0, 5.0, 8.0, 10.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.578125, -6.38299560546875, -6.1878662109375, -5.99273681640625, -5.797607421875, -5.60247802734375, -5.4073486328125, -5.21221923828125, -5.01708984375, -4.82196044921875, -4.6268310546875, -4.43170166015625, -4.236572265625, -4.04144287109375, -3.8463134765625, -3.65118408203125, -3.4560546875, -3.26092529296875, -3.0657958984375, -2.87066650390625, -2.675537109375, -2.48040771484375, -2.2852783203125, -2.09014892578125, -1.89501953125, -1.69989013671875, -1.5047607421875, -1.30963134765625, -1.114501953125, -0.91937255859375, -0.7242431640625, -0.52911376953125, -0.333984375, -0.13885498046875, 0.0562744140625, 0.25140380859375, 0.446533203125, 0.64166259765625, 0.8367919921875, 1.03192138671875, 1.22705078125, 1.42218017578125, 1.6173095703125, 1.81243896484375, 2.007568359375, 2.20269775390625, 2.3978271484375, 2.59295654296875, 2.7880859375, 2.98321533203125, 3.1783447265625, 3.37347412109375, 3.568603515625, 3.76373291015625, 3.9588623046875, 4.15399169921875, 4.34912109375, 4.54425048828125, 4.7393798828125, 4.93450927734375, 5.129638671875, 5.32476806640625, 5.5198974609375, 5.71502685546875, 5.91015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 6.0, 6.0, 16.0, 23.0, 23.0, 50.0, 45.0, 69.0, 74.0, 104.0, 140.0, 274.0, 533.0, 824.0, 749.0, 393.0, 226.0, 143.0, 90.0, 72.0, 47.0, 32.0, 27.0, 29.0, 18.0, 12.0, 7.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.70367431640625, -4.4659423828125, -4.22821044921875, -3.990478515625, -3.75274658203125, -3.5150146484375, -3.27728271484375, -3.03955078125, -2.80181884765625, -2.5640869140625, -2.32635498046875, -2.088623046875, -1.85089111328125, -1.6131591796875, -1.37542724609375, -1.1376953125, -0.89996337890625, -0.6622314453125, -0.42449951171875, -0.186767578125, 0.05096435546875, 0.2886962890625, 0.52642822265625, 0.76416015625, 1.00189208984375, 1.2396240234375, 1.47735595703125, 1.715087890625, 1.95281982421875, 2.1905517578125, 2.42828369140625, 2.666015625, 2.90374755859375, 3.1414794921875, 3.37921142578125, 3.616943359375, 3.85467529296875, 4.0924072265625, 4.33013916015625, 4.56787109375, 4.80560302734375, 5.0433349609375, 5.28106689453125, 5.518798828125, 5.75653076171875, 5.9942626953125, 6.23199462890625, 6.4697265625, 6.70745849609375, 6.9451904296875, 7.18292236328125, 7.420654296875, 7.65838623046875, 7.8961181640625, 8.13385009765625, 8.37158203125, 8.60931396484375, 8.8470458984375, 9.08477783203125, 9.322509765625, 9.56024169921875, 9.7979736328125, 10.03570556640625, 10.2734375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 11.0, 8.0, 16.0, 23.0, 44.0, 52.0, 115.0, 190.0, 350.0, 660.0, 1311.0, 2815.0, 6283.0, 14593.0, 37653.0, 109665.0, 537679.0, 2992207.0, 350106.0, 87024.0, 30834.0, 12482.0, 5334.0, 2438.0, 1147.0, 547.0, 295.0, 158.0, 82.0, 53.0, 37.0, 32.0, 16.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.234375, -11.915771484375, -11.59716796875, -11.278564453125, -10.9599609375, -10.641357421875, -10.32275390625, -10.004150390625, -9.685546875, -9.366943359375, -9.04833984375, -8.729736328125, -8.4111328125, -8.092529296875, -7.77392578125, -7.455322265625, -7.13671875, -6.818115234375, -6.49951171875, -6.180908203125, -5.8623046875, -5.543701171875, -5.22509765625, -4.906494140625, -4.587890625, -4.269287109375, -3.95068359375, -3.632080078125, -3.3134765625, -2.994873046875, -2.67626953125, -2.357666015625, -2.0390625, -1.720458984375, -1.40185546875, -1.083251953125, -0.7646484375, -0.446044921875, -0.12744140625, 0.191162109375, 0.509765625, 0.828369140625, 1.14697265625, 1.465576171875, 1.7841796875, 2.102783203125, 2.42138671875, 2.739990234375, 3.05859375, 3.377197265625, 3.69580078125, 4.014404296875, 4.3330078125, 4.651611328125, 4.97021484375, 5.288818359375, 5.607421875, 5.926025390625, 6.24462890625, 6.563232421875, 6.8818359375, 7.200439453125, 7.51904296875, 7.837646484375, 8.15625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 16.0, 26.0, 57.0, 93.0, 156.0, 184.0, 181.0, 126.0, 63.0, 36.0, 34.0, 15.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.126312255859375, -59.4169807434082, -57.70764923095703, -55.998313903808594, -54.28898239135742, -52.57965087890625, -50.87031936645508, -49.160987854003906, -47.45165252685547, -45.7423210144043, -44.032989501953125, -42.32365417480469, -40.614322662353516, -38.904991149902344, -37.19565963745117, -35.486328125, -33.77699661254883, -32.067665100097656, -30.35833168029785, -28.64900016784668, -26.939666748046875, -25.230335235595703, -23.52100372314453, -21.81167221069336, -20.102338790893555, -18.393007278442383, -16.683673858642578, -14.974342346191406, -13.265009880065918, -11.55567741394043, -9.846345901489258, -8.13701343536377, -6.427677154541016, -4.718344688415527, -3.0090126991271973, -1.2996807098388672, 0.4096517562866211, 2.1189842224121094, 3.8283157348632812, 5.5376482009887695, 7.246980667114258, 8.956313133239746, 10.665645599365234, 12.374977111816406, 14.084309577941895, 15.793642044067383, 17.502973556518555, 19.21230697631836, 20.92163848876953, 22.630970001220703, 24.340303421020508, 26.04963493347168, 27.758968353271484, 29.468299865722656, 31.177631378173828, 32.886962890625, 34.59629821777344, 36.30562973022461, 38.01496124267578, 39.72429656982422, 41.43362808227539, 43.14295959472656, 44.852291107177734, 46.561622619628906, 48.27095413208008]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 14.0, 11.0, 15.0, 13.0, 15.0, 20.0, 22.0, 25.0, 21.0, 34.0, 28.0, 36.0, 36.0, 42.0, 36.0, 29.0, 32.0, 44.0, 31.0, 33.0, 48.0, 43.0, 33.0, 37.0, 35.0, 34.0, 29.0, 32.0, 24.0, 27.0, 20.0, 16.0, 11.0, 17.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.841964721679688, -17.242277145385742, -16.642589569091797, -16.04290199279785, -15.44321346282959, -14.843525886535645, -14.2438383102417, -13.644149780273438, -13.044462203979492, -12.444774627685547, -11.845087051391602, -11.245399475097656, -10.645710945129395, -10.04602336883545, -9.446335792541504, -8.846647262573242, -8.246960639953613, -7.647273063659668, -7.0475850105285645, -6.447897434234619, -5.848209381103516, -5.24852180480957, -4.648834228515625, -4.0491461753845215, -3.449458599090576, -2.8497707843780518, -2.2500829696655273, -1.650395393371582, -1.0507075786590576, -0.4510197639465332, 0.1486678123474121, 0.7483558654785156, 1.348043441772461, 1.9477312564849854, 2.5474190711975098, 3.147106647491455, 3.7467944622039795, 4.346482276916504, 4.946169853210449, 5.545857906341553, 6.145545482635498, 6.745233058929443, 7.344921112060547, 7.944608688354492, 8.544296264648438, 9.143983840942383, 9.743671417236328, 10.34335994720459, 10.943047523498535, 11.54273509979248, 12.142422676086426, 12.742111206054688, 13.341798782348633, 13.941486358642578, 14.541173934936523, 15.140861511230469, 15.740549087524414, 16.34023666381836, 16.939924240112305, 17.53961181640625, 18.139299392700195, 18.73898696899414, 19.33867645263672, 19.938364028930664, 20.53805160522461]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 11.0, 9.0, 12.0, 13.0, 18.0, 22.0, 35.0, 32.0, 37.0, 39.0, 37.0, 52.0, 63.0, 63.0, 65.0, 53.0, 67.0, 51.0, 40.0, 29.0, 36.0, 35.0, 26.0, 34.0, 27.0, 15.0, 19.0, 11.0, 11.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4517822265625, -2.372314453125, -2.2928466796875, -2.21337890625, -2.1339111328125, -2.054443359375, -1.9749755859375, -1.8955078125, -1.8160400390625, -1.736572265625, -1.6571044921875, -1.57763671875, -1.4981689453125, -1.418701171875, -1.3392333984375, -1.259765625, -1.1802978515625, -1.100830078125, -1.0213623046875, -0.94189453125, -0.8624267578125, -0.782958984375, -0.7034912109375, -0.6240234375, -0.5445556640625, -0.465087890625, -0.3856201171875, -0.30615234375, -0.2266845703125, -0.147216796875, -0.0677490234375, 0.01171875, 0.0911865234375, 0.170654296875, 0.2501220703125, 0.32958984375, 0.4090576171875, 0.488525390625, 0.5679931640625, 0.6474609375, 0.7269287109375, 0.806396484375, 0.8858642578125, 0.96533203125, 1.0447998046875, 1.124267578125, 1.2037353515625, 1.283203125, 1.3626708984375, 1.442138671875, 1.5216064453125, 1.60107421875, 1.6805419921875, 1.760009765625, 1.8394775390625, 1.9189453125, 1.9984130859375, 2.077880859375, 2.1573486328125, 2.23681640625, 2.3162841796875, 2.395751953125, 2.4752197265625, 2.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 4.0, 14.0, 15.0, 31.0, 68.0, 69.0, 127.0, 213.0, 319.0, 507.0, 739.0, 1129.0, 1780.0, 2924.0, 4516.0, 7082.0, 11398.0, 18787.0, 34332.0, 68378.0, 162734.0, 415208.0, 164195.0, 69390.0, 34629.0, 19337.0, 11371.0, 6928.0, 4424.0, 2803.0, 1776.0, 1161.0, 754.0, 521.0, 326.0, 194.0, 136.0, 84.0, 56.0, 28.0, 16.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5762939453125, -10.269775390625, -9.9632568359375, -9.65673828125, -9.3502197265625, -9.043701171875, -8.7371826171875, -8.4306640625, -8.1241455078125, -7.817626953125, -7.5111083984375, -7.20458984375, -6.8980712890625, -6.591552734375, -6.2850341796875, -5.978515625, -5.6719970703125, -5.365478515625, -5.0589599609375, -4.75244140625, -4.4459228515625, -4.139404296875, -3.8328857421875, -3.5263671875, -3.2198486328125, -2.913330078125, -2.6068115234375, -2.30029296875, -1.9937744140625, -1.687255859375, -1.3807373046875, -1.07421875, -0.7677001953125, -0.461181640625, -0.1546630859375, 0.15185546875, 0.4583740234375, 0.764892578125, 1.0714111328125, 1.3779296875, 1.6844482421875, 1.990966796875, 2.2974853515625, 2.60400390625, 2.9105224609375, 3.217041015625, 3.5235595703125, 3.830078125, 4.1365966796875, 4.443115234375, 4.7496337890625, 5.05615234375, 5.3626708984375, 5.669189453125, 5.9757080078125, 6.2822265625, 6.5887451171875, 6.895263671875, 7.2017822265625, 7.50830078125, 7.8148193359375, 8.121337890625, 8.4278564453125, 8.734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 15.0, 20.0, 14.0, 15.0, 23.0, 21.0, 34.0, 37.0, 39.0, 39.0, 53.0, 46.0, 43.0, 59.0, 1061.0, 47.0, 43.0, 38.0, 34.0, 32.0, 33.0, 33.0, 27.0, 27.0, 27.0, 17.0, 22.0, 15.0, 14.0, 11.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.45703125, -2.3908233642578125, -2.324615478515625, -2.2584075927734375, -2.19219970703125, -2.1259918212890625, -2.059783935546875, -1.9935760498046875, -1.9273681640625, -1.8611602783203125, -1.794952392578125, -1.7287445068359375, -1.66253662109375, -1.5963287353515625, -1.530120849609375, -1.4639129638671875, -1.397705078125, -1.3314971923828125, -1.265289306640625, -1.1990814208984375, -1.13287353515625, -1.0666656494140625, -1.000457763671875, -0.9342498779296875, -0.8680419921875, -0.8018341064453125, -0.735626220703125, -0.6694183349609375, -0.60321044921875, -0.5370025634765625, -0.470794677734375, -0.4045867919921875, -0.33837890625, -0.2721710205078125, -0.205963134765625, -0.1397552490234375, -0.07354736328125, -0.0073394775390625, 0.058868408203125, 0.1250762939453125, 0.1912841796875, 0.2574920654296875, 0.323699951171875, 0.3899078369140625, 0.45611572265625, 0.5223236083984375, 0.588531494140625, 0.6547393798828125, 0.720947265625, 0.7871551513671875, 0.853363037109375, 0.9195709228515625, 0.98577880859375, 1.0519866943359375, 1.118194580078125, 1.1844024658203125, 1.2506103515625, 1.3168182373046875, 1.383026123046875, 1.4492340087890625, 1.51544189453125, 1.5816497802734375, 1.647857666015625, 1.7140655517578125, 1.7802734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 0.0, 10.0, 3.0, 6.0, 20.0, 30.0, 33.0, 57.0, 68.0, 103.0, 186.0, 275.0, 439.0, 763.0, 1424.0, 3173.0, 8534.0, 26684.0, 132851.0, 1727473.0, 150553.0, 28509.0, 8945.0, 3449.0, 1479.0, 801.0, 422.0, 271.0, 175.0, 127.0, 107.0, 54.0, 35.0, 13.0, 12.0, 13.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.5625, -18.921630859375, -18.28076171875, -17.639892578125, -16.9990234375, -16.358154296875, -15.71728515625, -15.076416015625, -14.435546875, -13.794677734375, -13.15380859375, -12.512939453125, -11.8720703125, -11.231201171875, -10.59033203125, -9.949462890625, -9.30859375, -8.667724609375, -8.02685546875, -7.385986328125, -6.7451171875, -6.104248046875, -5.46337890625, -4.822509765625, -4.181640625, -3.540771484375, -2.89990234375, -2.259033203125, -1.6181640625, -0.977294921875, -0.33642578125, 0.304443359375, 0.9453125, 1.586181640625, 2.22705078125, 2.867919921875, 3.5087890625, 4.149658203125, 4.79052734375, 5.431396484375, 6.072265625, 6.713134765625, 7.35400390625, 7.994873046875, 8.6357421875, 9.276611328125, 9.91748046875, 10.558349609375, 11.19921875, 11.840087890625, 12.48095703125, 13.121826171875, 13.7626953125, 14.403564453125, 15.04443359375, 15.685302734375, 16.326171875, 16.967041015625, 17.60791015625, 18.248779296875, 18.8896484375, 19.530517578125, 20.17138671875, 20.812255859375, 21.453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 19.0, 26.0, 71.0, 109.0, 287.0, 235.0, 103.0, 50.0, 26.0, 16.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.453125, -5.2578125, -5.0625, -4.8671875, -4.671875, -4.4765625, -4.28125, -4.0859375, -3.890625, -3.6953125, -3.5, -3.3046875, -3.109375, -2.9140625, -2.71875, -2.5234375, -2.328125, -2.1328125, -1.9375, -1.7421875, -1.546875, -1.3515625, -1.15625, -0.9609375, -0.765625, -0.5703125, -0.375, -0.1796875, 0.015625, 0.2109375, 0.40625, 0.6015625, 0.796875, 0.9921875, 1.1875, 1.3828125, 1.578125, 1.7734375, 1.96875, 2.1640625, 2.359375, 2.5546875, 2.75, 2.9453125, 3.140625, 3.3359375, 3.53125, 3.7265625, 3.921875, 4.1171875, 4.3125, 4.5078125, 4.703125, 4.8984375, 5.09375, 5.2890625, 5.484375, 5.6796875, 5.875, 6.0703125, 6.265625, 6.4609375, 6.65625, 6.8515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 32.0, 52.0, 113.0, 382.0, 1554.0, 20360.0, 1017587.0, 7015.0, 992.0, 237.0, 99.0, 41.0, 12.0, 10.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.625, -102.63671875, -99.6484375, -96.66015625, -93.671875, -90.68359375, -87.6953125, -84.70703125, -81.71875, -78.73046875, -75.7421875, -72.75390625, -69.765625, -66.77734375, -63.7890625, -60.80078125, -57.8125, -54.82421875, -51.8359375, -48.84765625, -45.859375, -42.87109375, -39.8828125, -36.89453125, -33.90625, -30.91796875, -27.9296875, -24.94140625, -21.953125, -18.96484375, -15.9765625, -12.98828125, -10.0, -7.01171875, -4.0234375, -1.03515625, 1.953125, 4.94140625, 7.9296875, 10.91796875, 13.90625, 16.89453125, 19.8828125, 22.87109375, 25.859375, 28.84765625, 31.8359375, 34.82421875, 37.8125, 40.80078125, 43.7890625, 46.77734375, 49.765625, 52.75390625, 55.7421875, 58.73046875, 61.71875, 64.70703125, 67.6953125, 70.68359375, 73.671875, 76.66015625, 79.6484375, 82.63671875, 85.625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 12.0, 11.0, 20.0, 45.0, 59.0, 143.0, 272.0, 235.0, 99.0, 58.0, 25.0, 15.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.849494934082031, -11.527217864990234, -11.204939842224121, -10.882662773132324, -10.560384750366211, -10.238107681274414, -9.9158296585083, -9.593552589416504, -9.27127456665039, -8.948997497558594, -8.62671947479248, -8.304442405700684, -7.98216438293457, -7.659886837005615, -7.33760929107666, -7.015332221984863, -6.693054676055908, -6.370777130126953, -6.048499584197998, -5.726222038269043, -5.403944492340088, -5.081666946411133, -4.759389877319336, -4.437111854553223, -4.114834785461426, -3.7925572395324707, -3.4702796936035156, -3.1480021476745605, -2.8257246017456055, -2.5034470558166504, -2.1811697483062744, -1.8588922023773193, -1.5366144180297852, -1.21433687210083, -0.8920593857765198, -0.5697818994522095, -0.2475043535232544, 0.07477319240570068, 0.3970506191253662, 0.7193281650543213, 1.0416057109832764, 1.3638832569122314, 1.6861608028411865, 2.0084381103515625, 2.3307156562805176, 2.6529932022094727, 2.9752707481384277, 3.297548294067383, 3.619825839996338, 3.942103385925293, 4.264380931854248, 4.586658477783203, 4.908936023712158, 5.231213569641113, 5.55349063873291, 5.875768661499023, 6.19804573059082, 6.520323276519775, 6.8426008224487305, 7.1648783683776855, 7.487155914306641, 7.809433460235596, 8.13171100616455, 8.453988075256348, 8.776266098022461]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 15.0, 11.0, 18.0, 17.0, 34.0, 31.0, 34.0, 44.0, 45.0, 38.0, 49.0, 38.0, 55.0, 58.0, 57.0, 47.0, 48.0, 57.0, 58.0, 32.0, 29.0, 36.0, 38.0, 20.0, 15.0, 12.0, 10.0, 6.0, 3.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3224947452545166, -3.1939871311187744, -3.0654797554016113, -2.936972141265869, -2.808464527130127, -2.6799569129943848, -2.5514495372772217, -2.4229419231414795, -2.2944345474243164, -2.165926933288574, -2.037419557571411, -1.908911943435669, -1.7804043292999268, -1.6518968343734741, -1.5233893394470215, -1.3948817253112793, -1.266374111175537, -1.1378666162490845, -1.0093590021133423, -0.8808515071868896, -0.7523439526557922, -0.6238363981246948, -0.4953289031982422, -0.3668213486671448, -0.23831379413604736, -0.10980625450611115, 0.018701285123825073, 0.1472088098526001, 0.2757163643836975, 0.4042239189147949, 0.5327314138412476, 0.661238968372345, 0.7897462844848633, 0.9182538390159607, 1.046761393547058, 1.1752688884735107, 1.303776502609253, 1.4322839975357056, 1.5607914924621582, 1.6892991065979004, 1.817806601524353, 1.9463140964508057, 2.074821710586548, 2.203329086303711, 2.331836700439453, 2.4603443145751953, 2.5888519287109375, 2.7173593044281006, 2.8458669185638428, 2.974374532699585, 3.102881908416748, 3.2313895225524902, 3.3598971366882324, 3.4884047508239746, 3.6169121265411377, 3.74541974067688, 3.873927116394043, 4.002434730529785, 4.130942344665527, 4.2594499588012695, 4.3879570960998535, 4.516464710235596, 4.644972324371338, 4.77347993850708, 4.901987552642822]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 13.0, 10.0, 12.0, 11.0, 17.0, 27.0, 30.0, 37.0, 46.0, 47.0, 48.0, 65.0, 67.0, 51.0, 64.0, 43.0, 66.0, 53.0, 45.0, 35.0, 32.0, 30.0, 32.0, 28.0, 18.0, 21.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.534454345703125, -2.44781494140625, -2.361175537109375, -2.2745361328125, -2.187896728515625, -2.10125732421875, -2.014617919921875, -1.927978515625, -1.841339111328125, -1.75469970703125, -1.668060302734375, -1.5814208984375, -1.494781494140625, -1.40814208984375, -1.321502685546875, -1.23486328125, -1.148223876953125, -1.06158447265625, -0.974945068359375, -0.8883056640625, -0.801666259765625, -0.71502685546875, -0.628387451171875, -0.541748046875, -0.455108642578125, -0.36846923828125, -0.281829833984375, -0.1951904296875, -0.108551025390625, -0.02191162109375, 0.064727783203125, 0.1513671875, 0.238006591796875, 0.32464599609375, 0.411285400390625, 0.4979248046875, 0.584564208984375, 0.67120361328125, 0.757843017578125, 0.844482421875, 0.931121826171875, 1.01776123046875, 1.104400634765625, 1.1910400390625, 1.277679443359375, 1.36431884765625, 1.450958251953125, 1.53759765625, 1.624237060546875, 1.71087646484375, 1.797515869140625, 1.8841552734375, 1.970794677734375, 2.05743408203125, 2.144073486328125, 2.230712890625, 2.317352294921875, 2.40399169921875, 2.490631103515625, 2.5772705078125, 2.663909912109375, 2.75054931640625, 2.837188720703125, 2.923828125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 16.0, 10.0, 31.0, 31.0, 59.0, 106.0, 153.0, 225.0, 343.0, 578.0, 930.0, 1463.0, 2509.0, 4232.0, 7539.0, 14357.0, 31507.0, 102764.0, 662201.0, 144565.0, 38060.0, 16737.0, 8533.0, 4773.0, 2604.0, 1580.0, 966.0, 596.0, 403.0, 245.0, 150.0, 91.0, 82.0, 35.0, 27.0, 20.0, 12.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.58154296875, -4.4365234375, -4.29150390625, -4.146484375, -4.00146484375, -3.8564453125, -3.71142578125, -3.56640625, -3.42138671875, -3.2763671875, -3.13134765625, -2.986328125, -2.84130859375, -2.6962890625, -2.55126953125, -2.40625, -2.26123046875, -2.1162109375, -1.97119140625, -1.826171875, -1.68115234375, -1.5361328125, -1.39111328125, -1.24609375, -1.10107421875, -0.9560546875, -0.81103515625, -0.666015625, -0.52099609375, -0.3759765625, -0.23095703125, -0.0859375, 0.05908203125, 0.2041015625, 0.34912109375, 0.494140625, 0.63916015625, 0.7841796875, 0.92919921875, 1.07421875, 1.21923828125, 1.3642578125, 1.50927734375, 1.654296875, 1.79931640625, 1.9443359375, 2.08935546875, 2.234375, 2.37939453125, 2.5244140625, 2.66943359375, 2.814453125, 2.95947265625, 3.1044921875, 3.24951171875, 3.39453125, 3.53955078125, 3.6845703125, 3.82958984375, 3.974609375, 4.11962890625, 4.2646484375, 4.40966796875, 4.5546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 6.0, 14.0, 13.0, 16.0, 26.0, 17.0, 27.0, 27.0, 36.0, 30.0, 39.0, 38.0, 63.0, 81.0, 124.0, 283.0, 1510.0, 157.0, 92.0, 82.0, 50.0, 34.0, 38.0, 39.0, 24.0, 27.0, 23.0, 14.0, 17.0, 12.0, 13.0, 7.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.37890625, -7.1424560546875, -6.906005859375, -6.6695556640625, -6.43310546875, -6.1966552734375, -5.960205078125, -5.7237548828125, -5.4873046875, -5.2508544921875, -5.014404296875, -4.7779541015625, -4.54150390625, -4.3050537109375, -4.068603515625, -3.8321533203125, -3.595703125, -3.3592529296875, -3.122802734375, -2.8863525390625, -2.64990234375, -2.4134521484375, -2.177001953125, -1.9405517578125, -1.7041015625, -1.4676513671875, -1.231201171875, -0.9947509765625, -0.75830078125, -0.5218505859375, -0.285400390625, -0.0489501953125, 0.1875, 0.4239501953125, 0.660400390625, 0.8968505859375, 1.13330078125, 1.3697509765625, 1.606201171875, 1.8426513671875, 2.0791015625, 2.3155517578125, 2.552001953125, 2.7884521484375, 3.02490234375, 3.2613525390625, 3.497802734375, 3.7342529296875, 3.970703125, 4.2071533203125, 4.443603515625, 4.6800537109375, 4.91650390625, 5.1529541015625, 5.389404296875, 5.6258544921875, 5.8623046875, 6.0987548828125, 6.335205078125, 6.5716552734375, 6.80810546875, 7.0445556640625, 7.281005859375, 7.5174560546875, 7.75390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 9.0, 15.0, 19.0, 24.0, 42.0, 50.0, 90.0, 186.0, 425.0, 1079.0, 3521.0, 17145.0, 231829.0, 2807588.0, 71138.0, 8981.0, 2133.0, 731.0, 310.0, 134.0, 68.0, 44.0, 38.0, 24.0, 20.0, 8.0, 8.0, 9.0, 6.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1787109375, -14.708984375, -14.2392578125, -13.76953125, -13.2998046875, -12.830078125, -12.3603515625, -11.890625, -11.4208984375, -10.951171875, -10.4814453125, -10.01171875, -9.5419921875, -9.072265625, -8.6025390625, -8.1328125, -7.6630859375, -7.193359375, -6.7236328125, -6.25390625, -5.7841796875, -5.314453125, -4.8447265625, -4.375, -3.9052734375, -3.435546875, -2.9658203125, -2.49609375, -2.0263671875, -1.556640625, -1.0869140625, -0.6171875, -0.1474609375, 0.322265625, 0.7919921875, 1.26171875, 1.7314453125, 2.201171875, 2.6708984375, 3.140625, 3.6103515625, 4.080078125, 4.5498046875, 5.01953125, 5.4892578125, 5.958984375, 6.4287109375, 6.8984375, 7.3681640625, 7.837890625, 8.3076171875, 8.77734375, 9.2470703125, 9.716796875, 10.1865234375, 10.65625, 11.1259765625, 11.595703125, 12.0654296875, 12.53515625, 13.0048828125, 13.474609375, 13.9443359375, 14.4140625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 28.0, 102.0, 205.0, 336.0, 230.0, 79.0, 19.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.266178131103516, -27.768829345703125, -26.271480560302734, -24.774133682250977, -23.276784896850586, -21.779436111450195, -20.282089233398438, -18.784740447998047, -17.287391662597656, -15.790042877197266, -14.292695045471191, -12.795347213745117, -11.297998428344727, -9.800649642944336, -8.303301811218262, -6.8059539794921875, -5.308605194091797, -3.8112568855285645, -2.313908576965332, -0.8165602684020996, 0.6807880401611328, 2.1781363487243652, 3.6754846572875977, 5.172832489013672, 6.6701812744140625, 8.167530059814453, 9.664877891540527, 11.162225723266602, 12.659574508666992, 14.156923294067383, 15.654271125793457, 17.15161895751953, 18.648971557617188, 20.146320343017578, 21.64366912841797, 23.141016006469727, 24.638364791870117, 26.135713577270508, 27.633060455322266, 29.130409240722656, 30.627758026123047, 32.12510681152344, 33.62245559692383, 35.11980438232422, 36.617149353027344, 38.114498138427734, 39.611846923828125, 41.109195709228516, 42.606544494628906, 44.1038932800293, 45.60124206542969, 47.09859085083008, 48.59593963623047, 50.093284606933594, 51.590633392333984, 53.087982177734375, 54.585330963134766, 56.082679748535156, 57.58002853393555, 59.07737731933594, 60.57472229003906, 62.07207107543945, 63.569419860839844, 65.0667724609375, 66.56411743164062]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 8.0, 4.0, 7.0, 12.0, 18.0, 17.0, 18.0, 22.0, 22.0, 36.0, 26.0, 38.0, 43.0, 42.0, 37.0, 41.0, 43.0, 56.0, 60.0, 47.0, 41.0, 35.0, 51.0, 49.0, 29.0, 34.0, 30.0, 25.0, 23.0, 21.0, 13.0, 18.0, 6.0, 4.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.179262161254883, -21.414167404174805, -20.649070739746094, -19.883975982666016, -19.118881225585938, -18.35378646850586, -17.58868980407715, -16.82359504699707, -16.05849838256836, -15.293402671813965, -14.528307914733887, -13.763212203979492, -12.998117446899414, -12.23302173614502, -11.467926025390625, -10.702831268310547, -9.937736511230469, -9.172640800476074, -8.407546043395996, -7.642450332641602, -6.877355098724365, -6.112259864807129, -5.347164154052734, -4.582068920135498, -3.8169736862182617, -3.0518784523010254, -2.28678297996521, -1.5216875076293945, -0.7565922737121582, 0.008502960205078125, 0.7735986709594727, 1.538693904876709, 2.3037891387939453, 3.0688843727111816, 3.833979845046997, 4.5990753173828125, 5.364170551300049, 6.129265785217285, 6.89436149597168, 7.659456729888916, 8.424551963806152, 9.189647674560547, 9.954742431640625, 10.71983814239502, 11.484933853149414, 12.250028610229492, 13.015124320983887, 13.780220031738281, 14.54531478881836, 15.310410499572754, 16.07550621032715, 16.840600967407227, 17.605695724487305, 18.370792388916016, 19.135887145996094, 19.900981903076172, 20.66607666015625, 21.431171417236328, 22.19626808166504, 22.961362838745117, 23.726457595825195, 24.491554260253906, 25.256649017333984, 26.021743774414062, 26.786840438842773]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 15.0, 12.0, 18.0, 27.0, 34.0, 35.0, 49.0, 53.0, 45.0, 64.0, 62.0, 51.0, 37.0, 76.0, 48.0, 44.0, 49.0, 37.0, 35.0, 27.0, 34.0, 20.0, 21.0, 24.0, 11.0, 11.0, 5.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.248016357421875, -2.16204833984375, -2.076080322265625, -1.9901123046875, -1.904144287109375, -1.81817626953125, -1.732208251953125, -1.646240234375, -1.560272216796875, -1.47430419921875, -1.388336181640625, -1.3023681640625, -1.216400146484375, -1.13043212890625, -1.044464111328125, -0.95849609375, -0.872528076171875, -0.78656005859375, -0.700592041015625, -0.6146240234375, -0.528656005859375, -0.44268798828125, -0.356719970703125, -0.270751953125, -0.184783935546875, -0.09881591796875, -0.012847900390625, 0.0731201171875, 0.159088134765625, 0.24505615234375, 0.331024169921875, 0.4169921875, 0.502960205078125, 0.58892822265625, 0.674896240234375, 0.7608642578125, 0.846832275390625, 0.93280029296875, 1.018768310546875, 1.104736328125, 1.190704345703125, 1.27667236328125, 1.362640380859375, 1.4486083984375, 1.534576416015625, 1.62054443359375, 1.706512451171875, 1.79248046875, 1.878448486328125, 1.96441650390625, 2.050384521484375, 2.1363525390625, 2.222320556640625, 2.30828857421875, 2.394256591796875, 2.480224609375, 2.566192626953125, 2.65216064453125, 2.738128662109375, 2.8240966796875, 2.910064697265625, 2.99603271484375, 3.082000732421875, 3.16796875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 11.0, 17.0, 17.0, 37.0, 53.0, 82.0, 124.0, 190.0, 289.0, 456.0, 689.0, 1075.0, 1680.0, 2800.0, 4438.0, 7328.0, 12669.0, 22339.0, 42740.0, 98970.0, 535661.0, 2602756.0, 648047.0, 108012.0, 44733.0, 23310.0, 13796.0, 8214.0, 4903.0, 3168.0, 2009.0, 1282.0, 776.0, 531.0, 351.0, 221.0, 158.0, 121.0, 58.0, 45.0, 32.0, 29.0, 13.0, 13.0, 13.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.27734375, -4.1220703125, -3.966796875, -3.8115234375, -3.65625, -3.5009765625, -3.345703125, -3.1904296875, -3.03515625, -2.8798828125, -2.724609375, -2.5693359375, -2.4140625, -2.2587890625, -2.103515625, -1.9482421875, -1.79296875, -1.6376953125, -1.482421875, -1.3271484375, -1.171875, -1.0166015625, -0.861328125, -0.7060546875, -0.55078125, -0.3955078125, -0.240234375, -0.0849609375, 0.0703125, 0.2255859375, 0.380859375, 0.5361328125, 0.69140625, 0.8466796875, 1.001953125, 1.1572265625, 1.3125, 1.4677734375, 1.623046875, 1.7783203125, 1.93359375, 2.0888671875, 2.244140625, 2.3994140625, 2.5546875, 2.7099609375, 2.865234375, 3.0205078125, 3.17578125, 3.3310546875, 3.486328125, 3.6416015625, 3.796875, 3.9521484375, 4.107421875, 4.2626953125, 4.41796875, 4.5732421875, 4.728515625, 4.8837890625, 5.0390625, 5.1943359375, 5.349609375, 5.5048828125, 5.66015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 16.0, 17.0, 14.0, 24.0, 35.0, 41.0, 48.0, 66.0, 78.0, 121.0, 173.0, 325.0, 501.0, 687.0, 589.0, 434.0, 211.0, 161.0, 104.0, 88.0, 71.0, 46.0, 46.0, 35.0, 25.0, 23.0, 10.0, 15.0, 11.0, 5.0, 6.0, 8.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.629150390625, -5.42626953125, -5.223388671875, -5.0205078125, -4.817626953125, -4.61474609375, -4.411865234375, -4.208984375, -4.006103515625, -3.80322265625, -3.600341796875, -3.3974609375, -3.194580078125, -2.99169921875, -2.788818359375, -2.5859375, -2.383056640625, -2.18017578125, -1.977294921875, -1.7744140625, -1.571533203125, -1.36865234375, -1.165771484375, -0.962890625, -0.760009765625, -0.55712890625, -0.354248046875, -0.1513671875, 0.051513671875, 0.25439453125, 0.457275390625, 0.66015625, 0.863037109375, 1.06591796875, 1.268798828125, 1.4716796875, 1.674560546875, 1.87744140625, 2.080322265625, 2.283203125, 2.486083984375, 2.68896484375, 2.891845703125, 3.0947265625, 3.297607421875, 3.50048828125, 3.703369140625, 3.90625, 4.109130859375, 4.31201171875, 4.514892578125, 4.7177734375, 4.920654296875, 5.12353515625, 5.326416015625, 5.529296875, 5.732177734375, 5.93505859375, 6.137939453125, 6.3408203125, 6.543701171875, 6.74658203125, 6.949462890625, 7.15234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 13.0, 11.0, 20.0, 46.0, 67.0, 77.0, 125.0, 224.0, 319.0, 571.0, 922.0, 1672.0, 2929.0, 5010.0, 9760.0, 18857.0, 40894.0, 96712.0, 311018.0, 2355993.0, 1037543.0, 182851.0, 67346.0, 29606.0, 14601.0, 7406.0, 4163.0, 2253.0, 1276.0, 784.0, 471.0, 287.0, 154.0, 109.0, 66.0, 41.0, 34.0, 18.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.453125, -7.21875, -6.984375, -6.75, -6.515625, -6.28125, -6.046875, -5.8125, -5.578125, -5.34375, -5.109375, -4.875, -4.640625, -4.40625, -4.171875, -3.9375, -3.703125, -3.46875, -3.234375, -3.0, -2.765625, -2.53125, -2.296875, -2.0625, -1.828125, -1.59375, -1.359375, -1.125, -0.890625, -0.65625, -0.421875, -0.1875, 0.046875, 0.28125, 0.515625, 0.75, 0.984375, 1.21875, 1.453125, 1.6875, 1.921875, 2.15625, 2.390625, 2.625, 2.859375, 3.09375, 3.328125, 3.5625, 3.796875, 4.03125, 4.265625, 4.5, 4.734375, 4.96875, 5.203125, 5.4375, 5.671875, 5.90625, 6.140625, 6.375, 6.609375, 6.84375, 7.078125, 7.3125, 7.546875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 10.0, 8.0, 32.0, 55.0, 127.0, 185.0, 248.0, 165.0, 102.0, 41.0, 19.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3114242553711, -92.07685089111328, -89.84226989746094, -87.60769653320312, -85.37312316894531, -83.1385498046875, -80.90396881103516, -78.66939544677734, -76.434814453125, -74.20024108886719, -71.96566009521484, -69.73108673095703, -67.49651336669922, -65.26193237304688, -63.02735900878906, -60.79278564453125, -58.55821228027344, -56.32363510131836, -54.08906173706055, -51.85448455810547, -49.619911193847656, -47.38533401489258, -45.1507568359375, -42.91618347167969, -40.68160629272461, -38.44702911376953, -36.21245574951172, -33.97787857055664, -31.743303298950195, -29.50872802734375, -27.274150848388672, -25.039575576782227, -22.804996490478516, -20.57042121887207, -18.335845947265625, -16.101268768310547, -13.866693496704102, -11.632118225097656, -9.397541999816895, -7.162965774536133, -4.9283905029296875, -2.693814754486084, -0.45923900604248047, 1.775336742401123, 4.009912490844727, 6.244487762451172, 8.479063987731934, 10.713640213012695, 12.94821548461914, 15.182790756225586, 17.41736602783203, 19.65194320678711, 21.886518478393555, 24.12109375, 26.355670928955078, 28.590246200561523, 30.82482147216797, 33.05939865112305, 35.29397201538086, 37.52854919433594, 39.76312255859375, 41.99769973754883, 44.232276916503906, 46.46685028076172, 48.7014274597168]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 7.0, 10.0, 21.0, 18.0, 23.0, 22.0, 26.0, 29.0, 30.0, 27.0, 28.0, 35.0, 36.0, 40.0, 28.0, 36.0, 39.0, 47.0, 50.0, 42.0, 40.0, 32.0, 35.0, 31.0, 35.0, 30.0, 38.0, 24.0, 18.0, 20.0, 26.0, 16.0, 8.0, 10.0, 10.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03443717956543, -20.38628578186035, -19.738136291503906, -19.089984893798828, -18.441835403442383, -17.793684005737305, -17.14553451538086, -16.49738311767578, -15.849231719970703, -15.201081275939941, -14.55293083190918, -13.904779434204102, -13.25662899017334, -12.608478546142578, -11.960328102111816, -11.312177658081055, -10.664027214050293, -10.015876770019531, -9.36772632598877, -8.719575881958008, -8.07142448425293, -7.423274040222168, -6.775123596191406, -6.126972675323486, -5.478822231292725, -4.830671787261963, -4.182520866394043, -3.5343704223632812, -2.8862197399139404, -2.2380690574645996, -1.589918613433838, -0.941767692565918, -0.29361724853515625, 0.3545333743095398, 1.0026839971542358, 1.650834560394287, 2.298985242843628, 2.9471359252929688, 3.5952863693237305, 4.24343729019165, 4.891587734222412, 5.539738178253174, 6.187889099121094, 6.8360395431518555, 7.484189987182617, 8.132341384887695, 8.78049087524414, 9.428642272949219, 10.07679271697998, 10.724943161010742, 11.373093605041504, 12.021244049072266, 12.669395446777344, 13.317545890808105, 13.965696334838867, 14.613847732543945, 15.26199722290039, 15.910147666931152, 16.558298110961914, 17.206449508666992, 17.854598999023438, 18.502750396728516, 19.150901794433594, 19.79905128479004, 20.447202682495117]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 13.0, 6.0, 13.0, 17.0, 13.0, 20.0, 20.0, 20.0, 40.0, 43.0, 36.0, 48.0, 58.0, 51.0, 55.0, 44.0, 53.0, 54.0, 47.0, 59.0, 39.0, 38.0, 23.0, 31.0, 22.0, 19.0, 21.0, 22.0, 23.0, 15.0, 10.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.123443603515625, -2.04180908203125, -1.960174560546875, -1.8785400390625, -1.796905517578125, -1.71527099609375, -1.633636474609375, -1.552001953125, -1.470367431640625, -1.38873291015625, -1.307098388671875, -1.2254638671875, -1.143829345703125, -1.06219482421875, -0.980560302734375, -0.89892578125, -0.817291259765625, -0.73565673828125, -0.654022216796875, -0.5723876953125, -0.490753173828125, -0.40911865234375, -0.327484130859375, -0.245849609375, -0.164215087890625, -0.08258056640625, -0.000946044921875, 0.0806884765625, 0.162322998046875, 0.24395751953125, 0.325592041015625, 0.4072265625, 0.488861083984375, 0.57049560546875, 0.652130126953125, 0.7337646484375, 0.815399169921875, 0.89703369140625, 0.978668212890625, 1.060302734375, 1.141937255859375, 1.22357177734375, 1.305206298828125, 1.3868408203125, 1.468475341796875, 1.55010986328125, 1.631744384765625, 1.71337890625, 1.795013427734375, 1.87664794921875, 1.958282470703125, 2.0399169921875, 2.121551513671875, 2.20318603515625, 2.284820556640625, 2.366455078125, 2.448089599609375, 2.52972412109375, 2.611358642578125, 2.6929931640625, 2.774627685546875, 2.85626220703125, 2.937896728515625, 3.01953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 9.0, 16.0, 37.0, 31.0, 55.0, 72.0, 129.0, 147.0, 192.0, 322.0, 492.0, 806.0, 1150.0, 1944.0, 3118.0, 5366.0, 9822.0, 20704.0, 55785.0, 376680.0, 463896.0, 60640.0, 22340.0, 10489.0, 5499.0, 3235.0, 1901.0, 1209.0, 747.0, 532.0, 342.0, 269.0, 175.0, 123.0, 73.0, 69.0, 29.0, 25.0, 21.0, 20.0, 13.0, 7.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.640625, -13.1865234375, -12.732421875, -12.2783203125, -11.82421875, -11.3701171875, -10.916015625, -10.4619140625, -10.0078125, -9.5537109375, -9.099609375, -8.6455078125, -8.19140625, -7.7373046875, -7.283203125, -6.8291015625, -6.375, -5.9208984375, -5.466796875, -5.0126953125, -4.55859375, -4.1044921875, -3.650390625, -3.1962890625, -2.7421875, -2.2880859375, -1.833984375, -1.3798828125, -0.92578125, -0.4716796875, -0.017578125, 0.4365234375, 0.890625, 1.3447265625, 1.798828125, 2.2529296875, 2.70703125, 3.1611328125, 3.615234375, 4.0693359375, 4.5234375, 4.9775390625, 5.431640625, 5.8857421875, 6.33984375, 6.7939453125, 7.248046875, 7.7021484375, 8.15625, 8.6103515625, 9.064453125, 9.5185546875, 9.97265625, 10.4267578125, 10.880859375, 11.3349609375, 11.7890625, 12.2431640625, 12.697265625, 13.1513671875, 13.60546875, 14.0595703125, 14.513671875, 14.9677734375, 15.421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 6.0, 15.0, 11.0, 19.0, 19.0, 25.0, 29.0, 23.0, 39.0, 41.0, 42.0, 44.0, 40.0, 63.0, 58.0, 1073.0, 45.0, 53.0, 59.0, 46.0, 41.0, 42.0, 29.0, 33.0, 24.0, 17.0, 17.0, 14.0, 8.0, 14.0, 7.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.380706787109375, -2.30633544921875, -2.231964111328125, -2.1575927734375, -2.083221435546875, -2.00885009765625, -1.934478759765625, -1.860107421875, -1.785736083984375, -1.71136474609375, -1.636993408203125, -1.5626220703125, -1.488250732421875, -1.41387939453125, -1.339508056640625, -1.26513671875, -1.190765380859375, -1.11639404296875, -1.042022705078125, -0.9676513671875, -0.893280029296875, -0.81890869140625, -0.744537353515625, -0.670166015625, -0.595794677734375, -0.52142333984375, -0.447052001953125, -0.3726806640625, -0.298309326171875, -0.22393798828125, -0.149566650390625, -0.0751953125, -0.000823974609375, 0.07354736328125, 0.147918701171875, 0.2222900390625, 0.296661376953125, 0.37103271484375, 0.445404052734375, 0.519775390625, 0.594146728515625, 0.66851806640625, 0.742889404296875, 0.8172607421875, 0.891632080078125, 0.96600341796875, 1.040374755859375, 1.11474609375, 1.189117431640625, 1.26348876953125, 1.337860107421875, 1.4122314453125, 1.486602783203125, 1.56097412109375, 1.635345458984375, 1.709716796875, 1.784088134765625, 1.85845947265625, 1.932830810546875, 2.0072021484375, 2.081573486328125, 2.15594482421875, 2.230316162109375, 2.3046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 10.0, 16.0, 24.0, 46.0, 74.0, 104.0, 148.0, 200.0, 316.0, 499.0, 739.0, 1225.0, 1936.0, 3985.0, 10746.0, 58438.0, 1918795.0, 77153.0, 12217.0, 4529.0, 2237.0, 1244.0, 731.0, 534.0, 392.0, 272.0, 149.0, 129.0, 64.0, 40.0, 25.0, 25.0, 11.0, 14.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.703125, -24.888427734375, -24.07373046875, -23.259033203125, -22.4443359375, -21.629638671875, -20.81494140625, -20.000244140625, -19.185546875, -18.370849609375, -17.55615234375, -16.741455078125, -15.9267578125, -15.112060546875, -14.29736328125, -13.482666015625, -12.66796875, -11.853271484375, -11.03857421875, -10.223876953125, -9.4091796875, -8.594482421875, -7.77978515625, -6.965087890625, -6.150390625, -5.335693359375, -4.52099609375, -3.706298828125, -2.8916015625, -2.076904296875, -1.26220703125, -0.447509765625, 0.3671875, 1.181884765625, 1.99658203125, 2.811279296875, 3.6259765625, 4.440673828125, 5.25537109375, 6.070068359375, 6.884765625, 7.699462890625, 8.51416015625, 9.328857421875, 10.1435546875, 10.958251953125, 11.77294921875, 12.587646484375, 13.40234375, 14.217041015625, 15.03173828125, 15.846435546875, 16.6611328125, 17.475830078125, 18.29052734375, 19.105224609375, 19.919921875, 20.734619140625, 21.54931640625, 22.364013671875, 23.1787109375, 23.993408203125, 24.80810546875, 25.622802734375, 26.4375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 42.0, 117.0, 425.0, 269.0, 67.0, 21.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.64306640625, -6.3955078125, -6.14794921875, -5.900390625, -5.65283203125, -5.4052734375, -5.15771484375, -4.91015625, -4.66259765625, -4.4150390625, -4.16748046875, -3.919921875, -3.67236328125, -3.4248046875, -3.17724609375, -2.9296875, -2.68212890625, -2.4345703125, -2.18701171875, -1.939453125, -1.69189453125, -1.4443359375, -1.19677734375, -0.94921875, -0.70166015625, -0.4541015625, -0.20654296875, 0.041015625, 0.28857421875, 0.5361328125, 0.78369140625, 1.03125, 1.27880859375, 1.5263671875, 1.77392578125, 2.021484375, 2.26904296875, 2.5166015625, 2.76416015625, 3.01171875, 3.25927734375, 3.5068359375, 3.75439453125, 4.001953125, 4.24951171875, 4.4970703125, 4.74462890625, 4.9921875, 5.23974609375, 5.4873046875, 5.73486328125, 5.982421875, 6.22998046875, 6.4775390625, 6.72509765625, 6.97265625, 7.22021484375, 7.4677734375, 7.71533203125, 7.962890625, 8.21044921875, 8.4580078125, 8.70556640625, 8.953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 17.0, 25.0, 33.0, 102.0, 496.0, 2862.0, 47850.0, 991885.0, 4212.0, 755.0, 152.0, 40.0, 23.0, 15.0, 11.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-140.625, -136.73046875, -132.8359375, -128.94140625, -125.046875, -121.15234375, -117.2578125, -113.36328125, -109.46875, -105.57421875, -101.6796875, -97.78515625, -93.890625, -89.99609375, -86.1015625, -82.20703125, -78.3125, -74.41796875, -70.5234375, -66.62890625, -62.734375, -58.83984375, -54.9453125, -51.05078125, -47.15625, -43.26171875, -39.3671875, -35.47265625, -31.578125, -27.68359375, -23.7890625, -19.89453125, -16.0, -12.10546875, -8.2109375, -4.31640625, -0.421875, 3.47265625, 7.3671875, 11.26171875, 15.15625, 19.05078125, 22.9453125, 26.83984375, 30.734375, 34.62890625, 38.5234375, 42.41796875, 46.3125, 50.20703125, 54.1015625, 57.99609375, 61.890625, 65.78515625, 69.6796875, 73.57421875, 77.46875, 81.36328125, 85.2578125, 89.15234375, 93.046875, 96.94140625, 100.8359375, 104.73046875, 108.625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 9.0, 13.0, 23.0, 26.0, 29.0, 54.0, 77.0, 162.0, 191.0, 126.0, 93.0, 59.0, 42.0, 15.0, 23.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.547995567321777, -8.305628776550293, -8.063262939453125, -7.820896625518799, -7.578530311584473, -7.3361639976501465, -7.09379768371582, -6.851430892944336, -6.609065055847168, -6.366698741912842, -6.124332427978516, -5.8819661140441895, -5.639599800109863, -5.397233486175537, -5.154867172241211, -4.912500381469727, -4.6701340675354, -4.427767753601074, -4.185401439666748, -3.943035125732422, -3.7006688117980957, -3.4583024978637695, -3.2159359455108643, -2.973569631576538, -2.731203317642212, -2.4888370037078857, -2.2464706897735596, -2.0041041374206543, -1.7617379426956177, -1.5193716287612915, -1.2770051956176758, -1.0346388816833496, -0.7922720909118652, -0.5499057769775391, -0.3075394034385681, -0.06517302989959717, 0.177193284034729, 0.4195595979690552, 0.6619260311126709, 0.9042923450469971, 1.1466586589813232, 1.3890249729156494, 1.6313912868499756, 1.8737577199935913, 2.116124153137207, 2.358490467071533, 2.6008567810058594, 2.8432230949401855, 3.0855894088745117, 3.327955722808838, 3.570322036743164, 3.8126883506774902, 4.055054664611816, 4.297420978546143, 4.539787292480469, 4.782154083251953, 5.024519920349121, 5.266886234283447, 5.509252548217773, 5.7516188621521, 5.993985176086426, 6.236351490020752, 6.478717803955078, 6.7210845947265625, 6.963450908660889]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 9.0, 7.0, 15.0, 10.0, 18.0, 25.0, 28.0, 25.0, 31.0, 28.0, 27.0, 27.0, 35.0, 46.0, 39.0, 39.0, 40.0, 44.0, 48.0, 43.0, 35.0, 38.0, 38.0, 33.0, 28.0, 28.0, 27.0, 17.0, 29.0, 19.0, 27.0, 17.0, 10.0, 14.0, 7.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8647117614746094, -3.7316665649414062, -3.598621368408203, -3.465576171875, -3.332530975341797, -3.1994857788085938, -3.0664408206939697, -2.9333956241607666, -2.8003504276275635, -2.6673052310943604, -2.5342600345611572, -2.401214838027954, -2.26816987991333, -2.135124683380127, -2.002079486846924, -1.8690342903137207, -1.7359890937805176, -1.6029438972473145, -1.4698987007141113, -1.3368536233901978, -1.2038084268569946, -1.0707632303237915, -0.9377180933952332, -0.8046729564666748, -0.6716277599334717, -0.5385825634002686, -0.4055374264717102, -0.27249225974082947, -0.13944709300994873, -0.0064018964767456055, 0.12664324045181274, 0.2596883773803711, 0.3927335739135742, 0.5257787704467773, 0.6588239073753357, 0.791869044303894, 0.9249142408370972, 1.0579594373703003, 1.1910045146942139, 1.324049711227417, 1.4570949077606201, 1.5901401042938232, 1.7231853008270264, 1.85623037815094, 1.989275574684143, 2.1223206520080566, 2.2553658485412598, 2.388411045074463, 2.521456241607666, 2.654501438140869, 2.7875466346740723, 2.9205918312072754, 3.0536370277404785, 3.1866822242736816, 3.3197271823883057, 3.452772378921509, 3.585817575454712, 3.718862771987915, 3.851907968521118, 3.9849531650543213, 4.117998123168945, 4.251043319702148, 4.384088516235352, 4.517133712768555, 4.650178909301758]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 10.0, 7.0, 12.0, 22.0, 19.0, 23.0, 28.0, 21.0, 33.0, 66.0, 47.0, 51.0, 53.0, 46.0, 69.0, 64.0, 55.0, 55.0, 56.0, 34.0, 39.0, 35.0, 27.0, 28.0, 22.0, 20.0, 18.0, 14.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.834686279296875, -2.73968505859375, -2.644683837890625, -2.5496826171875, -2.454681396484375, -2.35968017578125, -2.264678955078125, -2.169677734375, -2.074676513671875, -1.97967529296875, -1.884674072265625, -1.7896728515625, -1.694671630859375, -1.59967041015625, -1.504669189453125, -1.40966796875, -1.314666748046875, -1.21966552734375, -1.124664306640625, -1.0296630859375, -0.934661865234375, -0.83966064453125, -0.744659423828125, -0.649658203125, -0.554656982421875, -0.45965576171875, -0.364654541015625, -0.2696533203125, -0.174652099609375, -0.07965087890625, 0.015350341796875, 0.1103515625, 0.205352783203125, 0.30035400390625, 0.395355224609375, 0.4903564453125, 0.585357666015625, 0.68035888671875, 0.775360107421875, 0.870361328125, 0.965362548828125, 1.06036376953125, 1.155364990234375, 1.2503662109375, 1.345367431640625, 1.44036865234375, 1.535369873046875, 1.63037109375, 1.725372314453125, 1.82037353515625, 1.915374755859375, 2.0103759765625, 2.105377197265625, 2.20037841796875, 2.295379638671875, 2.390380859375, 2.485382080078125, 2.58038330078125, 2.675384521484375, 2.7703857421875, 2.865386962890625, 2.96038818359375, 3.055389404296875, 3.150390625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 25.0, 28.0, 47.0, 67.0, 115.0, 190.0, 260.0, 457.0, 706.0, 1206.0, 2049.0, 3518.0, 6397.0, 12337.0, 25738.0, 66906.0, 246401.0, 476009.0, 125749.0, 41750.0, 17990.0, 8979.0, 4929.0, 2607.0, 1598.0, 895.0, 601.0, 350.0, 235.0, 136.0, 97.0, 53.0, 42.0, 31.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.1973876953125, -3.088134765625, -2.9788818359375, -2.86962890625, -2.7603759765625, -2.651123046875, -2.5418701171875, -2.4326171875, -2.3233642578125, -2.214111328125, -2.1048583984375, -1.99560546875, -1.8863525390625, -1.777099609375, -1.6678466796875, -1.55859375, -1.4493408203125, -1.340087890625, -1.2308349609375, -1.12158203125, -1.0123291015625, -0.903076171875, -0.7938232421875, -0.6845703125, -0.5753173828125, -0.466064453125, -0.3568115234375, -0.24755859375, -0.1383056640625, -0.029052734375, 0.0802001953125, 0.189453125, 0.2987060546875, 0.407958984375, 0.5172119140625, 0.62646484375, 0.7357177734375, 0.844970703125, 0.9542236328125, 1.0634765625, 1.1727294921875, 1.281982421875, 1.3912353515625, 1.50048828125, 1.6097412109375, 1.718994140625, 1.8282470703125, 1.9375, 2.0467529296875, 2.156005859375, 2.2652587890625, 2.37451171875, 2.4837646484375, 2.593017578125, 2.7022705078125, 2.8115234375, 2.9207763671875, 3.030029296875, 3.1392822265625, 3.24853515625, 3.3577880859375, 3.467041015625, 3.5762939453125, 3.685546875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 10.0, 14.0, 7.0, 8.0, 9.0, 15.0, 19.0, 20.0, 13.0, 33.0, 24.0, 35.0, 32.0, 52.0, 56.0, 65.0, 94.0, 193.0, 1406.0, 330.0, 149.0, 81.0, 62.0, 51.0, 35.0, 35.0, 29.0, 29.0, 22.0, 23.0, 21.0, 11.0, 13.0, 11.0, 7.0, 3.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7589111328125, -6.486572265625, -6.2142333984375, -5.94189453125, -5.6695556640625, -5.397216796875, -5.1248779296875, -4.8525390625, -4.5802001953125, -4.307861328125, -4.0355224609375, -3.76318359375, -3.4908447265625, -3.218505859375, -2.9461669921875, -2.673828125, -2.4014892578125, -2.129150390625, -1.8568115234375, -1.58447265625, -1.3121337890625, -1.039794921875, -0.7674560546875, -0.4951171875, -0.2227783203125, 0.049560546875, 0.3218994140625, 0.59423828125, 0.8665771484375, 1.138916015625, 1.4112548828125, 1.68359375, 1.9559326171875, 2.228271484375, 2.5006103515625, 2.77294921875, 3.0452880859375, 3.317626953125, 3.5899658203125, 3.8623046875, 4.1346435546875, 4.406982421875, 4.6793212890625, 4.95166015625, 5.2239990234375, 5.496337890625, 5.7686767578125, 6.041015625, 6.3133544921875, 6.585693359375, 6.8580322265625, 7.13037109375, 7.4027099609375, 7.675048828125, 7.9473876953125, 8.2197265625, 8.4920654296875, 8.764404296875, 9.0367431640625, 9.30908203125, 9.5814208984375, 9.853759765625, 10.1260986328125, 10.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 14.0, 15.0, 14.0, 16.0, 18.0, 32.0, 44.0, 46.0, 61.0, 94.0, 137.0, 232.0, 461.0, 1187.0, 5278.0, 56616.0, 2670479.0, 391102.0, 15762.0, 2410.0, 680.0, 330.0, 179.0, 126.0, 91.0, 50.0, 50.0, 26.0, 25.0, 20.0, 19.0, 11.0, 15.0, 10.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-15.046875, -14.6260986328125, -14.205322265625, -13.7845458984375, -13.36376953125, -12.9429931640625, -12.522216796875, -12.1014404296875, -11.6806640625, -11.2598876953125, -10.839111328125, -10.4183349609375, -9.99755859375, -9.5767822265625, -9.156005859375, -8.7352294921875, -8.314453125, -7.8936767578125, -7.472900390625, -7.0521240234375, -6.63134765625, -6.2105712890625, -5.789794921875, -5.3690185546875, -4.9482421875, -4.5274658203125, -4.106689453125, -3.6859130859375, -3.26513671875, -2.8443603515625, -2.423583984375, -2.0028076171875, -1.58203125, -1.1612548828125, -0.740478515625, -0.3197021484375, 0.10107421875, 0.5218505859375, 0.942626953125, 1.3634033203125, 1.7841796875, 2.2049560546875, 2.625732421875, 3.0465087890625, 3.46728515625, 3.8880615234375, 4.308837890625, 4.7296142578125, 5.150390625, 5.5711669921875, 5.991943359375, 6.4127197265625, 6.83349609375, 7.2542724609375, 7.675048828125, 8.0958251953125, 8.5166015625, 8.9373779296875, 9.358154296875, 9.7789306640625, 10.19970703125, 10.6204833984375, 11.041259765625, 11.4620361328125, 11.8828125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [5.0, 445.0, 546.0, 19.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.746743202209473, -5.018730640411377, -0.29071807861328125, 4.437294960021973, 9.16530704498291, 13.893319129943848, 18.621334075927734, 23.349346160888672, 28.07735824584961, 32.80537033081055, 37.533382415771484, 42.26139831542969, 46.989410400390625, 51.71742248535156, 56.4454345703125, 61.17344665527344, 65.90145874023438, 70.62947082519531, 75.35748291015625, 80.08549499511719, 84.81350708007812, 89.54151916503906, 94.26953125, 98.99754333496094, 103.72555541992188, 108.45356750488281, 113.18157958984375, 117.90959167480469, 122.63760375976562, 127.36561584472656, 132.0936279296875, 136.82164001464844, 141.54966735839844, 146.27767944335938, 151.0056915283203, 155.73370361328125, 160.4617156982422, 165.18972778320312, 169.91773986816406, 174.645751953125, 179.37376403808594, 184.10177612304688, 188.8297882080078, 193.55780029296875, 198.2858123779297, 203.01382446289062, 207.74183654785156, 212.4698486328125, 217.1978759765625, 221.92588806152344, 226.65390014648438, 231.3819122314453, 236.10992431640625, 240.8379364013672, 245.56594848632812, 250.29396057128906, 255.02197265625, 259.75, 264.4779968261719, 269.2060241699219, 273.93402099609375, 278.66204833984375, 283.3900451660156, 288.1180725097656, 292.8460693359375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 10.0, 9.0, 14.0, 9.0, 11.0, 10.0, 13.0, 17.0, 26.0, 30.0, 29.0, 36.0, 31.0, 39.0, 41.0, 33.0, 50.0, 31.0, 32.0, 45.0, 51.0, 35.0, 49.0, 40.0, 29.0, 35.0, 25.0, 31.0, 24.0, 24.0, 31.0, 22.0, 17.0, 11.0, 13.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.77924156188965, -21.081886291503906, -20.384531021118164, -19.687175750732422, -18.989822387695312, -18.29246711730957, -17.595111846923828, -16.897756576538086, -16.200401306152344, -15.503046035766602, -14.805691719055176, -14.108336448669434, -13.410982131958008, -12.713626861572266, -12.016271591186523, -11.318916320800781, -10.621562957763672, -9.92420768737793, -9.226853370666504, -8.529498100280762, -7.832143306732178, -7.134788513183594, -6.437433242797852, -5.740078449249268, -5.042723655700684, -4.3453688621521, -3.6480138301849365, -2.9506587982177734, -2.2533040046691895, -1.5559492111206055, -0.8585939407348633, -0.1612391471862793, 0.5361175537109375, 1.233472466468811, 1.9308273792266846, 2.6281824111938477, 3.3255372047424316, 4.022891998291016, 4.720247268676758, 5.417602062225342, 6.114956855773926, 6.81231164932251, 7.509666442871094, 8.207021713256836, 8.904376983642578, 9.601731300354004, 10.299086570739746, 10.996440887451172, 11.693796157836914, 12.391151428222656, 13.088505744934082, 13.785861015319824, 14.48321533203125, 15.180570602416992, 15.877925872802734, 16.575281143188477, 17.27263641357422, 17.96999168395996, 18.667346954345703, 19.364700317382812, 20.062055587768555, 20.759410858154297, 21.45676612854004, 22.15412139892578, 22.85147476196289]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 15.0, 22.0, 15.0, 26.0, 28.0, 35.0, 30.0, 44.0, 54.0, 44.0, 45.0, 55.0, 49.0, 43.0, 58.0, 42.0, 55.0, 47.0, 41.0, 39.0, 31.0, 25.0, 28.0, 22.0, 16.0, 18.0, 19.0, 18.0, 9.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.45062255859375, -2.3621826171875, -2.27374267578125, -2.185302734375, -2.09686279296875, -2.0084228515625, -1.91998291015625, -1.83154296875, -1.74310302734375, -1.6546630859375, -1.56622314453125, -1.477783203125, -1.38934326171875, -1.3009033203125, -1.21246337890625, -1.1240234375, -1.03558349609375, -0.9471435546875, -0.85870361328125, -0.770263671875, -0.68182373046875, -0.5933837890625, -0.50494384765625, -0.41650390625, -0.32806396484375, -0.2396240234375, -0.15118408203125, -0.062744140625, 0.02569580078125, 0.1141357421875, 0.20257568359375, 0.291015625, 0.37945556640625, 0.4678955078125, 0.55633544921875, 0.644775390625, 0.73321533203125, 0.8216552734375, 0.91009521484375, 0.99853515625, 1.08697509765625, 1.1754150390625, 1.26385498046875, 1.352294921875, 1.44073486328125, 1.5291748046875, 1.61761474609375, 1.7060546875, 1.79449462890625, 1.8829345703125, 1.97137451171875, 2.059814453125, 2.14825439453125, 2.2366943359375, 2.32513427734375, 2.41357421875, 2.50201416015625, 2.5904541015625, 2.67889404296875, 2.767333984375, 2.85577392578125, 2.9442138671875, 3.03265380859375, 3.12109375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 10.0, 5.0, 7.0, 8.0, 14.0, 14.0, 33.0, 45.0, 62.0, 102.0, 172.0, 258.0, 393.0, 697.0, 1300.0, 2229.0, 4093.0, 7602.0, 14770.0, 29488.0, 68087.0, 313022.0, 2718772.0, 856636.0, 98117.0, 38020.0, 18534.0, 9578.0, 5301.0, 2836.0, 1590.0, 931.0, 547.0, 321.0, 244.0, 140.0, 94.0, 67.0, 38.0, 30.0, 16.0, 24.0, 14.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.2154541015625, -6.012939453125, -5.8104248046875, -5.60791015625, -5.4053955078125, -5.202880859375, -5.0003662109375, -4.7978515625, -4.5953369140625, -4.392822265625, -4.1903076171875, -3.98779296875, -3.7852783203125, -3.582763671875, -3.3802490234375, -3.177734375, -2.9752197265625, -2.772705078125, -2.5701904296875, -2.36767578125, -2.1651611328125, -1.962646484375, -1.7601318359375, -1.5576171875, -1.3551025390625, -1.152587890625, -0.9500732421875, -0.74755859375, -0.5450439453125, -0.342529296875, -0.1400146484375, 0.0625, 0.2650146484375, 0.467529296875, 0.6700439453125, 0.87255859375, 1.0750732421875, 1.277587890625, 1.4801025390625, 1.6826171875, 1.8851318359375, 2.087646484375, 2.2901611328125, 2.49267578125, 2.6951904296875, 2.897705078125, 3.1002197265625, 3.302734375, 3.5052490234375, 3.707763671875, 3.9102783203125, 4.11279296875, 4.3153076171875, 4.517822265625, 4.7203369140625, 4.9228515625, 5.1253662109375, 5.327880859375, 5.5303955078125, 5.73291015625, 5.9354248046875, 6.137939453125, 6.3404541015625, 6.54296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 16.0, 10.0, 21.0, 16.0, 49.0, 61.0, 74.0, 105.0, 148.0, 248.0, 491.0, 877.0, 816.0, 403.0, 208.0, 138.0, 91.0, 83.0, 58.0, 43.0, 32.0, 24.0, 16.0, 12.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.17938232421875, -5.9095458984375, -5.63970947265625, -5.369873046875, -5.10003662109375, -4.8302001953125, -4.56036376953125, -4.29052734375, -4.02069091796875, -3.7508544921875, -3.48101806640625, -3.211181640625, -2.94134521484375, -2.6715087890625, -2.40167236328125, -2.1318359375, -1.86199951171875, -1.5921630859375, -1.32232666015625, -1.052490234375, -0.78265380859375, -0.5128173828125, -0.24298095703125, 0.02685546875, 0.29669189453125, 0.5665283203125, 0.83636474609375, 1.106201171875, 1.37603759765625, 1.6458740234375, 1.91571044921875, 2.185546875, 2.45538330078125, 2.7252197265625, 2.99505615234375, 3.264892578125, 3.53472900390625, 3.8045654296875, 4.07440185546875, 4.34423828125, 4.61407470703125, 4.8839111328125, 5.15374755859375, 5.423583984375, 5.69342041015625, 5.9632568359375, 6.23309326171875, 6.5029296875, 6.77276611328125, 7.0426025390625, 7.31243896484375, 7.582275390625, 7.85211181640625, 8.1219482421875, 8.39178466796875, 8.66162109375, 8.93145751953125, 9.2012939453125, 9.47113037109375, 9.740966796875, 10.01080322265625, 10.2806396484375, 10.55047607421875, 10.8203125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 8.0, 25.0, 28.0, 56.0, 78.0, 108.0, 218.0, 492.0, 1378.0, 5216.0, 25015.0, 183040.0, 3617793.0, 315220.0, 35690.0, 6827.0, 1900.0, 572.0, 248.0, 139.0, 68.0, 49.0, 25.0, 20.0, 13.0, 12.0, 13.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.078125, -23.4700927734375, -22.862060546875, -22.2540283203125, -21.64599609375, -21.0379638671875, -20.429931640625, -19.8218994140625, -19.2138671875, -18.6058349609375, -17.997802734375, -17.3897705078125, -16.78173828125, -16.1737060546875, -15.565673828125, -14.9576416015625, -14.349609375, -13.7415771484375, -13.133544921875, -12.5255126953125, -11.91748046875, -11.3094482421875, -10.701416015625, -10.0933837890625, -9.4853515625, -8.8773193359375, -8.269287109375, -7.6612548828125, -7.05322265625, -6.4451904296875, -5.837158203125, -5.2291259765625, -4.62109375, -4.0130615234375, -3.405029296875, -2.7969970703125, -2.18896484375, -1.5809326171875, -0.972900390625, -0.3648681640625, 0.2431640625, 0.8511962890625, 1.459228515625, 2.0672607421875, 2.67529296875, 3.2833251953125, 3.891357421875, 4.4993896484375, 5.107421875, 5.7154541015625, 6.323486328125, 6.9315185546875, 7.53955078125, 8.1475830078125, 8.755615234375, 9.3636474609375, 9.9716796875, 10.5797119140625, 11.187744140625, 11.7957763671875, 12.40380859375, 13.0118408203125, 13.619873046875, 14.2279052734375, 14.8359375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 19.0, 25.0, 61.0, 87.0, 127.0, 152.0, 160.0, 102.0, 78.0, 58.0, 42.0, 31.0, 17.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-71.78440856933594, -70.34912872314453, -68.91385650634766, -67.47857666015625, -66.04330444335938, -64.60802459716797, -63.17274856567383, -61.73747253417969, -60.30219650268555, -58.866920471191406, -57.431644439697266, -55.996368408203125, -54.56108856201172, -53.12581253051758, -51.69053649902344, -50.2552604675293, -48.819984436035156, -47.384708404541016, -45.949432373046875, -44.514156341552734, -43.078880310058594, -41.64360046386719, -40.20832443237305, -38.773048400878906, -37.337772369384766, -35.902496337890625, -34.467220306396484, -33.031944274902344, -31.59666633605957, -30.16139030456543, -28.726112365722656, -27.290836334228516, -25.85555648803711, -24.42028045654297, -22.985004425048828, -21.549726486206055, -20.114450454711914, -18.679174423217773, -17.243896484375, -15.80862045288086, -14.373344421386719, -12.938068389892578, -11.502791404724121, -10.067514419555664, -8.632238388061523, -7.196961879730225, -5.761685371398926, -4.326408386230469, -2.891132354736328, -1.4558558464050293, -0.02057933807373047, 1.4146971702575684, 2.849973678588867, 4.285250186920166, 5.720526695251465, 7.155803680419922, 8.591079711914062, 10.026355743408203, 11.46163272857666, 12.896909713745117, 14.332185745239258, 15.767461776733398, 17.202739715576172, 18.638015747070312, 20.073291778564453]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 12.0, 6.0, 16.0, 14.0, 12.0, 16.0, 22.0, 25.0, 18.0, 24.0, 35.0, 35.0, 33.0, 45.0, 52.0, 38.0, 34.0, 42.0, 47.0, 46.0, 45.0, 34.0, 43.0, 38.0, 31.0, 30.0, 24.0, 20.0, 26.0, 18.0, 18.0, 15.0, 13.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.072383880615234, -20.38842010498047, -19.704458236694336, -19.02049446105957, -18.336532592773438, -17.652568817138672, -16.968605041503906, -16.284643173217773, -15.600679397583008, -14.916716575622559, -14.23275375366211, -13.548789978027344, -12.864827156066895, -12.180864334106445, -11.496901512145996, -10.812938690185547, -10.128975868225098, -9.445013046264648, -8.7610502243042, -8.07708740234375, -7.393123626708984, -6.709160804748535, -6.025197982788086, -5.3412346839904785, -4.657271862030029, -3.973308801651001, -3.2893457412719727, -2.6053829193115234, -1.9214198589324951, -1.2374567985534668, -0.5534939765930176, 0.13046932220458984, 0.8144321441650391, 1.4983952045440674, 2.1823582649230957, 2.866321086883545, 3.5502841472625732, 4.234247207641602, 4.918210029602051, 5.602173328399658, 6.286136150360107, 6.970098972320557, 7.654062271118164, 8.338025093078613, 9.021987915039062, 9.705951690673828, 10.389913558959961, 11.073877334594727, 11.757840156555176, 12.441802978515625, 13.125765800476074, 13.809728622436523, 14.493692398071289, 15.177655220031738, 15.861618041992188, 16.545581817626953, 17.229543685913086, 17.91350746154785, 18.597469329833984, 19.28143310546875, 19.965394973754883, 20.64935874938965, 21.33332061767578, 22.017284393310547, 22.701248168945312]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 9.0, 12.0, 21.0, 22.0, 33.0, 29.0, 31.0, 26.0, 41.0, 42.0, 46.0, 38.0, 50.0, 43.0, 49.0, 42.0, 36.0, 36.0, 43.0, 37.0, 39.0, 38.0, 41.0, 20.0, 20.0, 23.0, 10.0, 15.0, 13.0, 13.0, 19.0, 11.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.01641845703125, -1.9410400390625, -1.86566162109375, -1.790283203125, -1.71490478515625, -1.6395263671875, -1.56414794921875, -1.48876953125, -1.41339111328125, -1.3380126953125, -1.26263427734375, -1.187255859375, -1.11187744140625, -1.0364990234375, -0.96112060546875, -0.8857421875, -0.81036376953125, -0.7349853515625, -0.65960693359375, -0.584228515625, -0.50885009765625, -0.4334716796875, -0.35809326171875, -0.28271484375, -0.20733642578125, -0.1319580078125, -0.05657958984375, 0.018798828125, 0.09417724609375, 0.1695556640625, 0.24493408203125, 0.3203125, 0.39569091796875, 0.4710693359375, 0.54644775390625, 0.621826171875, 0.69720458984375, 0.7725830078125, 0.84796142578125, 0.92333984375, 0.99871826171875, 1.0740966796875, 1.14947509765625, 1.224853515625, 1.30023193359375, 1.3756103515625, 1.45098876953125, 1.5263671875, 1.60174560546875, 1.6771240234375, 1.75250244140625, 1.827880859375, 1.90325927734375, 1.9786376953125, 2.05401611328125, 2.12939453125, 2.20477294921875, 2.2801513671875, 2.35552978515625, 2.430908203125, 2.50628662109375, 2.5816650390625, 2.65704345703125, 2.732421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 9.0, 21.0, 34.0, 41.0, 70.0, 107.0, 125.0, 202.0, 280.0, 413.0, 605.0, 861.0, 1276.0, 1938.0, 2866.0, 4366.0, 6850.0, 10855.0, 18139.0, 31267.0, 61641.0, 279036.0, 471134.0, 70173.0, 34022.0, 19223.0, 11804.0, 7232.0, 4612.0, 3025.0, 1917.0, 1341.0, 889.0, 683.0, 427.0, 301.0, 215.0, 161.0, 105.0, 71.0, 63.0, 41.0, 29.0, 19.0, 13.0, 11.0, 7.0, 0.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.8828125, -9.5428466796875, -9.202880859375, -8.8629150390625, -8.52294921875, -8.1829833984375, -7.843017578125, -7.5030517578125, -7.1630859375, -6.8231201171875, -6.483154296875, -6.1431884765625, -5.80322265625, -5.4632568359375, -5.123291015625, -4.7833251953125, -4.443359375, -4.1033935546875, -3.763427734375, -3.4234619140625, -3.08349609375, -2.7435302734375, -2.403564453125, -2.0635986328125, -1.7236328125, -1.3836669921875, -1.043701171875, -0.7037353515625, -0.36376953125, -0.0238037109375, 0.316162109375, 0.6561279296875, 0.99609375, 1.3360595703125, 1.676025390625, 2.0159912109375, 2.35595703125, 2.6959228515625, 3.035888671875, 3.3758544921875, 3.7158203125, 4.0557861328125, 4.395751953125, 4.7357177734375, 5.07568359375, 5.4156494140625, 5.755615234375, 6.0955810546875, 6.435546875, 6.7755126953125, 7.115478515625, 7.4554443359375, 7.79541015625, 8.1353759765625, 8.475341796875, 8.8153076171875, 9.1552734375, 9.4952392578125, 9.835205078125, 10.1751708984375, 10.51513671875, 10.8551025390625, 11.195068359375, 11.5350341796875, 11.875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 13.0, 14.0, 11.0, 18.0, 11.0, 20.0, 19.0, 32.0, 41.0, 28.0, 41.0, 31.0, 48.0, 46.0, 45.0, 47.0, 1062.0, 48.0, 33.0, 30.0, 36.0, 41.0, 29.0, 33.0, 24.0, 30.0, 23.0, 19.0, 24.0, 18.0, 11.0, 8.0, 9.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.78515625, -1.7266693115234375, -1.668182373046875, -1.6096954345703125, -1.55120849609375, -1.4927215576171875, -1.434234619140625, -1.3757476806640625, -1.3172607421875, -1.2587738037109375, -1.200286865234375, -1.1417999267578125, -1.08331298828125, -1.0248260498046875, -0.966339111328125, -0.9078521728515625, -0.849365234375, -0.7908782958984375, -0.732391357421875, -0.6739044189453125, -0.61541748046875, -0.5569305419921875, -0.498443603515625, -0.4399566650390625, -0.3814697265625, -0.3229827880859375, -0.264495849609375, -0.2060089111328125, -0.14752197265625, -0.0890350341796875, -0.030548095703125, 0.0279388427734375, 0.08642578125, 0.1449127197265625, 0.203399658203125, 0.2618865966796875, 0.32037353515625, 0.3788604736328125, 0.437347412109375, 0.4958343505859375, 0.5543212890625, 0.6128082275390625, 0.671295166015625, 0.7297821044921875, 0.78826904296875, 0.8467559814453125, 0.905242919921875, 0.9637298583984375, 1.022216796875, 1.0807037353515625, 1.139190673828125, 1.1976776123046875, 1.25616455078125, 1.3146514892578125, 1.373138427734375, 1.4316253662109375, 1.4901123046875, 1.5485992431640625, 1.607086181640625, 1.6655731201171875, 1.72406005859375, 1.7825469970703125, 1.841033935546875, 1.8995208740234375, 1.9580078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 7.0, 4.0, 6.0, 14.0, 20.0, 30.0, 45.0, 54.0, 89.0, 128.0, 264.0, 375.0, 619.0, 937.0, 1589.0, 2993.0, 9093.0, 68365.0, 1954137.0, 44092.0, 7409.0, 2758.0, 1510.0, 929.0, 571.0, 346.0, 251.0, 162.0, 130.0, 67.0, 32.0, 36.0, 13.0, 15.0, 14.0, 7.0, 5.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.8359375, -37.515625, -36.1953125, -34.875, -33.5546875, -32.234375, -30.9140625, -29.59375, -28.2734375, -26.953125, -25.6328125, -24.3125, -22.9921875, -21.671875, -20.3515625, -19.03125, -17.7109375, -16.390625, -15.0703125, -13.75, -12.4296875, -11.109375, -9.7890625, -8.46875, -7.1484375, -5.828125, -4.5078125, -3.1875, -1.8671875, -0.546875, 0.7734375, 2.09375, 3.4140625, 4.734375, 6.0546875, 7.375, 8.6953125, 10.015625, 11.3359375, 12.65625, 13.9765625, 15.296875, 16.6171875, 17.9375, 19.2578125, 20.578125, 21.8984375, 23.21875, 24.5390625, 25.859375, 27.1796875, 28.5, 29.8203125, 31.140625, 32.4609375, 33.78125, 35.1015625, 36.421875, 37.7421875, 39.0625, 40.3828125, 41.703125, 43.0234375, 44.34375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 24.0, 47.0, 752.0, 76.0, 30.0, 19.0, 8.0, 10.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.828857421875, -10.42333984375, -10.017822265625, -9.6123046875, -9.206787109375, -8.80126953125, -8.395751953125, -7.990234375, -7.584716796875, -7.17919921875, -6.773681640625, -6.3681640625, -5.962646484375, -5.55712890625, -5.151611328125, -4.74609375, -4.340576171875, -3.93505859375, -3.529541015625, -3.1240234375, -2.718505859375, -2.31298828125, -1.907470703125, -1.501953125, -1.096435546875, -0.69091796875, -0.285400390625, 0.1201171875, 0.525634765625, 0.93115234375, 1.336669921875, 1.7421875, 2.147705078125, 2.55322265625, 2.958740234375, 3.3642578125, 3.769775390625, 4.17529296875, 4.580810546875, 4.986328125, 5.391845703125, 5.79736328125, 6.202880859375, 6.6083984375, 7.013916015625, 7.41943359375, 7.824951171875, 8.23046875, 8.635986328125, 9.04150390625, 9.447021484375, 9.8525390625, 10.258056640625, 10.66357421875, 11.069091796875, 11.474609375, 11.880126953125, 12.28564453125, 12.691162109375, 13.0966796875, 13.502197265625, 13.90771484375, 14.313232421875, 14.71875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 23.0, 64.0, 236.0, 1200.0, 14160.0, 1028432.0, 3671.0, 491.0, 125.0, 53.0, 22.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-244.375, -237.63671875, -230.8984375, -224.16015625, -217.421875, -210.68359375, -203.9453125, -197.20703125, -190.46875, -183.73046875, -176.9921875, -170.25390625, -163.515625, -156.77734375, -150.0390625, -143.30078125, -136.5625, -129.82421875, -123.0859375, -116.34765625, -109.609375, -102.87109375, -96.1328125, -89.39453125, -82.65625, -75.91796875, -69.1796875, -62.44140625, -55.703125, -48.96484375, -42.2265625, -35.48828125, -28.75, -22.01171875, -15.2734375, -8.53515625, -1.796875, 4.94140625, 11.6796875, 18.41796875, 25.15625, 31.89453125, 38.6328125, 45.37109375, 52.109375, 58.84765625, 65.5859375, 72.32421875, 79.0625, 85.80078125, 92.5390625, 99.27734375, 106.015625, 112.75390625, 119.4921875, 126.23046875, 132.96875, 139.70703125, 146.4453125, 153.18359375, 159.921875, 166.66015625, 173.3984375, 180.13671875, 186.875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 13.0, 16.0, 11.0, 9.0, 13.0, 16.0, 22.0, 38.0, 58.0, 63.0, 89.0, 135.0, 133.0, 78.0, 65.0, 43.0, 37.0, 40.0, 19.0, 21.0, 17.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.570699691772461, -6.352674961090088, -6.134650230407715, -5.916625499725342, -5.698600769042969, -5.480576038360596, -5.262551307678223, -5.044526100158691, -4.826501846313477, -4.6084771156311035, -4.3904523849487305, -4.172427654266357, -3.9544029235839844, -3.7363781929016113, -3.518353223800659, -3.300328493118286, -3.082303524017334, -2.864278793334961, -2.646254062652588, -2.428229331970215, -2.210204601287842, -1.9921797513961792, -1.7741549015045166, -1.5561301708221436, -1.3381054401397705, -1.1200807094573975, -0.9020559191703796, -0.6840311288833618, -0.46600639820098877, -0.24798166751861572, -0.029956817626953125, 0.18806791305541992, 0.40609264373779297, 0.624117374420166, 0.8421421647071838, 1.0601669549942017, 1.2781916856765747, 1.4962164163589478, 1.7142412662506104, 1.9322659969329834, 2.1502907276153564, 2.3683154582977295, 2.5863401889801025, 2.8043651580810547, 3.0223898887634277, 3.240414619445801, 3.458439350128174, 3.676464080810547, 3.89448881149292, 4.112513542175293, 4.330538272857666, 4.548563003540039, 4.766587734222412, 4.984612464904785, 5.202637672424316, 5.420661926269531, 5.6386871337890625, 5.8567118644714355, 6.074736595153809, 6.292761325836182, 6.510786056518555, 6.728810787200928, 6.946835517883301, 7.164860725402832, 7.382884979248047]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 6.0, 18.0, 11.0, 14.0, 18.0, 25.0, 23.0, 37.0, 28.0, 39.0, 42.0, 41.0, 40.0, 32.0, 51.0, 59.0, 50.0, 41.0, 48.0, 49.0, 39.0, 45.0, 40.0, 35.0, 26.0, 26.0, 23.0, 16.0, 18.0, 21.0, 7.0, 6.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.732614040374756, -6.518804550170898, -6.304995059967041, -6.091185569763184, -5.877376079559326, -5.663566589355469, -5.449756622314453, -5.235947132110596, -5.022137641906738, -4.808328151702881, -4.594518661499023, -4.380709171295166, -4.166899681091309, -3.953089952468872, -3.7392804622650146, -3.525470733642578, -3.3116614818573, -3.0978519916534424, -2.884042501449585, -2.6702327728271484, -2.456423282623291, -2.2426137924194336, -2.028804302215576, -1.8149946928024292, -1.6011852025985718, -1.3873757123947144, -1.1735661029815674, -0.95975661277771, -0.7459470629692078, -0.5321375131607056, -0.31832802295684814, -0.10451841354370117, 0.10929107666015625, 0.32310062646865845, 0.5369101762771606, 0.7507196664810181, 0.9645292162895203, 1.1783387660980225, 1.3921482563018799, 1.6059578657150269, 1.8197673559188843, 2.0335769653320312, 2.2473864555358887, 2.461195945739746, 2.6750054359436035, 2.888814926147461, 3.1026244163513184, 3.316434144973755, 3.5302436351776123, 3.7440531253814697, 3.957862615585327, 4.171672344207764, 4.385481834411621, 4.5992913246154785, 4.813100814819336, 5.026910305023193, 5.240719795227051, 5.454529285430908, 5.668338775634766, 5.882148265838623, 6.0959577560424805, 6.309767723083496, 6.523576736450195, 6.737386703491211, 6.951196193695068]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 13.0, 8.0, 19.0, 21.0, 22.0, 34.0, 38.0, 37.0, 32.0, 33.0, 38.0, 45.0, 59.0, 52.0, 46.0, 48.0, 51.0, 40.0, 52.0, 48.0, 36.0, 32.0, 26.0, 21.0, 23.0, 15.0, 24.0, 20.0, 14.0, 12.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.208892822265625, -2.11700439453125, -2.025115966796875, -1.9332275390625, -1.841339111328125, -1.74945068359375, -1.657562255859375, -1.565673828125, -1.473785400390625, -1.38189697265625, -1.290008544921875, -1.1981201171875, -1.106231689453125, -1.01434326171875, -0.922454833984375, -0.83056640625, -0.738677978515625, -0.64678955078125, -0.554901123046875, -0.4630126953125, -0.371124267578125, -0.27923583984375, -0.187347412109375, -0.095458984375, -0.003570556640625, 0.08831787109375, 0.180206298828125, 0.2720947265625, 0.363983154296875, 0.45587158203125, 0.547760009765625, 0.6396484375, 0.731536865234375, 0.82342529296875, 0.915313720703125, 1.0072021484375, 1.099090576171875, 1.19097900390625, 1.282867431640625, 1.374755859375, 1.466644287109375, 1.55853271484375, 1.650421142578125, 1.7423095703125, 1.834197998046875, 1.92608642578125, 2.017974853515625, 2.10986328125, 2.201751708984375, 2.29364013671875, 2.385528564453125, 2.4774169921875, 2.569305419921875, 2.66119384765625, 2.753082275390625, 2.844970703125, 2.936859130859375, 3.02874755859375, 3.120635986328125, 3.2125244140625, 3.304412841796875, 3.39630126953125, 3.488189697265625, 3.580078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 6.0, 18.0, 13.0, 32.0, 30.0, 56.0, 101.0, 132.0, 172.0, 252.0, 400.0, 597.0, 961.0, 1644.0, 2753.0, 4945.0, 9217.0, 18896.0, 42575.0, 133776.0, 597327.0, 147421.0, 45071.0, 19758.0, 9770.0, 5147.0, 2909.0, 1723.0, 1011.0, 675.0, 371.0, 258.0, 162.0, 100.0, 86.0, 59.0, 38.0, 14.0, 22.0, 10.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.05963134765625, -4.8614501953125, -4.66326904296875, -4.465087890625, -4.26690673828125, -4.0687255859375, -3.87054443359375, -3.67236328125, -3.47418212890625, -3.2760009765625, -3.07781982421875, -2.879638671875, -2.68145751953125, -2.4832763671875, -2.28509521484375, -2.0869140625, -1.88873291015625, -1.6905517578125, -1.49237060546875, -1.294189453125, -1.09600830078125, -0.8978271484375, -0.69964599609375, -0.50146484375, -0.30328369140625, -0.1051025390625, 0.09307861328125, 0.291259765625, 0.48944091796875, 0.6876220703125, 0.88580322265625, 1.083984375, 1.28216552734375, 1.4803466796875, 1.67852783203125, 1.876708984375, 2.07489013671875, 2.2730712890625, 2.47125244140625, 2.66943359375, 2.86761474609375, 3.0657958984375, 3.26397705078125, 3.462158203125, 3.66033935546875, 3.8585205078125, 4.05670166015625, 4.2548828125, 4.45306396484375, 4.6512451171875, 4.84942626953125, 5.047607421875, 5.24578857421875, 5.4439697265625, 5.64215087890625, 5.84033203125, 6.03851318359375, 6.2366943359375, 6.43487548828125, 6.633056640625, 6.83123779296875, 7.0294189453125, 7.22760009765625, 7.42578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 18.0, 33.0, 25.0, 26.0, 25.0, 31.0, 41.0, 41.0, 72.0, 71.0, 95.0, 146.0, 1424.0, 360.0, 131.0, 93.0, 70.0, 52.0, 45.0, 39.0, 35.0, 35.0, 21.0, 15.0, 16.0, 15.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.307373046875, -8.97412109375, -8.640869140625, -8.3076171875, -7.974365234375, -7.64111328125, -7.307861328125, -6.974609375, -6.641357421875, -6.30810546875, -5.974853515625, -5.6416015625, -5.308349609375, -4.97509765625, -4.641845703125, -4.30859375, -3.975341796875, -3.64208984375, -3.308837890625, -2.9755859375, -2.642333984375, -2.30908203125, -1.975830078125, -1.642578125, -1.309326171875, -0.97607421875, -0.642822265625, -0.3095703125, 0.023681640625, 0.35693359375, 0.690185546875, 1.0234375, 1.356689453125, 1.68994140625, 2.023193359375, 2.3564453125, 2.689697265625, 3.02294921875, 3.356201171875, 3.689453125, 4.022705078125, 4.35595703125, 4.689208984375, 5.0224609375, 5.355712890625, 5.68896484375, 6.022216796875, 6.35546875, 6.688720703125, 7.02197265625, 7.355224609375, 7.6884765625, 8.021728515625, 8.35498046875, 8.688232421875, 9.021484375, 9.354736328125, 9.68798828125, 10.021240234375, 10.3544921875, 10.687744140625, 11.02099609375, 11.354248046875, 11.6875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 17.0, 13.0, 11.0, 19.0, 22.0, 27.0, 32.0, 37.0, 55.0, 111.0, 156.0, 276.0, 766.0, 2423.0, 11071.0, 82469.0, 2693648.0, 322074.0, 25543.0, 4646.0, 1220.0, 427.0, 214.0, 118.0, 61.0, 41.0, 43.0, 32.0, 27.0, 20.0, 17.0, 9.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.797119140625, -16.25048828125, -15.703857421875, -15.1572265625, -14.610595703125, -14.06396484375, -13.517333984375, -12.970703125, -12.424072265625, -11.87744140625, -11.330810546875, -10.7841796875, -10.237548828125, -9.69091796875, -9.144287109375, -8.59765625, -8.051025390625, -7.50439453125, -6.957763671875, -6.4111328125, -5.864501953125, -5.31787109375, -4.771240234375, -4.224609375, -3.677978515625, -3.13134765625, -2.584716796875, -2.0380859375, -1.491455078125, -0.94482421875, -0.398193359375, 0.1484375, 0.695068359375, 1.24169921875, 1.788330078125, 2.3349609375, 2.881591796875, 3.42822265625, 3.974853515625, 4.521484375, 5.068115234375, 5.61474609375, 6.161376953125, 6.7080078125, 7.254638671875, 7.80126953125, 8.347900390625, 8.89453125, 9.441162109375, 9.98779296875, 10.534423828125, 11.0810546875, 11.627685546875, 12.17431640625, 12.720947265625, 13.267578125, 13.814208984375, 14.36083984375, 14.907470703125, 15.4541015625, 16.000732421875, 16.54736328125, 17.093994140625, 17.640625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 33.0, 93.0, 201.0, 300.0, 207.0, 122.0, 37.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96629524230957, -25.113798141479492, -23.261301040649414, -21.408803939819336, -19.556306838989258, -17.70380973815918, -15.851312637329102, -13.998815536499023, -12.146318435668945, -10.293821334838867, -8.441324234008789, -6.588827133178711, -4.736330032348633, -2.8838329315185547, -1.0313358306884766, 0.8211612701416016, 2.6736583709716797, 4.526155471801758, 6.378652572631836, 8.231149673461914, 10.083646774291992, 11.93614387512207, 13.788640975952148, 15.641138076782227, 17.493635177612305, 19.346132278442383, 21.19862937927246, 23.05112648010254, 24.903623580932617, 26.756120681762695, 28.608617782592773, 30.46111488342285, 32.31361389160156, 34.16611099243164, 36.01860809326172, 37.8711051940918, 39.723602294921875, 41.57609939575195, 43.42859649658203, 45.28109359741211, 47.13359069824219, 48.986087799072266, 50.838584899902344, 52.69108200073242, 54.5435791015625, 56.39607620239258, 58.248573303222656, 60.101070404052734, 61.95356750488281, 63.80606460571289, 65.65856170654297, 67.51106262207031, 69.36355590820312, 71.21604919433594, 73.06855010986328, 74.92105102539062, 76.77354431152344, 78.62603759765625, 80.4785385131836, 82.33103942871094, 84.18353271484375, 86.03602600097656, 87.8885269165039, 89.74102783203125, 91.59352111816406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 11.0, 16.0, 13.0, 31.0, 22.0, 18.0, 26.0, 26.0, 35.0, 36.0, 36.0, 40.0, 45.0, 37.0, 49.0, 56.0, 41.0, 31.0, 40.0, 36.0, 32.0, 35.0, 24.0, 27.0, 29.0, 20.0, 24.0, 19.0, 22.0, 13.0, 15.0, 20.0, 8.0, 7.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.59970474243164, -25.747615814208984, -24.89552879333496, -24.043439865112305, -23.19135284423828, -22.339263916015625, -21.48717498779297, -20.635087966918945, -19.78299903869629, -18.930910110473633, -18.07882308959961, -17.226734161376953, -16.37464714050293, -15.522558212280273, -14.670470237731934, -13.818382263183594, -12.966294288635254, -12.114206314086914, -11.262118339538574, -10.410030364990234, -9.557941436767578, -8.705853462219238, -7.853765487670898, -7.0016770362854, -6.1495890617370605, -5.297501087188721, -4.445412635803223, -3.593324661254883, -2.741236448287964, -1.889148235321045, -1.037060260772705, -0.18497180938720703, 0.6671161651611328, 1.5192043781280518, 2.3712925910949707, 3.2233805656433105, 4.075469017028809, 4.927556991577148, 5.779644966125488, 6.631733417510986, 7.483821392059326, 8.335909843444824, 9.187997817993164, 10.040085792541504, 10.892173767089844, 11.7442626953125, 12.596349716186523, 13.44843864440918, 14.30052661895752, 15.15261459350586, 16.004703521728516, 16.85679054260254, 17.708879470825195, 18.56096649169922, 19.413055419921875, 20.26514434814453, 21.117231369018555, 21.96932029724121, 22.821407318115234, 23.67349624633789, 24.525583267211914, 25.37767219543457, 26.229759216308594, 27.08184814453125, 27.933937072753906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 13.0, 13.0, 18.0, 28.0, 22.0, 33.0, 30.0, 23.0, 45.0, 43.0, 43.0, 45.0, 48.0, 65.0, 42.0, 37.0, 42.0, 46.0, 43.0, 47.0, 32.0, 27.0, 30.0, 25.0, 20.0, 19.0, 22.0, 17.0, 16.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.393798828125, -2.29736328125, -2.200927734375, -2.1044921875, -2.008056640625, -1.91162109375, -1.815185546875, -1.71875, -1.622314453125, -1.52587890625, -1.429443359375, -1.3330078125, -1.236572265625, -1.14013671875, -1.043701171875, -0.947265625, -0.850830078125, -0.75439453125, -0.657958984375, -0.5615234375, -0.465087890625, -0.36865234375, -0.272216796875, -0.17578125, -0.079345703125, 0.01708984375, 0.113525390625, 0.2099609375, 0.306396484375, 0.40283203125, 0.499267578125, 0.595703125, 0.692138671875, 0.78857421875, 0.885009765625, 0.9814453125, 1.077880859375, 1.17431640625, 1.270751953125, 1.3671875, 1.463623046875, 1.56005859375, 1.656494140625, 1.7529296875, 1.849365234375, 1.94580078125, 2.042236328125, 2.138671875, 2.235107421875, 2.33154296875, 2.427978515625, 2.5244140625, 2.620849609375, 2.71728515625, 2.813720703125, 2.91015625, 3.006591796875, 3.10302734375, 3.199462890625, 3.2958984375, 3.392333984375, 3.48876953125, 3.585205078125, 3.681640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 12.0, 14.0, 24.0, 18.0, 46.0, 62.0, 74.0, 154.0, 200.0, 335.0, 483.0, 776.0, 1200.0, 2117.0, 3588.0, 6547.0, 11816.0, 23213.0, 52388.0, 198159.0, 1589525.0, 1964535.0, 230896.0, 54733.0, 24184.0, 12369.0, 6673.0, 3784.0, 2243.0, 1365.0, 910.0, 570.0, 369.0, 271.0, 175.0, 126.0, 91.0, 68.0, 35.0, 36.0, 21.0, 20.0, 13.0, 9.0, 10.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.4140625, -5.2210693359375, -5.028076171875, -4.8350830078125, -4.64208984375, -4.4490966796875, -4.256103515625, -4.0631103515625, -3.8701171875, -3.6771240234375, -3.484130859375, -3.2911376953125, -3.09814453125, -2.9051513671875, -2.712158203125, -2.5191650390625, -2.326171875, -2.1331787109375, -1.940185546875, -1.7471923828125, -1.55419921875, -1.3612060546875, -1.168212890625, -0.9752197265625, -0.7822265625, -0.5892333984375, -0.396240234375, -0.2032470703125, -0.01025390625, 0.1827392578125, 0.375732421875, 0.5687255859375, 0.76171875, 0.9547119140625, 1.147705078125, 1.3406982421875, 1.53369140625, 1.7266845703125, 1.919677734375, 2.1126708984375, 2.3056640625, 2.4986572265625, 2.691650390625, 2.8846435546875, 3.07763671875, 3.2706298828125, 3.463623046875, 3.6566162109375, 3.849609375, 4.0426025390625, 4.235595703125, 4.4285888671875, 4.62158203125, 4.8145751953125, 5.007568359375, 5.2005615234375, 5.3935546875, 5.5865478515625, 5.779541015625, 5.9725341796875, 6.16552734375, 6.3585205078125, 6.551513671875, 6.7445068359375, 6.9375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 18.0, 19.0, 31.0, 39.0, 49.0, 84.0, 113.0, 172.0, 371.0, 713.0, 940.0, 643.0, 312.0, 153.0, 109.0, 82.0, 60.0, 38.0, 41.0, 12.0, 12.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3641357421875, -9.056396484375, -8.7486572265625, -8.44091796875, -8.1331787109375, -7.825439453125, -7.5177001953125, -7.2099609375, -6.9022216796875, -6.594482421875, -6.2867431640625, -5.97900390625, -5.6712646484375, -5.363525390625, -5.0557861328125, -4.748046875, -4.4403076171875, -4.132568359375, -3.8248291015625, -3.51708984375, -3.2093505859375, -2.901611328125, -2.5938720703125, -2.2861328125, -1.9783935546875, -1.670654296875, -1.3629150390625, -1.05517578125, -0.7474365234375, -0.439697265625, -0.1319580078125, 0.17578125, 0.4835205078125, 0.791259765625, 1.0989990234375, 1.40673828125, 1.7144775390625, 2.022216796875, 2.3299560546875, 2.6376953125, 2.9454345703125, 3.253173828125, 3.5609130859375, 3.86865234375, 4.1763916015625, 4.484130859375, 4.7918701171875, 5.099609375, 5.4073486328125, 5.715087890625, 6.0228271484375, 6.33056640625, 6.6383056640625, 6.946044921875, 7.2537841796875, 7.5615234375, 7.8692626953125, 8.177001953125, 8.4847412109375, 8.79248046875, 9.1002197265625, 9.407958984375, 9.7156982421875, 10.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 10.0, 32.0, 32.0, 50.0, 86.0, 174.0, 341.0, 681.0, 1664.0, 4676.0, 16562.0, 79864.0, 1387124.0, 2567562.0, 105722.0, 20632.0, 5629.0, 1860.0, 769.0, 370.0, 176.0, 104.0, 60.0, 29.0, 24.0, 8.0, 13.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.439697265625, -15.91064453125, -15.381591796875, -14.8525390625, -14.323486328125, -13.79443359375, -13.265380859375, -12.736328125, -12.207275390625, -11.67822265625, -11.149169921875, -10.6201171875, -10.091064453125, -9.56201171875, -9.032958984375, -8.50390625, -7.974853515625, -7.44580078125, -6.916748046875, -6.3876953125, -5.858642578125, -5.32958984375, -4.800537109375, -4.271484375, -3.742431640625, -3.21337890625, -2.684326171875, -2.1552734375, -1.626220703125, -1.09716796875, -0.568115234375, -0.0390625, 0.489990234375, 1.01904296875, 1.548095703125, 2.0771484375, 2.606201171875, 3.13525390625, 3.664306640625, 4.193359375, 4.722412109375, 5.25146484375, 5.780517578125, 6.3095703125, 6.838623046875, 7.36767578125, 7.896728515625, 8.42578125, 8.954833984375, 9.48388671875, 10.012939453125, 10.5419921875, 11.071044921875, 11.60009765625, 12.129150390625, 12.658203125, 13.187255859375, 13.71630859375, 14.245361328125, 14.7744140625, 15.303466796875, 15.83251953125, 16.361572265625, 16.890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 18.0, 24.0, 28.0, 41.0, 54.0, 73.0, 111.0, 142.0, 130.0, 103.0, 83.0, 70.0, 36.0, 25.0, 24.0, 18.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.594764709472656, -34.35810470581055, -33.12144088745117, -31.88477897644043, -30.648117065429688, -29.411457061767578, -28.174795150756836, -26.938133239746094, -25.70147132873535, -24.46480941772461, -23.228147506713867, -21.991485595703125, -20.754825592041016, -19.51816177368164, -18.28150177001953, -17.04483985900879, -15.808177947998047, -14.571516036987305, -13.334854125976562, -12.098193168640137, -10.861531257629395, -9.624869346618652, -8.388208389282227, -7.151546478271484, -5.914884567260742, -4.67822265625, -3.441561222076416, -2.204899549484253, -0.9682378768920898, 0.26842403411865234, 1.5050854682922363, 2.7417469024658203, 3.978412628173828, 5.21507453918457, 6.451735973358154, 7.688397407531738, 8.92505931854248, 10.161721229553223, 11.398382186889648, 12.63504409790039, 13.871706008911133, 15.108367919921875, 16.345029830932617, 17.58169174194336, 18.81835174560547, 20.055015563964844, 21.291675567626953, 22.528337478637695, 23.764999389648438, 25.00166130065918, 26.238323211669922, 27.474985122680664, 28.711647033691406, 29.948307037353516, 31.184968948364258, 32.421630859375, 33.658294677734375, 34.894954681396484, 36.13161849975586, 37.36827850341797, 38.604942321777344, 39.84160232543945, 41.07826614379883, 42.31492614746094, 43.55158615112305]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 3.0, 7.0, 13.0, 12.0, 11.0, 13.0, 19.0, 19.0, 22.0, 25.0, 31.0, 28.0, 37.0, 32.0, 25.0, 40.0, 42.0, 41.0, 42.0, 27.0, 40.0, 34.0, 41.0, 37.0, 37.0, 40.0, 35.0, 24.0, 24.0, 29.0, 12.0, 25.0, 18.0, 14.0, 16.0, 16.0, 10.0, 15.0, 8.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-22.668424606323242, -21.979143142700195, -21.28986167907715, -20.6005802154541, -19.911298751831055, -19.222017288208008, -18.532737731933594, -17.843456268310547, -17.1541748046875, -16.464893341064453, -15.775611877441406, -15.08633041381836, -14.397048950195312, -13.707767486572266, -13.018486976623535, -12.329205513000488, -11.639923095703125, -10.950641632080078, -10.261360168457031, -9.572078704833984, -8.882797241210938, -8.19351577758789, -7.50423526763916, -6.814953804016113, -6.125672340393066, -5.4363908767700195, -4.747109413146973, -4.057828426361084, -3.368546962738037, -2.6792654991149902, -1.9899845123291016, -1.3007030487060547, -0.6114234924316406, 0.0778578519821167, 0.767139196395874, 1.4564204216003418, 2.1457018852233887, 2.8349833488464355, 3.524264335632324, 4.213545799255371, 4.902827262878418, 5.592108726501465, 6.281390190124512, 6.9706711769104, 7.659952640533447, 8.349233627319336, 9.038515090942383, 9.72779655456543, 10.417078018188477, 11.106359481811523, 11.79564094543457, 12.484922409057617, 13.174203872680664, 13.863485336303711, 14.552765846252441, 15.242047309875488, 15.931328773498535, 16.620609283447266, 17.309890747070312, 17.99917221069336, 18.688453674316406, 19.377735137939453, 20.0670166015625, 20.756298065185547, 21.445579528808594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 14.0, 19.0, 21.0, 22.0, 15.0, 28.0, 26.0, 28.0, 34.0, 38.0, 29.0, 40.0, 30.0, 38.0, 40.0, 39.0, 41.0, 34.0, 35.0, 35.0, 37.0, 29.0, 35.0, 33.0, 14.0, 22.0, 20.0, 26.0, 16.0, 24.0, 19.0, 14.0, 5.0, 6.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.296875, -2.2203369140625, -2.143798828125, -2.0672607421875, -1.99072265625, -1.9141845703125, -1.837646484375, -1.7611083984375, -1.6845703125, -1.6080322265625, -1.531494140625, -1.4549560546875, -1.37841796875, -1.3018798828125, -1.225341796875, -1.1488037109375, -1.072265625, -0.9957275390625, -0.919189453125, -0.8426513671875, -0.76611328125, -0.6895751953125, -0.613037109375, -0.5364990234375, -0.4599609375, -0.3834228515625, -0.306884765625, -0.2303466796875, -0.15380859375, -0.0772705078125, -0.000732421875, 0.0758056640625, 0.15234375, 0.2288818359375, 0.305419921875, 0.3819580078125, 0.45849609375, 0.5350341796875, 0.611572265625, 0.6881103515625, 0.7646484375, 0.8411865234375, 0.917724609375, 0.9942626953125, 1.07080078125, 1.1473388671875, 1.223876953125, 1.3004150390625, 1.376953125, 1.4534912109375, 1.530029296875, 1.6065673828125, 1.68310546875, 1.7596435546875, 1.836181640625, 1.9127197265625, 1.9892578125, 2.0657958984375, 2.142333984375, 2.2188720703125, 2.29541015625, 2.3719482421875, 2.448486328125, 2.5250244140625, 2.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 12.0, 19.0, 31.0, 31.0, 40.0, 59.0, 109.0, 111.0, 171.0, 217.0, 282.0, 444.0, 591.0, 792.0, 1155.0, 1654.0, 2601.0, 4471.0, 9412.0, 25489.0, 117873.0, 722753.0, 113239.0, 24972.0, 9311.0, 4410.0, 2575.0, 1654.0, 1187.0, 764.0, 556.0, 441.0, 290.0, 235.0, 153.0, 109.0, 98.0, 76.0, 37.0, 40.0, 29.0, 18.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.19146728515625, -5.9884033203125, -5.78533935546875, -5.582275390625, -5.37921142578125, -5.1761474609375, -4.97308349609375, -4.77001953125, -4.56695556640625, -4.3638916015625, -4.16082763671875, -3.957763671875, -3.75469970703125, -3.5516357421875, -3.34857177734375, -3.1455078125, -2.94244384765625, -2.7393798828125, -2.53631591796875, -2.333251953125, -2.13018798828125, -1.9271240234375, -1.72406005859375, -1.52099609375, -1.31793212890625, -1.1148681640625, -0.91180419921875, -0.708740234375, -0.50567626953125, -0.3026123046875, -0.09954833984375, 0.103515625, 0.30657958984375, 0.5096435546875, 0.71270751953125, 0.915771484375, 1.11883544921875, 1.3218994140625, 1.52496337890625, 1.72802734375, 1.93109130859375, 2.1341552734375, 2.33721923828125, 2.540283203125, 2.74334716796875, 2.9464111328125, 3.14947509765625, 3.3525390625, 3.55560302734375, 3.7586669921875, 3.96173095703125, 4.164794921875, 4.36785888671875, 4.5709228515625, 4.77398681640625, 4.97705078125, 5.18011474609375, 5.3831787109375, 5.58624267578125, 5.789306640625, 5.99237060546875, 6.1954345703125, 6.39849853515625, 6.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 11.0, 7.0, 4.0, 12.0, 9.0, 9.0, 19.0, 25.0, 29.0, 26.0, 27.0, 32.0, 27.0, 39.0, 45.0, 35.0, 41.0, 40.0, 1078.0, 43.0, 38.0, 34.0, 38.0, 36.0, 43.0, 43.0, 32.0, 32.0, 21.0, 17.0, 20.0, 15.0, 19.0, 13.0, 12.0, 12.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.0850830078125, -2.011962890625, -1.9388427734375, -1.86572265625, -1.7926025390625, -1.719482421875, -1.6463623046875, -1.5732421875, -1.5001220703125, -1.427001953125, -1.3538818359375, -1.28076171875, -1.2076416015625, -1.134521484375, -1.0614013671875, -0.98828125, -0.9151611328125, -0.842041015625, -0.7689208984375, -0.69580078125, -0.6226806640625, -0.549560546875, -0.4764404296875, -0.4033203125, -0.3302001953125, -0.257080078125, -0.1839599609375, -0.11083984375, -0.0377197265625, 0.035400390625, 0.1085205078125, 0.181640625, 0.2547607421875, 0.327880859375, 0.4010009765625, 0.47412109375, 0.5472412109375, 0.620361328125, 0.6934814453125, 0.7666015625, 0.8397216796875, 0.912841796875, 0.9859619140625, 1.05908203125, 1.1322021484375, 1.205322265625, 1.2784423828125, 1.3515625, 1.4246826171875, 1.497802734375, 1.5709228515625, 1.64404296875, 1.7171630859375, 1.790283203125, 1.8634033203125, 1.9365234375, 2.0096435546875, 2.082763671875, 2.1558837890625, 2.22900390625, 2.3021240234375, 2.375244140625, 2.4483642578125, 2.521484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 9.0, 13.0, 10.0, 9.0, 19.0, 25.0, 22.0, 37.0, 31.0, 63.0, 66.0, 114.0, 120.0, 172.0, 276.0, 315.0, 457.0, 653.0, 1004.0, 1536.0, 2470.0, 4353.0, 9495.0, 32477.0, 1329657.0, 665232.0, 28540.0, 8662.0, 4153.0, 2322.0, 1489.0, 1017.0, 609.0, 444.0, 344.0, 211.0, 192.0, 120.0, 93.0, 68.0, 62.0, 34.0, 32.0, 28.0, 19.0, 18.0, 6.0, 9.0, 4.0, 4.0, 0.0, 3.0, 6.0, 5.0], "bins": [-8.3046875, -8.067138671875, -7.82958984375, -7.592041015625, -7.3544921875, -7.116943359375, -6.87939453125, -6.641845703125, -6.404296875, -6.166748046875, -5.92919921875, -5.691650390625, -5.4541015625, -5.216552734375, -4.97900390625, -4.741455078125, -4.50390625, -4.266357421875, -4.02880859375, -3.791259765625, -3.5537109375, -3.316162109375, -3.07861328125, -2.841064453125, -2.603515625, -2.365966796875, -2.12841796875, -1.890869140625, -1.6533203125, -1.415771484375, -1.17822265625, -0.940673828125, -0.703125, -0.465576171875, -0.22802734375, 0.009521484375, 0.2470703125, 0.484619140625, 0.72216796875, 0.959716796875, 1.197265625, 1.434814453125, 1.67236328125, 1.909912109375, 2.1474609375, 2.385009765625, 2.62255859375, 2.860107421875, 3.09765625, 3.335205078125, 3.57275390625, 3.810302734375, 4.0478515625, 4.285400390625, 4.52294921875, 4.760498046875, 4.998046875, 5.235595703125, 5.47314453125, 5.710693359375, 5.9482421875, 6.185791015625, 6.42333984375, 6.660888671875, 6.8984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 17.0, 19.0, 25.0, 28.0, 60.0, 184.0, 362.0, 97.0, 49.0, 30.0, 20.0, 15.0, 16.0, 13.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.38671875, -2.3244171142578125, -2.262115478515625, -2.1998138427734375, -2.13751220703125, -2.0752105712890625, -2.012908935546875, -1.9506072998046875, -1.8883056640625, -1.8260040283203125, -1.763702392578125, -1.7014007568359375, -1.63909912109375, -1.5767974853515625, -1.514495849609375, -1.4521942138671875, -1.389892578125, -1.3275909423828125, -1.265289306640625, -1.2029876708984375, -1.14068603515625, -1.0783843994140625, -1.016082763671875, -0.9537811279296875, -0.8914794921875, -0.8291778564453125, -0.766876220703125, -0.7045745849609375, -0.64227294921875, -0.5799713134765625, -0.517669677734375, -0.4553680419921875, -0.39306640625, -0.3307647705078125, -0.268463134765625, -0.2061614990234375, -0.14385986328125, -0.0815582275390625, -0.019256591796875, 0.0430450439453125, 0.1053466796875, 0.1676483154296875, 0.229949951171875, 0.2922515869140625, 0.35455322265625, 0.4168548583984375, 0.479156494140625, 0.5414581298828125, 0.603759765625, 0.6660614013671875, 0.728363037109375, 0.7906646728515625, 0.85296630859375, 0.9152679443359375, 0.977569580078125, 1.0398712158203125, 1.1021728515625, 1.1644744873046875, 1.226776123046875, 1.2890777587890625, 1.35137939453125, 1.4136810302734375, 1.475982666015625, 1.5382843017578125, 1.6005859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 3.0, 8.0, 5.0, 8.0, 18.0, 34.0, 55.0, 102.0, 292.0, 1296.0, 7571.0, 999347.0, 36042.0, 2828.0, 575.0, 153.0, 66.0, 33.0, 21.0, 17.0, 17.0, 15.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-28.71875, -27.60302734375, -26.4873046875, -25.37158203125, -24.255859375, -23.14013671875, -22.0244140625, -20.90869140625, -19.79296875, -18.67724609375, -17.5615234375, -16.44580078125, -15.330078125, -14.21435546875, -13.0986328125, -11.98291015625, -10.8671875, -9.75146484375, -8.6357421875, -7.52001953125, -6.404296875, -5.28857421875, -4.1728515625, -3.05712890625, -1.94140625, -0.82568359375, 0.2900390625, 1.40576171875, 2.521484375, 3.63720703125, 4.7529296875, 5.86865234375, 6.984375, 8.10009765625, 9.2158203125, 10.33154296875, 11.447265625, 12.56298828125, 13.6787109375, 14.79443359375, 15.91015625, 17.02587890625, 18.1416015625, 19.25732421875, 20.373046875, 21.48876953125, 22.6044921875, 23.72021484375, 24.8359375, 25.95166015625, 27.0673828125, 28.18310546875, 29.298828125, 30.41455078125, 31.5302734375, 32.64599609375, 33.76171875, 34.87744140625, 35.9931640625, 37.10888671875, 38.224609375, 39.34033203125, 40.4560546875, 41.57177734375, 42.6875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 17.0, 43.0, 228.0, 583.0, 107.0, 26.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082770347595215, -3.6443777084350586, -3.2059853076934814, -2.7675929069519043, -2.329200267791748, -1.8908076286315918, -1.4524152278900146, -1.0140228271484375, -0.5756301879882812, -0.13723766803741455, 0.30115485191345215, 0.7395473718643188, 1.1779398918151855, 1.6163325309753418, 2.054724931716919, 2.493117332458496, 2.9315099716186523, 3.3699026107788086, 3.8082950115203857, 4.246687412261963, 4.685080051422119, 5.123472690582275, 5.561864852905273, 6.00025749206543, 6.438650131225586, 6.877042770385742, 7.315435409545898, 7.7538275718688965, 8.192220687866211, 8.630613327026367, 9.069005012512207, 9.507397651672363, 9.945791244506836, 10.384183883666992, 10.822576522827148, 11.260969161987305, 11.699361801147461, 12.137754440307617, 12.576146125793457, 13.014538764953613, 13.45293140411377, 13.891324043273926, 14.329716682434082, 14.768109321594238, 15.206501007080078, 15.644893646240234, 16.08328628540039, 16.521678924560547, 16.960071563720703, 17.39846420288086, 17.836856842041016, 18.275249481201172, 18.713642120361328, 19.152034759521484, 19.59042739868164, 20.028820037841797, 20.467212677001953, 20.90560531616211, 21.343997955322266, 21.782390594482422, 22.220783233642578, 22.659175872802734, 23.09756851196289, 23.535961151123047, 23.97435188293457]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 10.0, 9.0, 10.0, 3.0, 13.0, 12.0, 21.0, 23.0, 25.0, 26.0, 25.0, 38.0, 43.0, 42.0, 43.0, 44.0, 55.0, 47.0, 55.0, 42.0, 42.0, 40.0, 44.0, 47.0, 38.0, 26.0, 25.0, 21.0, 23.0, 21.0, 19.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5552830696105957, -1.4940707683563232, -1.4328584671020508, -1.3716461658477783, -1.3104337453842163, -1.2492214441299438, -1.1880091428756714, -1.126796841621399, -1.065584421157837, -1.0043721199035645, -0.9431597590446472, -0.8819474577903748, -0.8207350969314575, -0.7595227956771851, -0.6983104944229126, -0.6370981931686401, -0.5758858919143677, -0.5146735906600952, -0.453461229801178, -0.3922489285469055, -0.33103659749031067, -0.2698242664337158, -0.20861196517944336, -0.1473996341228485, -0.08618730306625366, -0.02497497946023941, 0.03623734414577484, 0.0974496603012085, 0.15866199135780334, 0.2198743224143982, 0.28108662366867065, 0.3422989547252655, 0.40351128578186035, 0.4647236168384552, 0.52593594789505, 0.5871482491493225, 0.6483606100082397, 0.7095729112625122, 0.7707852125167847, 0.8319975137710571, 0.8932098746299744, 0.9544221758842468, 1.015634536743164, 1.0768468379974365, 1.138059139251709, 1.1992714405059814, 1.260483741760254, 1.321696162223816, 1.3829084634780884, 1.4441207647323608, 1.5053330659866333, 1.5665454864501953, 1.6277577877044678, 1.6889700889587402, 1.7501823902130127, 1.8113946914672852, 1.8726069927215576, 1.93381929397583, 1.9950315952301025, 2.056243896484375, 2.1174561977386475, 2.17866849899292, 2.2398810386657715, 2.301093339920044, 2.3623056411743164]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 9.0, 11.0, 11.0, 17.0, 14.0, 31.0, 26.0, 25.0, 39.0, 43.0, 32.0, 41.0, 42.0, 28.0, 39.0, 43.0, 48.0, 52.0, 41.0, 52.0, 37.0, 44.0, 35.0, 32.0, 24.0, 27.0, 29.0, 26.0, 14.0, 11.0, 11.0, 11.0, 9.0, 11.0, 6.0, 7.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.904296875, -2.815826416015625, -2.72735595703125, -2.638885498046875, -2.5504150390625, -2.461944580078125, -2.37347412109375, -2.285003662109375, -2.196533203125, -2.108062744140625, -2.01959228515625, -1.931121826171875, -1.8426513671875, -1.754180908203125, -1.66571044921875, -1.577239990234375, -1.48876953125, -1.400299072265625, -1.31182861328125, -1.223358154296875, -1.1348876953125, -1.046417236328125, -0.95794677734375, -0.869476318359375, -0.781005859375, -0.692535400390625, -0.60406494140625, -0.515594482421875, -0.4271240234375, -0.338653564453125, -0.25018310546875, -0.161712646484375, -0.0732421875, 0.015228271484375, 0.10369873046875, 0.192169189453125, 0.2806396484375, 0.369110107421875, 0.45758056640625, 0.546051025390625, 0.634521484375, 0.722991943359375, 0.81146240234375, 0.899932861328125, 0.9884033203125, 1.076873779296875, 1.16534423828125, 1.253814697265625, 1.34228515625, 1.430755615234375, 1.51922607421875, 1.607696533203125, 1.6961669921875, 1.784637451171875, 1.87310791015625, 1.961578369140625, 2.050048828125, 2.138519287109375, 2.22698974609375, 2.315460205078125, 2.4039306640625, 2.492401123046875, 2.58087158203125, 2.669342041015625, 2.7578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 6.0, 9.0, 7.0, 29.0, 31.0, 46.0, 65.0, 90.0, 160.0, 202.0, 320.0, 512.0, 814.0, 1188.0, 1812.0, 2901.0, 4678.0, 7652.0, 12303.0, 21298.0, 38886.0, 76964.0, 195786.0, 392694.0, 146780.0, 63315.0, 32729.0, 18351.0, 10852.0, 6478.0, 4121.0, 2569.0, 1669.0, 1129.0, 685.0, 485.0, 303.0, 213.0, 138.0, 98.0, 64.0, 46.0, 19.0, 17.0, 16.0, 11.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.47161865234375, -3.3572998046875, -3.24298095703125, -3.128662109375, -3.01434326171875, -2.9000244140625, -2.78570556640625, -2.67138671875, -2.55706787109375, -2.4427490234375, -2.32843017578125, -2.214111328125, -2.09979248046875, -1.9854736328125, -1.87115478515625, -1.7568359375, -1.64251708984375, -1.5281982421875, -1.41387939453125, -1.299560546875, -1.18524169921875, -1.0709228515625, -0.95660400390625, -0.84228515625, -0.72796630859375, -0.6136474609375, -0.49932861328125, -0.385009765625, -0.27069091796875, -0.1563720703125, -0.04205322265625, 0.072265625, 0.18658447265625, 0.3009033203125, 0.41522216796875, 0.529541015625, 0.64385986328125, 0.7581787109375, 0.87249755859375, 0.98681640625, 1.10113525390625, 1.2154541015625, 1.32977294921875, 1.444091796875, 1.55841064453125, 1.6727294921875, 1.78704833984375, 1.9013671875, 2.01568603515625, 2.1300048828125, 2.24432373046875, 2.358642578125, 2.47296142578125, 2.5872802734375, 2.70159912109375, 2.81591796875, 2.93023681640625, 3.0445556640625, 3.15887451171875, 3.273193359375, 3.38751220703125, 3.5018310546875, 3.61614990234375, 3.73046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 10.0, 16.0, 19.0, 15.0, 24.0, 27.0, 37.0, 34.0, 45.0, 49.0, 56.0, 83.0, 139.0, 251.0, 1420.0, 253.0, 136.0, 68.0, 54.0, 53.0, 50.0, 41.0, 27.0, 12.0, 24.0, 17.0, 8.0, 9.0, 6.0, 8.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-12.046875, -11.70703125, -11.3671875, -11.02734375, -10.6875, -10.34765625, -10.0078125, -9.66796875, -9.328125, -8.98828125, -8.6484375, -8.30859375, -7.96875, -7.62890625, -7.2890625, -6.94921875, -6.609375, -6.26953125, -5.9296875, -5.58984375, -5.25, -4.91015625, -4.5703125, -4.23046875, -3.890625, -3.55078125, -3.2109375, -2.87109375, -2.53125, -2.19140625, -1.8515625, -1.51171875, -1.171875, -0.83203125, -0.4921875, -0.15234375, 0.1875, 0.52734375, 0.8671875, 1.20703125, 1.546875, 1.88671875, 2.2265625, 2.56640625, 2.90625, 3.24609375, 3.5859375, 3.92578125, 4.265625, 4.60546875, 4.9453125, 5.28515625, 5.625, 5.96484375, 6.3046875, 6.64453125, 6.984375, 7.32421875, 7.6640625, 8.00390625, 8.34375, 8.68359375, 9.0234375, 9.36328125, 9.703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 22.0, 41.0, 49.0, 65.0, 89.0, 129.0, 215.0, 437.0, 1597.0, 10625.0, 221794.0, 2826820.0, 75691.0, 6014.0, 996.0, 358.0, 210.0, 120.0, 91.0, 71.0, 51.0, 32.0, 32.0, 20.0, 16.0, 13.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.189453125, -15.59765625, -15.005859375, -14.4140625, -13.822265625, -13.23046875, -12.638671875, -12.046875, -11.455078125, -10.86328125, -10.271484375, -9.6796875, -9.087890625, -8.49609375, -7.904296875, -7.3125, -6.720703125, -6.12890625, -5.537109375, -4.9453125, -4.353515625, -3.76171875, -3.169921875, -2.578125, -1.986328125, -1.39453125, -0.802734375, -0.2109375, 0.380859375, 0.97265625, 1.564453125, 2.15625, 2.748046875, 3.33984375, 3.931640625, 4.5234375, 5.115234375, 5.70703125, 6.298828125, 6.890625, 7.482421875, 8.07421875, 8.666015625, 9.2578125, 9.849609375, 10.44140625, 11.033203125, 11.625, 12.216796875, 12.80859375, 13.400390625, 13.9921875, 14.583984375, 15.17578125, 15.767578125, 16.359375, 16.951171875, 17.54296875, 18.134765625, 18.7265625, 19.318359375, 19.91015625, 20.501953125, 21.09375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [3.0, 20.0, 327.0, 597.0, 73.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.854573249816895, -9.474528312683105, -5.094483375549316, -0.7144384384155273, 3.6656064987182617, 8.04565143585205, 12.42569637298584, 16.805740356445312, 21.185787200927734, 25.565832138061523, 29.945877075195312, 34.32592010498047, 38.70596694946289, 43.08601379394531, 47.46605682373047, 51.846099853515625, 56.22614669799805, 60.60619354248047, 64.98623657226562, 69.36627960205078, 73.74632263183594, 78.12637329101562, 82.50641632080078, 86.88645935058594, 91.2665023803711, 95.64654541015625, 100.02659606933594, 104.4066390991211, 108.78668212890625, 113.1667251586914, 117.54676818847656, 121.92681884765625, 126.30685424804688, 130.68690490722656, 135.0669403076172, 139.44699096679688, 143.8270263671875, 148.2070770263672, 152.58712768554688, 156.9671630859375, 161.3472137451172, 165.72726440429688, 170.1072998046875, 174.4873504638672, 178.86740112304688, 183.2474365234375, 187.6274871826172, 192.0075225830078, 196.3875732421875, 200.7676239013672, 205.1476593017578, 209.5277099609375, 213.90774536132812, 218.2877960205078, 222.6678466796875, 227.04788208007812, 231.4279327392578, 235.8079833984375, 240.18801879882812, 244.5680694580078, 248.9481201171875, 253.32815551757812, 257.70819091796875, 262.0882568359375, 266.4682922363281]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 9.0, 12.0, 12.0, 14.0, 13.0, 12.0, 15.0, 24.0, 23.0, 34.0, 26.0, 23.0, 31.0, 32.0, 33.0, 19.0, 33.0, 37.0, 36.0, 27.0, 33.0, 24.0, 41.0, 39.0, 34.0, 36.0, 35.0, 39.0, 26.0, 24.0, 20.0, 22.0, 23.0, 18.0, 17.0, 14.0, 10.0, 13.0, 11.0, 10.0, 14.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.88700294494629, -21.217126846313477, -20.547252655029297, -19.877376556396484, -19.207500457763672, -18.53762435913086, -17.86775016784668, -17.197874069213867, -16.527999877929688, -15.858124732971191, -15.188248634338379, -14.518373489379883, -13.84849739074707, -13.178622245788574, -12.508747100830078, -11.838871002197266, -11.168994903564453, -10.499119758605957, -9.829243659973145, -9.159368515014648, -8.489492416381836, -7.81961727142334, -7.149742126464844, -6.4798665046691895, -5.809990882873535, -5.140115261077881, -4.470239639282227, -3.8003644943237305, -3.130488872528076, -2.460613250732422, -1.7907381057739258, -1.1208624839782715, -0.4509849548339844, 0.21889054775238037, 0.8887660503387451, 1.5586414337158203, 2.2285170555114746, 2.898392677307129, 3.568267822265625, 4.238143444061279, 4.908019065856934, 5.577894687652588, 6.247770309448242, 6.917645454406738, 7.587521076202393, 8.257396697998047, 8.927271842956543, 9.597146987915039, 10.267023086547852, 10.936898231506348, 11.60677433013916, 12.276649475097656, 12.946525573730469, 13.616400718688965, 14.286275863647461, 14.956151962280273, 15.62602710723877, 16.295902252197266, 16.965778350830078, 17.63565444946289, 18.30552864074707, 18.975404739379883, 19.645278930664062, 20.315155029296875, 20.985031127929688]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 16.0, 13.0, 13.0, 18.0, 24.0, 20.0, 25.0, 22.0, 33.0, 31.0, 34.0, 47.0, 37.0, 44.0, 43.0, 55.0, 53.0, 36.0, 42.0, 52.0, 39.0, 38.0, 28.0, 24.0, 36.0, 21.0, 21.0, 19.0, 18.0, 15.0, 11.0, 7.0, 10.0, 5.0, 8.0, 12.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.095703125, -3.002593994140625, -2.90948486328125, -2.816375732421875, -2.7232666015625, -2.630157470703125, -2.53704833984375, -2.443939208984375, -2.350830078125, -2.257720947265625, -2.16461181640625, -2.071502685546875, -1.9783935546875, -1.885284423828125, -1.79217529296875, -1.699066162109375, -1.60595703125, -1.512847900390625, -1.41973876953125, -1.326629638671875, -1.2335205078125, -1.140411376953125, -1.04730224609375, -0.954193115234375, -0.861083984375, -0.767974853515625, -0.67486572265625, -0.581756591796875, -0.4886474609375, -0.395538330078125, -0.30242919921875, -0.209320068359375, -0.1162109375, -0.023101806640625, 0.07000732421875, 0.163116455078125, 0.2562255859375, 0.349334716796875, 0.44244384765625, 0.535552978515625, 0.628662109375, 0.721771240234375, 0.81488037109375, 0.907989501953125, 1.0010986328125, 1.094207763671875, 1.18731689453125, 1.280426025390625, 1.37353515625, 1.466644287109375, 1.55975341796875, 1.652862548828125, 1.7459716796875, 1.839080810546875, 1.93218994140625, 2.025299072265625, 2.118408203125, 2.211517333984375, 2.30462646484375, 2.397735595703125, 2.4908447265625, 2.583953857421875, 2.67706298828125, 2.770172119140625, 2.86328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 11.0, 26.0, 32.0, 53.0, 81.0, 113.0, 147.0, 237.0, 332.0, 550.0, 867.0, 1486.0, 2600.0, 4608.0, 8473.0, 16960.0, 38347.0, 130966.0, 1106509.0, 2452063.0, 317416.0, 60328.0, 24414.0, 11817.0, 6306.0, 3623.0, 2091.0, 1292.0, 799.0, 523.0, 357.0, 234.0, 162.0, 103.0, 89.0, 65.0, 38.0, 37.0, 23.0, 17.0, 14.0, 12.0, 7.0, 9.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.4609375, -6.24725341796875, -6.0335693359375, -5.81988525390625, -5.606201171875, -5.39251708984375, -5.1788330078125, -4.96514892578125, -4.75146484375, -4.53778076171875, -4.3240966796875, -4.11041259765625, -3.896728515625, -3.68304443359375, -3.4693603515625, -3.25567626953125, -3.0419921875, -2.82830810546875, -2.6146240234375, -2.40093994140625, -2.187255859375, -1.97357177734375, -1.7598876953125, -1.54620361328125, -1.33251953125, -1.11883544921875, -0.9051513671875, -0.69146728515625, -0.477783203125, -0.26409912109375, -0.0504150390625, 0.16326904296875, 0.376953125, 0.59063720703125, 0.8043212890625, 1.01800537109375, 1.231689453125, 1.44537353515625, 1.6590576171875, 1.87274169921875, 2.08642578125, 2.30010986328125, 2.5137939453125, 2.72747802734375, 2.941162109375, 3.15484619140625, 3.3685302734375, 3.58221435546875, 3.7958984375, 4.00958251953125, 4.2232666015625, 4.43695068359375, 4.650634765625, 4.86431884765625, 5.0780029296875, 5.29168701171875, 5.50537109375, 5.71905517578125, 5.9327392578125, 6.14642333984375, 6.360107421875, 6.57379150390625, 6.7874755859375, 7.00115966796875, 7.21484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 16.0, 13.0, 14.0, 33.0, 37.0, 68.0, 73.0, 93.0, 155.0, 261.0, 467.0, 789.0, 801.0, 464.0, 225.0, 148.0, 115.0, 74.0, 55.0, 33.0, 27.0, 22.0, 12.0, 18.0, 8.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6953125, -9.41796875, -9.140625, -8.86328125, -8.5859375, -8.30859375, -8.03125, -7.75390625, -7.4765625, -7.19921875, -6.921875, -6.64453125, -6.3671875, -6.08984375, -5.8125, -5.53515625, -5.2578125, -4.98046875, -4.703125, -4.42578125, -4.1484375, -3.87109375, -3.59375, -3.31640625, -3.0390625, -2.76171875, -2.484375, -2.20703125, -1.9296875, -1.65234375, -1.375, -1.09765625, -0.8203125, -0.54296875, -0.265625, 0.01171875, 0.2890625, 0.56640625, 0.84375, 1.12109375, 1.3984375, 1.67578125, 1.953125, 2.23046875, 2.5078125, 2.78515625, 3.0625, 3.33984375, 3.6171875, 3.89453125, 4.171875, 4.44921875, 4.7265625, 5.00390625, 5.28125, 5.55859375, 5.8359375, 6.11328125, 6.390625, 6.66796875, 6.9453125, 7.22265625, 7.5, 7.77734375, 8.0546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 10.0, 24.0, 33.0, 45.0, 99.0, 129.0, 320.0, 751.0, 1812.0, 6095.0, 26018.0, 193031.0, 3549601.0, 365341.0, 38623.0, 8179.0, 2412.0, 876.0, 421.0, 184.0, 94.0, 54.0, 36.0, 20.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.01904296875, -16.4443359375, -15.86962890625, -15.294921875, -14.72021484375, -14.1455078125, -13.57080078125, -12.99609375, -12.42138671875, -11.8466796875, -11.27197265625, -10.697265625, -10.12255859375, -9.5478515625, -8.97314453125, -8.3984375, -7.82373046875, -7.2490234375, -6.67431640625, -6.099609375, -5.52490234375, -4.9501953125, -4.37548828125, -3.80078125, -3.22607421875, -2.6513671875, -2.07666015625, -1.501953125, -0.92724609375, -0.3525390625, 0.22216796875, 0.796875, 1.37158203125, 1.9462890625, 2.52099609375, 3.095703125, 3.67041015625, 4.2451171875, 4.81982421875, 5.39453125, 5.96923828125, 6.5439453125, 7.11865234375, 7.693359375, 8.26806640625, 8.8427734375, 9.41748046875, 9.9921875, 10.56689453125, 11.1416015625, 11.71630859375, 12.291015625, 12.86572265625, 13.4404296875, 14.01513671875, 14.58984375, 15.16455078125, 15.7392578125, 16.31396484375, 16.888671875, 17.46337890625, 18.0380859375, 18.61279296875, 19.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 23.0, 17.0, 35.0, 53.0, 93.0, 120.0, 140.0, 125.0, 131.0, 87.0, 48.0, 49.0, 20.0, 15.0, 11.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.46260070800781, -40.11937713623047, -38.776153564453125, -37.43292999267578, -36.08970642089844, -34.74648666381836, -33.403263092041016, -32.06003952026367, -30.716815948486328, -29.373592376708984, -28.03036880493164, -26.68714714050293, -25.343923568725586, -24.000699996948242, -22.65747833251953, -21.314254760742188, -19.971031188964844, -18.6278076171875, -17.284584045410156, -15.941362380981445, -14.598138809204102, -13.254915237426758, -11.91169261932373, -10.568470001220703, -9.22524642944336, -7.882023334503174, -6.538800239562988, -5.195577144622803, -3.852354049682617, -2.5091309547424316, -1.165907859802246, 0.17731475830078125, 1.520538330078125, 2.8637614250183105, 4.206984519958496, 5.550207614898682, 6.893430709838867, 8.236654281616211, 9.579876899719238, 10.923099517822266, 12.26632308959961, 13.609546661376953, 14.95276927947998, 16.295991897583008, 17.63921546936035, 18.982439041137695, 20.325660705566406, 21.66888427734375, 23.012107849121094, 24.355331420898438, 25.69855499267578, 27.041776657104492, 28.385000228881836, 29.72822380065918, 31.07144546508789, 32.414669036865234, 33.75789260864258, 35.10111618041992, 36.444339752197266, 37.78756332397461, 39.13078308105469, 40.47400665283203, 41.817230224609375, 43.16045379638672, 44.50367736816406]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 13.0, 9.0, 11.0, 17.0, 19.0, 23.0, 17.0, 34.0, 36.0, 35.0, 45.0, 35.0, 40.0, 39.0, 42.0, 54.0, 43.0, 42.0, 50.0, 40.0, 43.0, 38.0, 39.0, 32.0, 24.0, 18.0, 26.0, 22.0, 17.0, 21.0, 12.0, 13.0, 9.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.348052978515625, -27.520893096923828, -26.6937313079834, -25.8665714263916, -25.039409637451172, -24.212249755859375, -23.385089874267578, -22.55792808532715, -21.73076629638672, -20.903606414794922, -20.076444625854492, -19.249284744262695, -18.422122955322266, -17.59496307373047, -16.767803192138672, -15.940641403198242, -15.113481521606445, -14.286320686340332, -13.459159851074219, -12.631999969482422, -11.804838180541992, -10.977678298950195, -10.150517463684082, -9.323356628417969, -8.496195793151855, -7.669034957885742, -6.841874122619629, -6.014713764190674, -5.1875529289245605, -4.360392093658447, -3.533231735229492, -2.706070899963379, -1.8789100646972656, -1.051749348640442, -0.22458863258361816, 0.602571964263916, 1.4297327995300293, 2.2568936347961426, 3.0840539932250977, 3.911214828491211, 4.738375663757324, 5.5655364990234375, 6.392697334289551, 7.219857692718506, 8.047018051147461, 8.87417984008789, 9.701339721679688, 10.5285005569458, 11.355661392211914, 12.182822227478027, 13.00998306274414, 13.837142944335938, 14.664304733276367, 15.491464614868164, 16.318626403808594, 17.14578628540039, 17.972946166992188, 18.800106048583984, 19.627267837524414, 20.45442771911621, 21.28158950805664, 22.108749389648438, 22.935909271240234, 23.763071060180664, 24.590232849121094]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 11.0, 8.0, 20.0, 17.0, 24.0, 15.0, 21.0, 27.0, 33.0, 34.0, 38.0, 35.0, 36.0, 50.0, 41.0, 60.0, 55.0, 43.0, 41.0, 53.0, 38.0, 44.0, 39.0, 33.0, 30.0, 23.0, 18.0, 22.0, 14.0, 10.0, 16.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.79058837890625, -2.6925048828125, -2.59442138671875, -2.496337890625, -2.39825439453125, -2.3001708984375, -2.20208740234375, -2.10400390625, -2.00592041015625, -1.9078369140625, -1.80975341796875, -1.711669921875, -1.61358642578125, -1.5155029296875, -1.41741943359375, -1.3193359375, -1.22125244140625, -1.1231689453125, -1.02508544921875, -0.927001953125, -0.82891845703125, -0.7308349609375, -0.63275146484375, -0.53466796875, -0.43658447265625, -0.3385009765625, -0.24041748046875, -0.142333984375, -0.04425048828125, 0.0538330078125, 0.15191650390625, 0.25, 0.34808349609375, 0.4461669921875, 0.54425048828125, 0.642333984375, 0.74041748046875, 0.8385009765625, 0.93658447265625, 1.03466796875, 1.13275146484375, 1.2308349609375, 1.32891845703125, 1.427001953125, 1.52508544921875, 1.6231689453125, 1.72125244140625, 1.8193359375, 1.91741943359375, 2.0155029296875, 2.11358642578125, 2.211669921875, 2.30975341796875, 2.4078369140625, 2.50592041015625, 2.60400390625, 2.70208740234375, 2.8001708984375, 2.89825439453125, 2.996337890625, 3.09442138671875, 3.1925048828125, 3.29058837890625, 3.388671875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 9.0, 14.0, 13.0, 10.0, 20.0, 27.0, 43.0, 56.0, 81.0, 109.0, 120.0, 202.0, 281.0, 347.0, 509.0, 754.0, 1079.0, 1412.0, 2122.0, 3086.0, 4710.0, 7170.0, 11399.0, 19182.0, 33769.0, 70879.0, 296425.0, 417817.0, 82412.0, 37907.0, 20442.0, 12356.0, 7667.0, 5030.0, 3348.0, 2303.0, 1494.0, 1129.0, 802.0, 552.0, 403.0, 313.0, 205.0, 144.0, 107.0, 83.0, 51.0, 46.0, 35.0, 26.0, 19.0, 13.0, 11.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.203125, -4.06341552734375, -3.9237060546875, -3.78399658203125, -3.644287109375, -3.50457763671875, -3.3648681640625, -3.22515869140625, -3.08544921875, -2.94573974609375, -2.8060302734375, -2.66632080078125, -2.526611328125, -2.38690185546875, -2.2471923828125, -2.10748291015625, -1.9677734375, -1.82806396484375, -1.6883544921875, -1.54864501953125, -1.408935546875, -1.26922607421875, -1.1295166015625, -0.98980712890625, -0.85009765625, -0.71038818359375, -0.5706787109375, -0.43096923828125, -0.291259765625, -0.15155029296875, -0.0118408203125, 0.12786865234375, 0.267578125, 0.40728759765625, 0.5469970703125, 0.68670654296875, 0.826416015625, 0.96612548828125, 1.1058349609375, 1.24554443359375, 1.38525390625, 1.52496337890625, 1.6646728515625, 1.80438232421875, 1.944091796875, 2.08380126953125, 2.2235107421875, 2.36322021484375, 2.5029296875, 2.64263916015625, 2.7823486328125, 2.92205810546875, 3.061767578125, 3.20147705078125, 3.3411865234375, 3.48089599609375, 3.62060546875, 3.76031494140625, 3.9000244140625, 4.03973388671875, 4.179443359375, 4.31915283203125, 4.4588623046875, 4.59857177734375, 4.73828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 4.0, 3.0, 12.0, 19.0, 14.0, 17.0, 27.0, 23.0, 18.0, 17.0, 30.0, 44.0, 47.0, 37.0, 48.0, 52.0, 38.0, 56.0, 1067.0, 36.0, 53.0, 25.0, 42.0, 39.0, 31.0, 29.0, 24.0, 27.0, 30.0, 16.0, 14.0, 13.0, 10.0, 7.0, 13.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.333984375, -2.256988525390625, -2.17999267578125, -2.102996826171875, -2.0260009765625, -1.949005126953125, -1.87200927734375, -1.795013427734375, -1.718017578125, -1.641021728515625, -1.56402587890625, -1.487030029296875, -1.4100341796875, -1.333038330078125, -1.25604248046875, -1.179046630859375, -1.10205078125, -1.025054931640625, -0.94805908203125, -0.871063232421875, -0.7940673828125, -0.717071533203125, -0.64007568359375, -0.563079833984375, -0.486083984375, -0.409088134765625, -0.33209228515625, -0.255096435546875, -0.1781005859375, -0.101104736328125, -0.02410888671875, 0.052886962890625, 0.1298828125, 0.206878662109375, 0.28387451171875, 0.360870361328125, 0.4378662109375, 0.514862060546875, 0.59185791015625, 0.668853759765625, 0.745849609375, 0.822845458984375, 0.89984130859375, 0.976837158203125, 1.0538330078125, 1.130828857421875, 1.20782470703125, 1.284820556640625, 1.36181640625, 1.438812255859375, 1.51580810546875, 1.592803955078125, 1.6697998046875, 1.746795654296875, 1.82379150390625, 1.900787353515625, 1.977783203125, 2.054779052734375, 2.13177490234375, 2.208770751953125, 2.2857666015625, 2.362762451171875, 2.43975830078125, 2.516754150390625, 2.59375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 4.0, 5.0, 11.0, 22.0, 20.0, 38.0, 55.0, 70.0, 99.0, 161.0, 230.0, 337.0, 476.0, 754.0, 1192.0, 1908.0, 3155.0, 5493.0, 10518.0, 22086.0, 65521.0, 1396340.0, 496896.0, 50520.0, 18925.0, 9252.0, 5068.0, 2924.0, 1766.0, 1114.0, 706.0, 472.0, 283.0, 238.0, 152.0, 74.0, 81.0, 57.0, 31.0, 24.0, 20.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.546875, -5.39239501953125, -5.2379150390625, -5.08343505859375, -4.928955078125, -4.77447509765625, -4.6199951171875, -4.46551513671875, -4.31103515625, -4.15655517578125, -4.0020751953125, -3.84759521484375, -3.693115234375, -3.53863525390625, -3.3841552734375, -3.22967529296875, -3.0751953125, -2.92071533203125, -2.7662353515625, -2.61175537109375, -2.457275390625, -2.30279541015625, -2.1483154296875, -1.99383544921875, -1.83935546875, -1.68487548828125, -1.5303955078125, -1.37591552734375, -1.221435546875, -1.06695556640625, -0.9124755859375, -0.75799560546875, -0.603515625, -0.44903564453125, -0.2945556640625, -0.14007568359375, 0.014404296875, 0.16888427734375, 0.3233642578125, 0.47784423828125, 0.63232421875, 0.78680419921875, 0.9412841796875, 1.09576416015625, 1.250244140625, 1.40472412109375, 1.5592041015625, 1.71368408203125, 1.8681640625, 2.02264404296875, 2.1771240234375, 2.33160400390625, 2.486083984375, 2.64056396484375, 2.7950439453125, 2.94952392578125, 3.10400390625, 3.25848388671875, 3.4129638671875, 3.56744384765625, 3.721923828125, 3.87640380859375, 4.0308837890625, 4.18536376953125, 4.33984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 5.0, 11.0, 29.0, 93.0, 264.0, 382.0, 117.0, 41.0, 12.0, 7.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.923828125, -1.85784912109375, -1.7918701171875, -1.72589111328125, -1.659912109375, -1.59393310546875, -1.5279541015625, -1.46197509765625, -1.39599609375, -1.33001708984375, -1.2640380859375, -1.19805908203125, -1.132080078125, -1.06610107421875, -1.0001220703125, -0.93414306640625, -0.8681640625, -0.80218505859375, -0.7362060546875, -0.67022705078125, -0.604248046875, -0.53826904296875, -0.4722900390625, -0.40631103515625, -0.34033203125, -0.27435302734375, -0.2083740234375, -0.14239501953125, -0.076416015625, -0.01043701171875, 0.0555419921875, 0.12152099609375, 0.1875, 0.25347900390625, 0.3194580078125, 0.38543701171875, 0.451416015625, 0.51739501953125, 0.5833740234375, 0.64935302734375, 0.71533203125, 0.78131103515625, 0.8472900390625, 0.91326904296875, 0.979248046875, 1.04522705078125, 1.1112060546875, 1.17718505859375, 1.2431640625, 1.30914306640625, 1.3751220703125, 1.44110107421875, 1.507080078125, 1.57305908203125, 1.6390380859375, 1.70501708984375, 1.77099609375, 1.83697509765625, 1.9029541015625, 1.96893310546875, 2.034912109375, 2.10089111328125, 2.1668701171875, 2.23284912109375, 2.298828125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 11.0, 19.0, 22.0, 67.0, 288.0, 2357.0, 1013239.0, 31074.0, 1174.0, 188.0, 33.0, 18.0, 15.0, 13.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.375, -42.13037109375, -40.8857421875, -39.64111328125, -38.396484375, -37.15185546875, -35.9072265625, -34.66259765625, -33.41796875, -32.17333984375, -30.9287109375, -29.68408203125, -28.439453125, -27.19482421875, -25.9501953125, -24.70556640625, -23.4609375, -22.21630859375, -20.9716796875, -19.72705078125, -18.482421875, -17.23779296875, -15.9931640625, -14.74853515625, -13.50390625, -12.25927734375, -11.0146484375, -9.77001953125, -8.525390625, -7.28076171875, -6.0361328125, -4.79150390625, -3.546875, -2.30224609375, -1.0576171875, 0.18701171875, 1.431640625, 2.67626953125, 3.9208984375, 5.16552734375, 6.41015625, 7.65478515625, 8.8994140625, 10.14404296875, 11.388671875, 12.63330078125, 13.8779296875, 15.12255859375, 16.3671875, 17.61181640625, 18.8564453125, 20.10107421875, 21.345703125, 22.59033203125, 23.8349609375, 25.07958984375, 26.32421875, 27.56884765625, 28.8134765625, 30.05810546875, 31.302734375, 32.54736328125, 33.7919921875, 35.03662109375, 36.28125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 12.0, 20.0, 24.0, 39.0, 62.0, 140.0, 210.0, 216.0, 115.0, 52.0, 33.0, 28.0, 10.0, 7.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7362329959869385, -3.644993305206299, -3.55375337600708, -3.4625136852264404, -3.3712737560272217, -3.280034065246582, -3.1887941360473633, -3.0975544452667236, -3.006314754486084, -2.9150750637054443, -2.8238351345062256, -2.732595443725586, -2.641355514526367, -2.5501158237457275, -2.458876132965088, -2.367636203765869, -2.2763962745666504, -2.1851565837860107, -2.093916654586792, -2.0026769638061523, -1.9114370346069336, -1.820197343826294, -1.7289575338363647, -1.6377177238464355, -1.5464779138565063, -1.4552381038665771, -1.363998293876648, -1.2727584838867188, -1.181518793106079, -1.0902788639068604, -0.9990391731262207, -0.9077993631362915, -0.8165597915649414, -0.7253199815750122, -0.634080171585083, -0.5428404211997986, -0.4516006112098694, -0.3603608012199402, -0.26912105083465576, -0.17788124084472656, -0.08664143085479736, 0.004598364233970642, 0.09583815932273865, 0.18707793951034546, 0.27831774950027466, 0.36955755949020386, 0.4607973098754883, 0.5520371198654175, 0.6432769298553467, 0.7345167398452759, 0.8257565498352051, 0.9169963002204895, 1.0082361698150635, 1.0994758605957031, 1.1907156705856323, 1.2819554805755615, 1.3731952905654907, 1.46443510055542, 1.5556749105453491, 1.6469147205352783, 1.738154411315918, 1.8293943405151367, 1.9206340312957764, 2.011873722076416, 2.1031136512756348]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 12.0, 16.0, 18.0, 28.0, 13.0, 25.0, 31.0, 25.0, 38.0, 27.0, 39.0, 35.0, 41.0, 35.0, 37.0, 37.0, 37.0, 43.0, 34.0, 46.0, 45.0, 23.0, 36.0, 31.0, 20.0, 27.0, 20.0, 18.0, 18.0, 18.0, 17.0, 9.0, 3.0, 10.0, 8.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1061121225357056, -1.0673414468765259, -1.0285708904266357, -0.989800214767456, -0.9510295391082764, -0.9122588634490967, -0.8734882473945618, -0.8347176313400269, -0.7959469556808472, -0.7571762800216675, -0.7184056639671326, -0.6796350479125977, -0.640864372253418, -0.6020936965942383, -0.5633230805397034, -0.5245524644851685, -0.48578178882598877, -0.44701114296913147, -0.40824049711227417, -0.36946985125541687, -0.33069920539855957, -0.29192855954170227, -0.25315791368484497, -0.21438726782798767, -0.17561662197113037, -0.13684597611427307, -0.09807533025741577, -0.05930468440055847, -0.020534038543701172, 0.018236607313156128, 0.05700725317001343, 0.09577789902687073, 0.13454842567443848, 0.17331907153129578, 0.21208971738815308, 0.2508603632450104, 0.2896310091018677, 0.328401654958725, 0.3671723008155823, 0.4059429466724396, 0.4447135925292969, 0.4834842383861542, 0.5222548842430115, 0.5610255002975464, 0.5997961759567261, 0.6385668516159058, 0.6773374676704407, 0.7161080837249756, 0.7548787593841553, 0.793649435043335, 0.8324200510978699, 0.8711906671524048, 0.9099613428115845, 0.9487320184707642, 0.9875026345252991, 1.026273250579834, 1.0650439262390137, 1.1038146018981934, 1.142585277557373, 1.1813558340072632, 1.2201265096664429, 1.2588971853256226, 1.2976677417755127, 1.3364384174346924, 1.375209093093872]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 1.0, 6.0, 7.0, 11.0, 15.0, 21.0, 21.0, 19.0, 27.0, 27.0, 27.0, 41.0, 38.0, 34.0, 33.0, 46.0, 39.0, 36.0, 51.0, 43.0, 54.0, 48.0, 42.0, 34.0, 46.0, 30.0, 37.0, 32.0, 22.0, 15.0, 16.0, 18.0, 12.0, 5.0, 4.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -2.994903564453125, -2.89996337890625, -2.805023193359375, -2.7100830078125, -2.615142822265625, -2.52020263671875, -2.425262451171875, -2.330322265625, -2.235382080078125, -2.14044189453125, -2.045501708984375, -1.9505615234375, -1.855621337890625, -1.76068115234375, -1.665740966796875, -1.57080078125, -1.475860595703125, -1.38092041015625, -1.285980224609375, -1.1910400390625, -1.096099853515625, -1.00115966796875, -0.906219482421875, -0.811279296875, -0.716339111328125, -0.62139892578125, -0.526458740234375, -0.4315185546875, -0.336578369140625, -0.24163818359375, -0.146697998046875, -0.0517578125, 0.043182373046875, 0.13812255859375, 0.233062744140625, 0.3280029296875, 0.422943115234375, 0.51788330078125, 0.612823486328125, 0.707763671875, 0.802703857421875, 0.89764404296875, 0.992584228515625, 1.0875244140625, 1.182464599609375, 1.27740478515625, 1.372344970703125, 1.46728515625, 1.562225341796875, 1.65716552734375, 1.752105712890625, 1.8470458984375, 1.941986083984375, 2.03692626953125, 2.131866455078125, 2.226806640625, 2.321746826171875, 2.41668701171875, 2.511627197265625, 2.6065673828125, 2.701507568359375, 2.79644775390625, 2.891387939453125, 2.986328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 16.0, 13.0, 20.0, 31.0, 38.0, 56.0, 72.0, 88.0, 150.0, 195.0, 296.0, 450.0, 668.0, 1083.0, 1888.0, 3350.0, 6361.0, 13076.0, 30335.0, 88294.0, 455232.0, 324358.0, 71486.0, 25855.0, 11640.0, 5749.0, 3004.0, 1699.0, 1050.0, 615.0, 387.0, 286.0, 191.0, 147.0, 108.0, 83.0, 44.0, 32.0, 27.0, 16.0, 13.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-5.60546875, -5.440185546875, -5.27490234375, -5.109619140625, -4.9443359375, -4.779052734375, -4.61376953125, -4.448486328125, -4.283203125, -4.117919921875, -3.95263671875, -3.787353515625, -3.6220703125, -3.456787109375, -3.29150390625, -3.126220703125, -2.9609375, -2.795654296875, -2.63037109375, -2.465087890625, -2.2998046875, -2.134521484375, -1.96923828125, -1.803955078125, -1.638671875, -1.473388671875, -1.30810546875, -1.142822265625, -0.9775390625, -0.812255859375, -0.64697265625, -0.481689453125, -0.31640625, -0.151123046875, 0.01416015625, 0.179443359375, 0.3447265625, 0.510009765625, 0.67529296875, 0.840576171875, 1.005859375, 1.171142578125, 1.33642578125, 1.501708984375, 1.6669921875, 1.832275390625, 1.99755859375, 2.162841796875, 2.328125, 2.493408203125, 2.65869140625, 2.823974609375, 2.9892578125, 3.154541015625, 3.31982421875, 3.485107421875, 3.650390625, 3.815673828125, 3.98095703125, 4.146240234375, 4.3115234375, 4.476806640625, 4.64208984375, 4.807373046875, 4.97265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 3.0, 13.0, 8.0, 14.0, 13.0, 15.0, 17.0, 21.0, 22.0, 23.0, 23.0, 34.0, 42.0, 44.0, 43.0, 66.0, 77.0, 146.0, 336.0, 1393.0, 143.0, 76.0, 65.0, 43.0, 44.0, 44.0, 43.0, 40.0, 32.0, 27.0, 17.0, 15.0, 21.0, 11.0, 2.0, 10.0, 15.0, 7.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.28125, -8.98193359375, -8.6826171875, -8.38330078125, -8.083984375, -7.78466796875, -7.4853515625, -7.18603515625, -6.88671875, -6.58740234375, -6.2880859375, -5.98876953125, -5.689453125, -5.39013671875, -5.0908203125, -4.79150390625, -4.4921875, -4.19287109375, -3.8935546875, -3.59423828125, -3.294921875, -2.99560546875, -2.6962890625, -2.39697265625, -2.09765625, -1.79833984375, -1.4990234375, -1.19970703125, -0.900390625, -0.60107421875, -0.3017578125, -0.00244140625, 0.296875, 0.59619140625, 0.8955078125, 1.19482421875, 1.494140625, 1.79345703125, 2.0927734375, 2.39208984375, 2.69140625, 2.99072265625, 3.2900390625, 3.58935546875, 3.888671875, 4.18798828125, 4.4873046875, 4.78662109375, 5.0859375, 5.38525390625, 5.6845703125, 5.98388671875, 6.283203125, 6.58251953125, 6.8818359375, 7.18115234375, 7.48046875, 7.77978515625, 8.0791015625, 8.37841796875, 8.677734375, 8.97705078125, 9.2763671875, 9.57568359375, 9.875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 10.0, 16.0, 14.0, 21.0, 38.0, 30.0, 62.0, 88.0, 111.0, 185.0, 343.0, 746.0, 2014.0, 9220.0, 126202.0, 2919810.0, 76425.0, 7107.0, 1737.0, 659.0, 292.0, 175.0, 88.0, 70.0, 63.0, 42.0, 28.0, 24.0, 17.0, 13.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.15673828125, -17.4697265625, -16.78271484375, -16.095703125, -15.40869140625, -14.7216796875, -14.03466796875, -13.34765625, -12.66064453125, -11.9736328125, -11.28662109375, -10.599609375, -9.91259765625, -9.2255859375, -8.53857421875, -7.8515625, -7.16455078125, -6.4775390625, -5.79052734375, -5.103515625, -4.41650390625, -3.7294921875, -3.04248046875, -2.35546875, -1.66845703125, -0.9814453125, -0.29443359375, 0.392578125, 1.07958984375, 1.7666015625, 2.45361328125, 3.140625, 3.82763671875, 4.5146484375, 5.20166015625, 5.888671875, 6.57568359375, 7.2626953125, 7.94970703125, 8.63671875, 9.32373046875, 10.0107421875, 10.69775390625, 11.384765625, 12.07177734375, 12.7587890625, 13.44580078125, 14.1328125, 14.81982421875, 15.5068359375, 16.19384765625, 16.880859375, 17.56787109375, 18.2548828125, 18.94189453125, 19.62890625, 20.31591796875, 21.0029296875, 21.68994140625, 22.376953125, 23.06396484375, 23.7509765625, 24.43798828125, 25.125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 34.0, 769.0, 209.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.653095245361328, -17.30721664428711, -10.961339950561523, -4.6154632568359375, 1.7304153442382812, 8.0762939453125, 14.422168731689453, 20.768047332763672, 27.11392593383789, 33.45980453491211, 39.80567932128906, 46.15155792236328, 52.4974365234375, 58.84331512451172, 65.18919372558594, 71.53506469726562, 77.88095092773438, 84.2268295288086, 90.57270812988281, 96.9185791015625, 103.26446533203125, 109.61033630371094, 115.95621490478516, 122.30209350585938, 128.64796447753906, 134.99383544921875, 141.3397216796875, 147.6855926513672, 154.03147888183594, 160.37734985351562, 166.72323608398438, 173.06910705566406, 179.41497802734375, 185.76084899902344, 192.1067352294922, 198.45260620117188, 204.79849243164062, 211.1443634033203, 217.490234375, 223.83612060546875, 230.1820068359375, 236.5278778076172, 242.87376403808594, 249.21963500976562, 255.56552124023438, 261.9114074707031, 268.25726318359375, 274.6031494140625, 280.94903564453125, 287.294921875, 293.6407775878906, 299.9866638183594, 306.3325500488281, 312.6784362792969, 319.0242919921875, 325.37017822265625, 331.7160339355469, 338.0619201660156, 344.40777587890625, 350.753662109375, 357.09954833984375, 363.4454345703125, 369.7912902832031, 376.1371765136719, 382.4830627441406]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 9.0, 7.0, 12.0, 23.0, 21.0, 23.0, 25.0, 32.0, 35.0, 27.0, 35.0, 34.0, 35.0, 45.0, 50.0, 37.0, 47.0, 39.0, 40.0, 40.0, 39.0, 37.0, 27.0, 46.0, 23.0, 30.0, 30.0, 18.0, 25.0, 19.0, 16.0, 6.0, 7.0, 11.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.468902587890625, -31.489551544189453, -30.51020050048828, -29.53084945678711, -28.551498413085938, -27.572147369384766, -26.592798233032227, -25.613447189331055, -24.634096145629883, -23.65474510192871, -22.67539405822754, -21.696043014526367, -20.716693878173828, -19.737342834472656, -18.757991790771484, -17.778640747070312, -16.79928970336914, -15.819938659667969, -14.840587615966797, -13.861237525939941, -12.88188648223877, -11.902535438537598, -10.923185348510742, -9.94383430480957, -8.964483261108398, -7.985132217407227, -7.005781650543213, -6.026431083679199, -5.047080039978027, -4.0677289962768555, -3.088378429412842, -2.109027862548828, -1.129678726196289, -0.1503279209136963, 0.8290228843688965, 1.8083736896514893, 2.787724494934082, 3.767075538635254, 4.746426105499268, 5.725776672363281, 6.705127716064453, 7.684478759765625, 8.663829803466797, 9.643179893493652, 10.622530937194824, 11.601881980895996, 12.581232070922852, 13.560583114624023, 14.539934158325195, 15.519285202026367, 16.49863624572754, 17.47798728942871, 18.45733642578125, 19.436687469482422, 20.416038513183594, 21.395389556884766, 22.374740600585938, 23.35409164428711, 24.33344268798828, 25.312793731689453, 26.292144775390625, 27.271495819091797, 28.250844955444336, 29.230195999145508, 30.20954704284668]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 7.0, 10.0, 11.0, 14.0, 12.0, 21.0, 23.0, 19.0, 25.0, 21.0, 31.0, 27.0, 29.0, 35.0, 40.0, 31.0, 32.0, 38.0, 45.0, 53.0, 54.0, 39.0, 35.0, 46.0, 28.0, 36.0, 30.0, 28.0, 25.0, 26.0, 25.0, 12.0, 14.0, 14.0, 15.0, 8.0, 14.0, 12.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.91796875, -2.821807861328125, -2.72564697265625, -2.629486083984375, -2.5333251953125, -2.437164306640625, -2.34100341796875, -2.244842529296875, -2.148681640625, -2.052520751953125, -1.95635986328125, -1.860198974609375, -1.7640380859375, -1.667877197265625, -1.57171630859375, -1.475555419921875, -1.37939453125, -1.283233642578125, -1.18707275390625, -1.090911865234375, -0.9947509765625, -0.898590087890625, -0.80242919921875, -0.706268310546875, -0.610107421875, -0.513946533203125, -0.41778564453125, -0.321624755859375, -0.2254638671875, -0.129302978515625, -0.03314208984375, 0.063018798828125, 0.1591796875, 0.255340576171875, 0.35150146484375, 0.447662353515625, 0.5438232421875, 0.639984130859375, 0.73614501953125, 0.832305908203125, 0.928466796875, 1.024627685546875, 1.12078857421875, 1.216949462890625, 1.3131103515625, 1.409271240234375, 1.50543212890625, 1.601593017578125, 1.69775390625, 1.793914794921875, 1.89007568359375, 1.986236572265625, 2.0823974609375, 2.178558349609375, 2.27471923828125, 2.370880126953125, 2.467041015625, 2.563201904296875, 2.65936279296875, 2.755523681640625, 2.8516845703125, 2.947845458984375, 3.04400634765625, 3.140167236328125, 3.236328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 3.0, 7.0, 9.0, 19.0, 25.0, 50.0, 69.0, 88.0, 148.0, 236.0, 324.0, 512.0, 777.0, 1328.0, 2218.0, 3888.0, 7189.0, 13124.0, 26238.0, 61253.0, 262474.0, 1811125.0, 1664721.0, 229785.0, 55583.0, 24292.0, 12325.0, 6724.0, 3719.0, 2227.0, 1390.0, 889.0, 527.0, 331.0, 212.0, 122.0, 112.0, 74.0, 49.0, 35.0, 24.0, 17.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96484375, -5.76580810546875, -5.5667724609375, -5.36773681640625, -5.168701171875, -4.96966552734375, -4.7706298828125, -4.57159423828125, -4.37255859375, -4.17352294921875, -3.9744873046875, -3.77545166015625, -3.576416015625, -3.37738037109375, -3.1783447265625, -2.97930908203125, -2.7802734375, -2.58123779296875, -2.3822021484375, -2.18316650390625, -1.984130859375, -1.78509521484375, -1.5860595703125, -1.38702392578125, -1.18798828125, -0.98895263671875, -0.7899169921875, -0.59088134765625, -0.391845703125, -0.19281005859375, 0.0062255859375, 0.20526123046875, 0.404296875, 0.60333251953125, 0.8023681640625, 1.00140380859375, 1.200439453125, 1.39947509765625, 1.5985107421875, 1.79754638671875, 1.99658203125, 2.19561767578125, 2.3946533203125, 2.59368896484375, 2.792724609375, 2.99176025390625, 3.1907958984375, 3.38983154296875, 3.5888671875, 3.78790283203125, 3.9869384765625, 4.18597412109375, 4.385009765625, 4.58404541015625, 4.7830810546875, 4.98211669921875, 5.18115234375, 5.38018798828125, 5.5792236328125, 5.77825927734375, 5.977294921875, 6.17633056640625, 6.3753662109375, 6.57440185546875, 6.7734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 12.0, 18.0, 26.0, 24.0, 42.0, 38.0, 51.0, 57.0, 94.0, 106.0, 207.0, 360.0, 517.0, 685.0, 590.0, 375.0, 236.0, 155.0, 85.0, 86.0, 51.0, 43.0, 46.0, 31.0, 18.0, 15.0, 15.0, 16.0, 7.0, 6.0, 2.0, 10.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86138916015625, -5.6329345703125, -5.40447998046875, -5.176025390625, -4.94757080078125, -4.7191162109375, -4.49066162109375, -4.26220703125, -4.03375244140625, -3.8052978515625, -3.57684326171875, -3.348388671875, -3.11993408203125, -2.8914794921875, -2.66302490234375, -2.4345703125, -2.20611572265625, -1.9776611328125, -1.74920654296875, -1.520751953125, -1.29229736328125, -1.0638427734375, -0.83538818359375, -0.60693359375, -0.37847900390625, -0.1500244140625, 0.07843017578125, 0.306884765625, 0.53533935546875, 0.7637939453125, 0.99224853515625, 1.220703125, 1.44915771484375, 1.6776123046875, 1.90606689453125, 2.134521484375, 2.36297607421875, 2.5914306640625, 2.81988525390625, 3.04833984375, 3.27679443359375, 3.5052490234375, 3.73370361328125, 3.962158203125, 4.19061279296875, 4.4190673828125, 4.64752197265625, 4.8759765625, 5.10443115234375, 5.3328857421875, 5.56134033203125, 5.789794921875, 6.01824951171875, 6.2467041015625, 6.47515869140625, 6.70361328125, 6.93206787109375, 7.1605224609375, 7.38897705078125, 7.617431640625, 7.84588623046875, 8.0743408203125, 8.30279541015625, 8.53125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 5.0, 1.0, 11.0, 13.0, 15.0, 15.0, 21.0, 32.0, 38.0, 57.0, 73.0, 160.0, 306.0, 952.0, 4114.0, 25760.0, 339750.0, 3681674.0, 123746.0, 13763.0, 2507.0, 611.0, 232.0, 114.0, 74.0, 50.0, 37.0, 37.0, 29.0, 13.0, 11.0, 11.0, 12.0, 3.0, 8.0, 8.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0], "bins": [-27.09375, -26.3681640625, -25.642578125, -24.9169921875, -24.19140625, -23.4658203125, -22.740234375, -22.0146484375, -21.2890625, -20.5634765625, -19.837890625, -19.1123046875, -18.38671875, -17.6611328125, -16.935546875, -16.2099609375, -15.484375, -14.7587890625, -14.033203125, -13.3076171875, -12.58203125, -11.8564453125, -11.130859375, -10.4052734375, -9.6796875, -8.9541015625, -8.228515625, -7.5029296875, -6.77734375, -6.0517578125, -5.326171875, -4.6005859375, -3.875, -3.1494140625, -2.423828125, -1.6982421875, -0.97265625, -0.2470703125, 0.478515625, 1.2041015625, 1.9296875, 2.6552734375, 3.380859375, 4.1064453125, 4.83203125, 5.5576171875, 6.283203125, 7.0087890625, 7.734375, 8.4599609375, 9.185546875, 9.9111328125, 10.63671875, 11.3623046875, 12.087890625, 12.8134765625, 13.5390625, 14.2646484375, 14.990234375, 15.7158203125, 16.44140625, 17.1669921875, 17.892578125, 18.6181640625, 19.34375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 9.0, 14.0, 30.0, 72.0, 97.0, 120.0, 172.0, 179.0, 131.0, 66.0, 47.0, 22.0, 9.0, 12.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.42725372314453, -44.872169494628906, -43.31708526611328, -41.76200485229492, -40.2069206237793, -38.65183639526367, -37.09675598144531, -35.54167175292969, -33.98658752441406, -32.43150329589844, -30.876420974731445, -29.321338653564453, -27.766254425048828, -26.211170196533203, -24.65608787536621, -23.10100555419922, -21.545921325683594, -19.99083709716797, -18.435754776000977, -16.880672454833984, -15.32558822631836, -13.77050495147705, -12.215421676635742, -10.660338401794434, -9.105255126953125, -7.550171852111816, -5.995088577270508, -4.440005302429199, -2.8849220275878906, -1.329838752746582, 0.22524452209472656, 1.7803277969360352, 3.3354110717773438, 4.890494346618652, 6.445577621459961, 8.00066089630127, 9.555744171142578, 11.110827445983887, 12.665910720825195, 14.220993995666504, 15.776077270507812, 17.331161499023438, 18.88624382019043, 20.441326141357422, 21.996410369873047, 23.551494598388672, 25.106576919555664, 26.661659240722656, 28.21674346923828, 29.771827697753906, 31.3269100189209, 32.88199234008789, 34.437076568603516, 35.99216079711914, 37.5472412109375, 39.102325439453125, 40.65740966796875, 42.212493896484375, 43.767578125, 45.32265853881836, 46.877742767333984, 48.43282699584961, 49.98790740966797, 51.542991638183594, 53.09807586669922]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 7.0, 7.0, 11.0, 13.0, 12.0, 15.0, 14.0, 26.0, 26.0, 41.0, 28.0, 36.0, 27.0, 40.0, 46.0, 54.0, 48.0, 46.0, 49.0, 30.0, 43.0, 50.0, 41.0, 40.0, 32.0, 21.0, 17.0, 30.0, 24.0, 16.0, 14.0, 16.0, 15.0, 9.0, 16.0, 5.0, 9.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.067045211791992, -24.29473876953125, -23.522430419921875, -22.750123977661133, -21.97781753540039, -21.20551109313965, -20.433202743530273, -19.66089630126953, -18.88858985900879, -18.116283416748047, -17.343975067138672, -16.57166862487793, -15.799362182617188, -15.027054786682129, -14.25474739074707, -13.482440948486328, -12.71013355255127, -11.937826156616211, -11.165519714355469, -10.39321231842041, -9.620905876159668, -8.84859848022461, -8.076292037963867, -7.303984642028809, -6.531677722930908, -5.759370803833008, -4.987063884735107, -4.214756965637207, -3.4424498081207275, -2.670142889022827, -1.8978357315063477, -1.1255288124084473, -0.3532218933105469, 0.4190850853919983, 1.1913920640945435, 1.9636991024017334, 2.736006021499634, 3.508312940597534, 4.280620098114014, 5.052927017211914, 5.8252339363098145, 6.597540855407715, 7.369847774505615, 8.142154693603516, 8.914462089538574, 9.686768531799316, 10.459075927734375, 11.231382369995117, 12.003689765930176, 12.775997161865234, 13.548303604125977, 14.320611000061035, 15.092917442321777, 15.865224838256836, 16.637531280517578, 17.409839630126953, 18.182146072387695, 18.954452514648438, 19.726760864257812, 20.499067306518555, 21.271373748779297, 22.04368019104004, 22.815988540649414, 23.588294982910156, 24.3606014251709]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 5.0, 6.0, 17.0, 10.0, 15.0, 23.0, 19.0, 26.0, 30.0, 29.0, 27.0, 27.0, 54.0, 41.0, 41.0, 51.0, 45.0, 47.0, 38.0, 42.0, 51.0, 46.0, 35.0, 33.0, 20.0, 37.0, 27.0, 27.0, 16.0, 22.0, 19.0, 15.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.171875, -3.074005126953125, -2.97613525390625, -2.878265380859375, -2.7803955078125, -2.682525634765625, -2.58465576171875, -2.486785888671875, -2.388916015625, -2.291046142578125, -2.19317626953125, -2.095306396484375, -1.9974365234375, -1.899566650390625, -1.80169677734375, -1.703826904296875, -1.60595703125, -1.508087158203125, -1.41021728515625, -1.312347412109375, -1.2144775390625, -1.116607666015625, -1.01873779296875, -0.920867919921875, -0.822998046875, -0.725128173828125, -0.62725830078125, -0.529388427734375, -0.4315185546875, -0.333648681640625, -0.23577880859375, -0.137908935546875, -0.0400390625, 0.057830810546875, 0.15570068359375, 0.253570556640625, 0.3514404296875, 0.449310302734375, 0.54718017578125, 0.645050048828125, 0.742919921875, 0.840789794921875, 0.93865966796875, 1.036529541015625, 1.1343994140625, 1.232269287109375, 1.33013916015625, 1.428009033203125, 1.52587890625, 1.623748779296875, 1.72161865234375, 1.819488525390625, 1.9173583984375, 2.015228271484375, 2.11309814453125, 2.210968017578125, 2.308837890625, 2.406707763671875, 2.50457763671875, 2.602447509765625, 2.7003173828125, 2.798187255859375, 2.89605712890625, 2.993927001953125, 3.091796875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 12.0, 19.0, 17.0, 34.0, 30.0, 58.0, 48.0, 73.0, 111.0, 130.0, 176.0, 262.0, 384.0, 531.0, 732.0, 1053.0, 1446.0, 2225.0, 3469.0, 5939.0, 13468.0, 56814.0, 526579.0, 367296.0, 40773.0, 11307.0, 5430.0, 3244.0, 2006.0, 1451.0, 962.0, 630.0, 479.0, 347.0, 277.0, 203.0, 141.0, 101.0, 72.0, 53.0, 55.0, 29.0, 16.0, 11.0, 17.0, 10.0, 7.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.30078125, -4.17010498046875, -4.0394287109375, -3.90875244140625, -3.778076171875, -3.64739990234375, -3.5167236328125, -3.38604736328125, -3.25537109375, -3.12469482421875, -2.9940185546875, -2.86334228515625, -2.732666015625, -2.60198974609375, -2.4713134765625, -2.34063720703125, -2.2099609375, -2.07928466796875, -1.9486083984375, -1.81793212890625, -1.687255859375, -1.55657958984375, -1.4259033203125, -1.29522705078125, -1.16455078125, -1.03387451171875, -0.9031982421875, -0.77252197265625, -0.641845703125, -0.51116943359375, -0.3804931640625, -0.24981689453125, -0.119140625, 0.01153564453125, 0.1422119140625, 0.27288818359375, 0.403564453125, 0.53424072265625, 0.6649169921875, 0.79559326171875, 0.92626953125, 1.05694580078125, 1.1876220703125, 1.31829833984375, 1.448974609375, 1.57965087890625, 1.7103271484375, 1.84100341796875, 1.9716796875, 2.10235595703125, 2.2330322265625, 2.36370849609375, 2.494384765625, 2.62506103515625, 2.7557373046875, 2.88641357421875, 3.01708984375, 3.14776611328125, 3.2784423828125, 3.40911865234375, 3.539794921875, 3.67047119140625, 3.8011474609375, 3.93182373046875, 4.0625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 16.0, 17.0, 26.0, 20.0, 16.0, 30.0, 42.0, 37.0, 32.0, 29.0, 48.0, 26.0, 31.0, 34.0, 1067.0, 49.0, 39.0, 37.0, 41.0, 36.0, 33.0, 32.0, 29.0, 22.0, 25.0, 18.0, 19.0, 20.0, 19.0, 20.0, 6.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.1060791015625, -2.034423828125, -1.9627685546875, -1.89111328125, -1.8194580078125, -1.747802734375, -1.6761474609375, -1.6044921875, -1.5328369140625, -1.461181640625, -1.3895263671875, -1.31787109375, -1.2462158203125, -1.174560546875, -1.1029052734375, -1.03125, -0.9595947265625, -0.887939453125, -0.8162841796875, -0.74462890625, -0.6729736328125, -0.601318359375, -0.5296630859375, -0.4580078125, -0.3863525390625, -0.314697265625, -0.2430419921875, -0.17138671875, -0.0997314453125, -0.028076171875, 0.0435791015625, 0.115234375, 0.1868896484375, 0.258544921875, 0.3302001953125, 0.40185546875, 0.4735107421875, 0.545166015625, 0.6168212890625, 0.6884765625, 0.7601318359375, 0.831787109375, 0.9034423828125, 0.97509765625, 1.0467529296875, 1.118408203125, 1.1900634765625, 1.26171875, 1.3333740234375, 1.405029296875, 1.4766845703125, 1.54833984375, 1.6199951171875, 1.691650390625, 1.7633056640625, 1.8349609375, 1.9066162109375, 1.978271484375, 2.0499267578125, 2.12158203125, 2.1932373046875, 2.264892578125, 2.3365478515625, 2.408203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 7.0, 7.0, 9.0, 6.0, 19.0, 19.0, 20.0, 27.0, 48.0, 40.0, 72.0, 89.0, 109.0, 164.0, 207.0, 262.0, 363.0, 516.0, 735.0, 1191.0, 2089.0, 4056.0, 11325.0, 85587.0, 1878081.0, 89849.0, 11968.0, 4229.0, 2040.0, 1218.0, 770.0, 541.0, 382.0, 248.0, 187.0, 160.0, 112.0, 103.0, 53.0, 59.0, 43.0, 27.0, 29.0, 18.0, 18.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-3.974609375, -3.855987548828125, -3.73736572265625, -3.618743896484375, -3.5001220703125, -3.381500244140625, -3.26287841796875, -3.144256591796875, -3.025634765625, -2.907012939453125, -2.78839111328125, -2.669769287109375, -2.5511474609375, -2.432525634765625, -2.31390380859375, -2.195281982421875, -2.07666015625, -1.958038330078125, -1.83941650390625, -1.720794677734375, -1.6021728515625, -1.483551025390625, -1.36492919921875, -1.246307373046875, -1.127685546875, -1.009063720703125, -0.89044189453125, -0.771820068359375, -0.6531982421875, -0.534576416015625, -0.41595458984375, -0.297332763671875, -0.1787109375, -0.060089111328125, 0.05853271484375, 0.177154541015625, 0.2957763671875, 0.414398193359375, 0.53302001953125, 0.651641845703125, 0.770263671875, 0.888885498046875, 1.00750732421875, 1.126129150390625, 1.2447509765625, 1.363372802734375, 1.48199462890625, 1.600616455078125, 1.71923828125, 1.837860107421875, 1.95648193359375, 2.075103759765625, 2.1937255859375, 2.312347412109375, 2.43096923828125, 2.549591064453125, 2.668212890625, 2.786834716796875, 2.90545654296875, 3.024078369140625, 3.1427001953125, 3.261322021484375, 3.37994384765625, 3.498565673828125, 3.6171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 15.0, 17.0, 10.0, 32.0, 40.0, 78.0, 132.0, 155.0, 146.0, 101.0, 77.0, 49.0, 25.0, 27.0, 21.0, 7.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.45072174072265625, -0.4365997314453125, -0.42247772216796875, -0.408355712890625, -0.39423370361328125, -0.3801116943359375, -0.36598968505859375, -0.35186767578125, -0.33774566650390625, -0.3236236572265625, -0.30950164794921875, -0.295379638671875, -0.28125762939453125, -0.2671356201171875, -0.25301361083984375, -0.2388916015625, -0.22476959228515625, -0.2106475830078125, -0.19652557373046875, -0.182403564453125, -0.16828155517578125, -0.1541595458984375, -0.14003753662109375, -0.12591552734375, -0.11179351806640625, -0.0976715087890625, -0.08354949951171875, -0.069427490234375, -0.05530548095703125, -0.0411834716796875, -0.02706146240234375, -0.012939453125, 0.00118255615234375, 0.0153045654296875, 0.02942657470703125, 0.043548583984375, 0.05767059326171875, 0.0717926025390625, 0.08591461181640625, 0.10003662109375, 0.11415863037109375, 0.1282806396484375, 0.14240264892578125, 0.156524658203125, 0.17064666748046875, 0.1847686767578125, 0.19889068603515625, 0.2130126953125, 0.22713470458984375, 0.2412567138671875, 0.25537872314453125, 0.269500732421875, 0.28362274169921875, 0.2977447509765625, 0.31186676025390625, 0.32598876953125, 0.34011077880859375, 0.3542327880859375, 0.36835479736328125, 0.382476806640625, 0.39659881591796875, 0.4107208251953125, 0.42484283447265625, 0.43896484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 13.0, 30.0, 34.0, 56.0, 111.0, 378.0, 3271.0, 188902.0, 850654.0, 4317.0, 480.0, 103.0, 56.0, 36.0, 21.0, 23.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.73291015625, -8.4423828125, -8.15185546875, -7.861328125, -7.57080078125, -7.2802734375, -6.98974609375, -6.69921875, -6.40869140625, -6.1181640625, -5.82763671875, -5.537109375, -5.24658203125, -4.9560546875, -4.66552734375, -4.375, -4.08447265625, -3.7939453125, -3.50341796875, -3.212890625, -2.92236328125, -2.6318359375, -2.34130859375, -2.05078125, -1.76025390625, -1.4697265625, -1.17919921875, -0.888671875, -0.59814453125, -0.3076171875, -0.01708984375, 0.2734375, 0.56396484375, 0.8544921875, 1.14501953125, 1.435546875, 1.72607421875, 2.0166015625, 2.30712890625, 2.59765625, 2.88818359375, 3.1787109375, 3.46923828125, 3.759765625, 4.05029296875, 4.3408203125, 4.63134765625, 4.921875, 5.21240234375, 5.5029296875, 5.79345703125, 6.083984375, 6.37451171875, 6.6650390625, 6.95556640625, 7.24609375, 7.53662109375, 7.8271484375, 8.11767578125, 8.408203125, 8.69873046875, 8.9892578125, 9.27978515625, 9.5703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 6.0, 7.0, 22.0, 51.0, 93.0, 178.0, 264.0, 224.0, 85.0, 41.0, 20.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4520385265350342, -0.4051550328731537, -0.3582715392112732, -0.3113880455493927, -0.2645045518875122, -0.2176210582256317, -0.17073756456375122, -0.12385407090187073, -0.07697057723999023, -0.03008708357810974, 0.016796410083770752, 0.06367990374565125, 0.11056339740753174, 0.15744689106941223, 0.20433038473129272, 0.2512138783931732, 0.2980973720550537, 0.3449808657169342, 0.3918643593788147, 0.4387478530406952, 0.4856313467025757, 0.5325148105621338, 0.5793983340263367, 0.6262818574905396, 0.6731653213500977, 0.7200487852096558, 0.7669323086738586, 0.8138158321380615, 0.8606992959976196, 0.9075827598571777, 0.9544662833213806, 1.0013498067855835, 1.0482332706451416, 1.0951167345046997, 1.1420001983642578, 1.1888837814331055, 1.2357672452926636, 1.2826507091522217, 1.3295342922210693, 1.3764177560806274, 1.4233012199401855, 1.4701846837997437, 1.5170681476593018, 1.5639517307281494, 1.6108351945877075, 1.6577186584472656, 1.7046022415161133, 1.7514857053756714, 1.7983691692352295, 1.8452526330947876, 1.8921360969543457, 1.9390196800231934, 1.9859031438827515, 2.0327866077423096, 2.0796701908111572, 2.126553535461426, 2.1734371185302734, 2.220320701599121, 2.2672040462493896, 2.3140876293182373, 2.360970973968506, 2.4078545570373535, 2.454738140106201, 2.5016214847564697, 2.5485050678253174]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 7.0, 2.0, 4.0, 4.0, 6.0, 14.0, 12.0, 19.0, 10.0, 18.0, 19.0, 23.0, 27.0, 29.0, 39.0, 42.0, 35.0, 40.0, 43.0, 47.0, 53.0, 55.0, 38.0, 50.0, 39.0, 32.0, 36.0, 27.0, 34.0, 27.0, 32.0, 24.0, 21.0, 18.0, 25.0, 16.0, 11.0, 6.0, 9.0, 9.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432320773601532, -0.4188823699951172, -0.40544393658638, -0.3920055329799652, -0.3785671293735504, -0.36512869596481323, -0.35169029235839844, -0.33825188875198364, -0.32481348514556885, -0.31137508153915405, -0.29793664813041687, -0.2844982445240021, -0.2710598409175873, -0.2576214075088501, -0.2441830039024353, -0.2307446002960205, -0.21730618178844452, -0.20386776328086853, -0.19042935967445374, -0.17699094116687775, -0.16355253756046295, -0.15011411905288696, -0.13667571544647217, -0.12323729693889618, -0.10979888588190079, -0.0963604748249054, -0.08292206376791, -0.06948365271091461, -0.05604523792862892, -0.04260682314634323, -0.02916841208934784, -0.015730001032352448, -0.0022915899753570557, 0.01114682201296091, 0.024585234001278877, 0.03802364692091942, 0.05146205797791481, 0.0649004727602005, 0.07833888381719589, 0.09177729487419128, 0.10521570593118668, 0.11865411698818207, 0.13209253549575806, 0.14553093910217285, 0.15896935760974884, 0.17240777611732483, 0.18584617972373962, 0.19928458333015442, 0.2127230018377304, 0.2261614203453064, 0.2395998239517212, 0.253038227558136, 0.26647666096687317, 0.27991506457328796, 0.29335346817970276, 0.30679190158843994, 0.32023030519485474, 0.33366870880126953, 0.3471071422100067, 0.3605455458164215, 0.3739839494228363, 0.3874223828315735, 0.4008607864379883, 0.4142991900444031, 0.42773759365081787]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 8.0, 8.0, 14.0, 13.0, 17.0, 13.0, 21.0, 21.0, 30.0, 27.0, 34.0, 39.0, 40.0, 41.0, 41.0, 48.0, 52.0, 43.0, 36.0, 50.0, 52.0, 49.0, 38.0, 38.0, 28.0, 37.0, 25.0, 20.0, 18.0, 25.0, 18.0, 5.0, 13.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.101531982421875, -2.99993896484375, -2.898345947265625, -2.7967529296875, -2.695159912109375, -2.59356689453125, -2.491973876953125, -2.390380859375, -2.288787841796875, -2.18719482421875, -2.085601806640625, -1.9840087890625, -1.882415771484375, -1.78082275390625, -1.679229736328125, -1.57763671875, -1.476043701171875, -1.37445068359375, -1.272857666015625, -1.1712646484375, -1.069671630859375, -0.96807861328125, -0.866485595703125, -0.764892578125, -0.663299560546875, -0.56170654296875, -0.460113525390625, -0.3585205078125, -0.256927490234375, -0.15533447265625, -0.053741455078125, 0.0478515625, 0.149444580078125, 0.25103759765625, 0.352630615234375, 0.4542236328125, 0.555816650390625, 0.65740966796875, 0.759002685546875, 0.860595703125, 0.962188720703125, 1.06378173828125, 1.165374755859375, 1.2669677734375, 1.368560791015625, 1.47015380859375, 1.571746826171875, 1.67333984375, 1.774932861328125, 1.87652587890625, 1.978118896484375, 2.0797119140625, 2.181304931640625, 2.28289794921875, 2.384490966796875, 2.486083984375, 2.587677001953125, 2.68927001953125, 2.790863037109375, 2.8924560546875, 2.994049072265625, 3.09564208984375, 3.197235107421875, 3.298828125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 6.0, 9.0, 9.0, 22.0, 20.0, 41.0, 56.0, 74.0, 90.0, 175.0, 232.0, 284.0, 471.0, 591.0, 900.0, 1295.0, 1934.0, 2830.0, 4508.0, 7087.0, 11979.0, 20823.0, 39538.0, 81988.0, 205175.0, 377068.0, 149504.0, 64158.0, 32093.0, 17405.0, 10104.0, 6228.0, 3778.0, 2568.0, 1674.0, 1174.0, 835.0, 544.0, 364.0, 286.0, 177.0, 138.0, 100.0, 70.0, 56.0, 35.0, 18.0, 18.0, 8.0, 5.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.21484375, -3.112274169921875, -3.00970458984375, -2.907135009765625, -2.8045654296875, -2.701995849609375, -2.59942626953125, -2.496856689453125, -2.394287109375, -2.291717529296875, -2.18914794921875, -2.086578369140625, -1.9840087890625, -1.881439208984375, -1.77886962890625, -1.676300048828125, -1.57373046875, -1.471160888671875, -1.36859130859375, -1.266021728515625, -1.1634521484375, -1.060882568359375, -0.95831298828125, -0.855743408203125, -0.753173828125, -0.650604248046875, -0.54803466796875, -0.445465087890625, -0.3428955078125, -0.240325927734375, -0.13775634765625, -0.035186767578125, 0.0673828125, 0.169952392578125, 0.27252197265625, 0.375091552734375, 0.4776611328125, 0.580230712890625, 0.68280029296875, 0.785369873046875, 0.887939453125, 0.990509033203125, 1.09307861328125, 1.195648193359375, 1.2982177734375, 1.400787353515625, 1.50335693359375, 1.605926513671875, 1.70849609375, 1.811065673828125, 1.91363525390625, 2.016204833984375, 2.1187744140625, 2.221343994140625, 2.32391357421875, 2.426483154296875, 2.529052734375, 2.631622314453125, 2.73419189453125, 2.836761474609375, 2.9393310546875, 3.041900634765625, 3.14447021484375, 3.247039794921875, 3.349609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 11.0, 22.0, 25.0, 14.0, 34.0, 19.0, 35.0, 35.0, 51.0, 56.0, 64.0, 90.0, 184.0, 1389.0, 300.0, 160.0, 110.0, 63.0, 58.0, 50.0, 33.0, 34.0, 25.0, 26.0, 19.0, 21.0, 12.0, 21.0, 10.0, 9.0, 9.0, 9.0, 5.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.34375, -9.998291015625, -9.65283203125, -9.307373046875, -8.9619140625, -8.616455078125, -8.27099609375, -7.925537109375, -7.580078125, -7.234619140625, -6.88916015625, -6.543701171875, -6.1982421875, -5.852783203125, -5.50732421875, -5.161865234375, -4.81640625, -4.470947265625, -4.12548828125, -3.780029296875, -3.4345703125, -3.089111328125, -2.74365234375, -2.398193359375, -2.052734375, -1.707275390625, -1.36181640625, -1.016357421875, -0.6708984375, -0.325439453125, 0.02001953125, 0.365478515625, 0.7109375, 1.056396484375, 1.40185546875, 1.747314453125, 2.0927734375, 2.438232421875, 2.78369140625, 3.129150390625, 3.474609375, 3.820068359375, 4.16552734375, 4.510986328125, 4.8564453125, 5.201904296875, 5.54736328125, 5.892822265625, 6.23828125, 6.583740234375, 6.92919921875, 7.274658203125, 7.6201171875, 7.965576171875, 8.31103515625, 8.656494140625, 9.001953125, 9.347412109375, 9.69287109375, 10.038330078125, 10.3837890625, 10.729248046875, 11.07470703125, 11.420166015625, 11.765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 11.0, 10.0, 13.0, 14.0, 26.0, 10.0, 28.0, 25.0, 42.0, 60.0, 76.0, 95.0, 114.0, 181.0, 242.0, 401.0, 939.0, 2642.0, 11768.0, 119480.0, 2786104.0, 201856.0, 15923.0, 3231.0, 1040.0, 459.0, 265.0, 168.0, 121.0, 89.0, 52.0, 50.0, 39.0, 25.0, 21.0, 18.0, 13.0, 12.0, 12.0, 7.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.28125, -18.7236328125, -18.166015625, -17.6083984375, -17.05078125, -16.4931640625, -15.935546875, -15.3779296875, -14.8203125, -14.2626953125, -13.705078125, -13.1474609375, -12.58984375, -12.0322265625, -11.474609375, -10.9169921875, -10.359375, -9.8017578125, -9.244140625, -8.6865234375, -8.12890625, -7.5712890625, -7.013671875, -6.4560546875, -5.8984375, -5.3408203125, -4.783203125, -4.2255859375, -3.66796875, -3.1103515625, -2.552734375, -1.9951171875, -1.4375, -0.8798828125, -0.322265625, 0.2353515625, 0.79296875, 1.3505859375, 1.908203125, 2.4658203125, 3.0234375, 3.5810546875, 4.138671875, 4.6962890625, 5.25390625, 5.8115234375, 6.369140625, 6.9267578125, 7.484375, 8.0419921875, 8.599609375, 9.1572265625, 9.71484375, 10.2724609375, 10.830078125, 11.3876953125, 11.9453125, 12.5029296875, 13.060546875, 13.6181640625, 14.17578125, 14.7333984375, 15.291015625, 15.8486328125, 16.40625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 618.0, 393.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2069091796875, -579.0357055664062, -568.8645629882812, -558.693359375, -548.5221557617188, -538.3510131835938, -528.1798095703125, -518.0086059570312, -507.8374328613281, -497.666259765625, -487.49505615234375, -477.3238830566406, -467.1527099609375, -456.98150634765625, -446.8103332519531, -436.63916015625, -426.46795654296875, -416.2967834472656, -406.1255798339844, -395.95440673828125, -385.783203125, -375.6120300292969, -365.44085693359375, -355.2696533203125, -345.0984802246094, -334.92730712890625, -324.756103515625, -314.5849304199219, -304.41375732421875, -294.2425537109375, -284.0713806152344, -273.90020751953125, -263.72900390625, -253.5578155517578, -243.38662719726562, -233.2154541015625, -223.0442657470703, -212.87307739257812, -202.701904296875, -192.5307159423828, -182.3595428466797, -172.1883544921875, -162.01718139648438, -151.8459930419922, -141.6748046875, -131.5036163330078, -121.33243560791016, -111.1612548828125, -100.99006652832031, -90.81887817382812, -80.64769744873047, -70.47651672363281, -60.305328369140625, -50.1341438293457, -39.96295928955078, -29.791778564453125, -19.620586395263672, -9.44940185546875, 0.7217826843261719, 10.892967224121094, 21.064151763916016, 31.235336303710938, 41.40652084350586, 51.577701568603516, 61.7488899230957]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 13.0, 20.0, 14.0, 13.0, 25.0, 34.0, 22.0, 26.0, 42.0, 31.0, 32.0, 40.0, 40.0, 51.0, 44.0, 58.0, 45.0, 44.0, 45.0, 32.0, 39.0, 32.0, 21.0, 34.0, 27.0, 29.0, 21.0, 12.0, 20.0, 12.0, 10.0, 15.0, 10.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.83502769470215, -30.820438385009766, -29.805849075317383, -28.791259765625, -27.776670455932617, -26.762081146240234, -25.747493743896484, -24.73290252685547, -23.71831512451172, -22.703725814819336, -21.689136505126953, -20.67454719543457, -19.659957885742188, -18.645368576049805, -17.630779266357422, -16.616191864013672, -15.601600646972656, -14.587011337280273, -13.57242202758789, -12.557832717895508, -11.543243408203125, -10.528654098510742, -9.514065742492676, -8.499476432800293, -7.48488712310791, -6.470297813415527, -5.4557085037231445, -4.44111967086792, -3.426530361175537, -2.4119410514831543, -1.3973522186279297, -0.3827629089355469, 0.6318283081054688, 1.646417498588562, 2.6610066890716553, 3.675595760345459, 4.690185070037842, 5.704774379730225, 6.719363212585449, 7.733952522277832, 8.748541831970215, 9.763131141662598, 10.77772045135498, 11.792308807373047, 12.80689811706543, 13.821487426757812, 14.836076736450195, 15.850666046142578, 16.86525535583496, 17.879844665527344, 18.894433975219727, 19.90902328491211, 20.923612594604492, 21.938201904296875, 22.952789306640625, 23.96738052368164, 24.98196792602539, 25.996557235717773, 27.011146545410156, 28.02573585510254, 29.040325164794922, 30.054914474487305, 31.069503784179688, 32.08409118652344, 33.09868240356445]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 10.0, 9.0, 12.0, 17.0, 23.0, 28.0, 25.0, 30.0, 27.0, 42.0, 35.0, 37.0, 53.0, 47.0, 52.0, 44.0, 51.0, 57.0, 53.0, 42.0, 42.0, 34.0, 27.0, 29.0, 24.0, 29.0, 25.0, 17.0, 14.0, 9.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5625, -3.4490966796875, -3.335693359375, -3.2222900390625, -3.10888671875, -2.9954833984375, -2.882080078125, -2.7686767578125, -2.6552734375, -2.5418701171875, -2.428466796875, -2.3150634765625, -2.20166015625, -2.0882568359375, -1.974853515625, -1.8614501953125, -1.748046875, -1.6346435546875, -1.521240234375, -1.4078369140625, -1.29443359375, -1.1810302734375, -1.067626953125, -0.9542236328125, -0.8408203125, -0.7274169921875, -0.614013671875, -0.5006103515625, -0.38720703125, -0.2738037109375, -0.160400390625, -0.0469970703125, 0.06640625, 0.1798095703125, 0.293212890625, 0.4066162109375, 0.52001953125, 0.6334228515625, 0.746826171875, 0.8602294921875, 0.9736328125, 1.0870361328125, 1.200439453125, 1.3138427734375, 1.42724609375, 1.5406494140625, 1.654052734375, 1.7674560546875, 1.880859375, 1.9942626953125, 2.107666015625, 2.2210693359375, 2.33447265625, 2.4478759765625, 2.561279296875, 2.6746826171875, 2.7880859375, 2.9014892578125, 3.014892578125, 3.1282958984375, 3.24169921875, 3.3551025390625, 3.468505859375, 3.5819091796875, 3.6953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 16.0, 26.0, 45.0, 48.0, 81.0, 112.0, 212.0, 364.0, 592.0, 929.0, 1677.0, 3071.0, 5990.0, 12374.0, 27508.0, 77017.0, 537248.0, 2880165.0, 518450.0, 75922.0, 26745.0, 12218.0, 6032.0, 3118.0, 1667.0, 1033.0, 556.0, 372.0, 223.0, 141.0, 87.0, 68.0, 48.0, 24.0, 19.0, 16.0, 12.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5, -8.2384033203125, -7.976806640625, -7.7152099609375, -7.45361328125, -7.1920166015625, -6.930419921875, -6.6688232421875, -6.4072265625, -6.1456298828125, -5.884033203125, -5.6224365234375, -5.36083984375, -5.0992431640625, -4.837646484375, -4.5760498046875, -4.314453125, -4.0528564453125, -3.791259765625, -3.5296630859375, -3.26806640625, -3.0064697265625, -2.744873046875, -2.4832763671875, -2.2216796875, -1.9600830078125, -1.698486328125, -1.4368896484375, -1.17529296875, -0.9136962890625, -0.652099609375, -0.3905029296875, -0.12890625, 0.1326904296875, 0.394287109375, 0.6558837890625, 0.91748046875, 1.1790771484375, 1.440673828125, 1.7022705078125, 1.9638671875, 2.2254638671875, 2.487060546875, 2.7486572265625, 3.01025390625, 3.2718505859375, 3.533447265625, 3.7950439453125, 4.056640625, 4.3182373046875, 4.579833984375, 4.8414306640625, 5.10302734375, 5.3646240234375, 5.626220703125, 5.8878173828125, 6.1494140625, 6.4110107421875, 6.672607421875, 6.9342041015625, 7.19580078125, 7.4573974609375, 7.718994140625, 7.9805908203125, 8.2421875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 8.0, 10.0, 23.0, 27.0, 32.0, 37.0, 48.0, 98.0, 116.0, 248.0, 431.0, 764.0, 860.0, 510.0, 277.0, 160.0, 107.0, 82.0, 54.0, 38.0, 31.0, 22.0, 18.0, 18.0, 14.0, 7.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.0137939453125, -8.715087890625, -8.4163818359375, -8.11767578125, -7.8189697265625, -7.520263671875, -7.2215576171875, -6.9228515625, -6.6241455078125, -6.325439453125, -6.0267333984375, -5.72802734375, -5.4293212890625, -5.130615234375, -4.8319091796875, -4.533203125, -4.2344970703125, -3.935791015625, -3.6370849609375, -3.33837890625, -3.0396728515625, -2.740966796875, -2.4422607421875, -2.1435546875, -1.8448486328125, -1.546142578125, -1.2474365234375, -0.94873046875, -0.6500244140625, -0.351318359375, -0.0526123046875, 0.24609375, 0.5447998046875, 0.843505859375, 1.1422119140625, 1.44091796875, 1.7396240234375, 2.038330078125, 2.3370361328125, 2.6357421875, 2.9344482421875, 3.233154296875, 3.5318603515625, 3.83056640625, 4.1292724609375, 4.427978515625, 4.7266845703125, 5.025390625, 5.3240966796875, 5.622802734375, 5.9215087890625, 6.22021484375, 6.5189208984375, 6.817626953125, 7.1163330078125, 7.4150390625, 7.7137451171875, 8.012451171875, 8.3111572265625, 8.60986328125, 8.9085693359375, 9.207275390625, 9.5059814453125, 9.8046875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 17.0, 17.0, 20.0, 28.0, 30.0, 55.0, 96.0, 168.0, 377.0, 1310.0, 7880.0, 105315.0, 3889382.0, 176450.0, 10601.0, 1636.0, 444.0, 179.0, 91.0, 48.0, 40.0, 31.0, 13.0, 12.0, 7.0, 8.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.41064453125, -30.4462890625, -29.48193359375, -28.517578125, -27.55322265625, -26.5888671875, -25.62451171875, -24.66015625, -23.69580078125, -22.7314453125, -21.76708984375, -20.802734375, -19.83837890625, -18.8740234375, -17.90966796875, -16.9453125, -15.98095703125, -15.0166015625, -14.05224609375, -13.087890625, -12.12353515625, -11.1591796875, -10.19482421875, -9.23046875, -8.26611328125, -7.3017578125, -6.33740234375, -5.373046875, -4.40869140625, -3.4443359375, -2.47998046875, -1.515625, -0.55126953125, 0.4130859375, 1.37744140625, 2.341796875, 3.30615234375, 4.2705078125, 5.23486328125, 6.19921875, 7.16357421875, 8.1279296875, 9.09228515625, 10.056640625, 11.02099609375, 11.9853515625, 12.94970703125, 13.9140625, 14.87841796875, 15.8427734375, 16.80712890625, 17.771484375, 18.73583984375, 19.7001953125, 20.66455078125, 21.62890625, 22.59326171875, 23.5576171875, 24.52197265625, 25.486328125, 26.45068359375, 27.4150390625, 28.37939453125, 29.34375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 25.0, 23.0, 22.0, 47.0, 81.0, 99.0, 131.0, 110.0, 113.0, 96.0, 83.0, 50.0, 39.0, 23.0, 18.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.63386917114258, -44.47373580932617, -43.31360626220703, -42.153472900390625, -40.99333953857422, -39.83320617675781, -38.67307662963867, -37.512943267822266, -36.352813720703125, -35.19268035888672, -34.03255081176758, -32.87241744995117, -31.712284088134766, -30.552152633666992, -29.39202117919922, -28.231887817382812, -27.071754455566406, -25.911623001098633, -24.751489639282227, -23.591358184814453, -22.431224822998047, -21.271093368530273, -20.1109619140625, -18.950828552246094, -17.79069709777832, -16.630565643310547, -15.47043228149414, -14.310300827026367, -13.150168418884277, -11.990036010742188, -10.829904556274414, -9.669772148132324, -8.509637832641602, -7.349505424499512, -6.18937349319458, -5.029241561889648, -3.8691091537475586, -2.7089767456054688, -1.548844814300537, -0.38871288299560547, 0.7714195251464844, 1.9315516948699951, 3.091683864593506, 4.2518157958984375, 5.411948204040527, 6.572080612182617, 7.732212543487549, 8.89234447479248, 10.05247688293457, 11.21260929107666, 12.37274169921875, 13.532873153686523, 14.693005561828613, 15.853137969970703, 17.013269424438477, 18.17340087890625, 19.333534240722656, 20.49366569519043, 21.653799057006836, 22.81393051147461, 23.974063873291016, 25.13419532775879, 26.294326782226562, 27.45446014404297, 28.614591598510742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 1.0, 5.0, 7.0, 10.0, 12.0, 14.0, 23.0, 36.0, 19.0, 37.0, 38.0, 26.0, 41.0, 45.0, 38.0, 47.0, 31.0, 38.0, 46.0, 50.0, 37.0, 37.0, 38.0, 34.0, 39.0, 40.0, 33.0, 36.0, 24.0, 24.0, 16.0, 13.0, 12.0, 12.0, 2.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.061450958251953, -25.286300659179688, -24.51114845275879, -23.735998153686523, -22.960847854614258, -22.18569564819336, -21.410545349121094, -20.635395050048828, -19.86024284362793, -19.085092544555664, -18.309940338134766, -17.5347900390625, -16.759639739990234, -15.984487533569336, -15.20933723449707, -14.434185981750488, -13.659035682678223, -12.88388442993164, -12.108734130859375, -11.333582878112793, -10.558431625366211, -9.783281326293945, -9.008130073547363, -8.232978820800781, -7.457828044891357, -6.682677268981934, -5.907526016235352, -5.132375240325928, -4.357224464416504, -3.582073211669922, -2.806922435760498, -2.031771183013916, -1.2566204071044922, -0.48146945238113403, 0.2936815023422241, 1.0688323974609375, 1.8439834117889404, 2.6191344261169434, 3.394285202026367, 4.169436454772949, 4.944587230682373, 5.719738006591797, 6.494889259338379, 7.270040035247803, 8.045190811157227, 8.820342063903809, 9.59549331665039, 10.370643615722656, 11.145794868469238, 11.92094612121582, 12.696096420288086, 13.471247673034668, 14.24639892578125, 15.021549224853516, 15.796700477600098, 16.57185173034668, 17.347002029418945, 18.12215232849121, 18.89730453491211, 19.672454833984375, 20.44760513305664, 21.22275733947754, 21.997907638549805, 22.773059844970703, 23.54821014404297]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 6.0, 10.0, 8.0, 12.0, 22.0, 19.0, 21.0, 37.0, 28.0, 35.0, 38.0, 25.0, 36.0, 50.0, 45.0, 44.0, 38.0, 40.0, 33.0, 50.0, 45.0, 43.0, 37.0, 40.0, 33.0, 24.0, 15.0, 17.0, 24.0, 16.0, 16.0, 17.0, 15.0, 6.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84423828125, -2.7490234375, -2.65380859375, -2.55859375, -2.46337890625, -2.3681640625, -2.27294921875, -2.177734375, -2.08251953125, -1.9873046875, -1.89208984375, -1.796875, -1.70166015625, -1.6064453125, -1.51123046875, -1.416015625, -1.32080078125, -1.2255859375, -1.13037109375, -1.03515625, -0.93994140625, -0.8447265625, -0.74951171875, -0.654296875, -0.55908203125, -0.4638671875, -0.36865234375, -0.2734375, -0.17822265625, -0.0830078125, 0.01220703125, 0.107421875, 0.20263671875, 0.2978515625, 0.39306640625, 0.48828125, 0.58349609375, 0.6787109375, 0.77392578125, 0.869140625, 0.96435546875, 1.0595703125, 1.15478515625, 1.25, 1.34521484375, 1.4404296875, 1.53564453125, 1.630859375, 1.72607421875, 1.8212890625, 1.91650390625, 2.01171875, 2.10693359375, 2.2021484375, 2.29736328125, 2.392578125, 2.48779296875, 2.5830078125, 2.67822265625, 2.7734375, 2.86865234375, 2.9638671875, 3.05908203125, 3.154296875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 19.0, 25.0, 32.0, 44.0, 67.0, 92.0, 122.0, 150.0, 219.0, 342.0, 444.0, 662.0, 944.0, 1367.0, 2170.0, 3344.0, 5537.0, 9727.0, 18761.0, 43822.0, 173242.0, 586396.0, 125218.0, 36108.0, 16694.0, 8657.0, 5020.0, 3009.0, 1966.0, 1342.0, 893.0, 626.0, 382.0, 315.0, 221.0, 158.0, 111.0, 85.0, 46.0, 42.0, 32.0, 27.0, 15.0, 16.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.296875, -5.1334228515625, -4.969970703125, -4.8065185546875, -4.64306640625, -4.4796142578125, -4.316162109375, -4.1527099609375, -3.9892578125, -3.8258056640625, -3.662353515625, -3.4989013671875, -3.33544921875, -3.1719970703125, -3.008544921875, -2.8450927734375, -2.681640625, -2.5181884765625, -2.354736328125, -2.1912841796875, -2.02783203125, -1.8643798828125, -1.700927734375, -1.5374755859375, -1.3740234375, -1.2105712890625, -1.047119140625, -0.8836669921875, -0.72021484375, -0.5567626953125, -0.393310546875, -0.2298583984375, -0.06640625, 0.0970458984375, 0.260498046875, 0.4239501953125, 0.58740234375, 0.7508544921875, 0.914306640625, 1.0777587890625, 1.2412109375, 1.4046630859375, 1.568115234375, 1.7315673828125, 1.89501953125, 2.0584716796875, 2.221923828125, 2.3853759765625, 2.548828125, 2.7122802734375, 2.875732421875, 3.0391845703125, 3.20263671875, 3.3660888671875, 3.529541015625, 3.6929931640625, 3.8564453125, 4.0198974609375, 4.183349609375, 4.3468017578125, 4.51025390625, 4.6737060546875, 4.837158203125, 5.0006103515625, 5.1640625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 22.0, 24.0, 18.0, 19.0, 31.0, 28.0, 26.0, 34.0, 37.0, 31.0, 38.0, 36.0, 34.0, 36.0, 1059.0, 39.0, 47.0, 34.0, 39.0, 34.0, 39.0, 35.0, 31.0, 41.0, 20.0, 16.0, 21.0, 14.0, 14.0, 14.0, 17.0, 7.0, 6.0, 4.0, 9.0, 3.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.423828125, -2.347747802734375, -2.27166748046875, -2.195587158203125, -2.1195068359375, -2.043426513671875, -1.96734619140625, -1.891265869140625, -1.815185546875, -1.739105224609375, -1.66302490234375, -1.586944580078125, -1.5108642578125, -1.434783935546875, -1.35870361328125, -1.282623291015625, -1.20654296875, -1.130462646484375, -1.05438232421875, -0.978302001953125, -0.9022216796875, -0.826141357421875, -0.75006103515625, -0.673980712890625, -0.597900390625, -0.521820068359375, -0.44573974609375, -0.369659423828125, -0.2935791015625, -0.217498779296875, -0.14141845703125, -0.065338134765625, 0.0107421875, 0.086822509765625, 0.16290283203125, 0.238983154296875, 0.3150634765625, 0.391143798828125, 0.46722412109375, 0.543304443359375, 0.619384765625, 0.695465087890625, 0.77154541015625, 0.847625732421875, 0.9237060546875, 0.999786376953125, 1.07586669921875, 1.151947021484375, 1.22802734375, 1.304107666015625, 1.38018798828125, 1.456268310546875, 1.5323486328125, 1.608428955078125, 1.68450927734375, 1.760589599609375, 1.836669921875, 1.912750244140625, 1.98883056640625, 2.064910888671875, 2.1409912109375, 2.217071533203125, 2.29315185546875, 2.369232177734375, 2.4453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 10.0, 13.0, 28.0, 42.0, 55.0, 86.0, 131.0, 190.0, 288.0, 466.0, 678.0, 1234.0, 2022.0, 3582.0, 6827.0, 14110.0, 36540.0, 194763.0, 1674104.0, 109512.0, 27206.0, 11628.0, 5765.0, 3125.0, 1840.0, 1099.0, 617.0, 394.0, 273.0, 155.0, 125.0, 79.0, 48.0, 37.0, 20.0, 17.0, 5.0, 9.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.2830810546875, -5.109130859375, -4.9351806640625, -4.76123046875, -4.5872802734375, -4.413330078125, -4.2393798828125, -4.0654296875, -3.8914794921875, -3.717529296875, -3.5435791015625, -3.36962890625, -3.1956787109375, -3.021728515625, -2.8477783203125, -2.673828125, -2.4998779296875, -2.325927734375, -2.1519775390625, -1.97802734375, -1.8040771484375, -1.630126953125, -1.4561767578125, -1.2822265625, -1.1082763671875, -0.934326171875, -0.7603759765625, -0.58642578125, -0.4124755859375, -0.238525390625, -0.0645751953125, 0.109375, 0.2833251953125, 0.457275390625, 0.6312255859375, 0.80517578125, 0.9791259765625, 1.153076171875, 1.3270263671875, 1.5009765625, 1.6749267578125, 1.848876953125, 2.0228271484375, 2.19677734375, 2.3707275390625, 2.544677734375, 2.7186279296875, 2.892578125, 3.0665283203125, 3.240478515625, 3.4144287109375, 3.58837890625, 3.7623291015625, 3.936279296875, 4.1102294921875, 4.2841796875, 4.4581298828125, 4.632080078125, 4.8060302734375, 4.97998046875, 5.1539306640625, 5.327880859375, 5.5018310546875, 5.67578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 28.0, 33.0, 134.0, 342.0, 238.0, 93.0, 31.0, 17.0, 20.0, 9.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9052734375, -1.8489837646484375, -1.792694091796875, -1.7364044189453125, -1.68011474609375, -1.6238250732421875, -1.567535400390625, -1.5112457275390625, -1.4549560546875, -1.3986663818359375, -1.342376708984375, -1.2860870361328125, -1.22979736328125, -1.1735076904296875, -1.117218017578125, -1.0609283447265625, -1.004638671875, -0.9483489990234375, -0.892059326171875, -0.8357696533203125, -0.77947998046875, -0.7231903076171875, -0.666900634765625, -0.6106109619140625, -0.5543212890625, -0.4980316162109375, -0.441741943359375, -0.3854522705078125, -0.32916259765625, -0.2728729248046875, -0.216583251953125, -0.1602935791015625, -0.10400390625, -0.0477142333984375, 0.008575439453125, 0.0648651123046875, 0.12115478515625, 0.1774444580078125, 0.233734130859375, 0.2900238037109375, 0.3463134765625, 0.4026031494140625, 0.458892822265625, 0.5151824951171875, 0.57147216796875, 0.6277618408203125, 0.684051513671875, 0.7403411865234375, 0.796630859375, 0.8529205322265625, 0.909210205078125, 0.9654998779296875, 1.02178955078125, 1.0780792236328125, 1.134368896484375, 1.1906585693359375, 1.2469482421875, 1.3032379150390625, 1.359527587890625, 1.4158172607421875, 1.47210693359375, 1.5283966064453125, 1.584686279296875, 1.6409759521484375, 1.697265625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 5.0, 9.0, 15.0, 37.0, 65.0, 231.0, 1412.0, 41236.0, 1002252.0, 2701.0, 411.0, 77.0, 30.0, 23.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.9375, -31.84521484375, -30.7529296875, -29.66064453125, -28.568359375, -27.47607421875, -26.3837890625, -25.29150390625, -24.19921875, -23.10693359375, -22.0146484375, -20.92236328125, -19.830078125, -18.73779296875, -17.6455078125, -16.55322265625, -15.4609375, -14.36865234375, -13.2763671875, -12.18408203125, -11.091796875, -9.99951171875, -8.9072265625, -7.81494140625, -6.72265625, -5.63037109375, -4.5380859375, -3.44580078125, -2.353515625, -1.26123046875, -0.1689453125, 0.92333984375, 2.015625, 3.10791015625, 4.2001953125, 5.29248046875, 6.384765625, 7.47705078125, 8.5693359375, 9.66162109375, 10.75390625, 11.84619140625, 12.9384765625, 14.03076171875, 15.123046875, 16.21533203125, 17.3076171875, 18.39990234375, 19.4921875, 20.58447265625, 21.6767578125, 22.76904296875, 23.861328125, 24.95361328125, 26.0458984375, 27.13818359375, 28.23046875, 29.32275390625, 30.4150390625, 31.50732421875, 32.599609375, 33.69189453125, 34.7841796875, 35.87646484375, 36.96875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 31.0, 153.0, 664.0, 141.0, 19.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.514542579650879, -1.239621877670288, -0.9647012948989868, -0.6897806525230408, -0.4148600101470947, -0.1399393081665039, 0.13498127460479736, 0.40990185737609863, 0.6848225593566895, 0.9597432017326355, 1.2346638441085815, 1.5095844268798828, 1.7845051288604736, 2.0594258308410645, 2.334346294403076, 2.609266996383667, 2.884187698364258, 3.1591084003448486, 3.4340291023254395, 3.708949565887451, 3.983870267868042, 4.258790969848633, 4.5337114334106445, 4.808631896972656, 5.083552837371826, 5.358473300933838, 5.633394241333008, 5.9083147048950195, 6.183235168457031, 6.458156108856201, 6.733076572418213, 7.007997512817383, 7.282918930053711, 7.557839393615723, 7.832760334014893, 8.107681274414062, 8.382601737976074, 8.657522201538086, 8.932442665100098, 9.20736312866211, 9.482284545898438, 9.75720500946045, 10.032125473022461, 10.307046890258789, 10.5819673538208, 10.856887817382812, 11.131808280944824, 11.406728744506836, 11.681649208068848, 11.95656967163086, 12.231490135192871, 12.5064115524292, 12.781332015991211, 13.056252479553223, 13.331172943115234, 13.606093406677246, 13.881013870239258, 14.15593433380127, 14.430854797363281, 14.70577621459961, 14.980696678161621, 15.255617141723633, 15.530537605285645, 15.805458068847656, 16.080379486083984]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 12.0, 13.0, 19.0, 11.0, 23.0, 24.0, 35.0, 21.0, 25.0, 31.0, 43.0, 32.0, 38.0, 41.0, 36.0, 48.0, 39.0, 41.0, 40.0, 41.0, 30.0, 33.0, 33.0, 32.0, 28.0, 28.0, 31.0, 12.0, 19.0, 20.0, 14.0, 14.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9238834381103516, -0.8947098255157471, -0.8655362129211426, -0.8363626003265381, -0.8071890473365784, -0.7780154347419739, -0.7488418221473694, -0.7196682095527649, -0.6904945969581604, -0.6613209843635559, -0.6321473717689514, -0.6029738187789917, -0.5738002061843872, -0.5446265935897827, -0.5154529809951782, -0.48627936840057373, -0.4571057856082916, -0.42793217301368713, -0.39875859022140503, -0.36958497762680054, -0.34041136503219604, -0.31123775243759155, -0.28206416964530945, -0.25289055705070496, -0.22371695935726166, -0.19454336166381836, -0.16536974906921387, -0.13619615137577057, -0.10702254623174667, -0.07784894108772278, -0.04867534339427948, -0.019501730799674988, 0.00967186689376831, 0.038845472037792206, 0.0680190771818161, 0.0971926748752594, 0.1263662874698639, 0.1555398851633072, 0.1847134828567505, 0.21388709545135498, 0.24306069314479828, 0.2722342908382416, 0.30140790343284607, 0.3305814862251282, 0.35975509881973267, 0.38892871141433716, 0.41810232400894165, 0.44727593660354614, 0.47644951939582825, 0.5056231021881104, 0.5347967147827148, 0.5639703273773193, 0.5931439399719238, 0.6223175525665283, 0.6514911651611328, 0.6806647777557373, 0.709838330745697, 0.7390119433403015, 0.768185555934906, 0.7973591089248657, 0.8265327215194702, 0.8557063341140747, 0.8848799467086792, 0.9140535593032837, 0.9432271718978882]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 10.0, 8.0, 11.0, 14.0, 14.0, 24.0, 24.0, 29.0, 26.0, 20.0, 29.0, 46.0, 42.0, 44.0, 35.0, 47.0, 40.0, 33.0, 38.0, 34.0, 41.0, 51.0, 43.0, 39.0, 33.0, 28.0, 18.0, 17.0, 24.0, 23.0, 11.0, 12.0, 12.0, 9.0, 6.0, 14.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.744140625, -2.653533935546875, -2.56292724609375, -2.472320556640625, -2.3817138671875, -2.291107177734375, -2.20050048828125, -2.109893798828125, -2.019287109375, -1.928680419921875, -1.83807373046875, -1.747467041015625, -1.6568603515625, -1.566253662109375, -1.47564697265625, -1.385040283203125, -1.29443359375, -1.203826904296875, -1.11322021484375, -1.022613525390625, -0.9320068359375, -0.841400146484375, -0.75079345703125, -0.660186767578125, -0.569580078125, -0.478973388671875, -0.38836669921875, -0.297760009765625, -0.2071533203125, -0.116546630859375, -0.02593994140625, 0.064666748046875, 0.1552734375, 0.245880126953125, 0.33648681640625, 0.427093505859375, 0.5177001953125, 0.608306884765625, 0.69891357421875, 0.789520263671875, 0.880126953125, 0.970733642578125, 1.06134033203125, 1.151947021484375, 1.2425537109375, 1.333160400390625, 1.42376708984375, 1.514373779296875, 1.60498046875, 1.695587158203125, 1.78619384765625, 1.876800537109375, 1.9674072265625, 2.058013916015625, 2.14862060546875, 2.239227294921875, 2.329833984375, 2.420440673828125, 2.51104736328125, 2.601654052734375, 2.6922607421875, 2.782867431640625, 2.87347412109375, 2.964080810546875, 3.0546875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 21.0, 34.0, 46.0, 55.0, 97.0, 119.0, 145.0, 231.0, 329.0, 377.0, 538.0, 872.0, 1154.0, 1658.0, 2546.0, 4133.0, 7588.0, 16394.0, 46752.0, 185822.0, 553396.0, 152198.0, 40565.0, 14680.0, 7019.0, 3844.0, 2514.0, 1601.0, 1115.0, 759.0, 550.0, 365.0, 295.0, 194.0, 171.0, 108.0, 68.0, 59.0, 44.0, 33.0, 10.0, 18.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.90679931640625, -3.7784423828125, -3.65008544921875, -3.521728515625, -3.39337158203125, -3.2650146484375, -3.13665771484375, -3.00830078125, -2.87994384765625, -2.7515869140625, -2.62322998046875, -2.494873046875, -2.36651611328125, -2.2381591796875, -2.10980224609375, -1.9814453125, -1.85308837890625, -1.7247314453125, -1.59637451171875, -1.468017578125, -1.33966064453125, -1.2113037109375, -1.08294677734375, -0.95458984375, -0.82623291015625, -0.6978759765625, -0.56951904296875, -0.441162109375, -0.31280517578125, -0.1844482421875, -0.05609130859375, 0.072265625, 0.20062255859375, 0.3289794921875, 0.45733642578125, 0.585693359375, 0.71405029296875, 0.8424072265625, 0.97076416015625, 1.09912109375, 1.22747802734375, 1.3558349609375, 1.48419189453125, 1.612548828125, 1.74090576171875, 1.8692626953125, 1.99761962890625, 2.1259765625, 2.25433349609375, 2.3826904296875, 2.51104736328125, 2.639404296875, 2.76776123046875, 2.8961181640625, 3.02447509765625, 3.15283203125, 3.28118896484375, 3.4095458984375, 3.53790283203125, 3.666259765625, 3.79461669921875, 3.9229736328125, 4.05133056640625, 4.1796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 14.0, 11.0, 18.0, 19.0, 20.0, 17.0, 21.0, 25.0, 28.0, 42.0, 36.0, 44.0, 54.0, 71.0, 86.0, 188.0, 1519.0, 252.0, 113.0, 74.0, 43.0, 40.0, 36.0, 42.0, 33.0, 26.0, 17.0, 28.0, 15.0, 18.0, 18.0, 17.0, 9.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3260498046875, -9.011474609375, -8.6968994140625, -8.38232421875, -8.0677490234375, -7.753173828125, -7.4385986328125, -7.1240234375, -6.8094482421875, -6.494873046875, -6.1802978515625, -5.86572265625, -5.5511474609375, -5.236572265625, -4.9219970703125, -4.607421875, -4.2928466796875, -3.978271484375, -3.6636962890625, -3.34912109375, -3.0345458984375, -2.719970703125, -2.4053955078125, -2.0908203125, -1.7762451171875, -1.461669921875, -1.1470947265625, -0.83251953125, -0.5179443359375, -0.203369140625, 0.1112060546875, 0.42578125, 0.7403564453125, 1.054931640625, 1.3695068359375, 1.68408203125, 1.9986572265625, 2.313232421875, 2.6278076171875, 2.9423828125, 3.2569580078125, 3.571533203125, 3.8861083984375, 4.20068359375, 4.5152587890625, 4.829833984375, 5.1444091796875, 5.458984375, 5.7735595703125, 6.088134765625, 6.4027099609375, 6.71728515625, 7.0318603515625, 7.346435546875, 7.6610107421875, 7.9755859375, 8.2901611328125, 8.604736328125, 8.9193115234375, 9.23388671875, 9.5484619140625, 9.863037109375, 10.1776123046875, 10.4921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 5.0, 1.0, 4.0, 16.0, 15.0, 13.0, 21.0, 24.0, 33.0, 51.0, 59.0, 98.0, 140.0, 264.0, 452.0, 1064.0, 3451.0, 19201.0, 2195394.0, 904992.0, 15230.0, 3020.0, 996.0, 448.0, 257.0, 128.0, 84.0, 53.0, 41.0, 24.0, 32.0, 20.0, 18.0, 11.0, 11.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.862548828125, -21.17822265625, -20.493896484375, -19.8095703125, -19.125244140625, -18.44091796875, -17.756591796875, -17.072265625, -16.387939453125, -15.70361328125, -15.019287109375, -14.3349609375, -13.650634765625, -12.96630859375, -12.281982421875, -11.59765625, -10.913330078125, -10.22900390625, -9.544677734375, -8.8603515625, -8.176025390625, -7.49169921875, -6.807373046875, -6.123046875, -5.438720703125, -4.75439453125, -4.070068359375, -3.3857421875, -2.701416015625, -2.01708984375, -1.332763671875, -0.6484375, 0.035888671875, 0.72021484375, 1.404541015625, 2.0888671875, 2.773193359375, 3.45751953125, 4.141845703125, 4.826171875, 5.510498046875, 6.19482421875, 6.879150390625, 7.5634765625, 8.247802734375, 8.93212890625, 9.616455078125, 10.30078125, 10.985107421875, 11.66943359375, 12.353759765625, 13.0380859375, 13.722412109375, 14.40673828125, 15.091064453125, 15.775390625, 16.459716796875, 17.14404296875, 17.828369140625, 18.5126953125, 19.197021484375, 19.88134765625, 20.565673828125, 21.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 18.0, 144.0, 530.0, 269.0, 47.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.36990737915039, -17.147403717041016, -14.924901962280273, -12.702398300170898, -10.47989559173584, -8.257392883300781, -6.034889221191406, -3.8123865127563477, -1.589883804321289, 0.6326191425323486, 2.8551220893859863, 5.077625274658203, 7.300127983093262, 9.52263069152832, 11.745134353637695, 13.967637062072754, 16.190139770507812, 18.412643432617188, 20.63514518737793, 22.857648849487305, 25.080150604248047, 27.302654266357422, 29.525157928466797, 31.747661590576172, 33.97016143798828, 36.192665100097656, 38.41516876220703, 40.637672424316406, 42.860172271728516, 45.08267593383789, 47.305179595947266, 49.52768325805664, 51.75018310546875, 53.972686767578125, 56.1951904296875, 58.417694091796875, 60.640193939208984, 62.86269760131836, 65.085205078125, 67.30770111083984, 69.53020477294922, 71.7527084350586, 73.97521209716797, 76.19771575927734, 78.42021942138672, 80.64271545410156, 82.86521911621094, 85.08772277832031, 87.31022644042969, 89.53273010253906, 91.75523376464844, 93.97773742675781, 96.20024108886719, 98.42274475097656, 100.64524841308594, 102.86774444580078, 105.09025573730469, 107.31275939941406, 109.53526306152344, 111.75776672363281, 113.98027038574219, 116.20277404785156, 118.42527770996094, 120.64777374267578, 122.87027740478516]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 20.0, 17.0, 36.0, 32.0, 45.0, 33.0, 41.0, 43.0, 46.0, 43.0, 32.0, 35.0, 31.0, 46.0, 34.0, 42.0, 30.0, 40.0, 31.0, 29.0, 24.0, 21.0, 22.0, 18.0, 16.0, 20.0, 6.0, 8.0, 3.0, 7.0, 8.0, 10.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.262863159179688, -22.507118225097656, -21.751375198364258, -20.995630264282227, -20.239887237548828, -19.484142303466797, -18.728397369384766, -17.972652435302734, -17.216909408569336, -16.461164474487305, -15.705421447753906, -14.949676513671875, -14.19393253326416, -13.438188552856445, -12.682443618774414, -11.9266996383667, -11.170955657958984, -10.41521167755127, -9.659467697143555, -8.903722763061523, -8.147978782653809, -7.392234802246094, -6.636490345001221, -5.880745887756348, -5.125001907348633, -4.369257926940918, -3.613513469696045, -2.857769250869751, -2.102025032043457, -1.346280813217163, -0.5905365943908691, 0.1652078628540039, 0.9209537506103516, 1.6766979694366455, 2.4324421882629395, 3.1881864070892334, 3.9439306259155273, 4.699674606323242, 5.455419063568115, 6.211163520812988, 6.966907501220703, 7.722651481628418, 8.478395462036133, 9.234140396118164, 9.989884376525879, 10.745628356933594, 11.501373291015625, 12.25711727142334, 13.012861251831055, 13.76860523223877, 14.524349212646484, 15.280094146728516, 16.035839080810547, 16.791582107543945, 17.547327041625977, 18.303070068359375, 19.058815002441406, 19.814559936523438, 20.570302963256836, 21.326047897338867, 22.081790924072266, 22.837535858154297, 23.593280792236328, 24.34902572631836, 25.104768753051758]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 9.0, 8.0, 9.0, 15.0, 20.0, 30.0, 30.0, 18.0, 27.0, 41.0, 49.0, 49.0, 41.0, 36.0, 49.0, 37.0, 55.0, 49.0, 54.0, 39.0, 39.0, 38.0, 24.0, 35.0, 34.0, 21.0, 16.0, 29.0, 16.0, 16.0, 6.0, 13.0, 4.0, 5.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.56536865234375, -3.4569091796875, -3.34844970703125, -3.239990234375, -3.13153076171875, -3.0230712890625, -2.91461181640625, -2.80615234375, -2.69769287109375, -2.5892333984375, -2.48077392578125, -2.372314453125, -2.26385498046875, -2.1553955078125, -2.04693603515625, -1.9384765625, -1.83001708984375, -1.7215576171875, -1.61309814453125, -1.504638671875, -1.39617919921875, -1.2877197265625, -1.17926025390625, -1.07080078125, -0.96234130859375, -0.8538818359375, -0.74542236328125, -0.636962890625, -0.52850341796875, -0.4200439453125, -0.31158447265625, -0.203125, -0.09466552734375, 0.0137939453125, 0.12225341796875, 0.230712890625, 0.33917236328125, 0.4476318359375, 0.55609130859375, 0.66455078125, 0.77301025390625, 0.8814697265625, 0.98992919921875, 1.098388671875, 1.20684814453125, 1.3153076171875, 1.42376708984375, 1.5322265625, 1.64068603515625, 1.7491455078125, 1.85760498046875, 1.966064453125, 2.07452392578125, 2.1829833984375, 2.29144287109375, 2.39990234375, 2.50836181640625, 2.6168212890625, 2.72528076171875, 2.833740234375, 2.94219970703125, 3.0506591796875, 3.15911865234375, 3.267578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 5.0, 12.0, 14.0, 17.0, 24.0, 63.0, 60.0, 85.0, 135.0, 167.0, 301.0, 378.0, 576.0, 896.0, 1258.0, 1973.0, 3147.0, 4918.0, 8280.0, 14262.0, 27191.0, 58618.0, 190281.0, 1178063.0, 2135071.0, 395863.0, 89187.0, 36980.0, 18682.0, 10697.0, 6093.0, 3855.0, 2438.0, 1602.0, 1006.0, 699.0, 436.0, 323.0, 187.0, 131.0, 103.0, 61.0, 50.0, 28.0, 17.0, 12.0, 15.0, 5.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.21875, -6.02569580078125, -5.8326416015625, -5.63958740234375, -5.446533203125, -5.25347900390625, -5.0604248046875, -4.86737060546875, -4.67431640625, -4.48126220703125, -4.2882080078125, -4.09515380859375, -3.902099609375, -3.70904541015625, -3.5159912109375, -3.32293701171875, -3.1298828125, -2.93682861328125, -2.7437744140625, -2.55072021484375, -2.357666015625, -2.16461181640625, -1.9715576171875, -1.77850341796875, -1.58544921875, -1.39239501953125, -1.1993408203125, -1.00628662109375, -0.813232421875, -0.62017822265625, -0.4271240234375, -0.23406982421875, -0.041015625, 0.15203857421875, 0.3450927734375, 0.53814697265625, 0.731201171875, 0.92425537109375, 1.1173095703125, 1.31036376953125, 1.50341796875, 1.69647216796875, 1.8895263671875, 2.08258056640625, 2.275634765625, 2.46868896484375, 2.6617431640625, 2.85479736328125, 3.0478515625, 3.24090576171875, 3.4339599609375, 3.62701416015625, 3.820068359375, 4.01312255859375, 4.2061767578125, 4.39923095703125, 4.59228515625, 4.78533935546875, 4.9783935546875, 5.17144775390625, 5.364501953125, 5.55755615234375, 5.7506103515625, 5.94366455078125, 6.13671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 1.0, 8.0, 7.0, 5.0, 8.0, 11.0, 13.0, 12.0, 31.0, 22.0, 37.0, 43.0, 47.0, 50.0, 58.0, 67.0, 97.0, 135.0, 215.0, 341.0, 470.0, 619.0, 471.0, 355.0, 237.0, 178.0, 116.0, 84.0, 63.0, 56.0, 32.0, 40.0, 23.0, 19.0, 16.0, 17.0, 13.0, 13.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-6.87109375, -6.67791748046875, -6.4847412109375, -6.29156494140625, -6.098388671875, -5.90521240234375, -5.7120361328125, -5.51885986328125, -5.32568359375, -5.13250732421875, -4.9393310546875, -4.74615478515625, -4.552978515625, -4.35980224609375, -4.1666259765625, -3.97344970703125, -3.7802734375, -3.58709716796875, -3.3939208984375, -3.20074462890625, -3.007568359375, -2.81439208984375, -2.6212158203125, -2.42803955078125, -2.23486328125, -2.04168701171875, -1.8485107421875, -1.65533447265625, -1.462158203125, -1.26898193359375, -1.0758056640625, -0.88262939453125, -0.689453125, -0.49627685546875, -0.3031005859375, -0.10992431640625, 0.083251953125, 0.27642822265625, 0.4696044921875, 0.66278076171875, 0.85595703125, 1.04913330078125, 1.2423095703125, 1.43548583984375, 1.628662109375, 1.82183837890625, 2.0150146484375, 2.20819091796875, 2.4013671875, 2.59454345703125, 2.7877197265625, 2.98089599609375, 3.174072265625, 3.36724853515625, 3.5604248046875, 3.75360107421875, 3.94677734375, 4.13995361328125, 4.3331298828125, 4.52630615234375, 4.719482421875, 4.91265869140625, 5.1058349609375, 5.29901123046875, 5.4921875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 20.0, 10.0, 22.0, 26.0, 38.0, 46.0, 68.0, 75.0, 134.0, 230.0, 643.0, 3621.0, 34842.0, 1746019.0, 2363851.0, 39242.0, 3875.0, 701.0, 237.0, 115.0, 57.0, 55.0, 48.0, 54.0, 39.0, 33.0, 24.0, 25.0, 8.0, 12.0, 7.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.485595703125, -23.61181640625, -22.738037109375, -21.8642578125, -20.990478515625, -20.11669921875, -19.242919921875, -18.369140625, -17.495361328125, -16.62158203125, -15.747802734375, -14.8740234375, -14.000244140625, -13.12646484375, -12.252685546875, -11.37890625, -10.505126953125, -9.63134765625, -8.757568359375, -7.8837890625, -7.010009765625, -6.13623046875, -5.262451171875, -4.388671875, -3.514892578125, -2.64111328125, -1.767333984375, -0.8935546875, -0.019775390625, 0.85400390625, 1.727783203125, 2.6015625, 3.475341796875, 4.34912109375, 5.222900390625, 6.0966796875, 6.970458984375, 7.84423828125, 8.718017578125, 9.591796875, 10.465576171875, 11.33935546875, 12.213134765625, 13.0869140625, 13.960693359375, 14.83447265625, 15.708251953125, 16.58203125, 17.455810546875, 18.32958984375, 19.203369140625, 20.0771484375, 20.950927734375, 21.82470703125, 22.698486328125, 23.572265625, 24.446044921875, 25.31982421875, 26.193603515625, 27.0673828125, 27.941162109375, 28.81494140625, 29.688720703125, 30.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 7.0, 19.0, 62.0, 177.0, 303.0, 284.0, 115.0, 35.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.066129684448242, -24.87198829650879, -21.677846908569336, -18.48370361328125, -15.289563179016113, -12.09542179107666, -8.90127944946289, -5.7071380615234375, -2.5129966735839844, 0.6811449527740479, 3.87528657913208, 7.069428443908691, 10.263569831848145, 13.457711219787598, 16.651853561401367, 19.84599494934082, 23.040136337280273, 26.234277725219727, 29.42841911315918, 32.622562408447266, 35.81670379638672, 39.01084518432617, 42.204986572265625, 45.39912796020508, 48.59326934814453, 51.787410736083984, 54.98155212402344, 58.17569351196289, 61.369834899902344, 64.56398010253906, 67.75811767578125, 70.95226287841797, 74.14640045166016, 77.34054565429688, 80.53468322753906, 83.72882843017578, 86.92296600341797, 90.11711120605469, 93.31124877929688, 96.5053939819336, 99.69953155517578, 102.8936767578125, 106.08781433105469, 109.2819595336914, 112.4760971069336, 115.67024230957031, 118.8643798828125, 122.05852508544922, 125.25267028808594, 128.44680786132812, 131.64096069335938, 134.83509826660156, 138.02923583984375, 141.22337341308594, 144.4175262451172, 147.61166381835938, 150.80580139160156, 153.99993896484375, 157.194091796875, 160.3882293701172, 163.58236694335938, 166.77650451660156, 169.9706573486328, 173.164794921875, 176.3589324951172]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 11.0, 9.0, 12.0, 13.0, 14.0, 11.0, 15.0, 17.0, 20.0, 20.0, 23.0, 27.0, 26.0, 31.0, 43.0, 41.0, 34.0, 36.0, 48.0, 41.0, 45.0, 36.0, 42.0, 41.0, 35.0, 46.0, 34.0, 35.0, 20.0, 28.0, 27.0, 20.0, 19.0, 13.0, 15.0, 13.0, 5.0, 7.0, 16.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.957801818847656, -24.247831344604492, -23.537860870361328, -22.827890396118164, -22.117919921875, -21.407947540283203, -20.69797706604004, -19.988006591796875, -19.27803611755371, -18.568065643310547, -17.858095169067383, -17.14812469482422, -16.438152313232422, -15.728182792663574, -15.018211364746094, -14.30824089050293, -13.598270416259766, -12.888299942016602, -12.178329467773438, -11.468358039855957, -10.758387565612793, -10.048417091369629, -9.338445663452148, -8.628475189208984, -7.91850471496582, -7.208534240722656, -6.498563289642334, -5.788592338562012, -5.078621864318848, -4.368651390075684, -3.6586804389953613, -2.948709487915039, -2.238740921020508, -1.5287702083587646, -0.8187994956970215, -0.10882878303527832, 0.6011419296264648, 1.311112642288208, 2.021083354949951, 2.7310543060302734, 3.4410247802734375, 4.150995254516602, 4.860966205596924, 5.570937156677246, 6.28090763092041, 6.990878105163574, 7.7008490562438965, 8.410820007324219, 9.120790481567383, 9.830760955810547, 10.540731430053711, 11.250702857971191, 11.960673332214355, 12.67064380645752, 13.380615234375, 14.090585708618164, 14.800556182861328, 15.510526657104492, 16.220497131347656, 16.93046760559082, 17.640438079833984, 18.35041046142578, 19.060380935668945, 19.77035140991211, 20.480321884155273]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 13.0, 27.0, 14.0, 14.0, 12.0, 23.0, 21.0, 22.0, 26.0, 40.0, 33.0, 34.0, 42.0, 37.0, 30.0, 46.0, 44.0, 41.0, 41.0, 40.0, 41.0, 42.0, 33.0, 29.0, 30.0, 23.0, 30.0, 25.0, 22.0, 18.0, 16.0, 9.0, 6.0, 8.0, 10.0, 14.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.693359375, -2.60345458984375, -2.5135498046875, -2.42364501953125, -2.333740234375, -2.24383544921875, -2.1539306640625, -2.06402587890625, -1.97412109375, -1.88421630859375, -1.7943115234375, -1.70440673828125, -1.614501953125, -1.52459716796875, -1.4346923828125, -1.34478759765625, -1.2548828125, -1.16497802734375, -1.0750732421875, -0.98516845703125, -0.895263671875, -0.80535888671875, -0.7154541015625, -0.62554931640625, -0.53564453125, -0.44573974609375, -0.3558349609375, -0.26593017578125, -0.176025390625, -0.08612060546875, 0.0037841796875, 0.09368896484375, 0.18359375, 0.27349853515625, 0.3634033203125, 0.45330810546875, 0.543212890625, 0.63311767578125, 0.7230224609375, 0.81292724609375, 0.90283203125, 0.99273681640625, 1.0826416015625, 1.17254638671875, 1.262451171875, 1.35235595703125, 1.4422607421875, 1.53216552734375, 1.6220703125, 1.71197509765625, 1.8018798828125, 1.89178466796875, 1.981689453125, 2.07159423828125, 2.1614990234375, 2.25140380859375, 2.34130859375, 2.43121337890625, 2.5211181640625, 2.61102294921875, 2.700927734375, 2.79083251953125, 2.8807373046875, 2.97064208984375, 3.060546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 7.0, 16.0, 16.0, 29.0, 35.0, 49.0, 69.0, 84.0, 94.0, 148.0, 224.0, 277.0, 402.0, 473.0, 677.0, 920.0, 1292.0, 1865.0, 2634.0, 3950.0, 5825.0, 9487.0, 16601.0, 37772.0, 154652.0, 583999.0, 146131.0, 36349.0, 16044.0, 9245.0, 5997.0, 3892.0, 2644.0, 1860.0, 1322.0, 929.0, 632.0, 493.0, 388.0, 282.0, 198.0, 146.0, 100.0, 83.0, 54.0, 45.0, 34.0, 26.0, 19.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.28515625, -4.1490478515625, -4.012939453125, -3.8768310546875, -3.74072265625, -3.6046142578125, -3.468505859375, -3.3323974609375, -3.1962890625, -3.0601806640625, -2.924072265625, -2.7879638671875, -2.65185546875, -2.5157470703125, -2.379638671875, -2.2435302734375, -2.107421875, -1.9713134765625, -1.835205078125, -1.6990966796875, -1.56298828125, -1.4268798828125, -1.290771484375, -1.1546630859375, -1.0185546875, -0.8824462890625, -0.746337890625, -0.6102294921875, -0.47412109375, -0.3380126953125, -0.201904296875, -0.0657958984375, 0.0703125, 0.2064208984375, 0.342529296875, 0.4786376953125, 0.61474609375, 0.7508544921875, 0.886962890625, 1.0230712890625, 1.1591796875, 1.2952880859375, 1.431396484375, 1.5675048828125, 1.70361328125, 1.8397216796875, 1.975830078125, 2.1119384765625, 2.248046875, 2.3841552734375, 2.520263671875, 2.6563720703125, 2.79248046875, 2.9285888671875, 3.064697265625, 3.2008056640625, 3.3369140625, 3.4730224609375, 3.609130859375, 3.7452392578125, 3.88134765625, 4.0174560546875, 4.153564453125, 4.2896728515625, 4.42578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 8.0, 12.0, 5.0, 5.0, 15.0, 14.0, 19.0, 17.0, 24.0, 27.0, 16.0, 19.0, 33.0, 39.0, 34.0, 46.0, 41.0, 35.0, 43.0, 53.0, 1056.0, 48.0, 26.0, 38.0, 30.0, 30.0, 34.0, 27.0, 36.0, 20.0, 22.0, 24.0, 24.0, 10.0, 16.0, 19.0, 12.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.994659423828125, -1.92291259765625, -1.851165771484375, -1.7794189453125, -1.707672119140625, -1.63592529296875, -1.564178466796875, -1.492431640625, -1.420684814453125, -1.34893798828125, -1.277191162109375, -1.2054443359375, -1.133697509765625, -1.06195068359375, -0.990203857421875, -0.91845703125, -0.846710205078125, -0.77496337890625, -0.703216552734375, -0.6314697265625, -0.559722900390625, -0.48797607421875, -0.416229248046875, -0.344482421875, -0.272735595703125, -0.20098876953125, -0.129241943359375, -0.0574951171875, 0.014251708984375, 0.08599853515625, 0.157745361328125, 0.2294921875, 0.301239013671875, 0.37298583984375, 0.444732666015625, 0.5164794921875, 0.588226318359375, 0.65997314453125, 0.731719970703125, 0.803466796875, 0.875213623046875, 0.94696044921875, 1.018707275390625, 1.0904541015625, 1.162200927734375, 1.23394775390625, 1.305694580078125, 1.37744140625, 1.449188232421875, 1.52093505859375, 1.592681884765625, 1.6644287109375, 1.736175537109375, 1.80792236328125, 1.879669189453125, 1.951416015625, 2.023162841796875, 2.09490966796875, 2.166656494140625, 2.2384033203125, 2.310150146484375, 2.38189697265625, 2.453643798828125, 2.525390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 16.0, 11.0, 33.0, 48.0, 53.0, 93.0, 132.0, 176.0, 299.0, 468.0, 711.0, 1036.0, 1813.0, 3119.0, 5679.0, 11993.0, 30723.0, 148886.0, 1647846.0, 182442.0, 34334.0, 12759.0, 5995.0, 3323.0, 1860.0, 1154.0, 713.0, 430.0, 306.0, 200.0, 133.0, 83.0, 66.0, 47.0, 32.0, 27.0, 16.0, 16.0, 11.0, 1.0, 0.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.912109375, -3.784027099609375, -3.65594482421875, -3.527862548828125, -3.3997802734375, -3.271697998046875, -3.14361572265625, -3.015533447265625, -2.887451171875, -2.759368896484375, -2.63128662109375, -2.503204345703125, -2.3751220703125, -2.247039794921875, -2.11895751953125, -1.990875244140625, -1.86279296875, -1.734710693359375, -1.60662841796875, -1.478546142578125, -1.3504638671875, -1.222381591796875, -1.09429931640625, -0.966217041015625, -0.838134765625, -0.710052490234375, -0.58197021484375, -0.453887939453125, -0.3258056640625, -0.197723388671875, -0.06964111328125, 0.058441162109375, 0.1865234375, 0.314605712890625, 0.44268798828125, 0.570770263671875, 0.6988525390625, 0.826934814453125, 0.95501708984375, 1.083099365234375, 1.211181640625, 1.339263916015625, 1.46734619140625, 1.595428466796875, 1.7235107421875, 1.851593017578125, 1.97967529296875, 2.107757568359375, 2.23583984375, 2.363922119140625, 2.49200439453125, 2.620086669921875, 2.7481689453125, 2.876251220703125, 3.00433349609375, 3.132415771484375, 3.260498046875, 3.388580322265625, 3.51666259765625, 3.644744873046875, 3.7728271484375, 3.900909423828125, 4.02899169921875, 4.157073974609375, 4.28515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 17.0, 21.0, 26.0, 55.0, 120.0, 227.0, 259.0, 106.0, 39.0, 29.0, 21.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4947509765625, -1.449462890625, -1.4041748046875, -1.35888671875, -1.3135986328125, -1.268310546875, -1.2230224609375, -1.177734375, -1.1324462890625, -1.087158203125, -1.0418701171875, -0.99658203125, -0.9512939453125, -0.906005859375, -0.8607177734375, -0.8154296875, -0.7701416015625, -0.724853515625, -0.6795654296875, -0.63427734375, -0.5889892578125, -0.543701171875, -0.4984130859375, -0.453125, -0.4078369140625, -0.362548828125, -0.3172607421875, -0.27197265625, -0.2266845703125, -0.181396484375, -0.1361083984375, -0.0908203125, -0.0455322265625, -0.000244140625, 0.0450439453125, 0.09033203125, 0.1356201171875, 0.180908203125, 0.2261962890625, 0.271484375, 0.3167724609375, 0.362060546875, 0.4073486328125, 0.45263671875, 0.4979248046875, 0.543212890625, 0.5885009765625, 0.6337890625, 0.6790771484375, 0.724365234375, 0.7696533203125, 0.81494140625, 0.8602294921875, 0.905517578125, 0.9508056640625, 0.99609375, 1.0413818359375, 1.086669921875, 1.1319580078125, 1.17724609375, 1.2225341796875, 1.267822265625, 1.3131103515625, 1.3583984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 25.0, 32.0, 68.0, 122.0, 958.0, 83425.0, 961860.0, 1660.0, 192.0, 64.0, 43.0, 23.0, 13.0, 14.0, 5.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.828125, -26.9033203125, -25.978515625, -25.0537109375, -24.12890625, -23.2041015625, -22.279296875, -21.3544921875, -20.4296875, -19.5048828125, -18.580078125, -17.6552734375, -16.73046875, -15.8056640625, -14.880859375, -13.9560546875, -13.03125, -12.1064453125, -11.181640625, -10.2568359375, -9.33203125, -8.4072265625, -7.482421875, -6.5576171875, -5.6328125, -4.7080078125, -3.783203125, -2.8583984375, -1.93359375, -1.0087890625, -0.083984375, 0.8408203125, 1.765625, 2.6904296875, 3.615234375, 4.5400390625, 5.46484375, 6.3896484375, 7.314453125, 8.2392578125, 9.1640625, 10.0888671875, 11.013671875, 11.9384765625, 12.86328125, 13.7880859375, 14.712890625, 15.6376953125, 16.5625, 17.4873046875, 18.412109375, 19.3369140625, 20.26171875, 21.1865234375, 22.111328125, 23.0361328125, 23.9609375, 24.8857421875, 25.810546875, 26.7353515625, 27.66015625, 28.5849609375, 29.509765625, 30.4345703125, 31.359375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 9.0, 12.0, 13.0, 22.0, 32.0, 60.0, 84.0, 113.0, 152.0, 157.0, 129.0, 81.0, 51.0, 38.0, 24.0, 15.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.998117208480835, -1.9491727352142334, -1.9002282619476318, -1.8512837886810303, -1.8023391962051392, -1.7533947229385376, -1.704450249671936, -1.6555057764053345, -1.6065611839294434, -1.5576167106628418, -1.5086722373962402, -1.4597277641296387, -1.4107831716537476, -1.361838698387146, -1.3128942251205444, -1.2639497518539429, -1.2150052785873413, -1.1660608053207397, -1.1171163320541382, -1.068171739578247, -1.0192272663116455, -0.970282793045044, -0.9213383197784424, -0.8723938465118408, -0.8234493136405945, -0.7745048403739929, -0.7255603075027466, -0.676615834236145, -0.6276713609695435, -0.5787268280982971, -0.5297823548316956, -0.4808378517627716, -0.4318934679031372, -0.38294896483421326, -0.3340044617652893, -0.28505998849868774, -0.2361154854297638, -0.18717098236083984, -0.13822650909423828, -0.08928200602531433, -0.04033750295639038, 0.008606992661952972, 0.057551488280296326, 0.10649597644805908, 0.15544047951698303, 0.20438498258590698, 0.25332945585250854, 0.3022739589214325, 0.35121846199035645, 0.4001629650592804, 0.44910746812820435, 0.4980519413948059, 0.5469964742660522, 0.5959409475326538, 0.6448854207992554, 0.6938298940658569, 0.7427744269371033, 0.7917189002037048, 0.8406634330749512, 0.8896079063415527, 0.9385523796081543, 0.9874969124794006, 1.0364413261413574, 1.0853859186172485, 1.13433039188385]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 17.0, 16.0, 9.0, 13.0, 21.0, 22.0, 29.0, 34.0, 40.0, 38.0, 33.0, 34.0, 44.0, 39.0, 37.0, 42.0, 38.0, 45.0, 38.0, 39.0, 42.0, 30.0, 36.0, 26.0, 27.0, 25.0, 25.0, 23.0, 24.0, 20.0, 12.0, 12.0, 10.0, 3.0, 8.0, 7.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8735390901565552, -0.8446713089942932, -0.8158035278320312, -0.7869357466697693, -0.7580679655075073, -0.7292001843452454, -0.7003324031829834, -0.6714646816253662, -0.6425968408584595, -0.6137290596961975, -0.5848612785339355, -0.5559934973716736, -0.5271257162094116, -0.49825793504714966, -0.4693901836872101, -0.4405224025249481, -0.41165465116500854, -0.3827868700027466, -0.3539190888404846, -0.32505130767822266, -0.2961835265159607, -0.26731574535369873, -0.23844799399375916, -0.2095802128314972, -0.18071243166923523, -0.15184465050697327, -0.1229768767952919, -0.09410910308361053, -0.06524132192134857, -0.03637354075908661, -0.00750577449798584, 0.021362006664276123, 0.05022972822189331, 0.07909750938415527, 0.10796528309583664, 0.136833056807518, 0.16570083796977997, 0.19456861913204193, 0.2234363853931427, 0.25230416655540466, 0.2811719477176666, 0.3100397288799286, 0.33890751004219055, 0.3677752614021301, 0.3966430425643921, 0.42551082372665405, 0.454378604888916, 0.483246386051178, 0.5121141672134399, 0.5409819483757019, 0.5698497295379639, 0.5987175107002258, 0.6275852918624878, 0.6564530730247498, 0.6853208541870117, 0.7141885757446289, 0.7430564165115356, 0.7719241976737976, 0.8007919788360596, 0.8296597599983215, 0.8585275411605835, 0.8873953223228455, 0.9162631034851074, 0.9451308250427246, 0.9739986062049866]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 9.0, 11.0, 9.0, 12.0, 20.0, 18.0, 14.0, 20.0, 29.0, 26.0, 40.0, 35.0, 35.0, 35.0, 37.0, 33.0, 37.0, 36.0, 48.0, 40.0, 41.0, 45.0, 38.0, 39.0, 26.0, 21.0, 24.0, 29.0, 26.0, 22.0, 23.0, 14.0, 13.0, 15.0, 10.0, 15.0, 6.0, 13.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.701171875, -2.612457275390625, -2.52374267578125, -2.435028076171875, -2.3463134765625, -2.257598876953125, -2.16888427734375, -2.080169677734375, -1.991455078125, -1.902740478515625, -1.81402587890625, -1.725311279296875, -1.6365966796875, -1.547882080078125, -1.45916748046875, -1.370452880859375, -1.28173828125, -1.193023681640625, -1.10430908203125, -1.015594482421875, -0.9268798828125, -0.838165283203125, -0.74945068359375, -0.660736083984375, -0.572021484375, -0.483306884765625, -0.39459228515625, -0.305877685546875, -0.2171630859375, -0.128448486328125, -0.03973388671875, 0.048980712890625, 0.1376953125, 0.226409912109375, 0.31512451171875, 0.403839111328125, 0.4925537109375, 0.581268310546875, 0.66998291015625, 0.758697509765625, 0.847412109375, 0.936126708984375, 1.02484130859375, 1.113555908203125, 1.2022705078125, 1.290985107421875, 1.37969970703125, 1.468414306640625, 1.55712890625, 1.645843505859375, 1.73455810546875, 1.823272705078125, 1.9119873046875, 2.000701904296875, 2.08941650390625, 2.178131103515625, 2.266845703125, 2.355560302734375, 2.44427490234375, 2.532989501953125, 2.6217041015625, 2.710418701171875, 2.79913330078125, 2.887847900390625, 2.9765625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 13.0, 13.0, 14.0, 31.0, 31.0, 45.0, 50.0, 88.0, 110.0, 166.0, 230.0, 340.0, 570.0, 924.0, 1490.0, 2540.0, 4654.0, 8524.0, 18114.0, 52040.0, 378990.0, 479591.0, 59370.0, 19580.0, 9064.0, 4827.0, 2697.0, 1600.0, 925.0, 635.0, 391.0, 263.0, 152.0, 102.0, 100.0, 64.0, 47.0, 34.0, 29.0, 20.0, 21.0, 11.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.828125, -5.6341552734375, -5.440185546875, -5.2462158203125, -5.05224609375, -4.8582763671875, -4.664306640625, -4.4703369140625, -4.2763671875, -4.0823974609375, -3.888427734375, -3.6944580078125, -3.50048828125, -3.3065185546875, -3.112548828125, -2.9185791015625, -2.724609375, -2.5306396484375, -2.336669921875, -2.1427001953125, -1.94873046875, -1.7547607421875, -1.560791015625, -1.3668212890625, -1.1728515625, -0.9788818359375, -0.784912109375, -0.5909423828125, -0.39697265625, -0.2030029296875, -0.009033203125, 0.1849365234375, 0.37890625, 0.5728759765625, 0.766845703125, 0.9608154296875, 1.15478515625, 1.3487548828125, 1.542724609375, 1.7366943359375, 1.9306640625, 2.1246337890625, 2.318603515625, 2.5125732421875, 2.70654296875, 2.9005126953125, 3.094482421875, 3.2884521484375, 3.482421875, 3.6763916015625, 3.870361328125, 4.0643310546875, 4.25830078125, 4.4522705078125, 4.646240234375, 4.8402099609375, 5.0341796875, 5.2281494140625, 5.422119140625, 5.6160888671875, 5.81005859375, 6.0040283203125, 6.197998046875, 6.3919677734375, 6.5859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 9.0, 24.0, 20.0, 22.0, 34.0, 26.0, 23.0, 41.0, 50.0, 44.0, 77.0, 108.0, 146.0, 1509.0, 261.0, 119.0, 90.0, 74.0, 50.0, 47.0, 35.0, 37.0, 29.0, 25.0, 18.0, 19.0, 10.0, 13.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.3359375, -11.970703125, -11.60546875, -11.240234375, -10.875, -10.509765625, -10.14453125, -9.779296875, -9.4140625, -9.048828125, -8.68359375, -8.318359375, -7.953125, -7.587890625, -7.22265625, -6.857421875, -6.4921875, -6.126953125, -5.76171875, -5.396484375, -5.03125, -4.666015625, -4.30078125, -3.935546875, -3.5703125, -3.205078125, -2.83984375, -2.474609375, -2.109375, -1.744140625, -1.37890625, -1.013671875, -0.6484375, -0.283203125, 0.08203125, 0.447265625, 0.8125, 1.177734375, 1.54296875, 1.908203125, 2.2734375, 2.638671875, 3.00390625, 3.369140625, 3.734375, 4.099609375, 4.46484375, 4.830078125, 5.1953125, 5.560546875, 5.92578125, 6.291015625, 6.65625, 7.021484375, 7.38671875, 7.751953125, 8.1171875, 8.482421875, 8.84765625, 9.212890625, 9.578125, 9.943359375, 10.30859375, 10.673828125, 11.0390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 7.0, 11.0, 15.0, 8.0, 19.0, 26.0, 32.0, 38.0, 53.0, 64.0, 74.0, 125.0, 159.0, 286.0, 828.0, 5503.0, 84324.0, 2962562.0, 84260.0, 5558.0, 833.0, 266.0, 156.0, 120.0, 95.0, 52.0, 53.0, 37.0, 28.0, 25.0, 22.0, 10.0, 13.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.182861328125, -22.39697265625, -21.611083984375, -20.8251953125, -20.039306640625, -19.25341796875, -18.467529296875, -17.681640625, -16.895751953125, -16.10986328125, -15.323974609375, -14.5380859375, -13.752197265625, -12.96630859375, -12.180419921875, -11.39453125, -10.608642578125, -9.82275390625, -9.036865234375, -8.2509765625, -7.465087890625, -6.67919921875, -5.893310546875, -5.107421875, -4.321533203125, -3.53564453125, -2.749755859375, -1.9638671875, -1.177978515625, -0.39208984375, 0.393798828125, 1.1796875, 1.965576171875, 2.75146484375, 3.537353515625, 4.3232421875, 5.109130859375, 5.89501953125, 6.680908203125, 7.466796875, 8.252685546875, 9.03857421875, 9.824462890625, 10.6103515625, 11.396240234375, 12.18212890625, 12.968017578125, 13.75390625, 14.539794921875, 15.32568359375, 16.111572265625, 16.8974609375, 17.683349609375, 18.46923828125, 19.255126953125, 20.041015625, 20.826904296875, 21.61279296875, 22.398681640625, 23.1845703125, 23.970458984375, 24.75634765625, 25.542236328125, 26.328125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 35.0, 102.0, 329.0, 366.0, 138.0, 34.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.385540008544922, -27.14822769165039, -24.91091537475586, -22.673603057861328, -20.436290740966797, -18.198978424072266, -15.961664199829102, -13.72435188293457, -11.487039566040039, -9.249727249145508, -7.012414455413818, -4.775101661682129, -2.5377893447875977, -0.3004770278930664, 1.9368362426757812, 4.1741485595703125, 6.411460876464844, 8.648773193359375, 10.886085510253906, 13.123398780822754, 15.360711097717285, 17.5980224609375, 19.835336685180664, 22.072649002075195, 24.309961318969727, 26.547273635864258, 28.78458595275879, 31.021900177001953, 33.259212493896484, 35.496524810791016, 37.73383712768555, 39.97114944458008, 42.208457946777344, 44.445770263671875, 46.683082580566406, 48.92039489746094, 51.15770721435547, 53.39501953125, 55.63233184814453, 57.86964416503906, 60.106956481933594, 62.344268798828125, 64.58158111572266, 66.81889343261719, 69.05620574951172, 71.29351806640625, 73.53083038330078, 75.76814270019531, 78.00546264648438, 80.2427749633789, 82.48008728027344, 84.71739959716797, 86.9547119140625, 89.19202423095703, 91.42933654785156, 93.6666488647461, 95.90396118164062, 98.14127349853516, 100.37858581542969, 102.61589813232422, 104.85321044921875, 107.09052276611328, 109.32783508300781, 111.56514739990234, 113.80245971679688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 4.0, 6.0, 7.0, 7.0, 11.0, 14.0, 7.0, 14.0, 21.0, 18.0, 16.0, 28.0, 30.0, 24.0, 34.0, 35.0, 38.0, 44.0, 33.0, 48.0, 43.0, 47.0, 40.0, 43.0, 43.0, 33.0, 40.0, 40.0, 31.0, 41.0, 43.0, 19.0, 12.0, 16.0, 10.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.859025955200195, -28.9013614654541, -27.94369888305664, -26.986034393310547, -26.028371810913086, -25.070707321166992, -24.11304473876953, -23.155380249023438, -22.197715759277344, -21.24005126953125, -20.28238868713379, -19.324724197387695, -18.367061614990234, -17.40939712524414, -16.451732635498047, -15.494070053100586, -14.536407470703125, -13.578743934631348, -12.62108039855957, -11.663415908813477, -10.705753326416016, -9.748088836669922, -8.790425300598145, -7.832761764526367, -6.87509822845459, -5.9174346923828125, -4.959771156311035, -4.0021071434021, -3.0444436073303223, -2.086780071258545, -1.1291160583496094, -0.17145252227783203, 0.7862110137939453, 1.7438746690750122, 2.701538324356079, 3.6592020988464355, 4.616865634918213, 5.57452917098999, 6.532193183898926, 7.489856719970703, 8.44752025604248, 9.405183792114258, 10.362847328186035, 11.320510864257812, 12.278175354003906, 13.235837936401367, 14.193502426147461, 15.151165962219238, 16.108829498291016, 17.06649398803711, 18.02415657043457, 18.981821060180664, 19.939483642578125, 20.89714813232422, 21.854812622070312, 22.812475204467773, 23.770137786865234, 24.727802276611328, 25.68546485900879, 26.643129348754883, 27.600791931152344, 28.558456420898438, 29.51612091064453, 30.473783493041992, 31.431447982788086]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 7.0, 11.0, 13.0, 14.0, 17.0, 15.0, 19.0, 23.0, 27.0, 22.0, 23.0, 38.0, 34.0, 32.0, 35.0, 40.0, 32.0, 39.0, 53.0, 34.0, 43.0, 56.0, 47.0, 29.0, 21.0, 36.0, 22.0, 34.0, 27.0, 24.0, 21.0, 23.0, 13.0, 15.0, 12.0, 10.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.938720703125, -2.83642578125, -2.734130859375, -2.6318359375, -2.529541015625, -2.42724609375, -2.324951171875, -2.22265625, -2.120361328125, -2.01806640625, -1.915771484375, -1.8134765625, -1.711181640625, -1.60888671875, -1.506591796875, -1.404296875, -1.302001953125, -1.19970703125, -1.097412109375, -0.9951171875, -0.892822265625, -0.79052734375, -0.688232421875, -0.5859375, -0.483642578125, -0.38134765625, -0.279052734375, -0.1767578125, -0.074462890625, 0.02783203125, 0.130126953125, 0.232421875, 0.334716796875, 0.43701171875, 0.539306640625, 0.6416015625, 0.743896484375, 0.84619140625, 0.948486328125, 1.05078125, 1.153076171875, 1.25537109375, 1.357666015625, 1.4599609375, 1.562255859375, 1.66455078125, 1.766845703125, 1.869140625, 1.971435546875, 2.07373046875, 2.176025390625, 2.2783203125, 2.380615234375, 2.48291015625, 2.585205078125, 2.6875, 2.789794921875, 2.89208984375, 2.994384765625, 3.0966796875, 3.198974609375, 3.30126953125, 3.403564453125, 3.505859375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 6.0, 9.0, 11.0, 11.0, 15.0, 30.0, 34.0, 63.0, 83.0, 111.0, 136.0, 191.0, 298.0, 420.0, 735.0, 1224.0, 2267.0, 4365.0, 9227.0, 21311.0, 62264.0, 451353.0, 2985198.0, 542965.0, 68253.0, 23040.0, 9962.0, 4723.0, 2315.0, 1304.0, 761.0, 502.0, 311.0, 232.0, 153.0, 93.0, 74.0, 61.0, 37.0, 32.0, 30.0, 12.0, 17.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.2109375, -8.9188232421875, -8.626708984375, -8.3345947265625, -8.04248046875, -7.7503662109375, -7.458251953125, -7.1661376953125, -6.8740234375, -6.5819091796875, -6.289794921875, -5.9976806640625, -5.70556640625, -5.4134521484375, -5.121337890625, -4.8292236328125, -4.537109375, -4.2449951171875, -3.952880859375, -3.6607666015625, -3.36865234375, -3.0765380859375, -2.784423828125, -2.4923095703125, -2.2001953125, -1.9080810546875, -1.615966796875, -1.3238525390625, -1.03173828125, -0.7396240234375, -0.447509765625, -0.1553955078125, 0.13671875, 0.4288330078125, 0.720947265625, 1.0130615234375, 1.30517578125, 1.5972900390625, 1.889404296875, 2.1815185546875, 2.4736328125, 2.7657470703125, 3.057861328125, 3.3499755859375, 3.64208984375, 3.9342041015625, 4.226318359375, 4.5184326171875, 4.810546875, 5.1026611328125, 5.394775390625, 5.6868896484375, 5.97900390625, 6.2711181640625, 6.563232421875, 6.8553466796875, 7.1474609375, 7.4395751953125, 7.731689453125, 8.0238037109375, 8.31591796875, 8.6080322265625, 8.900146484375, 9.1922607421875, 9.484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 4.0, 4.0, 8.0, 13.0, 22.0, 27.0, 25.0, 26.0, 43.0, 67.0, 79.0, 81.0, 148.0, 200.0, 350.0, 557.0, 701.0, 543.0, 343.0, 241.0, 125.0, 100.0, 76.0, 64.0, 47.0, 41.0, 31.0, 18.0, 16.0, 9.0, 14.0, 9.0, 10.0, 11.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.15203857421875, -6.9251708984375, -6.69830322265625, -6.471435546875, -6.24456787109375, -6.0177001953125, -5.79083251953125, -5.56396484375, -5.33709716796875, -5.1102294921875, -4.88336181640625, -4.656494140625, -4.42962646484375, -4.2027587890625, -3.97589111328125, -3.7490234375, -3.52215576171875, -3.2952880859375, -3.06842041015625, -2.841552734375, -2.61468505859375, -2.3878173828125, -2.16094970703125, -1.93408203125, -1.70721435546875, -1.4803466796875, -1.25347900390625, -1.026611328125, -0.79974365234375, -0.5728759765625, -0.34600830078125, -0.119140625, 0.10772705078125, 0.3345947265625, 0.56146240234375, 0.788330078125, 1.01519775390625, 1.2420654296875, 1.46893310546875, 1.69580078125, 1.92266845703125, 2.1495361328125, 2.37640380859375, 2.603271484375, 2.83013916015625, 3.0570068359375, 3.28387451171875, 3.5107421875, 3.73760986328125, 3.9644775390625, 4.19134521484375, 4.418212890625, 4.64508056640625, 4.8719482421875, 5.09881591796875, 5.32568359375, 5.55255126953125, 5.7794189453125, 6.00628662109375, 6.233154296875, 6.46002197265625, 6.6868896484375, 6.91375732421875, 7.140625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 9.0, 16.0, 8.0, 21.0, 20.0, 28.0, 41.0, 50.0, 70.0, 71.0, 136.0, 256.0, 854.0, 5022.0, 82183.0, 3880748.0, 213433.0, 9246.0, 1175.0, 328.0, 144.0, 107.0, 80.0, 43.0, 35.0, 27.0, 21.0, 24.0, 23.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.90625, -29.928955078125, -28.95166015625, -27.974365234375, -26.9970703125, -26.019775390625, -25.04248046875, -24.065185546875, -23.087890625, -22.110595703125, -21.13330078125, -20.156005859375, -19.1787109375, -18.201416015625, -17.22412109375, -16.246826171875, -15.26953125, -14.292236328125, -13.31494140625, -12.337646484375, -11.3603515625, -10.383056640625, -9.40576171875, -8.428466796875, -7.451171875, -6.473876953125, -5.49658203125, -4.519287109375, -3.5419921875, -2.564697265625, -1.58740234375, -0.610107421875, 0.3671875, 1.344482421875, 2.32177734375, 3.299072265625, 4.2763671875, 5.253662109375, 6.23095703125, 7.208251953125, 8.185546875, 9.162841796875, 10.14013671875, 11.117431640625, 12.0947265625, 13.072021484375, 14.04931640625, 15.026611328125, 16.00390625, 16.981201171875, 17.95849609375, 18.935791015625, 19.9130859375, 20.890380859375, 21.86767578125, 22.844970703125, 23.822265625, 24.799560546875, 25.77685546875, 26.754150390625, 27.7314453125, 28.708740234375, 29.68603515625, 30.663330078125, 31.640625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 13.0, 21.0, 39.0, 74.0, 139.0, 213.0, 209.0, 130.0, 80.0, 40.0, 23.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62064743041992, -52.782440185546875, -50.944236755371094, -49.10602951049805, -47.267822265625, -45.42961883544922, -43.59141159057617, -41.753204345703125, -39.915000915527344, -38.0767936706543, -36.238590240478516, -34.40038299560547, -32.56217575073242, -30.723970413208008, -28.885765075683594, -27.047557830810547, -25.2093505859375, -23.371145248413086, -21.53293800354004, -19.694732666015625, -17.856525421142578, -16.018320083618164, -14.18011474609375, -12.34190845489502, -10.503702163696289, -8.665495872497559, -6.827290058135986, -4.989084243774414, -3.1508779525756836, -1.3126716613769531, 0.5255336761474609, 2.3637399673461914, 4.201946258544922, 6.040152549743652, 7.878358364105225, 9.716564178466797, 11.554770469665527, 13.392976760864258, 15.231182098388672, 17.06938934326172, 18.907594680786133, 20.745800018310547, 22.584007263183594, 24.422212600708008, 26.260417938232422, 28.09862518310547, 29.936830520629883, 31.775035858154297, 33.613243103027344, 35.45145034790039, 37.28965377807617, 39.12786102294922, 40.966068267822266, 42.80427551269531, 44.642478942871094, 46.48068618774414, 48.31889343261719, 50.157100677490234, 51.995304107666016, 53.83351135253906, 55.67171859741211, 57.509925842285156, 59.34812927246094, 61.186336517333984, 63.024539947509766]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 12.0, 10.0, 17.0, 20.0, 15.0, 24.0, 34.0, 34.0, 42.0, 27.0, 27.0, 44.0, 56.0, 37.0, 39.0, 48.0, 42.0, 37.0, 39.0, 38.0, 33.0, 30.0, 34.0, 30.0, 32.0, 25.0, 15.0, 24.0, 22.0, 19.0, 9.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.095863342285156, -21.375322341918945, -20.6547794342041, -19.93423843383789, -19.213695526123047, -18.493154525756836, -17.772613525390625, -17.05207061767578, -16.33152961730957, -15.610987663269043, -14.890445709228516, -14.169904708862305, -13.449362754821777, -12.72882080078125, -12.008279800415039, -11.287737846374512, -10.567195892333984, -9.846653938293457, -9.12611198425293, -8.405570983886719, -7.685029029846191, -6.964487075805664, -6.243945598602295, -5.523404121398926, -4.802862167358398, -4.082320213317871, -3.361778736114502, -2.6412370204925537, -1.9206953048706055, -1.2001535892486572, -0.479611873626709, 0.24092960357666016, 0.9614734649658203, 1.6820151805877686, 2.402556896209717, 3.123098611831665, 3.8436403274536133, 4.564182281494141, 5.28472375869751, 6.005265235900879, 6.725807189941406, 7.446349143981934, 8.166891098022461, 8.887432098388672, 9.6079740524292, 10.328516006469727, 11.049057006835938, 11.769598960876465, 12.490140914916992, 13.21068286895752, 13.931224822998047, 14.651765823364258, 15.372307777404785, 16.092849731445312, 16.813390731811523, 17.533931732177734, 18.254474639892578, 18.97501564025879, 19.695558547973633, 20.416099548339844, 21.136642456054688, 21.8571834564209, 22.57772445678711, 23.298267364501953, 24.018808364868164]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 4.0, 9.0, 10.0, 16.0, 14.0, 13.0, 14.0, 21.0, 22.0, 25.0, 25.0, 29.0, 33.0, 46.0, 39.0, 49.0, 36.0, 40.0, 42.0, 46.0, 26.0, 52.0, 63.0, 37.0, 35.0, 31.0, 21.0, 20.0, 24.0, 39.0, 16.0, 13.0, 25.0, 9.0, 16.0, 12.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.835906982421875, -2.73040771484375, -2.624908447265625, -2.5194091796875, -2.413909912109375, -2.30841064453125, -2.202911376953125, -2.097412109375, -1.991912841796875, -1.88641357421875, -1.780914306640625, -1.6754150390625, -1.569915771484375, -1.46441650390625, -1.358917236328125, -1.25341796875, -1.147918701171875, -1.04241943359375, -0.936920166015625, -0.8314208984375, -0.725921630859375, -0.62042236328125, -0.514923095703125, -0.409423828125, -0.303924560546875, -0.19842529296875, -0.092926025390625, 0.0125732421875, 0.118072509765625, 0.22357177734375, 0.329071044921875, 0.4345703125, 0.540069580078125, 0.64556884765625, 0.751068115234375, 0.8565673828125, 0.962066650390625, 1.06756591796875, 1.173065185546875, 1.278564453125, 1.384063720703125, 1.48956298828125, 1.595062255859375, 1.7005615234375, 1.806060791015625, 1.91156005859375, 2.017059326171875, 2.12255859375, 2.228057861328125, 2.33355712890625, 2.439056396484375, 2.5445556640625, 2.650054931640625, 2.75555419921875, 2.861053466796875, 2.966552734375, 3.072052001953125, 3.17755126953125, 3.283050537109375, 3.3885498046875, 3.494049072265625, 3.59954833984375, 3.705047607421875, 3.810546875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 20.0, 13.0, 29.0, 70.0, 156.0, 308.0, 610.0, 1424.0, 3555.0, 11157.0, 76747.0, 815142.0, 118219.0, 14017.0, 4024.0, 1623.0, 756.0, 309.0, 157.0, 87.0, 46.0, 24.0, 11.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.44921875, -4.32415771484375, -4.1990966796875, -4.07403564453125, -3.948974609375, -3.82391357421875, -3.6988525390625, -3.57379150390625, -3.44873046875, -3.32366943359375, -3.1986083984375, -3.07354736328125, -2.948486328125, -2.82342529296875, -2.6983642578125, -2.57330322265625, -2.4482421875, -2.32318115234375, -2.1981201171875, -2.07305908203125, -1.947998046875, -1.82293701171875, -1.6978759765625, -1.57281494140625, -1.44775390625, -1.32269287109375, -1.1976318359375, -1.07257080078125, -0.947509765625, -0.82244873046875, -0.6973876953125, -0.57232666015625, -0.447265625, -0.32220458984375, -0.1971435546875, -0.07208251953125, 0.052978515625, 0.17803955078125, 0.3031005859375, 0.42816162109375, 0.55322265625, 0.67828369140625, 0.8033447265625, 0.92840576171875, 1.053466796875, 1.17852783203125, 1.3035888671875, 1.42864990234375, 1.5537109375, 1.67877197265625, 1.8038330078125, 1.92889404296875, 2.053955078125, 2.17901611328125, 2.3040771484375, 2.42913818359375, 2.55419921875, 2.67926025390625, 2.8043212890625, 2.92938232421875, 3.054443359375, 3.17950439453125, 3.3045654296875, 3.42962646484375, 3.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 10.0, 9.0, 11.0, 17.0, 11.0, 16.0, 15.0, 26.0, 21.0, 24.0, 33.0, 24.0, 35.0, 38.0, 25.0, 37.0, 47.0, 1066.0, 34.0, 41.0, 46.0, 45.0, 44.0, 35.0, 31.0, 35.0, 33.0, 25.0, 34.0, 13.0, 18.0, 16.0, 22.0, 10.0, 5.0, 12.0, 7.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.44921875, -2.370208740234375, -2.29119873046875, -2.212188720703125, -2.1331787109375, -2.054168701171875, -1.97515869140625, -1.896148681640625, -1.817138671875, -1.738128662109375, -1.65911865234375, -1.580108642578125, -1.5010986328125, -1.422088623046875, -1.34307861328125, -1.264068603515625, -1.18505859375, -1.106048583984375, -1.02703857421875, -0.948028564453125, -0.8690185546875, -0.790008544921875, -0.71099853515625, -0.631988525390625, -0.552978515625, -0.473968505859375, -0.39495849609375, -0.315948486328125, -0.2369384765625, -0.157928466796875, -0.07891845703125, 9.1552734375e-05, 0.0791015625, 0.158111572265625, 0.23712158203125, 0.316131591796875, 0.3951416015625, 0.474151611328125, 0.55316162109375, 0.632171630859375, 0.711181640625, 0.790191650390625, 0.86920166015625, 0.948211669921875, 1.0272216796875, 1.106231689453125, 1.18524169921875, 1.264251708984375, 1.34326171875, 1.422271728515625, 1.50128173828125, 1.580291748046875, 1.6593017578125, 1.738311767578125, 1.81732177734375, 1.896331787109375, 1.975341796875, 2.054351806640625, 2.13336181640625, 2.212371826171875, 2.2913818359375, 2.370391845703125, 2.44940185546875, 2.528411865234375, 2.607421875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 3.0, 6.0, 5.0, 17.0, 33.0, 48.0, 56.0, 103.0, 131.0, 244.0, 379.0, 569.0, 999.0, 1877.0, 3985.0, 12042.0, 74235.0, 1792372.0, 180284.0, 18799.0, 5510.0, 2288.0, 1223.0, 754.0, 432.0, 248.0, 177.0, 102.0, 71.0, 41.0, 31.0, 20.0, 7.0, 10.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.505859375, -2.4374847412109375, -2.369110107421875, -2.3007354736328125, -2.23236083984375, -2.1639862060546875, -2.095611572265625, -2.0272369384765625, -1.9588623046875, -1.8904876708984375, -1.822113037109375, -1.7537384033203125, -1.68536376953125, -1.6169891357421875, -1.548614501953125, -1.4802398681640625, -1.411865234375, -1.3434906005859375, -1.275115966796875, -1.2067413330078125, -1.13836669921875, -1.0699920654296875, -1.001617431640625, -0.9332427978515625, -0.8648681640625, -0.7964935302734375, -0.728118896484375, -0.6597442626953125, -0.59136962890625, -0.5229949951171875, -0.454620361328125, -0.3862457275390625, -0.31787109375, -0.2494964599609375, -0.181121826171875, -0.1127471923828125, -0.04437255859375, 0.0240020751953125, 0.092376708984375, 0.1607513427734375, 0.2291259765625, 0.2975006103515625, 0.365875244140625, 0.4342498779296875, 0.50262451171875, 0.5709991455078125, 0.639373779296875, 0.7077484130859375, 0.776123046875, 0.8444976806640625, 0.912872314453125, 0.9812469482421875, 1.04962158203125, 1.1179962158203125, 1.186370849609375, 1.2547454833984375, 1.3231201171875, 1.3914947509765625, 1.459869384765625, 1.5282440185546875, 1.59661865234375, 1.6649932861328125, 1.733367919921875, 1.8017425537109375, 1.8701171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 30.0, 37.0, 77.0, 94.0, 207.0, 206.0, 137.0, 72.0, 55.0, 19.0, 25.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4054222106933594, -0.39238739013671875, -0.3793525695800781, -0.3663177490234375, -0.3532829284667969, -0.34024810791015625, -0.3272132873535156, -0.314178466796875, -0.3011436462402344, -0.28810882568359375, -0.2750740051269531, -0.2620391845703125, -0.24900436401367188, -0.23596954345703125, -0.22293472290039062, -0.20989990234375, -0.19686508178710938, -0.18383026123046875, -0.17079544067382812, -0.1577606201171875, -0.14472579956054688, -0.13169097900390625, -0.11865615844726562, -0.105621337890625, -0.09258651733398438, -0.07955169677734375, -0.06651687622070312, -0.0534820556640625, -0.040447235107421875, -0.02741241455078125, -0.014377593994140625, -0.0013427734375, 0.011692047119140625, 0.02472686767578125, 0.037761688232421875, 0.0507965087890625, 0.06383132934570312, 0.07686614990234375, 0.08990097045898438, 0.102935791015625, 0.11597061157226562, 0.12900543212890625, 0.14204025268554688, 0.1550750732421875, 0.16810989379882812, 0.18114471435546875, 0.19417953491210938, 0.20721435546875, 0.22024917602539062, 0.23328399658203125, 0.24631881713867188, 0.2593536376953125, 0.2723884582519531, 0.28542327880859375, 0.2984580993652344, 0.311492919921875, 0.3245277404785156, 0.33756256103515625, 0.3505973815917969, 0.3636322021484375, 0.3766670227050781, 0.38970184326171875, 0.4027366638183594, 0.415771484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 27.0, 36.0, 85.0, 170.0, 1145.0, 226177.0, 819212.0, 1348.0, 162.0, 67.0, 45.0, 21.0, 9.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.62060546875, -8.3427734375, -8.06494140625, -7.787109375, -7.50927734375, -7.2314453125, -6.95361328125, -6.67578125, -6.39794921875, -6.1201171875, -5.84228515625, -5.564453125, -5.28662109375, -5.0087890625, -4.73095703125, -4.453125, -4.17529296875, -3.8974609375, -3.61962890625, -3.341796875, -3.06396484375, -2.7861328125, -2.50830078125, -2.23046875, -1.95263671875, -1.6748046875, -1.39697265625, -1.119140625, -0.84130859375, -0.5634765625, -0.28564453125, -0.0078125, 0.27001953125, 0.5478515625, 0.82568359375, 1.103515625, 1.38134765625, 1.6591796875, 1.93701171875, 2.21484375, 2.49267578125, 2.7705078125, 3.04833984375, 3.326171875, 3.60400390625, 3.8818359375, 4.15966796875, 4.4375, 4.71533203125, 4.9931640625, 5.27099609375, 5.548828125, 5.82666015625, 6.1044921875, 6.38232421875, 6.66015625, 6.93798828125, 7.2158203125, 7.49365234375, 7.771484375, 8.04931640625, 8.3271484375, 8.60498046875, 8.8828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 22.0, 28.0, 23.0, 52.0, 79.0, 121.0, 136.0, 161.0, 99.0, 82.0, 54.0, 41.0, 26.0, 22.0, 14.0, 14.0, 8.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18939897418022156, -0.1777198165655136, -0.16604065895080566, -0.1543615162372589, -0.14268234372138977, -0.13100320100784302, -0.11932404339313507, -0.10764488577842712, -0.09596572816371918, -0.08428657054901123, -0.07260741293430328, -0.060928262770175934, -0.04924910515546799, -0.03756994754076004, -0.02589079737663269, -0.014211639761924744, -0.002532482147216797, 0.009146673604846, 0.020825829356908798, 0.03250498324632645, 0.04418414086103439, 0.05586329847574234, 0.06754244863986969, 0.07922160625457764, 0.09090076386928558, 0.10257992148399353, 0.11425907909870148, 0.12593823671340942, 0.13761737942695618, 0.14929655194282532, 0.16097569465637207, 0.17265485227108002, 0.18433398008346558, 0.19601313769817352, 0.20769229531288147, 0.21937143802642822, 0.23105061054229736, 0.24272975325584412, 0.25440889596939087, 0.26608806848526, 0.27776724100112915, 0.2894463837146759, 0.30112555623054504, 0.3128046989440918, 0.32448387145996094, 0.3361630141735077, 0.34784215688705444, 0.3595213294029236, 0.37120047211647034, 0.3828796148300171, 0.39455878734588623, 0.406237930059433, 0.4179171025753021, 0.4295962452888489, 0.441275417804718, 0.45295456051826477, 0.4646337032318115, 0.4763128459453583, 0.4879920184612274, 0.49967116117477417, 0.5113503336906433, 0.5230295062065125, 0.5347086191177368, 0.546387791633606, 0.5580669641494751]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 4.0, 14.0, 16.0, 18.0, 16.0, 22.0, 30.0, 17.0, 28.0, 29.0, 29.0, 31.0, 40.0, 38.0, 39.0, 39.0, 44.0, 44.0, 34.0, 37.0, 31.0, 35.0, 29.0, 28.0, 38.0, 34.0, 21.0, 21.0, 21.0, 18.0, 19.0, 14.0, 14.0, 15.0, 11.0, 7.0, 12.0, 5.0, 2.0, 1.0, 4.0, 9.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.17023152112960815, -0.16418780386447906, -0.15814407169818878, -0.1521003544330597, -0.1460566222667694, -0.14001290500164032, -0.13396918773651123, -0.12792545557022095, -0.12188173830509186, -0.11583801358938217, -0.10979428887367249, -0.1037505716085434, -0.09770684689283371, -0.09166312217712402, -0.08561940491199493, -0.07957568019628525, -0.07353195548057556, -0.06748823076486588, -0.06144450977444649, -0.0554007887840271, -0.04935706406831741, -0.04331333935260773, -0.03726961836218834, -0.03122589737176895, -0.025182172656059265, -0.019138449802994728, -0.013094726949930191, -0.007051004096865654, -0.001007281243801117, 0.00503644160926342, 0.011080164462327957, 0.017123885452747345, 0.02316761016845703, 0.02921133302152157, 0.035255055874586105, 0.04129877686500549, 0.04734250158071518, 0.053386226296424866, 0.059429947286844254, 0.06547366827726364, 0.07151739299297333, 0.07756111770868301, 0.0836048424243927, 0.08964855968952179, 0.09569228440523148, 0.10173600912094116, 0.10777972638607025, 0.11382345110177994, 0.11986717581748962, 0.1259108930826187, 0.131954625248909, 0.13799834251403809, 0.14404207468032837, 0.15008579194545746, 0.15612950921058655, 0.16217324137687683, 0.16821695864200592, 0.174260675907135, 0.1803044080734253, 0.18634812533855438, 0.19239184260368347, 0.19843557476997375, 0.20447929203510284, 0.21052300930023193, 0.21656674146652222]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 5.0, 7.0, 11.0, 10.0, 20.0, 20.0, 16.0, 22.0, 27.0, 29.0, 28.0, 34.0, 44.0, 32.0, 39.0, 40.0, 36.0, 35.0, 43.0, 43.0, 48.0, 46.0, 35.0, 33.0, 35.0, 29.0, 34.0, 30.0, 20.0, 10.0, 25.0, 21.0, 15.0, 18.0, 9.0, 8.0, 5.0, 6.0, 2.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.061492919921875, -2.96087646484375, -2.860260009765625, -2.7596435546875, -2.659027099609375, -2.55841064453125, -2.457794189453125, -2.357177734375, -2.256561279296875, -2.15594482421875, -2.055328369140625, -1.9547119140625, -1.854095458984375, -1.75347900390625, -1.652862548828125, -1.55224609375, -1.451629638671875, -1.35101318359375, -1.250396728515625, -1.1497802734375, -1.049163818359375, -0.94854736328125, -0.847930908203125, -0.747314453125, -0.646697998046875, -0.54608154296875, -0.445465087890625, -0.3448486328125, -0.244232177734375, -0.14361572265625, -0.042999267578125, 0.0576171875, 0.158233642578125, 0.25885009765625, 0.359466552734375, 0.4600830078125, 0.560699462890625, 0.66131591796875, 0.761932373046875, 0.862548828125, 0.963165283203125, 1.06378173828125, 1.164398193359375, 1.2650146484375, 1.365631103515625, 1.46624755859375, 1.566864013671875, 1.66748046875, 1.768096923828125, 1.86871337890625, 1.969329833984375, 2.0699462890625, 2.170562744140625, 2.27117919921875, 2.371795654296875, 2.472412109375, 2.573028564453125, 2.67364501953125, 2.774261474609375, 2.8748779296875, 2.975494384765625, 3.07611083984375, 3.176727294921875, 3.27734375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 11.0, 15.0, 25.0, 42.0, 59.0, 87.0, 157.0, 204.0, 301.0, 446.0, 727.0, 1149.0, 1844.0, 2985.0, 4821.0, 8380.0, 14807.0, 28000.0, 58374.0, 166206.0, 493608.0, 150768.0, 54672.0, 26346.0, 14061.0, 7995.0, 4713.0, 2917.0, 1746.0, 1043.0, 730.0, 451.0, 283.0, 202.0, 118.0, 98.0, 47.0, 31.0, 18.0, 16.0, 16.0, 13.0, 12.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.18878173828125, -5.0064697265625, -4.82415771484375, -4.641845703125, -4.45953369140625, -4.2772216796875, -4.09490966796875, -3.91259765625, -3.73028564453125, -3.5479736328125, -3.36566162109375, -3.183349609375, -3.00103759765625, -2.8187255859375, -2.63641357421875, -2.4541015625, -2.27178955078125, -2.0894775390625, -1.90716552734375, -1.724853515625, -1.54254150390625, -1.3602294921875, -1.17791748046875, -0.99560546875, -0.81329345703125, -0.6309814453125, -0.44866943359375, -0.266357421875, -0.08404541015625, 0.0982666015625, 0.28057861328125, 0.462890625, 0.64520263671875, 0.8275146484375, 1.00982666015625, 1.192138671875, 1.37445068359375, 1.5567626953125, 1.73907470703125, 1.92138671875, 2.10369873046875, 2.2860107421875, 2.46832275390625, 2.650634765625, 2.83294677734375, 3.0152587890625, 3.19757080078125, 3.3798828125, 3.56219482421875, 3.7445068359375, 3.92681884765625, 4.109130859375, 4.29144287109375, 4.4737548828125, 4.65606689453125, 4.83837890625, 5.02069091796875, 5.2030029296875, 5.38531494140625, 5.567626953125, 5.74993896484375, 5.9322509765625, 6.11456298828125, 6.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 4.0, 4.0, 4.0, 10.0, 7.0, 16.0, 17.0, 16.0, 17.0, 19.0, 29.0, 29.0, 33.0, 39.0, 45.0, 52.0, 48.0, 84.0, 131.0, 241.0, 1467.0, 196.0, 94.0, 68.0, 60.0, 38.0, 39.0, 28.0, 31.0, 27.0, 29.0, 20.0, 11.0, 11.0, 13.0, 13.0, 10.0, 9.0, 5.0, 8.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.1171875, -9.8043212890625, -9.491455078125, -9.1785888671875, -8.86572265625, -8.5528564453125, -8.239990234375, -7.9271240234375, -7.6142578125, -7.3013916015625, -6.988525390625, -6.6756591796875, -6.36279296875, -6.0499267578125, -5.737060546875, -5.4241943359375, -5.111328125, -4.7984619140625, -4.485595703125, -4.1727294921875, -3.85986328125, -3.5469970703125, -3.234130859375, -2.9212646484375, -2.6083984375, -2.2955322265625, -1.982666015625, -1.6697998046875, -1.35693359375, -1.0440673828125, -0.731201171875, -0.4183349609375, -0.10546875, 0.2073974609375, 0.520263671875, 0.8331298828125, 1.14599609375, 1.4588623046875, 1.771728515625, 2.0845947265625, 2.3974609375, 2.7103271484375, 3.023193359375, 3.3360595703125, 3.64892578125, 3.9617919921875, 4.274658203125, 4.5875244140625, 4.900390625, 5.2132568359375, 5.526123046875, 5.8389892578125, 6.15185546875, 6.4647216796875, 6.777587890625, 7.0904541015625, 7.4033203125, 7.7161865234375, 8.029052734375, 8.3419189453125, 8.65478515625, 8.9676513671875, 9.280517578125, 9.5933837890625, 9.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 10.0, 23.0, 13.0, 32.0, 36.0, 41.0, 75.0, 125.0, 184.0, 313.0, 862.0, 4628.0, 59142.0, 2921844.0, 148044.0, 7972.0, 1324.0, 381.0, 209.0, 125.0, 82.0, 70.0, 45.0, 30.0, 25.0, 14.0, 12.0, 11.0, 10.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.63818359375, -17.7763671875, -16.91455078125, -16.052734375, -15.19091796875, -14.3291015625, -13.46728515625, -12.60546875, -11.74365234375, -10.8818359375, -10.02001953125, -9.158203125, -8.29638671875, -7.4345703125, -6.57275390625, -5.7109375, -4.84912109375, -3.9873046875, -3.12548828125, -2.263671875, -1.40185546875, -0.5400390625, 0.32177734375, 1.18359375, 2.04541015625, 2.9072265625, 3.76904296875, 4.630859375, 5.49267578125, 6.3544921875, 7.21630859375, 8.078125, 8.93994140625, 9.8017578125, 10.66357421875, 11.525390625, 12.38720703125, 13.2490234375, 14.11083984375, 14.97265625, 15.83447265625, 16.6962890625, 17.55810546875, 18.419921875, 19.28173828125, 20.1435546875, 21.00537109375, 21.8671875, 22.72900390625, 23.5908203125, 24.45263671875, 25.314453125, 26.17626953125, 27.0380859375, 27.89990234375, 28.76171875, 29.62353515625, 30.4853515625, 31.34716796875, 32.208984375, 33.07080078125, 33.9326171875, 34.79443359375, 35.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 200.0, 716.0, 91.0, 0.0, 2.0], "bins": [-305.0229797363281, -299.96630859375, -294.90960693359375, -289.8529357910156, -284.7962646484375, -279.73956298828125, -274.6828918457031, -269.626220703125, -264.56951904296875, -259.5128479003906, -254.45616149902344, -249.39947509765625, -244.34278869628906, -239.28610229492188, -234.22943115234375, -229.17274475097656, -224.11605834960938, -219.0593719482422, -214.00270080566406, -208.94601440429688, -203.8893280029297, -198.8326416015625, -193.77597045898438, -188.7192840576172, -183.66261291503906, -178.60592651367188, -173.54925537109375, -168.49256896972656, -163.43588256835938, -158.3791961669922, -153.32252502441406, -148.26583862304688, -143.2091522216797, -138.1524658203125, -133.09579467773438, -128.0391082763672, -122.982421875, -117.92574310302734, -112.86906433105469, -107.8123779296875, -102.75569152832031, -97.69901275634766, -92.64232635498047, -87.58564758300781, -82.52896118164062, -77.47228240966797, -72.41560363769531, -67.35891723632812, -62.30223846435547, -57.24555587768555, -52.188873291015625, -47.13219451904297, -42.07550811767578, -37.018829345703125, -31.962146759033203, -26.90546417236328, -21.84878158569336, -16.792098999023438, -11.735417366027832, -6.678735733032227, -1.6220531463623047, 3.434629440307617, 8.491310119628906, 13.547992706298828, 18.60467529296875]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 11.0, 13.0, 11.0, 8.0, 14.0, 18.0, 18.0, 14.0, 29.0, 28.0, 30.0, 38.0, 39.0, 43.0, 52.0, 47.0, 46.0, 42.0, 48.0, 38.0, 42.0, 34.0, 42.0, 38.0, 32.0, 38.0, 31.0, 25.0, 15.0, 25.0, 20.0, 17.0, 18.0, 8.0, 6.0, 6.0, 8.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.94982147216797, -27.997146606445312, -27.04447364807129, -26.091798782348633, -25.139123916625977, -24.186450958251953, -23.233776092529297, -22.28110122680664, -21.328428268432617, -20.37575340270996, -19.423080444335938, -18.47040557861328, -17.517730712890625, -16.5650577545166, -15.612382888793945, -14.659708976745605, -13.70703411102295, -12.75436019897461, -11.801685333251953, -10.849011421203613, -9.896337509155273, -8.943662643432617, -7.990988731384277, -7.0383148193359375, -6.0856404304504395, -5.132966041564941, -4.180292129516602, -3.2276177406311035, -2.2749435901641846, -1.3222694396972656, -0.3695950508117676, 0.5830788612365723, 1.5357532501220703, 2.4884274005889893, 3.441101551055908, 4.393775939941406, 5.346449851989746, 6.299124240875244, 7.251798629760742, 8.204472541809082, 9.157146453857422, 10.109820365905762, 11.062495231628418, 12.015169143676758, 12.967843055725098, 13.920516967773438, 14.873191833496094, 15.825865745544434, 16.778541564941406, 17.731216430664062, 18.683889389038086, 19.636564254760742, 20.5892391204834, 21.541912078857422, 22.494586944580078, 23.447261810302734, 24.399934768676758, 25.352609634399414, 26.305282592773438, 27.257957458496094, 28.21063232421875, 29.163305282592773, 30.11598014831543, 31.068653106689453, 32.02132797241211]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 13.0, 7.0, 9.0, 14.0, 18.0, 21.0, 16.0, 25.0, 39.0, 43.0, 25.0, 45.0, 42.0, 37.0, 52.0, 39.0, 65.0, 50.0, 43.0, 48.0, 38.0, 40.0, 33.0, 31.0, 27.0, 26.0, 24.0, 17.0, 28.0, 17.0, 10.0, 16.0, 3.0, 7.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.2890625, -4.16485595703125, -4.0406494140625, -3.91644287109375, -3.792236328125, -3.66802978515625, -3.5438232421875, -3.41961669921875, -3.29541015625, -3.17120361328125, -3.0469970703125, -2.92279052734375, -2.798583984375, -2.67437744140625, -2.5501708984375, -2.42596435546875, -2.3017578125, -2.17755126953125, -2.0533447265625, -1.92913818359375, -1.804931640625, -1.68072509765625, -1.5565185546875, -1.43231201171875, -1.30810546875, -1.18389892578125, -1.0596923828125, -0.93548583984375, -0.811279296875, -0.68707275390625, -0.5628662109375, -0.43865966796875, -0.314453125, -0.19024658203125, -0.0660400390625, 0.05816650390625, 0.182373046875, 0.30657958984375, 0.4307861328125, 0.55499267578125, 0.67919921875, 0.80340576171875, 0.9276123046875, 1.05181884765625, 1.176025390625, 1.30023193359375, 1.4244384765625, 1.54864501953125, 1.6728515625, 1.79705810546875, 1.9212646484375, 2.04547119140625, 2.169677734375, 2.29388427734375, 2.4180908203125, 2.54229736328125, 2.66650390625, 2.79071044921875, 2.9149169921875, 3.03912353515625, 3.163330078125, 3.28753662109375, 3.4117431640625, 3.53594970703125, 3.66015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 11.0, 15.0, 16.0, 26.0, 26.0, 40.0, 65.0, 111.0, 145.0, 224.0, 346.0, 637.0, 1069.0, 1867.0, 3475.0, 6897.0, 15332.0, 39470.0, 173760.0, 1586846.0, 2057125.0, 227335.0, 45902.0, 16956.0, 7757.0, 3805.0, 2019.0, 1164.0, 678.0, 410.0, 255.0, 170.0, 100.0, 60.0, 47.0, 33.0, 24.0, 16.0, 14.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-8.8125, -8.56817626953125, -8.3238525390625, -8.07952880859375, -7.835205078125, -7.59088134765625, -7.3465576171875, -7.10223388671875, -6.85791015625, -6.61358642578125, -6.3692626953125, -6.12493896484375, -5.880615234375, -5.63629150390625, -5.3919677734375, -5.14764404296875, -4.9033203125, -4.65899658203125, -4.4146728515625, -4.17034912109375, -3.926025390625, -3.68170166015625, -3.4373779296875, -3.19305419921875, -2.94873046875, -2.70440673828125, -2.4600830078125, -2.21575927734375, -1.971435546875, -1.72711181640625, -1.4827880859375, -1.23846435546875, -0.994140625, -0.74981689453125, -0.5054931640625, -0.26116943359375, -0.016845703125, 0.22747802734375, 0.4718017578125, 0.71612548828125, 0.96044921875, 1.20477294921875, 1.4490966796875, 1.69342041015625, 1.937744140625, 2.18206787109375, 2.4263916015625, 2.67071533203125, 2.9150390625, 3.15936279296875, 3.4036865234375, 3.64801025390625, 3.892333984375, 4.13665771484375, 4.3809814453125, 4.62530517578125, 4.86962890625, 5.11395263671875, 5.3582763671875, 5.60260009765625, 5.846923828125, 6.09124755859375, 6.3355712890625, 6.57989501953125, 6.82421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 9.0, 6.0, 12.0, 14.0, 23.0, 34.0, 34.0, 39.0, 47.0, 75.0, 83.0, 139.0, 251.0, 398.0, 590.0, 774.0, 524.0, 347.0, 201.0, 123.0, 79.0, 84.0, 38.0, 31.0, 32.0, 20.0, 15.0, 11.0, 3.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.6162109375, -7.373046875, -7.1298828125, -6.88671875, -6.6435546875, -6.400390625, -6.1572265625, -5.9140625, -5.6708984375, -5.427734375, -5.1845703125, -4.94140625, -4.6982421875, -4.455078125, -4.2119140625, -3.96875, -3.7255859375, -3.482421875, -3.2392578125, -2.99609375, -2.7529296875, -2.509765625, -2.2666015625, -2.0234375, -1.7802734375, -1.537109375, -1.2939453125, -1.05078125, -0.8076171875, -0.564453125, -0.3212890625, -0.078125, 0.1650390625, 0.408203125, 0.6513671875, 0.89453125, 1.1376953125, 1.380859375, 1.6240234375, 1.8671875, 2.1103515625, 2.353515625, 2.5966796875, 2.83984375, 3.0830078125, 3.326171875, 3.5693359375, 3.8125, 4.0556640625, 4.298828125, 4.5419921875, 4.78515625, 5.0283203125, 5.271484375, 5.5146484375, 5.7578125, 6.0009765625, 6.244140625, 6.4873046875, 6.73046875, 6.9736328125, 7.216796875, 7.4599609375, 7.703125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 2.0, 10.0, 16.0, 20.0, 38.0, 17.0, 31.0, 74.0, 92.0, 100.0, 227.0, 707.0, 6785.0, 465423.0, 3699645.0, 18995.0, 1284.0, 288.0, 136.0, 82.0, 63.0, 51.0, 35.0, 33.0, 28.0, 22.0, 15.0, 9.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.53125, -39.27099609375, -38.0107421875, -36.75048828125, -35.490234375, -34.22998046875, -32.9697265625, -31.70947265625, -30.44921875, -29.18896484375, -27.9287109375, -26.66845703125, -25.408203125, -24.14794921875, -22.8876953125, -21.62744140625, -20.3671875, -19.10693359375, -17.8466796875, -16.58642578125, -15.326171875, -14.06591796875, -12.8056640625, -11.54541015625, -10.28515625, -9.02490234375, -7.7646484375, -6.50439453125, -5.244140625, -3.98388671875, -2.7236328125, -1.46337890625, -0.203125, 1.05712890625, 2.3173828125, 3.57763671875, 4.837890625, 6.09814453125, 7.3583984375, 8.61865234375, 9.87890625, 11.13916015625, 12.3994140625, 13.65966796875, 14.919921875, 16.18017578125, 17.4404296875, 18.70068359375, 19.9609375, 21.22119140625, 22.4814453125, 23.74169921875, 25.001953125, 26.26220703125, 27.5224609375, 28.78271484375, 30.04296875, 31.30322265625, 32.5634765625, 33.82373046875, 35.083984375, 36.34423828125, 37.6044921875, 38.86474609375, 40.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 17.0, 17.0, 56.0, 83.0, 131.0, 173.0, 182.0, 145.0, 101.0, 53.0, 24.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.73108673095703, -54.26681137084961, -52.80253982543945, -51.33826446533203, -49.873992919921875, -48.40971755981445, -46.94544219970703, -45.481170654296875, -44.01689910888672, -42.5526237487793, -41.08835220336914, -39.62407684326172, -38.15980529785156, -36.69552993774414, -35.23125457763672, -33.76698303222656, -32.30270767211914, -30.83843421936035, -29.374160766601562, -27.90988540649414, -26.445613861083984, -24.981338500976562, -23.517065048217773, -22.052791595458984, -20.588518142700195, -19.124244689941406, -17.659971237182617, -16.195697784423828, -14.731423377990723, -13.267149925231934, -11.802875518798828, -10.338602066040039, -8.874324798583984, -7.410051345825195, -5.945777416229248, -4.481503486633301, -3.0172300338745117, -1.5529565811157227, -0.08868217468261719, 1.3755912780761719, 2.839864730834961, 4.30413818359375, 5.768412113189697, 7.2326860427856445, 8.696959495544434, 10.161232948303223, 11.625507354736328, 13.089780807495117, 14.554054260253906, 16.018327713012695, 17.482601165771484, 18.946876525878906, 20.411148071289062, 21.875423431396484, 23.339696884155273, 24.803970336914062, 26.26824378967285, 27.73251724243164, 29.19679069519043, 30.66106414794922, 32.12533950805664, 33.5896110534668, 35.05388641357422, 36.518157958984375, 37.9824333190918]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 5.0, 8.0, 20.0, 11.0, 19.0, 15.0, 17.0, 18.0, 32.0, 46.0, 41.0, 41.0, 34.0, 36.0, 37.0, 54.0, 42.0, 46.0, 40.0, 42.0, 43.0, 40.0, 32.0, 39.0, 26.0, 25.0, 21.0, 30.0, 14.0, 20.0, 19.0, 7.0, 20.0, 15.0, 6.0, 5.0, 9.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.172319412231445, -21.4759464263916, -20.77957534790039, -20.083202362060547, -19.386831283569336, -18.690458297729492, -17.99408721923828, -17.297714233398438, -16.601341247558594, -15.904969215393066, -15.208597183227539, -14.512224197387695, -13.815853118896484, -13.11948013305664, -12.423108100891113, -11.726736068725586, -11.030364990234375, -10.333992958068848, -9.63762092590332, -8.941247940063477, -8.244876861572266, -7.54850435256958, -6.8521318435668945, -6.155759811401367, -5.45938777923584, -4.7630157470703125, -4.066643714904785, -3.3702712059020996, -2.6738991737365723, -1.977527141571045, -1.2811546325683594, -0.584782600402832, 0.11159133911132812, 0.807963490486145, 1.504335641860962, 2.2007079124450684, 2.8970799446105957, 3.593451976776123, 4.289824485778809, 4.986196517944336, 5.682568550109863, 6.378940582275391, 7.075312614440918, 7.7716851234436035, 8.468057632446289, 9.1644287109375, 9.860801696777344, 10.557173728942871, 11.253545761108398, 11.949917793273926, 12.646289825439453, 13.342662811279297, 14.039033889770508, 14.735406875610352, 15.431778907775879, 16.128150939941406, 16.82452392578125, 17.520896911621094, 18.217267990112305, 18.91364097595215, 19.61001205444336, 20.306385040283203, 21.002758026123047, 21.699129104614258, 22.39550018310547]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 17.0, 6.0, 18.0, 16.0, 16.0, 28.0, 31.0, 33.0, 31.0, 34.0, 40.0, 39.0, 35.0, 39.0, 54.0, 39.0, 42.0, 36.0, 58.0, 38.0, 48.0, 33.0, 39.0, 28.0, 23.0, 28.0, 20.0, 18.0, 14.0, 11.0, 12.0, 7.0, 12.0, 6.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.23089599609375, -3.1180419921875, -3.00518798828125, -2.892333984375, -2.77947998046875, -2.6666259765625, -2.55377197265625, -2.44091796875, -2.32806396484375, -2.2152099609375, -2.10235595703125, -1.989501953125, -1.87664794921875, -1.7637939453125, -1.65093994140625, -1.5380859375, -1.42523193359375, -1.3123779296875, -1.19952392578125, -1.086669921875, -0.97381591796875, -0.8609619140625, -0.74810791015625, -0.63525390625, -0.52239990234375, -0.4095458984375, -0.29669189453125, -0.183837890625, -0.07098388671875, 0.0418701171875, 0.15472412109375, 0.267578125, 0.38043212890625, 0.4932861328125, 0.60614013671875, 0.718994140625, 0.83184814453125, 0.9447021484375, 1.05755615234375, 1.17041015625, 1.28326416015625, 1.3961181640625, 1.50897216796875, 1.621826171875, 1.73468017578125, 1.8475341796875, 1.96038818359375, 2.0732421875, 2.18609619140625, 2.2989501953125, 2.41180419921875, 2.524658203125, 2.63751220703125, 2.7503662109375, 2.86322021484375, 2.97607421875, 3.08892822265625, 3.2017822265625, 3.31463623046875, 3.427490234375, 3.54034423828125, 3.6531982421875, 3.76605224609375, 3.87890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 13.0, 13.0, 33.0, 47.0, 107.0, 213.0, 442.0, 950.0, 2286.0, 6374.0, 27335.0, 222177.0, 690795.0, 77704.0, 13288.0, 3932.0, 1534.0, 697.0, 303.0, 154.0, 68.0, 37.0, 23.0, 13.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.55487060546875, -4.4417724609375, -4.32867431640625, -4.215576171875, -4.10247802734375, -3.9893798828125, -3.87628173828125, -3.76318359375, -3.65008544921875, -3.5369873046875, -3.42388916015625, -3.310791015625, -3.19769287109375, -3.0845947265625, -2.97149658203125, -2.8583984375, -2.74530029296875, -2.6322021484375, -2.51910400390625, -2.406005859375, -2.29290771484375, -2.1798095703125, -2.06671142578125, -1.95361328125, -1.84051513671875, -1.7274169921875, -1.61431884765625, -1.501220703125, -1.38812255859375, -1.2750244140625, -1.16192626953125, -1.048828125, -0.93572998046875, -0.8226318359375, -0.70953369140625, -0.596435546875, -0.48333740234375, -0.3702392578125, -0.25714111328125, -0.14404296875, -0.03094482421875, 0.0821533203125, 0.19525146484375, 0.308349609375, 0.42144775390625, 0.5345458984375, 0.64764404296875, 0.7607421875, 0.87384033203125, 0.9869384765625, 1.10003662109375, 1.213134765625, 1.32623291015625, 1.4393310546875, 1.55242919921875, 1.66552734375, 1.77862548828125, 1.8917236328125, 2.00482177734375, 2.117919921875, 2.23101806640625, 2.3441162109375, 2.45721435546875, 2.5703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 10.0, 17.0, 9.0, 12.0, 12.0, 16.0, 29.0, 22.0, 26.0, 28.0, 28.0, 26.0, 40.0, 44.0, 36.0, 49.0, 35.0, 31.0, 1063.0, 44.0, 32.0, 33.0, 37.0, 33.0, 27.0, 31.0, 29.0, 27.0, 21.0, 31.0, 20.0, 12.0, 14.0, 19.0, 10.0, 4.0, 3.0, 9.0, 9.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.720703125, -2.641082763671875, -2.56146240234375, -2.481842041015625, -2.4022216796875, -2.322601318359375, -2.24298095703125, -2.163360595703125, -2.083740234375, -2.004119873046875, -1.92449951171875, -1.844879150390625, -1.7652587890625, -1.685638427734375, -1.60601806640625, -1.526397705078125, -1.44677734375, -1.367156982421875, -1.28753662109375, -1.207916259765625, -1.1282958984375, -1.048675537109375, -0.96905517578125, -0.889434814453125, -0.809814453125, -0.730194091796875, -0.65057373046875, -0.570953369140625, -0.4913330078125, -0.411712646484375, -0.33209228515625, -0.252471923828125, -0.1728515625, -0.093231201171875, -0.01361083984375, 0.066009521484375, 0.1456298828125, 0.225250244140625, 0.30487060546875, 0.384490966796875, 0.464111328125, 0.543731689453125, 0.62335205078125, 0.702972412109375, 0.7825927734375, 0.862213134765625, 0.94183349609375, 1.021453857421875, 1.10107421875, 1.180694580078125, 1.26031494140625, 1.339935302734375, 1.4195556640625, 1.499176025390625, 1.57879638671875, 1.658416748046875, 1.738037109375, 1.817657470703125, 1.89727783203125, 1.976898193359375, 2.0565185546875, 2.136138916015625, 2.21575927734375, 2.295379638671875, 2.375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 12.0, 11.0, 13.0, 17.0, 32.0, 55.0, 62.0, 81.0, 107.0, 160.0, 261.0, 394.0, 611.0, 938.0, 1681.0, 2806.0, 5719.0, 12732.0, 36895.0, 166233.0, 1503100.0, 283130.0, 50761.0, 16300.0, 6913.0, 3321.0, 1746.0, 1034.0, 676.0, 437.0, 287.0, 199.0, 124.0, 77.0, 51.0, 42.0, 28.0, 16.0, 12.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5556640625, -1.5093994140625, -1.463134765625, -1.4168701171875, -1.37060546875, -1.3243408203125, -1.278076171875, -1.2318115234375, -1.185546875, -1.1392822265625, -1.093017578125, -1.0467529296875, -1.00048828125, -0.9542236328125, -0.907958984375, -0.8616943359375, -0.8154296875, -0.7691650390625, -0.722900390625, -0.6766357421875, -0.63037109375, -0.5841064453125, -0.537841796875, -0.4915771484375, -0.4453125, -0.3990478515625, -0.352783203125, -0.3065185546875, -0.26025390625, -0.2139892578125, -0.167724609375, -0.1214599609375, -0.0751953125, -0.0289306640625, 0.017333984375, 0.0635986328125, 0.10986328125, 0.1561279296875, 0.202392578125, 0.2486572265625, 0.294921875, 0.3411865234375, 0.387451171875, 0.4337158203125, 0.47998046875, 0.5262451171875, 0.572509765625, 0.6187744140625, 0.6650390625, 0.7113037109375, 0.757568359375, 0.8038330078125, 0.85009765625, 0.8963623046875, 0.942626953125, 0.9888916015625, 1.03515625, 1.0814208984375, 1.127685546875, 1.1739501953125, 1.22021484375, 1.2664794921875, 1.312744140625, 1.3590087890625, 1.4052734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 8.0, 7.0, 3.0, 13.0, 7.0, 13.0, 15.0, 31.0, 78.0, 171.0, 311.0, 147.0, 71.0, 28.0, 25.0, 17.0, 12.0, 7.0, 3.0, 10.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5035934448242188, -0.4852142333984375, -0.46683502197265625, -0.448455810546875, -0.43007659912109375, -0.4116973876953125, -0.39331817626953125, -0.37493896484375, -0.35655975341796875, -0.3381805419921875, -0.31980133056640625, -0.301422119140625, -0.28304290771484375, -0.2646636962890625, -0.24628448486328125, -0.2279052734375, -0.20952606201171875, -0.1911468505859375, -0.17276763916015625, -0.154388427734375, -0.13600921630859375, -0.1176300048828125, -0.09925079345703125, -0.08087158203125, -0.06249237060546875, -0.0441131591796875, -0.02573394775390625, -0.007354736328125, 0.01102447509765625, 0.0294036865234375, 0.04778289794921875, 0.066162109375, 0.08454132080078125, 0.1029205322265625, 0.12129974365234375, 0.139678955078125, 0.15805816650390625, 0.1764373779296875, 0.19481658935546875, 0.21319580078125, 0.23157501220703125, 0.2499542236328125, 0.26833343505859375, 0.286712646484375, 0.30509185791015625, 0.3234710693359375, 0.34185028076171875, 0.3602294921875, 0.37860870361328125, 0.3969879150390625, 0.41536712646484375, 0.433746337890625, 0.45212554931640625, 0.4705047607421875, 0.48888397216796875, 0.50726318359375, 0.5256423950195312, 0.5440216064453125, 0.5624008178710938, 0.580780029296875, 0.5991592407226562, 0.6175384521484375, 0.6359176635742188, 0.654296875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 6.0, 20.0, 24.0, 40.0, 71.0, 183.0, 2126.0, 992771.0, 52037.0, 941.0, 128.0, 65.0, 32.0, 21.0, 16.0, 8.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.921875, -13.5225830078125, -13.123291015625, -12.7239990234375, -12.32470703125, -11.9254150390625, -11.526123046875, -11.1268310546875, -10.7275390625, -10.3282470703125, -9.928955078125, -9.5296630859375, -9.13037109375, -8.7310791015625, -8.331787109375, -7.9324951171875, -7.533203125, -7.1339111328125, -6.734619140625, -6.3353271484375, -5.93603515625, -5.5367431640625, -5.137451171875, -4.7381591796875, -4.3388671875, -3.9395751953125, -3.540283203125, -3.1409912109375, -2.74169921875, -2.3424072265625, -1.943115234375, -1.5438232421875, -1.14453125, -0.7452392578125, -0.345947265625, 0.0533447265625, 0.45263671875, 0.8519287109375, 1.251220703125, 1.6505126953125, 2.0498046875, 2.4490966796875, 2.848388671875, 3.2476806640625, 3.64697265625, 4.0462646484375, 4.445556640625, 4.8448486328125, 5.244140625, 5.6434326171875, 6.042724609375, 6.4420166015625, 6.84130859375, 7.2406005859375, 7.639892578125, 8.0391845703125, 8.4384765625, 8.8377685546875, 9.237060546875, 9.6363525390625, 10.03564453125, 10.4349365234375, 10.834228515625, 11.2335205078125, 11.6328125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 6.0, 3.0, 10.0, 23.0, 26.0, 63.0, 93.0, 157.0, 172.0, 169.0, 117.0, 66.0, 31.0, 30.0, 13.0, 10.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41232261061668396, -0.38766157627105713, -0.3630005717277527, -0.33833953738212585, -0.313678503036499, -0.2890174984931946, -0.26435646414756775, -0.2396954447031021, -0.21503442525863647, -0.19037340581417084, -0.1657123863697052, -0.14105135202407837, -0.11639033257961273, -0.0917293131351471, -0.06706827878952026, -0.042407259345054626, -0.01774623990058899, 0.006914783269166946, 0.03157580643892288, 0.056236833333969116, 0.08089785277843475, 0.10555887222290039, 0.13021990656852722, 0.15488092601299286, 0.1795419454574585, 0.20420296490192413, 0.22886398434638977, 0.2535250186920166, 0.27818602323532104, 0.3028470575809479, 0.3275080919265747, 0.35216909646987915, 0.3768301010131836, 0.4014911353588104, 0.42615213990211487, 0.4508131742477417, 0.47547417879104614, 0.5001351833343506, 0.5247962474822998, 0.5494572520256042, 0.5741182565689087, 0.5987792611122131, 0.6234403252601624, 0.6481013298034668, 0.6727623343467712, 0.6974233388900757, 0.7220844030380249, 0.7467454075813293, 0.7714064717292786, 0.796067476272583, 0.8207285404205322, 0.8453895449638367, 0.8700505495071411, 0.8947116136550903, 0.9193726181983948, 0.9440336227416992, 0.9686946868896484, 0.9933556914329529, 1.0180166959762573, 1.0426777601242065, 1.0673388242721558, 1.0919997692108154, 1.1166608333587646, 1.1413218975067139, 1.1659828424453735]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 4.0, 9.0, 6.0, 14.0, 11.0, 16.0, 15.0, 22.0, 29.0, 19.0, 32.0, 35.0, 26.0, 28.0, 35.0, 46.0, 39.0, 41.0, 36.0, 40.0, 41.0, 35.0, 41.0, 28.0, 44.0, 41.0, 36.0, 30.0, 21.0, 28.0, 19.0, 16.0, 20.0, 19.0, 14.0, 9.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.3948132395744324, -0.383027046918869, -0.37124085426330566, -0.3594546616077423, -0.34766846895217896, -0.3358822464942932, -0.32409605383872986, -0.3123098611831665, -0.30052366852760315, -0.2887374758720398, -0.27695128321647644, -0.2651650905609131, -0.25337886810302734, -0.24159269034862518, -0.22980648279190063, -0.21802029013633728, -0.20623409748077393, -0.19444790482521057, -0.18266171216964722, -0.17087550461292267, -0.15908931195735931, -0.14730311930179596, -0.1355169117450714, -0.12373071908950806, -0.1119445264339447, -0.10015833377838135, -0.0883721336722374, -0.07658593356609344, -0.06479974091053009, -0.05301354452967644, -0.041227348148822784, -0.029441148042678833, -0.01765495538711548, -0.0058687590062618256, 0.005917437374591827, 0.01770363375544548, 0.029489830136299133, 0.041276026517152786, 0.05306222289800644, 0.06484842300415039, 0.07663461565971375, 0.0884208083152771, 0.10020700842142105, 0.111993208527565, 0.12377940118312836, 0.1355655938386917, 0.14735180139541626, 0.15913799405097961, 0.17092418670654297, 0.18271037936210632, 0.19449657201766968, 0.20628277957439423, 0.21806897222995758, 0.22985516488552094, 0.24164137244224548, 0.25342756509780884, 0.2652137577533722, 0.27699995040893555, 0.2887861430644989, 0.30057233572006226, 0.312358558177948, 0.32414475083351135, 0.3359309434890747, 0.34771713614463806, 0.3595033288002014]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 14.0, 11.0, 11.0, 17.0, 20.0, 19.0, 25.0, 25.0, 24.0, 26.0, 28.0, 38.0, 35.0, 28.0, 41.0, 30.0, 51.0, 44.0, 42.0, 45.0, 29.0, 45.0, 34.0, 30.0, 47.0, 31.0, 25.0, 26.0, 14.0, 20.0, 20.0, 10.0, 10.0, 11.0, 10.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.98828125, -2.88323974609375, -2.7781982421875, -2.67315673828125, -2.568115234375, -2.46307373046875, -2.3580322265625, -2.25299072265625, -2.14794921875, -2.04290771484375, -1.9378662109375, -1.83282470703125, -1.727783203125, -1.62274169921875, -1.5177001953125, -1.41265869140625, -1.3076171875, -1.20257568359375, -1.0975341796875, -0.99249267578125, -0.887451171875, -0.78240966796875, -0.6773681640625, -0.57232666015625, -0.46728515625, -0.36224365234375, -0.2572021484375, -0.15216064453125, -0.047119140625, 0.05792236328125, 0.1629638671875, 0.26800537109375, 0.373046875, 0.47808837890625, 0.5831298828125, 0.68817138671875, 0.793212890625, 0.89825439453125, 1.0032958984375, 1.10833740234375, 1.21337890625, 1.31842041015625, 1.4234619140625, 1.52850341796875, 1.633544921875, 1.73858642578125, 1.8436279296875, 1.94866943359375, 2.0537109375, 2.15875244140625, 2.2637939453125, 2.36883544921875, 2.473876953125, 2.57891845703125, 2.6839599609375, 2.78900146484375, 2.89404296875, 2.99908447265625, 3.1041259765625, 3.20916748046875, 3.314208984375, 3.41925048828125, 3.5242919921875, 3.62933349609375, 3.734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 10.0, 22.0, 27.0, 31.0, 58.0, 85.0, 107.0, 172.0, 279.0, 407.0, 611.0, 1036.0, 1718.0, 3095.0, 5687.0, 11369.0, 26765.0, 77764.0, 433051.0, 368740.0, 69230.0, 24608.0, 10827.0, 5469.0, 2932.0, 1718.0, 964.0, 629.0, 370.0, 254.0, 162.0, 112.0, 70.0, 61.0, 31.0, 21.0, 20.0, 10.0, 4.0, 8.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.8046875, -5.64324951171875, -5.4818115234375, -5.32037353515625, -5.158935546875, -4.99749755859375, -4.8360595703125, -4.67462158203125, -4.51318359375, -4.35174560546875, -4.1903076171875, -4.02886962890625, -3.867431640625, -3.70599365234375, -3.5445556640625, -3.38311767578125, -3.2216796875, -3.06024169921875, -2.8988037109375, -2.73736572265625, -2.575927734375, -2.41448974609375, -2.2530517578125, -2.09161376953125, -1.93017578125, -1.76873779296875, -1.6072998046875, -1.44586181640625, -1.284423828125, -1.12298583984375, -0.9615478515625, -0.80010986328125, -0.638671875, -0.47723388671875, -0.3157958984375, -0.15435791015625, 0.007080078125, 0.16851806640625, 0.3299560546875, 0.49139404296875, 0.65283203125, 0.81427001953125, 0.9757080078125, 1.13714599609375, 1.298583984375, 1.46002197265625, 1.6214599609375, 1.78289794921875, 1.9443359375, 2.10577392578125, 2.2672119140625, 2.42864990234375, 2.590087890625, 2.75152587890625, 2.9129638671875, 3.07440185546875, 3.23583984375, 3.39727783203125, 3.5587158203125, 3.72015380859375, 3.881591796875, 4.04302978515625, 4.2044677734375, 4.36590576171875, 4.52734375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 21.0, 26.0, 31.0, 39.0, 39.0, 39.0, 39.0, 46.0, 63.0, 93.0, 236.0, 1624.0, 208.0, 100.0, 58.0, 47.0, 39.0, 43.0, 32.0, 34.0, 20.0, 22.0, 19.0, 16.0, 9.0, 14.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -10.9981689453125, -10.582275390625, -10.1663818359375, -9.75048828125, -9.3345947265625, -8.918701171875, -8.5028076171875, -8.0869140625, -7.6710205078125, -7.255126953125, -6.8392333984375, -6.42333984375, -6.0074462890625, -5.591552734375, -5.1756591796875, -4.759765625, -4.3438720703125, -3.927978515625, -3.5120849609375, -3.09619140625, -2.6802978515625, -2.264404296875, -1.8485107421875, -1.4326171875, -1.0167236328125, -0.600830078125, -0.1849365234375, 0.23095703125, 0.6468505859375, 1.062744140625, 1.4786376953125, 1.89453125, 2.3104248046875, 2.726318359375, 3.1422119140625, 3.55810546875, 3.9739990234375, 4.389892578125, 4.8057861328125, 5.2216796875, 5.6375732421875, 6.053466796875, 6.4693603515625, 6.88525390625, 7.3011474609375, 7.717041015625, 8.1329345703125, 8.548828125, 8.9647216796875, 9.380615234375, 9.7965087890625, 10.21240234375, 10.6282958984375, 11.044189453125, 11.4600830078125, 11.8759765625, 12.2918701171875, 12.707763671875, 13.1236572265625, 13.53955078125, 13.9554443359375, 14.371337890625, 14.7872314453125, 15.203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 11.0, 24.0, 20.0, 22.0, 22.0, 33.0, 49.0, 79.0, 102.0, 179.0, 493.0, 1866.0, 12365.0, 568579.0, 2538229.0, 19847.0, 2492.0, 607.0, 200.0, 111.0, 76.0, 56.0, 48.0, 36.0, 30.0, 24.0, 17.0, 12.0, 18.0, 7.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.779052734375, -26.96435546875, -26.149658203125, -25.3349609375, -24.520263671875, -23.70556640625, -22.890869140625, -22.076171875, -21.261474609375, -20.44677734375, -19.632080078125, -18.8173828125, -18.002685546875, -17.18798828125, -16.373291015625, -15.55859375, -14.743896484375, -13.92919921875, -13.114501953125, -12.2998046875, -11.485107421875, -10.67041015625, -9.855712890625, -9.041015625, -8.226318359375, -7.41162109375, -6.596923828125, -5.7822265625, -4.967529296875, -4.15283203125, -3.338134765625, -2.5234375, -1.708740234375, -0.89404296875, -0.079345703125, 0.7353515625, 1.550048828125, 2.36474609375, 3.179443359375, 3.994140625, 4.808837890625, 5.62353515625, 6.438232421875, 7.2529296875, 8.067626953125, 8.88232421875, 9.697021484375, 10.51171875, 11.326416015625, 12.14111328125, 12.955810546875, 13.7705078125, 14.585205078125, 15.39990234375, 16.214599609375, 17.029296875, 17.843994140625, 18.65869140625, 19.473388671875, 20.2880859375, 21.102783203125, 21.91748046875, 22.732177734375, 23.546875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [3.0, 8.0, 17.0, 51.0, 139.0, 240.0, 267.0, 175.0, 66.0, 34.0, 15.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.217764377593994, -6.045231819152832, -4.872698783874512, -3.7001659870147705, -2.5276331901550293, -1.355100154876709, -0.18256759643554688, 0.9899649620056152, 2.1624979972839355, 3.3350307941436768, 4.507563591003418, 5.680096626281738, 6.8526291847229, 8.025161743164062, 9.197694778442383, 10.370227813720703, 11.542760848999023, 12.715293884277344, 13.887826919555664, 15.060359001159668, 16.232891082763672, 17.405426025390625, 18.577957153320312, 19.750490188598633, 20.923023223876953, 22.095556259155273, 23.268089294433594, 24.440622329711914, 25.613155364990234, 26.785686492919922, 27.958219528198242, 29.130752563476562, 30.30328369140625, 31.47581672668457, 32.64834976196289, 33.82088088989258, 34.99341583251953, 36.16594696044922, 37.33848190307617, 38.51101303100586, 39.68354797363281, 40.8560791015625, 42.02861404418945, 43.20114517211914, 44.373680114746094, 45.54621124267578, 46.718746185302734, 47.89127731323242, 49.06380844116211, 50.2363395690918, 51.40887451171875, 52.58140563964844, 53.75394058227539, 54.92647171020508, 56.09900665283203, 57.27153778076172, 58.444068908691406, 59.616600036621094, 60.78913497924805, 61.961666107177734, 63.13420104980469, 64.30673217773438, 65.47926330566406, 66.65179443359375, 67.82433319091797]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 9.0, 6.0, 6.0, 8.0, 11.0, 10.0, 18.0, 18.0, 15.0, 21.0, 27.0, 36.0, 28.0, 26.0, 33.0, 36.0, 36.0, 40.0, 40.0, 38.0, 54.0, 37.0, 56.0, 31.0, 38.0, 31.0, 39.0, 25.0, 28.0, 25.0, 22.0, 32.0, 24.0, 12.0, 20.0, 10.0, 5.0, 7.0, 10.0, 11.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-39.971099853515625, -38.82118606567383, -37.67127227783203, -36.5213623046875, -35.3714485168457, -34.221534729003906, -33.07162094116211, -31.921707153320312, -30.77179527282715, -29.62188148498535, -28.471969604492188, -27.32205581665039, -26.172142028808594, -25.02223014831543, -23.872316360473633, -22.72240447998047, -21.572490692138672, -20.422576904296875, -19.27266502380371, -18.122751235961914, -16.97283935546875, -15.822925567626953, -14.673011779785156, -13.523098945617676, -12.373186111450195, -11.223273277282715, -10.073360443115234, -8.923446655273438, -7.773533821105957, -6.623620986938477, -5.473707675933838, -4.323794364929199, -3.173877716064453, -2.0239646434783936, -0.874051570892334, 0.2758615016937256, 1.4257745742797852, 2.5756874084472656, 3.7256007194519043, 4.875514030456543, 6.025426864624023, 7.175339698791504, 8.325252532958984, 9.475166320800781, 10.625079154968262, 11.774991989135742, 12.924905776977539, 14.07481861114502, 15.2247314453125, 16.374645233154297, 17.52455711364746, 18.674470901489258, 19.824382781982422, 20.97429656982422, 22.124210357666016, 23.274124145507812, 24.424036026000977, 25.573949813842773, 26.723861694335938, 27.873775482177734, 29.02368927001953, 30.173601150512695, 31.323514938354492, 32.473426818847656, 33.62334060668945]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 13.0, 8.0, 14.0, 20.0, 24.0, 17.0, 20.0, 25.0, 33.0, 34.0, 28.0, 38.0, 37.0, 30.0, 40.0, 36.0, 41.0, 40.0, 42.0, 45.0, 45.0, 40.0, 39.0, 32.0, 31.0, 28.0, 36.0, 26.0, 13.0, 15.0, 19.0, 14.0, 10.0, 7.0, 11.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.71484375, -3.595703125, -3.4765625, -3.357421875, -3.23828125, -3.119140625, -3.0, -2.880859375, -2.76171875, -2.642578125, -2.5234375, -2.404296875, -2.28515625, -2.166015625, -2.046875, -1.927734375, -1.80859375, -1.689453125, -1.5703125, -1.451171875, -1.33203125, -1.212890625, -1.09375, -0.974609375, -0.85546875, -0.736328125, -0.6171875, -0.498046875, -0.37890625, -0.259765625, -0.140625, -0.021484375, 0.09765625, 0.216796875, 0.3359375, 0.455078125, 0.57421875, 0.693359375, 0.8125, 0.931640625, 1.05078125, 1.169921875, 1.2890625, 1.408203125, 1.52734375, 1.646484375, 1.765625, 1.884765625, 2.00390625, 2.123046875, 2.2421875, 2.361328125, 2.48046875, 2.599609375, 2.71875, 2.837890625, 2.95703125, 3.076171875, 3.1953125, 3.314453125, 3.43359375, 3.552734375, 3.671875, 3.791015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 7.0, 12.0, 18.0, 30.0, 36.0, 58.0, 96.0, 149.0, 232.0, 347.0, 512.0, 887.0, 1247.0, 1871.0, 2994.0, 4831.0, 7747.0, 13456.0, 24074.0, 50770.0, 138139.0, 514330.0, 1583751.0, 1286502.0, 368674.0, 102099.0, 40680.0, 20229.0, 11446.0, 6858.0, 4240.0, 2727.0, 1823.0, 1136.0, 769.0, 505.0, 313.0, 222.0, 146.0, 85.0, 69.0, 62.0, 28.0, 14.0, 13.0, 11.0, 4.0, 8.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.90625, -4.7523193359375, -4.598388671875, -4.4444580078125, -4.29052734375, -4.1365966796875, -3.982666015625, -3.8287353515625, -3.6748046875, -3.5208740234375, -3.366943359375, -3.2130126953125, -3.05908203125, -2.9051513671875, -2.751220703125, -2.5972900390625, -2.443359375, -2.2894287109375, -2.135498046875, -1.9815673828125, -1.82763671875, -1.6737060546875, -1.519775390625, -1.3658447265625, -1.2119140625, -1.0579833984375, -0.904052734375, -0.7501220703125, -0.59619140625, -0.4422607421875, -0.288330078125, -0.1343994140625, 0.01953125, 0.1734619140625, 0.327392578125, 0.4813232421875, 0.63525390625, 0.7891845703125, 0.943115234375, 1.0970458984375, 1.2509765625, 1.4049072265625, 1.558837890625, 1.7127685546875, 1.86669921875, 2.0206298828125, 2.174560546875, 2.3284912109375, 2.482421875, 2.6363525390625, 2.790283203125, 2.9442138671875, 3.09814453125, 3.2520751953125, 3.406005859375, 3.5599365234375, 3.7138671875, 3.8677978515625, 4.021728515625, 4.1756591796875, 4.32958984375, 4.4835205078125, 4.637451171875, 4.7913818359375, 4.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 11.0, 12.0, 19.0, 25.0, 35.0, 50.0, 53.0, 80.0, 97.0, 165.0, 232.0, 387.0, 594.0, 698.0, 533.0, 365.0, 206.0, 143.0, 102.0, 77.0, 40.0, 37.0, 31.0, 20.0, 15.0, 8.0, 6.0, 3.0, 4.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3580322265625, -8.083251953125, -7.8084716796875, -7.53369140625, -7.2589111328125, -6.984130859375, -6.7093505859375, -6.4345703125, -6.1597900390625, -5.885009765625, -5.6102294921875, -5.33544921875, -5.0606689453125, -4.785888671875, -4.5111083984375, -4.236328125, -3.9615478515625, -3.686767578125, -3.4119873046875, -3.13720703125, -2.8624267578125, -2.587646484375, -2.3128662109375, -2.0380859375, -1.7633056640625, -1.488525390625, -1.2137451171875, -0.93896484375, -0.6641845703125, -0.389404296875, -0.1146240234375, 0.16015625, 0.4349365234375, 0.709716796875, 0.9844970703125, 1.25927734375, 1.5340576171875, 1.808837890625, 2.0836181640625, 2.3583984375, 2.6331787109375, 2.907958984375, 3.1827392578125, 3.45751953125, 3.7322998046875, 4.007080078125, 4.2818603515625, 4.556640625, 4.8314208984375, 5.106201171875, 5.3809814453125, 5.65576171875, 5.9305419921875, 6.205322265625, 6.4801025390625, 6.7548828125, 7.0296630859375, 7.304443359375, 7.5792236328125, 7.85400390625, 8.1287841796875, 8.403564453125, 8.6783447265625, 8.953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 4.0, 2.0, 11.0, 9.0, 19.0, 29.0, 38.0, 34.0, 83.0, 123.0, 229.0, 478.0, 1680.0, 13166.0, 797864.0, 3349702.0, 26944.0, 2529.0, 631.0, 265.0, 131.0, 88.0, 55.0, 53.0, 26.0, 24.0, 18.0, 15.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.396484375, -31.35546875, -30.314453125, -29.2734375, -28.232421875, -27.19140625, -26.150390625, -25.109375, -24.068359375, -23.02734375, -21.986328125, -20.9453125, -19.904296875, -18.86328125, -17.822265625, -16.78125, -15.740234375, -14.69921875, -13.658203125, -12.6171875, -11.576171875, -10.53515625, -9.494140625, -8.453125, -7.412109375, -6.37109375, -5.330078125, -4.2890625, -3.248046875, -2.20703125, -1.166015625, -0.125, 0.916015625, 1.95703125, 2.998046875, 4.0390625, 5.080078125, 6.12109375, 7.162109375, 8.203125, 9.244140625, 10.28515625, 11.326171875, 12.3671875, 13.408203125, 14.44921875, 15.490234375, 16.53125, 17.572265625, 18.61328125, 19.654296875, 20.6953125, 21.736328125, 22.77734375, 23.818359375, 24.859375, 25.900390625, 26.94140625, 27.982421875, 29.0234375, 30.064453125, 31.10546875, 32.146484375, 33.1875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 18.0, 80.0, 230.0, 373.0, 238.0, 44.0, 21.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.60581970214844, -123.48200225830078, -120.3581771850586, -117.23435974121094, -114.11053466796875, -110.9867172241211, -107.86289978027344, -104.73907470703125, -101.61524963378906, -98.4914321899414, -95.36760711669922, -92.24378967285156, -89.11996459960938, -85.99614715576172, -82.87232971191406, -79.74850463867188, -76.62468719482422, -73.50086975097656, -70.37704467773438, -67.25322723388672, -64.12940216064453, -61.005584716796875, -57.88176345825195, -54.75794219970703, -51.63412094116211, -48.51029968261719, -45.386478424072266, -42.262657165527344, -39.13883972167969, -36.0150146484375, -32.891197204589844, -29.767375946044922, -26.64354705810547, -23.519725799560547, -20.395904541015625, -17.272085189819336, -14.148263931274414, -11.024442672729492, -7.900623321533203, -4.776802062988281, -1.6529808044433594, 1.4708399772644043, 4.594660758972168, 7.718481063842773, 10.842302322387695, 13.966123580932617, 17.089942932128906, 20.213764190673828, 23.33758544921875, 26.461406707763672, 29.585227966308594, 32.70904541015625, 35.83287048339844, 38.956687927246094, 42.080509185791016, 45.20433044433594, 48.32815170288086, 51.45197296142578, 54.5757942199707, 57.699615478515625, 60.82343292236328, 63.94725799560547, 67.07107543945312, 70.19490051269531, 73.31871795654297]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 1.0, 8.0, 7.0, 19.0, 14.0, 17.0, 23.0, 19.0, 34.0, 19.0, 32.0, 25.0, 39.0, 43.0, 33.0, 42.0, 43.0, 33.0, 45.0, 45.0, 49.0, 43.0, 53.0, 40.0, 34.0, 29.0, 23.0, 29.0, 24.0, 21.0, 17.0, 19.0, 8.0, 8.0, 7.0, 7.0, 4.0, 6.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.01807403564453, -20.24705696105957, -19.476041793823242, -18.70502471923828, -17.934009552001953, -17.162992477416992, -16.39197540283203, -15.620959281921387, -14.849943161010742, -14.078927040100098, -13.307910919189453, -12.536893844604492, -11.765877723693848, -10.994861602783203, -10.223844528198242, -9.452828407287598, -8.681812286376953, -7.910796165466309, -7.139779567718506, -6.368762969970703, -5.597746849060059, -4.826730728149414, -4.055714130401611, -3.2846975326538086, -2.513681411743164, -1.7426650524139404, -0.9716486930847168, -0.20063233375549316, 0.5703840255737305, 1.341400384902954, 2.1124167442321777, 2.8834333419799805, 3.654449462890625, 4.4254655838012695, 5.196482181549072, 5.967498779296875, 6.7385149002075195, 7.509531021118164, 8.280548095703125, 9.05156421661377, 9.822580337524414, 10.593596458435059, 11.364612579345703, 12.135629653930664, 12.906645774841309, 13.677661895751953, 14.448678970336914, 15.219695091247559, 15.990711212158203, 16.761728286743164, 17.532743453979492, 18.303760528564453, 19.07477569580078, 19.845792770385742, 20.616809844970703, 21.38782501220703, 22.158842086791992, 22.929859161376953, 23.70087432861328, 24.471891403198242, 25.242908477783203, 26.01392364501953, 26.784940719604492, 27.555957794189453, 28.32697296142578]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 15.0, 14.0, 9.0, 27.0, 23.0, 24.0, 28.0, 24.0, 18.0, 39.0, 43.0, 41.0, 30.0, 36.0, 49.0, 52.0, 50.0, 44.0, 47.0, 35.0, 43.0, 34.0, 34.0, 26.0, 20.0, 25.0, 21.0, 18.0, 25.0, 15.0, 17.0, 14.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.666748046875, -3.55224609375, -3.437744140625, -3.3232421875, -3.208740234375, -3.09423828125, -2.979736328125, -2.865234375, -2.750732421875, -2.63623046875, -2.521728515625, -2.4072265625, -2.292724609375, -2.17822265625, -2.063720703125, -1.94921875, -1.834716796875, -1.72021484375, -1.605712890625, -1.4912109375, -1.376708984375, -1.26220703125, -1.147705078125, -1.033203125, -0.918701171875, -0.80419921875, -0.689697265625, -0.5751953125, -0.460693359375, -0.34619140625, -0.231689453125, -0.1171875, -0.002685546875, 0.11181640625, 0.226318359375, 0.3408203125, 0.455322265625, 0.56982421875, 0.684326171875, 0.798828125, 0.913330078125, 1.02783203125, 1.142333984375, 1.2568359375, 1.371337890625, 1.48583984375, 1.600341796875, 1.71484375, 1.829345703125, 1.94384765625, 2.058349609375, 2.1728515625, 2.287353515625, 2.40185546875, 2.516357421875, 2.630859375, 2.745361328125, 2.85986328125, 2.974365234375, 3.0888671875, 3.203369140625, 3.31787109375, 3.432373046875, 3.546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 12.0, 24.0, 36.0, 42.0, 45.0, 82.0, 137.0, 273.0, 338.0, 591.0, 1079.0, 2083.0, 4417.0, 10657.0, 31108.0, 147097.0, 640125.0, 157377.0, 32733.0, 10800.0, 4573.0, 2128.0, 1121.0, 634.0, 362.0, 234.0, 137.0, 86.0, 73.0, 41.0, 31.0, 21.0, 12.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.200408935546875, -3.10198974609375, -3.003570556640625, -2.9051513671875, -2.806732177734375, -2.70831298828125, -2.609893798828125, -2.511474609375, -2.413055419921875, -2.31463623046875, -2.216217041015625, -2.1177978515625, -2.019378662109375, -1.92095947265625, -1.822540283203125, -1.72412109375, -1.625701904296875, -1.52728271484375, -1.428863525390625, -1.3304443359375, -1.232025146484375, -1.13360595703125, -1.035186767578125, -0.936767578125, -0.838348388671875, -0.73992919921875, -0.641510009765625, -0.5430908203125, -0.444671630859375, -0.34625244140625, -0.247833251953125, -0.1494140625, -0.050994873046875, 0.04742431640625, 0.145843505859375, 0.2442626953125, 0.342681884765625, 0.44110107421875, 0.539520263671875, 0.637939453125, 0.736358642578125, 0.83477783203125, 0.933197021484375, 1.0316162109375, 1.130035400390625, 1.22845458984375, 1.326873779296875, 1.42529296875, 1.523712158203125, 1.62213134765625, 1.720550537109375, 1.8189697265625, 1.917388916015625, 2.01580810546875, 2.114227294921875, 2.212646484375, 2.311065673828125, 2.40948486328125, 2.507904052734375, 2.6063232421875, 2.704742431640625, 2.80316162109375, 2.901580810546875, 3.0]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 11.0, 10.0, 16.0, 13.0, 20.0, 17.0, 25.0, 21.0, 22.0, 30.0, 33.0, 24.0, 27.0, 44.0, 34.0, 39.0, 1058.0, 46.0, 54.0, 33.0, 36.0, 35.0, 39.0, 36.0, 45.0, 37.0, 25.0, 21.0, 23.0, 17.0, 24.0, 15.0, 11.0, 10.0, 10.0, 7.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.111602783203125, -2.02984619140625, -1.948089599609375, -1.8663330078125, -1.784576416015625, -1.70281982421875, -1.621063232421875, -1.539306640625, -1.457550048828125, -1.37579345703125, -1.294036865234375, -1.2122802734375, -1.130523681640625, -1.04876708984375, -0.967010498046875, -0.88525390625, -0.803497314453125, -0.72174072265625, -0.639984130859375, -0.5582275390625, -0.476470947265625, -0.39471435546875, -0.312957763671875, -0.231201171875, -0.149444580078125, -0.06768798828125, 0.014068603515625, 0.0958251953125, 0.177581787109375, 0.25933837890625, 0.341094970703125, 0.4228515625, 0.504608154296875, 0.58636474609375, 0.668121337890625, 0.7498779296875, 0.831634521484375, 0.91339111328125, 0.995147705078125, 1.076904296875, 1.158660888671875, 1.24041748046875, 1.322174072265625, 1.4039306640625, 1.485687255859375, 1.56744384765625, 1.649200439453125, 1.73095703125, 1.812713623046875, 1.89447021484375, 1.976226806640625, 2.0579833984375, 2.139739990234375, 2.22149658203125, 2.303253173828125, 2.385009765625, 2.466766357421875, 2.54852294921875, 2.630279541015625, 2.7120361328125, 2.793792724609375, 2.87554931640625, 2.957305908203125, 3.0390625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 18.0, 16.0, 27.0, 36.0, 52.0, 52.0, 84.0, 141.0, 234.0, 335.0, 525.0, 901.0, 1542.0, 2788.0, 5153.0, 10731.0, 26888.0, 103292.0, 1543672.0, 320409.0, 47713.0, 16172.0, 7414.0, 3759.0, 2083.0, 1150.0, 700.0, 413.0, 258.0, 186.0, 113.0, 86.0, 47.0, 51.0, 29.0, 11.0, 18.0, 6.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.948394775390625, -1.88702392578125, -1.825653076171875, -1.7642822265625, -1.702911376953125, -1.64154052734375, -1.580169677734375, -1.518798828125, -1.457427978515625, -1.39605712890625, -1.334686279296875, -1.2733154296875, -1.211944580078125, -1.15057373046875, -1.089202880859375, -1.02783203125, -0.966461181640625, -0.90509033203125, -0.843719482421875, -0.7823486328125, -0.720977783203125, -0.65960693359375, -0.598236083984375, -0.536865234375, -0.475494384765625, -0.41412353515625, -0.352752685546875, -0.2913818359375, -0.230010986328125, -0.16864013671875, -0.107269287109375, -0.0458984375, 0.015472412109375, 0.07684326171875, 0.138214111328125, 0.1995849609375, 0.260955810546875, 0.32232666015625, 0.383697509765625, 0.445068359375, 0.506439208984375, 0.56781005859375, 0.629180908203125, 0.6905517578125, 0.751922607421875, 0.81329345703125, 0.874664306640625, 0.93603515625, 0.997406005859375, 1.05877685546875, 1.120147705078125, 1.1815185546875, 1.242889404296875, 1.30426025390625, 1.365631103515625, 1.427001953125, 1.488372802734375, 1.54974365234375, 1.611114501953125, 1.6724853515625, 1.733856201171875, 1.79522705078125, 1.856597900390625, 1.91796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 7.0, 4.0, 14.0, 20.0, 47.0, 99.0, 277.0, 276.0, 117.0, 36.0, 23.0, 15.0, 12.0, 5.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.662109375, -0.6426773071289062, -0.6232452392578125, -0.6038131713867188, -0.584381103515625, -0.5649490356445312, -0.5455169677734375, -0.5260848999023438, -0.50665283203125, -0.48722076416015625, -0.4677886962890625, -0.44835662841796875, -0.428924560546875, -0.40949249267578125, -0.3900604248046875, -0.37062835693359375, -0.3511962890625, -0.33176422119140625, -0.3123321533203125, -0.29290008544921875, -0.273468017578125, -0.25403594970703125, -0.2346038818359375, -0.21517181396484375, -0.19573974609375, -0.17630767822265625, -0.1568756103515625, -0.13744354248046875, -0.118011474609375, -0.09857940673828125, -0.0791473388671875, -0.05971527099609375, -0.040283203125, -0.02085113525390625, -0.0014190673828125, 0.01801300048828125, 0.037445068359375, 0.05687713623046875, 0.0763092041015625, 0.09574127197265625, 0.11517333984375, 0.13460540771484375, 0.1540374755859375, 0.17346954345703125, 0.192901611328125, 0.21233367919921875, 0.2317657470703125, 0.25119781494140625, 0.2706298828125, 0.29006195068359375, 0.3094940185546875, 0.32892608642578125, 0.348358154296875, 0.36779022216796875, 0.3872222900390625, 0.40665435791015625, 0.42608642578125, 0.44551849365234375, 0.4649505615234375, 0.48438262939453125, 0.503814697265625, 0.5232467651367188, 0.5426788330078125, 0.5621109008789062, 0.58154296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 2.0, 8.0, 13.0, 10.0, 24.0, 31.0, 44.0, 143.0, 639.0, 3580.0, 875802.0, 164320.0, 3118.0, 567.0, 105.0, 44.0, 25.0, 18.0, 8.0, 6.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.03125, -10.6630859375, -10.294921875, -9.9267578125, -9.55859375, -9.1904296875, -8.822265625, -8.4541015625, -8.0859375, -7.7177734375, -7.349609375, -6.9814453125, -6.61328125, -6.2451171875, -5.876953125, -5.5087890625, -5.140625, -4.7724609375, -4.404296875, -4.0361328125, -3.66796875, -3.2998046875, -2.931640625, -2.5634765625, -2.1953125, -1.8271484375, -1.458984375, -1.0908203125, -0.72265625, -0.3544921875, 0.013671875, 0.3818359375, 0.75, 1.1181640625, 1.486328125, 1.8544921875, 2.22265625, 2.5908203125, 2.958984375, 3.3271484375, 3.6953125, 4.0634765625, 4.431640625, 4.7998046875, 5.16796875, 5.5361328125, 5.904296875, 6.2724609375, 6.640625, 7.0087890625, 7.376953125, 7.7451171875, 8.11328125, 8.4814453125, 8.849609375, 9.2177734375, 9.5859375, 9.9541015625, 10.322265625, 10.6904296875, 11.05859375, 11.4267578125, 11.794921875, 12.1630859375, 12.53125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 10.0, 13.0, 15.0, 39.0, 52.0, 111.0, 211.0, 257.0, 144.0, 61.0, 44.0, 24.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6177295446395874, -0.5797190070152283, -0.5417084693908691, -0.50369793176651, -0.4656873941421509, -0.42767685651779175, -0.3896663188934326, -0.3516557812690735, -0.31364524364471436, -0.2756347060203552, -0.2376241683959961, -0.19961363077163696, -0.16160309314727783, -0.1235925555229187, -0.08558201789855957, -0.04757148027420044, -0.009560942649841309, 0.028449594974517822, 0.06646013259887695, 0.10447067022323608, 0.14248120784759521, 0.18049174547195435, 0.21850228309631348, 0.2565128207206726, 0.29452335834503174, 0.33253389596939087, 0.37054443359375, 0.40855497121810913, 0.44656550884246826, 0.4845760464668274, 0.5225865840911865, 0.5605971217155457, 0.5986077785491943, 0.6366183161735535, 0.6746288537979126, 0.7126393914222717, 0.7506499290466309, 0.78866046667099, 0.8266710042953491, 0.8646815419197083, 0.9026920795440674, 0.9407026171684265, 0.9787131547927856, 1.0167236328125, 1.054734230041504, 1.0927448272705078, 1.1307553052902222, 1.1687657833099365, 1.2067763805389404, 1.2447869777679443, 1.2827974557876587, 1.320807933807373, 1.358818531036377, 1.3968291282653809, 1.4348396062850952, 1.4728500843048096, 1.5108606815338135, 1.5488712787628174, 1.5868817567825317, 1.624892234802246, 1.66290283203125, 1.700913429260254, 1.7389239072799683, 1.7769343852996826, 1.8149449825286865]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 8.0, 8.0, 8.0, 12.0, 19.0, 19.0, 24.0, 19.0, 20.0, 23.0, 16.0, 31.0, 40.0, 30.0, 35.0, 35.0, 33.0, 41.0, 36.0, 38.0, 35.0, 37.0, 39.0, 37.0, 33.0, 30.0, 28.0, 24.0, 28.0, 15.0, 17.0, 26.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 8.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35305070877075195, -0.3404378592967987, -0.32782498002052307, -0.3152121305465698, -0.3025992512702942, -0.28998640179634094, -0.2773735225200653, -0.26476067304611206, -0.2521477937698364, -0.23953492939472198, -0.22692206501960754, -0.2143092006444931, -0.20169633626937866, -0.18908348679542542, -0.17647060751914978, -0.16385775804519653, -0.1512448936700821, -0.13863202929496765, -0.1260191649198532, -0.11340630054473877, -0.10079343616962433, -0.08818057924509048, -0.07556771486997604, -0.0629548504948616, -0.05034198611974716, -0.03772912174463272, -0.02511625923216343, -0.012503396719694138, 0.00010946765542030334, 0.012722328305244446, 0.025335192680358887, 0.03794805705547333, 0.05056092143058777, 0.06317378580570221, 0.07578665018081665, 0.08839951455593109, 0.10101237893104553, 0.11362523585557938, 0.12623810768127441, 0.13885095715522766, 0.1514638364315033, 0.16407670080661774, 0.17668956518173218, 0.18930242955684662, 0.20191529393196106, 0.2145281434059143, 0.22714102268218994, 0.2397538721561432, 0.25236672163009644, 0.2649795711040497, 0.2775924503803253, 0.29020529985427856, 0.3028181791305542, 0.31543102860450745, 0.3280439078807831, 0.34065675735473633, 0.35326963663101196, 0.3658824861049652, 0.37849536538124084, 0.3911082148551941, 0.4037210941314697, 0.416333943605423, 0.4289468228816986, 0.44155967235565186, 0.4541725516319275]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 10.0, 19.0, 11.0, 22.0, 20.0, 18.0, 25.0, 18.0, 30.0, 31.0, 32.0, 39.0, 38.0, 43.0, 30.0, 44.0, 37.0, 40.0, 47.0, 45.0, 52.0, 46.0, 34.0, 21.0, 25.0, 26.0, 16.0, 30.0, 24.0, 18.0, 14.0, 12.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.541015625, -3.43310546875, -3.3251953125, -3.21728515625, -3.109375, -3.00146484375, -2.8935546875, -2.78564453125, -2.677734375, -2.56982421875, -2.4619140625, -2.35400390625, -2.24609375, -2.13818359375, -2.0302734375, -1.92236328125, -1.814453125, -1.70654296875, -1.5986328125, -1.49072265625, -1.3828125, -1.27490234375, -1.1669921875, -1.05908203125, -0.951171875, -0.84326171875, -0.7353515625, -0.62744140625, -0.51953125, -0.41162109375, -0.3037109375, -0.19580078125, -0.087890625, 0.02001953125, 0.1279296875, 0.23583984375, 0.34375, 0.45166015625, 0.5595703125, 0.66748046875, 0.775390625, 0.88330078125, 0.9912109375, 1.09912109375, 1.20703125, 1.31494140625, 1.4228515625, 1.53076171875, 1.638671875, 1.74658203125, 1.8544921875, 1.96240234375, 2.0703125, 2.17822265625, 2.2861328125, 2.39404296875, 2.501953125, 2.60986328125, 2.7177734375, 2.82568359375, 2.93359375, 3.04150390625, 3.1494140625, 3.25732421875, 3.365234375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 7.0, 11.0, 27.0, 34.0, 55.0, 84.0, 159.0, 205.0, 320.0, 483.0, 753.0, 1251.0, 2051.0, 3504.0, 5985.0, 10574.0, 20265.0, 45513.0, 140850.0, 456701.0, 235080.0, 66329.0, 26841.0, 13250.0, 7390.0, 4140.0, 2566.0, 1489.0, 954.0, 587.0, 354.0, 250.0, 150.0, 90.0, 67.0, 46.0, 43.0, 27.0, 9.0, 15.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.94921875, -5.7672119140625, -5.585205078125, -5.4031982421875, -5.22119140625, -5.0391845703125, -4.857177734375, -4.6751708984375, -4.4931640625, -4.3111572265625, -4.129150390625, -3.9471435546875, -3.76513671875, -3.5831298828125, -3.401123046875, -3.2191162109375, -3.037109375, -2.8551025390625, -2.673095703125, -2.4910888671875, -2.30908203125, -2.1270751953125, -1.945068359375, -1.7630615234375, -1.5810546875, -1.3990478515625, -1.217041015625, -1.0350341796875, -0.85302734375, -0.6710205078125, -0.489013671875, -0.3070068359375, -0.125, 0.0570068359375, 0.239013671875, 0.4210205078125, 0.60302734375, 0.7850341796875, 0.967041015625, 1.1490478515625, 1.3310546875, 1.5130615234375, 1.695068359375, 1.8770751953125, 2.05908203125, 2.2410888671875, 2.423095703125, 2.6051025390625, 2.787109375, 2.9691162109375, 3.151123046875, 3.3331298828125, 3.51513671875, 3.6971435546875, 3.879150390625, 4.0611572265625, 4.2431640625, 4.4251708984375, 4.607177734375, 4.7891845703125, 4.97119140625, 5.1531982421875, 5.335205078125, 5.5172119140625, 5.69921875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 12.0, 14.0, 30.0, 34.0, 35.0, 37.0, 36.0, 63.0, 52.0, 67.0, 88.0, 227.0, 1577.0, 248.0, 89.0, 63.0, 63.0, 49.0, 41.0, 35.0, 30.0, 25.0, 17.0, 23.0, 12.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8851318359375, -11.418701171875, -10.9522705078125, -10.48583984375, -10.0194091796875, -9.552978515625, -9.0865478515625, -8.6201171875, -8.1536865234375, -7.687255859375, -7.2208251953125, -6.75439453125, -6.2879638671875, -5.821533203125, -5.3551025390625, -4.888671875, -4.4222412109375, -3.955810546875, -3.4893798828125, -3.02294921875, -2.5565185546875, -2.090087890625, -1.6236572265625, -1.1572265625, -0.6907958984375, -0.224365234375, 0.2420654296875, 0.70849609375, 1.1749267578125, 1.641357421875, 2.1077880859375, 2.57421875, 3.0406494140625, 3.507080078125, 3.9735107421875, 4.43994140625, 4.9063720703125, 5.372802734375, 5.8392333984375, 6.3056640625, 6.7720947265625, 7.238525390625, 7.7049560546875, 8.17138671875, 8.6378173828125, 9.104248046875, 9.5706787109375, 10.037109375, 10.5035400390625, 10.969970703125, 11.4364013671875, 11.90283203125, 12.3692626953125, 12.835693359375, 13.3021240234375, 13.7685546875, 14.2349853515625, 14.701416015625, 15.1678466796875, 15.63427734375, 16.1007080078125, 16.567138671875, 17.0335693359375, 17.5]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 20.0, 28.0, 28.0, 42.0, 73.0, 86.0, 139.0, 263.0, 542.0, 1650.0, 6831.0, 48085.0, 2506483.0, 550360.0, 24668.0, 4179.0, 1086.0, 448.0, 197.0, 139.0, 87.0, 74.0, 51.0, 27.0, 18.0, 22.0, 9.0, 9.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.03125, -22.40625, -21.78125, -21.15625, -20.53125, -19.90625, -19.28125, -18.65625, -18.03125, -17.40625, -16.78125, -16.15625, -15.53125, -14.90625, -14.28125, -13.65625, -13.03125, -12.40625, -11.78125, -11.15625, -10.53125, -9.90625, -9.28125, -8.65625, -8.03125, -7.40625, -6.78125, -6.15625, -5.53125, -4.90625, -4.28125, -3.65625, -3.03125, -2.40625, -1.78125, -1.15625, -0.53125, 0.09375, 0.71875, 1.34375, 1.96875, 2.59375, 3.21875, 3.84375, 4.46875, 5.09375, 5.71875, 6.34375, 6.96875, 7.59375, 8.21875, 8.84375, 9.46875, 10.09375, 10.71875, 11.34375, 11.96875, 12.59375, 13.21875, 13.84375, 14.46875, 15.09375, 15.71875, 16.34375, 16.96875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 15.0, 59.0, 185.0, 314.0, 251.0, 106.0, 50.0, 14.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46574020385742, -60.84966278076172, -59.23358154296875, -57.61750411987305, -56.00142288208008, -54.385345458984375, -52.769264221191406, -51.1531867980957, -49.537105560302734, -47.92102813720703, -46.30494689941406, -44.68886947631836, -43.07278823852539, -41.45671081542969, -39.84062957763672, -38.224552154541016, -36.60847473144531, -34.99239730834961, -33.37631607055664, -31.760236740112305, -30.14415740966797, -28.528079986572266, -26.911998748779297, -25.295921325683594, -23.679840087890625, -22.06376075744629, -20.447681427001953, -18.831602096557617, -17.21552276611328, -15.599444389343262, -13.983365058898926, -12.36728572845459, -10.751205444335938, -9.135126113891602, -7.519046783447266, -5.902967929840088, -4.286888599395752, -2.670809745788574, -1.0547304153442383, 0.5613489151000977, 2.1774282455444336, 3.7935075759887695, 5.4095869064331055, 7.025665760040283, 8.641744613647461, 10.257823944091797, 11.873903274536133, 13.489982604980469, 15.106061935424805, 16.72214126586914, 18.338220596313477, 19.954299926757812, 21.57037925720215, 23.186458587646484, 24.802536010742188, 26.418617248535156, 28.03469467163086, 29.650774002075195, 31.26685333251953, 32.882930755615234, 34.4990119934082, 36.115089416503906, 37.731170654296875, 39.34724807739258, 40.96332931518555]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 6.0, 10.0, 8.0, 14.0, 11.0, 20.0, 15.0, 11.0, 13.0, 23.0, 23.0, 15.0, 25.0, 30.0, 28.0, 40.0, 37.0, 32.0, 41.0, 46.0, 39.0, 34.0, 34.0, 28.0, 33.0, 34.0, 24.0, 40.0, 29.0, 36.0, 17.0, 29.0, 15.0, 28.0, 22.0, 14.0, 18.0, 12.0, 16.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-30.805992126464844, -29.864938735961914, -28.923887252807617, -27.982833862304688, -27.04178237915039, -26.10072898864746, -25.159677505493164, -24.218624114990234, -23.277572631835938, -22.336519241333008, -21.39546775817871, -20.45441436767578, -19.513362884521484, -18.572309494018555, -17.631258010864258, -16.690204620361328, -15.749152183532715, -14.808099746704102, -13.867047309875488, -12.925994873046875, -11.984942436218262, -11.043889999389648, -10.102836608886719, -9.161785125732422, -8.220731735229492, -7.279679298400879, -6.338626861572266, -5.397574424743652, -4.456521987915039, -3.5154690742492676, -2.5744166374206543, -1.633364200592041, -0.6923122406005859, 0.24874025583267212, 1.1897927522659302, 2.130845308303833, 3.0718977451324463, 4.012950420379639, 4.954002857208252, 5.895055294036865, 6.8361077308654785, 7.777160167694092, 8.718213081359863, 9.659265518188477, 10.60031795501709, 11.541370391845703, 12.482422828674316, 13.42347526550293, 14.364527702331543, 15.305580139160156, 16.246633529663086, 17.187685012817383, 18.128738403320312, 19.06978988647461, 20.01084327697754, 20.951894760131836, 21.892948150634766, 22.834001541137695, 23.775053024291992, 24.716106414794922, 25.65715789794922, 26.59821128845215, 27.539262771606445, 28.480316162109375, 29.421367645263672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 10.0, 6.0, 8.0, 9.0, 11.0, 14.0, 15.0, 15.0, 18.0, 26.0, 29.0, 20.0, 31.0, 20.0, 37.0, 34.0, 45.0, 43.0, 51.0, 49.0, 50.0, 39.0, 37.0, 35.0, 43.0, 39.0, 27.0, 33.0, 29.0, 27.0, 26.0, 16.0, 22.0, 11.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.822265625, -3.706298828125, -3.59033203125, -3.474365234375, -3.3583984375, -3.242431640625, -3.12646484375, -3.010498046875, -2.89453125, -2.778564453125, -2.66259765625, -2.546630859375, -2.4306640625, -2.314697265625, -2.19873046875, -2.082763671875, -1.966796875, -1.850830078125, -1.73486328125, -1.618896484375, -1.5029296875, -1.386962890625, -1.27099609375, -1.155029296875, -1.0390625, -0.923095703125, -0.80712890625, -0.691162109375, -0.5751953125, -0.459228515625, -0.34326171875, -0.227294921875, -0.111328125, 0.004638671875, 0.12060546875, 0.236572265625, 0.3525390625, 0.468505859375, 0.58447265625, 0.700439453125, 0.81640625, 0.932373046875, 1.04833984375, 1.164306640625, 1.2802734375, 1.396240234375, 1.51220703125, 1.628173828125, 1.744140625, 1.860107421875, 1.97607421875, 2.092041015625, 2.2080078125, 2.323974609375, 2.43994140625, 2.555908203125, 2.671875, 2.787841796875, 2.90380859375, 3.019775390625, 3.1357421875, 3.251708984375, 3.36767578125, 3.483642578125, 3.599609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 12.0, 12.0, 21.0, 39.0, 50.0, 72.0, 96.0, 122.0, 206.0, 304.0, 416.0, 626.0, 1091.0, 1907.0, 3450.0, 7515.0, 16705.0, 43227.0, 177252.0, 1437154.0, 2130138.0, 280435.0, 55451.0, 19836.0, 8627.0, 3962.0, 2136.0, 1225.0, 726.0, 469.0, 291.0, 194.0, 148.0, 120.0, 62.0, 46.0, 36.0, 30.0, 14.0, 10.0, 9.0, 11.0, 11.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.3936767578125, -6.166259765625, -5.9388427734375, -5.71142578125, -5.4840087890625, -5.256591796875, -5.0291748046875, -4.8017578125, -4.5743408203125, -4.346923828125, -4.1195068359375, -3.89208984375, -3.6646728515625, -3.437255859375, -3.2098388671875, -2.982421875, -2.7550048828125, -2.527587890625, -2.3001708984375, -2.07275390625, -1.8453369140625, -1.617919921875, -1.3905029296875, -1.1630859375, -0.9356689453125, -0.708251953125, -0.4808349609375, -0.25341796875, -0.0260009765625, 0.201416015625, 0.4288330078125, 0.65625, 0.8836669921875, 1.111083984375, 1.3385009765625, 1.56591796875, 1.7933349609375, 2.020751953125, 2.2481689453125, 2.4755859375, 2.7030029296875, 2.930419921875, 3.1578369140625, 3.38525390625, 3.6126708984375, 3.840087890625, 4.0675048828125, 4.294921875, 4.5223388671875, 4.749755859375, 4.9771728515625, 5.20458984375, 5.4320068359375, 5.659423828125, 5.8868408203125, 6.1142578125, 6.3416748046875, 6.569091796875, 6.7965087890625, 7.02392578125, 7.2513427734375, 7.478759765625, 7.7061767578125, 7.93359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 11.0, 7.0, 7.0, 12.0, 9.0, 19.0, 24.0, 29.0, 25.0, 42.0, 58.0, 90.0, 90.0, 106.0, 163.0, 221.0, 410.0, 564.0, 614.0, 476.0, 290.0, 218.0, 156.0, 106.0, 71.0, 55.0, 46.0, 43.0, 23.0, 24.0, 11.0, 10.0, 7.0, 5.0, 3.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.84765625, -7.64752197265625, -7.4473876953125, -7.24725341796875, -7.047119140625, -6.84698486328125, -6.6468505859375, -6.44671630859375, -6.24658203125, -6.04644775390625, -5.8463134765625, -5.64617919921875, -5.446044921875, -5.24591064453125, -5.0457763671875, -4.84564208984375, -4.6455078125, -4.44537353515625, -4.2452392578125, -4.04510498046875, -3.844970703125, -3.64483642578125, -3.4447021484375, -3.24456787109375, -3.04443359375, -2.84429931640625, -2.6441650390625, -2.44403076171875, -2.243896484375, -2.04376220703125, -1.8436279296875, -1.64349365234375, -1.443359375, -1.24322509765625, -1.0430908203125, -0.84295654296875, -0.642822265625, -0.44268798828125, -0.2425537109375, -0.04241943359375, 0.15771484375, 0.35784912109375, 0.5579833984375, 0.75811767578125, 0.958251953125, 1.15838623046875, 1.3585205078125, 1.55865478515625, 1.7587890625, 1.95892333984375, 2.1590576171875, 2.35919189453125, 2.559326171875, 2.75946044921875, 2.9595947265625, 3.15972900390625, 3.35986328125, 3.55999755859375, 3.7601318359375, 3.96026611328125, 4.160400390625, 4.36053466796875, 4.5606689453125, 4.76080322265625, 4.9609375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 9.0, 12.0, 17.0, 24.0, 37.0, 50.0, 66.0, 113.0, 130.0, 249.0, 523.0, 2178.0, 15399.0, 269974.0, 3772044.0, 121885.0, 9031.0, 1373.0, 425.0, 207.0, 142.0, 108.0, 58.0, 49.0, 32.0, 27.0, 23.0, 17.0, 13.0, 8.0, 4.0, 12.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.236572265625, -17.48876953125, -16.740966796875, -15.9931640625, -15.245361328125, -14.49755859375, -13.749755859375, -13.001953125, -12.254150390625, -11.50634765625, -10.758544921875, -10.0107421875, -9.262939453125, -8.51513671875, -7.767333984375, -7.01953125, -6.271728515625, -5.52392578125, -4.776123046875, -4.0283203125, -3.280517578125, -2.53271484375, -1.784912109375, -1.037109375, -0.289306640625, 0.45849609375, 1.206298828125, 1.9541015625, 2.701904296875, 3.44970703125, 4.197509765625, 4.9453125, 5.693115234375, 6.44091796875, 7.188720703125, 7.9365234375, 8.684326171875, 9.43212890625, 10.179931640625, 10.927734375, 11.675537109375, 12.42333984375, 13.171142578125, 13.9189453125, 14.666748046875, 15.41455078125, 16.162353515625, 16.91015625, 17.657958984375, 18.40576171875, 19.153564453125, 19.9013671875, 20.649169921875, 21.39697265625, 22.144775390625, 22.892578125, 23.640380859375, 24.38818359375, 25.135986328125, 25.8837890625, 26.631591796875, 27.37939453125, 28.127197265625, 28.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 32.0, 97.0, 250.0, 348.0, 201.0, 66.0, 11.0, 6.0], "bins": [-150.67547607421875, -148.13961791992188, -145.603759765625, -143.0679168701172, -140.5320587158203, -137.99620056152344, -135.46034240722656, -132.9244842529297, -130.38864135742188, -127.852783203125, -125.31693267822266, -122.78107452392578, -120.24522399902344, -117.70936584472656, -115.17350769042969, -112.63765716552734, -110.10179138183594, -107.56593322753906, -105.03008270263672, -102.49422454833984, -99.9583740234375, -97.42251586914062, -94.88665771484375, -92.3508071899414, -89.81495666503906, -87.27909851074219, -84.74324798583984, -82.20738983154297, -79.67153930664062, -77.13568115234375, -74.59982299804688, -72.06397247314453, -69.52810668945312, -66.99224853515625, -64.4563980102539, -61.92053985595703, -59.38468551635742, -56.84883117675781, -54.3129768371582, -51.777122497558594, -49.24127197265625, -46.70541763305664, -44.16956329345703, -41.633705139160156, -39.09785079956055, -36.56199645996094, -34.02614212036133, -31.490285873413086, -28.954429626464844, -26.418575286865234, -23.882719039916992, -21.346864700317383, -18.81100845336914, -16.27515411376953, -13.739299774169922, -11.20344352722168, -8.66758918762207, -6.1317338943481445, -3.595879077911377, -1.0600242614746094, 1.4758310317993164, 4.011686325073242, 6.547540664672852, 9.083396911621094, 11.619251251220703]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 7.0, 5.0, 11.0, 13.0, 22.0, 19.0, 29.0, 30.0, 22.0, 31.0, 44.0, 43.0, 33.0, 38.0, 42.0, 44.0, 38.0, 31.0, 50.0, 47.0, 38.0, 45.0, 40.0, 27.0, 34.0, 25.0, 33.0, 21.0, 25.0, 19.0, 26.0, 12.0, 14.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.054899215698242, -26.296161651611328, -25.537424087524414, -24.7786865234375, -24.019948959350586, -23.261211395263672, -22.502471923828125, -21.74373435974121, -20.984996795654297, -20.226259231567383, -19.46752166748047, -18.708784103393555, -17.95004653930664, -17.191307067871094, -16.432571411132812, -15.673831939697266, -14.915095329284668, -14.156357765197754, -13.39762020111084, -12.63888168334961, -11.880144119262695, -11.121406555175781, -10.362668991088867, -9.603931427001953, -8.845193862915039, -8.086456298828125, -7.327718257904053, -6.568980693817139, -5.810242652893066, -5.051505088806152, -4.292767524719238, -3.534029483795166, -2.7752914428710938, -2.0165536403656006, -1.257815957069397, -0.49907827377319336, 0.2596595287322998, 1.018397331237793, 1.777134895324707, 2.5358729362487793, 3.2946105003356934, 4.053348064422607, 4.81208610534668, 5.570823669433594, 6.329561233520508, 7.08829927444458, 7.847036838531494, 8.605774879455566, 9.36451244354248, 10.123250007629395, 10.881987571716309, 11.640726089477539, 12.399463653564453, 13.158201217651367, 13.916938781738281, 14.675676345825195, 15.43441390991211, 16.193151473999023, 16.951889038085938, 17.71062660217285, 18.469364166259766, 19.228103637695312, 19.986839294433594, 20.74557876586914, 21.504316329956055]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 2.0, 6.0, 4.0, 13.0, 14.0, 11.0, 11.0, 17.0, 20.0, 20.0, 35.0, 25.0, 18.0, 34.0, 27.0, 42.0, 35.0, 47.0, 35.0, 58.0, 48.0, 38.0, 43.0, 43.0, 43.0, 31.0, 35.0, 32.0, 35.0, 23.0, 25.0, 23.0, 21.0, 15.0, 9.0, 7.0, 7.0, 8.0, 4.0, 5.0, 6.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.453125, -3.338043212890625, -3.22296142578125, -3.107879638671875, -2.9927978515625, -2.877716064453125, -2.76263427734375, -2.647552490234375, -2.532470703125, -2.417388916015625, -2.30230712890625, -2.187225341796875, -2.0721435546875, -1.957061767578125, -1.84197998046875, -1.726898193359375, -1.61181640625, -1.496734619140625, -1.38165283203125, -1.266571044921875, -1.1514892578125, -1.036407470703125, -0.92132568359375, -0.806243896484375, -0.691162109375, -0.576080322265625, -0.46099853515625, -0.345916748046875, -0.2308349609375, -0.115753173828125, -0.00067138671875, 0.114410400390625, 0.2294921875, 0.344573974609375, 0.45965576171875, 0.574737548828125, 0.6898193359375, 0.804901123046875, 0.91998291015625, 1.035064697265625, 1.150146484375, 1.265228271484375, 1.38031005859375, 1.495391845703125, 1.6104736328125, 1.725555419921875, 1.84063720703125, 1.955718994140625, 2.07080078125, 2.185882568359375, 2.30096435546875, 2.416046142578125, 2.5311279296875, 2.646209716796875, 2.76129150390625, 2.876373291015625, 2.991455078125, 3.106536865234375, 3.22161865234375, 3.336700439453125, 3.4517822265625, 3.566864013671875, 3.68194580078125, 3.797027587890625, 3.912109375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 16.0, 24.0, 28.0, 42.0, 56.0, 61.0, 101.0, 128.0, 204.0, 262.0, 306.0, 483.0, 659.0, 959.0, 1494.0, 2259.0, 4016.0, 9393.0, 41793.0, 493535.0, 435727.0, 37489.0, 8716.0, 3872.0, 2259.0, 1336.0, 967.0, 653.0, 469.0, 312.0, 250.0, 170.0, 127.0, 96.0, 60.0, 59.0, 42.0, 36.0, 22.0, 16.0, 14.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.58984375, -2.5062255859375, -2.422607421875, -2.3389892578125, -2.25537109375, -2.1717529296875, -2.088134765625, -2.0045166015625, -1.9208984375, -1.8372802734375, -1.753662109375, -1.6700439453125, -1.58642578125, -1.5028076171875, -1.419189453125, -1.3355712890625, -1.251953125, -1.1683349609375, -1.084716796875, -1.0010986328125, -0.91748046875, -0.8338623046875, -0.750244140625, -0.6666259765625, -0.5830078125, -0.4993896484375, -0.415771484375, -0.3321533203125, -0.24853515625, -0.1649169921875, -0.081298828125, 0.0023193359375, 0.0859375, 0.1695556640625, 0.253173828125, 0.3367919921875, 0.42041015625, 0.5040283203125, 0.587646484375, 0.6712646484375, 0.7548828125, 0.8385009765625, 0.922119140625, 1.0057373046875, 1.08935546875, 1.1729736328125, 1.256591796875, 1.3402099609375, 1.423828125, 1.5074462890625, 1.591064453125, 1.6746826171875, 1.75830078125, 1.8419189453125, 1.925537109375, 2.0091552734375, 2.0927734375, 2.1763916015625, 2.260009765625, 2.3436279296875, 2.42724609375, 2.5108642578125, 2.594482421875, 2.6781005859375, 2.76171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 11.0, 4.0, 13.0, 12.0, 14.0, 16.0, 16.0, 29.0, 25.0, 21.0, 40.0, 35.0, 19.0, 41.0, 49.0, 43.0, 43.0, 43.0, 1069.0, 50.0, 35.0, 43.0, 32.0, 45.0, 35.0, 41.0, 23.0, 33.0, 22.0, 23.0, 18.0, 15.0, 18.0, 14.0, 7.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.090667724609375, -2.99774169921875, -2.904815673828125, -2.8118896484375, -2.718963623046875, -2.62603759765625, -2.533111572265625, -2.440185546875, -2.347259521484375, -2.25433349609375, -2.161407470703125, -2.0684814453125, -1.975555419921875, -1.88262939453125, -1.789703369140625, -1.69677734375, -1.603851318359375, -1.51092529296875, -1.417999267578125, -1.3250732421875, -1.232147216796875, -1.13922119140625, -1.046295166015625, -0.953369140625, -0.860443115234375, -0.76751708984375, -0.674591064453125, -0.5816650390625, -0.488739013671875, -0.39581298828125, -0.302886962890625, -0.2099609375, -0.117034912109375, -0.02410888671875, 0.068817138671875, 0.1617431640625, 0.254669189453125, 0.34759521484375, 0.440521240234375, 0.533447265625, 0.626373291015625, 0.71929931640625, 0.812225341796875, 0.9051513671875, 0.998077392578125, 1.09100341796875, 1.183929443359375, 1.27685546875, 1.369781494140625, 1.46270751953125, 1.555633544921875, 1.6485595703125, 1.741485595703125, 1.83441162109375, 1.927337646484375, 2.020263671875, 2.113189697265625, 2.20611572265625, 2.299041748046875, 2.3919677734375, 2.484893798828125, 2.57781982421875, 2.670745849609375, 2.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 6.0, 5.0, 5.0, 11.0, 11.0, 13.0, 14.0, 26.0, 38.0, 42.0, 67.0, 92.0, 150.0, 136.0, 228.0, 331.0, 567.0, 938.0, 1635.0, 3623.0, 12454.0, 162782.0, 1847369.0, 52739.0, 7625.0, 2724.0, 1342.0, 751.0, 409.0, 270.0, 200.0, 127.0, 94.0, 87.0, 49.0, 46.0, 26.0, 22.0, 18.0, 7.0, 11.0, 6.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-2.658203125, -2.580780029296875, -2.50335693359375, -2.425933837890625, -2.3485107421875, -2.271087646484375, -2.19366455078125, -2.116241455078125, -2.038818359375, -1.961395263671875, -1.88397216796875, -1.806549072265625, -1.7291259765625, -1.651702880859375, -1.57427978515625, -1.496856689453125, -1.41943359375, -1.342010498046875, -1.26458740234375, -1.187164306640625, -1.1097412109375, -1.032318115234375, -0.95489501953125, -0.877471923828125, -0.800048828125, -0.722625732421875, -0.64520263671875, -0.567779541015625, -0.4903564453125, -0.412933349609375, -0.33551025390625, -0.258087158203125, -0.1806640625, -0.103240966796875, -0.02581787109375, 0.051605224609375, 0.1290283203125, 0.206451416015625, 0.28387451171875, 0.361297607421875, 0.438720703125, 0.516143798828125, 0.59356689453125, 0.670989990234375, 0.7484130859375, 0.825836181640625, 0.90325927734375, 0.980682373046875, 1.05810546875, 1.135528564453125, 1.21295166015625, 1.290374755859375, 1.3677978515625, 1.445220947265625, 1.52264404296875, 1.600067138671875, 1.677490234375, 1.754913330078125, 1.83233642578125, 1.909759521484375, 1.9871826171875, 2.064605712890625, 2.14202880859375, 2.219451904296875, 2.296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 11.0, 34.0, 51.0, 125.0, 224.0, 244.0, 135.0, 66.0, 27.0, 14.0, 18.0, 9.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.34619140625, -0.33469390869140625, -0.3231964111328125, -0.31169891357421875, -0.300201416015625, -0.28870391845703125, -0.2772064208984375, -0.26570892333984375, -0.25421142578125, -0.24271392822265625, -0.2312164306640625, -0.21971893310546875, -0.208221435546875, -0.19672393798828125, -0.1852264404296875, -0.17372894287109375, -0.1622314453125, -0.15073394775390625, -0.1392364501953125, -0.12773895263671875, -0.116241455078125, -0.10474395751953125, -0.0932464599609375, -0.08174896240234375, -0.07025146484375, -0.05875396728515625, -0.0472564697265625, -0.03575897216796875, -0.024261474609375, -0.01276397705078125, -0.0012664794921875, 0.01023101806640625, 0.021728515625, 0.03322601318359375, 0.0447235107421875, 0.05622100830078125, 0.067718505859375, 0.07921600341796875, 0.0907135009765625, 0.10221099853515625, 0.11370849609375, 0.12520599365234375, 0.1367034912109375, 0.14820098876953125, 0.159698486328125, 0.17119598388671875, 0.1826934814453125, 0.19419097900390625, 0.2056884765625, 0.21718597412109375, 0.2286834716796875, 0.24018096923828125, 0.251678466796875, 0.26317596435546875, 0.2746734619140625, 0.28617095947265625, 0.29766845703125, 0.30916595458984375, 0.3206634521484375, 0.33216094970703125, 0.343658447265625, 0.35515594482421875, 0.3666534423828125, 0.37815093994140625, 0.3896484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 21.0, 12.0, 29.0, 39.0, 92.0, 264.0, 2707.0, 1031748.0, 12615.0, 712.0, 125.0, 62.0, 43.0, 22.0, 7.0, 9.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.10400390625, -7.8564453125, -7.60888671875, -7.361328125, -7.11376953125, -6.8662109375, -6.61865234375, -6.37109375, -6.12353515625, -5.8759765625, -5.62841796875, -5.380859375, -5.13330078125, -4.8857421875, -4.63818359375, -4.390625, -4.14306640625, -3.8955078125, -3.64794921875, -3.400390625, -3.15283203125, -2.9052734375, -2.65771484375, -2.41015625, -2.16259765625, -1.9150390625, -1.66748046875, -1.419921875, -1.17236328125, -0.9248046875, -0.67724609375, -0.4296875, -0.18212890625, 0.0654296875, 0.31298828125, 0.560546875, 0.80810546875, 1.0556640625, 1.30322265625, 1.55078125, 1.79833984375, 2.0458984375, 2.29345703125, 2.541015625, 2.78857421875, 3.0361328125, 3.28369140625, 3.53125, 3.77880859375, 4.0263671875, 4.27392578125, 4.521484375, 4.76904296875, 5.0166015625, 5.26416015625, 5.51171875, 5.75927734375, 6.0068359375, 6.25439453125, 6.501953125, 6.74951171875, 6.9970703125, 7.24462890625, 7.4921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 26.0, 227.0, 667.0, 76.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296105146408081, -3.2330474853515625, -3.169989824295044, -3.1069321632385254, -3.043874502182007, -2.9808168411254883, -2.9177591800689697, -2.854701519012451, -2.7916440963745117, -2.728586435317993, -2.6655287742614746, -2.602471113204956, -2.5394134521484375, -2.476355791091919, -2.4132981300354004, -2.350240707397461, -2.2871828079223633, -2.2241251468658447, -2.161067485809326, -2.0980098247528076, -2.034952163696289, -1.9718945026397705, -1.9088369607925415, -1.845779299736023, -1.7827216386795044, -1.7196639776229858, -1.6566063165664673, -1.5935486555099487, -1.5304911136627197, -1.4674334526062012, -1.4043757915496826, -1.341318130493164, -1.2782602310180664, -1.2152025699615479, -1.1521449089050293, -1.0890872478485107, -1.0260295867919922, -0.9629719853401184, -0.8999143838882446, -0.8368567228317261, -0.7737990617752075, -0.710741400718689, -0.6476837396621704, -0.5846261382102966, -0.5215684771537781, -0.4585108160972595, -0.39545318484306335, -0.3323955535888672, -0.26933789253234863, -0.20628024637699127, -0.1432226002216339, -0.08016495406627655, -0.01710730791091919, 0.045950353145599365, 0.10900798439979553, 0.1720656156539917, 0.23512327671051025, 0.2981809377670288, 0.361238569021225, 0.42429620027542114, 0.4873538613319397, 0.5504115223884583, 0.613469123840332, 0.6765267848968506, 0.7395844459533691]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 13.0, 15.0, 10.0, 16.0, 15.0, 23.0, 27.0, 26.0, 21.0, 30.0, 32.0, 37.0, 42.0, 34.0, 42.0, 53.0, 47.0, 33.0, 38.0, 37.0, 51.0, 41.0, 34.0, 33.0, 26.0, 34.0, 24.0, 22.0, 28.0, 17.0, 8.0, 18.0, 14.0, 4.0, 8.0, 4.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2493683099746704, -0.2419174164533615, -0.2344665229320526, -0.2270156294107437, -0.21956473588943481, -0.21211384236812592, -0.20466294884681702, -0.19721205532550812, -0.18976116180419922, -0.18231026828289032, -0.17485937476158142, -0.16740848124027252, -0.15995758771896362, -0.15250669419765472, -0.14505580067634583, -0.13760490715503693, -0.13015401363372803, -0.12270312011241913, -0.11525222659111023, -0.10780133306980133, -0.10035043954849243, -0.09289954602718353, -0.08544865250587463, -0.07799775898456573, -0.07054686546325684, -0.06309597194194794, -0.05564507842063904, -0.04819418489933014, -0.04074329137802124, -0.03329239785671234, -0.025841504335403442, -0.018390610814094543, -0.010939717292785645, -0.0034888237714767456, 0.003962069749832153, 0.011412963271141052, 0.01886385679244995, 0.02631475031375885, 0.03376564383506775, 0.04121653735637665, 0.04866743087768555, 0.056118324398994446, 0.06356921792030334, 0.07102011144161224, 0.07847100496292114, 0.08592189848423004, 0.09337279200553894, 0.10082368552684784, 0.10827457904815674, 0.11572547256946564, 0.12317636609077454, 0.13062725961208344, 0.13807815313339233, 0.14552904665470123, 0.15297994017601013, 0.16043083369731903, 0.16788172721862793, 0.17533262073993683, 0.18278351426124573, 0.19023440778255463, 0.19768530130386353, 0.20513619482517242, 0.21258708834648132, 0.22003798186779022, 0.22748887538909912]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 7.0, 8.0, 7.0, 7.0, 13.0, 14.0, 19.0, 15.0, 24.0, 26.0, 21.0, 33.0, 35.0, 31.0, 40.0, 56.0, 42.0, 38.0, 55.0, 60.0, 49.0, 50.0, 28.0, 40.0, 35.0, 33.0, 35.0, 23.0, 29.0, 25.0, 19.0, 14.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.425628662109375, -3.30242919921875, -3.179229736328125, -3.0560302734375, -2.932830810546875, -2.80963134765625, -2.686431884765625, -2.563232421875, -2.440032958984375, -2.31683349609375, -2.193634033203125, -2.0704345703125, -1.947235107421875, -1.82403564453125, -1.700836181640625, -1.57763671875, -1.454437255859375, -1.33123779296875, -1.208038330078125, -1.0848388671875, -0.961639404296875, -0.83843994140625, -0.715240478515625, -0.592041015625, -0.468841552734375, -0.34564208984375, -0.222442626953125, -0.0992431640625, 0.023956298828125, 0.14715576171875, 0.270355224609375, 0.3935546875, 0.516754150390625, 0.63995361328125, 0.763153076171875, 0.8863525390625, 1.009552001953125, 1.13275146484375, 1.255950927734375, 1.379150390625, 1.502349853515625, 1.62554931640625, 1.748748779296875, 1.8719482421875, 1.995147705078125, 2.11834716796875, 2.241546630859375, 2.36474609375, 2.487945556640625, 2.61114501953125, 2.734344482421875, 2.8575439453125, 2.980743408203125, 3.10394287109375, 3.227142333984375, 3.350341796875, 3.473541259765625, 3.59674072265625, 3.719940185546875, 3.8431396484375, 3.966339111328125, 4.08953857421875, 4.212738037109375, 4.3359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 14.0, 28.0, 23.0, 33.0, 51.0, 80.0, 105.0, 137.0, 203.0, 306.0, 430.0, 727.0, 1139.0, 1860.0, 3549.0, 7405.0, 16719.0, 45549.0, 183530.0, 558476.0, 156305.0, 41319.0, 15442.0, 6774.0, 3371.0, 1843.0, 1037.0, 680.0, 435.0, 281.0, 205.0, 150.0, 93.0, 66.0, 51.0, 33.0, 24.0, 16.0, 16.0, 7.0, 10.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.31561279296875, -5.1351318359375, -4.95465087890625, -4.774169921875, -4.59368896484375, -4.4132080078125, -4.23272705078125, -4.05224609375, -3.87176513671875, -3.6912841796875, -3.51080322265625, -3.330322265625, -3.14984130859375, -2.9693603515625, -2.78887939453125, -2.6083984375, -2.42791748046875, -2.2474365234375, -2.06695556640625, -1.886474609375, -1.70599365234375, -1.5255126953125, -1.34503173828125, -1.16455078125, -0.98406982421875, -0.8035888671875, -0.62310791015625, -0.442626953125, -0.26214599609375, -0.0816650390625, 0.09881591796875, 0.279296875, 0.45977783203125, 0.6402587890625, 0.82073974609375, 1.001220703125, 1.18170166015625, 1.3621826171875, 1.54266357421875, 1.72314453125, 1.90362548828125, 2.0841064453125, 2.26458740234375, 2.445068359375, 2.62554931640625, 2.8060302734375, 2.98651123046875, 3.1669921875, 3.34747314453125, 3.5279541015625, 3.70843505859375, 3.888916015625, 4.06939697265625, 4.2498779296875, 4.43035888671875, 4.61083984375, 4.79132080078125, 4.9718017578125, 5.15228271484375, 5.332763671875, 5.51324462890625, 5.6937255859375, 5.87420654296875, 6.0546875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 12.0, 13.0, 8.0, 17.0, 17.0, 20.0, 29.0, 24.0, 36.0, 27.0, 31.0, 44.0, 49.0, 54.0, 66.0, 165.0, 1464.0, 367.0, 124.0, 52.0, 69.0, 51.0, 35.0, 29.0, 38.0, 28.0, 22.0, 16.0, 10.0, 18.0, 12.0, 12.0, 15.0, 6.0, 8.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.26220703125, -9.9072265625, -9.55224609375, -9.197265625, -8.84228515625, -8.4873046875, -8.13232421875, -7.77734375, -7.42236328125, -7.0673828125, -6.71240234375, -6.357421875, -6.00244140625, -5.6474609375, -5.29248046875, -4.9375, -4.58251953125, -4.2275390625, -3.87255859375, -3.517578125, -3.16259765625, -2.8076171875, -2.45263671875, -2.09765625, -1.74267578125, -1.3876953125, -1.03271484375, -0.677734375, -0.32275390625, 0.0322265625, 0.38720703125, 0.7421875, 1.09716796875, 1.4521484375, 1.80712890625, 2.162109375, 2.51708984375, 2.8720703125, 3.22705078125, 3.58203125, 3.93701171875, 4.2919921875, 4.64697265625, 5.001953125, 5.35693359375, 5.7119140625, 6.06689453125, 6.421875, 6.77685546875, 7.1318359375, 7.48681640625, 7.841796875, 8.19677734375, 8.5517578125, 8.90673828125, 9.26171875, 9.61669921875, 9.9716796875, 10.32666015625, 10.681640625, 11.03662109375, 11.3916015625, 11.74658203125, 12.1015625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 10.0, 9.0, 15.0, 22.0, 23.0, 15.0, 26.0, 28.0, 41.0, 66.0, 82.0, 120.0, 164.0, 298.0, 664.0, 2009.0, 10694.0, 137560.0, 2882449.0, 99004.0, 9033.0, 1810.0, 603.0, 280.0, 190.0, 94.0, 93.0, 60.0, 47.0, 45.0, 21.0, 29.0, 13.0, 18.0, 17.0, 11.0, 7.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.890625, -17.371337890625, -16.85205078125, -16.332763671875, -15.8134765625, -15.294189453125, -14.77490234375, -14.255615234375, -13.736328125, -13.217041015625, -12.69775390625, -12.178466796875, -11.6591796875, -11.139892578125, -10.62060546875, -10.101318359375, -9.58203125, -9.062744140625, -8.54345703125, -8.024169921875, -7.5048828125, -6.985595703125, -6.46630859375, -5.947021484375, -5.427734375, -4.908447265625, -4.38916015625, -3.869873046875, -3.3505859375, -2.831298828125, -2.31201171875, -1.792724609375, -1.2734375, -0.754150390625, -0.23486328125, 0.284423828125, 0.8037109375, 1.322998046875, 1.84228515625, 2.361572265625, 2.880859375, 3.400146484375, 3.91943359375, 4.438720703125, 4.9580078125, 5.477294921875, 5.99658203125, 6.515869140625, 7.03515625, 7.554443359375, 8.07373046875, 8.593017578125, 9.1123046875, 9.631591796875, 10.15087890625, 10.670166015625, 11.189453125, 11.708740234375, 12.22802734375, 12.747314453125, 13.2666015625, 13.785888671875, 14.30517578125, 14.824462890625, 15.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 11.0, 300.0, 674.0, 30.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.324481010437012, -9.159858703613281, -4.995236396789551, -0.8306140899658203, 3.33400821685791, 7.498631477355957, 11.663252830505371, 15.827874183654785, 19.992496490478516, 24.157119750976562, 28.321741104125977, 32.48636245727539, 36.65098571777344, 40.815608978271484, 44.98023223876953, 49.14485168457031, 53.30947494506836, 57.474098205566406, 61.63871765136719, 65.8033447265625, 69.96796417236328, 74.13258361816406, 78.29721069335938, 82.46183013916016, 86.62645721435547, 90.79107666015625, 94.95570373535156, 99.12032318115234, 103.28494262695312, 107.44956970214844, 111.61418914794922, 115.77880859375, 119.94343566894531, 124.1080551147461, 128.27267456054688, 132.4373016357422, 136.6019287109375, 140.76654052734375, 144.93116760253906, 149.09579467773438, 153.26040649414062, 157.42503356933594, 161.5896453857422, 165.7542724609375, 169.9188995361328, 174.08352661132812, 178.24813842773438, 182.4127655029297, 186.577392578125, 190.7420196533203, 194.90663146972656, 199.07125854492188, 203.2358856201172, 207.4005126953125, 211.56512451171875, 215.72975158691406, 219.89437866210938, 224.0590057373047, 228.22361755371094, 232.38824462890625, 236.55287170410156, 240.71749877929688, 244.88211059570312, 249.04673767089844, 253.2113494873047]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 3.0, 10.0, 6.0, 7.0, 7.0, 14.0, 8.0, 15.0, 22.0, 34.0, 25.0, 33.0, 37.0, 26.0, 35.0, 43.0, 52.0, 43.0, 45.0, 40.0, 44.0, 47.0, 22.0, 42.0, 24.0, 37.0, 31.0, 32.0, 30.0, 28.0, 30.0, 23.0, 23.0, 16.0, 17.0, 8.0, 7.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.405521392822266, -29.41016960144043, -28.414817810058594, -27.41946792602539, -26.424116134643555, -25.42876434326172, -24.433412551879883, -23.438060760498047, -22.442710876464844, -21.447359085083008, -20.452007293701172, -19.45665740966797, -18.461305618286133, -17.465953826904297, -16.47060203552246, -15.475250244140625, -14.479898452758789, -13.484546661376953, -12.489195823669434, -11.493844032287598, -10.498493194580078, -9.503141403198242, -8.507789611816406, -7.5124382972717285, -6.517086982727051, -5.521735668182373, -4.526384353637695, -3.5310325622558594, -2.5356812477111816, -1.540329933166504, -0.544978141784668, 0.45037317276000977, 1.4457244873046875, 2.4410758018493652, 3.436427354812622, 4.431778907775879, 5.427130222320557, 6.422481536865234, 7.41783332824707, 8.413185119628906, 9.408535957336426, 10.403887748718262, 11.399238586425781, 12.394590377807617, 13.389942169189453, 14.385293006896973, 15.380644798278809, 16.375995635986328, 17.371347427368164, 18.36669921875, 19.362051010131836, 20.357402801513672, 21.352752685546875, 22.34810447692871, 23.343456268310547, 24.338808059692383, 25.33415985107422, 26.329511642456055, 27.32486343383789, 28.320213317871094, 29.31556510925293, 30.310916900634766, 31.3062686920166, 32.30162048339844, 33.29697036743164]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 6.0, 14.0, 10.0, 8.0, 8.0, 19.0, 16.0, 18.0, 15.0, 22.0, 25.0, 30.0, 40.0, 28.0, 40.0, 41.0, 45.0, 37.0, 44.0, 49.0, 32.0, 49.0, 31.0, 47.0, 37.0, 24.0, 16.0, 29.0, 37.0, 23.0, 26.0, 23.0, 11.0, 25.0, 10.0, 6.0, 7.0, 11.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.298828125, -3.183013916015625, -3.06719970703125, -2.951385498046875, -2.8355712890625, -2.719757080078125, -2.60394287109375, -2.488128662109375, -2.372314453125, -2.256500244140625, -2.14068603515625, -2.024871826171875, -1.9090576171875, -1.793243408203125, -1.67742919921875, -1.561614990234375, -1.44580078125, -1.329986572265625, -1.21417236328125, -1.098358154296875, -0.9825439453125, -0.866729736328125, -0.75091552734375, -0.635101318359375, -0.519287109375, -0.403472900390625, -0.28765869140625, -0.171844482421875, -0.0560302734375, 0.059783935546875, 0.17559814453125, 0.291412353515625, 0.4072265625, 0.523040771484375, 0.63885498046875, 0.754669189453125, 0.8704833984375, 0.986297607421875, 1.10211181640625, 1.217926025390625, 1.333740234375, 1.449554443359375, 1.56536865234375, 1.681182861328125, 1.7969970703125, 1.912811279296875, 2.02862548828125, 2.144439697265625, 2.26025390625, 2.376068115234375, 2.49188232421875, 2.607696533203125, 2.7235107421875, 2.839324951171875, 2.95513916015625, 3.070953369140625, 3.186767578125, 3.302581787109375, 3.41839599609375, 3.534210205078125, 3.6500244140625, 3.765838623046875, 3.88165283203125, 3.997467041015625, 4.11328125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 22.0, 18.0, 43.0, 60.0, 74.0, 124.0, 181.0, 276.0, 509.0, 759.0, 1196.0, 2065.0, 3902.0, 7297.0, 14377.0, 35169.0, 123656.0, 695213.0, 2307131.0, 797066.0, 133994.0, 37574.0, 15421.0, 7815.0, 4077.0, 2378.0, 1401.0, 885.0, 548.0, 341.0, 211.0, 154.0, 117.0, 68.0, 42.0, 37.0, 13.0, 21.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.05181884765625, -4.8614501953125, -4.67108154296875, -4.480712890625, -4.29034423828125, -4.0999755859375, -3.90960693359375, -3.71923828125, -3.52886962890625, -3.3385009765625, -3.14813232421875, -2.957763671875, -2.76739501953125, -2.5770263671875, -2.38665771484375, -2.1962890625, -2.00592041015625, -1.8155517578125, -1.62518310546875, -1.434814453125, -1.24444580078125, -1.0540771484375, -0.86370849609375, -0.67333984375, -0.48297119140625, -0.2926025390625, -0.10223388671875, 0.088134765625, 0.27850341796875, 0.4688720703125, 0.65924072265625, 0.849609375, 1.03997802734375, 1.2303466796875, 1.42071533203125, 1.611083984375, 1.80145263671875, 1.9918212890625, 2.18218994140625, 2.37255859375, 2.56292724609375, 2.7532958984375, 2.94366455078125, 3.134033203125, 3.32440185546875, 3.5147705078125, 3.70513916015625, 3.8955078125, 4.08587646484375, 4.2762451171875, 4.46661376953125, 4.656982421875, 4.84735107421875, 5.0377197265625, 5.22808837890625, 5.41845703125, 5.60882568359375, 5.7991943359375, 5.98956298828125, 6.179931640625, 6.37030029296875, 6.5606689453125, 6.75103759765625, 6.94140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 8.0, 4.0, 7.0, 12.0, 15.0, 23.0, 28.0, 28.0, 51.0, 53.0, 99.0, 120.0, 161.0, 248.0, 434.0, 619.0, 669.0, 509.0, 314.0, 198.0, 117.0, 86.0, 71.0, 36.0, 49.0, 29.0, 11.0, 16.0, 18.0, 11.0, 6.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.50384521484375, -5.2850341796875, -5.06622314453125, -4.847412109375, -4.62860107421875, -4.4097900390625, -4.19097900390625, -3.97216796875, -3.75335693359375, -3.5345458984375, -3.31573486328125, -3.096923828125, -2.87811279296875, -2.6593017578125, -2.44049072265625, -2.2216796875, -2.00286865234375, -1.7840576171875, -1.56524658203125, -1.346435546875, -1.12762451171875, -0.9088134765625, -0.69000244140625, -0.47119140625, -0.25238037109375, -0.0335693359375, 0.18524169921875, 0.404052734375, 0.62286376953125, 0.8416748046875, 1.06048583984375, 1.279296875, 1.49810791015625, 1.7169189453125, 1.93572998046875, 2.154541015625, 2.37335205078125, 2.5921630859375, 2.81097412109375, 3.02978515625, 3.24859619140625, 3.4674072265625, 3.68621826171875, 3.905029296875, 4.12384033203125, 4.3426513671875, 4.56146240234375, 4.7802734375, 4.99908447265625, 5.2178955078125, 5.43670654296875, 5.655517578125, 5.87432861328125, 6.0931396484375, 6.31195068359375, 6.53076171875, 6.74957275390625, 6.9683837890625, 7.18719482421875, 7.406005859375, 7.62481689453125, 7.8436279296875, 8.06243896484375, 8.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 14.0, 19.0, 21.0, 29.0, 38.0, 83.0, 88.0, 133.0, 257.0, 625.0, 2119.0, 11889.0, 140730.0, 3681257.0, 331721.0, 20339.0, 3182.0, 866.0, 318.0, 182.0, 103.0, 67.0, 46.0, 41.0, 25.0, 20.0, 12.0, 10.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.859375, -23.24169921875, -22.6240234375, -22.00634765625, -21.388671875, -20.77099609375, -20.1533203125, -19.53564453125, -18.91796875, -18.30029296875, -17.6826171875, -17.06494140625, -16.447265625, -15.82958984375, -15.2119140625, -14.59423828125, -13.9765625, -13.35888671875, -12.7412109375, -12.12353515625, -11.505859375, -10.88818359375, -10.2705078125, -9.65283203125, -9.03515625, -8.41748046875, -7.7998046875, -7.18212890625, -6.564453125, -5.94677734375, -5.3291015625, -4.71142578125, -4.09375, -3.47607421875, -2.8583984375, -2.24072265625, -1.623046875, -1.00537109375, -0.3876953125, 0.22998046875, 0.84765625, 1.46533203125, 2.0830078125, 2.70068359375, 3.318359375, 3.93603515625, 4.5537109375, 5.17138671875, 5.7890625, 6.40673828125, 7.0244140625, 7.64208984375, 8.259765625, 8.87744140625, 9.4951171875, 10.11279296875, 10.73046875, 11.34814453125, 11.9658203125, 12.58349609375, 13.201171875, 13.81884765625, 14.4365234375, 15.05419921875, 15.671875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 37.0, 91.0, 166.0, 242.0, 235.0, 120.0, 71.0, 26.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.61666488647461, -52.90502166748047, -51.19337463378906, -49.48173141479492, -47.770084381103516, -46.058441162109375, -44.34679412841797, -42.63515090942383, -40.92350387573242, -39.21186065673828, -37.500213623046875, -35.788570404052734, -34.07692337036133, -32.36528015136719, -30.65363311767578, -28.94198989868164, -27.230344772338867, -25.518699645996094, -23.80705451965332, -22.095409393310547, -20.383764266967773, -18.672119140625, -16.96047592163086, -15.24882984161377, -13.537184715270996, -11.825539588928223, -10.11389446258545, -8.402250289916992, -6.6906046867370605, -4.978960037231445, -3.267314910888672, -1.5556697845458984, 0.155975341796875, 1.8676203489303589, 3.5792653560638428, 5.290910243988037, 7.0025553703308105, 8.714200019836426, 10.4258451461792, 12.137490272521973, 13.849135398864746, 15.56078052520752, 17.272424697875977, 18.98406982421875, 20.695714950561523, 22.407360076904297, 24.11900520324707, 25.830650329589844, 27.542295455932617, 29.25394058227539, 30.965585708618164, 32.67723083496094, 34.38887405395508, 36.100521087646484, 37.812164306640625, 39.52381134033203, 41.23545455932617, 42.94709777832031, 44.65874481201172, 46.37038803100586, 48.082035064697266, 49.793678283691406, 51.50532531738281, 53.21696853637695, 54.92861557006836]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 2.0, 5.0, 6.0, 12.0, 9.0, 11.0, 18.0, 19.0, 19.0, 22.0, 31.0, 30.0, 30.0, 32.0, 44.0, 41.0, 51.0, 38.0, 45.0, 55.0, 39.0, 41.0, 40.0, 44.0, 30.0, 44.0, 42.0, 29.0, 31.0, 31.0, 21.0, 14.0, 16.0, 11.0, 8.0, 7.0, 8.0, 2.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.89798927307129, -25.143157958984375, -24.388328552246094, -23.63349723815918, -22.878665924072266, -22.123836517333984, -21.36900520324707, -20.614173889160156, -19.859344482421875, -19.10451316833496, -18.34968376159668, -17.594852447509766, -16.840023040771484, -16.08519172668457, -15.330360412597656, -14.575530052185059, -13.820699691772461, -13.065869331359863, -12.311038970947266, -11.556207656860352, -10.801377296447754, -10.046546936035156, -9.291715621948242, -8.536885261535645, -7.782054901123047, -7.027224540710449, -6.272393703460693, -5.5175628662109375, -4.76273250579834, -4.007902145385742, -3.2530713081359863, -2.4982404708862305, -1.743408203125, -0.9885776042938232, -0.23374700546264648, 0.5210835933685303, 1.275914192199707, 2.030744791030884, 2.7855753898620605, 3.5404062271118164, 4.295236587524414, 5.050066947937012, 5.804897785186768, 6.559728622436523, 7.314558982849121, 8.069389343261719, 8.824220657348633, 9.57905101776123, 10.333881378173828, 11.088711738586426, 11.843542098999023, 12.598373413085938, 13.353203773498535, 14.108034133911133, 14.862865447998047, 15.617695808410645, 16.372526168823242, 17.127357482910156, 17.882186889648438, 18.63701820373535, 19.391849517822266, 20.146678924560547, 20.90151023864746, 21.656341552734375, 22.411170959472656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 4.0, 10.0, 10.0, 4.0, 8.0, 15.0, 10.0, 14.0, 26.0, 26.0, 28.0, 23.0, 23.0, 26.0, 50.0, 39.0, 35.0, 34.0, 32.0, 40.0, 31.0, 44.0, 44.0, 42.0, 39.0, 45.0, 34.0, 36.0, 28.0, 29.0, 25.0, 21.0, 14.0, 18.0, 9.0, 12.0, 10.0, 13.0, 7.0, 12.0, 2.0, 4.0, 4.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.318359375, -3.210540771484375, -3.10272216796875, -2.994903564453125, -2.8870849609375, -2.779266357421875, -2.67144775390625, -2.563629150390625, -2.455810546875, -2.347991943359375, -2.24017333984375, -2.132354736328125, -2.0245361328125, -1.916717529296875, -1.80889892578125, -1.701080322265625, -1.59326171875, -1.485443115234375, -1.37762451171875, -1.269805908203125, -1.1619873046875, -1.054168701171875, -0.94635009765625, -0.838531494140625, -0.730712890625, -0.622894287109375, -0.51507568359375, -0.407257080078125, -0.2994384765625, -0.191619873046875, -0.08380126953125, 0.024017333984375, 0.1318359375, 0.239654541015625, 0.34747314453125, 0.455291748046875, 0.5631103515625, 0.670928955078125, 0.77874755859375, 0.886566162109375, 0.994384765625, 1.102203369140625, 1.21002197265625, 1.317840576171875, 1.4256591796875, 1.533477783203125, 1.64129638671875, 1.749114990234375, 1.85693359375, 1.964752197265625, 2.07257080078125, 2.180389404296875, 2.2882080078125, 2.396026611328125, 2.50384521484375, 2.611663818359375, 2.719482421875, 2.827301025390625, 2.93511962890625, 3.042938232421875, 3.1507568359375, 3.258575439453125, 3.36639404296875, 3.474212646484375, 3.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 10.0, 12.0, 10.0, 21.0, 21.0, 26.0, 46.0, 56.0, 74.0, 101.0, 138.0, 187.0, 272.0, 395.0, 556.0, 863.0, 1339.0, 1961.0, 3167.0, 5679.0, 10921.0, 26002.0, 325245.0, 610730.0, 32172.0, 12172.0, 6365.0, 3625.0, 2056.0, 1323.0, 930.0, 568.0, 444.0, 314.0, 204.0, 149.0, 122.0, 92.0, 47.0, 29.0, 36.0, 18.0, 20.0, 7.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6015625, -4.466552734375, -4.33154296875, -4.196533203125, -4.0615234375, -3.926513671875, -3.79150390625, -3.656494140625, -3.521484375, -3.386474609375, -3.25146484375, -3.116455078125, -2.9814453125, -2.846435546875, -2.71142578125, -2.576416015625, -2.44140625, -2.306396484375, -2.17138671875, -2.036376953125, -1.9013671875, -1.766357421875, -1.63134765625, -1.496337890625, -1.361328125, -1.226318359375, -1.09130859375, -0.956298828125, -0.8212890625, -0.686279296875, -0.55126953125, -0.416259765625, -0.28125, -0.146240234375, -0.01123046875, 0.123779296875, 0.2587890625, 0.393798828125, 0.52880859375, 0.663818359375, 0.798828125, 0.933837890625, 1.06884765625, 1.203857421875, 1.3388671875, 1.473876953125, 1.60888671875, 1.743896484375, 1.87890625, 2.013916015625, 2.14892578125, 2.283935546875, 2.4189453125, 2.553955078125, 2.68896484375, 2.823974609375, 2.958984375, 3.093994140625, 3.22900390625, 3.364013671875, 3.4990234375, 3.634033203125, 3.76904296875, 3.904052734375, 4.0390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 11.0, 5.0, 11.0, 10.0, 17.0, 12.0, 17.0, 15.0, 21.0, 25.0, 23.0, 34.0, 40.0, 33.0, 37.0, 27.0, 41.0, 49.0, 41.0, 44.0, 1068.0, 41.0, 45.0, 41.0, 36.0, 36.0, 34.0, 23.0, 18.0, 15.0, 21.0, 24.0, 14.0, 17.0, 13.0, 14.0, 8.0, 4.0, 10.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.365234375, -2.287109375, -2.208984375, -2.130859375, -2.052734375, -1.974609375, -1.896484375, -1.818359375, -1.740234375, -1.662109375, -1.583984375, -1.505859375, -1.427734375, -1.349609375, -1.271484375, -1.193359375, -1.115234375, -1.037109375, -0.958984375, -0.880859375, -0.802734375, -0.724609375, -0.646484375, -0.568359375, -0.490234375, -0.412109375, -0.333984375, -0.255859375, -0.177734375, -0.099609375, -0.021484375, 0.056640625, 0.134765625, 0.212890625, 0.291015625, 0.369140625, 0.447265625, 0.525390625, 0.603515625, 0.681640625, 0.759765625, 0.837890625, 0.916015625, 0.994140625, 1.072265625, 1.150390625, 1.228515625, 1.306640625, 1.384765625, 1.462890625, 1.541015625, 1.619140625, 1.697265625, 1.775390625, 1.853515625, 1.931640625, 2.009765625, 2.087890625, 2.166015625, 2.244140625, 2.322265625, 2.400390625, 2.478515625, 2.556640625, 2.634765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 14.0, 7.0, 10.0, 24.0, 22.0, 23.0, 41.0, 53.0, 68.0, 84.0, 105.0, 147.0, 191.0, 282.0, 418.0, 560.0, 866.0, 1394.0, 2218.0, 3776.0, 6980.0, 16241.0, 58201.0, 1621715.0, 325566.0, 32290.0, 11571.0, 5611.0, 2983.0, 1883.0, 1165.0, 724.0, 514.0, 355.0, 250.0, 188.0, 131.0, 107.0, 76.0, 55.0, 45.0, 34.0, 28.0, 16.0, 13.0, 14.0, 14.0, 15.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.0078125, -1.9447021484375, -1.881591796875, -1.8184814453125, -1.75537109375, -1.6922607421875, -1.629150390625, -1.5660400390625, -1.5029296875, -1.4398193359375, -1.376708984375, -1.3135986328125, -1.25048828125, -1.1873779296875, -1.124267578125, -1.0611572265625, -0.998046875, -0.9349365234375, -0.871826171875, -0.8087158203125, -0.74560546875, -0.6824951171875, -0.619384765625, -0.5562744140625, -0.4931640625, -0.4300537109375, -0.366943359375, -0.3038330078125, -0.24072265625, -0.1776123046875, -0.114501953125, -0.0513916015625, 0.01171875, 0.0748291015625, 0.137939453125, 0.2010498046875, 0.26416015625, 0.3272705078125, 0.390380859375, 0.4534912109375, 0.5166015625, 0.5797119140625, 0.642822265625, 0.7059326171875, 0.76904296875, 0.8321533203125, 0.895263671875, 0.9583740234375, 1.021484375, 1.0845947265625, 1.147705078125, 1.2108154296875, 1.27392578125, 1.3370361328125, 1.400146484375, 1.4632568359375, 1.5263671875, 1.5894775390625, 1.652587890625, 1.7156982421875, 1.77880859375, 1.8419189453125, 1.905029296875, 1.9681396484375, 2.03125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 12.0, 20.0, 16.0, 54.0, 188.0, 469.0, 84.0, 41.0, 18.0, 16.0, 9.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.485107421875, -0.4709625244140625, -0.456817626953125, -0.4426727294921875, -0.42852783203125, -0.4143829345703125, -0.400238037109375, -0.3860931396484375, -0.3719482421875, -0.3578033447265625, -0.343658447265625, -0.3295135498046875, -0.31536865234375, -0.3012237548828125, -0.287078857421875, -0.2729339599609375, -0.2587890625, -0.2446441650390625, -0.230499267578125, -0.2163543701171875, -0.20220947265625, -0.1880645751953125, -0.173919677734375, -0.1597747802734375, -0.1456298828125, -0.1314849853515625, -0.117340087890625, -0.1031951904296875, -0.08905029296875, -0.0749053955078125, -0.060760498046875, -0.0466156005859375, -0.032470703125, -0.0183258056640625, -0.004180908203125, 0.0099639892578125, 0.02410888671875, 0.0382537841796875, 0.052398681640625, 0.0665435791015625, 0.0806884765625, 0.0948333740234375, 0.108978271484375, 0.1231231689453125, 0.13726806640625, 0.1514129638671875, 0.165557861328125, 0.1797027587890625, 0.19384765625, 0.2079925537109375, 0.222137451171875, 0.2362823486328125, 0.25042724609375, 0.2645721435546875, 0.278717041015625, 0.2928619384765625, 0.3070068359375, 0.3211517333984375, 0.335296630859375, 0.3494415283203125, 0.36358642578125, 0.3777313232421875, 0.391876220703125, 0.4060211181640625, 0.420166015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 20.0, 36.0, 52.0, 121.0, 746.0, 41394.0, 1004242.0, 1498.0, 172.0, 63.0, 56.0, 25.0, 24.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 1.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-9.9765625, -9.6453857421875, -9.314208984375, -8.9830322265625, -8.65185546875, -8.3206787109375, -7.989501953125, -7.6583251953125, -7.3271484375, -6.9959716796875, -6.664794921875, -6.3336181640625, -6.00244140625, -5.6712646484375, -5.340087890625, -5.0089111328125, -4.677734375, -4.3465576171875, -4.015380859375, -3.6842041015625, -3.35302734375, -3.0218505859375, -2.690673828125, -2.3594970703125, -2.0283203125, -1.6971435546875, -1.365966796875, -1.0347900390625, -0.70361328125, -0.3724365234375, -0.041259765625, 0.2899169921875, 0.62109375, 0.9522705078125, 1.283447265625, 1.6146240234375, 1.94580078125, 2.2769775390625, 2.608154296875, 2.9393310546875, 3.2705078125, 3.6016845703125, 3.932861328125, 4.2640380859375, 4.59521484375, 4.9263916015625, 5.257568359375, 5.5887451171875, 5.919921875, 6.2510986328125, 6.582275390625, 6.9134521484375, 7.24462890625, 7.5758056640625, 7.906982421875, 8.2381591796875, 8.5693359375, 8.9005126953125, 9.231689453125, 9.5628662109375, 9.89404296875, 10.2252197265625, 10.556396484375, 10.8875732421875, 11.21875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 25.0, 60.0, 208.0, 361.0, 210.0, 84.0, 28.0, 15.0, 14.0, 4.0], "bins": [-1.8845131397247314, -1.8517507314682007, -1.81898832321167, -1.7862260341644287, -1.753463625907898, -1.7207012176513672, -1.6879388093948364, -1.6551764011383057, -1.6224141120910645, -1.5896517038345337, -1.556889295578003, -1.5241270065307617, -1.491364598274231, -1.4586021900177002, -1.4258397817611694, -1.3930773735046387, -1.3603150844573975, -1.3275526762008667, -1.294790267944336, -1.2620279788970947, -1.229265570640564, -1.1965031623840332, -1.1637407541275024, -1.1309783458709717, -1.098215937614441, -1.0654535293579102, -1.0326911211013794, -0.9999287724494934, -0.9671664237976074, -0.9344040155410767, -0.9016416072845459, -0.8688792586326599, -0.8361169099807739, -0.8033545017242432, -0.7705921530723572, -0.7378297448158264, -0.7050673961639404, -0.6723049879074097, -0.6395425796508789, -0.6067802309989929, -0.5740178823471069, -0.5412554740905762, -0.5084931254386902, -0.4757307171821594, -0.44296836853027344, -0.4102059602737427, -0.3774435818195343, -0.3446812033653259, -0.31191879510879517, -0.2791564166545868, -0.24639403820037842, -0.21363164484500885, -0.18086926639080048, -0.1481068879365921, -0.11534449458122253, -0.08258211612701416, -0.04981975257396698, -0.017057370394468307, 0.015705011785030365, 0.048467397689819336, 0.08122977614402771, 0.11399215459823608, 0.14675454795360565, 0.17951692640781403, 0.2122793048620224]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 14.0, 1.0, 16.0, 11.0, 16.0, 24.0, 17.0, 23.0, 28.0, 23.0, 23.0, 31.0, 37.0, 32.0, 29.0, 39.0, 28.0, 36.0, 28.0, 30.0, 45.0, 43.0, 42.0, 36.0, 29.0, 30.0, 28.0, 25.0, 24.0, 21.0, 22.0, 21.0, 17.0, 13.0, 11.0, 13.0, 13.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.29606109857559204, -0.2868116796016693, -0.2775622308254242, -0.26831281185150146, -0.25906336307525635, -0.24981392920017242, -0.2405644953250885, -0.23131507635116577, -0.22206562757492065, -0.21281619369983673, -0.2035667598247528, -0.19431732594966888, -0.18506789207458496, -0.17581845819950104, -0.16656902432441711, -0.15731960535049438, -0.14807017147541046, -0.13882073760032654, -0.12957130372524261, -0.12032186985015869, -0.11107243597507477, -0.10182300209999084, -0.09257357567548752, -0.0833241418004036, -0.07407470792531967, -0.06482527405023575, -0.055575840175151825, -0.0463264100253582, -0.03707697615027428, -0.027827542275190353, -0.01857811212539673, -0.009328678250312805, -7.924437522888184e-05, 0.009170188568532467, 0.018419621512293816, 0.02766905352473259, 0.03691848739981651, 0.046167921274900436, 0.05541735142469406, 0.06466678529977798, 0.07391621917486191, 0.08316565304994583, 0.09241508692502975, 0.10166451334953308, 0.110913947224617, 0.12016338109970093, 0.12941281497478485, 0.13866224884986877, 0.1479116827249527, 0.15716111660003662, 0.16641055047512054, 0.17565998435020447, 0.1849094182252884, 0.19415885210037231, 0.20340827107429504, 0.21265771985054016, 0.2219071388244629, 0.23115657269954681, 0.24040600657463074, 0.24965544044971466, 0.2589048743247986, 0.2681542932987213, 0.27740374207496643, 0.28665316104888916, 0.2959026098251343]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 12.0, 9.0, 6.0, 14.0, 7.0, 23.0, 21.0, 21.0, 24.0, 36.0, 20.0, 24.0, 39.0, 31.0, 38.0, 39.0, 36.0, 36.0, 38.0, 48.0, 40.0, 41.0, 35.0, 39.0, 43.0, 23.0, 29.0, 22.0, 23.0, 29.0, 19.0, 13.0, 14.0, 12.0, 15.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.453125, -3.34478759765625, -3.2364501953125, -3.12811279296875, -3.019775390625, -2.91143798828125, -2.8031005859375, -2.69476318359375, -2.58642578125, -2.47808837890625, -2.3697509765625, -2.26141357421875, -2.153076171875, -2.04473876953125, -1.9364013671875, -1.82806396484375, -1.7197265625, -1.61138916015625, -1.5030517578125, -1.39471435546875, -1.286376953125, -1.17803955078125, -1.0697021484375, -0.96136474609375, -0.85302734375, -0.74468994140625, -0.6363525390625, -0.52801513671875, -0.419677734375, -0.31134033203125, -0.2030029296875, -0.09466552734375, 0.013671875, 0.12200927734375, 0.2303466796875, 0.33868408203125, 0.447021484375, 0.55535888671875, 0.6636962890625, 0.77203369140625, 0.88037109375, 0.98870849609375, 1.0970458984375, 1.20538330078125, 1.313720703125, 1.42205810546875, 1.5303955078125, 1.63873291015625, 1.7470703125, 1.85540771484375, 1.9637451171875, 2.07208251953125, 2.180419921875, 2.28875732421875, 2.3970947265625, 2.50543212890625, 2.61376953125, 2.72210693359375, 2.8304443359375, 2.93878173828125, 3.047119140625, 3.15545654296875, 3.2637939453125, 3.37213134765625, 3.48046875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 10.0, 14.0, 11.0, 25.0, 29.0, 32.0, 54.0, 84.0, 125.0, 196.0, 353.0, 525.0, 837.0, 1493.0, 2437.0, 4392.0, 8184.0, 15934.0, 35915.0, 147168.0, 659841.0, 108590.0, 31004.0, 14077.0, 7207.0, 4005.0, 2367.0, 1430.0, 810.0, 488.0, 317.0, 197.0, 124.0, 78.0, 59.0, 43.0, 24.0, 11.0, 7.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.60546875, -7.384521484375, -7.16357421875, -6.942626953125, -6.7216796875, -6.500732421875, -6.27978515625, -6.058837890625, -5.837890625, -5.616943359375, -5.39599609375, -5.175048828125, -4.9541015625, -4.733154296875, -4.51220703125, -4.291259765625, -4.0703125, -3.849365234375, -3.62841796875, -3.407470703125, -3.1865234375, -2.965576171875, -2.74462890625, -2.523681640625, -2.302734375, -2.081787109375, -1.86083984375, -1.639892578125, -1.4189453125, -1.197998046875, -0.97705078125, -0.756103515625, -0.53515625, -0.314208984375, -0.09326171875, 0.127685546875, 0.3486328125, 0.569580078125, 0.79052734375, 1.011474609375, 1.232421875, 1.453369140625, 1.67431640625, 1.895263671875, 2.1162109375, 2.337158203125, 2.55810546875, 2.779052734375, 3.0, 3.220947265625, 3.44189453125, 3.662841796875, 3.8837890625, 4.104736328125, 4.32568359375, 4.546630859375, 4.767578125, 4.988525390625, 5.20947265625, 5.430419921875, 5.6513671875, 5.872314453125, 6.09326171875, 6.314208984375, 6.53515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 7.0, 9.0, 10.0, 16.0, 15.0, 14.0, 29.0, 25.0, 27.0, 27.0, 36.0, 42.0, 51.0, 52.0, 88.0, 111.0, 257.0, 1569.0, 170.0, 67.0, 59.0, 59.0, 41.0, 29.0, 37.0, 19.0, 23.0, 34.0, 25.0, 14.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0390625, -10.6748046875, -10.310546875, -9.9462890625, -9.58203125, -9.2177734375, -8.853515625, -8.4892578125, -8.125, -7.7607421875, -7.396484375, -7.0322265625, -6.66796875, -6.3037109375, -5.939453125, -5.5751953125, -5.2109375, -4.8466796875, -4.482421875, -4.1181640625, -3.75390625, -3.3896484375, -3.025390625, -2.6611328125, -2.296875, -1.9326171875, -1.568359375, -1.2041015625, -0.83984375, -0.4755859375, -0.111328125, 0.2529296875, 0.6171875, 0.9814453125, 1.345703125, 1.7099609375, 2.07421875, 2.4384765625, 2.802734375, 3.1669921875, 3.53125, 3.8955078125, 4.259765625, 4.6240234375, 4.98828125, 5.3525390625, 5.716796875, 6.0810546875, 6.4453125, 6.8095703125, 7.173828125, 7.5380859375, 7.90234375, 8.2666015625, 8.630859375, 8.9951171875, 9.359375, 9.7236328125, 10.087890625, 10.4521484375, 10.81640625, 11.1806640625, 11.544921875, 11.9091796875, 12.2734375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 7.0, 9.0, 17.0, 17.0, 32.0, 37.0, 51.0, 86.0, 92.0, 186.0, 372.0, 929.0, 3016.0, 15479.0, 233159.0, 2831181.0, 51387.0, 6663.0, 1592.0, 619.0, 268.0, 140.0, 76.0, 84.0, 43.0, 45.0, 27.0, 17.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.468017578125, -17.85791015625, -17.247802734375, -16.6376953125, -16.027587890625, -15.41748046875, -14.807373046875, -14.197265625, -13.587158203125, -12.97705078125, -12.366943359375, -11.7568359375, -11.146728515625, -10.53662109375, -9.926513671875, -9.31640625, -8.706298828125, -8.09619140625, -7.486083984375, -6.8759765625, -6.265869140625, -5.65576171875, -5.045654296875, -4.435546875, -3.825439453125, -3.21533203125, -2.605224609375, -1.9951171875, -1.385009765625, -0.77490234375, -0.164794921875, 0.4453125, 1.055419921875, 1.66552734375, 2.275634765625, 2.8857421875, 3.495849609375, 4.10595703125, 4.716064453125, 5.326171875, 5.936279296875, 6.54638671875, 7.156494140625, 7.7666015625, 8.376708984375, 8.98681640625, 9.596923828125, 10.20703125, 10.817138671875, 11.42724609375, 12.037353515625, 12.6474609375, 13.257568359375, 13.86767578125, 14.477783203125, 15.087890625, 15.697998046875, 16.30810546875, 16.918212890625, 17.5283203125, 18.138427734375, 18.74853515625, 19.358642578125, 19.96875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 21.0, 30.0, 116.0, 254.0, 277.0, 195.0, 74.0, 32.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.020174026489258, -14.71348762512207, -13.406801223754883, -12.100114822387695, -10.793428421020508, -9.48674201965332, -8.180055618286133, -6.873369216918945, -5.566682815551758, -4.25999641418457, -2.953310012817383, -1.6466236114501953, -0.3399372100830078, 0.9667491912841797, 2.273435592651367, 3.5801219940185547, 4.886808395385742, 6.19349479675293, 7.500181198120117, 8.806867599487305, 10.113554000854492, 11.42024040222168, 12.726926803588867, 14.033613204956055, 15.340299606323242, 16.64698600769043, 17.953672409057617, 19.260358810424805, 20.567045211791992, 21.87373161315918, 23.180418014526367, 24.487104415893555, 25.793792724609375, 27.100479125976562, 28.40716552734375, 29.713851928710938, 31.020538330078125, 32.32722473144531, 33.6339111328125, 34.94059753417969, 36.247283935546875, 37.55397033691406, 38.86065673828125, 40.16734313964844, 41.474029541015625, 42.78071594238281, 44.08740234375, 45.39408874511719, 46.700775146484375, 48.00746154785156, 49.31414794921875, 50.62083435058594, 51.927520751953125, 53.23420715332031, 54.5408935546875, 55.84757995605469, 57.154266357421875, 58.46095275878906, 59.76763916015625, 61.07432556152344, 62.381011962890625, 63.68769836425781, 64.994384765625, 66.30107116699219, 67.60775756835938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 4.0, 9.0, 4.0, 8.0, 12.0, 15.0, 26.0, 27.0, 18.0, 29.0, 35.0, 32.0, 29.0, 37.0, 46.0, 48.0, 48.0, 38.0, 43.0, 44.0, 46.0, 41.0, 38.0, 43.0, 28.0, 39.0, 25.0, 23.0, 26.0, 17.0, 18.0, 19.0, 13.0, 15.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.587955474853516, -35.603729248046875, -34.619503021240234, -33.635276794433594, -32.65105056762695, -31.666824340820312, -30.682598114013672, -29.6983699798584, -28.714143753051758, -27.729917526245117, -26.745691299438477, -25.761465072631836, -24.777238845825195, -23.793010711669922, -22.80878448486328, -21.82455825805664, -20.84033203125, -19.85610580444336, -18.87187957763672, -17.887653350830078, -16.903427124023438, -15.91919994354248, -14.93497371673584, -13.950746536254883, -12.966522216796875, -11.982295989990234, -10.998069763183594, -10.013843536376953, -9.029616355895996, -8.045390129089355, -7.061163902282715, -6.076937198638916, -5.092710494995117, -4.108484268188477, -3.1242575645446777, -2.140031337738037, -1.1558048725128174, -0.17157840728759766, 0.812647819519043, 1.7968745231628418, 2.7811007499694824, 3.765327215194702, 4.749553680419922, 5.7337799072265625, 6.718006134033203, 7.702232837677002, 8.686458587646484, 9.670685768127441, 10.654911994934082, 11.639138221740723, 12.623364448547363, 13.60759162902832, 14.591817855834961, 15.576044082641602, 16.560270309448242, 17.544496536254883, 18.528722763061523, 19.512948989868164, 20.497175216674805, 21.481401443481445, 22.465627670288086, 23.44985580444336, 24.43408203125, 25.41830825805664, 26.40253448486328]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 7.0, 11.0, 12.0, 12.0, 17.0, 18.0, 13.0, 14.0, 20.0, 29.0, 25.0, 29.0, 29.0, 26.0, 34.0, 43.0, 42.0, 31.0, 42.0, 41.0, 50.0, 30.0, 45.0, 39.0, 41.0, 32.0, 28.0, 30.0, 33.0, 21.0, 26.0, 12.0, 15.0, 17.0, 10.0, 17.0, 8.0, 5.0, 8.0, 6.0, 8.0, 4.0, 3.0, 10.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.478515625, -3.365692138671875, -3.25286865234375, -3.140045166015625, -3.0272216796875, -2.914398193359375, -2.80157470703125, -2.688751220703125, -2.575927734375, -2.463104248046875, -2.35028076171875, -2.237457275390625, -2.1246337890625, -2.011810302734375, -1.89898681640625, -1.786163330078125, -1.67333984375, -1.560516357421875, -1.44769287109375, -1.334869384765625, -1.2220458984375, -1.109222412109375, -0.99639892578125, -0.883575439453125, -0.770751953125, -0.657928466796875, -0.54510498046875, -0.432281494140625, -0.3194580078125, -0.206634521484375, -0.09381103515625, 0.019012451171875, 0.1318359375, 0.244659423828125, 0.35748291015625, 0.470306396484375, 0.5831298828125, 0.695953369140625, 0.80877685546875, 0.921600341796875, 1.034423828125, 1.147247314453125, 1.26007080078125, 1.372894287109375, 1.4857177734375, 1.598541259765625, 1.71136474609375, 1.824188232421875, 1.93701171875, 2.049835205078125, 2.16265869140625, 2.275482177734375, 2.3883056640625, 2.501129150390625, 2.61395263671875, 2.726776123046875, 2.839599609375, 2.952423095703125, 3.06524658203125, 3.178070068359375, 3.2908935546875, 3.403717041015625, 3.51654052734375, 3.629364013671875, 3.7421875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 6.0, 18.0, 18.0, 27.0, 40.0, 48.0, 85.0, 136.0, 221.0, 366.0, 600.0, 1083.0, 1885.0, 3800.0, 7936.0, 17823.0, 48403.0, 232222.0, 1652444.0, 1876167.0, 261764.0, 52319.0, 18795.0, 8609.0, 4223.0, 2252.0, 1187.0, 670.0, 409.0, 263.0, 174.0, 88.0, 67.0, 43.0, 23.0, 17.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.4761962890625, -6.253173828125, -6.0301513671875, -5.80712890625, -5.5841064453125, -5.361083984375, -5.1380615234375, -4.9150390625, -4.6920166015625, -4.468994140625, -4.2459716796875, -4.02294921875, -3.7999267578125, -3.576904296875, -3.3538818359375, -3.130859375, -2.9078369140625, -2.684814453125, -2.4617919921875, -2.23876953125, -2.0157470703125, -1.792724609375, -1.5697021484375, -1.3466796875, -1.1236572265625, -0.900634765625, -0.6776123046875, -0.45458984375, -0.2315673828125, -0.008544921875, 0.2144775390625, 0.4375, 0.6605224609375, 0.883544921875, 1.1065673828125, 1.32958984375, 1.5526123046875, 1.775634765625, 1.9986572265625, 2.2216796875, 2.4447021484375, 2.667724609375, 2.8907470703125, 3.11376953125, 3.3367919921875, 3.559814453125, 3.7828369140625, 4.005859375, 4.2288818359375, 4.451904296875, 4.6749267578125, 4.89794921875, 5.1209716796875, 5.343994140625, 5.5670166015625, 5.7900390625, 6.0130615234375, 6.236083984375, 6.4591064453125, 6.68212890625, 6.9051513671875, 7.128173828125, 7.3511962890625, 7.57421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 8.0, 5.0, 12.0, 20.0, 17.0, 29.0, 36.0, 52.0, 94.0, 118.0, 157.0, 324.0, 531.0, 765.0, 686.0, 430.0, 257.0, 159.0, 110.0, 67.0, 46.0, 42.0, 27.0, 19.0, 18.0, 10.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.65234375, -7.39569091796875, -7.1390380859375, -6.88238525390625, -6.625732421875, -6.36907958984375, -6.1124267578125, -5.85577392578125, -5.59912109375, -5.34246826171875, -5.0858154296875, -4.82916259765625, -4.572509765625, -4.31585693359375, -4.0592041015625, -3.80255126953125, -3.5458984375, -3.28924560546875, -3.0325927734375, -2.77593994140625, -2.519287109375, -2.26263427734375, -2.0059814453125, -1.74932861328125, -1.49267578125, -1.23602294921875, -0.9793701171875, -0.72271728515625, -0.466064453125, -0.20941162109375, 0.0472412109375, 0.30389404296875, 0.560546875, 0.81719970703125, 1.0738525390625, 1.33050537109375, 1.587158203125, 1.84381103515625, 2.1004638671875, 2.35711669921875, 2.61376953125, 2.87042236328125, 3.1270751953125, 3.38372802734375, 3.640380859375, 3.89703369140625, 4.1536865234375, 4.41033935546875, 4.6669921875, 4.92364501953125, 5.1802978515625, 5.43695068359375, 5.693603515625, 5.95025634765625, 6.2069091796875, 6.46356201171875, 6.72021484375, 6.97686767578125, 7.2335205078125, 7.49017333984375, 7.746826171875, 8.00347900390625, 8.2601318359375, 8.51678466796875, 8.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 60.0, 82.0, 141.0, 278.0, 622.0, 2339.0, 17320.0, 564935.0, 3549130.0, 52812.0, 4631.0, 979.0, 366.0, 193.0, 94.0, 58.0, 34.0, 18.0, 27.0, 13.0, 6.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.390625, -25.618896484375, -24.84716796875, -24.075439453125, -23.3037109375, -22.531982421875, -21.76025390625, -20.988525390625, -20.216796875, -19.445068359375, -18.67333984375, -17.901611328125, -17.1298828125, -16.358154296875, -15.58642578125, -14.814697265625, -14.04296875, -13.271240234375, -12.49951171875, -11.727783203125, -10.9560546875, -10.184326171875, -9.41259765625, -8.640869140625, -7.869140625, -7.097412109375, -6.32568359375, -5.553955078125, -4.7822265625, -4.010498046875, -3.23876953125, -2.467041015625, -1.6953125, -0.923583984375, -0.15185546875, 0.619873046875, 1.3916015625, 2.163330078125, 2.93505859375, 3.706787109375, 4.478515625, 5.250244140625, 6.02197265625, 6.793701171875, 7.5654296875, 8.337158203125, 9.10888671875, 9.880615234375, 10.65234375, 11.424072265625, 12.19580078125, 12.967529296875, 13.7392578125, 14.510986328125, 15.28271484375, 16.054443359375, 16.826171875, 17.597900390625, 18.36962890625, 19.141357421875, 19.9130859375, 20.684814453125, 21.45654296875, 22.228271484375, 23.0]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 59.0, 278.0, 515.0, 128.0, 23.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-216.75743103027344, -212.90518188476562, -209.0529327392578, -205.20069885253906, -201.34844970703125, -197.49620056152344, -193.64395141601562, -189.79171752929688, -185.93946838378906, -182.08721923828125, -178.23497009277344, -174.3827362060547, -170.53048706054688, -166.67823791503906, -162.82598876953125, -158.9737548828125, -155.1215057373047, -151.26925659179688, -147.41700744628906, -143.5647735595703, -139.7125244140625, -135.8602752685547, -132.00802612304688, -128.15579223632812, -124.30353546142578, -120.45128631591797, -116.59904479980469, -112.74679565429688, -108.8945541381836, -105.04230499267578, -101.1900634765625, -97.33781433105469, -93.48558044433594, -89.63333129882812, -85.78108978271484, -81.92884063720703, -78.07659912109375, -74.22434997558594, -70.37210845947266, -66.51985931396484, -62.66761016845703, -58.815364837646484, -54.96311950683594, -51.11087417602539, -47.258628845214844, -43.40637969970703, -39.55413818359375, -35.70188903808594, -31.849647521972656, -27.99740219116211, -24.145156860351562, -20.292911529541016, -16.44066619873047, -12.588418960571289, -8.736173629760742, -4.883928298950195, -1.0316829681396484, 2.8205626010894775, 6.6728081703186035, 10.525053977966309, 14.377299308776855, 18.22954559326172, 22.081790924072266, 25.934036254882812, 29.78628158569336]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 10.0, 14.0, 6.0, 22.0, 18.0, 20.0, 35.0, 28.0, 38.0, 37.0, 40.0, 38.0, 42.0, 42.0, 45.0, 48.0, 53.0, 44.0, 36.0, 44.0, 42.0, 29.0, 40.0, 23.0, 26.0, 26.0, 21.0, 22.0, 21.0, 19.0, 9.0, 6.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.454151153564453, -22.71558380126953, -21.977014541625977, -21.238447189331055, -20.4998779296875, -19.761310577392578, -19.022743225097656, -18.284175872802734, -17.54560661315918, -16.807039260864258, -16.068470001220703, -15.329902648925781, -14.591334342956543, -13.852766036987305, -13.114198684692383, -12.375630378723145, -11.637062072753906, -10.898493766784668, -10.15992546081543, -9.421358108520508, -8.68278980255127, -7.944221496582031, -7.205653667449951, -6.467085838317871, -5.728517532348633, -4.9899492263793945, -4.2513813972473145, -3.5128133296966553, -2.774245262145996, -2.035677194595337, -1.2971091270446777, -0.5585412979125977, 0.18002891540527344, 0.9185969829559326, 1.6571650505065918, 2.395733118057251, 3.13430118560791, 3.8728692531585693, 4.6114373207092285, 5.350005149841309, 6.088573455810547, 6.827141761779785, 7.565709590911865, 8.304277420043945, 9.042845726013184, 9.781414031982422, 10.519981384277344, 11.258549690246582, 11.99711799621582, 12.735686302185059, 13.474254608154297, 14.212821960449219, 14.951390266418457, 15.689958572387695, 16.428525924682617, 17.167095184326172, 17.905662536621094, 18.644229888916016, 19.38279914855957, 20.121366500854492, 20.859935760498047, 21.59850311279297, 22.33707046508789, 23.075637817382812, 23.814207077026367]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 9.0, 10.0, 16.0, 22.0, 14.0, 28.0, 28.0, 27.0, 31.0, 42.0, 36.0, 42.0, 47.0, 45.0, 44.0, 49.0, 41.0, 42.0, 47.0, 40.0, 43.0, 29.0, 31.0, 31.0, 38.0, 28.0, 16.0, 15.0, 16.0, 16.0, 12.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.15234375, -4.02862548828125, -3.9049072265625, -3.78118896484375, -3.657470703125, -3.53375244140625, -3.4100341796875, -3.28631591796875, -3.16259765625, -3.03887939453125, -2.9151611328125, -2.79144287109375, -2.667724609375, -2.54400634765625, -2.4202880859375, -2.29656982421875, -2.1728515625, -2.04913330078125, -1.9254150390625, -1.80169677734375, -1.677978515625, -1.55426025390625, -1.4305419921875, -1.30682373046875, -1.18310546875, -1.05938720703125, -0.9356689453125, -0.81195068359375, -0.688232421875, -0.56451416015625, -0.4407958984375, -0.31707763671875, -0.193359375, -0.06964111328125, 0.0540771484375, 0.17779541015625, 0.301513671875, 0.42523193359375, 0.5489501953125, 0.67266845703125, 0.79638671875, 0.92010498046875, 1.0438232421875, 1.16754150390625, 1.291259765625, 1.41497802734375, 1.5386962890625, 1.66241455078125, 1.7861328125, 1.90985107421875, 2.0335693359375, 2.15728759765625, 2.281005859375, 2.40472412109375, 2.5284423828125, 2.65216064453125, 2.77587890625, 2.89959716796875, 3.0233154296875, 3.14703369140625, 3.270751953125, 3.39447021484375, 3.5181884765625, 3.64190673828125, 3.765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 12.0, 28.0, 37.0, 47.0, 58.0, 101.0, 150.0, 175.0, 236.0, 333.0, 456.0, 658.0, 962.0, 1445.0, 2505.0, 5621.0, 45421.0, 927898.0, 49286.0, 5743.0, 2502.0, 1529.0, 997.0, 656.0, 488.0, 371.0, 224.0, 181.0, 130.0, 99.0, 66.0, 40.0, 33.0, 19.0, 15.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.5400390625, -4.400390625, -4.2607421875, -4.12109375, -3.9814453125, -3.841796875, -3.7021484375, -3.5625, -3.4228515625, -3.283203125, -3.1435546875, -3.00390625, -2.8642578125, -2.724609375, -2.5849609375, -2.4453125, -2.3056640625, -2.166015625, -2.0263671875, -1.88671875, -1.7470703125, -1.607421875, -1.4677734375, -1.328125, -1.1884765625, -1.048828125, -0.9091796875, -0.76953125, -0.6298828125, -0.490234375, -0.3505859375, -0.2109375, -0.0712890625, 0.068359375, 0.2080078125, 0.34765625, 0.4873046875, 0.626953125, 0.7666015625, 0.90625, 1.0458984375, 1.185546875, 1.3251953125, 1.46484375, 1.6044921875, 1.744140625, 1.8837890625, 2.0234375, 2.1630859375, 2.302734375, 2.4423828125, 2.58203125, 2.7216796875, 2.861328125, 3.0009765625, 3.140625, 3.2802734375, 3.419921875, 3.5595703125, 3.69921875, 3.8388671875, 3.978515625, 4.1181640625, 4.2578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 1.0, 12.0, 14.0, 17.0, 10.0, 10.0, 11.0, 18.0, 26.0, 27.0, 17.0, 32.0, 32.0, 43.0, 41.0, 37.0, 31.0, 52.0, 1058.0, 49.0, 42.0, 41.0, 30.0, 35.0, 39.0, 26.0, 36.0, 33.0, 36.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 9.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.66796875, -2.588836669921875, -2.50970458984375, -2.430572509765625, -2.3514404296875, -2.272308349609375, -2.19317626953125, -2.114044189453125, -2.034912109375, -1.955780029296875, -1.87664794921875, -1.797515869140625, -1.7183837890625, -1.639251708984375, -1.56011962890625, -1.480987548828125, -1.40185546875, -1.322723388671875, -1.24359130859375, -1.164459228515625, -1.0853271484375, -1.006195068359375, -0.92706298828125, -0.847930908203125, -0.768798828125, -0.689666748046875, -0.61053466796875, -0.531402587890625, -0.4522705078125, -0.373138427734375, -0.29400634765625, -0.214874267578125, -0.1357421875, -0.056610107421875, 0.02252197265625, 0.101654052734375, 0.1807861328125, 0.259918212890625, 0.33905029296875, 0.418182373046875, 0.497314453125, 0.576446533203125, 0.65557861328125, 0.734710693359375, 0.8138427734375, 0.892974853515625, 0.97210693359375, 1.051239013671875, 1.13037109375, 1.209503173828125, 1.28863525390625, 1.367767333984375, 1.4468994140625, 1.526031494140625, 1.60516357421875, 1.684295654296875, 1.763427734375, 1.842559814453125, 1.92169189453125, 2.000823974609375, 2.0799560546875, 2.159088134765625, 2.23822021484375, 2.317352294921875, 2.396484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 5.0, 9.0, 6.0, 13.0, 19.0, 39.0, 48.0, 63.0, 81.0, 137.0, 185.0, 257.0, 390.0, 578.0, 797.0, 1393.0, 2353.0, 5039.0, 18022.0, 406766.0, 1620585.0, 27345.0, 5955.0, 2713.0, 1430.0, 944.0, 568.0, 416.0, 287.0, 198.0, 163.0, 104.0, 64.0, 42.0, 35.0, 23.0, 20.0, 12.0, 11.0, 6.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.13671875, -2.0758514404296875, -2.014984130859375, -1.9541168212890625, -1.89324951171875, -1.8323822021484375, -1.771514892578125, -1.7106475830078125, -1.6497802734375, -1.5889129638671875, -1.528045654296875, -1.4671783447265625, -1.40631103515625, -1.3454437255859375, -1.284576416015625, -1.2237091064453125, -1.162841796875, -1.1019744873046875, -1.041107177734375, -0.9802398681640625, -0.91937255859375, -0.8585052490234375, -0.797637939453125, -0.7367706298828125, -0.6759033203125, -0.6150360107421875, -0.554168701171875, -0.4933013916015625, -0.43243408203125, -0.3715667724609375, -0.310699462890625, -0.2498321533203125, -0.18896484375, -0.1280975341796875, -0.067230224609375, -0.0063629150390625, 0.05450439453125, 0.1153717041015625, 0.176239013671875, 0.2371063232421875, 0.2979736328125, 0.3588409423828125, 0.419708251953125, 0.4805755615234375, 0.54144287109375, 0.6023101806640625, 0.663177490234375, 0.7240447998046875, 0.784912109375, 0.8457794189453125, 0.906646728515625, 0.9675140380859375, 1.02838134765625, 1.0892486572265625, 1.150115966796875, 1.2109832763671875, 1.2718505859375, 1.3327178955078125, 1.393585205078125, 1.4544525146484375, 1.51531982421875, 1.5761871337890625, 1.637054443359375, 1.6979217529296875, 1.7587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 6.0, 9.0, 18.0, 18.0, 8.0, 20.0, 26.0, 31.0, 48.0, 100.0, 206.0, 168.0, 95.0, 63.0, 43.0, 28.0, 21.0, 14.0, 14.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09587287902832031, -0.09305191040039062, -0.09023094177246094, -0.08740997314453125, -0.08458900451660156, -0.08176803588867188, -0.07894706726074219, -0.0761260986328125, -0.07330513000488281, -0.07048416137695312, -0.06766319274902344, -0.06484222412109375, -0.06202125549316406, -0.059200286865234375, -0.05637931823730469, -0.053558349609375, -0.05073738098144531, -0.047916412353515625, -0.04509544372558594, -0.04227447509765625, -0.03945350646972656, -0.036632537841796875, -0.03381156921386719, -0.0309906005859375, -0.028169631958007812, -0.025348663330078125, -0.022527694702148438, -0.01970672607421875, -0.016885757446289062, -0.014064788818359375, -0.011243820190429688, -0.0084228515625, -0.0056018829345703125, -0.002780914306640625, 4.00543212890625e-05, 0.00286102294921875, 0.0056819915771484375, 0.008502960205078125, 0.011323928833007812, 0.0141448974609375, 0.016965866088867188, 0.019786834716796875, 0.022607803344726562, 0.02542877197265625, 0.028249740600585938, 0.031070709228515625, 0.03389167785644531, 0.036712646484375, 0.03953361511230469, 0.042354583740234375, 0.04517555236816406, 0.04799652099609375, 0.05081748962402344, 0.053638458251953125, 0.05645942687988281, 0.0592803955078125, 0.06210136413574219, 0.06492233276367188, 0.06774330139160156, 0.07056427001953125, 0.07338523864746094, 0.07620620727539062, 0.07902717590332031, 0.08184814453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 14.0, 18.0, 38.0, 49.0, 104.0, 221.0, 1116.0, 1040445.0, 5819.0, 336.0, 124.0, 62.0, 41.0, 26.0, 13.0, 19.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.962249755859375, -1.89129638671875, -1.820343017578125, -1.7493896484375, -1.678436279296875, -1.60748291015625, -1.536529541015625, -1.465576171875, -1.394622802734375, -1.32366943359375, -1.252716064453125, -1.1817626953125, -1.110809326171875, -1.03985595703125, -0.968902587890625, -0.89794921875, -0.826995849609375, -0.75604248046875, -0.685089111328125, -0.6141357421875, -0.543182373046875, -0.47222900390625, -0.401275634765625, -0.330322265625, -0.259368896484375, -0.18841552734375, -0.117462158203125, -0.0465087890625, 0.024444580078125, 0.09539794921875, 0.166351318359375, 0.2373046875, 0.308258056640625, 0.37921142578125, 0.450164794921875, 0.5211181640625, 0.592071533203125, 0.66302490234375, 0.733978271484375, 0.804931640625, 0.875885009765625, 0.94683837890625, 1.017791748046875, 1.0887451171875, 1.159698486328125, 1.23065185546875, 1.301605224609375, 1.37255859375, 1.443511962890625, 1.51446533203125, 1.585418701171875, 1.6563720703125, 1.727325439453125, 1.79827880859375, 1.869232177734375, 1.940185546875, 2.011138916015625, 2.08209228515625, 2.153045654296875, 2.2239990234375, 2.294952392578125, 2.36590576171875, 2.436859130859375, 2.5078125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 6.0, 34.0, 92.0, 325.0, 385.0, 135.0, 28.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06273401528596878, -0.05401284620165825, -0.04529167711734772, -0.036570508033037186, -0.027849338948726654, -0.019128169864416122, -0.01040700078010559, -0.0016858316957950592, 0.007035337388515472, 0.015756506472826004, 0.024477675557136536, 0.03319884464144707, 0.0419200137257576, 0.05064118281006813, 0.05936235189437866, 0.06808352470397949, 0.07680469006299973, 0.08552585542201996, 0.09424702823162079, 0.10296820104122162, 0.11168936640024185, 0.12041053175926208, 0.12913170456886292, 0.13785287737846375, 0.14657405018806458, 0.1552952229976654, 0.16401639580726624, 0.17273755371570587, 0.1814587265253067, 0.19017989933490753, 0.19890105724334717, 0.207622230052948, 0.21634337306022644, 0.22506454586982727, 0.2337857186794281, 0.24250687658786774, 0.2512280344963074, 0.2599492073059082, 0.26867038011550903, 0.27739155292510986, 0.2861127257347107, 0.2948338985443115, 0.30355507135391235, 0.3122762441635132, 0.320997416973114, 0.32971855998039246, 0.3384397327899933, 0.3471609055995941, 0.35588207840919495, 0.3646032512187958, 0.3733244240283966, 0.38204559683799744, 0.3907667398452759, 0.3994879126548767, 0.40820908546447754, 0.41693025827407837, 0.4256514310836792, 0.43437260389328003, 0.44309377670288086, 0.4518149495124817, 0.4605361223220825, 0.46925726532936096, 0.4779784381389618, 0.4866996109485626, 0.49542078375816345]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 11.0, 13.0, 3.0, 13.0, 15.0, 25.0, 11.0, 25.0, 21.0, 33.0, 38.0, 36.0, 39.0, 43.0, 54.0, 33.0, 53.0, 49.0, 47.0, 47.0, 34.0, 37.0, 31.0, 42.0, 34.0, 30.0, 27.0, 23.0, 18.0, 27.0, 16.0, 11.0, 10.0, 8.0, 9.0, 9.0, 9.0, 10.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07050657272338867, -0.06814620643854141, -0.06578584015369415, -0.06342548131942749, -0.06106511503458023, -0.05870474874973297, -0.05634438619017601, -0.05398402363061905, -0.05162365734577179, -0.04926329106092453, -0.04690292850136757, -0.04454256594181061, -0.04218219965696335, -0.03982183337211609, -0.03746147081255913, -0.03510110825300217, -0.03274074196815491, -0.030380377545952797, -0.028020013123750687, -0.025659648701548576, -0.023299284279346466, -0.020938919857144356, -0.018578555434942245, -0.016218191012740135, -0.013857826590538025, -0.011497462168335915, -0.009137097746133804, -0.006776733323931694, -0.004416368901729584, -0.0020560044795274734, 0.00030435994267463684, 0.002664724364876747, 0.005025088787078857, 0.007385453209280968, 0.009745817631483078, 0.012106182053685188, 0.014466546475887299, 0.01682691089808941, 0.01918727532029152, 0.02154763974249363, 0.02390800416469574, 0.02626836858689785, 0.02862873300909996, 0.03098909743130207, 0.03334946185350418, 0.03570982813835144, 0.0380701906979084, 0.04043055325746536, 0.04279091954231262, 0.04515128582715988, 0.04751164838671684, 0.049872010946273804, 0.05223237723112106, 0.05459274351596832, 0.056953106075525284, 0.059313468635082245, 0.061673834919929504, 0.06403420120477676, 0.06639456748962402, 0.06875492632389069, 0.07111529260873795, 0.0734756588935852, 0.07583601772785187, 0.07819638401269913, 0.08055675029754639]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 14.0, 13.0, 12.0, 23.0, 33.0, 22.0, 25.0, 36.0, 30.0, 43.0, 42.0, 39.0, 40.0, 45.0, 34.0, 39.0, 33.0, 44.0, 52.0, 46.0, 38.0, 40.0, 26.0, 27.0, 26.0, 37.0, 20.0, 20.0, 20.0, 10.0, 6.0, 13.0, 10.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.830535888671875, -3.70989990234375, -3.589263916015625, -3.4686279296875, -3.347991943359375, -3.22735595703125, -3.106719970703125, -2.986083984375, -2.865447998046875, -2.74481201171875, -2.624176025390625, -2.5035400390625, -2.382904052734375, -2.26226806640625, -2.141632080078125, -2.02099609375, -1.900360107421875, -1.77972412109375, -1.659088134765625, -1.5384521484375, -1.417816162109375, -1.29718017578125, -1.176544189453125, -1.055908203125, -0.935272216796875, -0.81463623046875, -0.694000244140625, -0.5733642578125, -0.452728271484375, -0.33209228515625, -0.211456298828125, -0.0908203125, 0.029815673828125, 0.15045166015625, 0.271087646484375, 0.3917236328125, 0.512359619140625, 0.63299560546875, 0.753631591796875, 0.874267578125, 0.994903564453125, 1.11553955078125, 1.236175537109375, 1.3568115234375, 1.477447509765625, 1.59808349609375, 1.718719482421875, 1.83935546875, 1.959991455078125, 2.08062744140625, 2.201263427734375, 2.3218994140625, 2.442535400390625, 2.56317138671875, 2.683807373046875, 2.804443359375, 2.925079345703125, 3.04571533203125, 3.166351318359375, 3.2869873046875, 3.407623291015625, 3.52825927734375, 3.648895263671875, 3.76953125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 8.0, 10.0, 14.0, 22.0, 15.0, 36.0, 51.0, 98.0, 182.0, 263.0, 467.0, 814.0, 1392.0, 2553.0, 4555.0, 8625.0, 16743.0, 33556.0, 70581.0, 170923.0, 386490.0, 196624.0, 78662.0, 36677.0, 18382.0, 9366.0, 5042.0, 2701.0, 1507.0, 922.0, 495.0, 293.0, 161.0, 114.0, 70.0, 36.0, 29.0, 19.0, 13.0, 14.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.65234375, -6.45416259765625, -6.2559814453125, -6.05780029296875, -5.859619140625, -5.66143798828125, -5.4632568359375, -5.26507568359375, -5.06689453125, -4.86871337890625, -4.6705322265625, -4.47235107421875, -4.274169921875, -4.07598876953125, -3.8778076171875, -3.67962646484375, -3.4814453125, -3.28326416015625, -3.0850830078125, -2.88690185546875, -2.688720703125, -2.49053955078125, -2.2923583984375, -2.09417724609375, -1.89599609375, -1.69781494140625, -1.4996337890625, -1.30145263671875, -1.103271484375, -0.90509033203125, -0.7069091796875, -0.50872802734375, -0.310546875, -0.11236572265625, 0.0858154296875, 0.28399658203125, 0.482177734375, 0.68035888671875, 0.8785400390625, 1.07672119140625, 1.27490234375, 1.47308349609375, 1.6712646484375, 1.86944580078125, 2.067626953125, 2.26580810546875, 2.4639892578125, 2.66217041015625, 2.8603515625, 3.05853271484375, 3.2567138671875, 3.45489501953125, 3.653076171875, 3.85125732421875, 4.0494384765625, 4.24761962890625, 4.44580078125, 4.64398193359375, 4.8421630859375, 5.04034423828125, 5.238525390625, 5.43670654296875, 5.6348876953125, 5.83306884765625, 6.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 8.0, 11.0, 17.0, 13.0, 19.0, 17.0, 23.0, 31.0, 24.0, 33.0, 45.0, 46.0, 48.0, 56.0, 90.0, 104.0, 169.0, 1367.0, 245.0, 144.0, 91.0, 44.0, 43.0, 36.0, 35.0, 40.0, 25.0, 24.0, 25.0, 23.0, 27.0, 15.0, 19.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 7.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.43505859375, -9.1279296875, -8.82080078125, -8.513671875, -8.20654296875, -7.8994140625, -7.59228515625, -7.28515625, -6.97802734375, -6.6708984375, -6.36376953125, -6.056640625, -5.74951171875, -5.4423828125, -5.13525390625, -4.828125, -4.52099609375, -4.2138671875, -3.90673828125, -3.599609375, -3.29248046875, -2.9853515625, -2.67822265625, -2.37109375, -2.06396484375, -1.7568359375, -1.44970703125, -1.142578125, -0.83544921875, -0.5283203125, -0.22119140625, 0.0859375, 0.39306640625, 0.7001953125, 1.00732421875, 1.314453125, 1.62158203125, 1.9287109375, 2.23583984375, 2.54296875, 2.85009765625, 3.1572265625, 3.46435546875, 3.771484375, 4.07861328125, 4.3857421875, 4.69287109375, 5.0, 5.30712890625, 5.6142578125, 5.92138671875, 6.228515625, 6.53564453125, 6.8427734375, 7.14990234375, 7.45703125, 7.76416015625, 8.0712890625, 8.37841796875, 8.685546875, 8.99267578125, 9.2998046875, 9.60693359375, 9.9140625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 15.0, 9.0, 19.0, 15.0, 36.0, 32.0, 69.0, 112.0, 187.0, 376.0, 701.0, 1793.0, 4835.0, 18409.0, 118770.0, 2476881.0, 465775.0, 43428.0, 9224.0, 2744.0, 1123.0, 513.0, 267.0, 143.0, 71.0, 44.0, 29.0, 22.0, 20.0, 8.0, 7.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.234375, -13.721435546875, -13.20849609375, -12.695556640625, -12.1826171875, -11.669677734375, -11.15673828125, -10.643798828125, -10.130859375, -9.617919921875, -9.10498046875, -8.592041015625, -8.0791015625, -7.566162109375, -7.05322265625, -6.540283203125, -6.02734375, -5.514404296875, -5.00146484375, -4.488525390625, -3.9755859375, -3.462646484375, -2.94970703125, -2.436767578125, -1.923828125, -1.410888671875, -0.89794921875, -0.385009765625, 0.1279296875, 0.640869140625, 1.15380859375, 1.666748046875, 2.1796875, 2.692626953125, 3.20556640625, 3.718505859375, 4.2314453125, 4.744384765625, 5.25732421875, 5.770263671875, 6.283203125, 6.796142578125, 7.30908203125, 7.822021484375, 8.3349609375, 8.847900390625, 9.36083984375, 9.873779296875, 10.38671875, 10.899658203125, 11.41259765625, 11.925537109375, 12.4384765625, 12.951416015625, 13.46435546875, 13.977294921875, 14.490234375, 15.003173828125, 15.51611328125, 16.029052734375, 16.5419921875, 17.054931640625, 17.56787109375, 18.080810546875, 18.59375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 17.0, 205.0, 531.0, 226.0, 30.0, 5.0, 1.0], "bins": [-228.764404296875, -224.92250061035156, -221.08059692382812, -217.23870849609375, -213.3968048095703, -209.55490112304688, -205.71299743652344, -201.87110900878906, -198.02920532226562, -194.1873016357422, -190.34539794921875, -186.50350952148438, -182.66160583496094, -178.8197021484375, -174.97779846191406, -171.1359100341797, -167.29400634765625, -163.4521026611328, -159.61019897460938, -155.768310546875, -151.92640686035156, -148.08450317382812, -144.2425994873047, -140.4007110595703, -136.55880737304688, -132.71690368652344, -128.875, -125.0331039428711, -121.19120788574219, -117.34930419921875, -113.50740814208984, -109.6655044555664, -105.82360076904297, -101.98169708251953, -98.13980102539062, -94.29789733886719, -90.45600128173828, -86.61409759521484, -82.77220153808594, -78.9302978515625, -75.08839416503906, -71.24649047851562, -67.40459442138672, -63.56269454956055, -59.720794677734375, -55.87889099121094, -52.03699493408203, -48.195091247558594, -44.35319519042969, -40.511295318603516, -36.669395446777344, -32.82749557495117, -28.985595703125, -25.143693923950195, -21.301794052124023, -17.45989418029785, -13.617996215820312, -9.77609634399414, -5.9341959953308105, -2.0922956466674805, 1.7496042251586914, 5.59150505065918, 9.433404922485352, 13.275304794311523, 17.117204666137695]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 14.0, 22.0, 15.0, 20.0, 13.0, 28.0, 26.0, 24.0, 35.0, 43.0, 39.0, 40.0, 43.0, 44.0, 37.0, 43.0, 43.0, 42.0, 40.0, 33.0, 31.0, 31.0, 28.0, 37.0, 17.0, 23.0, 30.0, 22.0, 14.0, 21.0, 12.0, 9.0, 11.0, 8.0, 7.0, 5.0, 10.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.797935485839844, -23.97972297668457, -23.161510467529297, -22.343297958374023, -21.52508544921875, -20.706871032714844, -19.888660430908203, -19.070446014404297, -18.252233505249023, -17.43402099609375, -16.615808486938477, -15.797595977783203, -14.979382514953613, -14.16117000579834, -13.342957496643066, -12.524744033813477, -11.70653247833252, -10.888319969177246, -10.070107460021973, -9.251893997192383, -8.43368148803711, -7.615468978881836, -6.7972564697265625, -5.979043483734131, -5.160830974578857, -4.342618465423584, -3.5244054794311523, -2.706192970275879, -1.8879802227020264, -1.0697674751281738, -0.2515549659729004, 0.5666580200195312, 1.3848705291748047, 2.2030832767486572, 3.0212960243225098, 3.839508533477783, 4.657721519470215, 5.475934028625488, 6.294146537780762, 7.112359523773193, 7.930572032928467, 8.748785018920898, 9.566997528076172, 10.385210037231445, 11.203422546386719, 12.021635055541992, 12.839847564697266, 13.658061027526855, 14.476273536682129, 15.294486045837402, 16.112699508666992, 16.930912017822266, 17.74912452697754, 18.567337036132812, 19.385549545288086, 20.20376205444336, 21.021974563598633, 21.840187072753906, 22.65839958190918, 23.476612091064453, 24.294824600219727, 25.113037109375, 25.931251525878906, 26.74946403503418, 27.567676544189453]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 5.0, 9.0, 12.0, 18.0, 12.0, 22.0, 14.0, 29.0, 19.0, 18.0, 33.0, 27.0, 25.0, 28.0, 28.0, 34.0, 33.0, 52.0, 42.0, 43.0, 38.0, 40.0, 44.0, 43.0, 32.0, 32.0, 27.0, 24.0, 32.0, 19.0, 21.0, 17.0, 8.0, 13.0, 18.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-3.341796875, -3.23211669921875, -3.1224365234375, -3.01275634765625, -2.903076171875, -2.79339599609375, -2.6837158203125, -2.57403564453125, -2.46435546875, -2.35467529296875, -2.2449951171875, -2.13531494140625, -2.025634765625, -1.91595458984375, -1.8062744140625, -1.69659423828125, -1.5869140625, -1.47723388671875, -1.3675537109375, -1.25787353515625, -1.148193359375, -1.03851318359375, -0.9288330078125, -0.81915283203125, -0.70947265625, -0.59979248046875, -0.4901123046875, -0.38043212890625, -0.270751953125, -0.16107177734375, -0.0513916015625, 0.05828857421875, 0.16796875, 0.27764892578125, 0.3873291015625, 0.49700927734375, 0.606689453125, 0.71636962890625, 0.8260498046875, 0.93572998046875, 1.04541015625, 1.15509033203125, 1.2647705078125, 1.37445068359375, 1.484130859375, 1.59381103515625, 1.7034912109375, 1.81317138671875, 1.9228515625, 2.03253173828125, 2.1422119140625, 2.25189208984375, 2.361572265625, 2.47125244140625, 2.5809326171875, 2.69061279296875, 2.80029296875, 2.90997314453125, 3.0196533203125, 3.12933349609375, 3.239013671875, 3.34869384765625, 3.4583740234375, 3.56805419921875, 3.677734375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 7.0, 13.0, 15.0, 16.0, 17.0, 25.0, 22.0, 32.0, 41.0, 35.0, 54.0, 55.0, 90.0, 167.0, 326.0, 948.0, 4247.0, 34799.0, 3086677.0, 1042467.0, 19597.0, 3026.0, 742.0, 278.0, 141.0, 85.0, 54.0, 34.0, 50.0, 30.0, 24.0, 20.0, 25.0, 18.0, 10.0, 12.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 2.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.635498046875, -20.91162109375, -20.187744140625, -19.4638671875, -18.739990234375, -18.01611328125, -17.292236328125, -16.568359375, -15.844482421875, -15.12060546875, -14.396728515625, -13.6728515625, -12.948974609375, -12.22509765625, -11.501220703125, -10.77734375, -10.053466796875, -9.32958984375, -8.605712890625, -7.8818359375, -7.157958984375, -6.43408203125, -5.710205078125, -4.986328125, -4.262451171875, -3.53857421875, -2.814697265625, -2.0908203125, -1.366943359375, -0.64306640625, 0.080810546875, 0.8046875, 1.528564453125, 2.25244140625, 2.976318359375, 3.7001953125, 4.424072265625, 5.14794921875, 5.871826171875, 6.595703125, 7.319580078125, 8.04345703125, 8.767333984375, 9.4912109375, 10.215087890625, 10.93896484375, 11.662841796875, 12.38671875, 13.110595703125, 13.83447265625, 14.558349609375, 15.2822265625, 16.006103515625, 16.72998046875, 17.453857421875, 18.177734375, 18.901611328125, 19.62548828125, 20.349365234375, 21.0732421875, 21.797119140625, 22.52099609375, 23.244873046875, 23.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 12.0, 8.0, 19.0, 18.0, 26.0, 31.0, 29.0, 58.0, 66.0, 88.0, 124.0, 202.0, 262.0, 442.0, 581.0, 607.0, 467.0, 271.0, 209.0, 130.0, 100.0, 74.0, 42.0, 48.0, 24.0, 27.0, 18.0, 9.0, 22.0, 10.0, 9.0, 8.0, 4.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.2452392578125, -4.052978515625, -3.8607177734375, -3.66845703125, -3.4761962890625, -3.283935546875, -3.0916748046875, -2.8994140625, -2.7071533203125, -2.514892578125, -2.3226318359375, -2.13037109375, -1.9381103515625, -1.745849609375, -1.5535888671875, -1.361328125, -1.1690673828125, -0.976806640625, -0.7845458984375, -0.59228515625, -0.4000244140625, -0.207763671875, -0.0155029296875, 0.1767578125, 0.3690185546875, 0.561279296875, 0.7535400390625, 0.94580078125, 1.1380615234375, 1.330322265625, 1.5225830078125, 1.71484375, 1.9071044921875, 2.099365234375, 2.2916259765625, 2.48388671875, 2.6761474609375, 2.868408203125, 3.0606689453125, 3.2529296875, 3.4451904296875, 3.637451171875, 3.8297119140625, 4.02197265625, 4.2142333984375, 4.406494140625, 4.5987548828125, 4.791015625, 4.9832763671875, 5.175537109375, 5.3677978515625, 5.56005859375, 5.7523193359375, 5.944580078125, 6.1368408203125, 6.3291015625, 6.5213623046875, 6.713623046875, 6.9058837890625, 7.09814453125, 7.2904052734375, 7.482666015625, 7.6749267578125, 7.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 4.0, 12.0, 13.0, 10.0, 16.0, 26.0, 24.0, 31.0, 37.0, 86.0, 120.0, 223.0, 715.0, 4107.0, 48352.0, 2920003.0, 1185259.0, 30887.0, 3116.0, 617.0, 238.0, 119.0, 58.0, 42.0, 34.0, 20.0, 16.0, 12.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.517333984375, -19.83154296875, -19.145751953125, -18.4599609375, -17.774169921875, -17.08837890625, -16.402587890625, -15.716796875, -15.031005859375, -14.34521484375, -13.659423828125, -12.9736328125, -12.287841796875, -11.60205078125, -10.916259765625, -10.23046875, -9.544677734375, -8.85888671875, -8.173095703125, -7.4873046875, -6.801513671875, -6.11572265625, -5.429931640625, -4.744140625, -4.058349609375, -3.37255859375, -2.686767578125, -2.0009765625, -1.315185546875, -0.62939453125, 0.056396484375, 0.7421875, 1.427978515625, 2.11376953125, 2.799560546875, 3.4853515625, 4.171142578125, 4.85693359375, 5.542724609375, 6.228515625, 6.914306640625, 7.60009765625, 8.285888671875, 8.9716796875, 9.657470703125, 10.34326171875, 11.029052734375, 11.71484375, 12.400634765625, 13.08642578125, 13.772216796875, 14.4580078125, 15.143798828125, 15.82958984375, 16.515380859375, 17.201171875, 17.886962890625, 18.57275390625, 19.258544921875, 19.9443359375, 20.630126953125, 21.31591796875, 22.001708984375, 22.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 17.0, 39.0, 81.0, 181.0, 249.0, 234.0, 123.0, 50.0, 24.0, 12.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.815486907958984, -53.194007873535156, -51.572532653808594, -49.951053619384766, -48.32957458496094, -46.708099365234375, -45.08662033081055, -43.46514129638672, -41.843666076660156, -40.22218704223633, -38.600711822509766, -36.97923278808594, -35.35775375366211, -33.73627471923828, -32.11479949951172, -30.49332046508789, -28.871841430664062, -27.250364303588867, -25.62888526916504, -24.007408142089844, -22.385929107666016, -20.76445198059082, -19.142974853515625, -17.521495819091797, -15.900018692016602, -14.27854061126709, -12.657062530517578, -11.035585403442383, -9.414107322692871, -7.792629241943359, -6.171152114868164, -4.549674034118652, -2.928192138671875, -1.3067142963409424, 0.31476354598999023, 1.9362411499023438, 3.5577192306518555, 5.179197311401367, 6.8006744384765625, 8.422152519226074, 10.043630599975586, 11.665108680725098, 13.28658676147461, 14.908063888549805, 16.529541015625, 18.151020050048828, 19.772497177124023, 21.39397430419922, 23.015453338623047, 24.636930465698242, 26.25840950012207, 27.879886627197266, 29.501365661621094, 31.12284278869629, 32.744319915771484, 34.36579895019531, 35.987274169921875, 37.6087532043457, 39.230228424072266, 40.851707458496094, 42.47318649291992, 44.09466552734375, 45.71614074707031, 47.33761978149414, 48.95909881591797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 8.0, 5.0, 5.0, 7.0, 10.0, 8.0, 15.0, 19.0, 12.0, 15.0, 18.0, 15.0, 18.0, 22.0, 31.0, 28.0, 24.0, 31.0, 27.0, 33.0, 43.0, 25.0, 23.0, 30.0, 47.0, 39.0, 26.0, 47.0, 33.0, 17.0, 44.0, 28.0, 34.0, 31.0, 17.0, 15.0, 20.0, 13.0, 15.0, 19.0, 7.0, 9.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.015356063842773, -16.481029510498047, -15.94670295715332, -15.412375450134277, -14.87804889678955, -14.343722343444824, -13.809394836425781, -13.275068283081055, -12.740741729736328, -12.206415176391602, -11.672088623046875, -11.137761116027832, -10.603434562683105, -10.069108009338379, -9.534780502319336, -9.00045394897461, -8.466127395629883, -7.931800842285156, -7.3974738121032715, -6.863146781921387, -6.32882022857666, -5.794493675231934, -5.260166645050049, -4.725839614868164, -4.1915130615234375, -3.657186269760132, -3.122859477996826, -2.5885326862335205, -2.054205894470215, -1.5198791027069092, -0.9855523109436035, -0.45122551918029785, 0.08310317993164062, 0.6174299716949463, 1.151756763458252, 1.6860835552215576, 2.2204103469848633, 2.754737138748169, 3.2890639305114746, 3.8233907222747803, 4.357717514038086, 4.8920440673828125, 5.426371097564697, 5.960698127746582, 6.495024681091309, 7.029351234436035, 7.56367826461792, 8.098005294799805, 8.632331848144531, 9.166658401489258, 9.700984954833984, 10.235312461853027, 10.769639015197754, 11.30396556854248, 11.838293075561523, 12.37261962890625, 12.906946182250977, 13.441272735595703, 13.97559928894043, 14.509926795959473, 15.0442533493042, 15.578579902648926, 16.11290740966797, 16.647233963012695, 17.181560516357422]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 10.0, 17.0, 13.0, 22.0, 15.0, 17.0, 19.0, 25.0, 27.0, 23.0, 30.0, 40.0, 34.0, 38.0, 40.0, 39.0, 52.0, 42.0, 51.0, 36.0, 35.0, 39.0, 30.0, 31.0, 37.0, 26.0, 27.0, 23.0, 22.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.326690673828125, -3.21002197265625, -3.093353271484375, -2.9766845703125, -2.860015869140625, -2.74334716796875, -2.626678466796875, -2.510009765625, -2.393341064453125, -2.27667236328125, -2.160003662109375, -2.0433349609375, -1.926666259765625, -1.80999755859375, -1.693328857421875, -1.57666015625, -1.459991455078125, -1.34332275390625, -1.226654052734375, -1.1099853515625, -0.993316650390625, -0.87664794921875, -0.759979248046875, -0.643310546875, -0.526641845703125, -0.40997314453125, -0.293304443359375, -0.1766357421875, -0.059967041015625, 0.05670166015625, 0.173370361328125, 0.2900390625, 0.406707763671875, 0.52337646484375, 0.640045166015625, 0.7567138671875, 0.873382568359375, 0.99005126953125, 1.106719970703125, 1.223388671875, 1.340057373046875, 1.45672607421875, 1.573394775390625, 1.6900634765625, 1.806732177734375, 1.92340087890625, 2.040069580078125, 2.15673828125, 2.273406982421875, 2.39007568359375, 2.506744384765625, 2.6234130859375, 2.740081787109375, 2.85675048828125, 2.973419189453125, 3.090087890625, 3.206756591796875, 3.32342529296875, 3.440093994140625, 3.5567626953125, 3.673431396484375, 3.79010009765625, 3.906768798828125, 4.0234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 12.0, 22.0, 24.0, 46.0, 66.0, 92.0, 125.0, 225.0, 312.0, 451.0, 798.0, 1211.0, 2059.0, 3612.0, 6373.0, 12117.0, 23867.0, 48701.0, 105548.0, 228162.0, 297256.0, 167144.0, 75469.0, 35508.0, 17512.0, 9451.0, 4994.0, 2934.0, 1648.0, 990.0, 647.0, 401.0, 233.0, 199.0, 102.0, 75.0, 47.0, 41.0, 29.0, 10.0, 12.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62841796875, -0.6089553833007812, -0.5894927978515625, -0.5700302124023438, -0.550567626953125, -0.5311050415039062, -0.5116424560546875, -0.49217987060546875, -0.47271728515625, -0.45325469970703125, -0.4337921142578125, -0.41432952880859375, -0.394866943359375, -0.37540435791015625, -0.3559417724609375, -0.33647918701171875, -0.3170166015625, -0.29755401611328125, -0.2780914306640625, -0.25862884521484375, -0.239166259765625, -0.21970367431640625, -0.2002410888671875, -0.18077850341796875, -0.16131591796875, -0.14185333251953125, -0.1223907470703125, -0.10292816162109375, -0.083465576171875, -0.06400299072265625, -0.0445404052734375, -0.02507781982421875, -0.005615234375, 0.01384735107421875, 0.0333099365234375, 0.05277252197265625, 0.072235107421875, 0.09169769287109375, 0.1111602783203125, 0.13062286376953125, 0.15008544921875, 0.16954803466796875, 0.1890106201171875, 0.20847320556640625, 0.227935791015625, 0.24739837646484375, 0.2668609619140625, 0.28632354736328125, 0.3057861328125, 0.32524871826171875, 0.3447113037109375, 0.36417388916015625, 0.383636474609375, 0.40309906005859375, 0.4225616455078125, 0.44202423095703125, 0.46148681640625, 0.48094940185546875, 0.5004119873046875, 0.5198745727539062, 0.539337158203125, 0.5587997436523438, 0.5782623291015625, 0.5977249145507812, 0.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 9.0, 5.0, 9.0, 8.0, 14.0, 12.0, 18.0, 17.0, 18.0, 26.0, 30.0, 26.0, 28.0, 35.0, 26.0, 30.0, 45.0, 40.0, 35.0, 43.0, 1068.0, 37.0, 40.0, 44.0, 22.0, 33.0, 34.0, 26.0, 30.0, 31.0, 25.0, 20.0, 21.0, 20.0, 16.0, 14.0, 13.0, 7.0, 9.0, 7.0, 5.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.349609375, -2.27178955078125, -2.1939697265625, -2.11614990234375, -2.038330078125, -1.96051025390625, -1.8826904296875, -1.80487060546875, -1.72705078125, -1.64923095703125, -1.5714111328125, -1.49359130859375, -1.415771484375, -1.33795166015625, -1.2601318359375, -1.18231201171875, -1.1044921875, -1.02667236328125, -0.9488525390625, -0.87103271484375, -0.793212890625, -0.71539306640625, -0.6375732421875, -0.55975341796875, -0.48193359375, -0.40411376953125, -0.3262939453125, -0.24847412109375, -0.170654296875, -0.09283447265625, -0.0150146484375, 0.06280517578125, 0.140625, 0.21844482421875, 0.2962646484375, 0.37408447265625, 0.451904296875, 0.52972412109375, 0.6075439453125, 0.68536376953125, 0.76318359375, 0.84100341796875, 0.9188232421875, 0.99664306640625, 1.074462890625, 1.15228271484375, 1.2301025390625, 1.30792236328125, 1.3857421875, 1.46356201171875, 1.5413818359375, 1.61920166015625, 1.697021484375, 1.77484130859375, 1.8526611328125, 1.93048095703125, 2.00830078125, 2.08612060546875, 2.1639404296875, 2.24176025390625, 2.319580078125, 2.39739990234375, 2.4752197265625, 2.55303955078125, 2.630859375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 14.0, 10.0, 22.0, 52.0, 68.0, 94.0, 150.0, 263.0, 460.0, 875.0, 1841.0, 4058.0, 10031.0, 27741.0, 88276.0, 369074.0, 1330679.0, 182731.0, 51305.0, 17344.0, 6428.0, 2728.0, 1279.0, 659.0, 347.0, 220.0, 115.0, 78.0, 42.0, 28.0, 21.0, 25.0, 15.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.646484375, -0.62762451171875, -0.6087646484375, -0.58990478515625, -0.571044921875, -0.55218505859375, -0.5333251953125, -0.51446533203125, -0.49560546875, -0.47674560546875, -0.4578857421875, -0.43902587890625, -0.420166015625, -0.40130615234375, -0.3824462890625, -0.36358642578125, -0.3447265625, -0.32586669921875, -0.3070068359375, -0.28814697265625, -0.269287109375, -0.25042724609375, -0.2315673828125, -0.21270751953125, -0.19384765625, -0.17498779296875, -0.1561279296875, -0.13726806640625, -0.118408203125, -0.09954833984375, -0.0806884765625, -0.06182861328125, -0.04296875, -0.02410888671875, -0.0052490234375, 0.01361083984375, 0.032470703125, 0.05133056640625, 0.0701904296875, 0.08905029296875, 0.10791015625, 0.12677001953125, 0.1456298828125, 0.16448974609375, 0.183349609375, 0.20220947265625, 0.2210693359375, 0.23992919921875, 0.2587890625, 0.27764892578125, 0.2965087890625, 0.31536865234375, 0.334228515625, 0.35308837890625, 0.3719482421875, 0.39080810546875, 0.40966796875, 0.42852783203125, 0.4473876953125, 0.46624755859375, 0.485107421875, 0.50396728515625, 0.5228271484375, 0.54168701171875, 0.560546875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 13.0, 18.0, 21.0, 27.0, 29.0, 48.0, 72.0, 131.0, 155.0, 140.0, 87.0, 67.0, 33.0, 22.0, 25.0, 14.0, 14.0, 8.0, 15.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10052490234375, -0.09778881072998047, -0.09505271911621094, -0.0923166275024414, -0.08958053588867188, -0.08684444427490234, -0.08410835266113281, -0.08137226104736328, -0.07863616943359375, -0.07590007781982422, -0.07316398620605469, -0.07042789459228516, -0.06769180297851562, -0.0649557113647461, -0.06221961975097656, -0.05948352813720703, -0.0567474365234375, -0.05401134490966797, -0.05127525329589844, -0.048539161682128906, -0.045803070068359375, -0.043066978454589844, -0.04033088684082031, -0.03759479522705078, -0.03485870361328125, -0.03212261199951172, -0.029386520385742188, -0.026650428771972656, -0.023914337158203125, -0.021178245544433594, -0.018442153930664062, -0.01570606231689453, -0.012969970703125, -0.010233879089355469, -0.0074977874755859375, -0.004761695861816406, -0.002025604248046875, 0.0007104873657226562, 0.0034465789794921875, 0.006182670593261719, 0.00891876220703125, 0.011654853820800781, 0.014390945434570312, 0.017127037048339844, 0.019863128662109375, 0.022599220275878906, 0.025335311889648438, 0.02807140350341797, 0.0308074951171875, 0.03354358673095703, 0.03627967834472656, 0.039015769958496094, 0.041751861572265625, 0.044487953186035156, 0.04722404479980469, 0.04996013641357422, 0.05269622802734375, 0.05543231964111328, 0.05816841125488281, 0.060904502868652344, 0.06364059448242188, 0.0663766860961914, 0.06911277770996094, 0.07184886932373047, 0.0745849609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 4.0, 5.0, 8.0, 6.0, 15.0, 16.0, 31.0, 38.0, 68.0, 108.0, 196.0, 487.0, 10561.0, 1032639.0, 3488.0, 399.0, 183.0, 87.0, 65.0, 39.0, 29.0, 21.0, 14.0, 3.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6268157958984375, -1.565155029296875, -1.5034942626953125, -1.44183349609375, -1.3801727294921875, -1.318511962890625, -1.2568511962890625, -1.1951904296875, -1.1335296630859375, -1.071868896484375, -1.0102081298828125, -0.94854736328125, -0.8868865966796875, -0.825225830078125, -0.7635650634765625, -0.701904296875, -0.6402435302734375, -0.578582763671875, -0.5169219970703125, -0.45526123046875, -0.3936004638671875, -0.331939697265625, -0.2702789306640625, -0.2086181640625, -0.1469573974609375, -0.085296630859375, -0.0236358642578125, 0.03802490234375, 0.0996856689453125, 0.161346435546875, 0.2230072021484375, 0.28466796875, 0.3463287353515625, 0.407989501953125, 0.4696502685546875, 0.53131103515625, 0.5929718017578125, 0.654632568359375, 0.7162933349609375, 0.7779541015625, 0.8396148681640625, 0.901275634765625, 0.9629364013671875, 1.02459716796875, 1.0862579345703125, 1.147918701171875, 1.2095794677734375, 1.271240234375, 1.3329010009765625, 1.394561767578125, 1.4562225341796875, 1.51788330078125, 1.5795440673828125, 1.641204833984375, 1.7028656005859375, 1.7645263671875, 1.8261871337890625, 1.887847900390625, 1.9495086669921875, 2.01116943359375, 2.0728302001953125, 2.134490966796875, 2.1961517333984375, 2.2578125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 18.0, 50.0, 127.0, 292.0, 307.0, 139.0, 39.0, 20.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19680680334568024, -0.18978610634803772, -0.1827654093503952, -0.17574471235275269, -0.16872401535511017, -0.16170331835746765, -0.15468262135982513, -0.14766192436218262, -0.1406412273645401, -0.13362053036689758, -0.12659983336925507, -0.11957913637161255, -0.11255843937397003, -0.10553774237632751, -0.098517045378685, -0.09149634838104248, -0.08447565138339996, -0.07745495438575745, -0.07043425738811493, -0.06341356039047241, -0.056392863392829895, -0.04937216639518738, -0.04235146939754486, -0.035330772399902344, -0.028310075402259827, -0.02128937840461731, -0.014268681406974792, -0.007247984409332275, -0.0002272874116897583, 0.006793409585952759, 0.013814106583595276, 0.020834803581237793, 0.027855515480041504, 0.03487621247768402, 0.04189690947532654, 0.048917606472969055, 0.05593830347061157, 0.06295900046825409, 0.0699796974658966, 0.07700039446353912, 0.08402109146118164, 0.09104178845882416, 0.09806248545646667, 0.10508318245410919, 0.11210387945175171, 0.11912457644939423, 0.12614527344703674, 0.13316597044467926, 0.14018666744232178, 0.1472073644399643, 0.1542280614376068, 0.16124875843524933, 0.16826945543289185, 0.17529015243053436, 0.18231084942817688, 0.1893315464258194, 0.19635224342346191, 0.20337294042110443, 0.21039363741874695, 0.21741433441638947, 0.22443503141403198, 0.2314557284116745, 0.23847642540931702, 0.24549712240695953, 0.25251781940460205]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 8.0, 4.0, 14.0, 13.0, 15.0, 19.0, 17.0, 22.0, 27.0, 35.0, 19.0, 16.0, 34.0, 28.0, 39.0, 36.0, 49.0, 29.0, 40.0, 42.0, 43.0, 32.0, 36.0, 32.0, 35.0, 25.0, 30.0, 34.0, 36.0, 38.0, 21.0, 20.0, 9.0, 16.0, 6.0, 17.0, 8.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.05887115001678467, -0.05697086825966835, -0.05507058650255203, -0.053170304745435715, -0.0512700229883194, -0.04936974123120308, -0.04746945947408676, -0.045569177716970444, -0.043668895959854126, -0.04176861420273781, -0.03986833244562149, -0.03796805068850517, -0.036067768931388855, -0.03416748717427254, -0.03226720541715622, -0.0303669236600399, -0.028466641902923584, -0.026566360145807266, -0.02466607838869095, -0.02276579663157463, -0.020865514874458313, -0.018965233117341995, -0.017064951360225677, -0.01516466960310936, -0.013264387845993042, -0.011364106088876724, -0.009463824331760406, -0.007563542574644089, -0.005663260817527771, -0.0037629790604114532, -0.0018626973032951355, 3.758445382118225e-05, 0.0019378662109375, 0.0038381479680538177, 0.0057384297251701355, 0.007638711482286453, 0.009538993239402771, 0.011439274996519089, 0.013339556753635406, 0.015239838510751724, 0.017140120267868042, 0.01904040202498436, 0.020940683782100677, 0.022840965539216995, 0.024741247296333313, 0.02664152905344963, 0.02854181081056595, 0.030442092567682266, 0.032342374324798584, 0.0342426560819149, 0.03614293783903122, 0.03804321959614754, 0.039943501353263855, 0.04184378311038017, 0.04374406486749649, 0.04564434662461281, 0.047544628381729126, 0.049444910138845444, 0.05134519189596176, 0.05324547365307808, 0.0551457554101944, 0.057046037167310715, 0.05894631892442703, 0.06084660068154335, 0.06274688243865967]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 10.0, 10.0, 13.0, 13.0, 15.0, 12.0, 19.0, 28.0, 27.0, 29.0, 25.0, 28.0, 36.0, 40.0, 31.0, 38.0, 53.0, 33.0, 41.0, 36.0, 46.0, 35.0, 40.0, 50.0, 26.0, 28.0, 32.0, 24.0, 21.0, 16.0, 10.0, 17.0, 10.0, 15.0, 9.0, 13.0, 10.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.46484375, -3.351806640625, -3.23876953125, -3.125732421875, -3.0126953125, -2.899658203125, -2.78662109375, -2.673583984375, -2.560546875, -2.447509765625, -2.33447265625, -2.221435546875, -2.1083984375, -1.995361328125, -1.88232421875, -1.769287109375, -1.65625, -1.543212890625, -1.43017578125, -1.317138671875, -1.2041015625, -1.091064453125, -0.97802734375, -0.864990234375, -0.751953125, -0.638916015625, -0.52587890625, -0.412841796875, -0.2998046875, -0.186767578125, -0.07373046875, 0.039306640625, 0.15234375, 0.265380859375, 0.37841796875, 0.491455078125, 0.6044921875, 0.717529296875, 0.83056640625, 0.943603515625, 1.056640625, 1.169677734375, 1.28271484375, 1.395751953125, 1.5087890625, 1.621826171875, 1.73486328125, 1.847900390625, 1.9609375, 2.073974609375, 2.18701171875, 2.300048828125, 2.4130859375, 2.526123046875, 2.63916015625, 2.752197265625, 2.865234375, 2.978271484375, 3.09130859375, 3.204345703125, 3.3173828125, 3.430419921875, 3.54345703125, 3.656494140625, 3.76953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 13.0, 7.0, 22.0, 33.0, 34.0, 46.0, 75.0, 95.0, 143.0, 218.0, 318.0, 459.0, 633.0, 1098.0, 1560.0, 2568.0, 4209.0, 7114.0, 12260.0, 21829.0, 41952.0, 86594.0, 197439.0, 337472.0, 170293.0, 76044.0, 37525.0, 19880.0, 11169.0, 6599.0, 3872.0, 2507.0, 1562.0, 941.0, 663.0, 437.0, 277.0, 200.0, 123.0, 67.0, 71.0, 45.0, 33.0, 15.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.70550537109375, -4.5399169921875, -4.37432861328125, -4.208740234375, -4.04315185546875, -3.8775634765625, -3.71197509765625, -3.54638671875, -3.38079833984375, -3.2152099609375, -3.04962158203125, -2.884033203125, -2.71844482421875, -2.5528564453125, -2.38726806640625, -2.2216796875, -2.05609130859375, -1.8905029296875, -1.72491455078125, -1.559326171875, -1.39373779296875, -1.2281494140625, -1.06256103515625, -0.89697265625, -0.73138427734375, -0.5657958984375, -0.40020751953125, -0.234619140625, -0.06903076171875, 0.0965576171875, 0.26214599609375, 0.427734375, 0.59332275390625, 0.7589111328125, 0.92449951171875, 1.090087890625, 1.25567626953125, 1.4212646484375, 1.58685302734375, 1.75244140625, 1.91802978515625, 2.0836181640625, 2.24920654296875, 2.414794921875, 2.58038330078125, 2.7459716796875, 2.91156005859375, 3.0771484375, 3.24273681640625, 3.4083251953125, 3.57391357421875, 3.739501953125, 3.90509033203125, 4.0706787109375, 4.23626708984375, 4.40185546875, 4.56744384765625, 4.7330322265625, 4.89862060546875, 5.064208984375, 5.22979736328125, 5.3953857421875, 5.56097412109375, 5.7265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 1.0, 6.0, 6.0, 7.0, 16.0, 16.0, 17.0, 21.0, 16.0, 27.0, 31.0, 31.0, 45.0, 31.0, 70.0, 82.0, 113.0, 182.0, 1390.0, 291.0, 133.0, 87.0, 66.0, 41.0, 40.0, 39.0, 29.0, 28.0, 31.0, 22.0, 21.0, 17.0, 15.0, 13.0, 19.0, 11.0, 5.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.03125, -9.70556640625, -9.3798828125, -9.05419921875, -8.728515625, -8.40283203125, -8.0771484375, -7.75146484375, -7.42578125, -7.10009765625, -6.7744140625, -6.44873046875, -6.123046875, -5.79736328125, -5.4716796875, -5.14599609375, -4.8203125, -4.49462890625, -4.1689453125, -3.84326171875, -3.517578125, -3.19189453125, -2.8662109375, -2.54052734375, -2.21484375, -1.88916015625, -1.5634765625, -1.23779296875, -0.912109375, -0.58642578125, -0.2607421875, 0.06494140625, 0.390625, 0.71630859375, 1.0419921875, 1.36767578125, 1.693359375, 2.01904296875, 2.3447265625, 2.67041015625, 2.99609375, 3.32177734375, 3.6474609375, 3.97314453125, 4.298828125, 4.62451171875, 4.9501953125, 5.27587890625, 5.6015625, 5.92724609375, 6.2529296875, 6.57861328125, 6.904296875, 7.22998046875, 7.5556640625, 7.88134765625, 8.20703125, 8.53271484375, 8.8583984375, 9.18408203125, 9.509765625, 9.83544921875, 10.1611328125, 10.48681640625, 10.8125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 12.0, 9.0, 13.0, 13.0, 20.0, 22.0, 38.0, 49.0, 81.0, 91.0, 161.0, 260.0, 500.0, 1167.0, 3992.0, 20739.0, 246759.0, 2732080.0, 120657.0, 13908.0, 3068.0, 959.0, 449.0, 224.0, 144.0, 80.0, 67.0, 36.0, 26.0, 23.0, 16.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.50537109375, -15.9794921875, -15.45361328125, -14.927734375, -14.40185546875, -13.8759765625, -13.35009765625, -12.82421875, -12.29833984375, -11.7724609375, -11.24658203125, -10.720703125, -10.19482421875, -9.6689453125, -9.14306640625, -8.6171875, -8.09130859375, -7.5654296875, -7.03955078125, -6.513671875, -5.98779296875, -5.4619140625, -4.93603515625, -4.41015625, -3.88427734375, -3.3583984375, -2.83251953125, -2.306640625, -1.78076171875, -1.2548828125, -0.72900390625, -0.203125, 0.32275390625, 0.8486328125, 1.37451171875, 1.900390625, 2.42626953125, 2.9521484375, 3.47802734375, 4.00390625, 4.52978515625, 5.0556640625, 5.58154296875, 6.107421875, 6.63330078125, 7.1591796875, 7.68505859375, 8.2109375, 8.73681640625, 9.2626953125, 9.78857421875, 10.314453125, 10.84033203125, 11.3662109375, 11.89208984375, 12.41796875, 12.94384765625, 13.4697265625, 13.99560546875, 14.521484375, 15.04736328125, 15.5732421875, 16.09912109375, 16.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 24.0, 99.0, 332.0, 364.0, 153.0, 32.0, 12.0], "bins": [-138.59930419921875, -136.29335021972656, -133.98741149902344, -131.68145751953125, -129.37551879882812, -127.06956481933594, -124.76361846923828, -122.45767211914062, -120.15171813964844, -117.84577178955078, -115.53982543945312, -113.23387145996094, -110.92792510986328, -108.62197875976562, -106.31603240966797, -104.01008605957031, -101.70413970947266, -99.398193359375, -97.09224700927734, -94.78629302978516, -92.4803466796875, -90.17440032958984, -87.86845397949219, -85.56250762939453, -83.25656127929688, -80.95061492919922, -78.64466857910156, -76.33871459960938, -74.03276824951172, -71.72682189941406, -69.4208755493164, -67.11492919921875, -64.8089828491211, -62.50303649902344, -60.197086334228516, -57.89113998413086, -55.58518981933594, -53.27924346923828, -50.973297119140625, -48.66735076904297, -46.36140060424805, -44.05545425415039, -41.74950408935547, -39.44355773925781, -37.137611389160156, -34.831661224365234, -32.52571487426758, -30.21976661682129, -27.913818359375, -25.60787010192871, -23.301921844482422, -20.995975494384766, -18.690027236938477, -16.384078979492188, -14.078131675720215, -11.772184371948242, -9.466236114501953, -7.160288333892822, -4.854340553283691, -2.5483927726745605, -0.2424449920654297, 2.0635032653808594, 4.369450569152832, 6.675397872924805, 8.981346130371094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 9.0, 10.0, 10.0, 14.0, 13.0, 15.0, 23.0, 27.0, 34.0, 34.0, 28.0, 29.0, 21.0, 26.0, 31.0, 49.0, 59.0, 51.0, 41.0, 41.0, 50.0, 44.0, 23.0, 23.0, 41.0, 30.0, 30.0, 32.0, 16.0, 22.0, 11.0, 17.0, 9.0, 9.0, 14.0, 17.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.878116607666016, -23.134761810302734, -22.39140510559082, -21.64805030822754, -20.904693603515625, -20.161338806152344, -19.417984008789062, -18.67462921142578, -17.931272506713867, -17.187917709350586, -16.444561004638672, -15.70120620727539, -14.957850456237793, -14.214494705200195, -13.471139907836914, -12.727784156799316, -11.984428405761719, -11.241072654724121, -10.497716903686523, -9.754362106323242, -9.011006355285645, -8.267650604248047, -7.524295330047607, -6.780940055847168, -6.03758430480957, -5.294228553771973, -4.550873279571533, -3.8075177669525146, -3.064162254333496, -2.3208067417144775, -1.577451229095459, -0.8340959548950195, -0.09074020385742188, 0.6526153087615967, 1.3959708213806152, 2.139326333999634, 2.8826818466186523, 3.626037359237671, 4.3693928718566895, 5.112748146057129, 5.856103897094727, 6.599459648132324, 7.342814922332764, 8.086170196533203, 8.8295259475708, 9.572881698608398, 10.31623649597168, 11.059592247009277, 11.802947998046875, 12.546303749084473, 13.28965950012207, 14.033014297485352, 14.77637004852295, 15.519725799560547, 16.263080596923828, 17.00643539428711, 17.749792098999023, 18.493146896362305, 19.23650360107422, 19.9798583984375, 20.72321319580078, 21.466569900512695, 22.209924697875977, 22.95328140258789, 23.696636199951172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 3.0, 2.0, 8.0, 9.0, 12.0, 10.0, 11.0, 16.0, 18.0, 12.0, 19.0, 26.0, 34.0, 23.0, 27.0, 49.0, 38.0, 40.0, 37.0, 43.0, 45.0, 36.0, 40.0, 40.0, 38.0, 37.0, 32.0, 24.0, 34.0, 31.0, 25.0, 23.0, 24.0, 11.0, 14.0, 16.0, 19.0, 9.0, 9.0, 4.0, 8.0, 8.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.46484375, -3.351715087890625, -3.23858642578125, -3.125457763671875, -3.0123291015625, -2.899200439453125, -2.78607177734375, -2.672943115234375, -2.559814453125, -2.446685791015625, -2.33355712890625, -2.220428466796875, -2.1072998046875, -1.994171142578125, -1.88104248046875, -1.767913818359375, -1.65478515625, -1.541656494140625, -1.42852783203125, -1.315399169921875, -1.2022705078125, -1.089141845703125, -0.97601318359375, -0.862884521484375, -0.749755859375, -0.636627197265625, -0.52349853515625, -0.410369873046875, -0.2972412109375, -0.184112548828125, -0.07098388671875, 0.042144775390625, 0.1552734375, 0.268402099609375, 0.38153076171875, 0.494659423828125, 0.6077880859375, 0.720916748046875, 0.83404541015625, 0.947174072265625, 1.060302734375, 1.173431396484375, 1.28656005859375, 1.399688720703125, 1.5128173828125, 1.625946044921875, 1.73907470703125, 1.852203369140625, 1.96533203125, 2.078460693359375, 2.19158935546875, 2.304718017578125, 2.4178466796875, 2.530975341796875, 2.64410400390625, 2.757232666015625, 2.870361328125, 2.983489990234375, 3.09661865234375, 3.209747314453125, 3.3228759765625, 3.436004638671875, 3.54913330078125, 3.662261962890625, 3.775390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 7.0, 4.0, 5.0, 11.0, 7.0, 27.0, 32.0, 32.0, 32.0, 44.0, 71.0, 91.0, 130.0, 150.0, 233.0, 374.0, 769.0, 6690.0, 3621492.0, 558804.0, 3548.0, 612.0, 307.0, 206.0, 142.0, 106.0, 87.0, 63.0, 32.0, 30.0, 30.0, 31.0, 23.0, 7.0, 3.0, 5.0, 6.0, 8.0, 4.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.9375, -37.634765625, -36.33203125, -35.029296875, -33.7265625, -32.423828125, -31.12109375, -29.818359375, -28.515625, -27.212890625, -25.91015625, -24.607421875, -23.3046875, -22.001953125, -20.69921875, -19.396484375, -18.09375, -16.791015625, -15.48828125, -14.185546875, -12.8828125, -11.580078125, -10.27734375, -8.974609375, -7.671875, -6.369140625, -5.06640625, -3.763671875, -2.4609375, -1.158203125, 0.14453125, 1.447265625, 2.75, 4.052734375, 5.35546875, 6.658203125, 7.9609375, 9.263671875, 10.56640625, 11.869140625, 13.171875, 14.474609375, 15.77734375, 17.080078125, 18.3828125, 19.685546875, 20.98828125, 22.291015625, 23.59375, 24.896484375, 26.19921875, 27.501953125, 28.8046875, 30.107421875, 31.41015625, 32.712890625, 34.015625, 35.318359375, 36.62109375, 37.923828125, 39.2265625, 40.529296875, 41.83203125, 43.134765625, 44.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 14.0, 14.0, 26.0, 35.0, 38.0, 62.0, 81.0, 104.0, 171.0, 287.0, 493.0, 719.0, 724.0, 453.0, 263.0, 162.0, 91.0, 68.0, 56.0, 32.0, 45.0, 27.0, 23.0, 13.0, 10.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.125, -6.91534423828125, -6.7056884765625, -6.49603271484375, -6.286376953125, -6.07672119140625, -5.8670654296875, -5.65740966796875, -5.44775390625, -5.23809814453125, -5.0284423828125, -4.81878662109375, -4.609130859375, -4.39947509765625, -4.1898193359375, -3.98016357421875, -3.7705078125, -3.56085205078125, -3.3511962890625, -3.14154052734375, -2.931884765625, -2.72222900390625, -2.5125732421875, -2.30291748046875, -2.09326171875, -1.88360595703125, -1.6739501953125, -1.46429443359375, -1.254638671875, -1.04498291015625, -0.8353271484375, -0.62567138671875, -0.416015625, -0.20635986328125, 0.0032958984375, 0.21295166015625, 0.422607421875, 0.63226318359375, 0.8419189453125, 1.05157470703125, 1.26123046875, 1.47088623046875, 1.6805419921875, 1.89019775390625, 2.099853515625, 2.30950927734375, 2.5191650390625, 2.72882080078125, 2.9384765625, 3.14813232421875, 3.3577880859375, 3.56744384765625, 3.777099609375, 3.98675537109375, 4.1964111328125, 4.40606689453125, 4.61572265625, 4.82537841796875, 5.0350341796875, 5.24468994140625, 5.454345703125, 5.66400146484375, 5.8736572265625, 6.08331298828125, 6.29296875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 4.0, 6.0, 17.0, 14.0, 23.0, 20.0, 38.0, 55.0, 91.0, 131.0, 339.0, 1219.0, 13591.0, 704841.0, 3438725.0, 32247.0, 2040.0, 428.0, 169.0, 99.0, 63.0, 40.0, 19.0, 12.0, 9.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53125, -23.767822265625, -23.00439453125, -22.240966796875, -21.4775390625, -20.714111328125, -19.95068359375, -19.187255859375, -18.423828125, -17.660400390625, -16.89697265625, -16.133544921875, -15.3701171875, -14.606689453125, -13.84326171875, -13.079833984375, -12.31640625, -11.552978515625, -10.78955078125, -10.026123046875, -9.2626953125, -8.499267578125, -7.73583984375, -6.972412109375, -6.208984375, -5.445556640625, -4.68212890625, -3.918701171875, -3.1552734375, -2.391845703125, -1.62841796875, -0.864990234375, -0.1015625, 0.661865234375, 1.42529296875, 2.188720703125, 2.9521484375, 3.715576171875, 4.47900390625, 5.242431640625, 6.005859375, 6.769287109375, 7.53271484375, 8.296142578125, 9.0595703125, 9.822998046875, 10.58642578125, 11.349853515625, 12.11328125, 12.876708984375, 13.64013671875, 14.403564453125, 15.1669921875, 15.930419921875, 16.69384765625, 17.457275390625, 18.220703125, 18.984130859375, 19.74755859375, 20.510986328125, 21.2744140625, 22.037841796875, 22.80126953125, 23.564697265625, 24.328125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 19.0, 9.0, 28.0, 28.0, 44.0, 63.0, 86.0, 110.0, 109.0, 105.0, 109.0, 82.0, 76.0, 51.0, 30.0, 14.0, 11.0, 16.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.738236427307129, -9.052277565002441, -8.36631965637207, -7.680360794067383, -6.994401931762695, -6.308443546295166, -5.622485160827637, -4.936526298522949, -4.25056791305542, -3.5646092891693115, -2.878650665283203, -2.192692279815674, -1.5067336559295654, -0.820775032043457, -0.13481664657592773, 0.5511422157287598, 1.237100601196289, 1.9230592250823975, 2.609017848968506, 3.294976234436035, 3.9809348583221436, 4.666893482208252, 5.352851867675781, 6.038810729980469, 6.724769115447998, 7.410727500915527, 8.096686363220215, 8.782644271850586, 9.468603134155273, 10.154561996459961, 10.840520858764648, 11.526479721069336, 12.212438583374023, 12.898397445678711, 13.584355354309082, 14.27031421661377, 14.956273078918457, 15.642230987548828, 16.328189849853516, 17.014148712158203, 17.70010757446289, 18.386066436767578, 19.072025299072266, 19.757984161376953, 20.443941116333008, 21.129899978637695, 21.815858840942383, 22.50181770324707, 23.187774658203125, 23.873733520507812, 24.5596923828125, 25.245651245117188, 25.931608200073242, 26.61756706237793, 27.303525924682617, 27.989484786987305, 28.675443649291992, 29.36140251159668, 30.047361373901367, 30.733318328857422, 31.41927719116211, 32.1052360534668, 32.791194915771484, 33.47715377807617, 34.16311264038086]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 1.0, 4.0, 7.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 19.0, 27.0, 12.0, 22.0, 21.0, 34.0, 33.0, 36.0, 26.0, 41.0, 39.0, 32.0, 42.0, 52.0, 40.0, 42.0, 35.0, 52.0, 40.0, 38.0, 29.0, 31.0, 28.0, 20.0, 28.0, 14.0, 13.0, 20.0, 12.0, 11.0, 10.0, 9.0, 0.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.44189453125, -17.84846305847168, -17.255033493041992, -16.661602020263672, -16.06817054748535, -15.474740028381348, -14.881309509277344, -14.287878036499023, -13.694446563720703, -13.1010160446167, -12.507584571838379, -11.914154052734375, -11.320722579956055, -10.72729206085205, -10.133861541748047, -9.540430068969727, -8.946999549865723, -8.353569030761719, -7.760137557983398, -7.1667070388793945, -6.573275566101074, -5.97984504699707, -5.386414051055908, -4.792983055114746, -4.199552059173584, -3.606121063232422, -3.0126900672912598, -2.4192593097686768, -1.8258283138275146, -1.2323973178863525, -0.6389665603637695, -0.04553556442260742, 0.5478954315185547, 1.1413264274597168, 1.7347573041915894, 2.328188180923462, 2.921619176864624, 3.515050172805786, 4.108480930328369, 4.701911926269531, 5.295342922210693, 5.8887739181518555, 6.482204914093018, 7.07563591003418, 7.669066429138184, 8.262497901916504, 8.855928421020508, 9.449359893798828, 10.042790412902832, 10.636220932006836, 11.229652404785156, 11.82308292388916, 12.41651439666748, 13.009944915771484, 13.603376388549805, 14.196806907653809, 14.790237426757812, 15.383667945861816, 15.977099418640137, 16.57052993774414, 17.16396141052246, 17.75739288330078, 18.35082244873047, 18.94425392150879, 19.53768539428711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 8.0, 8.0, 14.0, 11.0, 19.0, 12.0, 12.0, 26.0, 39.0, 26.0, 35.0, 32.0, 36.0, 46.0, 37.0, 37.0, 39.0, 49.0, 46.0, 52.0, 31.0, 39.0, 49.0, 34.0, 17.0, 29.0, 22.0, 13.0, 24.0, 26.0, 24.0, 12.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.677734375, -3.562835693359375, -3.44793701171875, -3.333038330078125, -3.2181396484375, -3.103240966796875, -2.98834228515625, -2.873443603515625, -2.758544921875, -2.643646240234375, -2.52874755859375, -2.413848876953125, -2.2989501953125, -2.184051513671875, -2.06915283203125, -1.954254150390625, -1.83935546875, -1.724456787109375, -1.60955810546875, -1.494659423828125, -1.3797607421875, -1.264862060546875, -1.14996337890625, -1.035064697265625, -0.920166015625, -0.805267333984375, -0.69036865234375, -0.575469970703125, -0.4605712890625, -0.345672607421875, -0.23077392578125, -0.115875244140625, -0.0009765625, 0.113922119140625, 0.22882080078125, 0.343719482421875, 0.4586181640625, 0.573516845703125, 0.68841552734375, 0.803314208984375, 0.918212890625, 1.033111572265625, 1.14801025390625, 1.262908935546875, 1.3778076171875, 1.492706298828125, 1.60760498046875, 1.722503662109375, 1.83740234375, 1.952301025390625, 2.06719970703125, 2.182098388671875, 2.2969970703125, 2.411895751953125, 2.52679443359375, 2.641693115234375, 2.756591796875, 2.871490478515625, 2.98638916015625, 3.101287841796875, 3.2161865234375, 3.331085205078125, 3.44598388671875, 3.560882568359375, 3.67578125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 12.0, 18.0, 24.0, 41.0, 66.0, 101.0, 137.0, 196.0, 282.0, 381.0, 573.0, 779.0, 1272.0, 1838.0, 2791.0, 4243.0, 6749.0, 11006.0, 18316.0, 32160.0, 60418.0, 124574.0, 250718.0, 256991.0, 128787.0, 62636.0, 33417.0, 18827.0, 11238.0, 6883.0, 4372.0, 2860.0, 1832.0, 1287.0, 868.0, 547.0, 437.0, 257.0, 195.0, 136.0, 99.0, 67.0, 46.0, 26.0, 21.0, 13.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.966796875, -0.9375228881835938, -0.9082489013671875, -0.8789749145507812, -0.849700927734375, -0.8204269409179688, -0.7911529541015625, -0.7618789672851562, -0.73260498046875, -0.7033309936523438, -0.6740570068359375, -0.6447830200195312, -0.615509033203125, -0.5862350463867188, -0.5569610595703125, -0.5276870727539062, -0.4984130859375, -0.46913909912109375, -0.4398651123046875, -0.41059112548828125, -0.381317138671875, -0.35204315185546875, -0.3227691650390625, -0.29349517822265625, -0.26422119140625, -0.23494720458984375, -0.2056732177734375, -0.17639923095703125, -0.147125244140625, -0.11785125732421875, -0.0885772705078125, -0.05930328369140625, -0.030029296875, -0.00075531005859375, 0.0285186767578125, 0.05779266357421875, 0.087066650390625, 0.11634063720703125, 0.1456146240234375, 0.17488861083984375, 0.20416259765625, 0.23343658447265625, 0.2627105712890625, 0.29198455810546875, 0.321258544921875, 0.35053253173828125, 0.3798065185546875, 0.40908050537109375, 0.4383544921875, 0.46762847900390625, 0.4969024658203125, 0.5261764526367188, 0.555450439453125, 0.5847244262695312, 0.6139984130859375, 0.6432723999023438, 0.67254638671875, 0.7018203735351562, 0.7310943603515625, 0.7603683471679688, 0.789642333984375, 0.8189163208007812, 0.8481903076171875, 0.8774642944335938, 0.90673828125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 6.0, 8.0, 7.0, 13.0, 14.0, 13.0, 13.0, 23.0, 17.0, 28.0, 29.0, 29.0, 29.0, 38.0, 29.0, 45.0, 45.0, 33.0, 47.0, 1061.0, 34.0, 46.0, 48.0, 47.0, 39.0, 32.0, 36.0, 29.0, 30.0, 25.0, 19.0, 19.0, 14.0, 9.0, 12.0, 9.0, 11.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.88543701171875, -2.7982177734375, -2.71099853515625, -2.623779296875, -2.53656005859375, -2.4493408203125, -2.36212158203125, -2.27490234375, -2.18768310546875, -2.1004638671875, -2.01324462890625, -1.926025390625, -1.83880615234375, -1.7515869140625, -1.66436767578125, -1.5771484375, -1.48992919921875, -1.4027099609375, -1.31549072265625, -1.228271484375, -1.14105224609375, -1.0538330078125, -0.96661376953125, -0.87939453125, -0.79217529296875, -0.7049560546875, -0.61773681640625, -0.530517578125, -0.44329833984375, -0.3560791015625, -0.26885986328125, -0.181640625, -0.09442138671875, -0.0072021484375, 0.08001708984375, 0.167236328125, 0.25445556640625, 0.3416748046875, 0.42889404296875, 0.51611328125, 0.60333251953125, 0.6905517578125, 0.77777099609375, 0.864990234375, 0.95220947265625, 1.0394287109375, 1.12664794921875, 1.2138671875, 1.30108642578125, 1.3883056640625, 1.47552490234375, 1.562744140625, 1.64996337890625, 1.7371826171875, 1.82440185546875, 1.91162109375, 1.99884033203125, 2.0860595703125, 2.17327880859375, 2.260498046875, 2.34771728515625, 2.4349365234375, 2.52215576171875, 2.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 11.0, 17.0, 21.0, 39.0, 61.0, 85.0, 150.0, 269.0, 471.0, 893.0, 1734.0, 3808.0, 9192.0, 27240.0, 119766.0, 1428486.0, 417500.0, 58950.0, 16754.0, 6204.0, 2605.0, 1274.0, 654.0, 348.0, 211.0, 131.0, 89.0, 44.0, 36.0, 34.0, 12.0, 13.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4755859375, -1.4276580810546875, -1.379730224609375, -1.3318023681640625, -1.28387451171875, -1.2359466552734375, -1.188018798828125, -1.1400909423828125, -1.0921630859375, -1.0442352294921875, -0.996307373046875, -0.9483795166015625, -0.90045166015625, -0.8525238037109375, -0.804595947265625, -0.7566680908203125, -0.708740234375, -0.6608123779296875, -0.612884521484375, -0.5649566650390625, -0.51702880859375, -0.4691009521484375, -0.421173095703125, -0.3732452392578125, -0.3253173828125, -0.2773895263671875, -0.229461669921875, -0.1815338134765625, -0.13360595703125, -0.0856781005859375, -0.037750244140625, 0.0101776123046875, 0.05810546875, 0.1060333251953125, 0.153961181640625, 0.2018890380859375, 0.24981689453125, 0.2977447509765625, 0.345672607421875, 0.3936004638671875, 0.4415283203125, 0.4894561767578125, 0.537384033203125, 0.5853118896484375, 0.63323974609375, 0.6811676025390625, 0.729095458984375, 0.7770233154296875, 0.824951171875, 0.8728790283203125, 0.920806884765625, 0.9687347412109375, 1.01666259765625, 1.0645904541015625, 1.112518310546875, 1.1604461669921875, 1.2083740234375, 1.2563018798828125, 1.304229736328125, 1.3521575927734375, 1.40008544921875, 1.4480133056640625, 1.495941162109375, 1.5438690185546875, 1.591796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 8.0, 7.0, 12.0, 14.0, 21.0, 28.0, 41.0, 69.0, 131.0, 148.0, 182.0, 115.0, 76.0, 46.0, 25.0, 17.0, 14.0, 14.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3879966735839844, -0.37584686279296875, -0.3636970520019531, -0.3515472412109375, -0.3393974304199219, -0.32724761962890625, -0.3150978088378906, -0.302947998046875, -0.2907981872558594, -0.27864837646484375, -0.2664985656738281, -0.2543487548828125, -0.24219894409179688, -0.23004913330078125, -0.21789932250976562, -0.20574951171875, -0.19359970092773438, -0.18144989013671875, -0.16930007934570312, -0.1571502685546875, -0.14500045776367188, -0.13285064697265625, -0.12070083618164062, -0.108551025390625, -0.09640121459960938, -0.08425140380859375, -0.07210159301757812, -0.0599517822265625, -0.047801971435546875, -0.03565216064453125, -0.023502349853515625, -0.0113525390625, 0.000797271728515625, 0.01294708251953125, 0.025096893310546875, 0.0372467041015625, 0.049396514892578125, 0.06154632568359375, 0.07369613647460938, 0.085845947265625, 0.09799575805664062, 0.11014556884765625, 0.12229537963867188, 0.1344451904296875, 0.14659500122070312, 0.15874481201171875, 0.17089462280273438, 0.18304443359375, 0.19519424438476562, 0.20734405517578125, 0.21949386596679688, 0.2316436767578125, 0.24379348754882812, 0.25594329833984375, 0.2680931091308594, 0.280242919921875, 0.2923927307128906, 0.30454254150390625, 0.3166923522949219, 0.3288421630859375, 0.3409919738769531, 0.35314178466796875, 0.3652915954589844, 0.37744140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 21.0, 29.0, 54.0, 93.0, 200.0, 492.0, 11757.0, 1033877.0, 1393.0, 274.0, 120.0, 70.0, 40.0, 30.0, 16.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.857666015625, -7.59814453125, -7.338623046875, -7.0791015625, -6.819580078125, -6.56005859375, -6.300537109375, -6.041015625, -5.781494140625, -5.52197265625, -5.262451171875, -5.0029296875, -4.743408203125, -4.48388671875, -4.224365234375, -3.96484375, -3.705322265625, -3.44580078125, -3.186279296875, -2.9267578125, -2.667236328125, -2.40771484375, -2.148193359375, -1.888671875, -1.629150390625, -1.36962890625, -1.110107421875, -0.8505859375, -0.591064453125, -0.33154296875, -0.072021484375, 0.1875, 0.447021484375, 0.70654296875, 0.966064453125, 1.2255859375, 1.485107421875, 1.74462890625, 2.004150390625, 2.263671875, 2.523193359375, 2.78271484375, 3.042236328125, 3.3017578125, 3.561279296875, 3.82080078125, 4.080322265625, 4.33984375, 4.599365234375, 4.85888671875, 5.118408203125, 5.3779296875, 5.637451171875, 5.89697265625, 6.156494140625, 6.416015625, 6.675537109375, 6.93505859375, 7.194580078125, 7.4541015625, 7.713623046875, 7.97314453125, 8.232666015625, 8.4921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 40.0, 258.0, 540.0, 130.0, 19.0, 13.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423232913017273, -1.3887617588043213, -1.35429048538208, -1.3198192119598389, -1.2853480577468872, -1.2508769035339355, -1.2164056301116943, -1.1819343566894531, -1.1474632024765015, -1.1129920482635498, -1.0785207748413086, -1.0440495014190674, -1.0095783472061157, -0.9751071333885193, -0.9406359195709229, -0.9061647057533264, -0.87169349193573, -0.8372222781181335, -0.8027510643005371, -0.7682798504829407, -0.7338086366653442, -0.6993374228477478, -0.6648662090301514, -0.6303949952125549, -0.5959237813949585, -0.5614525675773621, -0.5269813537597656, -0.4925101399421692, -0.45803892612457275, -0.4235677123069763, -0.3890964984893799, -0.35462528467178345, -0.3201541304588318, -0.28568291664123535, -0.2512117028236389, -0.21674048900604248, -0.18226927518844604, -0.1477980613708496, -0.11332684755325317, -0.07885563373565674, -0.0443844199180603, -0.009913206100463867, 0.02455800771713257, 0.059029221534729004, 0.09350043535232544, 0.12797164916992188, 0.1624428629875183, 0.19691407680511475, 0.23138529062271118, 0.2658565044403076, 0.30032771825790405, 0.3347989320755005, 0.3692701458930969, 0.40374135971069336, 0.4382125735282898, 0.47268378734588623, 0.5071550011634827, 0.5416262149810791, 0.5760974287986755, 0.610568642616272, 0.6450398564338684, 0.6795110702514648, 0.7139822840690613, 0.7484534978866577, 0.7829247117042542]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 10.0, 9.0, 15.0, 13.0, 16.0, 13.0, 21.0, 26.0, 36.0, 24.0, 37.0, 45.0, 36.0, 42.0, 39.0, 34.0, 45.0, 31.0, 36.0, 41.0, 40.0, 48.0, 23.0, 35.0, 30.0, 24.0, 43.0, 25.0, 29.0, 17.0, 12.0, 12.0, 13.0, 9.0, 13.0, 8.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2747429609298706, -0.26545190811157227, -0.2561608552932739, -0.24686981737613678, -0.23757877945899963, -0.2282877266407013, -0.21899667382240295, -0.2097056359052658, -0.20041459798812866, -0.19112354516983032, -0.18183250725269318, -0.17254145443439484, -0.1632504165172577, -0.15395936369895935, -0.144668310880661, -0.13537727296352386, -0.12608622014522552, -0.11679517477750778, -0.10750412940979004, -0.0982130765914917, -0.08892203867435455, -0.07963098585605621, -0.07033994048833847, -0.06104889512062073, -0.051757849752902985, -0.04246680438518524, -0.0331757590174675, -0.023884709924459457, -0.014593664556741714, -0.0053026191890239716, 0.00398842990398407, 0.013279475271701813, 0.022570520639419556, 0.0318615660071373, 0.04115261137485504, 0.05044366046786308, 0.059734705835580826, 0.06902575492858887, 0.07831680029630661, 0.08760784566402435, 0.0968988910317421, 0.10618993639945984, 0.11548098176717758, 0.12477202713489532, 0.13406307995319366, 0.1433541178703308, 0.15264517068862915, 0.1619362235069275, 0.17122726142406464, 0.18051831424236298, 0.18980935215950012, 0.19910040497779846, 0.2083914428949356, 0.21768249571323395, 0.2269735336303711, 0.23626458644866943, 0.24555563926696777, 0.2548466920852661, 0.26413774490356445, 0.2734287679195404, 0.28271982073783875, 0.2920108735561371, 0.3013019263744354, 0.3105929493904114, 0.3198840022087097]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 11.0, 14.0, 12.0, 25.0, 26.0, 23.0, 30.0, 30.0, 25.0, 38.0, 33.0, 54.0, 58.0, 44.0, 46.0, 57.0, 34.0, 53.0, 47.0, 31.0, 35.0, 25.0, 25.0, 27.0, 25.0, 19.0, 21.0, 18.0, 27.0, 10.0, 14.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.609466552734375, -3.48651123046875, -3.363555908203125, -3.2406005859375, -3.117645263671875, -2.99468994140625, -2.871734619140625, -2.748779296875, -2.625823974609375, -2.50286865234375, -2.379913330078125, -2.2569580078125, -2.134002685546875, -2.01104736328125, -1.888092041015625, -1.76513671875, -1.642181396484375, -1.51922607421875, -1.396270751953125, -1.2733154296875, -1.150360107421875, -1.02740478515625, -0.904449462890625, -0.781494140625, -0.658538818359375, -0.53558349609375, -0.412628173828125, -0.2896728515625, -0.166717529296875, -0.04376220703125, 0.079193115234375, 0.2021484375, 0.325103759765625, 0.44805908203125, 0.571014404296875, 0.6939697265625, 0.816925048828125, 0.93988037109375, 1.062835693359375, 1.185791015625, 1.308746337890625, 1.43170166015625, 1.554656982421875, 1.6776123046875, 1.800567626953125, 1.92352294921875, 2.046478271484375, 2.16943359375, 2.292388916015625, 2.41534423828125, 2.538299560546875, 2.6612548828125, 2.784210205078125, 2.90716552734375, 3.030120849609375, 3.153076171875, 3.276031494140625, 3.39898681640625, 3.521942138671875, 3.6448974609375, 3.767852783203125, 3.89080810546875, 4.013763427734375, 4.13671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 13.0, 28.0, 24.0, 35.0, 79.0, 75.0, 106.0, 198.0, 315.0, 430.0, 624.0, 1073.0, 1685.0, 2820.0, 4806.0, 8945.0, 16816.0, 33790.0, 73748.0, 181310.0, 365130.0, 199208.0, 80284.0, 36727.0, 17801.0, 9546.0, 5093.0, 2958.0, 1736.0, 1059.0, 704.0, 418.0, 297.0, 194.0, 137.0, 86.0, 67.0, 50.0, 36.0, 27.0, 13.0, 13.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7890625, -4.63726806640625, -4.4854736328125, -4.33367919921875, -4.181884765625, -4.03009033203125, -3.8782958984375, -3.72650146484375, -3.57470703125, -3.42291259765625, -3.2711181640625, -3.11932373046875, -2.967529296875, -2.81573486328125, -2.6639404296875, -2.51214599609375, -2.3603515625, -2.20855712890625, -2.0567626953125, -1.90496826171875, -1.753173828125, -1.60137939453125, -1.4495849609375, -1.29779052734375, -1.14599609375, -0.99420166015625, -0.8424072265625, -0.69061279296875, -0.538818359375, -0.38702392578125, -0.2352294921875, -0.08343505859375, 0.068359375, 0.22015380859375, 0.3719482421875, 0.52374267578125, 0.675537109375, 0.82733154296875, 0.9791259765625, 1.13092041015625, 1.28271484375, 1.43450927734375, 1.5863037109375, 1.73809814453125, 1.889892578125, 2.04168701171875, 2.1934814453125, 2.34527587890625, 2.4970703125, 2.64886474609375, 2.8006591796875, 2.95245361328125, 3.104248046875, 3.25604248046875, 3.4078369140625, 3.55963134765625, 3.71142578125, 3.86322021484375, 4.0150146484375, 4.16680908203125, 4.318603515625, 4.47039794921875, 4.6221923828125, 4.77398681640625, 4.92578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 8.0, 7.0, 10.0, 11.0, 14.0, 22.0, 28.0, 26.0, 33.0, 20.0, 28.0, 40.0, 53.0, 65.0, 91.0, 194.0, 1412.0, 341.0, 168.0, 84.0, 56.0, 50.0, 47.0, 25.0, 38.0, 31.0, 23.0, 20.0, 14.0, 23.0, 19.0, 8.0, 9.0, 8.0, 7.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-11.8515625, -11.5390625, -11.2265625, -10.9140625, -10.6015625, -10.2890625, -9.9765625, -9.6640625, -9.3515625, -9.0390625, -8.7265625, -8.4140625, -8.1015625, -7.7890625, -7.4765625, -7.1640625, -6.8515625, -6.5390625, -6.2265625, -5.9140625, -5.6015625, -5.2890625, -4.9765625, -4.6640625, -4.3515625, -4.0390625, -3.7265625, -3.4140625, -3.1015625, -2.7890625, -2.4765625, -2.1640625, -1.8515625, -1.5390625, -1.2265625, -0.9140625, -0.6015625, -0.2890625, 0.0234375, 0.3359375, 0.6484375, 0.9609375, 1.2734375, 1.5859375, 1.8984375, 2.2109375, 2.5234375, 2.8359375, 3.1484375, 3.4609375, 3.7734375, 4.0859375, 4.3984375, 4.7109375, 5.0234375, 5.3359375, 5.6484375, 5.9609375, 6.2734375, 6.5859375, 6.8984375, 7.2109375, 7.5234375, 7.8359375, 8.1484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 6.0, 7.0, 17.0, 14.0, 20.0, 24.0, 35.0, 39.0, 41.0, 61.0, 96.0, 145.0, 236.0, 360.0, 626.0, 1828.0, 18223.0, 2969360.0, 147951.0, 4268.0, 983.0, 470.0, 257.0, 181.0, 126.0, 71.0, 47.0, 38.0, 31.0, 17.0, 20.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0], "bins": [-25.890625, -25.145263671875, -24.39990234375, -23.654541015625, -22.9091796875, -22.163818359375, -21.41845703125, -20.673095703125, -19.927734375, -19.182373046875, -18.43701171875, -17.691650390625, -16.9462890625, -16.200927734375, -15.45556640625, -14.710205078125, -13.96484375, -13.219482421875, -12.47412109375, -11.728759765625, -10.9833984375, -10.238037109375, -9.49267578125, -8.747314453125, -8.001953125, -7.256591796875, -6.51123046875, -5.765869140625, -5.0205078125, -4.275146484375, -3.52978515625, -2.784423828125, -2.0390625, -1.293701171875, -0.54833984375, 0.197021484375, 0.9423828125, 1.687744140625, 2.43310546875, 3.178466796875, 3.923828125, 4.669189453125, 5.41455078125, 6.159912109375, 6.9052734375, 7.650634765625, 8.39599609375, 9.141357421875, 9.88671875, 10.632080078125, 11.37744140625, 12.122802734375, 12.8681640625, 13.613525390625, 14.35888671875, 15.104248046875, 15.849609375, 16.594970703125, 17.34033203125, 18.085693359375, 18.8310546875, 19.576416015625, 20.32177734375, 21.067138671875, 21.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 17.0, 125.0, 341.0, 372.0, 129.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.57786560058594, -113.2703628540039, -110.96285247802734, -108.65534973144531, -106.34784698486328, -104.04034423828125, -101.73283386230469, -99.42533111572266, -97.11782836914062, -94.8103256225586, -92.50281524658203, -90.1953125, -87.88780975341797, -85.58030700683594, -83.27279663085938, -80.96529388427734, -78.65778350830078, -76.35028076171875, -74.04277038574219, -71.73526763916016, -69.42776489257812, -67.12025451660156, -64.81275177001953, -62.5052490234375, -60.1977424621582, -57.890235900878906, -55.582733154296875, -53.27522659301758, -50.96772003173828, -48.66021728515625, -46.35271072387695, -44.045204162597656, -41.737701416015625, -39.43019485473633, -37.1226921081543, -34.815185546875, -32.50768280029297, -30.200176239013672, -27.892669677734375, -25.58516502380371, -23.277660369873047, -20.970155715942383, -18.66265106201172, -16.355144500732422, -14.047639846801758, -11.740135192871094, -9.432629585266113, -7.125123977661133, -4.817619323730469, -2.5101141929626465, -0.20260906219482422, 2.104896068572998, 4.41240119934082, 6.719905853271484, 9.027411460876465, 11.334917068481445, 13.64242172241211, 15.949926376342773, 18.257431030273438, 20.564937591552734, 22.8724422454834, 25.179946899414062, 27.48745346069336, 29.794958114624023, 32.10246276855469]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 3.0, 7.0, 7.0, 10.0, 8.0, 18.0, 9.0, 20.0, 15.0, 29.0, 24.0, 30.0, 37.0, 34.0, 38.0, 36.0, 50.0, 46.0, 47.0, 45.0, 36.0, 49.0, 46.0, 39.0, 38.0, 32.0, 21.0, 26.0, 28.0, 23.0, 26.0, 20.0, 26.0, 10.0, 21.0, 10.0, 11.0, 4.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.476526260375977, -25.670103073120117, -24.863679885864258, -24.057254791259766, -23.250831604003906, -22.444408416748047, -21.637985229492188, -20.831562042236328, -20.02513885498047, -19.21871566772461, -18.41229248046875, -17.60586929321289, -16.7994441986084, -15.993021011352539, -15.18659782409668, -14.38017463684082, -13.573750495910645, -12.767327308654785, -11.96090316772461, -11.15447998046875, -10.34805679321289, -9.541633605957031, -8.735209465026855, -7.928786277770996, -7.1223626136779785, -6.315938949584961, -5.509515762329102, -4.703092098236084, -3.8966686725616455, -3.090245246887207, -2.2838215827941895, -1.47739839553833, -0.6709747314453125, 0.13544875383377075, 0.941872239112854, 1.748295783996582, 2.5547192096710205, 3.361142635345459, 4.167566299438477, 4.973989486694336, 5.7804131507873535, 6.586836814880371, 7.3932600021362305, 8.199684143066406, 9.006107330322266, 9.812530517578125, 10.618953704833984, 11.425376892089844, 12.23180103302002, 13.038224220275879, 13.844648361206055, 14.651071548461914, 15.457494735717773, 16.263917922973633, 17.070343017578125, 17.876766204833984, 18.683189392089844, 19.489612579345703, 20.296035766601562, 21.102458953857422, 21.908884048461914, 22.715307235717773, 23.521730422973633, 24.328153610229492, 25.13457679748535]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 12.0, 13.0, 15.0, 17.0, 21.0, 31.0, 24.0, 35.0, 38.0, 47.0, 34.0, 45.0, 57.0, 43.0, 56.0, 54.0, 39.0, 46.0, 44.0, 36.0, 41.0, 35.0, 30.0, 29.0, 22.0, 24.0, 21.0, 12.0, 20.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13739013671875, -4.0013427734375, -3.86529541015625, -3.729248046875, -3.59320068359375, -3.4571533203125, -3.32110595703125, -3.18505859375, -3.04901123046875, -2.9129638671875, -2.77691650390625, -2.640869140625, -2.50482177734375, -2.3687744140625, -2.23272705078125, -2.0966796875, -1.96063232421875, -1.8245849609375, -1.68853759765625, -1.552490234375, -1.41644287109375, -1.2803955078125, -1.14434814453125, -1.00830078125, -0.87225341796875, -0.7362060546875, -0.60015869140625, -0.464111328125, -0.32806396484375, -0.1920166015625, -0.05596923828125, 0.080078125, 0.21612548828125, 0.3521728515625, 0.48822021484375, 0.624267578125, 0.76031494140625, 0.8963623046875, 1.03240966796875, 1.16845703125, 1.30450439453125, 1.4405517578125, 1.57659912109375, 1.712646484375, 1.84869384765625, 1.9847412109375, 2.12078857421875, 2.2568359375, 2.39288330078125, 2.5289306640625, 2.66497802734375, 2.801025390625, 2.93707275390625, 3.0731201171875, 3.20916748046875, 3.34521484375, 3.48126220703125, 3.6173095703125, 3.75335693359375, 3.889404296875, 4.02545166015625, 4.1614990234375, 4.29754638671875, 4.43359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 5.0, 3.0, 2.0, 10.0, 15.0, 24.0, 22.0, 29.0, 52.0, 63.0, 89.0, 117.0, 162.0, 235.0, 302.0, 466.0, 638.0, 898.0, 1370.0, 2175.0, 3787.0, 6985.0, 14283.0, 35694.0, 115746.0, 430163.0, 1408792.0, 1530492.0, 458715.0, 115234.0, 34971.0, 14786.0, 7065.0, 3946.0, 2294.0, 1475.0, 935.0, 635.0, 485.0, 296.0, 191.0, 169.0, 128.0, 100.0, 70.0, 51.0, 37.0, 19.0, 22.0, 11.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0], "bins": [-4.83203125, -4.69000244140625, -4.5479736328125, -4.40594482421875, -4.263916015625, -4.12188720703125, -3.9798583984375, -3.83782958984375, -3.69580078125, -3.55377197265625, -3.4117431640625, -3.26971435546875, -3.127685546875, -2.98565673828125, -2.8436279296875, -2.70159912109375, -2.5595703125, -2.41754150390625, -2.2755126953125, -2.13348388671875, -1.991455078125, -1.84942626953125, -1.7073974609375, -1.56536865234375, -1.42333984375, -1.28131103515625, -1.1392822265625, -0.99725341796875, -0.855224609375, -0.71319580078125, -0.5711669921875, -0.42913818359375, -0.287109375, -0.14508056640625, -0.0030517578125, 0.13897705078125, 0.281005859375, 0.42303466796875, 0.5650634765625, 0.70709228515625, 0.84912109375, 0.99114990234375, 1.1331787109375, 1.27520751953125, 1.417236328125, 1.55926513671875, 1.7012939453125, 1.84332275390625, 1.9853515625, 2.12738037109375, 2.2694091796875, 2.41143798828125, 2.553466796875, 2.69549560546875, 2.8375244140625, 2.97955322265625, 3.12158203125, 3.26361083984375, 3.4056396484375, 3.54766845703125, 3.689697265625, 3.83172607421875, 3.9737548828125, 4.11578369140625, 4.2578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 15.0, 8.0, 9.0, 26.0, 22.0, 37.0, 30.0, 52.0, 87.0, 110.0, 103.0, 140.0, 195.0, 301.0, 467.0, 562.0, 523.0, 381.0, 244.0, 180.0, 122.0, 88.0, 79.0, 65.0, 53.0, 41.0, 35.0, 27.0, 11.0, 22.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.8863525390625, -6.682861328125, -6.4793701171875, -6.27587890625, -6.0723876953125, -5.868896484375, -5.6654052734375, -5.4619140625, -5.2584228515625, -5.054931640625, -4.8514404296875, -4.64794921875, -4.4444580078125, -4.240966796875, -4.0374755859375, -3.833984375, -3.6304931640625, -3.427001953125, -3.2235107421875, -3.02001953125, -2.8165283203125, -2.613037109375, -2.4095458984375, -2.2060546875, -2.0025634765625, -1.799072265625, -1.5955810546875, -1.39208984375, -1.1885986328125, -0.985107421875, -0.7816162109375, -0.578125, -0.3746337890625, -0.171142578125, 0.0323486328125, 0.23583984375, 0.4393310546875, 0.642822265625, 0.8463134765625, 1.0498046875, 1.2532958984375, 1.456787109375, 1.6602783203125, 1.86376953125, 2.0672607421875, 2.270751953125, 2.4742431640625, 2.677734375, 2.8812255859375, 3.084716796875, 3.2882080078125, 3.49169921875, 3.6951904296875, 3.898681640625, 4.1021728515625, 4.3056640625, 4.5091552734375, 4.712646484375, 4.9161376953125, 5.11962890625, 5.3231201171875, 5.526611328125, 5.7301025390625, 5.93359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 10.0, 8.0, 18.0, 21.0, 17.0, 28.0, 31.0, 62.0, 83.0, 127.0, 208.0, 288.0, 480.0, 782.0, 1301.0, 2523.0, 5991.0, 18329.0, 78661.0, 446471.0, 2885271.0, 615516.0, 101235.0, 23016.0, 7131.0, 2901.0, 1496.0, 833.0, 515.0, 322.0, 197.0, 130.0, 102.0, 56.0, 32.0, 27.0, 19.0, 13.0, 10.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1875, -6.9268798828125, -6.666259765625, -6.4056396484375, -6.14501953125, -5.8843994140625, -5.623779296875, -5.3631591796875, -5.1025390625, -4.8419189453125, -4.581298828125, -4.3206787109375, -4.06005859375, -3.7994384765625, -3.538818359375, -3.2781982421875, -3.017578125, -2.7569580078125, -2.496337890625, -2.2357177734375, -1.97509765625, -1.7144775390625, -1.453857421875, -1.1932373046875, -0.9326171875, -0.6719970703125, -0.411376953125, -0.1507568359375, 0.10986328125, 0.3704833984375, 0.631103515625, 0.8917236328125, 1.15234375, 1.4129638671875, 1.673583984375, 1.9342041015625, 2.19482421875, 2.4554443359375, 2.716064453125, 2.9766845703125, 3.2373046875, 3.4979248046875, 3.758544921875, 4.0191650390625, 4.27978515625, 4.5404052734375, 4.801025390625, 5.0616455078125, 5.322265625, 5.5828857421875, 5.843505859375, 6.1041259765625, 6.36474609375, 6.6253662109375, 6.885986328125, 7.1466064453125, 7.4072265625, 7.6678466796875, 7.928466796875, 8.1890869140625, 8.44970703125, 8.7103271484375, 8.970947265625, 9.2315673828125, 9.4921875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 19.0, 222.0, 553.0, 196.0, 17.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.85098266601562, -154.71749877929688, -150.58399963378906, -146.4505157470703, -142.31703186035156, -138.1835479736328, -134.050048828125, -129.91656494140625, -125.7830810546875, -121.64958953857422, -117.51610565185547, -113.38261413574219, -109.24913024902344, -105.11563873291016, -100.98214721679688, -96.84866333007812, -92.71517181396484, -88.58168029785156, -84.44819641113281, -80.31470489501953, -76.18122100830078, -72.0477294921875, -67.91424560546875, -63.78075408935547, -59.64726638793945, -55.51377868652344, -51.38029098510742, -47.246803283691406, -43.113311767578125, -38.979827880859375, -34.846336364746094, -30.712848663330078, -26.579360961914062, -22.445873260498047, -18.31238555908203, -14.178895950317383, -10.045408248901367, -5.911920547485352, -1.7784309387207031, 2.3550567626953125, 6.488544464111328, 10.622032165527344, 14.755520820617676, 18.889009475708008, 23.022497177124023, 27.15598487854004, 31.289474487304688, 35.4229621887207, 39.55644989013672, 43.689937591552734, 47.82342529296875, 51.95691680908203, 56.09040069580078, 60.22389221191406, 64.35737609863281, 68.4908676147461, 72.62435913085938, 76.75785064697266, 80.8913345336914, 85.02482604980469, 89.15830993652344, 93.29180145263672, 97.42529296875, 101.55877685546875, 105.6922607421875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 3.0, 3.0, 7.0, 11.0, 14.0, 7.0, 11.0, 21.0, 20.0, 21.0, 20.0, 25.0, 30.0, 32.0, 33.0, 35.0, 38.0, 28.0, 40.0, 40.0, 30.0, 44.0, 41.0, 46.0, 42.0, 56.0, 38.0, 39.0, 31.0, 25.0, 33.0, 14.0, 18.0, 18.0, 18.0, 14.0, 11.0, 12.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.935544967651367, -23.193965911865234, -22.45238494873047, -21.710805892944336, -20.96922492980957, -20.227645874023438, -19.486064910888672, -18.74448585510254, -18.002906799316406, -17.261327743530273, -16.519746780395508, -15.778167724609375, -15.036587715148926, -14.295007705688477, -13.553427696228027, -12.811847686767578, -12.070267677307129, -11.32868766784668, -10.58710765838623, -9.845527648925781, -9.103948593139648, -8.3623685836792, -7.62078857421875, -6.879209041595459, -6.13762903213501, -5.3960490226745605, -4.6544694900512695, -3.9128894805908203, -3.17130970954895, -2.42972993850708, -1.6881499290466309, -0.9465703964233398, -0.20499038696289062, 0.5365894436836243, 1.2781692743301392, 2.019749164581299, 2.761328935623169, 3.502908706665039, 4.244488716125488, 4.986068248748779, 5.7276482582092285, 6.469228267669678, 7.210807800292969, 7.952387809753418, 8.693967819213867, 9.435546875, 10.177127838134766, 10.918706893920898, 11.660286903381348, 12.401866912841797, 13.143446922302246, 13.885026931762695, 14.626605987548828, 15.368185997009277, 16.109766006469727, 16.85134506225586, 17.592926025390625, 18.334505081176758, 19.076086044311523, 19.817665100097656, 20.559246063232422, 21.300825119018555, 22.042404174804688, 22.783985137939453, 23.525564193725586]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 16.0, 19.0, 19.0, 15.0, 22.0, 30.0, 34.0, 23.0, 36.0, 37.0, 29.0, 36.0, 38.0, 40.0, 37.0, 37.0, 32.0, 33.0, 39.0, 40.0, 37.0, 29.0, 36.0, 28.0, 18.0, 28.0, 21.0, 19.0, 20.0, 19.0, 12.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0], "bins": [-2.810546875, -2.7255859375, -2.640625, -2.5556640625, -2.470703125, -2.3857421875, -2.30078125, -2.2158203125, -2.130859375, -2.0458984375, -1.9609375, -1.8759765625, -1.791015625, -1.7060546875, -1.62109375, -1.5361328125, -1.451171875, -1.3662109375, -1.28125, -1.1962890625, -1.111328125, -1.0263671875, -0.94140625, -0.8564453125, -0.771484375, -0.6865234375, -0.6015625, -0.5166015625, -0.431640625, -0.3466796875, -0.26171875, -0.1767578125, -0.091796875, -0.0068359375, 0.078125, 0.1630859375, 0.248046875, 0.3330078125, 0.41796875, 0.5029296875, 0.587890625, 0.6728515625, 0.7578125, 0.8427734375, 0.927734375, 1.0126953125, 1.09765625, 1.1826171875, 1.267578125, 1.3525390625, 1.4375, 1.5224609375, 1.607421875, 1.6923828125, 1.77734375, 1.8623046875, 1.947265625, 2.0322265625, 2.1171875, 2.2021484375, 2.287109375, 2.3720703125, 2.45703125, 2.5419921875, 2.626953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 31.0, 41.0, 50.0, 77.0, 115.0, 171.0, 252.0, 372.0, 554.0, 818.0, 1189.0, 1943.0, 3036.0, 4958.0, 7892.0, 12653.0, 21952.0, 37743.0, 65510.0, 113168.0, 185345.0, 220414.0, 152409.0, 90633.0, 52283.0, 29595.0, 17629.0, 10443.0, 6301.0, 3779.0, 2466.0, 1550.0, 1000.0, 686.0, 469.0, 310.0, 224.0, 134.0, 113.0, 75.0, 41.0, 31.0, 27.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.378662109375, -0.36728668212890625, -0.3559112548828125, -0.34453582763671875, -0.333160400390625, -0.32178497314453125, -0.3104095458984375, -0.29903411865234375, -0.28765869140625, -0.27628326416015625, -0.2649078369140625, -0.25353240966796875, -0.242156982421875, -0.23078155517578125, -0.2194061279296875, -0.20803070068359375, -0.1966552734375, -0.18527984619140625, -0.1739044189453125, -0.16252899169921875, -0.151153564453125, -0.13977813720703125, -0.1284027099609375, -0.11702728271484375, -0.10565185546875, -0.09427642822265625, -0.0829010009765625, -0.07152557373046875, -0.060150146484375, -0.04877471923828125, -0.0373992919921875, -0.02602386474609375, -0.0146484375, -0.00327301025390625, 0.0081024169921875, 0.01947784423828125, 0.030853271484375, 0.04222869873046875, 0.0536041259765625, 0.06497955322265625, 0.07635498046875, 0.08773040771484375, 0.0991058349609375, 0.11048126220703125, 0.121856689453125, 0.13323211669921875, 0.1446075439453125, 0.15598297119140625, 0.1673583984375, 0.17873382568359375, 0.1901092529296875, 0.20148468017578125, 0.212860107421875, 0.22423553466796875, 0.2356109619140625, 0.24698638916015625, 0.25836181640625, 0.26973724365234375, 0.2811126708984375, 0.29248809814453125, 0.303863525390625, 0.31523895263671875, 0.3266143798828125, 0.33798980712890625, 0.349365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 4.0, 9.0, 7.0, 15.0, 8.0, 15.0, 23.0, 14.0, 16.0, 24.0, 31.0, 31.0, 37.0, 37.0, 38.0, 38.0, 28.0, 33.0, 39.0, 45.0, 1069.0, 35.0, 43.0, 37.0, 40.0, 26.0, 37.0, 24.0, 40.0, 23.0, 22.0, 22.0, 23.0, 19.0, 10.0, 13.0, 10.0, 6.0, 2.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.14959716796875, -2.0784912109375, -2.00738525390625, -1.936279296875, -1.86517333984375, -1.7940673828125, -1.72296142578125, -1.65185546875, -1.58074951171875, -1.5096435546875, -1.43853759765625, -1.367431640625, -1.29632568359375, -1.2252197265625, -1.15411376953125, -1.0830078125, -1.01190185546875, -0.9407958984375, -0.86968994140625, -0.798583984375, -0.72747802734375, -0.6563720703125, -0.58526611328125, -0.51416015625, -0.44305419921875, -0.3719482421875, -0.30084228515625, -0.229736328125, -0.15863037109375, -0.0875244140625, -0.01641845703125, 0.0546875, 0.12579345703125, 0.1968994140625, 0.26800537109375, 0.339111328125, 0.41021728515625, 0.4813232421875, 0.55242919921875, 0.62353515625, 0.69464111328125, 0.7657470703125, 0.83685302734375, 0.907958984375, 0.97906494140625, 1.0501708984375, 1.12127685546875, 1.1923828125, 1.26348876953125, 1.3345947265625, 1.40570068359375, 1.476806640625, 1.54791259765625, 1.6190185546875, 1.69012451171875, 1.76123046875, 1.83233642578125, 1.9034423828125, 1.97454833984375, 2.045654296875, 2.11676025390625, 2.1878662109375, 2.25897216796875, 2.330078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 16.0, 25.0, 49.0, 67.0, 121.0, 176.0, 342.0, 706.0, 1634.0, 4252.0, 12901.0, 50466.0, 248536.0, 1489727.0, 222880.0, 46285.0, 12175.0, 3798.0, 1490.0, 653.0, 345.0, 197.0, 105.0, 55.0, 34.0, 17.0, 14.0, 16.0, 13.0, 2.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6912612915039062, -0.6706085205078125, -0.6499557495117188, -0.629302978515625, -0.6086502075195312, -0.5879974365234375, -0.5673446655273438, -0.54669189453125, -0.5260391235351562, -0.5053863525390625, -0.48473358154296875, -0.464080810546875, -0.44342803955078125, -0.4227752685546875, -0.40212249755859375, -0.3814697265625, -0.36081695556640625, -0.3401641845703125, -0.31951141357421875, -0.298858642578125, -0.27820587158203125, -0.2575531005859375, -0.23690032958984375, -0.21624755859375, -0.19559478759765625, -0.1749420166015625, -0.15428924560546875, -0.133636474609375, -0.11298370361328125, -0.0923309326171875, -0.07167816162109375, -0.051025390625, -0.03037261962890625, -0.0097198486328125, 0.01093292236328125, 0.031585693359375, 0.05223846435546875, 0.0728912353515625, 0.09354400634765625, 0.11419677734375, 0.13484954833984375, 0.1555023193359375, 0.17615509033203125, 0.196807861328125, 0.21746063232421875, 0.2381134033203125, 0.25876617431640625, 0.2794189453125, 0.30007171630859375, 0.3207244873046875, 0.34137725830078125, 0.362030029296875, 0.38268280029296875, 0.4033355712890625, 0.42398834228515625, 0.44464111328125, 0.46529388427734375, 0.4859466552734375, 0.5065994262695312, 0.527252197265625, 0.5479049682617188, 0.5685577392578125, 0.5892105102539062, 0.60986328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 10.0, 17.0, 18.0, 24.0, 27.0, 62.0, 61.0, 88.0, 133.0, 139.0, 132.0, 68.0, 41.0, 26.0, 29.0, 14.0, 13.0, 10.0, 9.0, 6.0, 14.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.090576171875, -0.0881357192993164, -0.08569526672363281, -0.08325481414794922, -0.08081436157226562, -0.07837390899658203, -0.07593345642089844, -0.07349300384521484, -0.07105255126953125, -0.06861209869384766, -0.06617164611816406, -0.06373119354248047, -0.061290740966796875, -0.05885028839111328, -0.05640983581542969, -0.053969383239746094, -0.0515289306640625, -0.049088478088378906, -0.04664802551269531, -0.04420757293701172, -0.041767120361328125, -0.03932666778564453, -0.03688621520996094, -0.034445762634277344, -0.03200531005859375, -0.029564857482910156, -0.027124404907226562, -0.02468395233154297, -0.022243499755859375, -0.01980304718017578, -0.017362594604492188, -0.014922142028808594, -0.012481689453125, -0.010041236877441406, -0.0076007843017578125, -0.005160331726074219, -0.002719879150390625, -0.00027942657470703125, 0.0021610260009765625, 0.004601478576660156, 0.00704193115234375, 0.009482383728027344, 0.011922836303710938, 0.014363288879394531, 0.016803741455078125, 0.01924419403076172, 0.021684646606445312, 0.024125099182128906, 0.0265655517578125, 0.029006004333496094, 0.03144645690917969, 0.03388690948486328, 0.036327362060546875, 0.03876781463623047, 0.04120826721191406, 0.043648719787597656, 0.04608917236328125, 0.048529624938964844, 0.05097007751464844, 0.05341053009033203, 0.055850982666015625, 0.05829143524169922, 0.06073188781738281, 0.0631723403930664, 0.06561279296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 4.0, 7.0, 13.0, 10.0, 18.0, 35.0, 27.0, 32.0, 61.0, 83.0, 171.0, 317.0, 1021.0, 1026617.0, 18845.0, 568.0, 267.0, 123.0, 92.0, 54.0, 42.0, 30.0, 20.0, 17.0, 13.0, 6.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.646484375, -1.593017578125, -1.53955078125, -1.486083984375, -1.4326171875, -1.379150390625, -1.32568359375, -1.272216796875, -1.21875, -1.165283203125, -1.11181640625, -1.058349609375, -1.0048828125, -0.951416015625, -0.89794921875, -0.844482421875, -0.791015625, -0.737548828125, -0.68408203125, -0.630615234375, -0.5771484375, -0.523681640625, -0.47021484375, -0.416748046875, -0.36328125, -0.309814453125, -0.25634765625, -0.202880859375, -0.1494140625, -0.095947265625, -0.04248046875, 0.010986328125, 0.064453125, 0.117919921875, 0.17138671875, 0.224853515625, 0.2783203125, 0.331787109375, 0.38525390625, 0.438720703125, 0.4921875, 0.545654296875, 0.59912109375, 0.652587890625, 0.7060546875, 0.759521484375, 0.81298828125, 0.866455078125, 0.919921875, 0.973388671875, 1.02685546875, 1.080322265625, 1.1337890625, 1.187255859375, 1.24072265625, 1.294189453125, 1.34765625, 1.401123046875, 1.45458984375, 1.508056640625, 1.5615234375, 1.614990234375, 1.66845703125, 1.721923828125, 1.775390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 67.0, 617.0, 297.0, 27.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23715998232364655, -0.22576290369033813, -0.21436583995819092, -0.2029687613248825, -0.1915716826915741, -0.18017460405826569, -0.16877752542495728, -0.15738046169281006, -0.14598338305950165, -0.13458630442619324, -0.12318923324346542, -0.11179216206073761, -0.1003950834274292, -0.08899800479412079, -0.07760093361139297, -0.06620386242866516, -0.05480678379535675, -0.04340970888733864, -0.032012633979320526, -0.020615559071302414, -0.009218484163284302, 0.0021785907447338104, 0.013575665652751923, 0.024972736835479736, 0.03636981546878815, 0.04776689037680626, 0.05916396528482437, 0.07056103646755219, 0.0819581151008606, 0.093355193734169, 0.10475226491689682, 0.11614933609962463, 0.12754639983177185, 0.13894347846508026, 0.15034055709838867, 0.1617376208305359, 0.1731346994638443, 0.1845317780971527, 0.19592884182929993, 0.20732592046260834, 0.21872299909591675, 0.23012007772922516, 0.24151715636253357, 0.2529142200946808, 0.2643113136291504, 0.2757083773612976, 0.2871054410934448, 0.29850250482559204, 0.30989959836006165, 0.32129666209220886, 0.33269375562667847, 0.3440908193588257, 0.3554878830909729, 0.3668849766254425, 0.3782820403575897, 0.3896791338920593, 0.40107619762420654, 0.41247326135635376, 0.42387035489082336, 0.4352674186229706, 0.4466645121574402, 0.4580615758895874, 0.4694586396217346, 0.48085570335388184, 0.49225279688835144]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 13.0, 8.0, 9.0, 20.0, 13.0, 18.0, 23.0, 20.0, 38.0, 33.0, 44.0, 31.0, 42.0, 37.0, 44.0, 47.0, 50.0, 46.0, 36.0, 55.0, 48.0, 44.0, 38.0, 27.0, 35.0, 31.0, 22.0, 23.0, 28.0, 19.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05618172883987427, -0.05404782295227051, -0.051913920789957047, -0.049780018627643585, -0.047646112740039825, -0.045512206852436066, -0.043378304690122604, -0.04124440252780914, -0.03911049664020538, -0.036976590752601624, -0.03484268859028816, -0.0327087864279747, -0.03057488054037094, -0.02844097651541233, -0.02630707249045372, -0.02417316846549511, -0.0220392644405365, -0.01990536041557789, -0.017771456390619278, -0.015637552365660667, -0.013503648340702057, -0.011369744315743446, -0.009235840290784836, -0.007101936265826225, -0.004968032240867615, -0.002834128215909004, -0.0007002241909503937, 0.0014336798340082169, 0.0035675838589668274, 0.005701487883925438, 0.007835391908884048, 0.009969295933842659, 0.01210319995880127, 0.01423710398375988, 0.01637100800871849, 0.0185049120336771, 0.02063881605863571, 0.022772720083594322, 0.024906624108552933, 0.027040528133511543, 0.029174432158470154, 0.031308338046073914, 0.033442240208387375, 0.035576142370700836, 0.037710048258304596, 0.039843954145908356, 0.04197785630822182, 0.04411175847053528, 0.04624566435813904, 0.0483795702457428, 0.05051347240805626, 0.05264737457036972, 0.05478128045797348, 0.05691518634557724, 0.0590490885078907, 0.06118299067020416, 0.06331689655780792, 0.06545080244541168, 0.06758470833301544, 0.0697186067700386, 0.07185251265764236, 0.07398641854524612, 0.07612031698226929, 0.07825422286987305, 0.0803881287574768]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 0.0, 4.0, 1.0, 8.0, 9.0, 6.0, 11.0, 12.0, 18.0, 13.0, 21.0, 26.0, 33.0, 24.0, 31.0, 34.0, 41.0, 33.0, 43.0, 36.0, 46.0, 36.0, 49.0, 42.0, 30.0, 41.0, 40.0, 34.0, 37.0, 21.0, 29.0, 35.0, 23.0, 13.0, 27.0, 23.0, 18.0, 12.0, 9.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0], "bins": [-3.279296875, -3.18701171875, -3.0947265625, -3.00244140625, -2.91015625, -2.81787109375, -2.7255859375, -2.63330078125, -2.541015625, -2.44873046875, -2.3564453125, -2.26416015625, -2.171875, -2.07958984375, -1.9873046875, -1.89501953125, -1.802734375, -1.71044921875, -1.6181640625, -1.52587890625, -1.43359375, -1.34130859375, -1.2490234375, -1.15673828125, -1.064453125, -0.97216796875, -0.8798828125, -0.78759765625, -0.6953125, -0.60302734375, -0.5107421875, -0.41845703125, -0.326171875, -0.23388671875, -0.1416015625, -0.04931640625, 0.04296875, 0.13525390625, 0.2275390625, 0.31982421875, 0.412109375, 0.50439453125, 0.5966796875, 0.68896484375, 0.78125, 0.87353515625, 0.9658203125, 1.05810546875, 1.150390625, 1.24267578125, 1.3349609375, 1.42724609375, 1.51953125, 1.61181640625, 1.7041015625, 1.79638671875, 1.888671875, 1.98095703125, 2.0732421875, 2.16552734375, 2.2578125, 2.35009765625, 2.4423828125, 2.53466796875, 2.626953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 13.0, 15.0, 18.0, 32.0, 48.0, 65.0, 83.0, 122.0, 173.0, 267.0, 435.0, 698.0, 1106.0, 1843.0, 3475.0, 6632.0, 13107.0, 28071.0, 70064.0, 247232.0, 464830.0, 125851.0, 44263.0, 19315.0, 9263.0, 4871.0, 2616.0, 1538.0, 909.0, 524.0, 316.0, 238.0, 148.0, 107.0, 60.0, 58.0, 45.0, 24.0, 19.0, 13.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.6671142578125, -4.517822265625, -4.3685302734375, -4.21923828125, -4.0699462890625, -3.920654296875, -3.7713623046875, -3.6220703125, -3.4727783203125, -3.323486328125, -3.1741943359375, -3.02490234375, -2.8756103515625, -2.726318359375, -2.5770263671875, -2.427734375, -2.2784423828125, -2.129150390625, -1.9798583984375, -1.83056640625, -1.6812744140625, -1.531982421875, -1.3826904296875, -1.2333984375, -1.0841064453125, -0.934814453125, -0.7855224609375, -0.63623046875, -0.4869384765625, -0.337646484375, -0.1883544921875, -0.0390625, 0.1102294921875, 0.259521484375, 0.4088134765625, 0.55810546875, 0.7073974609375, 0.856689453125, 1.0059814453125, 1.1552734375, 1.3045654296875, 1.453857421875, 1.6031494140625, 1.75244140625, 1.9017333984375, 2.051025390625, 2.2003173828125, 2.349609375, 2.4989013671875, 2.648193359375, 2.7974853515625, 2.94677734375, 3.0960693359375, 3.245361328125, 3.3946533203125, 3.5439453125, 3.6932373046875, 3.842529296875, 3.9918212890625, 4.14111328125, 4.2904052734375, 4.439697265625, 4.5889892578125, 4.73828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 7.0, 3.0, 7.0, 12.0, 11.0, 13.0, 22.0, 25.0, 33.0, 34.0, 32.0, 46.0, 57.0, 44.0, 87.0, 158.0, 370.0, 1473.0, 151.0, 108.0, 60.0, 39.0, 28.0, 37.0, 32.0, 23.0, 21.0, 18.0, 12.0, 14.0, 14.0, 13.0, 10.0, 7.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.18896484375, -6.9326171875, -6.67626953125, -6.419921875, -6.16357421875, -5.9072265625, -5.65087890625, -5.39453125, -5.13818359375, -4.8818359375, -4.62548828125, -4.369140625, -4.11279296875, -3.8564453125, -3.60009765625, -3.34375, -3.08740234375, -2.8310546875, -2.57470703125, -2.318359375, -2.06201171875, -1.8056640625, -1.54931640625, -1.29296875, -1.03662109375, -0.7802734375, -0.52392578125, -0.267578125, -0.01123046875, 0.2451171875, 0.50146484375, 0.7578125, 1.01416015625, 1.2705078125, 1.52685546875, 1.783203125, 2.03955078125, 2.2958984375, 2.55224609375, 2.80859375, 3.06494140625, 3.3212890625, 3.57763671875, 3.833984375, 4.09033203125, 4.3466796875, 4.60302734375, 4.859375, 5.11572265625, 5.3720703125, 5.62841796875, 5.884765625, 6.14111328125, 6.3974609375, 6.65380859375, 6.91015625, 7.16650390625, 7.4228515625, 7.67919921875, 7.935546875, 8.19189453125, 8.4482421875, 8.70458984375, 8.9609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 12.0, 12.0, 9.0, 10.0, 11.0, 20.0, 34.0, 30.0, 61.0, 87.0, 121.0, 217.0, 293.0, 497.0, 1095.0, 9267.0, 2981498.0, 147223.0, 3147.0, 802.0, 429.0, 247.0, 158.0, 109.0, 86.0, 62.0, 37.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.46875, -21.783935546875, -21.09912109375, -20.414306640625, -19.7294921875, -19.044677734375, -18.35986328125, -17.675048828125, -16.990234375, -16.305419921875, -15.62060546875, -14.935791015625, -14.2509765625, -13.566162109375, -12.88134765625, -12.196533203125, -11.51171875, -10.826904296875, -10.14208984375, -9.457275390625, -8.7724609375, -8.087646484375, -7.40283203125, -6.718017578125, -6.033203125, -5.348388671875, -4.66357421875, -3.978759765625, -3.2939453125, -2.609130859375, -1.92431640625, -1.239501953125, -0.5546875, 0.130126953125, 0.81494140625, 1.499755859375, 2.1845703125, 2.869384765625, 3.55419921875, 4.239013671875, 4.923828125, 5.608642578125, 6.29345703125, 6.978271484375, 7.6630859375, 8.347900390625, 9.03271484375, 9.717529296875, 10.40234375, 11.087158203125, 11.77197265625, 12.456787109375, 13.1416015625, 13.826416015625, 14.51123046875, 15.196044921875, 15.880859375, 16.565673828125, 17.25048828125, 17.935302734375, 18.6201171875, 19.304931640625, 19.98974609375, 20.674560546875, 21.359375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 15.0, 34.0, 103.0, 142.0, 205.0, 192.0, 130.0, 88.0, 44.0, 18.0, 12.0, 3.0, 4.0], "bins": [-57.1346435546875, -56.117767333984375, -55.10089111328125, -54.08401107788086, -53.067134857177734, -52.05025863647461, -51.033382415771484, -50.01650619506836, -48.99962615966797, -47.982749938964844, -46.96587371826172, -45.94899368286133, -44.9321174621582, -43.91524124145508, -42.89836502075195, -41.88148880004883, -40.8646125793457, -39.84773635864258, -38.83086013793945, -37.81398010253906, -36.79710388183594, -35.78022766113281, -34.76335144042969, -33.74647521972656, -32.72959899902344, -31.712722778320312, -30.695844650268555, -29.67896842956543, -28.662090301513672, -27.645214080810547, -26.628337860107422, -25.611461639404297, -24.59458351135254, -23.577707290649414, -22.560829162597656, -21.54395294189453, -20.527076721191406, -19.51019859313965, -18.493322372436523, -17.476444244384766, -16.45956802368164, -15.4426908493042, -14.425813674926758, -13.408937454223633, -12.392060279846191, -11.37518310546875, -10.358306884765625, -9.341429710388184, -8.324552536010742, -7.307675361633301, -6.290798664093018, -5.273921966552734, -4.257044792175293, -3.2401676177978516, -2.2232909202575684, -1.2064142227172852, -0.18953657150268555, 0.8273403644561768, 1.844217300415039, 2.8610942363739014, 3.8779711723327637, 4.894848346710205, 5.911725044250488, 6.9286017417907715, 7.945478916168213]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 13.0, 14.0, 15.0, 19.0, 13.0, 24.0, 29.0, 26.0, 28.0, 24.0, 28.0, 37.0, 46.0, 36.0, 52.0, 39.0, 37.0, 37.0, 47.0, 41.0, 28.0, 38.0, 39.0, 34.0, 29.0, 26.0, 31.0, 19.0, 15.0, 19.0, 13.0, 17.0, 13.0, 5.0, 10.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.634201049804688, -22.898351669311523, -22.16250228881836, -21.426652908325195, -20.69080352783203, -19.9549560546875, -19.219104766845703, -18.483257293701172, -17.747407913208008, -17.011558532714844, -16.27570915222168, -15.539859771728516, -14.804011344909668, -14.068161964416504, -13.33231258392334, -12.596464157104492, -11.860613822937012, -11.124764442443848, -10.388915061950684, -9.653066635131836, -8.917217254638672, -8.181367874145508, -7.445518493652344, -6.709669589996338, -5.973820209503174, -5.23797082901001, -4.502121925354004, -3.76627254486084, -3.030423402786255, -2.29457426071167, -1.5587248802185059, -0.8228759765625, -0.08702659606933594, 0.6488226056098938, 1.3846718072891235, 2.120521068572998, 2.856370210647583, 3.592219352722168, 4.328068733215332, 5.063917636871338, 5.799767017364502, 6.535616397857666, 7.271465301513672, 8.007314682006836, 8.7431640625, 9.479013442993164, 10.214862823486328, 10.950711250305176, 11.68656063079834, 12.422410011291504, 13.158259391784668, 13.894107818603516, 14.62995719909668, 15.365806579589844, 16.101655960083008, 16.837505340576172, 17.573354721069336, 18.3092041015625, 19.045053482055664, 19.780902862548828, 20.516752243041992, 21.252601623535156, 21.988449096679688, 22.72429847717285, 23.460147857666016]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 14.0, 17.0, 17.0, 12.0, 17.0, 21.0, 25.0, 21.0, 33.0, 44.0, 42.0, 45.0, 40.0, 46.0, 55.0, 46.0, 47.0, 46.0, 50.0, 42.0, 37.0, 27.0, 36.0, 22.0, 26.0, 26.0, 18.0, 19.0, 12.0, 13.0, 20.0, 12.0, 10.0, 10.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20172119140625, -3.0909423828125, -2.98016357421875, -2.869384765625, -2.75860595703125, -2.6478271484375, -2.53704833984375, -2.42626953125, -2.31549072265625, -2.2047119140625, -2.09393310546875, -1.983154296875, -1.87237548828125, -1.7615966796875, -1.65081787109375, -1.5400390625, -1.42926025390625, -1.3184814453125, -1.20770263671875, -1.096923828125, -0.98614501953125, -0.8753662109375, -0.76458740234375, -0.65380859375, -0.54302978515625, -0.4322509765625, -0.32147216796875, -0.210693359375, -0.09991455078125, 0.0108642578125, 0.12164306640625, 0.232421875, 0.34320068359375, 0.4539794921875, 0.56475830078125, 0.675537109375, 0.78631591796875, 0.8970947265625, 1.00787353515625, 1.11865234375, 1.22943115234375, 1.3402099609375, 1.45098876953125, 1.561767578125, 1.67254638671875, 1.7833251953125, 1.89410400390625, 2.0048828125, 2.11566162109375, 2.2264404296875, 2.33721923828125, 2.447998046875, 2.55877685546875, 2.6695556640625, 2.78033447265625, 2.89111328125, 3.00189208984375, 3.1126708984375, 3.22344970703125, 3.334228515625, 3.44500732421875, 3.5557861328125, 3.66656494140625, 3.77734375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 11.0, 26.0, 26.0, 47.0, 53.0, 74.0, 117.0, 166.0, 315.0, 534.0, 1082.0, 2276.0, 5476.0, 19693.0, 511298.0, 3447242.0, 183814.0, 13588.0, 4378.0, 1870.0, 873.0, 465.0, 293.0, 166.0, 104.0, 72.0, 61.0, 36.0, 28.0, 17.0, 12.0, 12.0, 4.0, 16.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.15625, -12.8043212890625, -12.452392578125, -12.1004638671875, -11.74853515625, -11.3966064453125, -11.044677734375, -10.6927490234375, -10.3408203125, -9.9888916015625, -9.636962890625, -9.2850341796875, -8.93310546875, -8.5811767578125, -8.229248046875, -7.8773193359375, -7.525390625, -7.1734619140625, -6.821533203125, -6.4696044921875, -6.11767578125, -5.7657470703125, -5.413818359375, -5.0618896484375, -4.7099609375, -4.3580322265625, -4.006103515625, -3.6541748046875, -3.30224609375, -2.9503173828125, -2.598388671875, -2.2464599609375, -1.89453125, -1.5426025390625, -1.190673828125, -0.8387451171875, -0.48681640625, -0.1348876953125, 0.217041015625, 0.5689697265625, 0.9208984375, 1.2728271484375, 1.624755859375, 1.9766845703125, 2.32861328125, 2.6805419921875, 3.032470703125, 3.3843994140625, 3.736328125, 4.0882568359375, 4.440185546875, 4.7921142578125, 5.14404296875, 5.4959716796875, 5.847900390625, 6.1998291015625, 6.5517578125, 6.9036865234375, 7.255615234375, 7.6075439453125, 7.95947265625, 8.3114013671875, 8.663330078125, 9.0152587890625, 9.3671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 11.0, 12.0, 13.0, 25.0, 24.0, 58.0, 61.0, 77.0, 85.0, 123.0, 142.0, 208.0, 273.0, 392.0, 447.0, 487.0, 386.0, 319.0, 222.0, 171.0, 132.0, 93.0, 81.0, 62.0, 46.0, 35.0, 23.0, 13.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.06787109375, -3.9130859375, -3.75830078125, -3.603515625, -3.44873046875, -3.2939453125, -3.13916015625, -2.984375, -2.82958984375, -2.6748046875, -2.52001953125, -2.365234375, -2.21044921875, -2.0556640625, -1.90087890625, -1.74609375, -1.59130859375, -1.4365234375, -1.28173828125, -1.126953125, -0.97216796875, -0.8173828125, -0.66259765625, -0.5078125, -0.35302734375, -0.1982421875, -0.04345703125, 0.111328125, 0.26611328125, 0.4208984375, 0.57568359375, 0.73046875, 0.88525390625, 1.0400390625, 1.19482421875, 1.349609375, 1.50439453125, 1.6591796875, 1.81396484375, 1.96875, 2.12353515625, 2.2783203125, 2.43310546875, 2.587890625, 2.74267578125, 2.8974609375, 3.05224609375, 3.20703125, 3.36181640625, 3.5166015625, 3.67138671875, 3.826171875, 3.98095703125, 4.1357421875, 4.29052734375, 4.4453125, 4.60009765625, 4.7548828125, 4.90966796875, 5.064453125, 5.21923828125, 5.3740234375, 5.52880859375, 5.68359375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 12.0, 7.0, 22.0, 28.0, 48.0, 61.0, 85.0, 154.0, 246.0, 496.0, 1003.0, 2605.0, 9259.0, 86348.0, 3019085.0, 1025990.0, 38825.0, 5963.0, 1979.0, 918.0, 411.0, 266.0, 161.0, 88.0, 70.0, 42.0, 29.0, 22.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9140625, -12.5728759765625, -12.231689453125, -11.8905029296875, -11.54931640625, -11.2081298828125, -10.866943359375, -10.5257568359375, -10.1845703125, -9.8433837890625, -9.502197265625, -9.1610107421875, -8.81982421875, -8.4786376953125, -8.137451171875, -7.7962646484375, -7.455078125, -7.1138916015625, -6.772705078125, -6.4315185546875, -6.09033203125, -5.7491455078125, -5.407958984375, -5.0667724609375, -4.7255859375, -4.3843994140625, -4.043212890625, -3.7020263671875, -3.36083984375, -3.0196533203125, -2.678466796875, -2.3372802734375, -1.99609375, -1.6549072265625, -1.313720703125, -0.9725341796875, -0.63134765625, -0.2901611328125, 0.051025390625, 0.3922119140625, 0.7333984375, 1.0745849609375, 1.415771484375, 1.7569580078125, 2.09814453125, 2.4393310546875, 2.780517578125, 3.1217041015625, 3.462890625, 3.8040771484375, 4.145263671875, 4.4864501953125, 4.82763671875, 5.1688232421875, 5.510009765625, 5.8511962890625, 6.1923828125, 6.5335693359375, 6.874755859375, 7.2159423828125, 7.55712890625, 7.8983154296875, 8.239501953125, 8.5806884765625, 8.921875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 53.0, 312.0, 465.0, 137.0, 33.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.54766082763672, -120.54611206054688, -117.5445556640625, -114.54300689697266, -111.54145812988281, -108.53990173339844, -105.5383529663086, -102.53680419921875, -99.53524780273438, -96.53369903564453, -93.53214263916016, -90.53059387207031, -87.52904510498047, -84.5274887084961, -81.52593994140625, -78.52438354492188, -75.52284240722656, -72.52129364013672, -69.51973724365234, -66.5181884765625, -63.51663589477539, -60.51508331298828, -57.51353454589844, -54.51198196411133, -51.51042938232422, -48.50887680053711, -45.507328033447266, -42.505775451660156, -39.50422286987305, -36.50267028808594, -33.501121520996094, -30.499568939208984, -27.498016357421875, -24.4964656829834, -21.49491310119629, -18.493362426757812, -15.49181079864502, -12.490259170532227, -9.48870849609375, -6.487155914306641, -3.485605239868164, -0.4840538501739502, 2.5174975395202637, 5.519048690795898, 8.520600318908691, 11.522151947021484, 14.523702621459961, 17.52525520324707, 20.526805877685547, 23.528356552124023, 26.529909133911133, 29.53145980834961, 32.53301239013672, 35.53456115722656, 38.53611373901367, 41.53766632080078, 44.539215087890625, 47.540767669677734, 50.54231643676758, 53.54386901855469, 56.5454216003418, 59.546974182128906, 62.54852294921875, 65.55007934570312, 68.55162811279297]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 7.0, 15.0, 6.0, 11.0, 10.0, 17.0, 16.0, 21.0, 21.0, 34.0, 15.0, 35.0, 27.0, 28.0, 37.0, 37.0, 30.0, 39.0, 35.0, 29.0, 48.0, 43.0, 35.0, 41.0, 39.0, 30.0, 28.0, 36.0, 30.0, 25.0, 25.0, 24.0, 14.0, 15.0, 12.0, 15.0, 11.0, 12.0, 6.0, 10.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-21.14389419555664, -20.527685165405273, -19.911476135253906, -19.295265197753906, -18.67905616760254, -18.062847137451172, -17.446636199951172, -16.830427169799805, -16.214218139648438, -15.59800910949707, -14.981799125671387, -14.365589141845703, -13.749380111694336, -13.133171081542969, -12.516961097717285, -11.900751113891602, -11.284542083740234, -10.668333053588867, -10.052123069763184, -9.4359130859375, -8.819704055786133, -8.203495025634766, -7.587285041809082, -6.971075534820557, -6.354866027832031, -5.738656520843506, -5.1224470138549805, -4.506237506866455, -3.8900279998779297, -3.2738184928894043, -2.657608985900879, -2.0413994789123535, -1.4251899719238281, -0.8089804649353027, -0.19277095794677734, 0.42343854904174805, 1.0396480560302734, 1.6558575630187988, 2.272067070007324, 2.8882765769958496, 3.504486083984375, 4.1206955909729, 4.736905097961426, 5.353114604949951, 5.969324111938477, 6.585533618927002, 7.201743125915527, 7.817952632904053, 8.434162139892578, 9.050371170043945, 9.666581153869629, 10.282791137695312, 10.89900016784668, 11.515209197998047, 12.13141918182373, 12.747629165649414, 13.363838195800781, 13.980047225952148, 14.596257209777832, 15.212467193603516, 15.828676223754883, 16.44488525390625, 17.06109619140625, 17.677305221557617, 18.293514251708984]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 5.0, 8.0, 13.0, 17.0, 18.0, 23.0, 23.0, 32.0, 38.0, 28.0, 33.0, 49.0, 59.0, 43.0, 59.0, 57.0, 50.0, 54.0, 50.0, 45.0, 39.0, 38.0, 48.0, 24.0, 29.0, 23.0, 18.0, 19.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.099884033203125, -2.99859619140625, -2.897308349609375, -2.7960205078125, -2.694732666015625, -2.59344482421875, -2.492156982421875, -2.390869140625, -2.289581298828125, -2.18829345703125, -2.087005615234375, -1.9857177734375, -1.884429931640625, -1.78314208984375, -1.681854248046875, -1.58056640625, -1.479278564453125, -1.37799072265625, -1.276702880859375, -1.1754150390625, -1.074127197265625, -0.97283935546875, -0.871551513671875, -0.770263671875, -0.668975830078125, -0.56768798828125, -0.466400146484375, -0.3651123046875, -0.263824462890625, -0.16253662109375, -0.061248779296875, 0.0400390625, 0.141326904296875, 0.24261474609375, 0.343902587890625, 0.4451904296875, 0.546478271484375, 0.64776611328125, 0.749053955078125, 0.850341796875, 0.951629638671875, 1.05291748046875, 1.154205322265625, 1.2554931640625, 1.356781005859375, 1.45806884765625, 1.559356689453125, 1.66064453125, 1.761932373046875, 1.86322021484375, 1.964508056640625, 2.0657958984375, 2.167083740234375, 2.26837158203125, 2.369659423828125, 2.470947265625, 2.572235107421875, 2.67352294921875, 2.774810791015625, 2.8760986328125, 2.977386474609375, 3.07867431640625, 3.179962158203125, 3.28125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 10.0, 5.0, 8.0, 17.0, 11.0, 27.0, 60.0, 84.0, 116.0, 192.0, 277.0, 411.0, 639.0, 1125.0, 1806.0, 3001.0, 5433.0, 9860.0, 19505.0, 43727.0, 122384.0, 402828.0, 284987.0, 84734.0, 32958.0, 15175.0, 8073.0, 4439.0, 2553.0, 1571.0, 910.0, 554.0, 399.0, 247.0, 148.0, 90.0, 63.0, 35.0, 34.0, 13.0, 19.0, 7.0, 9.0, 9.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7116470336914062, -0.6869659423828125, -0.6622848510742188, -0.637603759765625, -0.6129226684570312, -0.5882415771484375, -0.5635604858398438, -0.53887939453125, -0.5141983032226562, -0.4895172119140625, -0.46483612060546875, -0.440155029296875, -0.41547393798828125, -0.3907928466796875, -0.36611175537109375, -0.3414306640625, -0.31674957275390625, -0.2920684814453125, -0.26738739013671875, -0.242706298828125, -0.21802520751953125, -0.1933441162109375, -0.16866302490234375, -0.14398193359375, -0.11930084228515625, -0.0946197509765625, -0.06993865966796875, -0.045257568359375, -0.02057647705078125, 0.0041046142578125, 0.02878570556640625, 0.053466796875, 0.07814788818359375, 0.1028289794921875, 0.12751007080078125, 0.152191162109375, 0.17687225341796875, 0.2015533447265625, 0.22623443603515625, 0.25091552734375, 0.27559661865234375, 0.3002777099609375, 0.32495880126953125, 0.349639892578125, 0.37432098388671875, 0.3990020751953125, 0.42368316650390625, 0.4483642578125, 0.47304534912109375, 0.4977264404296875, 0.5224075317382812, 0.547088623046875, 0.5717697143554688, 0.5964508056640625, 0.6211318969726562, 0.64581298828125, 0.6704940795898438, 0.6951751708984375, 0.7198562622070312, 0.744537353515625, 0.7692184448242188, 0.7938995361328125, 0.8185806274414062, 0.84326171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 18.0, 16.0, 17.0, 16.0, 12.0, 12.0, 19.0, 31.0, 33.0, 44.0, 51.0, 30.0, 41.0, 39.0, 52.0, 49.0, 1070.0, 38.0, 50.0, 47.0, 31.0, 38.0, 36.0, 32.0, 29.0, 30.0, 22.0, 27.0, 18.0, 7.0, 17.0, 11.0, 6.0, 6.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.33984375, -2.2772064208984375, -2.214569091796875, -2.1519317626953125, -2.08929443359375, -2.0266571044921875, -1.964019775390625, -1.9013824462890625, -1.8387451171875, -1.7761077880859375, -1.713470458984375, -1.6508331298828125, -1.58819580078125, -1.5255584716796875, -1.462921142578125, -1.4002838134765625, -1.337646484375, -1.2750091552734375, -1.212371826171875, -1.1497344970703125, -1.08709716796875, -1.0244598388671875, -0.961822509765625, -0.8991851806640625, -0.8365478515625, -0.7739105224609375, -0.711273193359375, -0.6486358642578125, -0.58599853515625, -0.5233612060546875, -0.460723876953125, -0.3980865478515625, -0.33544921875, -0.2728118896484375, -0.210174560546875, -0.1475372314453125, -0.08489990234375, -0.0222625732421875, 0.040374755859375, 0.1030120849609375, 0.1656494140625, 0.2282867431640625, 0.290924072265625, 0.3535614013671875, 0.41619873046875, 0.4788360595703125, 0.541473388671875, 0.6041107177734375, 0.666748046875, 0.7293853759765625, 0.792022705078125, 0.8546600341796875, 0.91729736328125, 0.9799346923828125, 1.042572021484375, 1.1052093505859375, 1.1678466796875, 1.2304840087890625, 1.293121337890625, 1.3557586669921875, 1.41839599609375, 1.4810333251953125, 1.543670654296875, 1.6063079833984375, 1.6689453125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 13.0, 9.0, 22.0, 33.0, 47.0, 69.0, 107.0, 144.0, 198.0, 283.0, 424.0, 630.0, 983.0, 1711.0, 3000.0, 5655.0, 12262.0, 30611.0, 100832.0, 623720.0, 1128978.0, 122917.0, 35879.0, 13728.0, 6422.0, 3326.0, 1815.0, 1153.0, 738.0, 429.0, 294.0, 203.0, 159.0, 76.0, 62.0, 43.0, 37.0, 28.0, 25.0, 13.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5236740112304688, -0.5068206787109375, -0.48996734619140625, -0.473114013671875, -0.45626068115234375, -0.4394073486328125, -0.42255401611328125, -0.40570068359375, -0.38884735107421875, -0.3719940185546875, -0.35514068603515625, -0.338287353515625, -0.32143402099609375, -0.3045806884765625, -0.28772735595703125, -0.2708740234375, -0.25402069091796875, -0.2371673583984375, -0.22031402587890625, -0.203460693359375, -0.18660736083984375, -0.1697540283203125, -0.15290069580078125, -0.13604736328125, -0.11919403076171875, -0.1023406982421875, -0.08548736572265625, -0.068634033203125, -0.05178070068359375, -0.0349273681640625, -0.01807403564453125, -0.001220703125, 0.01563262939453125, 0.0324859619140625, 0.04933929443359375, 0.066192626953125, 0.08304595947265625, 0.0998992919921875, 0.11675262451171875, 0.13360595703125, 0.15045928955078125, 0.1673126220703125, 0.18416595458984375, 0.201019287109375, 0.21787261962890625, 0.2347259521484375, 0.25157928466796875, 0.2684326171875, 0.28528594970703125, 0.3021392822265625, 0.31899261474609375, 0.335845947265625, 0.35269927978515625, 0.3695526123046875, 0.38640594482421875, 0.40325927734375, 0.42011260986328125, 0.4369659423828125, 0.45381927490234375, 0.470672607421875, 0.48752593994140625, 0.5043792724609375, 0.5212326049804688, 0.5380859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 15.0, 16.0, 15.0, 10.0, 22.0, 21.0, 37.0, 41.0, 90.0, 161.0, 186.0, 139.0, 55.0, 30.0, 21.0, 27.0, 18.0, 15.0, 16.0, 10.0, 8.0, 7.0, 1.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08339881896972656, -0.08110427856445312, -0.07880973815917969, -0.07651519775390625, -0.07422065734863281, -0.07192611694335938, -0.06963157653808594, -0.0673370361328125, -0.06504249572753906, -0.06274795532226562, -0.06045341491699219, -0.05815887451171875, -0.05586433410644531, -0.053569793701171875, -0.05127525329589844, -0.048980712890625, -0.04668617248535156, -0.044391632080078125, -0.04209709167480469, -0.03980255126953125, -0.03750801086425781, -0.035213470458984375, -0.03291893005371094, -0.0306243896484375, -0.028329849243164062, -0.026035308837890625, -0.023740768432617188, -0.02144622802734375, -0.019151687622070312, -0.016857147216796875, -0.014562606811523438, -0.01226806640625, -0.009973526000976562, -0.007678985595703125, -0.0053844451904296875, -0.00308990478515625, -0.0007953643798828125, 0.001499176025390625, 0.0037937164306640625, 0.0060882568359375, 0.008382797241210938, 0.010677337646484375, 0.012971878051757812, 0.01526641845703125, 0.017560958862304688, 0.019855499267578125, 0.022150039672851562, 0.024444580078125, 0.026739120483398438, 0.029033660888671875, 0.03132820129394531, 0.03362274169921875, 0.03591728210449219, 0.038211822509765625, 0.04050636291503906, 0.0428009033203125, 0.04509544372558594, 0.047389984130859375, 0.04968452453613281, 0.05197906494140625, 0.05427360534667969, 0.056568145751953125, 0.05886268615722656, 0.0611572265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 6.0, 11.0, 8.0, 14.0, 26.0, 26.0, 29.0, 48.0, 55.0, 74.0, 126.0, 212.0, 422.0, 2074.0, 1021993.0, 21895.0, 692.0, 274.0, 184.0, 86.0, 56.0, 48.0, 44.0, 40.0, 21.0, 17.0, 13.0, 12.0, 7.0, 7.0, 4.0, 6.0, 8.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1769256591796875, -1.131195068359375, -1.0854644775390625, -1.03973388671875, -0.9940032958984375, -0.948272705078125, -0.9025421142578125, -0.8568115234375, -0.8110809326171875, -0.765350341796875, -0.7196197509765625, -0.67388916015625, -0.6281585693359375, -0.582427978515625, -0.5366973876953125, -0.490966796875, -0.4452362060546875, -0.399505615234375, -0.3537750244140625, -0.30804443359375, -0.2623138427734375, -0.216583251953125, -0.1708526611328125, -0.1251220703125, -0.0793914794921875, -0.033660888671875, 0.0120697021484375, 0.05780029296875, 0.1035308837890625, 0.149261474609375, 0.1949920654296875, 0.24072265625, 0.2864532470703125, 0.332183837890625, 0.3779144287109375, 0.42364501953125, 0.4693756103515625, 0.515106201171875, 0.5608367919921875, 0.6065673828125, 0.6522979736328125, 0.698028564453125, 0.7437591552734375, 0.78948974609375, 0.8352203369140625, 0.880950927734375, 0.9266815185546875, 0.972412109375, 1.0181427001953125, 1.063873291015625, 1.1096038818359375, 1.15533447265625, 1.2010650634765625, 1.246795654296875, 1.2925262451171875, 1.3382568359375, 1.3839874267578125, 1.429718017578125, 1.4754486083984375, 1.52117919921875, 1.5669097900390625, 1.612640380859375, 1.6583709716796875, 1.7041015625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 48.0, 716.0, 239.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27755460143089294, -0.2641831934452057, -0.25081175565719604, -0.2374403476715088, -0.22406893968582153, -0.21069751679897308, -0.19732609391212463, -0.18395468592643738, -0.17058326303958893, -0.15721184015274048, -0.14384043216705322, -0.13046900928020477, -0.11709759384393692, -0.10372617840766907, -0.09035475552082062, -0.07698334008455276, -0.06361192464828491, -0.05024050921201706, -0.03686909005045891, -0.023497670888900757, -0.010126255452632904, 0.0032451599836349487, 0.0166165828704834, 0.02998799830675125, 0.043359413743019104, 0.05673082917928696, 0.07010224461555481, 0.08347366750240326, 0.09684508293867111, 0.11021649837493896, 0.12358792126178741, 0.13695934414863586, 0.15033072233200073, 0.16370214521884918, 0.17707355320453644, 0.1904449760913849, 0.20381638407707214, 0.2171878069639206, 0.23055922985076904, 0.2439306378364563, 0.25730204582214355, 0.2706734538078308, 0.28404489159584045, 0.2974162995815277, 0.31078770756721497, 0.3241591453552246, 0.33753055334091187, 0.3509019613265991, 0.36427339911460876, 0.377644807100296, 0.39101624488830566, 0.4043876528739929, 0.4177590608596802, 0.43113046884536743, 0.4445019066333771, 0.45787331461906433, 0.471244752407074, 0.48461616039276123, 0.4979875981807709, 0.5113589763641357, 0.5247304439544678, 0.538101851940155, 0.5514732599258423, 0.5648446679115295, 0.5782160758972168]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 11.0, 24.0, 19.0, 19.0, 25.0, 28.0, 31.0, 34.0, 32.0, 34.0, 38.0, 41.0, 39.0, 60.0, 45.0, 47.0, 48.0, 41.0, 37.0, 34.0, 44.0, 28.0, 29.0, 21.0, 20.0, 25.0, 20.0, 13.0, 13.0, 15.0, 16.0, 8.0, 4.0, 10.0, 6.0, 7.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-0.09314745664596558, -0.09059496223926544, -0.0880424752831459, -0.08548998087644577, -0.08293749392032623, -0.0803849995136261, -0.07783250510692596, -0.07528001070022583, -0.07272752374410629, -0.07017502933740616, -0.06762254238128662, -0.06507004797458649, -0.06251755356788635, -0.059965066611766815, -0.05741257220506668, -0.054860081523656845, -0.05230759084224701, -0.04975510016083717, -0.04720260947942734, -0.0446501150727272, -0.04209762439131737, -0.03954513370990753, -0.0369926393032074, -0.03444014862179756, -0.031887657940387726, -0.02933516725897789, -0.026782674714922905, -0.02423018217086792, -0.021677691489458084, -0.01912520080804825, -0.016572708263993263, -0.014020215719938278, -0.011467725038528442, -0.008915233425796032, -0.0063627418130636215, -0.003810250200331211, -0.0012577585875988007, 0.0012947330251336098, 0.00384722463786602, 0.006399717181921005, 0.008952207863330841, 0.011504699476063251, 0.014057191088795662, 0.016609683632850647, 0.019162174314260483, 0.02171466499567032, 0.024267157539725304, 0.02681965008378029, 0.029372140765190125, 0.03192463144659996, 0.034477122128009796, 0.03702961653470993, 0.039582107216119766, 0.0421345978975296, 0.044687092304229736, 0.04723958298563957, 0.04979207366704941, 0.052344564348459244, 0.05489705502986908, 0.057449549436569214, 0.06000204011797905, 0.06255453079938889, 0.06510702520608902, 0.06765951216220856, 0.07021200656890869]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 11.0, 8.0, 15.0, 17.0, 14.0, 17.0, 30.0, 21.0, 27.0, 32.0, 38.0, 42.0, 38.0, 51.0, 50.0, 60.0, 56.0, 53.0, 53.0, 39.0, 48.0, 39.0, 45.0, 39.0, 27.0, 25.0, 23.0, 15.0, 12.0, 15.0, 10.0, 11.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.443359375, -3.34259033203125, -3.2418212890625, -3.14105224609375, -3.040283203125, -2.93951416015625, -2.8387451171875, -2.73797607421875, -2.63720703125, -2.53643798828125, -2.4356689453125, -2.33489990234375, -2.234130859375, -2.13336181640625, -2.0325927734375, -1.93182373046875, -1.8310546875, -1.73028564453125, -1.6295166015625, -1.52874755859375, -1.427978515625, -1.32720947265625, -1.2264404296875, -1.12567138671875, -1.02490234375, -0.92413330078125, -0.8233642578125, -0.72259521484375, -0.621826171875, -0.52105712890625, -0.4202880859375, -0.31951904296875, -0.21875, -0.11798095703125, -0.0172119140625, 0.08355712890625, 0.184326171875, 0.28509521484375, 0.3858642578125, 0.48663330078125, 0.58740234375, 0.68817138671875, 0.7889404296875, 0.88970947265625, 0.990478515625, 1.09124755859375, 1.1920166015625, 1.29278564453125, 1.3935546875, 1.49432373046875, 1.5950927734375, 1.69586181640625, 1.796630859375, 1.89739990234375, 1.9981689453125, 2.09893798828125, 2.19970703125, 2.30047607421875, 2.4012451171875, 2.50201416015625, 2.602783203125, 2.70355224609375, 2.8043212890625, 2.90509033203125, 3.005859375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 9.0, 6.0, 8.0, 14.0, 18.0, 33.0, 41.0, 69.0, 78.0, 95.0, 167.0, 250.0, 374.0, 569.0, 905.0, 1574.0, 2725.0, 5337.0, 11255.0, 27577.0, 83778.0, 291965.0, 411097.0, 137682.0, 41363.0, 15774.0, 7082.0, 3625.0, 1993.0, 1104.0, 688.0, 433.0, 253.0, 182.0, 134.0, 85.0, 64.0, 34.0, 33.0, 27.0, 19.0, 6.0, 13.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.056640625, -2.967254638671875, -2.87786865234375, -2.788482666015625, -2.6990966796875, -2.609710693359375, -2.52032470703125, -2.430938720703125, -2.341552734375, -2.252166748046875, -2.16278076171875, -2.073394775390625, -1.9840087890625, -1.894622802734375, -1.80523681640625, -1.715850830078125, -1.62646484375, -1.537078857421875, -1.44769287109375, -1.358306884765625, -1.2689208984375, -1.179534912109375, -1.09014892578125, -1.000762939453125, -0.911376953125, -0.821990966796875, -0.73260498046875, -0.643218994140625, -0.5538330078125, -0.464447021484375, -0.37506103515625, -0.285675048828125, -0.1962890625, -0.106903076171875, -0.01751708984375, 0.071868896484375, 0.1612548828125, 0.250640869140625, 0.34002685546875, 0.429412841796875, 0.518798828125, 0.608184814453125, 0.69757080078125, 0.786956787109375, 0.8763427734375, 0.965728759765625, 1.05511474609375, 1.144500732421875, 1.23388671875, 1.323272705078125, 1.41265869140625, 1.502044677734375, 1.5914306640625, 1.680816650390625, 1.77020263671875, 1.859588623046875, 1.948974609375, 2.038360595703125, 2.12774658203125, 2.217132568359375, 2.3065185546875, 2.395904541015625, 2.48529052734375, 2.574676513671875, 2.6640625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 12.0, 17.0, 19.0, 18.0, 23.0, 22.0, 25.0, 35.0, 30.0, 50.0, 70.0, 65.0, 151.0, 342.0, 1516.0, 173.0, 88.0, 59.0, 47.0, 44.0, 38.0, 31.0, 25.0, 30.0, 20.0, 17.0, 20.0, 8.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.81170654296875, -7.5609130859375, -7.31011962890625, -7.059326171875, -6.80853271484375, -6.5577392578125, -6.30694580078125, -6.05615234375, -5.80535888671875, -5.5545654296875, -5.30377197265625, -5.052978515625, -4.80218505859375, -4.5513916015625, -4.30059814453125, -4.0498046875, -3.79901123046875, -3.5482177734375, -3.29742431640625, -3.046630859375, -2.79583740234375, -2.5450439453125, -2.29425048828125, -2.04345703125, -1.79266357421875, -1.5418701171875, -1.29107666015625, -1.040283203125, -0.78948974609375, -0.5386962890625, -0.28790283203125, -0.037109375, 0.21368408203125, 0.4644775390625, 0.71527099609375, 0.966064453125, 1.21685791015625, 1.4676513671875, 1.71844482421875, 1.96923828125, 2.22003173828125, 2.4708251953125, 2.72161865234375, 2.972412109375, 3.22320556640625, 3.4739990234375, 3.72479248046875, 3.9755859375, 4.22637939453125, 4.4771728515625, 4.72796630859375, 4.978759765625, 5.22955322265625, 5.4803466796875, 5.73114013671875, 5.98193359375, 6.23272705078125, 6.4835205078125, 6.73431396484375, 6.985107421875, 7.23590087890625, 7.4866943359375, 7.73748779296875, 7.98828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 7.0, 8.0, 9.0, 14.0, 17.0, 33.0, 32.0, 33.0, 61.0, 83.0, 95.0, 192.0, 281.0, 517.0, 1243.0, 49335.0, 3087497.0, 4384.0, 786.0, 393.0, 213.0, 133.0, 96.0, 60.0, 39.0, 36.0, 31.0, 20.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.671142578125, -16.17041015625, -15.669677734375, -15.1689453125, -14.668212890625, -14.16748046875, -13.666748046875, -13.166015625, -12.665283203125, -12.16455078125, -11.663818359375, -11.1630859375, -10.662353515625, -10.16162109375, -9.660888671875, -9.16015625, -8.659423828125, -8.15869140625, -7.657958984375, -7.1572265625, -6.656494140625, -6.15576171875, -5.655029296875, -5.154296875, -4.653564453125, -4.15283203125, -3.652099609375, -3.1513671875, -2.650634765625, -2.14990234375, -1.649169921875, -1.1484375, -0.647705078125, -0.14697265625, 0.353759765625, 0.8544921875, 1.355224609375, 1.85595703125, 2.356689453125, 2.857421875, 3.358154296875, 3.85888671875, 4.359619140625, 4.8603515625, 5.361083984375, 5.86181640625, 6.362548828125, 6.86328125, 7.364013671875, 7.86474609375, 8.365478515625, 8.8662109375, 9.366943359375, 9.86767578125, 10.368408203125, 10.869140625, 11.369873046875, 11.87060546875, 12.371337890625, 12.8720703125, 13.372802734375, 13.87353515625, 14.374267578125, 14.875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 88.0, 791.0, 132.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.147857666015625, -21.607765197753906, -19.06767463684082, -16.5275821685791, -13.9874906539917, -11.447399139404297, -8.907306671142578, -6.367216110229492, -3.8271236419677734, -1.287031888961792, 1.2530598640441895, 3.79315185546875, 6.333243370056152, 8.873334884643555, 11.413427352905273, 13.95351791381836, 16.493610382080078, 19.033702850341797, 21.573793411254883, 24.1138858795166, 26.653976440429688, 29.194068908691406, 31.734161376953125, 34.274253845214844, 36.81434631347656, 39.35443878173828, 41.89453125, 44.43462371826172, 46.97471237182617, 49.51480484008789, 52.05489730834961, 54.59498596191406, 57.13507843017578, 59.6751708984375, 62.21526336669922, 64.75535583496094, 67.29544830322266, 69.83554077148438, 72.37562561035156, 74.91571807861328, 77.455810546875, 79.99590301513672, 82.53599548339844, 85.07608795166016, 87.61618041992188, 90.15626525878906, 92.69636535644531, 95.2364501953125, 97.77655029296875, 100.31664276123047, 102.85673522949219, 105.3968276977539, 107.93692016601562, 110.47700500488281, 113.01710510253906, 115.55718994140625, 118.09728240966797, 120.63737487792969, 123.1774673461914, 125.71755981445312, 128.2576446533203, 130.79774475097656, 133.33782958984375, 135.8779296875, 138.4180145263672]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 5.0, 3.0, 5.0, 21.0, 10.0, 7.0, 16.0, 32.0, 20.0, 24.0, 34.0, 34.0, 40.0, 41.0, 44.0, 57.0, 45.0, 48.0, 32.0, 56.0, 46.0, 42.0, 42.0, 42.0, 37.0, 39.0, 31.0, 22.0, 22.0, 21.0, 15.0, 13.0, 9.0, 9.0, 7.0, 4.0, 8.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.396127700805664, -14.830148696899414, -14.264169692993164, -13.698189735412598, -13.132210731506348, -12.566231727600098, -12.000251770019531, -11.434272766113281, -10.868293762207031, -10.302314758300781, -9.736335754394531, -9.170355796813965, -8.604376792907715, -8.038397789001465, -7.472418308258057, -6.906438827514648, -6.340459823608398, -5.774480819702148, -5.20850133895874, -4.642521858215332, -4.076542854309082, -3.510563611984253, -2.944584369659424, -2.3786051273345947, -1.8126258850097656, -1.2466466426849365, -0.6806674003601074, -0.11468815803527832, 0.4512910842895508, 1.0172703266143799, 1.583249568939209, 2.149228811264038, 2.7152099609375, 3.281189203262329, 3.847168445587158, 4.413147926330566, 4.979126930236816, 5.545105934143066, 6.111085414886475, 6.677064895629883, 7.243043899536133, 7.809022903442383, 8.375001907348633, 8.9409818649292, 9.50696086883545, 10.0729398727417, 10.638919830322266, 11.204898834228516, 11.770877838134766, 12.336856842041016, 12.902835845947266, 13.468815803527832, 14.034794807434082, 14.600773811340332, 15.166753768920898, 15.732732772827148, 16.2987117767334, 16.86469078063965, 17.4306697845459, 17.99664878845215, 18.56262969970703, 19.12860870361328, 19.69458770751953, 20.26056671142578, 20.82654571533203]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 18.0, 15.0, 14.0, 20.0, 22.0, 30.0, 31.0, 46.0, 37.0, 35.0, 34.0, 53.0, 51.0, 47.0, 36.0, 31.0, 52.0, 34.0, 34.0, 47.0, 39.0, 36.0, 28.0, 30.0, 28.0, 19.0, 19.0, 13.0, 12.0, 15.0, 12.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.12890625, -3.03179931640625, -2.9346923828125, -2.83758544921875, -2.740478515625, -2.64337158203125, -2.5462646484375, -2.44915771484375, -2.35205078125, -2.25494384765625, -2.1578369140625, -2.06072998046875, -1.963623046875, -1.86651611328125, -1.7694091796875, -1.67230224609375, -1.5751953125, -1.47808837890625, -1.3809814453125, -1.28387451171875, -1.186767578125, -1.08966064453125, -0.9925537109375, -0.89544677734375, -0.79833984375, -0.70123291015625, -0.6041259765625, -0.50701904296875, -0.409912109375, -0.31280517578125, -0.2156982421875, -0.11859130859375, -0.021484375, 0.07562255859375, 0.1727294921875, 0.26983642578125, 0.366943359375, 0.46405029296875, 0.5611572265625, 0.65826416015625, 0.75537109375, 0.85247802734375, 0.9495849609375, 1.04669189453125, 1.143798828125, 1.24090576171875, 1.3380126953125, 1.43511962890625, 1.5322265625, 1.62933349609375, 1.7264404296875, 1.82354736328125, 1.920654296875, 2.01776123046875, 2.1148681640625, 2.21197509765625, 2.30908203125, 2.40618896484375, 2.5032958984375, 2.60040283203125, 2.697509765625, 2.79461669921875, 2.8917236328125, 2.98883056640625, 3.0859375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 5.0, 7.0, 19.0, 22.0, 26.0, 40.0, 50.0, 74.0, 98.0, 113.0, 173.0, 213.0, 292.0, 366.0, 518.0, 841.0, 1391.0, 3111.0, 8229.0, 33605.0, 969166.0, 3073720.0, 79142.0, 13253.0, 4460.0, 1955.0, 1020.0, 658.0, 450.0, 332.0, 235.0, 165.0, 139.0, 100.0, 60.0, 65.0, 39.0, 35.0, 24.0, 14.0, 9.0, 14.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.375, -13.928466796875, -13.48193359375, -13.035400390625, -12.5888671875, -12.142333984375, -11.69580078125, -11.249267578125, -10.802734375, -10.356201171875, -9.90966796875, -9.463134765625, -9.0166015625, -8.570068359375, -8.12353515625, -7.677001953125, -7.23046875, -6.783935546875, -6.33740234375, -5.890869140625, -5.4443359375, -4.997802734375, -4.55126953125, -4.104736328125, -3.658203125, -3.211669921875, -2.76513671875, -2.318603515625, -1.8720703125, -1.425537109375, -0.97900390625, -0.532470703125, -0.0859375, 0.360595703125, 0.80712890625, 1.253662109375, 1.7001953125, 2.146728515625, 2.59326171875, 3.039794921875, 3.486328125, 3.932861328125, 4.37939453125, 4.825927734375, 5.2724609375, 5.718994140625, 6.16552734375, 6.612060546875, 7.05859375, 7.505126953125, 7.95166015625, 8.398193359375, 8.8447265625, 9.291259765625, 9.73779296875, 10.184326171875, 10.630859375, 11.077392578125, 11.52392578125, 11.970458984375, 12.4169921875, 12.863525390625, 13.31005859375, 13.756591796875, 14.203125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 9.0, 11.0, 21.0, 13.0, 31.0, 46.0, 74.0, 143.0, 195.0, 335.0, 581.0, 730.0, 683.0, 442.0, 286.0, 160.0, 112.0, 59.0, 41.0, 31.0, 23.0, 16.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.08966064453125, -5.8629150390625, -5.63616943359375, -5.409423828125, -5.18267822265625, -4.9559326171875, -4.72918701171875, -4.50244140625, -4.27569580078125, -4.0489501953125, -3.82220458984375, -3.595458984375, -3.36871337890625, -3.1419677734375, -2.91522216796875, -2.6884765625, -2.46173095703125, -2.2349853515625, -2.00823974609375, -1.781494140625, -1.55474853515625, -1.3280029296875, -1.10125732421875, -0.87451171875, -0.64776611328125, -0.4210205078125, -0.19427490234375, 0.032470703125, 0.25921630859375, 0.4859619140625, 0.71270751953125, 0.939453125, 1.16619873046875, 1.3929443359375, 1.61968994140625, 1.846435546875, 2.07318115234375, 2.2999267578125, 2.52667236328125, 2.75341796875, 2.98016357421875, 3.2069091796875, 3.43365478515625, 3.660400390625, 3.88714599609375, 4.1138916015625, 4.34063720703125, 4.5673828125, 4.79412841796875, 5.0208740234375, 5.24761962890625, 5.474365234375, 5.70111083984375, 5.9278564453125, 6.15460205078125, 6.38134765625, 6.60809326171875, 6.8348388671875, 7.06158447265625, 7.288330078125, 7.51507568359375, 7.7418212890625, 7.96856689453125, 8.1953125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 26.0, 34.0, 97.0, 227.0, 639.0, 2397.0, 12262.0, 136039.0, 3671862.0, 345138.0, 20665.0, 3483.0, 886.0, 284.0, 121.0, 59.0, 16.0, 12.0, 5.0, 4.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.3397216796875, -13.937255859375, -13.5347900390625, -13.13232421875, -12.7298583984375, -12.327392578125, -11.9249267578125, -11.5224609375, -11.1199951171875, -10.717529296875, -10.3150634765625, -9.91259765625, -9.5101318359375, -9.107666015625, -8.7052001953125, -8.302734375, -7.9002685546875, -7.497802734375, -7.0953369140625, -6.69287109375, -6.2904052734375, -5.887939453125, -5.4854736328125, -5.0830078125, -4.6805419921875, -4.278076171875, -3.8756103515625, -3.47314453125, -3.0706787109375, -2.668212890625, -2.2657470703125, -1.86328125, -1.4608154296875, -1.058349609375, -0.6558837890625, -0.25341796875, 0.1490478515625, 0.551513671875, 0.9539794921875, 1.3564453125, 1.7589111328125, 2.161376953125, 2.5638427734375, 2.96630859375, 3.3687744140625, 3.771240234375, 4.1737060546875, 4.576171875, 4.9786376953125, 5.381103515625, 5.7835693359375, 6.18603515625, 6.5885009765625, 6.990966796875, 7.3934326171875, 7.7958984375, 8.1983642578125, 8.600830078125, 9.0032958984375, 9.40576171875, 9.8082275390625, 10.210693359375, 10.6131591796875, 11.015625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 3.0, 14.0, 20.0, 41.0, 64.0, 88.0, 95.0, 96.0, 124.0, 106.0, 105.0, 82.0, 48.0, 29.0, 33.0, 14.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.936784744262695, -19.583702087402344, -18.230619430541992, -16.87753677368164, -15.524456024169922, -14.17137336730957, -12.818290710449219, -11.465209007263184, -10.112126350402832, -8.75904369354248, -7.405961990356445, -6.052879333496094, -4.6997971534729, -3.346714973449707, -1.9936323165893555, -0.6405506134033203, 0.7125320434570312, 2.0656142234802246, 3.418696641921997, 4.7717790603637695, 6.124861240386963, 7.477943420410156, 8.831026077270508, 10.184107780456543, 11.537190437316895, 12.890273094177246, 14.243354797363281, 15.596437454223633, 16.949520111083984, 18.302600860595703, 19.655685424804688, 21.008766174316406, 22.36185073852539, 23.714933395385742, 25.068016052246094, 26.421096801757812, 27.774179458618164, 29.127262115478516, 30.480344772338867, 31.83342742919922, 33.18650817871094, 34.539588928222656, 35.89267349243164, 37.24575424194336, 38.598838806152344, 39.95191955566406, 41.30500030517578, 42.658084869384766, 44.01116943359375, 45.36425018310547, 46.71733474731445, 48.07041549682617, 49.423500061035156, 50.776580810546875, 52.129661560058594, 53.48274612426758, 54.8358268737793, 56.188907623291016, 57.5419921875, 58.89507293701172, 60.2481575012207, 61.60123825073242, 62.954322814941406, 64.30740356445312, 65.66048431396484]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 11.0, 12.0, 16.0, 17.0, 13.0, 26.0, 16.0, 27.0, 31.0, 34.0, 37.0, 47.0, 41.0, 44.0, 43.0, 43.0, 55.0, 34.0, 48.0, 33.0, 34.0, 40.0, 29.0, 31.0, 37.0, 34.0, 22.0, 16.0, 23.0, 10.0, 10.0, 12.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.79792594909668, -19.13520050048828, -18.47247314453125, -17.80974578857422, -17.14702033996582, -16.484294891357422, -15.82156753540039, -15.158841133117676, -14.496114730834961, -13.833388328552246, -13.170661926269531, -12.507935523986816, -11.845209121704102, -11.182482719421387, -10.519756317138672, -9.857029914855957, -9.194303512573242, -8.531577110290527, -7.8688507080078125, -7.206124305725098, -6.543397903442383, -5.880671501159668, -5.217945098876953, -4.555218696594238, -3.8924922943115234, -3.2297658920288086, -2.5670394897460938, -1.904313087463379, -1.241586685180664, -0.5788602828979492, 0.08386611938476562, 0.7465925216674805, 1.4093189239501953, 2.07204532623291, 2.734771728515625, 3.39749813079834, 4.060224533081055, 4.7229509353637695, 5.385677337646484, 6.048403739929199, 6.711130142211914, 7.373856544494629, 8.036582946777344, 8.699309349060059, 9.362035751342773, 10.024762153625488, 10.687488555908203, 11.350214958190918, 12.012941360473633, 12.675667762756348, 13.338394165039062, 14.001120567321777, 14.663846969604492, 15.326573371887207, 15.989299774169922, 16.652027130126953, 17.31475257873535, 17.97747802734375, 18.64020538330078, 19.302932739257812, 19.96565818786621, 20.62838363647461, 21.29111099243164, 21.953838348388672, 22.61656379699707]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 10.0, 22.0, 20.0, 20.0, 25.0, 26.0, 34.0, 40.0, 29.0, 41.0, 43.0, 51.0, 49.0, 60.0, 56.0, 58.0, 48.0, 43.0, 33.0, 43.0, 33.0, 34.0, 27.0, 21.0, 20.0, 15.0, 18.0, 13.0, 8.0, 9.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.81884765625, -45.2001953125, -43.58154296875, -41.962890625, -40.34423828125, -38.7255859375, -37.10693359375, -35.48828125, -33.86962890625, -32.2509765625, -30.63232421875, -29.013671875, -27.39501953125, -25.7763671875, -24.15771484375, -22.5390625, -20.92041015625, -19.3017578125, -17.68310546875, -16.064453125, -14.44580078125, -12.8271484375, -11.20849609375, -9.58984375, -7.97119140625, -6.3525390625, -4.73388671875, -3.115234375, -1.49658203125, 0.1220703125, 1.74072265625, 3.359375, 4.97802734375, 6.5966796875, 8.21533203125, 9.833984375, 11.45263671875, 13.0712890625, 14.68994140625, 16.30859375, 17.92724609375, 19.5458984375, 21.16455078125, 22.783203125, 24.40185546875, 26.0205078125, 27.63916015625, 29.2578125, 30.87646484375, 32.4951171875, 34.11376953125, 35.732421875, 37.35107421875, 38.9697265625, 40.58837890625, 42.20703125, 43.82568359375, 45.4443359375, 47.06298828125, 48.681640625, 50.30029296875, 51.9189453125, 53.53759765625, 55.15625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 24.0, 32.0, 53.0, 65.0, 103.0, 131.0, 215.0, 332.0, 467.0, 612.0, 926.0, 1371.0, 2107.0, 3306.0, 5035.0, 7847.0, 12210.0, 19513.0, 31071.0, 49947.0, 80042.0, 127820.0, 189079.0, 185208.0, 123221.0, 76773.0, 48549.0, 30078.0, 18694.0, 11881.0, 7554.0, 4762.0, 3141.0, 2128.0, 1383.0, 927.0, 613.0, 410.0, 270.0, 186.0, 149.0, 92.0, 60.0, 46.0, 33.0, 25.0, 15.0, 15.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.409027099609375, -1.36199951171875, -1.314971923828125, -1.2679443359375, -1.220916748046875, -1.17388916015625, -1.126861572265625, -1.079833984375, -1.032806396484375, -0.98577880859375, -0.938751220703125, -0.8917236328125, -0.844696044921875, -0.79766845703125, -0.750640869140625, -0.70361328125, -0.656585693359375, -0.60955810546875, -0.562530517578125, -0.5155029296875, -0.468475341796875, -0.42144775390625, -0.374420166015625, -0.327392578125, -0.280364990234375, -0.23333740234375, -0.186309814453125, -0.1392822265625, -0.092254638671875, -0.04522705078125, 0.001800537109375, 0.048828125, 0.095855712890625, 0.14288330078125, 0.189910888671875, 0.2369384765625, 0.283966064453125, 0.33099365234375, 0.378021240234375, 0.425048828125, 0.472076416015625, 0.51910400390625, 0.566131591796875, 0.6131591796875, 0.660186767578125, 0.70721435546875, 0.754241943359375, 0.80126953125, 0.848297119140625, 0.89532470703125, 0.942352294921875, 0.9893798828125, 1.036407470703125, 1.08343505859375, 1.130462646484375, 1.177490234375, 1.224517822265625, 1.27154541015625, 1.318572998046875, 1.3656005859375, 1.412628173828125, 1.45965576171875, 1.506683349609375, 1.5537109375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 10.0, 13.0, 12.0, 23.0, 16.0, 27.0, 18.0, 24.0, 30.0, 42.0, 40.0, 38.0, 46.0, 36.0, 46.0, 40.0, 1062.0, 46.0, 37.0, 36.0, 37.0, 37.0, 42.0, 26.0, 31.0, 31.0, 22.0, 23.0, 27.0, 15.0, 14.0, 12.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.078125, -28.218505859375, -27.35888671875, -26.499267578125, -25.6396484375, -24.780029296875, -23.92041015625, -23.060791015625, -22.201171875, -21.341552734375, -20.48193359375, -19.622314453125, -18.7626953125, -17.903076171875, -17.04345703125, -16.183837890625, -15.32421875, -14.464599609375, -13.60498046875, -12.745361328125, -11.8857421875, -11.026123046875, -10.16650390625, -9.306884765625, -8.447265625, -7.587646484375, -6.72802734375, -5.868408203125, -5.0087890625, -4.149169921875, -3.28955078125, -2.429931640625, -1.5703125, -0.710693359375, 0.14892578125, 1.008544921875, 1.8681640625, 2.727783203125, 3.58740234375, 4.447021484375, 5.306640625, 6.166259765625, 7.02587890625, 7.885498046875, 8.7451171875, 9.604736328125, 10.46435546875, 11.323974609375, 12.18359375, 13.043212890625, 13.90283203125, 14.762451171875, 15.6220703125, 16.481689453125, 17.34130859375, 18.200927734375, 19.060546875, 19.920166015625, 20.77978515625, 21.639404296875, 22.4990234375, 23.358642578125, 24.21826171875, 25.077880859375, 25.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 17.0, 31.0, 41.0, 72.0, 111.0, 174.0, 271.0, 362.0, 574.0, 896.0, 1350.0, 2141.0, 3227.0, 4941.0, 7400.0, 11538.0, 17318.0, 26223.0, 40243.0, 60883.0, 92070.0, 140712.0, 1173072.0, 199507.0, 106519.0, 70916.0, 46974.0, 30595.0, 20261.0, 13395.0, 8761.0, 5805.0, 3790.0, 2330.0, 1548.0, 1067.0, 695.0, 438.0, 304.0, 184.0, 122.0, 70.0, 57.0, 43.0, 20.0, 12.0, 15.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.220703125, -1.1795806884765625, -1.138458251953125, -1.0973358154296875, -1.05621337890625, -1.0150909423828125, -0.973968505859375, -0.9328460693359375, -0.8917236328125, -0.8506011962890625, -0.809478759765625, -0.7683563232421875, -0.72723388671875, -0.6861114501953125, -0.644989013671875, -0.6038665771484375, -0.562744140625, -0.5216217041015625, -0.480499267578125, -0.4393768310546875, -0.39825439453125, -0.3571319580078125, -0.316009521484375, -0.2748870849609375, -0.2337646484375, -0.1926422119140625, -0.151519775390625, -0.1103973388671875, -0.06927490234375, -0.0281524658203125, 0.012969970703125, 0.0540924072265625, 0.09521484375, 0.1363372802734375, 0.177459716796875, 0.2185821533203125, 0.25970458984375, 0.3008270263671875, 0.341949462890625, 0.3830718994140625, 0.4241943359375, 0.4653167724609375, 0.506439208984375, 0.5475616455078125, 0.58868408203125, 0.6298065185546875, 0.670928955078125, 0.7120513916015625, 0.753173828125, 0.7942962646484375, 0.835418701171875, 0.8765411376953125, 0.91766357421875, 0.9587860107421875, 0.999908447265625, 1.0410308837890625, 1.0821533203125, 1.1232757568359375, 1.164398193359375, 1.2055206298828125, 1.24664306640625, 1.2877655029296875, 1.328887939453125, 1.3700103759765625, 1.4111328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 13.0, 10.0, 8.0, 18.0, 12.0, 16.0, 19.0, 19.0, 25.0, 34.0, 27.0, 49.0, 51.0, 42.0, 64.0, 54.0, 50.0, 62.0, 55.0, 48.0, 43.0, 40.0, 30.0, 25.0, 22.0, 26.0, 12.0, 14.0, 13.0, 13.0, 12.0, 10.0, 5.0, 10.0, 6.0, 3.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.027862548828125, -0.027006864547729492, -0.026151180267333984, -0.025295495986938477, -0.02443981170654297, -0.02358412742614746, -0.022728443145751953, -0.021872758865356445, -0.021017074584960938, -0.02016139030456543, -0.019305706024169922, -0.018450021743774414, -0.017594337463378906, -0.0167386531829834, -0.01588296890258789, -0.015027284622192383, -0.014171600341796875, -0.013315916061401367, -0.01246023178100586, -0.011604547500610352, -0.010748863220214844, -0.009893178939819336, -0.009037494659423828, -0.00818181037902832, -0.0073261260986328125, -0.006470441818237305, -0.005614757537841797, -0.004759073257446289, -0.0039033889770507812, -0.0030477046966552734, -0.0021920204162597656, -0.0013363361358642578, -0.00048065185546875, 0.0003750324249267578, 0.0012307167053222656, 0.0020864009857177734, 0.0029420852661132812, 0.003797769546508789, 0.004653453826904297, 0.005509138107299805, 0.0063648223876953125, 0.00722050666809082, 0.008076190948486328, 0.008931875228881836, 0.009787559509277344, 0.010643243789672852, 0.01149892807006836, 0.012354612350463867, 0.013210296630859375, 0.014065980911254883, 0.01492166519165039, 0.0157773494720459, 0.016633033752441406, 0.017488718032836914, 0.018344402313232422, 0.01920008659362793, 0.020055770874023438, 0.020911455154418945, 0.021767139434814453, 0.02262282371520996, 0.02347850799560547, 0.024334192276000977, 0.025189876556396484, 0.026045560836791992, 0.0269012451171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 11.0, 18.0, 29.0, 41.0, 67.0, 78.0, 133.0, 160.0, 286.0, 484.0, 819.0, 1410.0, 2950.0, 6612.0, 16926.0, 52741.0, 200815.0, 475048.0, 205228.0, 54140.0, 17193.0, 6655.0, 3048.0, 1468.0, 818.0, 468.0, 298.0, 182.0, 121.0, 97.0, 48.0, 37.0, 29.0, 25.0, 18.0, 10.0, 7.0, 5.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1968212127685547, -0.19015121459960938, -0.18348121643066406, -0.17681121826171875, -0.17014122009277344, -0.16347122192382812, -0.1568012237548828, -0.1501312255859375, -0.1434612274169922, -0.13679122924804688, -0.13012123107910156, -0.12345123291015625, -0.11678123474121094, -0.11011123657226562, -0.10344123840332031, -0.096771240234375, -0.09010124206542969, -0.08343124389648438, -0.07676124572753906, -0.07009124755859375, -0.06342124938964844, -0.056751251220703125, -0.05008125305175781, -0.0434112548828125, -0.03674125671386719, -0.030071258544921875, -0.023401260375976562, -0.01673126220703125, -0.010061264038085938, -0.003391265869140625, 0.0032787322998046875, 0.00994873046875, 0.016618728637695312, 0.023288726806640625, 0.029958724975585938, 0.03662872314453125, 0.04329872131347656, 0.049968719482421875, 0.05663871765136719, 0.0633087158203125, 0.06997871398925781, 0.07664871215820312, 0.08331871032714844, 0.08998870849609375, 0.09665870666503906, 0.10332870483398438, 0.10999870300292969, 0.116668701171875, 0.12333869934082031, 0.13000869750976562, 0.13667869567871094, 0.14334869384765625, 0.15001869201660156, 0.15668869018554688, 0.1633586883544922, 0.1700286865234375, 0.1766986846923828, 0.18336868286132812, 0.19003868103027344, 0.19670867919921875, 0.20337867736816406, 0.21004867553710938, 0.2167186737060547, 0.223388671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 19.0, 47.0, 81.0, 168.0, 253.0, 201.0, 94.0, 56.0, 31.0, 18.0, 9.0, 9.0, 8.0, 0.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073527030646801, -0.0676354467868805, -0.061743855476379395, -0.055852267891168594, -0.049960680305957794, -0.044069092720746994, -0.038177505135536194, -0.032285917550325394, -0.026394329965114594, -0.020502742379903793, -0.014611154794692993, -0.008719567209482193, -0.002827979624271393, 0.0030636079609394073, 0.008955195546150208, 0.014846783131361008, 0.020738370716571808, 0.026629958301782608, 0.03252154588699341, 0.03841313347220421, 0.04430472105741501, 0.05019630864262581, 0.05608789622783661, 0.06197948381304741, 0.06787107139825821, 0.07376265525817871, 0.07965424656867981, 0.08554583787918091, 0.09143742173910141, 0.09732900559902191, 0.10322059690952301, 0.10911218822002411, 0.11500376462936401, 0.12089535593986511, 0.1267869472503662, 0.13267852365970612, 0.13857011497020721, 0.1444617062807083, 0.15035328269004822, 0.15624487400054932, 0.16213646531105042, 0.1680280566215515, 0.1739196479320526, 0.17981122434139252, 0.18570281565189362, 0.19159440696239471, 0.19748598337173462, 0.20337757468223572, 0.20926916599273682, 0.21516075730323792, 0.221052348613739, 0.22694392502307892, 0.23283551633358002, 0.23872710764408112, 0.24461868405342102, 0.2505102753639221, 0.2564018666744232, 0.2622934579849243, 0.2681850492954254, 0.2740766406059265, 0.2799682021141052, 0.2858597934246063, 0.2917513847351074, 0.2976429760456085, 0.3035345673561096]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 8.0, 19.0, 17.0, 17.0, 20.0, 13.0, 28.0, 28.0, 33.0, 27.0, 32.0, 41.0, 32.0, 30.0, 41.0, 31.0, 37.0, 35.0, 50.0, 45.0, 39.0, 30.0, 33.0, 36.0, 28.0, 22.0, 27.0, 18.0, 22.0, 16.0, 21.0, 17.0, 15.0, 8.0, 12.0, 5.0, 14.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04460030794143677, -0.0431242436170578, -0.041648175567388535, -0.04017210751771927, -0.0386960431933403, -0.037219978868961334, -0.03574391081929207, -0.0342678427696228, -0.032791778445243835, -0.03131571412086487, -0.029839646071195602, -0.028363579884171486, -0.02688751369714737, -0.025411447510123253, -0.023935381323099136, -0.02245931513607502, -0.020983248949050903, -0.019507182762026787, -0.01803111657500267, -0.016555050387978554, -0.015078984200954437, -0.01360291801393032, -0.012126851826906204, -0.010650785639882088, -0.009174719452857971, -0.007698653265833855, -0.006222587078809738, -0.004746520891785622, -0.003270454704761505, -0.0017943885177373886, -0.0003183223307132721, 0.0011577438563108444, 0.002633810043334961, 0.0041098762303590775, 0.005585942417383194, 0.0070620086044073105, 0.008538074791431427, 0.010014140978455544, 0.01149020716547966, 0.012966273352503777, 0.014442339539527893, 0.01591840572655201, 0.017394471913576126, 0.018870538100600243, 0.02034660428762436, 0.021822670474648476, 0.023298736661672592, 0.02477480284869671, 0.026250869035720825, 0.02772693522274494, 0.029203001409769058, 0.030679067596793175, 0.03215513378381729, 0.03363119810819626, 0.035107266157865524, 0.03658333420753479, 0.03805939853191376, 0.039535462856292725, 0.04101153090596199, 0.042487598955631256, 0.04396366328001022, 0.04543972760438919, 0.046915795654058456, 0.04839186370372772, 0.04986792802810669]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 10.0, 12.0, 14.0, 9.0, 10.0, 19.0, 23.0, 21.0, 25.0, 30.0, 39.0, 46.0, 41.0, 48.0, 37.0, 48.0, 53.0, 57.0, 45.0, 51.0, 42.0, 36.0, 43.0, 40.0, 32.0, 26.0, 23.0, 29.0, 16.0, 15.0, 7.0, 11.0, 10.0, 10.0, 2.0, 1.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.71875, -46.12744140625, -44.5361328125, -42.94482421875, -41.353515625, -39.76220703125, -38.1708984375, -36.57958984375, -34.98828125, -33.39697265625, -31.8056640625, -30.21435546875, -28.623046875, -27.03173828125, -25.4404296875, -23.84912109375, -22.2578125, -20.66650390625, -19.0751953125, -17.48388671875, -15.892578125, -14.30126953125, -12.7099609375, -11.11865234375, -9.52734375, -7.93603515625, -6.3447265625, -4.75341796875, -3.162109375, -1.57080078125, 0.0205078125, 1.61181640625, 3.203125, 4.79443359375, 6.3857421875, 7.97705078125, 9.568359375, 11.15966796875, 12.7509765625, 14.34228515625, 15.93359375, 17.52490234375, 19.1162109375, 20.70751953125, 22.298828125, 23.89013671875, 25.4814453125, 27.07275390625, 28.6640625, 30.25537109375, 31.8466796875, 33.43798828125, 35.029296875, 36.62060546875, 38.2119140625, 39.80322265625, 41.39453125, 42.98583984375, 44.5771484375, 46.16845703125, 47.759765625, 49.35107421875, 50.9423828125, 52.53369140625, 54.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 16.0, 22.0, 26.0, 25.0, 43.0, 32.0, 67.0, 79.0, 112.0, 190.0, 430.0, 1066.0, 4057.0, 22589.0, 171148.0, 636515.0, 181928.0, 23756.0, 4189.0, 1145.0, 406.0, 202.0, 113.0, 72.0, 60.0, 43.0, 41.0, 29.0, 25.0, 20.0, 20.0, 17.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.98046875, -7.71893310546875, -7.4573974609375, -7.19586181640625, -6.934326171875, -6.67279052734375, -6.4112548828125, -6.14971923828125, -5.88818359375, -5.62664794921875, -5.3651123046875, -5.10357666015625, -4.842041015625, -4.58050537109375, -4.3189697265625, -4.05743408203125, -3.7958984375, -3.53436279296875, -3.2728271484375, -3.01129150390625, -2.749755859375, -2.48822021484375, -2.2266845703125, -1.96514892578125, -1.70361328125, -1.44207763671875, -1.1805419921875, -0.91900634765625, -0.657470703125, -0.39593505859375, -0.1343994140625, 0.12713623046875, 0.388671875, 0.65020751953125, 0.9117431640625, 1.17327880859375, 1.434814453125, 1.69635009765625, 1.9578857421875, 2.21942138671875, 2.48095703125, 2.74249267578125, 3.0040283203125, 3.26556396484375, 3.527099609375, 3.78863525390625, 4.0501708984375, 4.31170654296875, 4.5732421875, 4.83477783203125, 5.0963134765625, 5.35784912109375, 5.619384765625, 5.88092041015625, 6.1424560546875, 6.40399169921875, 6.66552734375, 6.92706298828125, 7.1885986328125, 7.45013427734375, 7.711669921875, 7.97320556640625, 8.2347412109375, 8.49627685546875, 8.7578125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 5.0, 13.0, 15.0, 19.0, 26.0, 44.0, 45.0, 52.0, 49.0, 61.0, 52.0, 75.0, 2117.0, 75.0, 80.0, 66.0, 51.0, 46.0, 33.0, 27.0, 27.0, 15.0, 15.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-105.4375, -102.5517578125, -99.666015625, -96.7802734375, -93.89453125, -91.0087890625, -88.123046875, -85.2373046875, -82.3515625, -79.4658203125, -76.580078125, -73.6943359375, -70.80859375, -67.9228515625, -65.037109375, -62.1513671875, -59.265625, -56.3798828125, -53.494140625, -50.6083984375, -47.72265625, -44.8369140625, -41.951171875, -39.0654296875, -36.1796875, -33.2939453125, -30.408203125, -27.5224609375, -24.63671875, -21.7509765625, -18.865234375, -15.9794921875, -13.09375, -10.2080078125, -7.322265625, -4.4365234375, -1.55078125, 1.3349609375, 4.220703125, 7.1064453125, 9.9921875, 12.8779296875, 15.763671875, 18.6494140625, 21.53515625, 24.4208984375, 27.306640625, 30.1923828125, 33.078125, 35.9638671875, 38.849609375, 41.7353515625, 44.62109375, 47.5068359375, 50.392578125, 53.2783203125, 56.1640625, 59.0498046875, 61.935546875, 64.8212890625, 67.70703125, 70.5927734375, 73.478515625, 76.3642578125, 79.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 19.0, 34.0, 43.0, 46.0, 92.0, 162.0, 315.0, 446.0, 877.0, 1976.0, 5950.0, 29657.0, 228575.0, 2731176.0, 121407.0, 17484.0, 4072.0, 1487.0, 761.0, 407.0, 247.0, 143.0, 90.0, 63.0, 34.0, 35.0, 14.0, 13.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40264892578125, -6.1685791015625, -5.93450927734375, -5.700439453125, -5.46636962890625, -5.2322998046875, -4.99822998046875, -4.76416015625, -4.53009033203125, -4.2960205078125, -4.06195068359375, -3.827880859375, -3.59381103515625, -3.3597412109375, -3.12567138671875, -2.8916015625, -2.65753173828125, -2.4234619140625, -2.18939208984375, -1.955322265625, -1.72125244140625, -1.4871826171875, -1.25311279296875, -1.01904296875, -0.78497314453125, -0.5509033203125, -0.31683349609375, -0.082763671875, 0.15130615234375, 0.3853759765625, 0.61944580078125, 0.853515625, 1.08758544921875, 1.3216552734375, 1.55572509765625, 1.789794921875, 2.02386474609375, 2.2579345703125, 2.49200439453125, 2.72607421875, 2.96014404296875, 3.1942138671875, 3.42828369140625, 3.662353515625, 3.89642333984375, 4.1304931640625, 4.36456298828125, 4.5986328125, 4.83270263671875, 5.0667724609375, 5.30084228515625, 5.534912109375, 5.76898193359375, 6.0030517578125, 6.23712158203125, 6.47119140625, 6.70526123046875, 6.9393310546875, 7.17340087890625, 7.407470703125, 7.64154052734375, 7.8756103515625, 8.10968017578125, 8.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 34.0, 96.0, 342.0, 331.0, 102.0, 39.0, 23.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.48118591308594, -124.69154357910156, -116.90190124511719, -109.11225891113281, -101.32261657714844, -93.53297424316406, -85.74333190917969, -77.95368957519531, -70.16404724121094, -62.37440490722656, -54.58476257324219, -46.79512023925781, -39.00547790527344, -31.215835571289062, -23.426193237304688, -15.636550903320312, -7.8469085693359375, -0.0572662353515625, 7.7323760986328125, 15.522018432617188, 23.311660766601562, 31.101303100585938, 38.89094543457031, 46.68058776855469, 54.47023010253906, 62.25987243652344, 70.04951477050781, 77.83915710449219, 85.62879943847656, 93.41844177246094, 101.20808410644531, 108.99772644042969, 116.787353515625, 124.57699584960938, 132.36663818359375, 140.15628051757812, 147.9459228515625, 155.73556518554688, 163.52520751953125, 171.31484985351562, 179.1044921875, 186.89413452148438, 194.68377685546875, 202.47341918945312, 210.2630615234375, 218.05270385742188, 225.84234619140625, 233.63198852539062, 241.421630859375, 249.21127319335938, 257.00091552734375, 264.7905578613281, 272.5802001953125, 280.3698425292969, 288.15948486328125, 295.9491271972656, 303.73876953125, 311.5284118652344, 319.31805419921875, 327.1076965332031, 334.8973388671875, 342.6869812011719, 350.47662353515625, 358.2662658691406, 366.055908203125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 11.0, 12.0, 12.0, 14.0, 16.0, 23.0, 25.0, 28.0, 26.0, 36.0, 46.0, 37.0, 47.0, 46.0, 46.0, 52.0, 48.0, 31.0, 42.0, 33.0, 26.0, 44.0, 40.0, 29.0, 25.0, 23.0, 24.0, 15.0, 22.0, 26.0, 10.0, 11.0, 6.0, 11.0, 9.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.71125030517578, -78.79401397705078, -75.87677001953125, -72.95953369140625, -70.04229736328125, -67.12506103515625, -64.20781707763672, -61.29058074951172, -58.37334442138672, -55.45610427856445, -52.53886795043945, -49.62162780761719, -46.70439147949219, -43.78715133666992, -40.869911193847656, -37.952674865722656, -35.03543472290039, -32.118194580078125, -29.200958251953125, -26.28371810913086, -23.36648178100586, -20.449241638183594, -17.53200340270996, -14.614765167236328, -11.697526931762695, -8.780288696289062, -5.8630499839782715, -2.9458112716674805, -0.028573036193847656, 2.888665199279785, 5.805904388427734, 8.723142623901367, 11.640380859375, 14.557619094848633, 17.474857330322266, 20.39209747314453, 23.30933380126953, 26.226573944091797, 29.14381217956543, 32.06105041503906, 34.97828674316406, 37.89552688598633, 40.81276321411133, 43.730003356933594, 46.647239685058594, 49.56447982788086, 52.481719970703125, 55.398956298828125, 58.31619644165039, 61.233436584472656, 64.15067291259766, 67.06790924072266, 69.98515319824219, 72.90238952636719, 75.81962585449219, 78.73686218261719, 81.65410614013672, 84.57134246826172, 87.48858642578125, 90.40582275390625, 93.32305908203125, 96.24029541015625, 99.15753936767578, 102.07477569580078, 104.99201202392578]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 9.0, 13.0, 20.0, 16.0, 15.0, 22.0, 35.0, 43.0, 56.0, 78.0, 103.0, 127.0, 185.0, 285.0, 475.0, 731.0, 1338.0, 3104.0, 1025392.0, 11026.0, 2426.0, 1023.0, 634.0, 398.0, 293.0, 168.0, 126.0, 85.0, 65.0, 48.0, 53.0, 32.0, 27.0, 21.0, 23.0, 14.0, 12.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.460712432861328, -25.603782653808594, -24.74685287475586, -23.889923095703125, -23.032995223999023, -22.17606544494629, -21.319135665893555, -20.46220588684082, -19.60527801513672, -18.748348236083984, -17.89141845703125, -17.034488677978516, -16.177560806274414, -15.32063102722168, -14.463701248168945, -13.606771469116211, -12.749841690063477, -11.892911911010742, -11.035983085632324, -10.17905330657959, -9.322124481201172, -8.465194702148438, -7.608264923095703, -6.751335620880127, -5.894406318664551, -5.037477016448975, -4.180547714233398, -3.323617935180664, -2.466688632965088, -1.6097593307495117, -0.7528295516967773, 0.10409975051879883, 0.9610271453857422, 1.817956566810608, 2.6748859882354736, 3.531815528869629, 4.388744831085205, 5.245674133300781, 6.102603912353516, 6.959533214569092, 7.816462516784668, 8.673392295837402, 9.53032112121582, 10.387250900268555, 11.244180679321289, 12.101109504699707, 12.958039283752441, 13.81496810913086, 14.671897888183594, 15.528827667236328, 16.385757446289062, 17.242687225341797, 18.0996150970459, 18.956544876098633, 19.813474655151367, 20.6704044342041, 21.527332305908203, 22.384262084960938, 23.241191864013672, 24.098121643066406, 24.955049514770508, 25.811979293823242, 26.668909072875977, 27.52583885192871, 28.382768630981445]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 39.0, 596.0, 51462116.0, 354.0, 23.0, 9.0, 0.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3868.11083984375, -3772.389892578125, -3676.668701171875, -3580.94775390625, -3485.226806640625, -3389.505859375, -3293.78466796875, -3198.063720703125, -3102.3427734375, -3006.621826171875, -2910.900634765625, -2815.1796875, -2719.458740234375, -2623.73779296875, -2528.0166015625, -2432.295654296875, -2336.574462890625, -2240.853515625, -2145.13232421875, -2049.411376953125, -1953.6904296875, -1857.9693603515625, -1762.248291015625, -1666.52734375, -1570.8062744140625, -1475.085205078125, -1379.3642578125, -1283.6431884765625, -1187.922119140625, -1092.201171875, -996.4801025390625, -900.7590942382812, -805.037841796875, -709.3168334960938, -613.5958251953125, -517.874755859375, -422.15374755859375, -326.4327392578125, -230.711669921875, -134.99066162109375, -39.2696533203125, 56.45137023925781, 152.17239379882812, 247.8934326171875, 343.61444091796875, 439.33544921875, 535.0565185546875, 630.7775268554688, 726.49853515625, 822.2195434570312, 917.9405517578125, 1013.66162109375, 1109.382568359375, 1205.1036376953125, 1300.82470703125, 1396.545654296875, 1492.2667236328125, 1587.98779296875, 1683.708740234375, 1779.4298095703125, 1875.15087890625, 1970.871826171875, 2066.5927734375, 2162.31396484375, 2258.034912109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 21.0, 36.0, 50.0, 81.0, 133.0, 181.0, 272.0, 431.0, 680.0, 1070.0, 1775.0, 2839.0, 4880.0, 8802.0, 15621.0, 29268.0, 58469.0, 125211.0, 297986.0, 919622.0, 3504103.0, 808701.0, 275663.0, 117125.0, 54991.0, 27986.0, 14940.0, 8423.0, 4700.0, 2698.0, 1703.0, 1092.0, 639.0, 429.0, 236.0, 182.0, 113.0, 77.0, 58.0, 28.0, 24.0, 17.0, 14.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.265625, -15.71337890625, -15.1611328125, -14.60888671875, -14.056640625, -13.50439453125, -12.9521484375, -12.39990234375, -11.84765625, -11.29541015625, -10.7431640625, -10.19091796875, -9.638671875, -9.08642578125, -8.5341796875, -7.98193359375, -7.4296875, -6.87744140625, -6.3251953125, -5.77294921875, -5.220703125, -4.66845703125, -4.1162109375, -3.56396484375, -3.01171875, -2.45947265625, -1.9072265625, -1.35498046875, -0.802734375, -0.25048828125, 0.3017578125, 0.85400390625, 1.40625, 1.95849609375, 2.5107421875, 3.06298828125, 3.615234375, 4.16748046875, 4.7197265625, 5.27197265625, 5.82421875, 6.37646484375, 6.9287109375, 7.48095703125, 8.033203125, 8.58544921875, 9.1376953125, 9.68994140625, 10.2421875, 10.79443359375, 11.3466796875, 11.89892578125, 12.451171875, 13.00341796875, 13.5556640625, 14.10791015625, 14.66015625, 15.21240234375, 15.7646484375, 16.31689453125, 16.869140625, 17.42138671875, 17.9736328125, 18.52587890625, 19.078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 10.0, 5.0, 12.0, 21.0, 18.0, 11.0, 20.0, 18.0, 32.0, 34.0, 21.0, 25.0, 31.0, 39.0, 45.0, 72.0, 130.0, 296.0, 459.0, 207.0, 93.0, 58.0, 42.0, 38.0, 32.0, 40.0, 34.0, 28.0, 20.0, 19.0, 23.0, 18.0, 13.0, 12.0, 9.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.625, -21.96484375, -21.3046875, -20.64453125, -19.984375, -19.32421875, -18.6640625, -18.00390625, -17.34375, -16.68359375, -16.0234375, -15.36328125, -14.703125, -14.04296875, -13.3828125, -12.72265625, -12.0625, -11.40234375, -10.7421875, -10.08203125, -9.421875, -8.76171875, -8.1015625, -7.44140625, -6.78125, -6.12109375, -5.4609375, -4.80078125, -4.140625, -3.48046875, -2.8203125, -2.16015625, -1.5, -0.83984375, -0.1796875, 0.48046875, 1.140625, 1.80078125, 2.4609375, 3.12109375, 3.78125, 4.44140625, 5.1015625, 5.76171875, 6.421875, 7.08203125, 7.7421875, 8.40234375, 9.0625, 9.72265625, 10.3828125, 11.04296875, 11.703125, 12.36328125, 13.0234375, 13.68359375, 14.34375, 15.00390625, 15.6640625, 16.32421875, 16.984375, 17.64453125, 18.3046875, 18.96484375, 19.625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 13.0, 26.0, 36.0, 55.0, 73.0, 93.0, 146.0, 207.0, 327.0, 408.0, 621.0, 870.0, 1382.0, 2039.0, 3249.0, 4947.0, 7784.0, 12736.0, 20596.0, 34537.0, 58981.0, 100216.0, 173628.0, 296755.0, 556631.0, 2300921.0, 1597311.0, 475200.0, 264279.0, 153846.0, 89678.0, 52171.0, 31039.0, 18677.0, 11342.0, 7031.0, 4501.0, 2861.0, 1966.0, 1322.0, 896.0, 615.0, 419.0, 307.0, 213.0, 148.0, 96.0, 91.0, 52.0, 37.0, 20.0, 17.0, 3.0, 8.0, 5.0, 1.0, 4.0], "bins": [-7.18359375, -6.96514892578125, -6.7467041015625, -6.52825927734375, -6.309814453125, -6.09136962890625, -5.8729248046875, -5.65447998046875, -5.43603515625, -5.21759033203125, -4.9991455078125, -4.78070068359375, -4.562255859375, -4.34381103515625, -4.1253662109375, -3.90692138671875, -3.6884765625, -3.47003173828125, -3.2515869140625, -3.03314208984375, -2.814697265625, -2.59625244140625, -2.3778076171875, -2.15936279296875, -1.94091796875, -1.72247314453125, -1.5040283203125, -1.28558349609375, -1.067138671875, -0.84869384765625, -0.6302490234375, -0.41180419921875, -0.193359375, 0.02508544921875, 0.2435302734375, 0.46197509765625, 0.680419921875, 0.89886474609375, 1.1173095703125, 1.33575439453125, 1.55419921875, 1.77264404296875, 1.9910888671875, 2.20953369140625, 2.427978515625, 2.64642333984375, 2.8648681640625, 3.08331298828125, 3.3017578125, 3.52020263671875, 3.7386474609375, 3.95709228515625, 4.175537109375, 4.39398193359375, 4.6124267578125, 4.83087158203125, 5.04931640625, 5.26776123046875, 5.4862060546875, 5.70465087890625, 5.923095703125, 6.14154052734375, 6.3599853515625, 6.57843017578125, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 8.0, 5.0, 19.0, 21.0, 22.0, 29.0, 24.0, 35.0, 34.0, 45.0, 36.0, 55.0, 68.0, 174.0, 542.0, 351.0, 114.0, 60.0, 50.0, 38.0, 36.0, 34.0, 35.0, 34.0, 25.0, 28.0, 16.0, 14.0, 15.0, 13.0, 5.0, 3.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.24853515625, -35.9970703125, -34.74560546875, -33.494140625, -32.24267578125, -30.9912109375, -29.73974609375, -28.48828125, -27.23681640625, -25.9853515625, -24.73388671875, -23.482421875, -22.23095703125, -20.9794921875, -19.72802734375, -18.4765625, -17.22509765625, -15.9736328125, -14.72216796875, -13.470703125, -12.21923828125, -10.9677734375, -9.71630859375, -8.46484375, -7.21337890625, -5.9619140625, -4.71044921875, -3.458984375, -2.20751953125, -0.9560546875, 0.29541015625, 1.546875, 2.79833984375, 4.0498046875, 5.30126953125, 6.552734375, 7.80419921875, 9.0556640625, 10.30712890625, 11.55859375, 12.81005859375, 14.0615234375, 15.31298828125, 16.564453125, 17.81591796875, 19.0673828125, 20.31884765625, 21.5703125, 22.82177734375, 24.0732421875, 25.32470703125, 26.576171875, 27.82763671875, 29.0791015625, 30.33056640625, 31.58203125, 32.83349609375, 34.0849609375, 35.33642578125, 36.587890625, 37.83935546875, 39.0908203125, 40.34228515625, 41.59375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 14.0, 16.0, 12.0, 35.0, 48.0, 81.0, 108.0, 126.0, 190.0, 258.0, 377.0, 542.0, 773.0, 1241.0, 1934.0, 3044.0, 5519.0, 11276.0, 26282.0, 67939.0, 227579.0, 5735172.0, 126301.0, 44862.0, 17998.0, 8226.0, 4295.0, 2454.0, 1506.0, 989.0, 651.0, 469.0, 312.0, 212.0, 177.0, 110.0, 83.0, 43.0, 42.0, 26.0, 26.0, 18.0, 14.0, 8.0, 4.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0], "bins": [-39.90625, -38.67041015625, -37.4345703125, -36.19873046875, -34.962890625, -33.72705078125, -32.4912109375, -31.25537109375, -30.01953125, -28.78369140625, -27.5478515625, -26.31201171875, -25.076171875, -23.84033203125, -22.6044921875, -21.36865234375, -20.1328125, -18.89697265625, -17.6611328125, -16.42529296875, -15.189453125, -13.95361328125, -12.7177734375, -11.48193359375, -10.24609375, -9.01025390625, -7.7744140625, -6.53857421875, -5.302734375, -4.06689453125, -2.8310546875, -1.59521484375, -0.359375, 0.87646484375, 2.1123046875, 3.34814453125, 4.583984375, 5.81982421875, 7.0556640625, 8.29150390625, 9.52734375, 10.76318359375, 11.9990234375, 13.23486328125, 14.470703125, 15.70654296875, 16.9423828125, 18.17822265625, 19.4140625, 20.64990234375, 21.8857421875, 23.12158203125, 24.357421875, 25.59326171875, 26.8291015625, 28.06494140625, 29.30078125, 30.53662109375, 31.7724609375, 33.00830078125, 34.244140625, 35.47998046875, 36.7158203125, 37.95166015625, 39.1875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 7.0, 4.0, 4.0, 6.0, 10.0, 8.0, 18.0, 6.0, 19.0, 14.0, 16.0, 17.0, 29.0, 31.0, 39.0, 28.0, 32.0, 27.0, 33.0, 56.0, 119.0, 703.0, 291.0, 81.0, 36.0, 31.0, 36.0, 40.0, 28.0, 26.0, 26.0, 20.0, 22.0, 22.0, 25.0, 19.0, 8.0, 9.0, 23.0, 11.0, 9.0, 9.0, 5.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3388671875, -60.240234375, -58.1416015625, -56.04296875, -53.9443359375, -51.845703125, -49.7470703125, -47.6484375, -45.5498046875, -43.451171875, -41.3525390625, -39.25390625, -37.1552734375, -35.056640625, -32.9580078125, -30.859375, -28.7607421875, -26.662109375, -24.5634765625, -22.46484375, -20.3662109375, -18.267578125, -16.1689453125, -14.0703125, -11.9716796875, -9.873046875, -7.7744140625, -5.67578125, -3.5771484375, -1.478515625, 0.6201171875, 2.71875, 4.8173828125, 6.916015625, 9.0146484375, 11.11328125, 13.2119140625, 15.310546875, 17.4091796875, 19.5078125, 21.6064453125, 23.705078125, 25.8037109375, 27.90234375, 30.0009765625, 32.099609375, 34.1982421875, 36.296875, 38.3955078125, 40.494140625, 42.5927734375, 44.69140625, 46.7900390625, 48.888671875, 50.9873046875, 53.0859375, 55.1845703125, 57.283203125, 59.3818359375, 61.48046875, 63.5791015625, 65.677734375, 67.7763671875, 69.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 35.0, 461.0, 433.0, 29.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.9376831054688, -490.0948486328125, -461.25201416015625, -432.4091796875, -403.56634521484375, -374.7235107421875, -345.8807067871094, -317.0378723144531, -288.1950378417969, -259.3522033691406, -230.50936889648438, -201.6665496826172, -172.82371520996094, -143.9808807373047, -115.1380615234375, -86.29522705078125, -57.452392578125, -28.609561920166016, 0.23326873779296875, 29.076095581054688, 57.91893005371094, 86.76176452636719, 115.60458374023438, 144.44741821289062, 173.29025268554688, 202.13308715820312, 230.97592163085938, 259.8187255859375, 288.66156005859375, 317.50439453125, 346.34722900390625, 375.1900634765625, 404.0328369140625, 432.87567138671875, 461.718505859375, 490.56134033203125, 519.4041748046875, 548.2470092773438, 577.08984375, 605.9326171875, 634.7755126953125, 663.6183471679688, 692.461181640625, 721.3040161132812, 750.1468505859375, 778.9896850585938, 807.83251953125, 836.67529296875, 865.5181274414062, 894.3609619140625, 923.2037963867188, 952.046630859375, 980.8894653320312, 1009.7322998046875, 1038.5750732421875, 1067.41796875, 1096.2607421875, 1125.103515625, 1153.9464111328125, 1182.7891845703125, 1211.632080078125, 1240.474853515625, 1269.3177490234375, 1298.1605224609375, 1327.00341796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 8.0, 12.0, 15.0, 17.0, 18.0, 24.0, 71.0, 425.0, 234.0, 37.0, 24.0, 14.0, 20.0, 10.0, 7.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-519.654296875, -503.79681396484375, -487.9393310546875, -472.08184814453125, -456.224365234375, -440.36688232421875, -424.5093994140625, -408.65191650390625, -392.79443359375, -376.93695068359375, -361.0794677734375, -345.22198486328125, -329.364501953125, -313.50701904296875, -297.6495361328125, -281.79205322265625, -265.9345703125, -250.07708740234375, -234.2196044921875, -218.36212158203125, -202.504638671875, -186.64715576171875, -170.7896728515625, -154.93218994140625, -139.07467651367188, -123.21719360351562, -107.35971069335938, -91.50222778320312, -75.64474487304688, -59.787254333496094, -43.929771423339844, -28.072288513183594, -12.214813232421875, 3.6426706314086914, 19.500154495239258, 35.35763931274414, 51.21512222290039, 67.0726089477539, 82.93009185791016, 98.7875747680664, 114.64505767822266, 130.50254821777344, 146.3600311279297, 162.21751403808594, 178.0749969482422, 193.93247985839844, 209.7899627685547, 225.64744567871094, 241.5049285888672, 257.3624267578125, 273.21990966796875, 289.077392578125, 304.93487548828125, 320.7923583984375, 336.64984130859375, 352.50732421875, 368.36480712890625, 384.2222900390625, 400.07977294921875, 415.937255859375, 431.79473876953125, 447.6522216796875, 463.50970458984375, 479.3671875, 495.22467041015625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 16.0, 14.0, 18.0, 38.0, 52.0, 74.0, 98.0, 163.0, 242.0, 392.0, 673.0, 1194.0, 2144.0, 4426.0, 11405.0, 63006.0, 4059775.0, 33895.0, 8474.0, 3643.0, 1737.0, 1028.0, 602.0, 414.0, 259.0, 146.0, 94.0, 74.0, 55.0, 34.0, 35.0, 19.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8590087890625, -2.764892578125, -2.6707763671875, -2.57666015625, -2.4825439453125, -2.388427734375, -2.2943115234375, -2.2001953125, -2.1060791015625, -2.011962890625, -1.9178466796875, -1.82373046875, -1.7296142578125, -1.635498046875, -1.5413818359375, -1.447265625, -1.3531494140625, -1.259033203125, -1.1649169921875, -1.07080078125, -0.9766845703125, -0.882568359375, -0.7884521484375, -0.6943359375, -0.6002197265625, -0.506103515625, -0.4119873046875, -0.31787109375, -0.2237548828125, -0.129638671875, -0.0355224609375, 0.05859375, 0.1527099609375, 0.246826171875, 0.3409423828125, 0.43505859375, 0.5291748046875, 0.623291015625, 0.7174072265625, 0.8115234375, 0.9056396484375, 0.999755859375, 1.0938720703125, 1.18798828125, 1.2821044921875, 1.376220703125, 1.4703369140625, 1.564453125, 1.6585693359375, 1.752685546875, 1.8468017578125, 1.94091796875, 2.0350341796875, 2.129150390625, 2.2232666015625, 2.3173828125, 2.4114990234375, 2.505615234375, 2.5997314453125, 2.69384765625, 2.7879638671875, 2.882080078125, 2.9761962890625, 3.0703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 9.0, 12.0, 13.0, 12.0, 17.0, 113.0, 649.0, 35.0, 14.0, 10.0, 9.0, 5.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8466796875, -0.814453125, -0.7822265625, -0.75, -0.7177734375, -0.685546875, -0.6533203125, -0.62109375, -0.5888671875, -0.556640625, -0.5244140625, -0.4921875, -0.4599609375, -0.427734375, -0.3955078125, -0.36328125, -0.3310546875, -0.298828125, -0.2666015625, -0.234375, -0.2021484375, -0.169921875, -0.1376953125, -0.10546875, -0.0732421875, -0.041015625, -0.0087890625, 0.0234375, 0.0556640625, 0.087890625, 0.1201171875, 0.15234375, 0.1845703125, 0.216796875, 0.2490234375, 0.28125, 0.3134765625, 0.345703125, 0.3779296875, 0.41015625, 0.4423828125, 0.474609375, 0.5068359375, 0.5390625, 0.5712890625, 0.603515625, 0.6357421875, 0.66796875, 0.7001953125, 0.732421875, 0.7646484375, 0.796875, 0.8291015625, 0.861328125, 0.8935546875, 0.92578125, 0.9580078125, 0.990234375, 1.0224609375, 1.0546875, 1.0869140625, 1.119140625, 1.1513671875, 1.18359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 17.0, 24.0, 18.0, 28.0, 46.0, 71.0, 128.0, 214.0, 381.0, 684.0, 1344.0, 2533.0, 5148.0, 11090.0, 28513.0, 101133.0, 3090342.0, 831353.0, 77627.0, 23925.0, 9816.0, 4644.0, 2338.0, 1192.0, 689.0, 359.0, 222.0, 128.0, 80.0, 61.0, 40.0, 19.0, 12.0, 10.0, 11.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.816009521484375, -2.72186279296875, -2.627716064453125, -2.5335693359375, -2.439422607421875, -2.34527587890625, -2.251129150390625, -2.156982421875, -2.062835693359375, -1.96868896484375, -1.874542236328125, -1.7803955078125, -1.686248779296875, -1.59210205078125, -1.497955322265625, -1.40380859375, -1.309661865234375, -1.21551513671875, -1.121368408203125, -1.0272216796875, -0.933074951171875, -0.83892822265625, -0.744781494140625, -0.650634765625, -0.556488037109375, -0.46234130859375, -0.368194580078125, -0.2740478515625, -0.179901123046875, -0.08575439453125, 0.008392333984375, 0.1025390625, 0.196685791015625, 0.29083251953125, 0.384979248046875, 0.4791259765625, 0.573272705078125, 0.66741943359375, 0.761566162109375, 0.855712890625, 0.949859619140625, 1.04400634765625, 1.138153076171875, 1.2322998046875, 1.326446533203125, 1.42059326171875, 1.514739990234375, 1.60888671875, 1.703033447265625, 1.79718017578125, 1.891326904296875, 1.9854736328125, 2.079620361328125, 2.17376708984375, 2.267913818359375, 2.362060546875, 2.456207275390625, 2.55035400390625, 2.644500732421875, 2.7386474609375, 2.832794189453125, 2.92694091796875, 3.021087646484375, 3.115234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 9.0, 6.0, 9.0, 14.0, 19.0, 25.0, 35.0, 34.0, 56.0, 84.0, 115.0, 229.0, 802.0, 1739.0, 337.0, 154.0, 101.0, 67.0, 40.0, 34.0, 23.0, 27.0, 15.0, 11.0, 14.0, 12.0, 5.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.896484375, -0.8677520751953125, -0.839019775390625, -0.8102874755859375, -0.78155517578125, -0.7528228759765625, -0.724090576171875, -0.6953582763671875, -0.6666259765625, -0.6378936767578125, -0.609161376953125, -0.5804290771484375, -0.55169677734375, -0.5229644775390625, -0.494232177734375, -0.4654998779296875, -0.436767578125, -0.4080352783203125, -0.379302978515625, -0.3505706787109375, -0.32183837890625, -0.2931060791015625, -0.264373779296875, -0.2356414794921875, -0.2069091796875, -0.1781768798828125, -0.149444580078125, -0.1207122802734375, -0.09197998046875, -0.0632476806640625, -0.034515380859375, -0.0057830810546875, 0.02294921875, 0.0516815185546875, 0.080413818359375, 0.1091461181640625, 0.13787841796875, 0.1666107177734375, 0.195343017578125, 0.2240753173828125, 0.2528076171875, 0.2815399169921875, 0.310272216796875, 0.3390045166015625, 0.36773681640625, 0.3964691162109375, 0.425201416015625, 0.4539337158203125, 0.482666015625, 0.5113983154296875, 0.540130615234375, 0.5688629150390625, 0.59759521484375, 0.6263275146484375, 0.655059814453125, 0.6837921142578125, 0.7125244140625, 0.7412567138671875, 0.769989013671875, 0.7987213134765625, 0.82745361328125, 0.8561859130859375, 0.884918212890625, 0.9136505126953125, 0.9423828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 12.0, 114.0, 493.0, 328.0, 40.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.387290000915527, -10.665428161621094, -9.943567276000977, -9.221705436706543, -8.49984359741211, -7.777982711791992, -7.056120872497559, -6.334259510040283, -5.612398147583008, -4.890536785125732, -4.168675422668457, -3.4468135833740234, -2.724952220916748, -2.0030908584594727, -1.281229019165039, -0.5593676567077637, 0.16249370574951172, 0.8843551874160767, 1.6062166690826416, 2.328078269958496, 3.0499396324157715, 3.771800994873047, 4.4936628341674805, 5.215524196624756, 5.937385559082031, 6.659246921539307, 7.381108283996582, 8.102970123291016, 8.824831008911133, 9.546692848205566, 10.2685546875, 10.990415573120117, 11.712276458740234, 12.434138298034668, 13.155999183654785, 13.877861022949219, 14.599721908569336, 15.32158374786377, 16.043445587158203, 16.76530647277832, 17.487167358398438, 18.209028244018555, 18.930891036987305, 19.652751922607422, 20.37461280822754, 21.096473693847656, 21.818336486816406, 22.540197372436523, 23.262060165405273, 23.98392105102539, 24.70578384399414, 25.427644729614258, 26.149505615234375, 26.871368408203125, 27.593229293823242, 28.31509017944336, 29.03695297241211, 29.758813858032227, 30.480676651000977, 31.202537536621094, 31.92439842224121, 32.64625930786133, 33.36812210083008, 34.08998489379883, 34.81184387207031]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 3.0, 9.0, 5.0, 6.0, 16.0, 17.0, 20.0, 24.0, 29.0, 35.0, 62.0, 51.0, 49.0, 30.0, 51.0, 59.0, 60.0, 54.0, 53.0, 56.0, 52.0, 42.0, 31.0, 44.0, 39.0, 22.0, 21.0, 16.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.881981134414673, -2.762664556503296, -2.643348217010498, -2.524031639099121, -2.4047152996063232, -2.2853987216949463, -2.1660823822021484, -2.0467658042907715, -1.927449345588684, -1.8081328868865967, -1.6888164281845093, -1.5694999694824219, -1.450183391571045, -1.330867052078247, -1.2115504741668701, -1.0922340154647827, -0.9729175567626953, -0.8536010980606079, -0.7342846393585205, -0.6149681210517883, -0.4956516623497009, -0.3763352036476135, -0.25701868534088135, -0.13770222663879395, -0.018385767936706543, 0.10093070566654205, 0.22024717926979065, 0.33956366777420044, 0.45888012647628784, 0.5781965851783752, 0.6975131034851074, 0.8168295621871948, 0.9361462593078613, 1.0554627180099487, 1.1747791767120361, 1.294095754623413, 1.413412094116211, 1.532728672027588, 1.6520451307296753, 1.7713615894317627, 1.89067804813385, 2.0099945068359375, 2.1293110847473145, 2.2486274242401123, 2.3679440021514893, 2.487260341644287, 2.606576919555664, 2.725893497467041, 2.845209836959839, 2.964526414871216, 3.0838427543640137, 3.2031593322753906, 3.3224756717681885, 3.4417922496795654, 3.5611085891723633, 3.6804251670837402, 3.799741744995117, 3.919058322906494, 4.038374900817871, 4.15769100189209, 4.277007579803467, 4.396324157714844, 4.515640735626221, 4.634957313537598, 4.754273414611816]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 11.0, 12.0, 15.0, 25.0, 36.0, 44.0, 87.0, 96.0, 146.0, 213.0, 347.0, 496.0, 746.0, 1116.0, 1710.0, 2821.0, 4319.0, 7288.0, 12899.0, 25208.0, 72145.0, 835237.0, 39005.0, 18473.0, 10201.0, 5763.0, 3567.0, 2166.0, 1491.0, 973.0, 566.0, 424.0, 330.0, 199.0, 123.0, 76.0, 61.0, 44.0, 29.0, 17.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.591796875, -2.52227783203125, -2.4527587890625, -2.38323974609375, -2.313720703125, -2.24420166015625, -2.1746826171875, -2.10516357421875, -2.03564453125, -1.96612548828125, -1.8966064453125, -1.82708740234375, -1.757568359375, -1.68804931640625, -1.6185302734375, -1.54901123046875, -1.4794921875, -1.40997314453125, -1.3404541015625, -1.27093505859375, -1.201416015625, -1.13189697265625, -1.0623779296875, -0.99285888671875, -0.92333984375, -0.85382080078125, -0.7843017578125, -0.71478271484375, -0.645263671875, -0.57574462890625, -0.5062255859375, -0.43670654296875, -0.3671875, -0.29766845703125, -0.2281494140625, -0.15863037109375, -0.089111328125, -0.01959228515625, 0.0499267578125, 0.11944580078125, 0.18896484375, 0.25848388671875, 0.3280029296875, 0.39752197265625, 0.467041015625, 0.53656005859375, 0.6060791015625, 0.67559814453125, 0.7451171875, 0.81463623046875, 0.8841552734375, 0.95367431640625, 1.023193359375, 1.09271240234375, 1.1622314453125, 1.23175048828125, 1.30126953125, 1.37078857421875, 1.4403076171875, 1.50982666015625, 1.579345703125, 1.64886474609375, 1.7183837890625, 1.78790283203125, 1.857421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 11.0, 11.0, 129.0, 553.0, 116.0, 12.0, 13.0, 12.0, 6.0, 7.0, 5.0, 4.0, 8.0, 6.0, 2.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8037109375, -0.773284912109375, -0.74285888671875, -0.712432861328125, -0.6820068359375, -0.651580810546875, -0.62115478515625, -0.590728759765625, -0.560302734375, -0.529876708984375, -0.49945068359375, -0.469024658203125, -0.4385986328125, -0.408172607421875, -0.37774658203125, -0.347320556640625, -0.31689453125, -0.286468505859375, -0.25604248046875, -0.225616455078125, -0.1951904296875, -0.164764404296875, -0.13433837890625, -0.103912353515625, -0.073486328125, -0.043060302734375, -0.01263427734375, 0.017791748046875, 0.0482177734375, 0.078643798828125, 0.10906982421875, 0.139495849609375, 0.169921875, 0.200347900390625, 0.23077392578125, 0.261199951171875, 0.2916259765625, 0.322052001953125, 0.35247802734375, 0.382904052734375, 0.413330078125, 0.443756103515625, 0.47418212890625, 0.504608154296875, 0.5350341796875, 0.565460205078125, 0.59588623046875, 0.626312255859375, 0.65673828125, 0.687164306640625, 0.71759033203125, 0.748016357421875, 0.7784423828125, 0.808868408203125, 0.83929443359375, 0.869720458984375, 0.900146484375, 0.930572509765625, 0.96099853515625, 0.991424560546875, 1.0218505859375, 1.052276611328125, 1.08270263671875, 1.113128662109375, 1.1435546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 10.0, 6.0, 14.0, 17.0, 18.0, 22.0, 35.0, 53.0, 87.0, 119.0, 189.0, 351.0, 753.0, 1618.0, 3931.0, 11433.0, 39126.0, 176126.0, 576732.0, 179234.0, 39854.0, 11497.0, 3995.0, 1606.0, 714.0, 371.0, 213.0, 145.0, 92.0, 44.0, 31.0, 29.0, 19.0, 21.0, 11.0, 7.0, 8.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.4671630859375, -2.383544921875, -2.2999267578125, -2.21630859375, -2.1326904296875, -2.049072265625, -1.9654541015625, -1.8818359375, -1.7982177734375, -1.714599609375, -1.6309814453125, -1.54736328125, -1.4637451171875, -1.380126953125, -1.2965087890625, -1.212890625, -1.1292724609375, -1.045654296875, -0.9620361328125, -0.87841796875, -0.7947998046875, -0.711181640625, -0.6275634765625, -0.5439453125, -0.4603271484375, -0.376708984375, -0.2930908203125, -0.20947265625, -0.1258544921875, -0.042236328125, 0.0413818359375, 0.125, 0.2086181640625, 0.292236328125, 0.3758544921875, 0.45947265625, 0.5430908203125, 0.626708984375, 0.7103271484375, 0.7939453125, 0.8775634765625, 0.961181640625, 1.0447998046875, 1.12841796875, 1.2120361328125, 1.295654296875, 1.3792724609375, 1.462890625, 1.5465087890625, 1.630126953125, 1.7137451171875, 1.79736328125, 1.8809814453125, 1.964599609375, 2.0482177734375, 2.1318359375, 2.2154541015625, 2.299072265625, 2.3826904296875, 2.46630859375, 2.5499267578125, 2.633544921875, 2.7171630859375, 2.80078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 17.0, 31.0, 20.0, 20.0, 36.0, 24.0, 37.0, 29.0, 35.0, 34.0, 39.0, 42.0, 43.0, 43.0, 55.0, 55.0, 39.0, 52.0, 33.0, 42.0, 29.0, 28.0, 32.0, 25.0, 25.0, 25.0, 9.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0], "bins": [-4.734375, -4.611480712890625, -4.48858642578125, -4.365692138671875, -4.2427978515625, -4.119903564453125, -3.99700927734375, -3.874114990234375, -3.751220703125, -3.628326416015625, -3.50543212890625, -3.382537841796875, -3.2596435546875, -3.136749267578125, -3.01385498046875, -2.890960693359375, -2.76806640625, -2.645172119140625, -2.52227783203125, -2.399383544921875, -2.2764892578125, -2.153594970703125, -2.03070068359375, -1.907806396484375, -1.784912109375, -1.662017822265625, -1.53912353515625, -1.416229248046875, -1.2933349609375, -1.170440673828125, -1.04754638671875, -0.924652099609375, -0.8017578125, -0.678863525390625, -0.55596923828125, -0.433074951171875, -0.3101806640625, -0.187286376953125, -0.06439208984375, 0.058502197265625, 0.181396484375, 0.304290771484375, 0.42718505859375, 0.550079345703125, 0.6729736328125, 0.795867919921875, 0.91876220703125, 1.041656494140625, 1.16455078125, 1.287445068359375, 1.41033935546875, 1.533233642578125, 1.6561279296875, 1.779022216796875, 1.90191650390625, 2.024810791015625, 2.147705078125, 2.270599365234375, 2.39349365234375, 2.516387939453125, 2.6392822265625, 2.762176513671875, 2.88507080078125, 3.007965087890625, 3.130859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 14.0, 17.0, 31.0, 35.0, 62.0, 93.0, 150.0, 303.0, 522.0, 1226.0, 2982.0, 8955.0, 36460.0, 327064.0, 590653.0, 60423.0, 12429.0, 3998.0, 1610.0, 722.0, 342.0, 164.0, 114.0, 54.0, 26.0, 29.0, 24.0, 10.0, 8.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.340484619140625, -2.24737548828125, -2.154266357421875, -2.0611572265625, -1.968048095703125, -1.87493896484375, -1.781829833984375, -1.688720703125, -1.595611572265625, -1.50250244140625, -1.409393310546875, -1.3162841796875, -1.223175048828125, -1.13006591796875, -1.036956787109375, -0.94384765625, -0.850738525390625, -0.75762939453125, -0.664520263671875, -0.5714111328125, -0.478302001953125, -0.38519287109375, -0.292083740234375, -0.198974609375, -0.105865478515625, -0.01275634765625, 0.080352783203125, 0.1734619140625, 0.266571044921875, 0.35968017578125, 0.452789306640625, 0.5458984375, 0.639007568359375, 0.73211669921875, 0.825225830078125, 0.9183349609375, 1.011444091796875, 1.10455322265625, 1.197662353515625, 1.290771484375, 1.383880615234375, 1.47698974609375, 1.570098876953125, 1.6632080078125, 1.756317138671875, 1.84942626953125, 1.942535400390625, 2.03564453125, 2.128753662109375, 2.22186279296875, 2.314971923828125, 2.4080810546875, 2.501190185546875, 2.59429931640625, 2.687408447265625, 2.780517578125, 2.873626708984375, 2.96673583984375, 3.059844970703125, 3.1529541015625, 3.246063232421875, 3.33917236328125, 3.432281494140625, 3.525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 5.0, 11.0, 15.0, 23.0, 28.0, 39.0, 52.0, 62.0, 79.0, 68.0, 94.0, 91.0, 86.0, 60.0, 61.0, 41.0, 36.0, 40.0, 23.0, 14.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011790171265602112, -0.00011301785707473755, -0.00010813400149345398, -0.00010325014591217041, -9.836629033088684e-05, -9.348243474960327e-05, -8.85985791683197e-05, -8.371472358703613e-05, -7.883086800575256e-05, -7.3947012424469e-05, -6.906315684318542e-05, -6.417930126190186e-05, -5.9295445680618286e-05, -5.441159009933472e-05, -4.952773451805115e-05, -4.464387893676758e-05, -3.976002335548401e-05, -3.487616777420044e-05, -2.999231219291687e-05, -2.51084566116333e-05, -2.022460103034973e-05, -1.5340745449066162e-05, -1.0456889867782593e-05, -5.5730342864990234e-06, -6.891787052154541e-07, 4.194676876068115e-06, 9.078532457351685e-06, 1.3962388038635254e-05, 1.8846243619918823e-05, 2.3730099201202393e-05, 2.8613954782485962e-05, 3.349781036376953e-05, 3.83816659450531e-05, 4.326552152633667e-05, 4.814937710762024e-05, 5.303323268890381e-05, 5.791708827018738e-05, 6.280094385147095e-05, 6.768479943275452e-05, 7.256865501403809e-05, 7.745251059532166e-05, 8.233636617660522e-05, 8.72202217578888e-05, 9.210407733917236e-05, 9.698793292045593e-05, 0.0001018717885017395, 0.00010675564408302307, 0.00011163949966430664, 0.00011652335524559021, 0.00012140721082687378, 0.00012629106640815735, 0.00013117492198944092, 0.0001360587775707245, 0.00014094263315200806, 0.00014582648873329163, 0.0001507103443145752, 0.00015559419989585876, 0.00016047805547714233, 0.0001653619110584259, 0.00017024576663970947, 0.00017512962222099304, 0.0001800134778022766, 0.00018489733338356018, 0.00018978118896484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 16.0, 12.0, 24.0, 31.0, 64.0, 113.0, 197.0, 446.0, 1017.0, 2667.0, 9912.0, 73714.0, 773111.0, 164765.0, 16152.0, 3893.0, 1268.0, 544.0, 257.0, 142.0, 81.0, 46.0, 30.0, 12.0, 10.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.593963623046875, -4.46136474609375, -4.328765869140625, -4.1961669921875, -4.063568115234375, -3.93096923828125, -3.798370361328125, -3.665771484375, -3.533172607421875, -3.40057373046875, -3.267974853515625, -3.1353759765625, -3.002777099609375, -2.87017822265625, -2.737579345703125, -2.60498046875, -2.472381591796875, -2.33978271484375, -2.207183837890625, -2.0745849609375, -1.941986083984375, -1.80938720703125, -1.676788330078125, -1.544189453125, -1.411590576171875, -1.27899169921875, -1.146392822265625, -1.0137939453125, -0.881195068359375, -0.74859619140625, -0.615997314453125, -0.4833984375, -0.350799560546875, -0.21820068359375, -0.085601806640625, 0.0469970703125, 0.179595947265625, 0.31219482421875, 0.444793701171875, 0.577392578125, 0.709991455078125, 0.84259033203125, 0.975189208984375, 1.1077880859375, 1.240386962890625, 1.37298583984375, 1.505584716796875, 1.63818359375, 1.770782470703125, 1.90338134765625, 2.035980224609375, 2.1685791015625, 2.301177978515625, 2.43377685546875, 2.566375732421875, 2.698974609375, 2.831573486328125, 2.96417236328125, 3.096771240234375, 3.2293701171875, 3.361968994140625, 3.49456787109375, 3.627166748046875, 3.759765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 11.0, 20.0, 23.0, 38.0, 43.0, 47.0, 76.0, 86.0, 86.0, 114.0, 104.0, 89.0, 62.0, 47.0, 38.0, 33.0, 17.0, 18.0, 11.0, 13.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.326080322265625, -2.26153564453125, -2.196990966796875, -2.1324462890625, -2.067901611328125, -2.00335693359375, -1.938812255859375, -1.874267578125, -1.809722900390625, -1.74517822265625, -1.680633544921875, -1.6160888671875, -1.551544189453125, -1.48699951171875, -1.422454833984375, -1.35791015625, -1.293365478515625, -1.22882080078125, -1.164276123046875, -1.0997314453125, -1.035186767578125, -0.97064208984375, -0.906097412109375, -0.841552734375, -0.777008056640625, -0.71246337890625, -0.647918701171875, -0.5833740234375, -0.518829345703125, -0.45428466796875, -0.389739990234375, -0.3251953125, -0.260650634765625, -0.19610595703125, -0.131561279296875, -0.0670166015625, -0.002471923828125, 0.06207275390625, 0.126617431640625, 0.191162109375, 0.255706787109375, 0.32025146484375, 0.384796142578125, 0.4493408203125, 0.513885498046875, 0.57843017578125, 0.642974853515625, 0.70751953125, 0.772064208984375, 0.83660888671875, 0.901153564453125, 0.9656982421875, 1.030242919921875, 1.09478759765625, 1.159332275390625, 1.223876953125, 1.288421630859375, 1.35296630859375, 1.417510986328125, 1.4820556640625, 1.546600341796875, 1.61114501953125, 1.675689697265625, 1.740234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 16.0, 52.0, 371.0, 491.0, 59.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.24732971191406, -120.71041107177734, -117.17349243164062, -113.63656616210938, -110.09964752197266, -106.56272888183594, -103.02580261230469, -99.48888397216797, -95.95196533203125, -92.41504669189453, -88.87812805175781, -85.34120178222656, -81.80428314208984, -78.26736450195312, -74.73043823242188, -71.19351959228516, -67.65660095214844, -64.11968231201172, -60.582759857177734, -57.04583740234375, -53.50891876220703, -49.97200012207031, -46.43507766723633, -42.898155212402344, -39.361236572265625, -35.824317932128906, -32.28739547729492, -28.75047492980957, -25.21355438232422, -21.676633834838867, -18.139713287353516, -14.602792739868164, -11.065872192382812, -7.528951644897461, -3.9920310974121094, -0.4551105499267578, 3.0818099975585938, 6.618730545043945, 10.155651092529297, 13.692571640014648, 17.2294921875, 20.76641273498535, 24.303333282470703, 27.840253829956055, 31.377174377441406, 34.914093017578125, 38.45101547241211, 41.987937927246094, 45.52485656738281, 49.06177520751953, 52.598697662353516, 56.1356201171875, 59.67253875732422, 63.20945739746094, 66.74638366699219, 70.2833023071289, 73.82022094726562, 77.35713958740234, 80.89405822753906, 84.43098449707031, 87.96790313720703, 91.50482177734375, 95.041748046875, 98.57866668701172, 102.11558532714844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 3.0, 7.0, 9.0, 12.0, 20.0, 29.0, 38.0, 64.0, 109.0, 123.0, 150.0, 117.0, 87.0, 72.0, 36.0, 16.0, 12.0, 12.0, 15.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.0882339477539, -61.97610855102539, -59.863983154296875, -57.751861572265625, -55.63973617553711, -53.527610778808594, -51.41548538208008, -49.30335998535156, -47.19123840332031, -45.0791130065918, -42.96698760986328, -40.85486602783203, -38.742740631103516, -36.630615234375, -34.518489837646484, -32.40636444091797, -30.294239044189453, -28.182113647460938, -26.069990158081055, -23.95786476135254, -21.845741271972656, -19.73361587524414, -17.621490478515625, -15.509366035461426, -13.397241592407227, -11.285117149353027, -9.172992706298828, -7.0608673095703125, -4.948742866516113, -2.836618423461914, -0.7244930267333984, 1.3876314163208008, 3.499755859375, 5.611880302429199, 7.724005222320557, 9.836130142211914, 11.948254585266113, 14.060379028320312, 16.172504425048828, 18.284629821777344, 20.396753311157227, 22.508878707885742, 24.621002197265625, 26.73312759399414, 28.845252990722656, 30.95737648010254, 33.06950378417969, 35.18162536621094, 37.29375076293945, 39.40587615966797, 41.518001556396484, 43.630126953125, 45.74224853515625, 47.854373931884766, 49.96649932861328, 52.0786247253418, 54.19075012207031, 56.30287551879883, 58.415000915527344, 60.527122497558594, 62.63924789428711, 64.75137329101562, 66.86349487304688, 68.97562408447266, 71.0877456665039]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 6.0, 10.0, 14.0, 23.0, 46.0, 46.0, 71.0, 98.0, 121.0, 202.0, 299.0, 429.0, 677.0, 1101.0, 1763.0, 3029.0, 5592.0, 12177.0, 35067.0, 3594586.0, 486835.0, 29786.0, 10367.0, 4822.0, 2644.0, 1499.0, 941.0, 588.0, 432.0, 298.0, 203.0, 148.0, 77.0, 71.0, 44.0, 37.0, 29.0, 23.0, 17.0, 8.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.87890625, -7.65972900390625, -7.4405517578125, -7.22137451171875, -7.002197265625, -6.78302001953125, -6.5638427734375, -6.34466552734375, -6.12548828125, -5.90631103515625, -5.6871337890625, -5.46795654296875, -5.248779296875, -5.02960205078125, -4.8104248046875, -4.59124755859375, -4.3720703125, -4.15289306640625, -3.9337158203125, -3.71453857421875, -3.495361328125, -3.27618408203125, -3.0570068359375, -2.83782958984375, -2.61865234375, -2.39947509765625, -2.1802978515625, -1.96112060546875, -1.741943359375, -1.52276611328125, -1.3035888671875, -1.08441162109375, -0.865234375, -0.64605712890625, -0.4268798828125, -0.20770263671875, 0.011474609375, 0.23065185546875, 0.4498291015625, 0.66900634765625, 0.88818359375, 1.10736083984375, 1.3265380859375, 1.54571533203125, 1.764892578125, 1.98406982421875, 2.2032470703125, 2.42242431640625, 2.6416015625, 2.86077880859375, 3.0799560546875, 3.29913330078125, 3.518310546875, 3.73748779296875, 3.9566650390625, 4.17584228515625, 4.39501953125, 4.61419677734375, 4.8333740234375, 5.05255126953125, 5.271728515625, 5.49090576171875, 5.7100830078125, 5.92926025390625, 6.1484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 16.0, 14.0, 9.0, 19.0, 22.0, 140.0, 357.0, 244.0, 61.0, 19.0, 12.0, 12.0, 7.0, 8.0, 9.0, 6.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6816787719726562, -0.6529083251953125, -0.6241378784179688, -0.595367431640625, -0.5665969848632812, -0.5378265380859375, -0.5090560913085938, -0.48028564453125, -0.45151519775390625, -0.4227447509765625, -0.39397430419921875, -0.365203857421875, -0.33643341064453125, -0.3076629638671875, -0.27889251708984375, -0.2501220703125, -0.22135162353515625, -0.1925811767578125, -0.16381072998046875, -0.135040283203125, -0.10626983642578125, -0.0774993896484375, -0.04872894287109375, -0.01995849609375, 0.00881195068359375, 0.0375823974609375, 0.06635284423828125, 0.095123291015625, 0.12389373779296875, 0.1526641845703125, 0.18143463134765625, 0.210205078125, 0.23897552490234375, 0.2677459716796875, 0.29651641845703125, 0.325286865234375, 0.35405731201171875, 0.3828277587890625, 0.41159820556640625, 0.44036865234375, 0.46913909912109375, 0.4979095458984375, 0.5266799926757812, 0.555450439453125, 0.5842208862304688, 0.6129913330078125, 0.6417617797851562, 0.6705322265625, 0.6993026733398438, 0.7280731201171875, 0.7568435668945312, 0.785614013671875, 0.8143844604492188, 0.8431549072265625, 0.8719253540039062, 0.90069580078125, 0.9294662475585938, 0.9582366943359375, 0.9870071411132812, 1.015777587890625, 1.0445480346679688, 1.0733184814453125, 1.1020889282226562, 1.130859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 7.0, 17.0, 25.0, 33.0, 51.0, 61.0, 138.0, 222.0, 448.0, 988.0, 2234.0, 5843.0, 17948.0, 84015.0, 3640573.0, 383782.0, 40267.0, 10724.0, 3909.0, 1570.0, 654.0, 361.0, 167.0, 90.0, 48.0, 36.0, 22.0, 12.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.59552001953125, -7.3707275390625, -7.14593505859375, -6.921142578125, -6.69635009765625, -6.4715576171875, -6.24676513671875, -6.02197265625, -5.79718017578125, -5.5723876953125, -5.34759521484375, -5.122802734375, -4.89801025390625, -4.6732177734375, -4.44842529296875, -4.2236328125, -3.99884033203125, -3.7740478515625, -3.54925537109375, -3.324462890625, -3.09967041015625, -2.8748779296875, -2.65008544921875, -2.42529296875, -2.20050048828125, -1.9757080078125, -1.75091552734375, -1.526123046875, -1.30133056640625, -1.0765380859375, -0.85174560546875, -0.626953125, -0.40216064453125, -0.1773681640625, 0.04742431640625, 0.272216796875, 0.49700927734375, 0.7218017578125, 0.94659423828125, 1.17138671875, 1.39617919921875, 1.6209716796875, 1.84576416015625, 2.070556640625, 2.29534912109375, 2.5201416015625, 2.74493408203125, 2.9697265625, 3.19451904296875, 3.4193115234375, 3.64410400390625, 3.868896484375, 4.09368896484375, 4.3184814453125, 4.54327392578125, 4.76806640625, 4.99285888671875, 5.2176513671875, 5.44244384765625, 5.667236328125, 5.89202880859375, 6.1168212890625, 6.34161376953125, 6.56640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 14.0, 18.0, 14.0, 19.0, 33.0, 59.0, 93.0, 178.0, 325.0, 2147.0, 615.0, 214.0, 134.0, 66.0, 37.0, 30.0, 24.0, 20.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2167816162109375, -1.184539794921875, -1.1522979736328125, -1.12005615234375, -1.0878143310546875, -1.055572509765625, -1.0233306884765625, -0.9910888671875, -0.9588470458984375, -0.926605224609375, -0.8943634033203125, -0.86212158203125, -0.8298797607421875, -0.797637939453125, -0.7653961181640625, -0.733154296875, -0.7009124755859375, -0.668670654296875, -0.6364288330078125, -0.60418701171875, -0.5719451904296875, -0.539703369140625, -0.5074615478515625, -0.4752197265625, -0.4429779052734375, -0.410736083984375, -0.3784942626953125, -0.34625244140625, -0.3140106201171875, -0.281768798828125, -0.2495269775390625, -0.21728515625, -0.1850433349609375, -0.152801513671875, -0.1205596923828125, -0.08831787109375, -0.0560760498046875, -0.023834228515625, 0.0084075927734375, 0.0406494140625, 0.0728912353515625, 0.105133056640625, 0.1373748779296875, 0.16961669921875, 0.2018585205078125, 0.234100341796875, 0.2663421630859375, 0.298583984375, 0.3308258056640625, 0.363067626953125, 0.3953094482421875, 0.42755126953125, 0.4597930908203125, 0.492034912109375, 0.5242767333984375, 0.5565185546875, 0.5887603759765625, 0.621002197265625, 0.6532440185546875, 0.68548583984375, 0.7177276611328125, 0.749969482421875, 0.7822113037109375, 0.814453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 48.0, 169.0, 450.0, 246.0, 56.0, 16.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.364155769348145, -9.9586820602417, -9.553208351135254, -9.147734642028809, -8.742260932922363, -8.336787223815918, -7.9313130378723145, -7.525839328765869, -7.120365619659424, -6.7148919105529785, -6.309418201446533, -5.90394401550293, -5.498470306396484, -5.092996597290039, -4.687522888183594, -4.282049179077148, -3.876575469970703, -3.471101760864258, -3.0656280517578125, -2.660154104232788, -2.2546803951263428, -1.8492066860198975, -1.443732738494873, -1.0382590293884277, -0.6327853202819824, -0.22731155157089233, 0.17816221714019775, 0.5836360454559326, 0.9891097545623779, 1.3945834636688232, 1.8000574111938477, 2.205531120300293, 2.611003875732422, 3.016477584838867, 3.4219512939453125, 3.827425241470337, 4.232898712158203, 4.638372421264648, 5.043846607208252, 5.449320316314697, 5.854794025421143, 6.260267734527588, 6.665741443634033, 7.071215629577637, 7.476689338684082, 7.882163047790527, 8.287636756896973, 8.693110466003418, 9.098584175109863, 9.504057884216309, 9.909531593322754, 10.3150053024292, 10.720479011535645, 11.12595272064209, 11.531427383422852, 11.936901092529297, 12.342374801635742, 12.747848510742188, 13.153322219848633, 13.558795928955078, 13.964269638061523, 14.369743347167969, 14.775217056274414, 15.18069076538086, 15.586164474487305]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 10.0, 8.0, 11.0, 16.0, 15.0, 34.0, 34.0, 34.0, 44.0, 63.0, 80.0, 65.0, 75.0, 68.0, 55.0, 79.0, 43.0, 58.0, 37.0, 28.0, 24.0, 25.0, 19.0, 16.0, 11.0, 9.0, 2.0, 4.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.959841251373291, -3.85481333732605, -3.7497856616973877, -3.6447577476501465, -3.5397298336029053, -3.434701919555664, -3.329674243927002, -3.2246463298797607, -3.1196184158325195, -3.0145905017852783, -2.909562826156616, -2.804534912109375, -2.699506998062134, -2.5944790840148926, -2.4894514083862305, -2.3844234943389893, -2.279395818710327, -2.174367904663086, -2.069340229034424, -1.9643123149871826, -1.8592844009399414, -1.7542566061019897, -1.649228811264038, -1.5442008972167969, -1.4391731023788452, -1.3341453075408936, -1.2291173934936523, -1.1240895986557007, -1.019061803817749, -0.9140338897705078, -0.8090060949325562, -0.7039782404899597, -0.5989501476287842, -0.49392229318618774, -0.3888944685459137, -0.28386664390563965, -0.1788387894630432, -0.07381093502044678, 0.031216859817504883, 0.13624471426010132, 0.24127256870269775, 0.3463004231452942, 0.45132824778556824, 0.5563560724258423, 0.6613839268684387, 0.7664117813110352, 0.8714395761489868, 0.9764674305915833, 1.0814952850341797, 1.1865230798721313, 1.2915509939193726, 1.3965787887573242, 1.5016067028045654, 1.606634497642517, 1.7116622924804688, 1.81669020652771, 1.9217180013656616, 2.0267457962036133, 2.1317737102508545, 2.2368016242980957, 2.341829299926758, 2.446857213973999, 2.5518851280212402, 2.6569128036499023, 2.7619407176971436]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 12.0, 8.0, 12.0, 16.0, 21.0, 24.0, 30.0, 46.0, 55.0, 94.0, 142.0, 164.0, 233.0, 374.0, 569.0, 936.0, 1510.0, 2494.0, 4326.0, 8399.0, 19191.0, 71619.0, 816896.0, 81192.0, 20206.0, 8621.0, 4401.0, 2520.0, 1565.0, 1001.0, 620.0, 359.0, 273.0, 193.0, 120.0, 93.0, 64.0, 38.0, 29.0, 28.0, 17.0, 13.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.9375, -4.79022216796875, -4.6429443359375, -4.49566650390625, -4.348388671875, -4.20111083984375, -4.0538330078125, -3.90655517578125, -3.75927734375, -3.61199951171875, -3.4647216796875, -3.31744384765625, -3.170166015625, -3.02288818359375, -2.8756103515625, -2.72833251953125, -2.5810546875, -2.43377685546875, -2.2864990234375, -2.13922119140625, -1.991943359375, -1.84466552734375, -1.6973876953125, -1.55010986328125, -1.40283203125, -1.25555419921875, -1.1082763671875, -0.96099853515625, -0.813720703125, -0.66644287109375, -0.5191650390625, -0.37188720703125, -0.224609375, -0.07733154296875, 0.0699462890625, 0.21722412109375, 0.364501953125, 0.51177978515625, 0.6590576171875, 0.80633544921875, 0.95361328125, 1.10089111328125, 1.2481689453125, 1.39544677734375, 1.542724609375, 1.69000244140625, 1.8372802734375, 1.98455810546875, 2.1318359375, 2.27911376953125, 2.4263916015625, 2.57366943359375, 2.720947265625, 2.86822509765625, 3.0155029296875, 3.16278076171875, 3.31005859375, 3.45733642578125, 3.6046142578125, 3.75189208984375, 3.899169921875, 4.04644775390625, 4.1937255859375, 4.34100341796875, 4.48828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 10.0, 3.0, 7.0, 18.0, 13.0, 27.0, 80.0, 221.0, 335.0, 161.0, 35.0, 19.0, 8.0, 11.0, 13.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7085494995117188, -0.6793060302734375, -0.6500625610351562, -0.620819091796875, -0.5915756225585938, -0.5623321533203125, -0.5330886840820312, -0.50384521484375, -0.47460174560546875, -0.4453582763671875, -0.41611480712890625, -0.386871337890625, -0.35762786865234375, -0.3283843994140625, -0.29914093017578125, -0.2698974609375, -0.24065399169921875, -0.2114105224609375, -0.18216705322265625, -0.152923583984375, -0.12368011474609375, -0.0944366455078125, -0.06519317626953125, -0.03594970703125, -0.00670623779296875, 0.0225372314453125, 0.05178070068359375, 0.081024169921875, 0.11026763916015625, 0.1395111083984375, 0.16875457763671875, 0.197998046875, 0.22724151611328125, 0.2564849853515625, 0.28572845458984375, 0.314971923828125, 0.34421539306640625, 0.3734588623046875, 0.40270233154296875, 0.43194580078125, 0.46118927001953125, 0.4904327392578125, 0.5196762084960938, 0.548919677734375, 0.5781631469726562, 0.6074066162109375, 0.6366500854492188, 0.6658935546875, 0.6951370239257812, 0.7243804931640625, 0.7536239624023438, 0.782867431640625, 0.8121109008789062, 0.8413543701171875, 0.8705978393554688, 0.89984130859375, 0.9290847778320312, 0.9583282470703125, 0.9875717163085938, 1.016815185546875, 1.0460586547851562, 1.0753021240234375, 1.1045455932617188, 1.1337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 11.0, 28.0, 39.0, 50.0, 93.0, 130.0, 266.0, 508.0, 1103.0, 2501.0, 6683.0, 23871.0, 171364.0, 706805.0, 109010.0, 17475.0, 4996.0, 1870.0, 804.0, 399.0, 209.0, 116.0, 74.0, 50.0, 24.0, 9.0, 13.0, 15.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.33843994140625, -4.2003173828125, -4.06219482421875, -3.924072265625, -3.78594970703125, -3.6478271484375, -3.50970458984375, -3.37158203125, -3.23345947265625, -3.0953369140625, -2.95721435546875, -2.819091796875, -2.68096923828125, -2.5428466796875, -2.40472412109375, -2.2666015625, -2.12847900390625, -1.9903564453125, -1.85223388671875, -1.714111328125, -1.57598876953125, -1.4378662109375, -1.29974365234375, -1.16162109375, -1.02349853515625, -0.8853759765625, -0.74725341796875, -0.609130859375, -0.47100830078125, -0.3328857421875, -0.19476318359375, -0.056640625, 0.08148193359375, 0.2196044921875, 0.35772705078125, 0.495849609375, 0.63397216796875, 0.7720947265625, 0.91021728515625, 1.04833984375, 1.18646240234375, 1.3245849609375, 1.46270751953125, 1.600830078125, 1.73895263671875, 1.8770751953125, 2.01519775390625, 2.1533203125, 2.29144287109375, 2.4295654296875, 2.56768798828125, 2.705810546875, 2.84393310546875, 2.9820556640625, 3.12017822265625, 3.25830078125, 3.39642333984375, 3.5345458984375, 3.67266845703125, 3.810791015625, 3.94891357421875, 4.0870361328125, 4.22515869140625, 4.36328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 10.0, 7.0, 17.0, 20.0, 29.0, 33.0, 30.0, 59.0, 46.0, 50.0, 54.0, 50.0, 56.0, 57.0, 49.0, 59.0, 57.0, 52.0, 55.0, 33.0, 38.0, 24.0, 20.0, 13.0, 17.0, 9.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.311767578125, -2.23095703125, -2.150146484375, -2.0693359375, -1.988525390625, -1.90771484375, -1.826904296875, -1.74609375, -1.665283203125, -1.58447265625, -1.503662109375, -1.4228515625, -1.342041015625, -1.26123046875, -1.180419921875, -1.099609375, -1.018798828125, -0.93798828125, -0.857177734375, -0.7763671875, -0.695556640625, -0.61474609375, -0.533935546875, -0.453125, -0.372314453125, -0.29150390625, -0.210693359375, -0.1298828125, -0.049072265625, 0.03173828125, 0.112548828125, 0.193359375, 0.274169921875, 0.35498046875, 0.435791015625, 0.5166015625, 0.597412109375, 0.67822265625, 0.759033203125, 0.83984375, 0.920654296875, 1.00146484375, 1.082275390625, 1.1630859375, 1.243896484375, 1.32470703125, 1.405517578125, 1.486328125, 1.567138671875, 1.64794921875, 1.728759765625, 1.8095703125, 1.890380859375, 1.97119140625, 2.052001953125, 2.1328125, 2.213623046875, 2.29443359375, 2.375244140625, 2.4560546875, 2.536865234375, 2.61767578125, 2.698486328125, 2.779296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 2.0, 4.0, 6.0, 13.0, 16.0, 27.0, 33.0, 42.0, 83.0, 96.0, 158.0, 200.0, 344.0, 504.0, 855.0, 1437.0, 2501.0, 5119.0, 10919.0, 28276.0, 93382.0, 376147.0, 382392.0, 94680.0, 28702.0, 11088.0, 5105.0, 2602.0, 1454.0, 860.0, 455.0, 328.0, 231.0, 145.0, 90.0, 72.0, 41.0, 30.0, 31.0, 22.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.865234375, -2.769744873046875, -2.67425537109375, -2.578765869140625, -2.4832763671875, -2.387786865234375, -2.29229736328125, -2.196807861328125, -2.101318359375, -2.005828857421875, -1.91033935546875, -1.814849853515625, -1.7193603515625, -1.623870849609375, -1.52838134765625, -1.432891845703125, -1.33740234375, -1.241912841796875, -1.14642333984375, -1.050933837890625, -0.9554443359375, -0.859954833984375, -0.76446533203125, -0.668975830078125, -0.573486328125, -0.477996826171875, -0.38250732421875, -0.287017822265625, -0.1915283203125, -0.096038818359375, -0.00054931640625, 0.094940185546875, 0.1904296875, 0.285919189453125, 0.38140869140625, 0.476898193359375, 0.5723876953125, 0.667877197265625, 0.76336669921875, 0.858856201171875, 0.954345703125, 1.049835205078125, 1.14532470703125, 1.240814208984375, 1.3363037109375, 1.431793212890625, 1.52728271484375, 1.622772216796875, 1.71826171875, 1.813751220703125, 1.90924072265625, 2.004730224609375, 2.1002197265625, 2.195709228515625, 2.29119873046875, 2.386688232421875, 2.482177734375, 2.577667236328125, 2.67315673828125, 2.768646240234375, 2.8641357421875, 2.959625244140625, 3.05511474609375, 3.150604248046875, 3.24609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 10.0, 15.0, 18.0, 32.0, 63.0, 120.0, 213.0, 187.0, 140.0, 76.0, 41.0, 24.0, 14.0, 9.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006275177001953125, -0.0006133057177066803, -0.0005990937352180481, -0.0005848817527294159, -0.0005706697702407837, -0.0005564577877521515, -0.0005422458052635193, -0.0005280338227748871, -0.0005138218402862549, -0.0004996098577976227, -0.0004853978753089905, -0.0004711858928203583, -0.0004569739103317261, -0.00044276192784309387, -0.00042854994535446167, -0.00041433796286582947, -0.00040012598037719727, -0.00038591399788856506, -0.00037170201539993286, -0.00035749003291130066, -0.00034327805042266846, -0.00032906606793403625, -0.00031485408544540405, -0.00030064210295677185, -0.00028643012046813965, -0.00027221813797950745, -0.00025800615549087524, -0.00024379417300224304, -0.00022958219051361084, -0.00021537020802497864, -0.00020115822553634644, -0.00018694624304771423, -0.00017273426055908203, -0.00015852227807044983, -0.00014431029558181763, -0.00013009831309318542, -0.00011588633060455322, -0.00010167434811592102, -8.746236562728882e-05, -7.325038313865662e-05, -5.9038400650024414e-05, -4.482641816139221e-05, -3.061443567276001e-05, -1.6402453184127808e-05, -2.1904706954956055e-06, 1.2021511793136597e-05, 2.62334942817688e-05, 4.0445476770401e-05, 5.46574592590332e-05, 6.88694417476654e-05, 8.308142423629761e-05, 9.729340672492981e-05, 0.00011150538921356201, 0.00012571737170219421, 0.00013992935419082642, 0.00015414133667945862, 0.00016835331916809082, 0.00018256530165672302, 0.00019677728414535522, 0.00021098926663398743, 0.00022520124912261963, 0.00023941323161125183, 0.00025362521409988403, 0.00026783719658851624, 0.00028204917907714844]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 6.0, 6.0, 9.0, 21.0, 24.0, 28.0, 27.0, 60.0, 98.0, 135.0, 220.0, 373.0, 653.0, 1156.0, 2226.0, 4661.0, 10747.0, 30802.0, 114591.0, 448379.0, 320218.0, 75375.0, 22356.0, 8429.0, 3635.0, 1818.0, 1024.0, 544.0, 312.0, 190.0, 119.0, 85.0, 53.0, 45.0, 30.0, 24.0, 16.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.2236328125, -3.119140625, -3.0146484375, -2.91015625, -2.8056640625, -2.701171875, -2.5966796875, -2.4921875, -2.3876953125, -2.283203125, -2.1787109375, -2.07421875, -1.9697265625, -1.865234375, -1.7607421875, -1.65625, -1.5517578125, -1.447265625, -1.3427734375, -1.23828125, -1.1337890625, -1.029296875, -0.9248046875, -0.8203125, -0.7158203125, -0.611328125, -0.5068359375, -0.40234375, -0.2978515625, -0.193359375, -0.0888671875, 0.015625, 0.1201171875, 0.224609375, 0.3291015625, 0.43359375, 0.5380859375, 0.642578125, 0.7470703125, 0.8515625, 0.9560546875, 1.060546875, 1.1650390625, 1.26953125, 1.3740234375, 1.478515625, 1.5830078125, 1.6875, 1.7919921875, 1.896484375, 2.0009765625, 2.10546875, 2.2099609375, 2.314453125, 2.4189453125, 2.5234375, 2.6279296875, 2.732421875, 2.8369140625, 2.94140625, 3.0458984375, 3.150390625, 3.2548828125, 3.359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 8.0, 11.0, 11.0, 9.0, 25.0, 19.0, 38.0, 43.0, 48.0, 59.0, 58.0, 97.0, 82.0, 70.0, 70.0, 54.0, 46.0, 47.0, 37.0, 35.0, 26.0, 21.0, 21.0, 9.0, 9.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.79913330078125, -1.7388916015625, -1.67864990234375, -1.618408203125, -1.55816650390625, -1.4979248046875, -1.43768310546875, -1.37744140625, -1.31719970703125, -1.2569580078125, -1.19671630859375, -1.136474609375, -1.07623291015625, -1.0159912109375, -0.95574951171875, -0.8955078125, -0.83526611328125, -0.7750244140625, -0.71478271484375, -0.654541015625, -0.59429931640625, -0.5340576171875, -0.47381591796875, -0.41357421875, -0.35333251953125, -0.2930908203125, -0.23284912109375, -0.172607421875, -0.11236572265625, -0.0521240234375, 0.00811767578125, 0.068359375, 0.12860107421875, 0.1888427734375, 0.24908447265625, 0.309326171875, 0.36956787109375, 0.4298095703125, 0.49005126953125, 0.55029296875, 0.61053466796875, 0.6707763671875, 0.73101806640625, 0.791259765625, 0.85150146484375, 0.9117431640625, 0.97198486328125, 1.0322265625, 1.09246826171875, 1.1527099609375, 1.21295166015625, 1.273193359375, 1.33343505859375, 1.3936767578125, 1.45391845703125, 1.51416015625, 1.57440185546875, 1.6346435546875, 1.69488525390625, 1.755126953125, 1.81536865234375, 1.8756103515625, 1.93585205078125, 1.99609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 24.0, 46.0, 92.0, 181.0, 258.0, 190.0, 110.0, 47.0, 24.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.348005294799805, -16.413665771484375, -15.479326248168945, -14.544986724853516, -13.610647201538086, -12.676307678222656, -11.741968154907227, -10.807628631591797, -9.873289108276367, -8.938949584960938, -8.004610061645508, -7.070270538330078, -6.135931015014648, -5.201591491699219, -4.267251968383789, -3.3329124450683594, -2.3985729217529297, -1.4642333984375, -0.5298938751220703, 0.4044456481933594, 1.338785171508789, 2.2731246948242188, 3.2074642181396484, 4.141803741455078, 5.076143264770508, 6.0104827880859375, 6.944822311401367, 7.879161834716797, 8.813501358032227, 9.747840881347656, 10.682180404663086, 11.616519927978516, 12.550857543945312, 13.485197067260742, 14.419536590576172, 15.353876113891602, 16.28821563720703, 17.22255516052246, 18.15689468383789, 19.09123420715332, 20.02557373046875, 20.95991325378418, 21.89425277709961, 22.82859230041504, 23.76293182373047, 24.6972713470459, 25.631610870361328, 26.565950393676758, 27.500289916992188, 28.434629440307617, 29.368968963623047, 30.303308486938477, 31.237648010253906, 32.17198944091797, 33.106327056884766, 34.04066467285156, 34.975006103515625, 35.90934753417969, 36.843685150146484, 37.77802276611328, 38.712364196777344, 39.646705627441406, 40.5810432434082, 41.515380859375, 42.44972229003906]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 12.0, 11.0, 11.0, 15.0, 22.0, 31.0, 34.0, 48.0, 43.0, 50.0, 63.0, 81.0, 68.0, 64.0, 69.0, 61.0, 57.0, 71.0, 40.0, 28.0, 26.0, 28.0, 13.0, 10.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.886821746826172, -17.308025360107422, -16.729228973388672, -16.150432586669922, -15.571636199951172, -14.992839813232422, -14.414044380187988, -13.835247993469238, -13.256451606750488, -12.677655220031738, -12.098858833312988, -11.520062446594238, -10.941267013549805, -10.362470626831055, -9.783674240112305, -9.204877853393555, -8.626081466674805, -8.047285079956055, -7.468488693237305, -6.889692783355713, -6.310896396636963, -5.732100009918213, -5.153304100036621, -4.574507713317871, -3.995711326599121, -3.416914939880371, -2.8381187915802, -2.2593226432800293, -1.6805262565612793, -1.1017298698425293, -0.5229337215423584, 0.0558624267578125, 0.6346588134765625, 1.213455080986023, 1.7922513484954834, 2.3710474967956543, 2.9498438835144043, 3.5286402702331543, 4.107436180114746, 4.686232566833496, 5.265028953552246, 5.843825340270996, 6.422621726989746, 7.001417636871338, 7.580214023590088, 8.15900993347168, 8.73780632019043, 9.31660270690918, 9.89539909362793, 10.47419548034668, 11.05299186706543, 11.63178825378418, 12.21058464050293, 12.78938102722168, 13.368176460266113, 13.946972846984863, 14.525769233703613, 15.104565620422363, 15.683362007141113, 16.262157440185547, 16.840953826904297, 17.419750213623047, 17.998546600341797, 18.577342987060547, 19.156139373779297]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 22.0, 21.0, 42.0, 51.0, 77.0, 100.0, 145.0, 225.0, 355.0, 448.0, 753.0, 1253.0, 2364.0, 4718.0, 11505.0, 45814.0, 3873722.0, 217062.0, 20971.0, 7079.0, 3088.0, 1709.0, 954.0, 607.0, 369.0, 256.0, 156.0, 111.0, 72.0, 65.0, 35.0, 22.0, 22.0, 12.0, 19.0, 6.0, 9.0, 3.0, 4.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9921875, -11.6370849609375, -11.281982421875, -10.9268798828125, -10.57177734375, -10.2166748046875, -9.861572265625, -9.5064697265625, -9.1513671875, -8.7962646484375, -8.441162109375, -8.0860595703125, -7.73095703125, -7.3758544921875, -7.020751953125, -6.6656494140625, -6.310546875, -5.9554443359375, -5.600341796875, -5.2452392578125, -4.89013671875, -4.5350341796875, -4.179931640625, -3.8248291015625, -3.4697265625, -3.1146240234375, -2.759521484375, -2.4044189453125, -2.04931640625, -1.6942138671875, -1.339111328125, -0.9840087890625, -0.62890625, -0.2738037109375, 0.081298828125, 0.4364013671875, 0.79150390625, 1.1466064453125, 1.501708984375, 1.8568115234375, 2.2119140625, 2.5670166015625, 2.922119140625, 3.2772216796875, 3.63232421875, 3.9874267578125, 4.342529296875, 4.6976318359375, 5.052734375, 5.4078369140625, 5.762939453125, 6.1180419921875, 6.47314453125, 6.8282470703125, 7.183349609375, 7.5384521484375, 7.8935546875, 8.2486572265625, 8.603759765625, 8.9588623046875, 9.31396484375, 9.6690673828125, 10.024169921875, 10.3792724609375, 10.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 11.0, 7.0, 18.0, 31.0, 54.0, 171.0, 287.0, 208.0, 101.0, 31.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7702255249023438, -0.7401580810546875, -0.7100906372070312, -0.680023193359375, -0.6499557495117188, -0.6198883056640625, -0.5898208618164062, -0.55975341796875, -0.5296859741210938, -0.4996185302734375, -0.46955108642578125, -0.439483642578125, -0.40941619873046875, -0.3793487548828125, -0.34928131103515625, -0.3192138671875, -0.28914642333984375, -0.2590789794921875, -0.22901153564453125, -0.198944091796875, -0.16887664794921875, -0.1388092041015625, -0.10874176025390625, -0.07867431640625, -0.04860687255859375, -0.0185394287109375, 0.01152801513671875, 0.041595458984375, 0.07166290283203125, 0.1017303466796875, 0.13179779052734375, 0.161865234375, 0.19193267822265625, 0.2220001220703125, 0.25206756591796875, 0.282135009765625, 0.31220245361328125, 0.3422698974609375, 0.37233734130859375, 0.40240478515625, 0.43247222900390625, 0.4625396728515625, 0.49260711669921875, 0.522674560546875, 0.5527420043945312, 0.5828094482421875, 0.6128768920898438, 0.6429443359375, 0.6730117797851562, 0.7030792236328125, 0.7331466674804688, 0.763214111328125, 0.7932815551757812, 0.8233489990234375, 0.8534164428710938, 0.88348388671875, 0.9135513305664062, 0.9436187744140625, 0.9736862182617188, 1.003753662109375, 1.0338211059570312, 1.0638885498046875, 1.0939559936523438, 1.1240234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 19.0, 34.0, 48.0, 86.0, 181.0, 335.0, 702.0, 1723.0, 4663.0, 15274.0, 63631.0, 653954.0, 3311489.0, 108230.0, 22858.0, 6786.0, 2382.0, 972.0, 400.0, 211.0, 118.0, 68.0, 36.0, 25.0, 10.0, 5.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.6072998046875, -8.339599609375, -8.0718994140625, -7.80419921875, -7.5364990234375, -7.268798828125, -7.0010986328125, -6.7333984375, -6.4656982421875, -6.197998046875, -5.9302978515625, -5.66259765625, -5.3948974609375, -5.127197265625, -4.8594970703125, -4.591796875, -4.3240966796875, -4.056396484375, -3.7886962890625, -3.52099609375, -3.2532958984375, -2.985595703125, -2.7178955078125, -2.4501953125, -2.1824951171875, -1.914794921875, -1.6470947265625, -1.37939453125, -1.1116943359375, -0.843994140625, -0.5762939453125, -0.30859375, -0.0408935546875, 0.226806640625, 0.4945068359375, 0.76220703125, 1.0299072265625, 1.297607421875, 1.5653076171875, 1.8330078125, 2.1007080078125, 2.368408203125, 2.6361083984375, 2.90380859375, 3.1715087890625, 3.439208984375, 3.7069091796875, 3.974609375, 4.2423095703125, 4.510009765625, 4.7777099609375, 5.04541015625, 5.3131103515625, 5.580810546875, 5.8485107421875, 6.1162109375, 6.3839111328125, 6.651611328125, 6.9193115234375, 7.18701171875, 7.4547119140625, 7.722412109375, 7.9901123046875, 8.2578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 7.0, 13.0, 20.0, 11.0, 25.0, 33.0, 50.0, 58.0, 112.0, 172.0, 293.0, 640.0, 1705.0, 383.0, 157.0, 111.0, 69.0, 45.0, 43.0, 27.0, 21.0, 11.0, 15.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.203125, -1.169891357421875, -1.13665771484375, -1.103424072265625, -1.0701904296875, -1.036956787109375, -1.00372314453125, -0.970489501953125, -0.937255859375, -0.904022216796875, -0.87078857421875, -0.837554931640625, -0.8043212890625, -0.771087646484375, -0.73785400390625, -0.704620361328125, -0.67138671875, -0.638153076171875, -0.60491943359375, -0.571685791015625, -0.5384521484375, -0.505218505859375, -0.47198486328125, -0.438751220703125, -0.405517578125, -0.372283935546875, -0.33905029296875, -0.305816650390625, -0.2725830078125, -0.239349365234375, -0.20611572265625, -0.172882080078125, -0.1396484375, -0.106414794921875, -0.07318115234375, -0.039947509765625, -0.0067138671875, 0.026519775390625, 0.05975341796875, 0.092987060546875, 0.126220703125, 0.159454345703125, 0.19268798828125, 0.225921630859375, 0.2591552734375, 0.292388916015625, 0.32562255859375, 0.358856201171875, 0.39208984375, 0.425323486328125, 0.45855712890625, 0.491790771484375, 0.5250244140625, 0.558258056640625, 0.59149169921875, 0.624725341796875, 0.657958984375, 0.691192626953125, 0.72442626953125, 0.757659912109375, 0.7908935546875, 0.824127197265625, 0.85736083984375, 0.890594482421875, 0.923828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 12.0, 30.0, 42.0, 113.0, 169.0, 245.0, 185.0, 96.0, 51.0, 26.0, 15.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.81429672241211, -16.46824836730957, -16.1221981048584, -15.776148796081543, -15.430099487304688, -15.084050178527832, -14.738000869750977, -14.391952514648438, -14.045902252197266, -13.69985294342041, -13.353803634643555, -13.0077543258667, -12.661705017089844, -12.315655708312988, -11.969606399536133, -11.623558044433594, -11.277508735656738, -10.931459426879883, -10.585410118103027, -10.239360809326172, -9.893311500549316, -9.547262191772461, -9.201213836669922, -8.85516357421875, -8.509115219116211, -8.163065910339355, -7.8170166015625, -7.4709672927856445, -7.124917984008789, -6.778868675231934, -6.432819843292236, -6.086770534515381, -5.740721702575684, -5.394672393798828, -5.048623085021973, -4.702573776245117, -4.356524467468262, -4.010475158691406, -3.664426326751709, -3.3183770179748535, -2.972327709197998, -2.6262784004211426, -2.280229091644287, -1.9341800212860107, -1.5881307125091553, -1.2420814037322998, -0.8960323333740234, -0.549983024597168, -0.2039337158203125, 0.1421155333518982, 0.4881647825241089, 0.8342139720916748, 1.1802632808685303, 1.5263125896453857, 1.872361660003662, 2.2184109687805176, 2.564460277557373, 2.9105095863342285, 3.256558895111084, 3.6026079654693604, 3.948657274246216, 4.294706344604492, 4.640755653381348, 4.986804962158203, 5.332854270935059]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 7.0, 6.0, 10.0, 14.0, 13.0, 14.0, 24.0, 21.0, 34.0, 28.0, 25.0, 27.0, 36.0, 40.0, 36.0, 47.0, 43.0, 34.0, 40.0, 35.0, 40.0, 46.0, 34.0, 34.0, 32.0, 42.0, 41.0, 23.0, 25.0, 20.0, 28.0, 14.0, 14.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2092902660369873, -3.1037561893463135, -2.9982218742370605, -2.8926877975463867, -2.787153720855713, -2.681619644165039, -2.5760855674743652, -2.4705512523651123, -2.3650171756744385, -2.2594830989837646, -2.1539487838745117, -2.048414707183838, -1.942880630493164, -1.8373465538024902, -1.7318123579025269, -1.6262781620025635, -1.5207440853118896, -1.4152100086212158, -1.3096758127212524, -1.204141616821289, -1.0986075401306152, -0.9930734038352966, -0.887539267539978, -0.7820051312446594, -0.6764709949493408, -0.5709368586540222, -0.4654027223587036, -0.359868586063385, -0.2543344497680664, -0.1488003134727478, -0.0432661771774292, 0.062267959117889404, 0.1678023338317871, 0.2733364701271057, 0.3788706064224243, 0.4844047427177429, 0.5899388790130615, 0.6954730153083801, 0.8010071516036987, 0.9065412878990173, 1.012075424194336, 1.1176095008850098, 1.2231436967849731, 1.3286778926849365, 1.4342119693756104, 1.5397460460662842, 1.6452802419662476, 1.750814437866211, 1.8563485145568848, 1.9618825912475586, 2.0674166679382324, 2.1729509830474854, 2.278485059738159, 2.384019136428833, 2.489553451538086, 2.5950875282287598, 2.7006216049194336, 2.8061556816101074, 2.9116897583007812, 3.017224073410034, 3.122758150100708, 3.228292226791382, 3.3338265419006348, 3.4393606185913086, 3.5448946952819824]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 13.0, 16.0, 19.0, 24.0, 31.0, 54.0, 73.0, 87.0, 109.0, 153.0, 238.0, 350.0, 523.0, 720.0, 1019.0, 1721.0, 2740.0, 5000.0, 10529.0, 28765.0, 145161.0, 653135.0, 145427.0, 28923.0, 10583.0, 5234.0, 2829.0, 1640.0, 1092.0, 681.0, 472.0, 340.0, 252.0, 166.0, 129.0, 90.0, 56.0, 38.0, 37.0, 22.0, 16.0, 13.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.953125, -5.76995849609375, -5.5867919921875, -5.40362548828125, -5.220458984375, -5.03729248046875, -4.8541259765625, -4.67095947265625, -4.48779296875, -4.30462646484375, -4.1214599609375, -3.93829345703125, -3.755126953125, -3.57196044921875, -3.3887939453125, -3.20562744140625, -3.0224609375, -2.83929443359375, -2.6561279296875, -2.47296142578125, -2.289794921875, -2.10662841796875, -1.9234619140625, -1.74029541015625, -1.55712890625, -1.37396240234375, -1.1907958984375, -1.00762939453125, -0.824462890625, -0.64129638671875, -0.4581298828125, -0.27496337890625, -0.091796875, 0.09136962890625, 0.2745361328125, 0.45770263671875, 0.640869140625, 0.82403564453125, 1.0072021484375, 1.19036865234375, 1.37353515625, 1.55670166015625, 1.7398681640625, 1.92303466796875, 2.106201171875, 2.28936767578125, 2.4725341796875, 2.65570068359375, 2.8388671875, 3.02203369140625, 3.2052001953125, 3.38836669921875, 3.571533203125, 3.75469970703125, 3.9378662109375, 4.12103271484375, 4.30419921875, 4.48736572265625, 4.6705322265625, 4.85369873046875, 5.036865234375, 5.22003173828125, 5.4031982421875, 5.58636474609375, 5.76953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 8.0, 23.0, 39.0, 100.0, 181.0, 232.0, 184.0, 106.0, 40.0, 22.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.771484375, -0.74224853515625, -0.7130126953125, -0.68377685546875, -0.654541015625, -0.62530517578125, -0.5960693359375, -0.56683349609375, -0.53759765625, -0.50836181640625, -0.4791259765625, -0.44989013671875, -0.420654296875, -0.39141845703125, -0.3621826171875, -0.33294677734375, -0.3037109375, -0.27447509765625, -0.2452392578125, -0.21600341796875, -0.186767578125, -0.15753173828125, -0.1282958984375, -0.09906005859375, -0.06982421875, -0.04058837890625, -0.0113525390625, 0.01788330078125, 0.047119140625, 0.07635498046875, 0.1055908203125, 0.13482666015625, 0.1640625, 0.19329833984375, 0.2225341796875, 0.25177001953125, 0.281005859375, 0.31024169921875, 0.3394775390625, 0.36871337890625, 0.39794921875, 0.42718505859375, 0.4564208984375, 0.48565673828125, 0.514892578125, 0.54412841796875, 0.5733642578125, 0.60260009765625, 0.6318359375, 0.66107177734375, 0.6903076171875, 0.71954345703125, 0.748779296875, 0.77801513671875, 0.8072509765625, 0.83648681640625, 0.86572265625, 0.89495849609375, 0.9241943359375, 0.95343017578125, 0.982666015625, 1.01190185546875, 1.0411376953125, 1.07037353515625, 1.099609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 2.0, 9.0, 9.0, 12.0, 15.0, 29.0, 34.0, 36.0, 81.0, 99.0, 124.0, 249.0, 370.0, 654.0, 1230.0, 2689.0, 6844.0, 21901.0, 87491.0, 390794.0, 407232.0, 93030.0, 22956.0, 6888.0, 2684.0, 1278.0, 681.0, 363.0, 239.0, 175.0, 93.0, 64.0, 48.0, 44.0, 25.0, 17.0, 12.0, 11.0, 9.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.48046875, -6.29541015625, -6.1103515625, -5.92529296875, -5.740234375, -5.55517578125, -5.3701171875, -5.18505859375, -5.0, -4.81494140625, -4.6298828125, -4.44482421875, -4.259765625, -4.07470703125, -3.8896484375, -3.70458984375, -3.51953125, -3.33447265625, -3.1494140625, -2.96435546875, -2.779296875, -2.59423828125, -2.4091796875, -2.22412109375, -2.0390625, -1.85400390625, -1.6689453125, -1.48388671875, -1.298828125, -1.11376953125, -0.9287109375, -0.74365234375, -0.55859375, -0.37353515625, -0.1884765625, -0.00341796875, 0.181640625, 0.36669921875, 0.5517578125, 0.73681640625, 0.921875, 1.10693359375, 1.2919921875, 1.47705078125, 1.662109375, 1.84716796875, 2.0322265625, 2.21728515625, 2.40234375, 2.58740234375, 2.7724609375, 2.95751953125, 3.142578125, 3.32763671875, 3.5126953125, 3.69775390625, 3.8828125, 4.06787109375, 4.2529296875, 4.43798828125, 4.623046875, 4.80810546875, 4.9931640625, 5.17822265625, 5.36328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 5.0, 13.0, 9.0, 19.0, 23.0, 13.0, 29.0, 29.0, 30.0, 38.0, 54.0, 45.0, 61.0, 51.0, 47.0, 39.0, 52.0, 53.0, 45.0, 42.0, 47.0, 39.0, 27.0, 19.0, 38.0, 18.0, 19.0, 16.0, 14.0, 8.0, 10.0, 4.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.95703125, -2.875640869140625, -2.79425048828125, -2.712860107421875, -2.6314697265625, -2.550079345703125, -2.46868896484375, -2.387298583984375, -2.305908203125, -2.224517822265625, -2.14312744140625, -2.061737060546875, -1.9803466796875, -1.898956298828125, -1.81756591796875, -1.736175537109375, -1.65478515625, -1.573394775390625, -1.49200439453125, -1.410614013671875, -1.3292236328125, -1.247833251953125, -1.16644287109375, -1.085052490234375, -1.003662109375, -0.922271728515625, -0.84088134765625, -0.759490966796875, -0.6781005859375, -0.596710205078125, -0.51531982421875, -0.433929443359375, -0.3525390625, -0.271148681640625, -0.18975830078125, -0.108367919921875, -0.0269775390625, 0.054412841796875, 0.13580322265625, 0.217193603515625, 0.298583984375, 0.379974365234375, 0.46136474609375, 0.542755126953125, 0.6241455078125, 0.705535888671875, 0.78692626953125, 0.868316650390625, 0.94970703125, 1.031097412109375, 1.11248779296875, 1.193878173828125, 1.2752685546875, 1.356658935546875, 1.43804931640625, 1.519439697265625, 1.600830078125, 1.682220458984375, 1.76361083984375, 1.845001220703125, 1.9263916015625, 2.007781982421875, 2.08917236328125, 2.170562744140625, 2.251953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 18.0, 21.0, 33.0, 59.0, 81.0, 131.0, 174.0, 293.0, 490.0, 840.0, 1589.0, 3063.0, 6688.0, 15785.0, 48731.0, 234242.0, 568875.0, 116137.0, 30152.0, 10957.0, 4837.0, 2325.0, 1213.0, 670.0, 405.0, 241.0, 155.0, 104.0, 62.0, 39.0, 32.0, 21.0, 19.0, 8.0, 12.0, 4.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.54296875, -6.36273193359375, -6.1824951171875, -6.00225830078125, -5.822021484375, -5.64178466796875, -5.4615478515625, -5.28131103515625, -5.10107421875, -4.92083740234375, -4.7406005859375, -4.56036376953125, -4.380126953125, -4.19989013671875, -4.0196533203125, -3.83941650390625, -3.6591796875, -3.47894287109375, -3.2987060546875, -3.11846923828125, -2.938232421875, -2.75799560546875, -2.5777587890625, -2.39752197265625, -2.21728515625, -2.03704833984375, -1.8568115234375, -1.67657470703125, -1.496337890625, -1.31610107421875, -1.1358642578125, -0.95562744140625, -0.775390625, -0.59515380859375, -0.4149169921875, -0.23468017578125, -0.054443359375, 0.12579345703125, 0.3060302734375, 0.48626708984375, 0.66650390625, 0.84674072265625, 1.0269775390625, 1.20721435546875, 1.387451171875, 1.56768798828125, 1.7479248046875, 1.92816162109375, 2.1083984375, 2.28863525390625, 2.4688720703125, 2.64910888671875, 2.829345703125, 3.00958251953125, 3.1898193359375, 3.37005615234375, 3.55029296875, 3.73052978515625, 3.9107666015625, 4.09100341796875, 4.271240234375, 4.45147705078125, 4.6317138671875, 4.81195068359375, 4.9921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 10.0, 20.0, 30.0, 47.0, 66.0, 125.0, 172.0, 162.0, 101.0, 57.0, 49.0, 41.0, 16.0, 21.0, 13.0, 7.0, 6.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000965118408203125, -0.0009358823299407959, -0.0009066462516784668, -0.0008774101734161377, -0.0008481740951538086, -0.0008189380168914795, -0.0007897019386291504, -0.0007604658603668213, -0.0007312297821044922, -0.0007019937038421631, -0.000672757625579834, -0.0006435215473175049, -0.0006142854690551758, -0.0005850493907928467, -0.0005558133125305176, -0.0005265772342681885, -0.0004973411560058594, -0.0004681050777435303, -0.00043886899948120117, -0.00040963292121887207, -0.00038039684295654297, -0.00035116076469421387, -0.00032192468643188477, -0.00029268860816955566, -0.00026345252990722656, -0.00023421645164489746, -0.00020498037338256836, -0.00017574429512023926, -0.00014650821685791016, -0.00011727213859558105, -8.803606033325195e-05, -5.879998207092285e-05, -2.956390380859375e-05, -3.2782554626464844e-07, 2.8908252716064453e-05, 5.8144330978393555e-05, 8.738040924072266e-05, 0.00011661648750305176, 0.00014585256576538086, 0.00017508864402770996, 0.00020432472229003906, 0.00023356080055236816, 0.00026279687881469727, 0.00029203295707702637, 0.00032126903533935547, 0.00035050511360168457, 0.00037974119186401367, 0.0004089772701263428, 0.0004382133483886719, 0.000467449426651001, 0.0004966855049133301, 0.0005259215831756592, 0.0005551576614379883, 0.0005843937397003174, 0.0006136298179626465, 0.0006428658962249756, 0.0006721019744873047, 0.0007013380527496338, 0.0007305741310119629, 0.000759810209274292, 0.0007890462875366211, 0.0008182823657989502, 0.0008475184440612793, 0.0008767545223236084, 0.0009059906005859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 11.0, 14.0, 15.0, 19.0, 21.0, 38.0, 64.0, 90.0, 105.0, 202.0, 323.0, 558.0, 1041.0, 2177.0, 4694.0, 12211.0, 41054.0, 301913.0, 593989.0, 62293.0, 16286.0, 5886.0, 2580.0, 1188.0, 711.0, 366.0, 233.0, 131.0, 79.0, 69.0, 52.0, 28.0, 35.0, 13.0, 13.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.947998046875, -7.70068359375, -7.453369140625, -7.2060546875, -6.958740234375, -6.71142578125, -6.464111328125, -6.216796875, -5.969482421875, -5.72216796875, -5.474853515625, -5.2275390625, -4.980224609375, -4.73291015625, -4.485595703125, -4.23828125, -3.990966796875, -3.74365234375, -3.496337890625, -3.2490234375, -3.001708984375, -2.75439453125, -2.507080078125, -2.259765625, -2.012451171875, -1.76513671875, -1.517822265625, -1.2705078125, -1.023193359375, -0.77587890625, -0.528564453125, -0.28125, -0.033935546875, 0.21337890625, 0.460693359375, 0.7080078125, 0.955322265625, 1.20263671875, 1.449951171875, 1.697265625, 1.944580078125, 2.19189453125, 2.439208984375, 2.6865234375, 2.933837890625, 3.18115234375, 3.428466796875, 3.67578125, 3.923095703125, 4.17041015625, 4.417724609375, 4.6650390625, 4.912353515625, 5.15966796875, 5.406982421875, 5.654296875, 5.901611328125, 6.14892578125, 6.396240234375, 6.6435546875, 6.890869140625, 7.13818359375, 7.385498046875, 7.6328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 13.0, 11.0, 14.0, 14.0, 22.0, 28.0, 26.0, 60.0, 86.0, 102.0, 126.0, 120.0, 94.0, 66.0, 33.0, 32.0, 23.0, 21.0, 14.0, 16.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.265625, -3.165283203125, -3.06494140625, -2.964599609375, -2.8642578125, -2.763916015625, -2.66357421875, -2.563232421875, -2.462890625, -2.362548828125, -2.26220703125, -2.161865234375, -2.0615234375, -1.961181640625, -1.86083984375, -1.760498046875, -1.66015625, -1.559814453125, -1.45947265625, -1.359130859375, -1.2587890625, -1.158447265625, -1.05810546875, -0.957763671875, -0.857421875, -0.757080078125, -0.65673828125, -0.556396484375, -0.4560546875, -0.355712890625, -0.25537109375, -0.155029296875, -0.0546875, 0.045654296875, 0.14599609375, 0.246337890625, 0.3466796875, 0.447021484375, 0.54736328125, 0.647705078125, 0.748046875, 0.848388671875, 0.94873046875, 1.049072265625, 1.1494140625, 1.249755859375, 1.35009765625, 1.450439453125, 1.55078125, 1.651123046875, 1.75146484375, 1.851806640625, 1.9521484375, 2.052490234375, 2.15283203125, 2.253173828125, 2.353515625, 2.453857421875, 2.55419921875, 2.654541015625, 2.7548828125, 2.855224609375, 2.95556640625, 3.055908203125, 3.15625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 9.0, 8.0, 13.0, 23.0, 56.0, 136.0, 213.0, 258.0, 169.0, 60.0, 34.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.481258392333984, -39.60136795043945, -37.721473693847656, -35.841583251953125, -33.961692810058594, -32.08180236816406, -30.201908111572266, -28.322017669677734, -26.44212532043457, -24.562232971191406, -22.682342529296875, -20.80245018005371, -18.922557830810547, -17.042667388916016, -15.162775039672852, -13.282883644104004, -11.402992248535156, -9.523100852966309, -7.643208980560303, -5.763317108154297, -3.883425712585449, -2.0035343170166016, -0.1236419677734375, 1.7562494277954102, 3.636140823364258, 5.5160322189331055, 7.395924091339111, 9.275815963745117, 11.155707359313965, 13.035598754882812, 14.915491104125977, 16.79538345336914, 18.675270080566406, 20.55516242980957, 22.4350528717041, 24.314945220947266, 26.194835662841797, 28.07472801208496, 29.954620361328125, 31.834510803222656, 33.71440124511719, 35.59429168701172, 37.474185943603516, 39.35407638549805, 41.23396682739258, 43.113861083984375, 44.993751525878906, 46.87364196777344, 48.753536224365234, 50.633426666259766, 52.51332092285156, 54.393211364746094, 56.273101806640625, 58.152992248535156, 60.03288650512695, 61.912776947021484, 63.79267120361328, 65.67256164550781, 67.55245208740234, 69.43234252929688, 71.31224060058594, 73.19213104248047, 75.072021484375, 76.95191192626953, 78.83180236816406]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 10.0, 12.0, 10.0, 27.0, 14.0, 31.0, 44.0, 42.0, 36.0, 37.0, 62.0, 59.0, 49.0, 62.0, 51.0, 62.0, 72.0, 49.0, 35.0, 39.0, 38.0, 30.0, 27.0, 18.0, 22.0, 9.0, 11.0, 13.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.923093795776367, -19.154081344604492, -18.385068893432617, -17.616056442260742, -16.847043991088867, -16.078033447265625, -15.309020042419434, -14.540008544921875, -13.77099609375, -13.001983642578125, -12.23297119140625, -11.463958740234375, -10.694947242736816, -9.925934791564941, -9.156922340393066, -8.387910842895508, -7.618897438049316, -6.849884986877441, -6.080873012542725, -5.31186056137085, -4.542848587036133, -3.773836135864258, -3.004823684692383, -2.235811710357666, -1.466799259185791, -0.6977869868278503, 0.07122528553009033, 0.8402376174926758, 1.6092498302459717, 2.3782620429992676, 3.1472744941711426, 3.9162864685058594, 4.685298919677734, 5.454311370849609, 6.223323345184326, 6.992335796356201, 7.761347770690918, 8.530360221862793, 9.299372673034668, 10.068384170532227, 10.837396621704102, 11.606409072875977, 12.375421524047852, 13.144433975219727, 13.913445472717285, 14.68245792388916, 15.451470375061035, 16.220481872558594, 16.98949432373047, 17.758506774902344, 18.52751922607422, 19.296531677246094, 20.06554412841797, 20.834556579589844, 21.60356903076172, 22.37257957458496, 23.14159393310547, 23.910606384277344, 24.67961883544922, 25.448631286621094, 26.21764373779297, 26.986656188964844, 27.75566864013672, 28.52467918395996, 29.293691635131836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 59.0, 103.0, 188.0, 462.0, 1393.0, 6387.0, 145844.0, 4020212.0, 16420.0, 2106.0, 592.0, 244.0, 111.0, 43.0, 25.0, 15.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.372314453125, -20.55712890625, -19.741943359375, -18.9267578125, -18.111572265625, -17.29638671875, -16.481201171875, -15.666015625, -14.850830078125, -14.03564453125, -13.220458984375, -12.4052734375, -11.590087890625, -10.77490234375, -9.959716796875, -9.14453125, -8.329345703125, -7.51416015625, -6.698974609375, -5.8837890625, -5.068603515625, -4.25341796875, -3.438232421875, -2.623046875, -1.807861328125, -0.99267578125, -0.177490234375, 0.6376953125, 1.452880859375, 2.26806640625, 3.083251953125, 3.8984375, 4.713623046875, 5.52880859375, 6.343994140625, 7.1591796875, 7.974365234375, 8.78955078125, 9.604736328125, 10.419921875, 11.235107421875, 12.05029296875, 12.865478515625, 13.6806640625, 14.495849609375, 15.31103515625, 16.126220703125, 16.94140625, 17.756591796875, 18.57177734375, 19.386962890625, 20.2021484375, 21.017333984375, 21.83251953125, 22.647705078125, 23.462890625, 24.278076171875, 25.09326171875, 25.908447265625, 26.7236328125, 27.538818359375, 28.35400390625, 29.169189453125, 29.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 10.0, 29.0, 54.0, 83.0, 153.0, 202.0, 184.0, 127.0, 57.0, 41.0, 21.0, 5.0, 5.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06781005859375, -1.0291748046875, -0.99053955078125, -0.951904296875, -0.91326904296875, -0.8746337890625, -0.83599853515625, -0.79736328125, -0.75872802734375, -0.7200927734375, -0.68145751953125, -0.642822265625, -0.60418701171875, -0.5655517578125, -0.52691650390625, -0.48828125, -0.44964599609375, -0.4110107421875, -0.37237548828125, -0.333740234375, -0.29510498046875, -0.2564697265625, -0.21783447265625, -0.17919921875, -0.14056396484375, -0.1019287109375, -0.06329345703125, -0.024658203125, 0.01397705078125, 0.0526123046875, 0.09124755859375, 0.1298828125, 0.16851806640625, 0.2071533203125, 0.24578857421875, 0.284423828125, 0.32305908203125, 0.3616943359375, 0.40032958984375, 0.43896484375, 0.47760009765625, 0.5162353515625, 0.55487060546875, 0.593505859375, 0.63214111328125, 0.6707763671875, 0.70941162109375, 0.748046875, 0.78668212890625, 0.8253173828125, 0.86395263671875, 0.902587890625, 0.94122314453125, 0.9798583984375, 1.01849365234375, 1.05712890625, 1.09576416015625, 1.1343994140625, 1.17303466796875, 1.211669921875, 1.25030517578125, 1.2889404296875, 1.32757568359375, 1.3662109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 14.0, 15.0, 24.0, 31.0, 47.0, 92.0, 122.0, 252.0, 467.0, 893.0, 2000.0, 5125.0, 14209.0, 49329.0, 265451.0, 3451968.0, 322015.0, 56395.0, 16041.0, 5547.0, 2209.0, 960.0, 484.0, 240.0, 127.0, 90.0, 41.0, 38.0, 22.0, 17.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.6640625, -8.43328857421875, -8.2025146484375, -7.97174072265625, -7.740966796875, -7.51019287109375, -7.2794189453125, -7.04864501953125, -6.81787109375, -6.58709716796875, -6.3563232421875, -6.12554931640625, -5.894775390625, -5.66400146484375, -5.4332275390625, -5.20245361328125, -4.9716796875, -4.74090576171875, -4.5101318359375, -4.27935791015625, -4.048583984375, -3.81781005859375, -3.5870361328125, -3.35626220703125, -3.12548828125, -2.89471435546875, -2.6639404296875, -2.43316650390625, -2.202392578125, -1.97161865234375, -1.7408447265625, -1.51007080078125, -1.279296875, -1.04852294921875, -0.8177490234375, -0.58697509765625, -0.356201171875, -0.12542724609375, 0.1053466796875, 0.33612060546875, 0.56689453125, 0.79766845703125, 1.0284423828125, 1.25921630859375, 1.489990234375, 1.72076416015625, 1.9515380859375, 2.18231201171875, 2.4130859375, 2.64385986328125, 2.8746337890625, 3.10540771484375, 3.336181640625, 3.56695556640625, 3.7977294921875, 4.02850341796875, 4.25927734375, 4.49005126953125, 4.7208251953125, 4.95159912109375, 5.182373046875, 5.41314697265625, 5.6439208984375, 5.87469482421875, 6.10546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 12.0, 11.0, 13.0, 15.0, 36.0, 44.0, 74.0, 84.0, 132.0, 222.0, 452.0, 1610.0, 575.0, 288.0, 141.0, 102.0, 58.0, 48.0, 31.0, 31.0, 14.0, 11.0, 15.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5686492919921875, -1.526947021484375, -1.4852447509765625, -1.44354248046875, -1.4018402099609375, -1.360137939453125, -1.3184356689453125, -1.2767333984375, -1.2350311279296875, -1.193328857421875, -1.1516265869140625, -1.10992431640625, -1.0682220458984375, -1.026519775390625, -0.9848175048828125, -0.943115234375, -0.9014129638671875, -0.859710693359375, -0.8180084228515625, -0.77630615234375, -0.7346038818359375, -0.692901611328125, -0.6511993408203125, -0.6094970703125, -0.5677947998046875, -0.526092529296875, -0.4843902587890625, -0.44268798828125, -0.4009857177734375, -0.359283447265625, -0.3175811767578125, -0.27587890625, -0.2341766357421875, -0.192474365234375, -0.1507720947265625, -0.10906982421875, -0.0673675537109375, -0.025665283203125, 0.0160369873046875, 0.0577392578125, 0.0994415283203125, 0.141143798828125, 0.1828460693359375, 0.22454833984375, 0.2662506103515625, 0.307952880859375, 0.3496551513671875, 0.391357421875, 0.4330596923828125, 0.474761962890625, 0.5164642333984375, 0.55816650390625, 0.5998687744140625, 0.641571044921875, 0.6832733154296875, 0.7249755859375, 0.7666778564453125, 0.808380126953125, 0.8500823974609375, 0.89178466796875, 0.9334869384765625, 0.975189208984375, 1.0168914794921875, 1.05859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 8.0, 18.0, 30.0, 81.0, 100.0, 177.0, 197.0, 165.0, 104.0, 62.0, 28.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.885089874267578, -17.483036041259766, -17.080982208251953, -16.678926467895508, -16.276872634887695, -15.874818801879883, -15.47276496887207, -15.070710182189941, -14.668655395507812, -14.2666015625, -13.864546775817871, -13.462492942810059, -13.06043815612793, -12.658384323120117, -12.256330490112305, -11.854275703430176, -11.452221870422363, -11.05016803741455, -10.648113250732422, -10.24605941772461, -9.84400463104248, -9.441950798034668, -9.039896011352539, -8.637842178344727, -8.235788345336914, -7.833734035491943, -7.431679725646973, -7.02962589263916, -6.627571105957031, -6.225517272949219, -5.823462963104248, -5.421408653259277, -5.019352912902832, -4.617298603057861, -4.215244293212891, -3.813190221786499, -3.4111359119415283, -3.0090816020965576, -2.607027530670166, -2.2049732208251953, -1.8029189109802246, -1.400864601135254, -0.9988104104995728, -0.5967562198638916, -0.1947019100189209, 0.2073523998260498, 0.6094064712524414, 1.011460781097412, 1.4135150909423828, 1.8155694007873535, 2.217623710632324, 2.619677782058716, 3.0217320919036865, 3.4237864017486572, 3.825840473175049, 4.2278947830200195, 4.62994909286499, 5.032003402709961, 5.434057712554932, 5.836112022399902, 6.238165855407715, 6.640220642089844, 7.042274475097656, 7.444328784942627, 7.846383094787598]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 9.0, 6.0, 8.0, 14.0, 10.0, 12.0, 16.0, 18.0, 19.0, 26.0, 26.0, 22.0, 28.0, 29.0, 34.0, 35.0, 32.0, 37.0, 28.0, 38.0, 41.0, 39.0, 28.0, 39.0, 31.0, 26.0, 35.0, 34.0, 20.0, 24.0, 24.0, 32.0, 22.0, 23.0, 20.0, 14.0, 20.0, 14.0, 7.0, 5.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.4001901149749756, -3.2787041664123535, -3.1572182178497314, -3.0357322692871094, -2.914246082305908, -2.792760133743286, -2.671274185180664, -2.549788236618042, -2.42830228805542, -2.306816339492798, -2.185330390930176, -2.0638442039489746, -1.9423582553863525, -1.8208723068237305, -1.6993863582611084, -1.5779004096984863, -1.4564142227172852, -1.334928274154663, -1.2134422063827515, -1.0919562578201294, -0.9704702496528625, -0.8489842414855957, -0.7274982929229736, -0.6060122847557068, -0.48452627658843994, -0.3630402684211731, -0.24155429005622864, -0.12006831169128418, 0.001417696475982666, 0.12290370464324951, 0.24438965320587158, 0.3658756613731384, 0.4873619079589844, 0.6088479161262512, 0.7303339242935181, 0.8518198728561401, 0.973305881023407, 1.0947918891906738, 1.216277837753296, 1.337763786315918, 1.4592498540878296, 1.5807358026504517, 1.7022218704223633, 1.8237078189849854, 1.9451937675476074, 2.0666799545288086, 2.1881656646728516, 2.3096518516540527, 2.431137800216675, 2.552623748779297, 2.674109697341919, 2.795595645904541, 2.917081832885742, 3.0385677814483643, 3.1600537300109863, 3.2815396785736084, 3.4030256271362305, 3.5245115756988525, 3.6459975242614746, 3.767483711242676, 3.888969659805298, 4.01045560836792, 4.131941795349121, 4.253427505493164, 4.374913692474365]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 4.0, 12.0, 19.0, 17.0, 42.0, 46.0, 59.0, 111.0, 160.0, 237.0, 419.0, 680.0, 1180.0, 2105.0, 4493.0, 11510.0, 42890.0, 239968.0, 571687.0, 130760.0, 26437.0, 8082.0, 3373.0, 1699.0, 1022.0, 603.0, 323.0, 178.0, 151.0, 80.0, 68.0, 48.0, 23.0, 15.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.86737060546875, -5.6527099609375, -5.43804931640625, -5.223388671875, -5.00872802734375, -4.7940673828125, -4.57940673828125, -4.36474609375, -4.15008544921875, -3.9354248046875, -3.72076416015625, -3.506103515625, -3.29144287109375, -3.0767822265625, -2.86212158203125, -2.6474609375, -2.43280029296875, -2.2181396484375, -2.00347900390625, -1.788818359375, -1.57415771484375, -1.3594970703125, -1.14483642578125, -0.93017578125, -0.71551513671875, -0.5008544921875, -0.28619384765625, -0.071533203125, 0.14312744140625, 0.3577880859375, 0.57244873046875, 0.787109375, 1.00177001953125, 1.2164306640625, 1.43109130859375, 1.645751953125, 1.86041259765625, 2.0750732421875, 2.28973388671875, 2.50439453125, 2.71905517578125, 2.9337158203125, 3.14837646484375, 3.363037109375, 3.57769775390625, 3.7923583984375, 4.00701904296875, 4.2216796875, 4.43634033203125, 4.6510009765625, 4.86566162109375, 5.080322265625, 5.29498291015625, 5.5096435546875, 5.72430419921875, 5.93896484375, 6.15362548828125, 6.3682861328125, 6.58294677734375, 6.797607421875, 7.01226806640625, 7.2269287109375, 7.44158935546875, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 7.0, 11.0, 14.0, 28.0, 42.0, 75.0, 129.0, 152.0, 188.0, 125.0, 113.0, 53.0, 31.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0396575927734375, -1.001190185546875, -0.9627227783203125, -0.92425537109375, -0.8857879638671875, -0.847320556640625, -0.8088531494140625, -0.7703857421875, -0.7319183349609375, -0.693450927734375, -0.6549835205078125, -0.61651611328125, -0.5780487060546875, -0.539581298828125, -0.5011138916015625, -0.462646484375, -0.4241790771484375, -0.385711669921875, -0.3472442626953125, -0.30877685546875, -0.2703094482421875, -0.231842041015625, -0.1933746337890625, -0.1549072265625, -0.1164398193359375, -0.077972412109375, -0.0395050048828125, -0.00103759765625, 0.0374298095703125, 0.075897216796875, 0.1143646240234375, 0.15283203125, 0.1912994384765625, 0.229766845703125, 0.2682342529296875, 0.30670166015625, 0.3451690673828125, 0.383636474609375, 0.4221038818359375, 0.4605712890625, 0.4990386962890625, 0.537506103515625, 0.5759735107421875, 0.61444091796875, 0.6529083251953125, 0.691375732421875, 0.7298431396484375, 0.768310546875, 0.8067779541015625, 0.845245361328125, 0.8837127685546875, 0.92218017578125, 0.9606475830078125, 0.999114990234375, 1.0375823974609375, 1.0760498046875, 1.1145172119140625, 1.152984619140625, 1.1914520263671875, 1.22991943359375, 1.2683868408203125, 1.306854248046875, 1.3453216552734375, 1.3837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 15.0, 23.0, 38.0, 56.0, 86.0, 141.0, 256.0, 479.0, 903.0, 2403.0, 7191.0, 32804.0, 203136.0, 625222.0, 142090.0, 24083.0, 5758.0, 2002.0, 824.0, 404.0, 232.0, 134.0, 70.0, 65.0, 30.0, 18.0, 13.0, 11.0, 11.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70050048828125, -8.4400634765625, -8.17962646484375, -7.919189453125, -7.65875244140625, -7.3983154296875, -7.13787841796875, -6.87744140625, -6.61700439453125, -6.3565673828125, -6.09613037109375, -5.835693359375, -5.57525634765625, -5.3148193359375, -5.05438232421875, -4.7939453125, -4.53350830078125, -4.2730712890625, -4.01263427734375, -3.752197265625, -3.49176025390625, -3.2313232421875, -2.97088623046875, -2.71044921875, -2.45001220703125, -2.1895751953125, -1.92913818359375, -1.668701171875, -1.40826416015625, -1.1478271484375, -0.88739013671875, -0.626953125, -0.36651611328125, -0.1060791015625, 0.15435791015625, 0.414794921875, 0.67523193359375, 0.9356689453125, 1.19610595703125, 1.45654296875, 1.71697998046875, 1.9774169921875, 2.23785400390625, 2.498291015625, 2.75872802734375, 3.0191650390625, 3.27960205078125, 3.5400390625, 3.80047607421875, 4.0609130859375, 4.32135009765625, 4.581787109375, 4.84222412109375, 5.1026611328125, 5.36309814453125, 5.62353515625, 5.88397216796875, 6.1444091796875, 6.40484619140625, 6.665283203125, 6.92572021484375, 7.1861572265625, 7.44659423828125, 7.70703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 10.0, 7.0, 15.0, 15.0, 33.0, 34.0, 47.0, 40.0, 36.0, 45.0, 48.0, 62.0, 67.0, 67.0, 53.0, 53.0, 45.0, 46.0, 42.0, 31.0, 39.0, 28.0, 23.0, 14.0, 18.0, 14.0, 12.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.33526611328125, -3.2135009765625, -3.09173583984375, -2.969970703125, -2.84820556640625, -2.7264404296875, -2.60467529296875, -2.48291015625, -2.36114501953125, -2.2393798828125, -2.11761474609375, -1.995849609375, -1.87408447265625, -1.7523193359375, -1.63055419921875, -1.5087890625, -1.38702392578125, -1.2652587890625, -1.14349365234375, -1.021728515625, -0.89996337890625, -0.7781982421875, -0.65643310546875, -0.53466796875, -0.41290283203125, -0.2911376953125, -0.16937255859375, -0.047607421875, 0.07415771484375, 0.1959228515625, 0.31768798828125, 0.439453125, 0.56121826171875, 0.6829833984375, 0.80474853515625, 0.926513671875, 1.04827880859375, 1.1700439453125, 1.29180908203125, 1.41357421875, 1.53533935546875, 1.6571044921875, 1.77886962890625, 1.900634765625, 2.02239990234375, 2.1441650390625, 2.26593017578125, 2.3876953125, 2.50946044921875, 2.6312255859375, 2.75299072265625, 2.874755859375, 2.99652099609375, 3.1182861328125, 3.24005126953125, 3.36181640625, 3.48358154296875, 3.6053466796875, 3.72711181640625, 3.848876953125, 3.97064208984375, 4.0924072265625, 4.21417236328125, 4.3359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 11.0, 18.0, 26.0, 31.0, 44.0, 55.0, 80.0, 109.0, 189.0, 301.0, 474.0, 700.0, 1161.0, 2024.0, 3493.0, 6328.0, 11906.0, 25485.0, 59884.0, 169111.0, 423191.0, 211939.0, 72035.0, 29632.0, 13778.0, 7043.0, 3785.0, 2205.0, 1284.0, 780.0, 476.0, 283.0, 226.0, 134.0, 91.0, 77.0, 45.0, 30.0, 20.0, 17.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.00830078125, -2.9130859375, -2.81787109375, -2.72265625, -2.62744140625, -2.5322265625, -2.43701171875, -2.341796875, -2.24658203125, -2.1513671875, -2.05615234375, -1.9609375, -1.86572265625, -1.7705078125, -1.67529296875, -1.580078125, -1.48486328125, -1.3896484375, -1.29443359375, -1.19921875, -1.10400390625, -1.0087890625, -0.91357421875, -0.818359375, -0.72314453125, -0.6279296875, -0.53271484375, -0.4375, -0.34228515625, -0.2470703125, -0.15185546875, -0.056640625, 0.03857421875, 0.1337890625, 0.22900390625, 0.32421875, 0.41943359375, 0.5146484375, 0.60986328125, 0.705078125, 0.80029296875, 0.8955078125, 0.99072265625, 1.0859375, 1.18115234375, 1.2763671875, 1.37158203125, 1.466796875, 1.56201171875, 1.6572265625, 1.75244140625, 1.84765625, 1.94287109375, 2.0380859375, 2.13330078125, 2.228515625, 2.32373046875, 2.4189453125, 2.51416015625, 2.609375, 2.70458984375, 2.7998046875, 2.89501953125, 2.990234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 25.0, 23.0, 27.0, 56.0, 83.0, 98.0, 164.0, 130.0, 88.0, 56.0, 38.0, 31.0, 29.0, 23.0, 14.0, 16.0, 9.0, 11.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006909370422363281, -0.0006668046116828918, -0.0006426721811294556, -0.0006185397505760193, -0.000594407320022583, -0.0005702748894691467, -0.0005461424589157104, -0.0005220100283622742, -0.0004978775978088379, -0.0004737451672554016, -0.00044961273670196533, -0.00042548030614852905, -0.0004013478755950928, -0.0003772154450416565, -0.0003530830144882202, -0.00032895058393478394, -0.00030481815338134766, -0.0002806857228279114, -0.0002565532922744751, -0.00023242086172103882, -0.00020828843116760254, -0.00018415600061416626, -0.00016002357006072998, -0.0001358911395072937, -0.00011175870895385742, -8.762627840042114e-05, -6.349384784698486e-05, -3.9361417293548584e-05, -1.5228986740112305e-05, 8.903443813323975e-06, 3.3035874366760254e-05, 5.716830492019653e-05, 8.130073547363281e-05, 0.00010543316602706909, 0.00012956559658050537, 0.00015369802713394165, 0.00017783045768737793, 0.0002019628882408142, 0.0002260953187942505, 0.00025022774934768677, 0.00027436017990112305, 0.0002984926104545593, 0.0003226250410079956, 0.0003467574715614319, 0.00037088990211486816, 0.00039502233266830444, 0.0004191547632217407, 0.000443287193775177, 0.0004674196243286133, 0.0004915520548820496, 0.0005156844854354858, 0.0005398169159889221, 0.0005639493465423584, 0.0005880817770957947, 0.000612214207649231, 0.0006363466382026672, 0.0006604790687561035, 0.0006846114993095398, 0.0007087439298629761, 0.0007328763604164124, 0.0007570087909698486, 0.0007811412215232849, 0.0008052736520767212, 0.0008294060826301575, 0.0008535385131835938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 16.0, 25.0, 39.0, 41.0, 93.0, 160.0, 327.0, 676.0, 1715.0, 5229.0, 20304.0, 132743.0, 761225.0, 101652.0, 17079.0, 4424.0, 1496.0, 579.0, 292.0, 153.0, 77.0, 48.0, 32.0, 26.0, 18.0, 13.0, 5.0, 3.0, 4.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-9.0625, -8.79150390625, -8.5205078125, -8.24951171875, -7.978515625, -7.70751953125, -7.4365234375, -7.16552734375, -6.89453125, -6.62353515625, -6.3525390625, -6.08154296875, -5.810546875, -5.53955078125, -5.2685546875, -4.99755859375, -4.7265625, -4.45556640625, -4.1845703125, -3.91357421875, -3.642578125, -3.37158203125, -3.1005859375, -2.82958984375, -2.55859375, -2.28759765625, -2.0166015625, -1.74560546875, -1.474609375, -1.20361328125, -0.9326171875, -0.66162109375, -0.390625, -0.11962890625, 0.1513671875, 0.42236328125, 0.693359375, 0.96435546875, 1.2353515625, 1.50634765625, 1.77734375, 2.04833984375, 2.3193359375, 2.59033203125, 2.861328125, 3.13232421875, 3.4033203125, 3.67431640625, 3.9453125, 4.21630859375, 4.4873046875, 4.75830078125, 5.029296875, 5.30029296875, 5.5712890625, 5.84228515625, 6.11328125, 6.38427734375, 6.6552734375, 6.92626953125, 7.197265625, 7.46826171875, 7.7392578125, 8.01025390625, 8.28125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 10.0, 9.0, 19.0, 20.0, 16.0, 24.0, 32.0, 50.0, 82.0, 104.0, 135.0, 128.0, 99.0, 58.0, 42.0, 31.0, 32.0, 14.0, 17.0, 8.0, 8.0, 7.0, 5.0, 7.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.515625, -3.40191650390625, -3.2882080078125, -3.17449951171875, -3.060791015625, -2.94708251953125, -2.8333740234375, -2.71966552734375, -2.60595703125, -2.49224853515625, -2.3785400390625, -2.26483154296875, -2.151123046875, -2.03741455078125, -1.9237060546875, -1.80999755859375, -1.6962890625, -1.58258056640625, -1.4688720703125, -1.35516357421875, -1.241455078125, -1.12774658203125, -1.0140380859375, -0.90032958984375, -0.78662109375, -0.67291259765625, -0.5592041015625, -0.44549560546875, -0.331787109375, -0.21807861328125, -0.1043701171875, 0.00933837890625, 0.123046875, 0.23675537109375, 0.3504638671875, 0.46417236328125, 0.577880859375, 0.69158935546875, 0.8052978515625, 0.91900634765625, 1.03271484375, 1.14642333984375, 1.2601318359375, 1.37384033203125, 1.487548828125, 1.60125732421875, 1.7149658203125, 1.82867431640625, 1.9423828125, 2.05609130859375, 2.1697998046875, 2.28350830078125, 2.397216796875, 2.51092529296875, 2.6246337890625, 2.73834228515625, 2.85205078125, 2.96575927734375, 3.0794677734375, 3.19317626953125, 3.306884765625, 3.42059326171875, 3.5343017578125, 3.64801025390625, 3.76171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 20.0, 49.0, 117.0, 194.0, 278.0, 187.0, 90.0, 29.0, 16.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.77375411987305, -57.32360076904297, -54.87344741821289, -52.42329406738281, -49.97313690185547, -47.522987365722656, -45.07283020019531, -42.622676849365234, -40.172523498535156, -37.72237014770508, -35.272216796875, -32.82206344604492, -30.37190818786621, -27.921754837036133, -25.471599578857422, -23.021446228027344, -20.571292877197266, -18.121139526367188, -15.670985221862793, -13.220830917358398, -10.77067756652832, -8.320524215698242, -5.870369911193848, -3.420215606689453, -0.970062255859375, 1.4800915718078613, 3.9302453994750977, 6.380399227142334, 8.83055305480957, 11.280706405639648, 13.730860710144043, 16.181015014648438, 18.63116455078125, 21.081317901611328, 23.531471252441406, 25.981626510620117, 28.431779861450195, 30.881933212280273, 33.332088470458984, 35.78224182128906, 38.23239517211914, 40.68254852294922, 43.1327018737793, 45.582855224609375, 48.03301239013672, 50.48316192626953, 52.933319091796875, 55.38347244262695, 57.83362579345703, 60.28377914428711, 62.73393249511719, 65.18408966064453, 67.63423919677734, 70.08439636230469, 72.5345458984375, 74.98470306396484, 77.43486022949219, 79.88501739501953, 82.33516693115234, 84.78532409667969, 87.2354736328125, 89.68563079833984, 92.13578033447266, 94.5859375, 97.03608703613281]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 17.0, 18.0, 23.0, 13.0, 29.0, 35.0, 39.0, 35.0, 35.0, 43.0, 60.0, 58.0, 54.0, 45.0, 64.0, 51.0, 50.0, 46.0, 40.0, 37.0, 38.0, 36.0, 14.0, 27.0, 19.0, 12.0, 12.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.994770050048828, -28.134937286376953, -27.275104522705078, -26.415271759033203, -25.555437088012695, -24.69560432434082, -23.835771560668945, -22.97593879699707, -22.116104125976562, -21.256271362304688, -20.396438598632812, -19.536605834960938, -18.67677116394043, -17.816938400268555, -16.95710563659668, -16.097272872924805, -15.23744010925293, -14.377607345581055, -13.517773628234863, -12.657940864562988, -11.798107147216797, -10.938274383544922, -10.078441619873047, -9.218608856201172, -8.35877513885498, -7.498941898345947, -6.639108657836914, -5.779275894165039, -4.919442653656006, -4.059609413146973, -3.1997766494750977, -2.3399434089660645, -1.480112075805664, -0.6202789545059204, 0.23955416679382324, 1.0993871688842773, 1.9592204093933105, 2.8190536499023438, 3.6788864135742188, 4.538719654083252, 5.398552894592285, 6.258386135101318, 7.118219375610352, 7.978052139282227, 8.837884902954102, 9.697718620300293, 10.557551383972168, 11.41738510131836, 12.277217864990234, 13.13705062866211, 13.9968843460083, 14.856717109680176, 15.716550827026367, 16.576383590698242, 17.436216354370117, 18.296049118041992, 19.1558837890625, 20.015716552734375, 20.87554931640625, 21.735382080078125, 22.595216751098633, 23.455049514770508, 24.314882278442383, 25.174715042114258, 26.034547805786133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 16.0, 22.0, 58.0, 58.0, 118.0, 194.0, 324.0, 782.0, 1832.0, 5656.0, 27244.0, 626878.0, 3481757.0, 38190.0, 7131.0, 2134.0, 860.0, 436.0, 213.0, 108.0, 79.0, 49.0, 35.0, 20.0, 12.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.05926513671875, -6.7396240234375, -6.41998291015625, -6.100341796875, -5.78070068359375, -5.4610595703125, -5.14141845703125, -4.82177734375, -4.50213623046875, -4.1824951171875, -3.86285400390625, -3.543212890625, -3.22357177734375, -2.9039306640625, -2.58428955078125, -2.2646484375, -1.94500732421875, -1.6253662109375, -1.30572509765625, -0.986083984375, -0.66644287109375, -0.3468017578125, -0.02716064453125, 0.29248046875, 0.61212158203125, 0.9317626953125, 1.25140380859375, 1.571044921875, 1.89068603515625, 2.2103271484375, 2.52996826171875, 2.849609375, 3.16925048828125, 3.4888916015625, 3.80853271484375, 4.128173828125, 4.44781494140625, 4.7674560546875, 5.08709716796875, 5.40673828125, 5.72637939453125, 6.0460205078125, 6.36566162109375, 6.685302734375, 7.00494384765625, 7.3245849609375, 7.64422607421875, 7.9638671875, 8.28350830078125, 8.6031494140625, 8.92279052734375, 9.242431640625, 9.56207275390625, 9.8817138671875, 10.20135498046875, 10.52099609375, 10.84063720703125, 11.1602783203125, 11.47991943359375, 11.799560546875, 12.11920166015625, 12.4388427734375, 12.75848388671875, 13.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 16.0, 30.0, 46.0, 55.0, 95.0, 98.0, 138.0, 135.0, 111.0, 78.0, 72.0, 50.0, 25.0, 11.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.01593017578125, -0.9752197265625, -0.93450927734375, -0.893798828125, -0.85308837890625, -0.8123779296875, -0.77166748046875, -0.73095703125, -0.69024658203125, -0.6495361328125, -0.60882568359375, -0.568115234375, -0.52740478515625, -0.4866943359375, -0.44598388671875, -0.4052734375, -0.36456298828125, -0.3238525390625, -0.28314208984375, -0.242431640625, -0.20172119140625, -0.1610107421875, -0.12030029296875, -0.07958984375, -0.03887939453125, 0.0018310546875, 0.04254150390625, 0.083251953125, 0.12396240234375, 0.1646728515625, 0.20538330078125, 0.24609375, 0.28680419921875, 0.3275146484375, 0.36822509765625, 0.408935546875, 0.44964599609375, 0.4903564453125, 0.53106689453125, 0.57177734375, 0.61248779296875, 0.6531982421875, 0.69390869140625, 0.734619140625, 0.77532958984375, 0.8160400390625, 0.85675048828125, 0.8974609375, 0.93817138671875, 0.9788818359375, 1.01959228515625, 1.060302734375, 1.10101318359375, 1.1417236328125, 1.18243408203125, 1.22314453125, 1.26385498046875, 1.3045654296875, 1.34527587890625, 1.385986328125, 1.42669677734375, 1.4674072265625, 1.50811767578125, 1.548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 0.0, 7.0, 12.0, 25.0, 29.0, 42.0, 57.0, 98.0, 148.0, 222.0, 372.0, 648.0, 1113.0, 1958.0, 3672.0, 7020.0, 14395.0, 33207.0, 96828.0, 500747.0, 3151702.0, 266699.0, 66730.0, 24830.0, 11204.0, 5696.0, 2902.0, 1566.0, 906.0, 503.0, 319.0, 206.0, 140.0, 82.0, 45.0, 42.0, 34.0, 17.0, 14.0, 12.0, 14.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.18359375, -4.05010986328125, -3.9166259765625, -3.78314208984375, -3.649658203125, -3.51617431640625, -3.3826904296875, -3.24920654296875, -3.11572265625, -2.98223876953125, -2.8487548828125, -2.71527099609375, -2.581787109375, -2.44830322265625, -2.3148193359375, -2.18133544921875, -2.0478515625, -1.91436767578125, -1.7808837890625, -1.64739990234375, -1.513916015625, -1.38043212890625, -1.2469482421875, -1.11346435546875, -0.97998046875, -0.84649658203125, -0.7130126953125, -0.57952880859375, -0.446044921875, -0.31256103515625, -0.1790771484375, -0.04559326171875, 0.087890625, 0.22137451171875, 0.3548583984375, 0.48834228515625, 0.621826171875, 0.75531005859375, 0.8887939453125, 1.02227783203125, 1.15576171875, 1.28924560546875, 1.4227294921875, 1.55621337890625, 1.689697265625, 1.82318115234375, 1.9566650390625, 2.09014892578125, 2.2236328125, 2.35711669921875, 2.4906005859375, 2.62408447265625, 2.757568359375, 2.89105224609375, 3.0245361328125, 3.15802001953125, 3.29150390625, 3.42498779296875, 3.5584716796875, 3.69195556640625, 3.825439453125, 3.95892333984375, 4.0924072265625, 4.22589111328125, 4.359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 10.0, 8.0, 11.0, 16.0, 28.0, 34.0, 50.0, 67.0, 109.0, 158.0, 291.0, 731.0, 1479.0, 377.0, 212.0, 132.0, 80.0, 50.0, 57.0, 25.0, 19.0, 16.0, 14.0, 16.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9782867431640625, -0.940948486328125, -0.9036102294921875, -0.86627197265625, -0.8289337158203125, -0.791595458984375, -0.7542572021484375, -0.7169189453125, -0.6795806884765625, -0.642242431640625, -0.6049041748046875, -0.56756591796875, -0.5302276611328125, -0.492889404296875, -0.4555511474609375, -0.418212890625, -0.3808746337890625, -0.343536376953125, -0.3061981201171875, -0.26885986328125, -0.2315216064453125, -0.194183349609375, -0.1568450927734375, -0.1195068359375, -0.0821685791015625, -0.044830322265625, -0.0074920654296875, 0.02984619140625, 0.0671844482421875, 0.104522705078125, 0.1418609619140625, 0.17919921875, 0.2165374755859375, 0.253875732421875, 0.2912139892578125, 0.32855224609375, 0.3658905029296875, 0.403228759765625, 0.4405670166015625, 0.4779052734375, 0.5152435302734375, 0.552581787109375, 0.5899200439453125, 0.62725830078125, 0.6645965576171875, 0.701934814453125, 0.7392730712890625, 0.776611328125, 0.8139495849609375, 0.851287841796875, 0.8886260986328125, 0.92596435546875, 0.9633026123046875, 1.000640869140625, 1.0379791259765625, 1.0753173828125, 1.1126556396484375, 1.149993896484375, 1.1873321533203125, 1.22467041015625, 1.2620086669921875, 1.299346923828125, 1.3366851806640625, 1.3740234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 21.0, 19.0, 33.0, 67.0, 128.0, 181.0, 198.0, 145.0, 90.0, 53.0, 36.0, 14.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.241500854492188, -19.847503662109375, -19.45350456237793, -19.059507369995117, -18.665508270263672, -18.27151107788086, -17.877513885498047, -17.4835147857666, -17.08951759338379, -16.695520401000977, -16.30152130126953, -15.907524108886719, -15.51352596282959, -15.119527816772461, -14.725530624389648, -14.33153247833252, -13.93753433227539, -13.543536186218262, -13.149538040161133, -12.75554084777832, -12.361542701721191, -11.967544555664062, -11.57354736328125, -11.179549217224121, -10.785551071166992, -10.391552925109863, -9.997554779052734, -9.603557586669922, -9.209559440612793, -8.815561294555664, -8.421564102172852, -8.027565956115723, -7.633566856384277, -7.239568710327148, -6.845571041107178, -6.451573371887207, -6.057575225830078, -5.663577079772949, -5.2695794105529785, -4.875581741333008, -4.481583595275879, -4.08758544921875, -3.6935877799987793, -3.2995898723602295, -2.9055919647216797, -2.51159405708313, -2.11759614944458, -1.7235982418060303, -1.3296003341674805, -0.9356024265289307, -0.5416045188903809, -0.14760661125183105, 0.24639129638671875, 0.6403892040252686, 1.0343871116638184, 1.4283850193023682, 1.822382926940918, 2.2163808345794678, 2.6103787422180176, 3.0043766498565674, 3.398374557495117, 3.792372465133667, 4.186370372772217, 4.5803680419921875, 4.974366188049316]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 7.0, 6.0, 7.0, 7.0, 13.0, 9.0, 9.0, 13.0, 17.0, 25.0, 33.0, 25.0, 30.0, 35.0, 48.0, 49.0, 45.0, 45.0, 54.0, 41.0, 64.0, 50.0, 41.0, 37.0, 48.0, 28.0, 42.0, 25.0, 28.0, 18.0, 23.0, 20.0, 18.0, 7.0, 14.0, 6.0, 10.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.262031316757202, -3.100661277770996, -2.93929123878479, -2.777921199798584, -2.616550922393799, -2.455181121826172, -2.2938108444213867, -2.1324408054351807, -1.9710707664489746, -1.8097007274627686, -1.6483306884765625, -1.486960530281067, -1.3255904912948608, -1.1642204523086548, -1.0028502941131592, -0.8414802551269531, -0.6801102161407471, -0.518740177154541, -0.3573700785636902, -0.19600000977516174, -0.0346299409866333, 0.12674009799957275, 0.2881101965904236, 0.4494802951812744, 0.6108503341674805, 0.7722203731536865, 0.9335904717445374, 1.0949605703353882, 1.2563306093215942, 1.4177006483078003, 1.579070806503296, 1.740440845489502, 1.901810646057129, 2.063180685043335, 2.224550724029541, 2.385920763015747, 2.547290802001953, 2.7086610794067383, 2.8700311183929443, 3.0314011573791504, 3.1927711963653564, 3.3541412353515625, 3.5155112743377686, 3.6768813133239746, 3.8382515907287598, 3.9996213912963867, 4.160991668701172, 4.322361946105957, 4.483731746673584, 4.645102024078369, 4.806471824645996, 4.967842102050781, 5.129211902618408, 5.290582180023193, 5.45195198059082, 5.6133222579956055, 5.774692535400391, 5.936062812805176, 6.097432613372803, 6.258802890777588, 6.420172691345215, 6.58154296875, 6.742912769317627, 6.904283046722412, 7.065652847290039]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 9.0, 4.0, 6.0, 14.0, 21.0, 28.0, 36.0, 59.0, 66.0, 125.0, 157.0, 253.0, 430.0, 605.0, 1049.0, 1742.0, 3388.0, 7162.0, 17812.0, 50655.0, 161836.0, 431787.0, 249894.0, 75936.0, 25553.0, 9890.0, 4519.0, 2169.0, 1207.0, 745.0, 444.0, 291.0, 222.0, 117.0, 95.0, 71.0, 29.0, 29.0, 25.0, 11.0, 14.0, 10.0, 11.0, 4.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.8125, -4.66961669921875, -4.5267333984375, -4.38385009765625, -4.240966796875, -4.09808349609375, -3.9552001953125, -3.81231689453125, -3.66943359375, -3.52655029296875, -3.3836669921875, -3.24078369140625, -3.097900390625, -2.95501708984375, -2.8121337890625, -2.66925048828125, -2.5263671875, -2.38348388671875, -2.2406005859375, -2.09771728515625, -1.954833984375, -1.81195068359375, -1.6690673828125, -1.52618408203125, -1.38330078125, -1.24041748046875, -1.0975341796875, -0.95465087890625, -0.811767578125, -0.66888427734375, -0.5260009765625, -0.38311767578125, -0.240234375, -0.09735107421875, 0.0455322265625, 0.18841552734375, 0.331298828125, 0.47418212890625, 0.6170654296875, 0.75994873046875, 0.90283203125, 1.04571533203125, 1.1885986328125, 1.33148193359375, 1.474365234375, 1.61724853515625, 1.7601318359375, 1.90301513671875, 2.0458984375, 2.18878173828125, 2.3316650390625, 2.47454833984375, 2.617431640625, 2.76031494140625, 2.9031982421875, 3.04608154296875, 3.18896484375, 3.33184814453125, 3.4747314453125, 3.61761474609375, 3.760498046875, 3.90338134765625, 4.0462646484375, 4.18914794921875, 4.33203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 5.0, 10.0, 12.0, 25.0, 30.0, 69.0, 70.0, 91.0, 117.0, 131.0, 112.0, 94.0, 84.0, 55.0, 36.0, 31.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.062347412109375, -1.02215576171875, -0.981964111328125, -0.9417724609375, -0.901580810546875, -0.86138916015625, -0.821197509765625, -0.781005859375, -0.740814208984375, -0.70062255859375, -0.660430908203125, -0.6202392578125, -0.580047607421875, -0.53985595703125, -0.499664306640625, -0.45947265625, -0.419281005859375, -0.37908935546875, -0.338897705078125, -0.2987060546875, -0.258514404296875, -0.21832275390625, -0.178131103515625, -0.137939453125, -0.097747802734375, -0.05755615234375, -0.017364501953125, 0.0228271484375, 0.063018798828125, 0.10321044921875, 0.143402099609375, 0.18359375, 0.223785400390625, 0.26397705078125, 0.304168701171875, 0.3443603515625, 0.384552001953125, 0.42474365234375, 0.464935302734375, 0.505126953125, 0.545318603515625, 0.58551025390625, 0.625701904296875, 0.6658935546875, 0.706085205078125, 0.74627685546875, 0.786468505859375, 0.82666015625, 0.866851806640625, 0.90704345703125, 0.947235107421875, 0.9874267578125, 1.027618408203125, 1.06781005859375, 1.108001708984375, 1.148193359375, 1.188385009765625, 1.22857666015625, 1.268768310546875, 1.3089599609375, 1.349151611328125, 1.38934326171875, 1.429534912109375, 1.4697265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 1.0, 6.0, 4.0, 4.0, 11.0, 15.0, 25.0, 39.0, 40.0, 86.0, 137.0, 210.0, 366.0, 739.0, 1474.0, 3810.0, 12596.0, 52643.0, 259240.0, 532264.0, 142092.0, 29710.0, 7937.0, 2642.0, 1102.0, 556.0, 264.0, 178.0, 102.0, 80.0, 61.0, 30.0, 20.0, 18.0, 13.0, 10.0, 9.0, 1.0, 2.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.6798095703125, -5.492431640625, -5.3050537109375, -5.11767578125, -4.9302978515625, -4.742919921875, -4.5555419921875, -4.3681640625, -4.1807861328125, -3.993408203125, -3.8060302734375, -3.61865234375, -3.4312744140625, -3.243896484375, -3.0565185546875, -2.869140625, -2.6817626953125, -2.494384765625, -2.3070068359375, -2.11962890625, -1.9322509765625, -1.744873046875, -1.5574951171875, -1.3701171875, -1.1827392578125, -0.995361328125, -0.8079833984375, -0.62060546875, -0.4332275390625, -0.245849609375, -0.0584716796875, 0.12890625, 0.3162841796875, 0.503662109375, 0.6910400390625, 0.87841796875, 1.0657958984375, 1.253173828125, 1.4405517578125, 1.6279296875, 1.8153076171875, 2.002685546875, 2.1900634765625, 2.37744140625, 2.5648193359375, 2.752197265625, 2.9395751953125, 3.126953125, 3.3143310546875, 3.501708984375, 3.6890869140625, 3.87646484375, 4.0638427734375, 4.251220703125, 4.4385986328125, 4.6259765625, 4.8133544921875, 5.000732421875, 5.1881103515625, 5.37548828125, 5.5628662109375, 5.750244140625, 5.9376220703125, 6.125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 11.0, 9.0, 10.0, 15.0, 15.0, 29.0, 17.0, 32.0, 40.0, 39.0, 40.0, 50.0, 44.0, 34.0, 43.0, 44.0, 56.0, 48.0, 46.0, 34.0, 46.0, 37.0, 36.0, 36.0, 18.0, 22.0, 27.0, 19.0, 12.0, 19.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.604583740234375, -3.49237060546875, -3.380157470703125, -3.2679443359375, -3.155731201171875, -3.04351806640625, -2.931304931640625, -2.819091796875, -2.706878662109375, -2.59466552734375, -2.482452392578125, -2.3702392578125, -2.258026123046875, -2.14581298828125, -2.033599853515625, -1.92138671875, -1.809173583984375, -1.69696044921875, -1.584747314453125, -1.4725341796875, -1.360321044921875, -1.24810791015625, -1.135894775390625, -1.023681640625, -0.911468505859375, -0.79925537109375, -0.687042236328125, -0.5748291015625, -0.462615966796875, -0.35040283203125, -0.238189697265625, -0.1259765625, -0.013763427734375, 0.09844970703125, 0.210662841796875, 0.3228759765625, 0.435089111328125, 0.54730224609375, 0.659515380859375, 0.771728515625, 0.883941650390625, 0.99615478515625, 1.108367919921875, 1.2205810546875, 1.332794189453125, 1.44500732421875, 1.557220458984375, 1.66943359375, 1.781646728515625, 1.89385986328125, 2.006072998046875, 2.1182861328125, 2.230499267578125, 2.34271240234375, 2.454925537109375, 2.567138671875, 2.679351806640625, 2.79156494140625, 2.903778076171875, 3.0159912109375, 3.128204345703125, 3.24041748046875, 3.352630615234375, 3.46484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 9.0, 19.0, 41.0, 40.0, 68.0, 103.0, 179.0, 287.0, 505.0, 983.0, 1942.0, 3864.0, 9139.0, 21850.0, 61417.0, 198992.0, 431662.0, 211673.0, 64951.0, 23139.0, 9180.0, 4166.0, 1977.0, 974.0, 528.0, 315.0, 183.0, 110.0, 64.0, 55.0, 36.0, 18.0, 23.0, 13.0, 6.0, 10.0, 3.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.33258056640625, -2.2608642578125, -2.18914794921875, -2.117431640625, -2.04571533203125, -1.9739990234375, -1.90228271484375, -1.83056640625, -1.75885009765625, -1.6871337890625, -1.61541748046875, -1.543701171875, -1.47198486328125, -1.4002685546875, -1.32855224609375, -1.2568359375, -1.18511962890625, -1.1134033203125, -1.04168701171875, -0.969970703125, -0.89825439453125, -0.8265380859375, -0.75482177734375, -0.68310546875, -0.61138916015625, -0.5396728515625, -0.46795654296875, -0.396240234375, -0.32452392578125, -0.2528076171875, -0.18109130859375, -0.109375, -0.03765869140625, 0.0340576171875, 0.10577392578125, 0.177490234375, 0.24920654296875, 0.3209228515625, 0.39263916015625, 0.46435546875, 0.53607177734375, 0.6077880859375, 0.67950439453125, 0.751220703125, 0.82293701171875, 0.8946533203125, 0.96636962890625, 1.0380859375, 1.10980224609375, 1.1815185546875, 1.25323486328125, 1.324951171875, 1.39666748046875, 1.4683837890625, 1.54010009765625, 1.61181640625, 1.68353271484375, 1.7552490234375, 1.82696533203125, 1.898681640625, 1.97039794921875, 2.0421142578125, 2.11383056640625, 2.185546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 6.0, 11.0, 18.0, 14.0, 22.0, 18.0, 40.0, 40.0, 62.0, 83.0, 96.0, 142.0, 103.0, 86.0, 62.0, 43.0, 36.0, 20.0, 19.0, 15.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006465911865234375, -0.0006297975778579712, -0.0006130039691925049, -0.0005962103605270386, -0.0005794167518615723, -0.000562623143196106, -0.0005458295345306396, -0.0005290359258651733, -0.000512242317199707, -0.0004954487085342407, -0.0004786550998687744, -0.0004618614912033081, -0.0004450678825378418, -0.0004282742738723755, -0.0004114806652069092, -0.00039468705654144287, -0.00037789344787597656, -0.00036109983921051025, -0.00034430623054504395, -0.00032751262187957764, -0.00031071901321411133, -0.000293925404548645, -0.0002771317958831787, -0.0002603381872177124, -0.0002435445785522461, -0.00022675096988677979, -0.00020995736122131348, -0.00019316375255584717, -0.00017637014389038086, -0.00015957653522491455, -0.00014278292655944824, -0.00012598931789398193, -0.00010919570922851562, -9.240210056304932e-05, -7.560849189758301e-05, -5.88148832321167e-05, -4.202127456665039e-05, -2.5227665901184082e-05, -8.434057235717773e-06, 8.359551429748535e-06, 2.5153160095214844e-05, 4.194676876068115e-05, 5.874037742614746e-05, 7.553398609161377e-05, 9.232759475708008e-05, 0.00010912120342254639, 0.0001259148120880127, 0.000142708420753479, 0.0001595020294189453, 0.00017629563808441162, 0.00019308924674987793, 0.00020988285541534424, 0.00022667646408081055, 0.00024347007274627686, 0.00026026368141174316, 0.00027705729007720947, 0.0002938508987426758, 0.0003106445074081421, 0.0003274381160736084, 0.0003442317247390747, 0.000361025333404541, 0.0003778189420700073, 0.00039461255073547363, 0.00041140615940093994, 0.00042819976806640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 17.0, 26.0, 33.0, 81.0, 136.0, 283.0, 661.0, 1782.0, 6038.0, 29931.0, 266575.0, 653319.0, 72826.0, 12132.0, 2916.0, 952.0, 397.0, 175.0, 104.0, 55.0, 27.0, 20.0, 13.0, 9.0, 5.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4493408203125, -4.297119140625, -4.1448974609375, -3.99267578125, -3.8404541015625, -3.688232421875, -3.5360107421875, -3.3837890625, -3.2315673828125, -3.079345703125, -2.9271240234375, -2.77490234375, -2.6226806640625, -2.470458984375, -2.3182373046875, -2.166015625, -2.0137939453125, -1.861572265625, -1.7093505859375, -1.55712890625, -1.4049072265625, -1.252685546875, -1.1004638671875, -0.9482421875, -0.7960205078125, -0.643798828125, -0.4915771484375, -0.33935546875, -0.1871337890625, -0.034912109375, 0.1173095703125, 0.26953125, 0.4217529296875, 0.573974609375, 0.7261962890625, 0.87841796875, 1.0306396484375, 1.182861328125, 1.3350830078125, 1.4873046875, 1.6395263671875, 1.791748046875, 1.9439697265625, 2.09619140625, 2.2484130859375, 2.400634765625, 2.5528564453125, 2.705078125, 2.8572998046875, 3.009521484375, 3.1617431640625, 3.31396484375, 3.4661865234375, 3.618408203125, 3.7706298828125, 3.9228515625, 4.0750732421875, 4.227294921875, 4.3795166015625, 4.53173828125, 4.6839599609375, 4.836181640625, 4.9884033203125, 5.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 5.0, 8.0, 4.0, 10.0, 8.0, 10.0, 18.0, 20.0, 14.0, 23.0, 36.0, 46.0, 56.0, 59.0, 63.0, 81.0, 86.0, 67.0, 83.0, 55.0, 55.0, 41.0, 32.0, 30.0, 18.0, 14.0, 10.0, 15.0, 7.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6953125, -1.63916015625, -1.5830078125, -1.52685546875, -1.470703125, -1.41455078125, -1.3583984375, -1.30224609375, -1.24609375, -1.18994140625, -1.1337890625, -1.07763671875, -1.021484375, -0.96533203125, -0.9091796875, -0.85302734375, -0.796875, -0.74072265625, -0.6845703125, -0.62841796875, -0.572265625, -0.51611328125, -0.4599609375, -0.40380859375, -0.34765625, -0.29150390625, -0.2353515625, -0.17919921875, -0.123046875, -0.06689453125, -0.0107421875, 0.04541015625, 0.1015625, 0.15771484375, 0.2138671875, 0.27001953125, 0.326171875, 0.38232421875, 0.4384765625, 0.49462890625, 0.55078125, 0.60693359375, 0.6630859375, 0.71923828125, 0.775390625, 0.83154296875, 0.8876953125, 0.94384765625, 1.0, 1.05615234375, 1.1123046875, 1.16845703125, 1.224609375, 1.28076171875, 1.3369140625, 1.39306640625, 1.44921875, 1.50537109375, 1.5615234375, 1.61767578125, 1.673828125, 1.72998046875, 1.7861328125, 1.84228515625, 1.8984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 10.0, 25.0, 46.0, 86.0, 192.0, 213.0, 219.0, 107.0, 70.0, 21.0, 13.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.60674285888672, -48.90692901611328, -47.20711898803711, -45.50730514526367, -43.807491302490234, -42.10768127441406, -40.407867431640625, -38.70805358886719, -37.00823974609375, -35.30842590332031, -33.60861587524414, -31.908802032470703, -30.208988189697266, -28.50917625427246, -26.809364318847656, -25.10955047607422, -23.409740447998047, -21.709928512573242, -20.010114669799805, -18.310302734375, -16.610488891601562, -14.910676956176758, -13.210865020751953, -11.511052131652832, -9.811239242553711, -8.11142635345459, -6.411613941192627, -4.711801528930664, -3.011988639831543, -1.3121757507324219, 0.3876361846923828, 2.087449073791504, 3.7872581481933594, 5.4870710372924805, 7.186883449554443, 8.886695861816406, 10.586508750915527, 12.286321640014648, 13.986133575439453, 15.685946464538574, 17.385759353637695, 19.0855712890625, 20.785385131835938, 22.485197067260742, 24.185009002685547, 25.884822845458984, 27.58463478088379, 29.284446716308594, 30.98426055908203, 32.68407440185547, 34.38388442993164, 36.08369827270508, 37.783512115478516, 39.48332214355469, 41.183135986328125, 42.88294982910156, 44.582763671875, 46.28257751464844, 47.98238754272461, 49.68220138549805, 51.382015228271484, 53.081825256347656, 54.781639099121094, 56.48145294189453, 58.1812629699707]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 16.0, 16.0, 17.0, 28.0, 28.0, 34.0, 31.0, 49.0, 33.0, 40.0, 49.0, 51.0, 39.0, 40.0, 40.0, 35.0, 45.0, 32.0, 35.0, 28.0, 22.0, 30.0, 16.0, 28.0, 23.0, 18.0, 14.0, 15.0, 12.0, 9.0, 10.0, 5.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.762094497680664, -18.190765380859375, -17.61943817138672, -17.04810905456543, -16.47677993774414, -15.905450820922852, -15.334122657775879, -14.762794494628906, -14.191465377807617, -13.620136260986328, -13.048808097839355, -12.477479934692383, -11.906150817871094, -11.334821701049805, -10.763493537902832, -10.19216537475586, -9.62083625793457, -9.049507141113281, -8.478178977966309, -7.906850337982178, -7.335521697998047, -6.764193058013916, -6.192864418029785, -5.621535778045654, -5.050207138061523, -4.478878498077393, -3.9075498580932617, -3.336221218109131, -2.764892578125, -2.193563938140869, -1.6222352981567383, -1.0509066581726074, -0.47957611083984375, 0.09175252914428711, 0.663081169128418, 1.2344098091125488, 1.8057384490966797, 2.3770670890808105, 2.9483957290649414, 3.5197243690490723, 4.091053009033203, 4.662381649017334, 5.233710289001465, 5.805038928985596, 6.376367568969727, 6.947696208953857, 7.519024848937988, 8.090353012084961, 8.66168212890625, 9.233011245727539, 9.804339408874512, 10.375667572021484, 10.946996688842773, 11.518325805664062, 12.089653968811035, 12.660982131958008, 13.232311248779297, 13.803640365600586, 14.374968528747559, 14.946296691894531, 15.51762580871582, 16.08895492553711, 16.660282135009766, 17.231611251831055, 17.802940368652344]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 10.0, 5.0, 16.0, 18.0, 32.0, 58.0, 124.0, 172.0, 375.0, 849.0, 2433.0, 8437.0, 52844.0, 3877006.0, 226523.0, 18629.0, 4189.0, 1348.0, 567.0, 281.0, 147.0, 85.0, 49.0, 26.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.73583984375, -8.4091796875, -8.08251953125, -7.755859375, -7.42919921875, -7.1025390625, -6.77587890625, -6.44921875, -6.12255859375, -5.7958984375, -5.46923828125, -5.142578125, -4.81591796875, -4.4892578125, -4.16259765625, -3.8359375, -3.50927734375, -3.1826171875, -2.85595703125, -2.529296875, -2.20263671875, -1.8759765625, -1.54931640625, -1.22265625, -0.89599609375, -0.5693359375, -0.24267578125, 0.083984375, 0.41064453125, 0.7373046875, 1.06396484375, 1.390625, 1.71728515625, 2.0439453125, 2.37060546875, 2.697265625, 3.02392578125, 3.3505859375, 3.67724609375, 4.00390625, 4.33056640625, 4.6572265625, 4.98388671875, 5.310546875, 5.63720703125, 5.9638671875, 6.29052734375, 6.6171875, 6.94384765625, 7.2705078125, 7.59716796875, 7.923828125, 8.25048828125, 8.5771484375, 8.90380859375, 9.23046875, 9.55712890625, 9.8837890625, 10.21044921875, 10.537109375, 10.86376953125, 11.1904296875, 11.51708984375, 11.84375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 11.0, 12.0, 16.0, 36.0, 45.0, 67.0, 69.0, 85.0, 101.0, 114.0, 95.0, 91.0, 74.0, 57.0, 48.0, 27.0, 15.0, 16.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.2063446044921875, -1.166595458984375, -1.1268463134765625, -1.08709716796875, -1.0473480224609375, -1.007598876953125, -0.9678497314453125, -0.9281005859375, -0.8883514404296875, -0.848602294921875, -0.8088531494140625, -0.76910400390625, -0.7293548583984375, -0.689605712890625, -0.6498565673828125, -0.610107421875, -0.5703582763671875, -0.530609130859375, -0.4908599853515625, -0.45111083984375, -0.4113616943359375, -0.371612548828125, -0.3318634033203125, -0.2921142578125, -0.2523651123046875, -0.212615966796875, -0.1728668212890625, -0.13311767578125, -0.0933685302734375, -0.053619384765625, -0.0138702392578125, 0.02587890625, 0.0656280517578125, 0.105377197265625, 0.1451263427734375, 0.18487548828125, 0.2246246337890625, 0.264373779296875, 0.3041229248046875, 0.3438720703125, 0.3836212158203125, 0.423370361328125, 0.4631195068359375, 0.50286865234375, 0.5426177978515625, 0.582366943359375, 0.6221160888671875, 0.661865234375, 0.7016143798828125, 0.741363525390625, 0.7811126708984375, 0.82086181640625, 0.8606109619140625, 0.900360107421875, 0.9401092529296875, 0.9798583984375, 1.0196075439453125, 1.059356689453125, 1.0991058349609375, 1.13885498046875, 1.1786041259765625, 1.218353271484375, 1.2581024169921875, 1.2978515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 8.0, 11.0, 29.0, 43.0, 83.0, 104.0, 164.0, 272.0, 429.0, 768.0, 1307.0, 2433.0, 5325.0, 12096.0, 31155.0, 106755.0, 858664.0, 2940553.0, 161164.0, 42999.0, 15817.0, 6814.0, 3344.0, 1757.0, 933.0, 496.0, 281.0, 195.0, 98.0, 58.0, 37.0, 23.0, 25.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.29296875, -5.150421142578125, -5.00787353515625, -4.865325927734375, -4.7227783203125, -4.580230712890625, -4.43768310546875, -4.295135498046875, -4.152587890625, -4.010040283203125, -3.86749267578125, -3.724945068359375, -3.5823974609375, -3.439849853515625, -3.29730224609375, -3.154754638671875, -3.01220703125, -2.869659423828125, -2.72711181640625, -2.584564208984375, -2.4420166015625, -2.299468994140625, -2.15692138671875, -2.014373779296875, -1.871826171875, -1.729278564453125, -1.58673095703125, -1.444183349609375, -1.3016357421875, -1.159088134765625, -1.01654052734375, -0.873992919921875, -0.7314453125, -0.588897705078125, -0.44635009765625, -0.303802490234375, -0.1612548828125, -0.018707275390625, 0.12384033203125, 0.266387939453125, 0.408935546875, 0.551483154296875, 0.69403076171875, 0.836578369140625, 0.9791259765625, 1.121673583984375, 1.26422119140625, 1.406768798828125, 1.54931640625, 1.691864013671875, 1.83441162109375, 1.976959228515625, 2.1195068359375, 2.262054443359375, 2.40460205078125, 2.547149658203125, 2.689697265625, 2.832244873046875, 2.97479248046875, 3.117340087890625, 3.2598876953125, 3.402435302734375, 3.54498291015625, 3.687530517578125, 3.830078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 12.0, 12.0, 18.0, 29.0, 24.0, 50.0, 51.0, 90.0, 149.0, 234.0, 600.0, 1646.0, 481.0, 199.0, 146.0, 76.0, 60.0, 38.0, 31.0, 26.0, 16.0, 9.0, 22.0, 10.0, 0.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.3683929443359375, -1.328582763671875, -1.2887725830078125, -1.24896240234375, -1.2091522216796875, -1.169342041015625, -1.1295318603515625, -1.0897216796875, -1.0499114990234375, -1.010101318359375, -0.9702911376953125, -0.93048095703125, -0.8906707763671875, -0.850860595703125, -0.8110504150390625, -0.771240234375, -0.7314300537109375, -0.691619873046875, -0.6518096923828125, -0.61199951171875, -0.5721893310546875, -0.532379150390625, -0.4925689697265625, -0.4527587890625, -0.4129486083984375, -0.373138427734375, -0.3333282470703125, -0.29351806640625, -0.2537078857421875, -0.213897705078125, -0.1740875244140625, -0.13427734375, -0.0944671630859375, -0.054656982421875, -0.0148468017578125, 0.02496337890625, 0.0647735595703125, 0.104583740234375, 0.1443939208984375, 0.1842041015625, 0.2240142822265625, 0.263824462890625, 0.3036346435546875, 0.34344482421875, 0.3832550048828125, 0.423065185546875, 0.4628753662109375, 0.502685546875, 0.5424957275390625, 0.582305908203125, 0.6221160888671875, 0.66192626953125, 0.7017364501953125, 0.741546630859375, 0.7813568115234375, 0.8211669921875, 0.8609771728515625, 0.900787353515625, 0.9405975341796875, 0.98040771484375, 1.0202178955078125, 1.060028076171875, 1.0998382568359375, 1.1396484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 23.0, 39.0, 103.0, 199.0, 244.0, 201.0, 122.0, 43.0, 14.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.255008697509766, -8.690715789794922, -8.126422882080078, -7.562129974365234, -6.997837066650391, -6.433544158935547, -5.869251251220703, -5.304958343505859, -4.740665435791016, -4.176372528076172, -3.612079620361328, -3.0477867126464844, -2.4834938049316406, -1.9192008972167969, -1.3549079895019531, -0.7906150817871094, -0.22632217407226562, 0.3379707336425781, 0.9022636413574219, 1.4665565490722656, 2.0308494567871094, 2.595142364501953, 3.159435272216797, 3.7237281799316406, 4.288021087646484, 4.852313995361328, 5.416606903076172, 5.980899810791016, 6.545192718505859, 7.109485626220703, 7.673778533935547, 8.23807144165039, 8.802366256713867, 9.366659164428711, 9.930952072143555, 10.495244979858398, 11.059537887573242, 11.623830795288086, 12.18812370300293, 12.752416610717773, 13.316709518432617, 13.881002426147461, 14.445295333862305, 15.009588241577148, 15.573881149291992, 16.138174057006836, 16.70246696472168, 17.266759872436523, 17.831052780151367, 18.39534568786621, 18.959638595581055, 19.5239315032959, 20.088224411010742, 20.652517318725586, 21.21681022644043, 21.781103134155273, 22.345396041870117, 22.90968894958496, 23.473981857299805, 24.03827476501465, 24.602567672729492, 25.166860580444336, 25.73115348815918, 26.295446395874023, 26.859739303588867]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 8.0, 7.0, 13.0, 5.0, 13.0, 16.0, 19.0, 19.0, 16.0, 12.0, 25.0, 40.0, 30.0, 34.0, 48.0, 34.0, 49.0, 39.0, 49.0, 55.0, 48.0, 54.0, 43.0, 44.0, 34.0, 33.0, 27.0, 23.0, 31.0, 15.0, 20.0, 19.0, 11.0, 15.0, 9.0, 11.0, 8.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.036235809326172, -4.883856296539307, -4.7314772605896, -4.579097747802734, -4.426718711853027, -4.274339199066162, -4.121959686279297, -3.9695804119110107, -3.8172011375427246, -3.6648218631744385, -3.5124425888061523, -3.360063076019287, -3.207683801651001, -3.055304527282715, -2.9029250144958496, -2.7505457401275635, -2.5981664657592773, -2.445787191390991, -2.293407917022705, -2.14102840423584, -1.9886491298675537, -1.8362698554992676, -1.683890461921692, -1.5315110683441162, -1.37913179397583, -1.226752519607544, -1.0743731260299683, -0.9219937920570374, -0.7696144580841064, -0.6172351241111755, -0.46485579013824463, -0.31247639656066895, -0.1600966453552246, -0.007717311382293701, 0.1446620225906372, 0.2970413565635681, 0.449420690536499, 0.6018000245094299, 0.7541793584823608, 0.9065587520599365, 1.0589380264282227, 1.2113173007965088, 1.3636966943740845, 1.5160760879516602, 1.6684553623199463, 1.8208346366882324, 1.973214030265808, 2.125593423843384, 2.27797269821167, 2.430351972579956, 2.582731246948242, 2.7351107597351074, 2.8874900341033936, 3.0398693084716797, 3.192248821258545, 3.344628095626831, 3.497007369995117, 3.6493866443634033, 3.8017659187316895, 3.9541454315185547, 4.106524467468262, 4.258903980255127, 4.411283493041992, 4.563662528991699, 4.7160420417785645]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 12.0, 20.0, 21.0, 35.0, 56.0, 67.0, 138.0, 224.0, 403.0, 637.0, 1264.0, 2524.0, 5935.0, 16749.0, 58984.0, 249263.0, 507625.0, 147737.0, 36771.0, 11397.0, 4421.0, 1929.0, 949.0, 570.0, 303.0, 177.0, 116.0, 73.0, 44.0, 39.0, 17.0, 9.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.71539306640625, -4.5362548828125, -4.35711669921875, -4.177978515625, -3.99884033203125, -3.8197021484375, -3.64056396484375, -3.46142578125, -3.28228759765625, -3.1031494140625, -2.92401123046875, -2.744873046875, -2.56573486328125, -2.3865966796875, -2.20745849609375, -2.0283203125, -1.84918212890625, -1.6700439453125, -1.49090576171875, -1.311767578125, -1.13262939453125, -0.9534912109375, -0.77435302734375, -0.59521484375, -0.41607666015625, -0.2369384765625, -0.05780029296875, 0.121337890625, 0.30047607421875, 0.4796142578125, 0.65875244140625, 0.837890625, 1.01702880859375, 1.1961669921875, 1.37530517578125, 1.554443359375, 1.73358154296875, 1.9127197265625, 2.09185791015625, 2.27099609375, 2.45013427734375, 2.6292724609375, 2.80841064453125, 2.987548828125, 3.16668701171875, 3.3458251953125, 3.52496337890625, 3.7041015625, 3.88323974609375, 4.0623779296875, 4.24151611328125, 4.420654296875, 4.59979248046875, 4.7789306640625, 4.95806884765625, 5.13720703125, 5.31634521484375, 5.4954833984375, 5.67462158203125, 5.853759765625, 6.03289794921875, 6.2120361328125, 6.39117431640625, 6.5703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 9.0, 14.0, 21.0, 26.0, 60.0, 52.0, 63.0, 68.0, 95.0, 99.0, 99.0, 88.0, 77.0, 61.0, 51.0, 32.0, 25.0, 21.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.0929718017578125, -1.056060791015625, -1.0191497802734375, -0.98223876953125, -0.9453277587890625, -0.908416748046875, -0.8715057373046875, -0.8345947265625, -0.7976837158203125, -0.760772705078125, -0.7238616943359375, -0.68695068359375, -0.6500396728515625, -0.613128662109375, -0.5762176513671875, -0.539306640625, -0.5023956298828125, -0.465484619140625, -0.4285736083984375, -0.39166259765625, -0.3547515869140625, -0.317840576171875, -0.2809295654296875, -0.2440185546875, -0.2071075439453125, -0.170196533203125, -0.1332855224609375, -0.09637451171875, -0.0594635009765625, -0.022552490234375, 0.0143585205078125, 0.05126953125, 0.0881805419921875, 0.125091552734375, 0.1620025634765625, 0.19891357421875, 0.2358245849609375, 0.272735595703125, 0.3096466064453125, 0.3465576171875, 0.3834686279296875, 0.420379638671875, 0.4572906494140625, 0.49420166015625, 0.5311126708984375, 0.568023681640625, 0.6049346923828125, 0.641845703125, 0.6787567138671875, 0.715667724609375, 0.7525787353515625, 0.78948974609375, 0.8264007568359375, 0.863311767578125, 0.9002227783203125, 0.9371337890625, 0.9740447998046875, 1.010955810546875, 1.0478668212890625, 1.08477783203125, 1.1216888427734375, 1.158599853515625, 1.1955108642578125, 1.232421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 7.0, 6.0, 14.0, 12.0, 16.0, 13.0, 32.0, 33.0, 51.0, 77.0, 127.0, 221.0, 357.0, 604.0, 1232.0, 3127.0, 10091.0, 45702.0, 255098.0, 563580.0, 132593.0, 24930.0, 6258.0, 2169.0, 953.0, 485.0, 281.0, 167.0, 92.0, 60.0, 48.0, 25.0, 16.0, 20.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.30078125, -6.11163330078125, -5.9224853515625, -5.73333740234375, -5.544189453125, -5.35504150390625, -5.1658935546875, -4.97674560546875, -4.78759765625, -4.59844970703125, -4.4093017578125, -4.22015380859375, -4.031005859375, -3.84185791015625, -3.6527099609375, -3.46356201171875, -3.2744140625, -3.08526611328125, -2.8961181640625, -2.70697021484375, -2.517822265625, -2.32867431640625, -2.1395263671875, -1.95037841796875, -1.76123046875, -1.57208251953125, -1.3829345703125, -1.19378662109375, -1.004638671875, -0.81549072265625, -0.6263427734375, -0.43719482421875, -0.248046875, -0.05889892578125, 0.1302490234375, 0.31939697265625, 0.508544921875, 0.69769287109375, 0.8868408203125, 1.07598876953125, 1.26513671875, 1.45428466796875, 1.6434326171875, 1.83258056640625, 2.021728515625, 2.21087646484375, 2.4000244140625, 2.58917236328125, 2.7783203125, 2.96746826171875, 3.1566162109375, 3.34576416015625, 3.534912109375, 3.72406005859375, 3.9132080078125, 4.10235595703125, 4.29150390625, 4.48065185546875, 4.6697998046875, 4.85894775390625, 5.048095703125, 5.23724365234375, 5.4263916015625, 5.61553955078125, 5.8046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 2.0, 9.0, 7.0, 13.0, 4.0, 15.0, 13.0, 16.0, 17.0, 33.0, 27.0, 33.0, 23.0, 38.0, 29.0, 32.0, 34.0, 34.0, 35.0, 33.0, 43.0, 41.0, 44.0, 26.0, 39.0, 39.0, 29.0, 34.0, 26.0, 35.0, 34.0, 27.0, 20.0, 26.0, 10.0, 9.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.947265625, -2.85589599609375, -2.7645263671875, -2.67315673828125, -2.581787109375, -2.49041748046875, -2.3990478515625, -2.30767822265625, -2.21630859375, -2.12493896484375, -2.0335693359375, -1.94219970703125, -1.850830078125, -1.75946044921875, -1.6680908203125, -1.57672119140625, -1.4853515625, -1.39398193359375, -1.3026123046875, -1.21124267578125, -1.119873046875, -1.02850341796875, -0.9371337890625, -0.84576416015625, -0.75439453125, -0.66302490234375, -0.5716552734375, -0.48028564453125, -0.388916015625, -0.29754638671875, -0.2061767578125, -0.11480712890625, -0.0234375, 0.06793212890625, 0.1593017578125, 0.25067138671875, 0.342041015625, 0.43341064453125, 0.5247802734375, 0.61614990234375, 0.70751953125, 0.79888916015625, 0.8902587890625, 0.98162841796875, 1.072998046875, 1.16436767578125, 1.2557373046875, 1.34710693359375, 1.4384765625, 1.52984619140625, 1.6212158203125, 1.71258544921875, 1.803955078125, 1.89532470703125, 1.9866943359375, 2.07806396484375, 2.16943359375, 2.26080322265625, 2.3521728515625, 2.44354248046875, 2.534912109375, 2.62628173828125, 2.7176513671875, 2.80902099609375, 2.900390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 12.0, 38.0, 57.0, 106.0, 251.0, 595.0, 1508.0, 4319.0, 20946.0, 250414.0, 706343.0, 51986.0, 7984.0, 2411.0, 861.0, 371.0, 152.0, 71.0, 39.0, 23.0, 15.0, 12.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.647216796875, -5.46630859375, -5.285400390625, -5.1044921875, -4.923583984375, -4.74267578125, -4.561767578125, -4.380859375, -4.199951171875, -4.01904296875, -3.838134765625, -3.6572265625, -3.476318359375, -3.29541015625, -3.114501953125, -2.93359375, -2.752685546875, -2.57177734375, -2.390869140625, -2.2099609375, -2.029052734375, -1.84814453125, -1.667236328125, -1.486328125, -1.305419921875, -1.12451171875, -0.943603515625, -0.7626953125, -0.581787109375, -0.40087890625, -0.219970703125, -0.0390625, 0.141845703125, 0.32275390625, 0.503662109375, 0.6845703125, 0.865478515625, 1.04638671875, 1.227294921875, 1.408203125, 1.589111328125, 1.77001953125, 1.950927734375, 2.1318359375, 2.312744140625, 2.49365234375, 2.674560546875, 2.85546875, 3.036376953125, 3.21728515625, 3.398193359375, 3.5791015625, 3.760009765625, 3.94091796875, 4.121826171875, 4.302734375, 4.483642578125, 4.66455078125, 4.845458984375, 5.0263671875, 5.207275390625, 5.38818359375, 5.569091796875, 5.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 5.0, 14.0, 10.0, 23.0, 37.0, 50.0, 87.0, 138.0, 214.0, 157.0, 86.0, 50.0, 35.0, 33.0, 16.0, 13.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010004043579101562, -0.0009697899222373962, -0.0009391754865646362, -0.0009085610508918762, -0.0008779466152191162, -0.0008473321795463562, -0.0008167177438735962, -0.0007861033082008362, -0.0007554888725280762, -0.0007248744368553162, -0.0006942600011825562, -0.0006636455655097961, -0.0006330311298370361, -0.0006024166941642761, -0.0005718022584915161, -0.0005411878228187561, -0.0005105733871459961, -0.0004799589514732361, -0.0004493445158004761, -0.00041873008012771606, -0.00038811564445495605, -0.00035750120878219604, -0.00032688677310943604, -0.000296272337436676, -0.000265657901763916, -0.000235043466091156, -0.000204429030418396, -0.00017381459474563599, -0.00014320015907287598, -0.00011258572340011597, -8.197128772735596e-05, -5.135685205459595e-05, -2.0742416381835938e-05, 9.872019290924072e-06, 4.048645496368408e-05, 7.110089063644409e-05, 0.0001017153263092041, 0.0001323297619819641, 0.00016294419765472412, 0.00019355863332748413, 0.00022417306900024414, 0.00025478750467300415, 0.00028540194034576416, 0.00031601637601852417, 0.0003466308116912842, 0.0003772452473640442, 0.0004078596830368042, 0.0004384741187095642, 0.0004690885543823242, 0.0004997029900550842, 0.0005303174257278442, 0.0005609318614006042, 0.0005915462970733643, 0.0006221607327461243, 0.0006527751684188843, 0.0006833896040916443, 0.0007140040397644043, 0.0007446184754371643, 0.0007752329111099243, 0.0008058473467826843, 0.0008364617824554443, 0.0008670762181282043, 0.0008976906538009644, 0.0009283050894737244, 0.0009589195251464844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 21.0, 30.0, 46.0, 95.0, 165.0, 430.0, 943.0, 2772.0, 12141.0, 201717.0, 793554.0, 29205.0, 4933.0, 1426.0, 515.0, 259.0, 131.0, 72.0, 19.0, 13.0, 19.0, 4.0, 7.0, 12.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.95574951171875, -7.7161865234375, -7.47662353515625, -7.237060546875, -6.99749755859375, -6.7579345703125, -6.51837158203125, -6.27880859375, -6.03924560546875, -5.7996826171875, -5.56011962890625, -5.320556640625, -5.08099365234375, -4.8414306640625, -4.60186767578125, -4.3623046875, -4.12274169921875, -3.8831787109375, -3.64361572265625, -3.404052734375, -3.16448974609375, -2.9249267578125, -2.68536376953125, -2.44580078125, -2.20623779296875, -1.9666748046875, -1.72711181640625, -1.487548828125, -1.24798583984375, -1.0084228515625, -0.76885986328125, -0.529296875, -0.28973388671875, -0.0501708984375, 0.18939208984375, 0.428955078125, 0.66851806640625, 0.9080810546875, 1.14764404296875, 1.38720703125, 1.62677001953125, 1.8663330078125, 2.10589599609375, 2.345458984375, 2.58502197265625, 2.8245849609375, 3.06414794921875, 3.3037109375, 3.54327392578125, 3.7828369140625, 4.02239990234375, 4.261962890625, 4.50152587890625, 4.7410888671875, 4.98065185546875, 5.22021484375, 5.45977783203125, 5.6993408203125, 5.93890380859375, 6.178466796875, 6.41802978515625, 6.6575927734375, 6.89715576171875, 7.13671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 4.0, 10.0, 8.0, 11.0, 24.0, 30.0, 61.0, 112.0, 140.0, 170.0, 145.0, 108.0, 48.0, 29.0, 19.0, 21.0, 13.0, 9.0, 8.0, 3.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4765625, -3.36602783203125, -3.2554931640625, -3.14495849609375, -3.034423828125, -2.92388916015625, -2.8133544921875, -2.70281982421875, -2.59228515625, -2.48175048828125, -2.3712158203125, -2.26068115234375, -2.150146484375, -2.03961181640625, -1.9290771484375, -1.81854248046875, -1.7080078125, -1.59747314453125, -1.4869384765625, -1.37640380859375, -1.265869140625, -1.15533447265625, -1.0447998046875, -0.93426513671875, -0.82373046875, -0.71319580078125, -0.6026611328125, -0.49212646484375, -0.381591796875, -0.27105712890625, -0.1605224609375, -0.04998779296875, 0.060546875, 0.17108154296875, 0.2816162109375, 0.39215087890625, 0.502685546875, 0.61322021484375, 0.7237548828125, 0.83428955078125, 0.94482421875, 1.05535888671875, 1.1658935546875, 1.27642822265625, 1.386962890625, 1.49749755859375, 1.6080322265625, 1.71856689453125, 1.8291015625, 1.93963623046875, 2.0501708984375, 2.16070556640625, 2.271240234375, 2.38177490234375, 2.4923095703125, 2.60284423828125, 2.71337890625, 2.82391357421875, 2.9344482421875, 3.04498291015625, 3.155517578125, 3.26605224609375, 3.3765869140625, 3.48712158203125, 3.59765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 22.0, 32.0, 56.0, 79.0, 121.0, 123.0, 134.0, 132.0, 101.0, 69.0, 30.0, 24.0, 20.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.876922607421875, -17.836334228515625, -16.795745849609375, -15.755155563354492, -14.714567184448242, -13.673978805541992, -12.633389472961426, -11.59280014038086, -10.55221176147461, -9.51162338256836, -8.471034049987793, -7.430445194244385, -6.389856338500977, -5.349267482757568, -4.30867862701416, -3.268089771270752, -2.2275009155273438, -1.1869120597839355, -0.14632320404052734, 0.8942656517028809, 1.934854507446289, 2.9754433631896973, 4.0160322189331055, 5.056621074676514, 6.097209930419922, 7.13779878616333, 8.178387641906738, 9.218976974487305, 10.259565353393555, 11.300153732299805, 12.340743064880371, 13.381332397460938, 14.421920776367188, 15.462509155273438, 16.503097534179688, 17.54368782043457, 18.58427619934082, 19.62486457824707, 20.665454864501953, 21.706043243408203, 22.746631622314453, 23.787220001220703, 24.827808380126953, 25.868398666381836, 26.908987045288086, 27.949575424194336, 28.99016571044922, 30.03075408935547, 31.07134246826172, 32.11193084716797, 33.15251922607422, 34.19310760498047, 35.23369598388672, 36.274288177490234, 37.314876556396484, 38.355464935302734, 39.396053314208984, 40.436641693115234, 41.477230072021484, 42.517818450927734, 43.55841064453125, 44.5989990234375, 45.63958740234375, 46.68017578125, 47.72076416015625]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 8.0, 3.0, 7.0, 8.0, 12.0, 9.0, 16.0, 11.0, 16.0, 14.0, 21.0, 21.0, 33.0, 35.0, 37.0, 41.0, 44.0, 34.0, 51.0, 51.0, 52.0, 50.0, 53.0, 54.0, 37.0, 37.0, 41.0, 34.0, 31.0, 24.0, 24.0, 22.0, 11.0, 15.0, 7.0, 6.0, 6.0, 5.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.13074493408203, -19.472129821777344, -18.813514709472656, -18.1549015045166, -17.496286392211914, -16.837671279907227, -16.179058074951172, -15.520442962646484, -14.861827850341797, -14.20321273803711, -13.544598579406738, -12.885984420776367, -12.22736930847168, -11.568754196166992, -10.910140037536621, -10.25152587890625, -9.592910766601562, -8.934295654296875, -8.275681495666504, -7.617066860198975, -6.958452224731445, -6.299837589263916, -5.641222953796387, -4.982608318328857, -4.323993682861328, -3.665379047393799, -3.0067644119262695, -2.3481497764587402, -1.689535140991211, -1.0309205055236816, -0.37230587005615234, 0.28630876541137695, 0.9449214935302734, 1.6035361289978027, 2.262150764465332, 2.9207653999328613, 3.5793800354003906, 4.23799467086792, 4.896609306335449, 5.5552239418029785, 6.213838577270508, 6.872453212738037, 7.531067848205566, 8.189682006835938, 8.848297119140625, 9.506912231445312, 10.165526390075684, 10.824140548706055, 11.482755661010742, 12.14137077331543, 12.7999849319458, 13.458599090576172, 14.11721420288086, 14.775829315185547, 15.434443473815918, 16.09305763244629, 16.751672744750977, 17.410287857055664, 18.06890106201172, 18.727516174316406, 19.386131286621094, 20.04474639892578, 20.70336151123047, 21.361974716186523, 22.02058982849121]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 15.0, 14.0, 32.0, 56.0, 89.0, 171.0, 323.0, 782.0, 2145.0, 7431.0, 37323.0, 728180.0, 3346537.0, 56766.0, 9883.0, 2724.0, 974.0, 398.0, 179.0, 93.0, 57.0, 29.0, 30.0, 13.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.25238037109375, -4.9774169921875, -4.70245361328125, -4.427490234375, -4.15252685546875, -3.8775634765625, -3.60260009765625, -3.32763671875, -3.05267333984375, -2.7777099609375, -2.50274658203125, -2.227783203125, -1.95281982421875, -1.6778564453125, -1.40289306640625, -1.1279296875, -0.85296630859375, -0.5780029296875, -0.30303955078125, -0.028076171875, 0.24688720703125, 0.5218505859375, 0.79681396484375, 1.07177734375, 1.34674072265625, 1.6217041015625, 1.89666748046875, 2.171630859375, 2.44659423828125, 2.7215576171875, 2.99652099609375, 3.271484375, 3.54644775390625, 3.8214111328125, 4.09637451171875, 4.371337890625, 4.64630126953125, 4.9212646484375, 5.19622802734375, 5.47119140625, 5.74615478515625, 6.0211181640625, 6.29608154296875, 6.571044921875, 6.84600830078125, 7.1209716796875, 7.39593505859375, 7.6708984375, 7.94586181640625, 8.2208251953125, 8.49578857421875, 8.770751953125, 9.04571533203125, 9.3206787109375, 9.59564208984375, 9.87060546875, 10.14556884765625, 10.4205322265625, 10.69549560546875, 10.970458984375, 11.24542236328125, 11.5203857421875, 11.79534912109375, 12.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 16.0, 20.0, 27.0, 45.0, 54.0, 55.0, 76.0, 69.0, 88.0, 86.0, 98.0, 74.0, 70.0, 53.0, 44.0, 30.0, 30.0, 17.0, 7.0, 3.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1135101318359375, -1.076629638671875, -1.0397491455078125, -1.00286865234375, -0.9659881591796875, -0.929107666015625, -0.8922271728515625, -0.8553466796875, -0.8184661865234375, -0.781585693359375, -0.7447052001953125, -0.70782470703125, -0.6709442138671875, -0.634063720703125, -0.5971832275390625, -0.560302734375, -0.5234222412109375, -0.486541748046875, -0.4496612548828125, -0.41278076171875, -0.3759002685546875, -0.339019775390625, -0.3021392822265625, -0.2652587890625, -0.2283782958984375, -0.191497802734375, -0.1546173095703125, -0.11773681640625, -0.0808563232421875, -0.043975830078125, -0.0070953369140625, 0.02978515625, 0.0666656494140625, 0.103546142578125, 0.1404266357421875, 0.17730712890625, 0.2141876220703125, 0.251068115234375, 0.2879486083984375, 0.3248291015625, 0.3617095947265625, 0.398590087890625, 0.4354705810546875, 0.47235107421875, 0.5092315673828125, 0.546112060546875, 0.5829925537109375, 0.619873046875, 0.6567535400390625, 0.693634033203125, 0.7305145263671875, 0.76739501953125, 0.8042755126953125, 0.841156005859375, 0.8780364990234375, 0.9149169921875, 0.9517974853515625, 0.988677978515625, 1.0255584716796875, 1.06243896484375, 1.0993194580078125, 1.136199951171875, 1.1730804443359375, 1.2099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 17.0, 15.0, 18.0, 34.0, 31.0, 38.0, 71.0, 113.0, 162.0, 246.0, 410.0, 702.0, 1271.0, 2203.0, 4345.0, 9463.0, 22310.0, 63793.0, 228615.0, 2433427.0, 1171587.0, 169443.0, 50498.0, 18662.0, 8103.0, 3994.0, 1928.0, 1060.0, 611.0, 397.0, 224.0, 146.0, 90.0, 72.0, 49.0, 26.0, 27.0, 12.0, 9.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.92578125, -3.809967041015625, -3.69415283203125, -3.578338623046875, -3.4625244140625, -3.346710205078125, -3.23089599609375, -3.115081787109375, -2.999267578125, -2.883453369140625, -2.76763916015625, -2.651824951171875, -2.5360107421875, -2.420196533203125, -2.30438232421875, -2.188568115234375, -2.07275390625, -1.956939697265625, -1.84112548828125, -1.725311279296875, -1.6094970703125, -1.493682861328125, -1.37786865234375, -1.262054443359375, -1.146240234375, -1.030426025390625, -0.91461181640625, -0.798797607421875, -0.6829833984375, -0.567169189453125, -0.45135498046875, -0.335540771484375, -0.2197265625, -0.103912353515625, 0.01190185546875, 0.127716064453125, 0.2435302734375, 0.359344482421875, 0.47515869140625, 0.590972900390625, 0.706787109375, 0.822601318359375, 0.93841552734375, 1.054229736328125, 1.1700439453125, 1.285858154296875, 1.40167236328125, 1.517486572265625, 1.63330078125, 1.749114990234375, 1.86492919921875, 1.980743408203125, 2.0965576171875, 2.212371826171875, 2.32818603515625, 2.444000244140625, 2.559814453125, 2.675628662109375, 2.79144287109375, 2.907257080078125, 3.0230712890625, 3.138885498046875, 3.25469970703125, 3.370513916015625, 3.486328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 21.0, 18.0, 21.0, 36.0, 48.0, 58.0, 71.0, 112.0, 198.0, 298.0, 687.0, 1234.0, 471.0, 231.0, 166.0, 91.0, 72.0, 59.0, 39.0, 29.0, 18.0, 22.0, 10.0, 6.0, 10.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.625244140625, -1.56982421875, -1.514404296875, -1.458984375, -1.403564453125, -1.34814453125, -1.292724609375, -1.2373046875, -1.181884765625, -1.12646484375, -1.071044921875, -1.015625, -0.960205078125, -0.90478515625, -0.849365234375, -0.7939453125, -0.738525390625, -0.68310546875, -0.627685546875, -0.572265625, -0.516845703125, -0.46142578125, -0.406005859375, -0.3505859375, -0.295166015625, -0.23974609375, -0.184326171875, -0.12890625, -0.073486328125, -0.01806640625, 0.037353515625, 0.0927734375, 0.148193359375, 0.20361328125, 0.259033203125, 0.314453125, 0.369873046875, 0.42529296875, 0.480712890625, 0.5361328125, 0.591552734375, 0.64697265625, 0.702392578125, 0.7578125, 0.813232421875, 0.86865234375, 0.924072265625, 0.9794921875, 1.034912109375, 1.09033203125, 1.145751953125, 1.201171875, 1.256591796875, 1.31201171875, 1.367431640625, 1.4228515625, 1.478271484375, 1.53369140625, 1.589111328125, 1.64453125, 1.699951171875, 1.75537109375, 1.810791015625, 1.8662109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 13.0, 10.0, 17.0, 12.0, 27.0, 45.0, 70.0, 63.0, 72.0, 97.0, 91.0, 87.0, 73.0, 72.0, 65.0, 61.0, 31.0, 23.0, 19.0, 11.0, 1.0, 7.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.557207107543945, -12.254907608032227, -11.952608108520508, -11.650307655334473, -11.348008155822754, -11.045708656311035, -10.743408203125, -10.441108703613281, -10.138809204101562, -9.836509704589844, -9.534210205078125, -9.23190975189209, -8.929610252380371, -8.627310752868652, -8.325010299682617, -8.022710800170898, -7.72041130065918, -7.418111801147461, -7.115811824798584, -6.813511848449707, -6.511212348937988, -6.2089128494262695, -5.906612873077393, -5.604312896728516, -5.302013397216797, -4.999713897705078, -4.697413921356201, -4.395113945007324, -4.0928144454956055, -3.7905147075653076, -3.4882149696350098, -3.185915231704712, -2.8836164474487305, -2.5813167095184326, -2.2790169715881348, -1.976717233657837, -1.674417495727539, -1.3721177577972412, -1.0698180198669434, -0.7675182819366455, -0.46521854400634766, -0.1629188060760498, 0.13938093185424805, 0.4416806697845459, 0.7439804077148438, 1.0462801456451416, 1.3485798835754395, 1.6508796215057373, 1.9531793594360352, 2.255479097366333, 2.557778835296631, 2.8600785732269287, 3.1623783111572266, 3.4646780490875244, 3.7669777870178223, 4.069277763366699, 4.371577262878418, 4.673876762390137, 4.976176738739014, 5.278476715087891, 5.580776214599609, 5.883075714111328, 6.185375690460205, 6.487675666809082, 6.789975166320801]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 13.0, 10.0, 13.0, 19.0, 20.0, 23.0, 24.0, 21.0, 39.0, 28.0, 36.0, 38.0, 42.0, 43.0, 42.0, 52.0, 35.0, 20.0, 40.0, 31.0, 37.0, 34.0, 43.0, 39.0, 22.0, 27.0, 21.0, 26.0, 26.0, 23.0, 13.0, 14.0, 8.0, 10.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.001309394836426, -5.808198928833008, -5.61508846282959, -5.421977996826172, -5.228867530822754, -5.035757064819336, -4.842646598815918, -4.649536609649658, -4.45642614364624, -4.263315677642822, -4.070205211639404, -3.8770947456359863, -3.6839845180511475, -3.4908740520477295, -3.2977635860443115, -3.1046533584594727, -2.9115426540374756, -2.7184321880340576, -2.5253217220306396, -2.332211494445801, -2.139101028442383, -1.9459905624389648, -1.7528800964355469, -1.5597697496414185, -1.3666592836380005, -1.1735488176345825, -0.9804384708404541, -0.7873280048370361, -0.5942175984382629, -0.40110719203948975, -0.20799672603607178, -0.01488637924194336, 0.1782240867614746, 0.3713344931602478, 0.564444899559021, 0.757555365562439, 0.9506657719612122, 1.1437761783599854, 1.3368866443634033, 1.5299969911575317, 1.7231074571609497, 1.9162179231643677, 2.109328269958496, 2.302438735961914, 2.495549201965332, 2.68865966796875, 2.881770133972168, 3.074880361557007, 3.267990827560425, 3.4611012935638428, 3.6542117595672607, 3.8473219871520996, 4.040432453155518, 4.2335429191589355, 4.4266533851623535, 4.6197638511657715, 4.8128743171691895, 5.005984783172607, 5.199095249176025, 5.392205715179443, 5.585316181182861, 5.778426170349121, 5.971536636352539, 6.164647102355957, 6.357757568359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 18.0, 23.0, 37.0, 61.0, 66.0, 116.0, 205.0, 350.0, 529.0, 931.0, 1829.0, 3563.0, 7608.0, 17744.0, 46329.0, 143289.0, 461900.0, 245233.0, 72031.0, 26134.0, 10571.0, 4680.0, 2273.0, 1190.0, 691.0, 418.0, 230.0, 149.0, 108.0, 62.0, 41.0, 33.0, 18.0, 14.0, 9.0, 15.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.6484375, -5.498626708984375, -5.34881591796875, -5.199005126953125, -5.0491943359375, -4.899383544921875, -4.74957275390625, -4.599761962890625, -4.449951171875, -4.300140380859375, -4.15032958984375, -4.000518798828125, -3.8507080078125, -3.700897216796875, -3.55108642578125, -3.401275634765625, -3.25146484375, -3.101654052734375, -2.95184326171875, -2.802032470703125, -2.6522216796875, -2.502410888671875, -2.35260009765625, -2.202789306640625, -2.052978515625, -1.903167724609375, -1.75335693359375, -1.603546142578125, -1.4537353515625, -1.303924560546875, -1.15411376953125, -1.004302978515625, -0.8544921875, -0.704681396484375, -0.55487060546875, -0.405059814453125, -0.2552490234375, -0.105438232421875, 0.04437255859375, 0.194183349609375, 0.343994140625, 0.493804931640625, 0.64361572265625, 0.793426513671875, 0.9432373046875, 1.093048095703125, 1.24285888671875, 1.392669677734375, 1.54248046875, 1.692291259765625, 1.84210205078125, 1.991912841796875, 2.1417236328125, 2.291534423828125, 2.44134521484375, 2.591156005859375, 2.740966796875, 2.890777587890625, 3.04058837890625, 3.190399169921875, 3.3402099609375, 3.490020751953125, 3.63983154296875, 3.789642333984375, 3.939453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 13.0, 13.0, 21.0, 29.0, 39.0, 45.0, 44.0, 64.0, 74.0, 77.0, 92.0, 83.0, 70.0, 80.0, 65.0, 49.0, 43.0, 25.0, 24.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.09783935546875, -1.0609130859375, -1.02398681640625, -0.987060546875, -0.95013427734375, -0.9132080078125, -0.87628173828125, -0.83935546875, -0.80242919921875, -0.7655029296875, -0.72857666015625, -0.691650390625, -0.65472412109375, -0.6177978515625, -0.58087158203125, -0.5439453125, -0.50701904296875, -0.4700927734375, -0.43316650390625, -0.396240234375, -0.35931396484375, -0.3223876953125, -0.28546142578125, -0.24853515625, -0.21160888671875, -0.1746826171875, -0.13775634765625, -0.100830078125, -0.06390380859375, -0.0269775390625, 0.00994873046875, 0.046875, 0.08380126953125, 0.1207275390625, 0.15765380859375, 0.194580078125, 0.23150634765625, 0.2684326171875, 0.30535888671875, 0.34228515625, 0.37921142578125, 0.4161376953125, 0.45306396484375, 0.489990234375, 0.52691650390625, 0.5638427734375, 0.60076904296875, 0.6376953125, 0.67462158203125, 0.7115478515625, 0.74847412109375, 0.785400390625, 0.82232666015625, 0.8592529296875, 0.89617919921875, 0.93310546875, 0.97003173828125, 1.0069580078125, 1.04388427734375, 1.080810546875, 1.11773681640625, 1.1546630859375, 1.19158935546875, 1.228515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 11.0, 13.0, 18.0, 32.0, 40.0, 55.0, 81.0, 149.0, 232.0, 409.0, 810.0, 1687.0, 4137.0, 13064.0, 47918.0, 224149.0, 578638.0, 131655.0, 30762.0, 8697.0, 3118.0, 1271.0, 637.0, 343.0, 199.0, 114.0, 85.0, 50.0, 46.0, 29.0, 27.0, 15.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.890625, -4.71173095703125, -4.5328369140625, -4.35394287109375, -4.175048828125, -3.99615478515625, -3.8172607421875, -3.63836669921875, -3.45947265625, -3.28057861328125, -3.1016845703125, -2.92279052734375, -2.743896484375, -2.56500244140625, -2.3861083984375, -2.20721435546875, -2.0283203125, -1.84942626953125, -1.6705322265625, -1.49163818359375, -1.312744140625, -1.13385009765625, -0.9549560546875, -0.77606201171875, -0.59716796875, -0.41827392578125, -0.2393798828125, -0.06048583984375, 0.118408203125, 0.29730224609375, 0.4761962890625, 0.65509033203125, 0.833984375, 1.01287841796875, 1.1917724609375, 1.37066650390625, 1.549560546875, 1.72845458984375, 1.9073486328125, 2.08624267578125, 2.26513671875, 2.44403076171875, 2.6229248046875, 2.80181884765625, 2.980712890625, 3.15960693359375, 3.3385009765625, 3.51739501953125, 3.6962890625, 3.87518310546875, 4.0540771484375, 4.23297119140625, 4.411865234375, 4.59075927734375, 4.7696533203125, 4.94854736328125, 5.12744140625, 5.30633544921875, 5.4852294921875, 5.66412353515625, 5.843017578125, 6.02191162109375, 6.2008056640625, 6.37969970703125, 6.55859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 8.0, 15.0, 19.0, 14.0, 16.0, 25.0, 23.0, 38.0, 36.0, 40.0, 49.0, 52.0, 43.0, 50.0, 56.0, 53.0, 45.0, 48.0, 50.0, 53.0, 35.0, 40.0, 24.0, 25.0, 23.0, 19.0, 25.0, 11.0, 8.0, 6.0, 9.0, 11.0, 1.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.977783203125, -3.84619140625, -3.714599609375, -3.5830078125, -3.451416015625, -3.31982421875, -3.188232421875, -3.056640625, -2.925048828125, -2.79345703125, -2.661865234375, -2.5302734375, -2.398681640625, -2.26708984375, -2.135498046875, -2.00390625, -1.872314453125, -1.74072265625, -1.609130859375, -1.4775390625, -1.345947265625, -1.21435546875, -1.082763671875, -0.951171875, -0.819580078125, -0.68798828125, -0.556396484375, -0.4248046875, -0.293212890625, -0.16162109375, -0.030029296875, 0.1015625, 0.233154296875, 0.36474609375, 0.496337890625, 0.6279296875, 0.759521484375, 0.89111328125, 1.022705078125, 1.154296875, 1.285888671875, 1.41748046875, 1.549072265625, 1.6806640625, 1.812255859375, 1.94384765625, 2.075439453125, 2.20703125, 2.338623046875, 2.47021484375, 2.601806640625, 2.7333984375, 2.864990234375, 2.99658203125, 3.128173828125, 3.259765625, 3.391357421875, 3.52294921875, 3.654541015625, 3.7861328125, 3.917724609375, 4.04931640625, 4.180908203125, 4.3125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 14.0, 18.0, 28.0, 52.0, 80.0, 167.0, 340.0, 733.0, 1689.0, 5140.0, 22475.0, 180985.0, 720277.0, 95582.0, 14499.0, 3878.0, 1386.0, 609.0, 251.0, 140.0, 79.0, 36.0, 26.0, 15.0, 10.0, 9.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.85247802734375, -5.6658935546875, -5.47930908203125, -5.292724609375, -5.10614013671875, -4.9195556640625, -4.73297119140625, -4.54638671875, -4.35980224609375, -4.1732177734375, -3.98663330078125, -3.800048828125, -3.61346435546875, -3.4268798828125, -3.24029541015625, -3.0537109375, -2.86712646484375, -2.6805419921875, -2.49395751953125, -2.307373046875, -2.12078857421875, -1.9342041015625, -1.74761962890625, -1.56103515625, -1.37445068359375, -1.1878662109375, -1.00128173828125, -0.814697265625, -0.62811279296875, -0.4415283203125, -0.25494384765625, -0.068359375, 0.11822509765625, 0.3048095703125, 0.49139404296875, 0.677978515625, 0.86456298828125, 1.0511474609375, 1.23773193359375, 1.42431640625, 1.61090087890625, 1.7974853515625, 1.98406982421875, 2.170654296875, 2.35723876953125, 2.5438232421875, 2.73040771484375, 2.9169921875, 3.10357666015625, 3.2901611328125, 3.47674560546875, 3.663330078125, 3.84991455078125, 4.0364990234375, 4.22308349609375, 4.40966796875, 4.59625244140625, 4.7828369140625, 4.96942138671875, 5.156005859375, 5.34259033203125, 5.5291748046875, 5.71575927734375, 5.90234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 19.0, 21.0, 22.0, 36.0, 84.0, 180.0, 257.0, 126.0, 83.0, 48.0, 29.0, 16.0, 14.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.0009905099868774414, -0.0009529590606689453, -0.0009154081344604492, -0.0008778572082519531, -0.000840306282043457, -0.0008027553558349609, -0.0007652044296264648, -0.0007276535034179688, -0.0006901025772094727, -0.0006525516510009766, -0.0006150007247924805, -0.0005774497985839844, -0.0005398988723754883, -0.0005023479461669922, -0.0004647970199584961, -0.00042724609375, -0.0003896951675415039, -0.0003521442413330078, -0.0003145933151245117, -0.0002770423889160156, -0.00023949146270751953, -0.00020194053649902344, -0.00016438961029052734, -0.00012683868408203125, -8.928775787353516e-05, -5.173683166503906e-05, -1.4185905456542969e-05, 2.3365020751953125e-05, 6.091594696044922e-05, 9.846687316894531e-05, 0.0001360177993774414, 0.0001735687255859375, 0.0002111196517944336, 0.0002486705780029297, 0.0002862215042114258, 0.0003237724304199219, 0.00036132335662841797, 0.00039887428283691406, 0.00043642520904541016, 0.00047397613525390625, 0.0005115270614624023, 0.0005490779876708984, 0.0005866289138793945, 0.0006241798400878906, 0.0006617307662963867, 0.0006992816925048828, 0.0007368326187133789, 0.000774383544921875, 0.0008119344711303711, 0.0008494853973388672, 0.0008870363235473633, 0.0009245872497558594, 0.0009621381759643555, 0.0009996891021728516, 0.0010372400283813477, 0.0010747909545898438, 0.0011123418807983398, 0.001149892807006836, 0.001187443733215332, 0.0012249946594238281, 0.0012625455856323242, 0.0013000965118408203, 0.0013376474380493164, 0.0013751983642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 6.0, 8.0, 10.0, 12.0, 23.0, 41.0, 33.0, 48.0, 112.0, 211.0, 509.0, 1216.0, 3551.0, 13769.0, 88331.0, 731933.0, 178599.0, 22049.0, 5269.0, 1581.0, 605.0, 292.0, 129.0, 88.0, 44.0, 30.0, 18.0, 17.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.9296875, -6.7503662109375, -6.571044921875, -6.3917236328125, -6.21240234375, -6.0330810546875, -5.853759765625, -5.6744384765625, -5.4951171875, -5.3157958984375, -5.136474609375, -4.9571533203125, -4.77783203125, -4.5985107421875, -4.419189453125, -4.2398681640625, -4.060546875, -3.8812255859375, -3.701904296875, -3.5225830078125, -3.34326171875, -3.1639404296875, -2.984619140625, -2.8052978515625, -2.6259765625, -2.4466552734375, -2.267333984375, -2.0880126953125, -1.90869140625, -1.7293701171875, -1.550048828125, -1.3707275390625, -1.19140625, -1.0120849609375, -0.832763671875, -0.6534423828125, -0.47412109375, -0.2947998046875, -0.115478515625, 0.0638427734375, 0.2431640625, 0.4224853515625, 0.601806640625, 0.7811279296875, 0.96044921875, 1.1397705078125, 1.319091796875, 1.4984130859375, 1.677734375, 1.8570556640625, 2.036376953125, 2.2156982421875, 2.39501953125, 2.5743408203125, 2.753662109375, 2.9329833984375, 3.1123046875, 3.2916259765625, 3.470947265625, 3.6502685546875, 3.82958984375, 4.0089111328125, 4.188232421875, 4.3675537109375, 4.546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 6.0, 14.0, 23.0, 30.0, 52.0, 60.0, 81.0, 132.0, 153.0, 121.0, 77.0, 54.0, 39.0, 33.0, 22.0, 19.0, 14.0, 14.0, 6.0, 5.0, 2.0, 1.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.91156005859375, -3.8074951171875, -3.70343017578125, -3.599365234375, -3.49530029296875, -3.3912353515625, -3.28717041015625, -3.18310546875, -3.07904052734375, -2.9749755859375, -2.87091064453125, -2.766845703125, -2.66278076171875, -2.5587158203125, -2.45465087890625, -2.3505859375, -2.24652099609375, -2.1424560546875, -2.03839111328125, -1.934326171875, -1.83026123046875, -1.7261962890625, -1.62213134765625, -1.51806640625, -1.41400146484375, -1.3099365234375, -1.20587158203125, -1.101806640625, -0.99774169921875, -0.8936767578125, -0.78961181640625, -0.685546875, -0.58148193359375, -0.4774169921875, -0.37335205078125, -0.269287109375, -0.16522216796875, -0.0611572265625, 0.04290771484375, 0.14697265625, 0.25103759765625, 0.3551025390625, 0.45916748046875, 0.563232421875, 0.66729736328125, 0.7713623046875, 0.87542724609375, 0.9794921875, 1.08355712890625, 1.1876220703125, 1.29168701171875, 1.395751953125, 1.49981689453125, 1.6038818359375, 1.70794677734375, 1.81201171875, 1.91607666015625, 2.0201416015625, 2.12420654296875, 2.228271484375, 2.33233642578125, 2.4364013671875, 2.54046630859375, 2.64453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 16.0, 30.0, 33.0, 46.0, 97.0, 138.0, 122.0, 125.0, 96.0, 101.0, 68.0, 46.0, 32.0, 17.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.55727767944336, -18.358530044555664, -17.15978240966797, -15.961034774780273, -14.762287139892578, -13.563539505004883, -12.364792823791504, -11.166045188903809, -9.967297554016113, -8.768549919128418, -7.569802284240723, -6.3710551261901855, -5.17230749130249, -3.973559856414795, -2.774812698364258, -1.5760650634765625, -0.3773174285888672, 0.8214300870895386, 2.0201776027679443, 3.2189249992370605, 4.417672634124756, 5.616420269012451, 6.815167427062988, 8.013915061950684, 9.212662696838379, 10.411410331726074, 11.61015796661377, 12.808904647827148, 14.007652282714844, 15.206399917602539, 16.405147552490234, 17.60389518737793, 18.802642822265625, 20.00139045715332, 21.200138092041016, 22.39888572692871, 23.597633361816406, 24.7963809967041, 25.995128631591797, 27.19387435913086, 28.392623901367188, 29.591371536254883, 30.790119171142578, 31.988866806030273, 33.18761444091797, 34.38636016845703, 35.58510971069336, 36.78385543823242, 37.98260498046875, 39.18135070800781, 40.38010025024414, 41.5788459777832, 42.77759552001953, 43.976341247558594, 45.17509078979492, 46.373836517333984, 47.57258224487305, 48.77132797241211, 49.97007751464844, 51.1688232421875, 52.36757278442383, 53.56631851196289, 54.76506805419922, 55.96381378173828, 57.16256332397461]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 4.0, 6.0, 7.0, 15.0, 7.0, 13.0, 18.0, 21.0, 17.0, 21.0, 26.0, 40.0, 31.0, 35.0, 51.0, 41.0, 46.0, 57.0, 55.0, 53.0, 42.0, 44.0, 45.0, 43.0, 42.0, 28.0, 34.0, 28.0, 17.0, 21.0, 15.0, 10.0, 9.0, 9.0, 13.0, 7.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.261754989624023, -22.515945434570312, -21.770137786865234, -21.024328231811523, -20.278520584106445, -19.532711029052734, -18.786903381347656, -18.041093826293945, -17.295284271240234, -16.549474716186523, -15.803667068481445, -15.057857513427734, -14.312049865722656, -13.566240310668945, -12.82043170928955, -12.074623107910156, -11.328815460205078, -10.583006858825684, -9.837198257446289, -9.091388702392578, -8.3455810546875, -7.599771976470947, -6.8539628982543945, -6.108154296875, -5.3623456954956055, -4.616537094116211, -3.8707282543182373, -3.1249194145202637, -2.379110813140869, -1.6333022117614746, -0.8874931335449219, -0.14168453216552734, 0.6041259765625, 1.349934697151184, 2.095743417739868, 2.841552257537842, 3.5873608589172363, 4.333169460296631, 5.078978538513184, 5.824787139892578, 6.570595741271973, 7.316404342651367, 8.062212944030762, 8.808021545410156, 9.553831100463867, 10.299638748168945, 11.045448303222656, 11.79125690460205, 12.537065505981445, 13.28287410736084, 14.028682708740234, 14.774492263793945, 15.520299911499023, 16.266109466552734, 17.011917114257812, 17.757726669311523, 18.503536224365234, 19.249345779418945, 19.995153427124023, 20.740962982177734, 21.486770629882812, 22.232580184936523, 22.978389739990234, 23.724197387695312, 24.47000503540039]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 13.0, 37.0, 44.0, 70.0, 129.0, 190.0, 315.0, 656.0, 1445.0, 3117.0, 8351.0, 28304.0, 147610.0, 3687280.0, 259215.0, 39554.0, 10922.0, 3875.0, 1561.0, 712.0, 360.0, 200.0, 96.0, 51.0, 44.0, 34.0, 25.0, 10.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.3046875, -6.0987548828125, -5.892822265625, -5.6868896484375, -5.48095703125, -5.2750244140625, -5.069091796875, -4.8631591796875, -4.6572265625, -4.4512939453125, -4.245361328125, -4.0394287109375, -3.83349609375, -3.6275634765625, -3.421630859375, -3.2156982421875, -3.009765625, -2.8038330078125, -2.597900390625, -2.3919677734375, -2.18603515625, -1.9801025390625, -1.774169921875, -1.5682373046875, -1.3623046875, -1.1563720703125, -0.950439453125, -0.7445068359375, -0.53857421875, -0.3326416015625, -0.126708984375, 0.0792236328125, 0.28515625, 0.4910888671875, 0.697021484375, 0.9029541015625, 1.10888671875, 1.3148193359375, 1.520751953125, 1.7266845703125, 1.9326171875, 2.1385498046875, 2.344482421875, 2.5504150390625, 2.75634765625, 2.9622802734375, 3.168212890625, 3.3741455078125, 3.580078125, 3.7860107421875, 3.991943359375, 4.1978759765625, 4.40380859375, 4.6097412109375, 4.815673828125, 5.0216064453125, 5.2275390625, 5.4334716796875, 5.639404296875, 5.8453369140625, 6.05126953125, 6.2572021484375, 6.463134765625, 6.6690673828125, 6.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 14.0, 24.0, 30.0, 21.0, 28.0, 49.0, 51.0, 72.0, 72.0, 75.0, 71.0, 68.0, 59.0, 68.0, 59.0, 44.0, 36.0, 35.0, 29.0, 22.0, 13.0, 7.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.090240478515625, -1.05352783203125, -1.016815185546875, -0.9801025390625, -0.943389892578125, -0.90667724609375, -0.869964599609375, -0.833251953125, -0.796539306640625, -0.75982666015625, -0.723114013671875, -0.6864013671875, -0.649688720703125, -0.61297607421875, -0.576263427734375, -0.53955078125, -0.502838134765625, -0.46612548828125, -0.429412841796875, -0.3927001953125, -0.355987548828125, -0.31927490234375, -0.282562255859375, -0.245849609375, -0.209136962890625, -0.17242431640625, -0.135711669921875, -0.0989990234375, -0.062286376953125, -0.02557373046875, 0.011138916015625, 0.0478515625, 0.084564208984375, 0.12127685546875, 0.157989501953125, 0.1947021484375, 0.231414794921875, 0.26812744140625, 0.304840087890625, 0.341552734375, 0.378265380859375, 0.41497802734375, 0.451690673828125, 0.4884033203125, 0.525115966796875, 0.56182861328125, 0.598541259765625, 0.63525390625, 0.671966552734375, 0.70867919921875, 0.745391845703125, 0.7821044921875, 0.818817138671875, 0.85552978515625, 0.892242431640625, 0.928955078125, 0.965667724609375, 1.00238037109375, 1.039093017578125, 1.0758056640625, 1.112518310546875, 1.14923095703125, 1.185943603515625, 1.22265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 17.0, 22.0, 19.0, 29.0, 61.0, 90.0, 127.0, 165.0, 298.0, 445.0, 760.0, 1339.0, 2495.0, 4737.0, 10565.0, 26543.0, 79723.0, 372464.0, 3268576.0, 309986.0, 71362.0, 24352.0, 9928.0, 4515.0, 2311.0, 1270.0, 776.0, 433.0, 266.0, 183.0, 118.0, 81.0, 65.0, 43.0, 18.0, 18.0, 19.0, 11.0, 6.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0234375, -4.86865234375, -4.7138671875, -4.55908203125, -4.404296875, -4.24951171875, -4.0947265625, -3.93994140625, -3.78515625, -3.63037109375, -3.4755859375, -3.32080078125, -3.166015625, -3.01123046875, -2.8564453125, -2.70166015625, -2.546875, -2.39208984375, -2.2373046875, -2.08251953125, -1.927734375, -1.77294921875, -1.6181640625, -1.46337890625, -1.30859375, -1.15380859375, -0.9990234375, -0.84423828125, -0.689453125, -0.53466796875, -0.3798828125, -0.22509765625, -0.0703125, 0.08447265625, 0.2392578125, 0.39404296875, 0.548828125, 0.70361328125, 0.8583984375, 1.01318359375, 1.16796875, 1.32275390625, 1.4775390625, 1.63232421875, 1.787109375, 1.94189453125, 2.0966796875, 2.25146484375, 2.40625, 2.56103515625, 2.7158203125, 2.87060546875, 3.025390625, 3.18017578125, 3.3349609375, 3.48974609375, 3.64453125, 3.79931640625, 3.9541015625, 4.10888671875, 4.263671875, 4.41845703125, 4.5732421875, 4.72802734375, 4.8828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 15.0, 25.0, 39.0, 51.0, 72.0, 109.0, 174.0, 403.0, 1709.0, 755.0, 273.0, 155.0, 83.0, 46.0, 35.0, 37.0, 17.0, 13.0, 4.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.705322265625, -2.62744140625, -2.549560546875, -2.4716796875, -2.393798828125, -2.31591796875, -2.238037109375, -2.16015625, -2.082275390625, -2.00439453125, -1.926513671875, -1.8486328125, -1.770751953125, -1.69287109375, -1.614990234375, -1.537109375, -1.459228515625, -1.38134765625, -1.303466796875, -1.2255859375, -1.147705078125, -1.06982421875, -0.991943359375, -0.9140625, -0.836181640625, -0.75830078125, -0.680419921875, -0.6025390625, -0.524658203125, -0.44677734375, -0.368896484375, -0.291015625, -0.213134765625, -0.13525390625, -0.057373046875, 0.0205078125, 0.098388671875, 0.17626953125, 0.254150390625, 0.33203125, 0.409912109375, 0.48779296875, 0.565673828125, 0.6435546875, 0.721435546875, 0.79931640625, 0.877197265625, 0.955078125, 1.032958984375, 1.11083984375, 1.188720703125, 1.2666015625, 1.344482421875, 1.42236328125, 1.500244140625, 1.578125, 1.656005859375, 1.73388671875, 1.811767578125, 1.8896484375, 1.967529296875, 2.04541015625, 2.123291015625, 2.201171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 30.0, 80.0, 171.0, 237.0, 230.0, 137.0, 60.0, 18.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.856782913208008, -29.00043296813965, -28.14408302307129, -27.28773307800293, -26.431381225585938, -25.575031280517578, -24.71868133544922, -23.86233139038086, -23.0059814453125, -22.14963150024414, -21.29328155517578, -20.436931610107422, -19.580581665039062, -18.724231719970703, -17.86787986755371, -17.01152992248535, -16.155179977416992, -15.298830032348633, -14.442480087280273, -13.586129188537598, -12.729779243469238, -11.873429298400879, -11.017078399658203, -10.160728454589844, -9.304378509521484, -8.448028564453125, -7.591678142547607, -6.73532772064209, -5.8789777755737305, -5.022627830505371, -4.1662774085998535, -3.309926986694336, -2.4535751342773438, -1.5972249507904053, -0.7408747673034668, 0.11547541618347168, 0.9718255996704102, 1.8281755447387695, 2.684525966644287, 3.5408763885498047, 4.397226333618164, 5.253576278686523, 6.109926700592041, 6.966277122497559, 7.822627067565918, 8.678977012634277, 9.535327911376953, 10.391677856445312, 11.248027801513672, 12.104377746582031, 12.96072769165039, 13.817078590393066, 14.673428535461426, 15.529778480529785, 16.38612937927246, 17.24247932434082, 18.09882926940918, 18.95517921447754, 19.8115291595459, 20.667879104614258, 21.52423095703125, 22.38058090209961, 23.23693084716797, 24.093280792236328, 24.949630737304688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 2.0, 11.0, 19.0, 17.0, 24.0, 22.0, 32.0, 29.0, 43.0, 35.0, 47.0, 38.0, 63.0, 52.0, 47.0, 48.0, 48.0, 56.0, 35.0, 41.0, 45.0, 33.0, 32.0, 33.0, 26.0, 20.0, 19.0, 17.0, 11.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.195155143737793, -7.932441234588623, -7.669727325439453, -7.407013893127441, -7.1442999839782715, -6.881586074829102, -6.61887264251709, -6.35615873336792, -6.09344482421875, -5.83073091506958, -5.56801700592041, -5.305303573608398, -5.0425896644592285, -4.779875755310059, -4.517162322998047, -4.254448413848877, -3.991734504699707, -3.729020595550537, -3.4663069248199463, -3.2035932540893555, -2.9408793449401855, -2.6781654357910156, -2.415451765060425, -2.152738094329834, -1.890024185180664, -1.6273103952407837, -1.3645966053009033, -1.101882815361023, -0.8391690254211426, -0.5764552354812622, -0.31374144554138184, -0.051027655601501465, 0.2116870880126953, 0.4744008779525757, 0.737114667892456, 0.9998284578323364, 1.2625422477722168, 1.5252560377120972, 1.7879698276519775, 2.0506834983825684, 2.3133974075317383, 2.576111316680908, 2.838824987411499, 3.10153865814209, 3.3642525672912598, 3.6269664764404297, 3.8896801471710205, 4.152393817901611, 4.415107727050781, 4.677821636199951, 4.940535545349121, 5.203248977661133, 5.465962886810303, 5.728676795959473, 5.991390228271484, 6.254104137420654, 6.516818046569824, 6.779531955718994, 7.042245864868164, 7.304959297180176, 7.567673206329346, 7.830387115478516, 8.093100547790527, 8.355814933776855, 8.618528366088867]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 8.0, 19.0, 18.0, 20.0, 35.0, 51.0, 88.0, 122.0, 223.0, 342.0, 608.0, 1307.0, 2633.0, 5583.0, 13045.0, 32509.0, 88298.0, 278579.0, 413352.0, 132316.0, 46381.0, 18195.0, 7632.0, 3457.0, 1757.0, 847.0, 435.0, 250.0, 135.0, 98.0, 68.0, 49.0, 25.0, 21.0, 9.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.87591552734375, -4.7088623046875, -4.54180908203125, -4.374755859375, -4.20770263671875, -4.0406494140625, -3.87359619140625, -3.70654296875, -3.53948974609375, -3.3724365234375, -3.20538330078125, -3.038330078125, -2.87127685546875, -2.7042236328125, -2.53717041015625, -2.3701171875, -2.20306396484375, -2.0360107421875, -1.86895751953125, -1.701904296875, -1.53485107421875, -1.3677978515625, -1.20074462890625, -1.03369140625, -0.86663818359375, -0.6995849609375, -0.53253173828125, -0.365478515625, -0.19842529296875, -0.0313720703125, 0.13568115234375, 0.302734375, 0.46978759765625, 0.6368408203125, 0.80389404296875, 0.970947265625, 1.13800048828125, 1.3050537109375, 1.47210693359375, 1.63916015625, 1.80621337890625, 1.9732666015625, 2.14031982421875, 2.307373046875, 2.47442626953125, 2.6414794921875, 2.80853271484375, 2.9755859375, 3.14263916015625, 3.3096923828125, 3.47674560546875, 3.643798828125, 3.81085205078125, 3.9779052734375, 4.14495849609375, 4.31201171875, 4.47906494140625, 4.6461181640625, 4.81317138671875, 4.980224609375, 5.14727783203125, 5.3143310546875, 5.48138427734375, 5.6484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 6.0, 10.0, 13.0, 16.0, 11.0, 21.0, 21.0, 23.0, 31.0, 33.0, 44.0, 52.0, 61.0, 76.0, 56.0, 62.0, 57.0, 61.0, 55.0, 44.0, 41.0, 39.0, 40.0, 35.0, 19.0, 20.0, 8.0, 13.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.898040771484375, -0.86541748046875, -0.832794189453125, -0.8001708984375, -0.767547607421875, -0.73492431640625, -0.702301025390625, -0.669677734375, -0.637054443359375, -0.60443115234375, -0.571807861328125, -0.5391845703125, -0.506561279296875, -0.47393798828125, -0.441314697265625, -0.40869140625, -0.376068115234375, -0.34344482421875, -0.310821533203125, -0.2781982421875, -0.245574951171875, -0.21295166015625, -0.180328369140625, -0.147705078125, -0.115081787109375, -0.08245849609375, -0.049835205078125, -0.0172119140625, 0.015411376953125, 0.04803466796875, 0.080657958984375, 0.11328125, 0.145904541015625, 0.17852783203125, 0.211151123046875, 0.2437744140625, 0.276397705078125, 0.30902099609375, 0.341644287109375, 0.374267578125, 0.406890869140625, 0.43951416015625, 0.472137451171875, 0.5047607421875, 0.537384033203125, 0.57000732421875, 0.602630615234375, 0.63525390625, 0.667877197265625, 0.70050048828125, 0.733123779296875, 0.7657470703125, 0.798370361328125, 0.83099365234375, 0.863616943359375, 0.896240234375, 0.928863525390625, 0.96148681640625, 0.994110107421875, 1.0267333984375, 1.059356689453125, 1.09197998046875, 1.124603271484375, 1.1572265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 13.0, 10.0, 11.0, 15.0, 34.0, 33.0, 54.0, 75.0, 111.0, 196.0, 346.0, 583.0, 1245.0, 3311.0, 13385.0, 79009.0, 573452.0, 319610.0, 43967.0, 8559.0, 2387.0, 963.0, 434.0, 240.0, 161.0, 109.0, 81.0, 32.0, 30.0, 18.0, 15.0, 14.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.89306640625, -6.6455078125, -6.39794921875, -6.150390625, -5.90283203125, -5.6552734375, -5.40771484375, -5.16015625, -4.91259765625, -4.6650390625, -4.41748046875, -4.169921875, -3.92236328125, -3.6748046875, -3.42724609375, -3.1796875, -2.93212890625, -2.6845703125, -2.43701171875, -2.189453125, -1.94189453125, -1.6943359375, -1.44677734375, -1.19921875, -0.95166015625, -0.7041015625, -0.45654296875, -0.208984375, 0.03857421875, 0.2861328125, 0.53369140625, 0.78125, 1.02880859375, 1.2763671875, 1.52392578125, 1.771484375, 2.01904296875, 2.2666015625, 2.51416015625, 2.76171875, 3.00927734375, 3.2568359375, 3.50439453125, 3.751953125, 3.99951171875, 4.2470703125, 4.49462890625, 4.7421875, 4.98974609375, 5.2373046875, 5.48486328125, 5.732421875, 5.97998046875, 6.2275390625, 6.47509765625, 6.72265625, 6.97021484375, 7.2177734375, 7.46533203125, 7.712890625, 7.96044921875, 8.2080078125, 8.45556640625, 8.703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 5.0, 10.0, 7.0, 12.0, 11.0, 15.0, 16.0, 21.0, 35.0, 32.0, 30.0, 30.0, 53.0, 44.0, 49.0, 61.0, 54.0, 45.0, 57.0, 42.0, 60.0, 33.0, 41.0, 48.0, 34.0, 29.0, 16.0, 28.0, 11.0, 16.0, 17.0, 11.0, 4.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.222412109375, -4.07763671875, -3.932861328125, -3.7880859375, -3.643310546875, -3.49853515625, -3.353759765625, -3.208984375, -3.064208984375, -2.91943359375, -2.774658203125, -2.6298828125, -2.485107421875, -2.34033203125, -2.195556640625, -2.05078125, -1.906005859375, -1.76123046875, -1.616455078125, -1.4716796875, -1.326904296875, -1.18212890625, -1.037353515625, -0.892578125, -0.747802734375, -0.60302734375, -0.458251953125, -0.3134765625, -0.168701171875, -0.02392578125, 0.120849609375, 0.265625, 0.410400390625, 0.55517578125, 0.699951171875, 0.8447265625, 0.989501953125, 1.13427734375, 1.279052734375, 1.423828125, 1.568603515625, 1.71337890625, 1.858154296875, 2.0029296875, 2.147705078125, 2.29248046875, 2.437255859375, 2.58203125, 2.726806640625, 2.87158203125, 3.016357421875, 3.1611328125, 3.305908203125, 3.45068359375, 3.595458984375, 3.740234375, 3.885009765625, 4.02978515625, 4.174560546875, 4.3193359375, 4.464111328125, 4.60888671875, 4.753662109375, 4.8984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 5.0, 17.0, 15.0, 34.0, 40.0, 60.0, 99.0, 130.0, 219.0, 448.0, 1001.0, 2514.0, 9453.0, 84466.0, 836295.0, 98544.0, 10387.0, 2634.0, 1051.0, 480.0, 241.0, 141.0, 93.0, 44.0, 42.0, 30.0, 19.0, 13.0, 6.0, 6.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58203125, -7.29620361328125, -7.0103759765625, -6.72454833984375, -6.438720703125, -6.15289306640625, -5.8670654296875, -5.58123779296875, -5.29541015625, -5.00958251953125, -4.7237548828125, -4.43792724609375, -4.152099609375, -3.86627197265625, -3.5804443359375, -3.29461669921875, -3.0087890625, -2.72296142578125, -2.4371337890625, -2.15130615234375, -1.865478515625, -1.57965087890625, -1.2938232421875, -1.00799560546875, -0.72216796875, -0.43634033203125, -0.1505126953125, 0.13531494140625, 0.421142578125, 0.70697021484375, 0.9927978515625, 1.27862548828125, 1.564453125, 1.85028076171875, 2.1361083984375, 2.42193603515625, 2.707763671875, 2.99359130859375, 3.2794189453125, 3.56524658203125, 3.85107421875, 4.13690185546875, 4.4227294921875, 4.70855712890625, 4.994384765625, 5.28021240234375, 5.5660400390625, 5.85186767578125, 6.1376953125, 6.42352294921875, 6.7093505859375, 6.99517822265625, 7.281005859375, 7.56683349609375, 7.8526611328125, 8.13848876953125, 8.42431640625, 8.71014404296875, 8.9959716796875, 9.28179931640625, 9.567626953125, 9.85345458984375, 10.1392822265625, 10.42510986328125, 10.7109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 13.0, 12.0, 17.0, 24.0, 43.0, 41.0, 61.0, 134.0, 141.0, 142.0, 91.0, 43.0, 45.0, 29.0, 19.0, 19.0, 21.0, 10.0, 6.0, 10.0, 3.0, 8.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008206367492675781, -0.0007954463362693787, -0.0007702559232711792, -0.0007450655102729797, -0.0007198750972747803, -0.0006946846842765808, -0.0006694942712783813, -0.0006443038582801819, -0.0006191134452819824, -0.000593923032283783, -0.0005687326192855835, -0.000543542206287384, -0.0005183517932891846, -0.0004931613802909851, -0.00046797096729278564, -0.0004427805542945862, -0.0004175901412963867, -0.00039239972829818726, -0.0003672093152999878, -0.00034201890230178833, -0.00031682848930358887, -0.0002916380763053894, -0.00026644766330718994, -0.00024125725030899048, -0.00021606683731079102, -0.00019087642431259155, -0.0001656860113143921, -0.00014049559831619263, -0.00011530518531799316, -9.01147723197937e-05, -6.492435932159424e-05, -3.9733946323394775e-05, -1.4543533325195312e-05, 1.064687967300415e-05, 3.583729267120361e-05, 6.1027705669403076e-05, 8.621811866760254e-05, 0.000111408531665802, 0.00013659894466400146, 0.00016178935766220093, 0.0001869797706604004, 0.00021217018365859985, 0.00023736059665679932, 0.0002625510096549988, 0.00028774142265319824, 0.0003129318356513977, 0.00033812224864959717, 0.00036331266164779663, 0.0003885030746459961, 0.00041369348764419556, 0.000438883900642395, 0.0004640743136405945, 0.0004892647266387939, 0.0005144551396369934, 0.0005396455526351929, 0.0005648359656333923, 0.0005900263786315918, 0.0006152167916297913, 0.0006404072046279907, 0.0006655976176261902, 0.0006907880306243896, 0.0007159784436225891, 0.0007411688566207886, 0.000766359269618988, 0.0007915496826171875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 27.0, 32.0, 74.0, 124.0, 284.0, 772.0, 2704.0, 15629.0, 792614.0, 225289.0, 8176.0, 1681.0, 621.0, 235.0, 121.0, 56.0, 26.0, 18.0, 16.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.015625, -15.592529296875, -15.16943359375, -14.746337890625, -14.3232421875, -13.900146484375, -13.47705078125, -13.053955078125, -12.630859375, -12.207763671875, -11.78466796875, -11.361572265625, -10.9384765625, -10.515380859375, -10.09228515625, -9.669189453125, -9.24609375, -8.822998046875, -8.39990234375, -7.976806640625, -7.5537109375, -7.130615234375, -6.70751953125, -6.284423828125, -5.861328125, -5.438232421875, -5.01513671875, -4.592041015625, -4.1689453125, -3.745849609375, -3.32275390625, -2.899658203125, -2.4765625, -2.053466796875, -1.63037109375, -1.207275390625, -0.7841796875, -0.361083984375, 0.06201171875, 0.485107421875, 0.908203125, 1.331298828125, 1.75439453125, 2.177490234375, 2.6005859375, 3.023681640625, 3.44677734375, 3.869873046875, 4.29296875, 4.716064453125, 5.13916015625, 5.562255859375, 5.9853515625, 6.408447265625, 6.83154296875, 7.254638671875, 7.677734375, 8.100830078125, 8.52392578125, 8.947021484375, 9.3701171875, 9.793212890625, 10.21630859375, 10.639404296875, 11.0625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 7.0, 18.0, 21.0, 32.0, 71.0, 96.0, 130.0, 168.0, 135.0, 95.0, 69.0, 51.0, 29.0, 9.0, 14.0, 5.0, 10.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.33721923828125, -4.1744384765625, -4.01165771484375, -3.848876953125, -3.68609619140625, -3.5233154296875, -3.36053466796875, -3.19775390625, -3.03497314453125, -2.8721923828125, -2.70941162109375, -2.546630859375, -2.38385009765625, -2.2210693359375, -2.05828857421875, -1.8955078125, -1.73272705078125, -1.5699462890625, -1.40716552734375, -1.244384765625, -1.08160400390625, -0.9188232421875, -0.75604248046875, -0.59326171875, -0.43048095703125, -0.2677001953125, -0.10491943359375, 0.057861328125, 0.22064208984375, 0.3834228515625, 0.54620361328125, 0.708984375, 0.87176513671875, 1.0345458984375, 1.19732666015625, 1.360107421875, 1.52288818359375, 1.6856689453125, 1.84844970703125, 2.01123046875, 2.17401123046875, 2.3367919921875, 2.49957275390625, 2.662353515625, 2.82513427734375, 2.9879150390625, 3.15069580078125, 3.3134765625, 3.47625732421875, 3.6390380859375, 3.80181884765625, 3.964599609375, 4.12738037109375, 4.2901611328125, 4.45294189453125, 4.61572265625, 4.77850341796875, 4.9412841796875, 5.10406494140625, 5.266845703125, 5.42962646484375, 5.5924072265625, 5.75518798828125, 5.91796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 13.0, 37.0, 150.0, 317.0, 277.0, 149.0, 39.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.17984008789062, -138.70510864257812, -135.23037719726562, -131.7556610107422, -128.2809295654297, -124.80619812011719, -121.33146667480469, -117.85674285888672, -114.38201141357422, -110.90727996826172, -107.43255615234375, -103.95782470703125, -100.48310089111328, -97.00836944580078, -93.53364562988281, -90.05891418457031, -86.58418273925781, -83.10945129394531, -79.63472747802734, -76.15999603271484, -72.68527221679688, -69.21054077148438, -65.73580932617188, -62.261085510253906, -58.78636169433594, -55.3116340637207, -51.83690643310547, -48.36217498779297, -44.887447357177734, -41.4127197265625, -37.937992095947266, -34.46326446533203, -30.98853302001953, -27.513805389404297, -24.03907585144043, -20.564348220825195, -17.089618682861328, -13.614891052246094, -10.14016342163086, -6.665433883666992, -3.190706253051758, 0.28402209281921387, 3.7587504386901855, 7.233478546142578, 10.708207130432129, 14.18293571472168, 17.657663345336914, 21.13239288330078, 24.607120513916016, 28.08184814453125, 31.556577682495117, 35.03130340576172, 38.50603485107422, 41.98076248168945, 45.45549011230469, 48.93022155761719, 52.404945373535156, 55.87967300415039, 59.354400634765625, 62.829132080078125, 66.3038558959961, 69.7785873413086, 73.25331115722656, 76.72804260253906, 80.20277404785156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 13.0, 10.0, 14.0, 8.0, 25.0, 23.0, 18.0, 24.0, 22.0, 34.0, 24.0, 35.0, 30.0, 54.0, 40.0, 42.0, 43.0, 45.0, 39.0, 45.0, 45.0, 33.0, 45.0, 31.0, 23.0, 32.0, 28.0, 15.0, 16.0, 18.0, 11.0, 12.0, 16.0, 20.0, 7.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.59099769592285, -21.890220642089844, -21.189443588256836, -20.488666534423828, -19.78788948059082, -19.087112426757812, -18.386335372924805, -17.685558319091797, -16.98478126525879, -16.28400421142578, -15.583227157592773, -14.882450103759766, -14.181673049926758, -13.48089599609375, -12.780118942260742, -12.079341888427734, -11.378564834594727, -10.677787780761719, -9.977010726928711, -9.276233673095703, -8.575456619262695, -7.8746795654296875, -7.17390251159668, -6.473125457763672, -5.772348403930664, -5.071571350097656, -4.370794296264648, -3.6700172424316406, -2.969240188598633, -2.268463134765625, -1.5676860809326172, -0.8669090270996094, -0.16613388061523438, 0.5346431732177734, 1.2354202270507812, 1.936197280883789, 2.636974334716797, 3.3377513885498047, 4.0385284423828125, 4.73930549621582, 5.440082550048828, 6.140859603881836, 6.841636657714844, 7.542413711547852, 8.24319076538086, 8.943967819213867, 9.644744873046875, 10.345521926879883, 11.04629898071289, 11.747076034545898, 12.447853088378906, 13.148630142211914, 13.849407196044922, 14.55018424987793, 15.250961303710938, 15.951738357543945, 16.652515411376953, 17.35329246520996, 18.05406951904297, 18.754846572875977, 19.455623626708984, 20.156400680541992, 20.857177734375, 21.557954788208008, 22.258731842041016]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 20.0, 24.0, 24.0, 50.0, 67.0, 135.0, 213.0, 387.0, 696.0, 1410.0, 3332.0, 8569.0, 26686.0, 118018.0, 3131608.0, 794106.0, 77981.0, 19704.0, 6503.0, 2466.0, 1111.0, 503.0, 283.0, 144.0, 85.0, 46.0, 30.0, 27.0, 14.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -3.97454833984375, -3.7928466796875, -3.61114501953125, -3.429443359375, -3.24774169921875, -3.0660400390625, -2.88433837890625, -2.70263671875, -2.52093505859375, -2.3392333984375, -2.15753173828125, -1.975830078125, -1.79412841796875, -1.6124267578125, -1.43072509765625, -1.2490234375, -1.06732177734375, -0.8856201171875, -0.70391845703125, -0.522216796875, -0.34051513671875, -0.1588134765625, 0.02288818359375, 0.20458984375, 0.38629150390625, 0.5679931640625, 0.74969482421875, 0.931396484375, 1.11309814453125, 1.2947998046875, 1.47650146484375, 1.658203125, 1.83990478515625, 2.0216064453125, 2.20330810546875, 2.385009765625, 2.56671142578125, 2.7484130859375, 2.93011474609375, 3.11181640625, 3.29351806640625, 3.4752197265625, 3.65692138671875, 3.838623046875, 4.02032470703125, 4.2020263671875, 4.38372802734375, 4.5654296875, 4.74713134765625, 4.9288330078125, 5.11053466796875, 5.292236328125, 5.47393798828125, 5.6556396484375, 5.83734130859375, 6.01904296875, 6.20074462890625, 6.3824462890625, 6.56414794921875, 6.745849609375, 6.92755126953125, 7.1092529296875, 7.29095458984375, 7.47265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 5.0, 8.0, 12.0, 5.0, 18.0, 27.0, 15.0, 31.0, 42.0, 46.0, 62.0, 52.0, 56.0, 55.0, 62.0, 67.0, 51.0, 56.0, 59.0, 50.0, 49.0, 38.0, 25.0, 35.0, 13.0, 12.0, 10.0, 4.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -1.0113372802734375, -0.974822998046875, -0.9383087158203125, -0.90179443359375, -0.8652801513671875, -0.828765869140625, -0.7922515869140625, -0.7557373046875, -0.7192230224609375, -0.682708740234375, -0.6461944580078125, -0.60968017578125, -0.5731658935546875, -0.536651611328125, -0.5001373291015625, -0.463623046875, -0.4271087646484375, -0.390594482421875, -0.3540802001953125, -0.31756591796875, -0.2810516357421875, -0.244537353515625, -0.2080230712890625, -0.1715087890625, -0.1349945068359375, -0.098480224609375, -0.0619659423828125, -0.02545166015625, 0.0110626220703125, 0.047576904296875, 0.0840911865234375, 0.12060546875, 0.1571197509765625, 0.193634033203125, 0.2301483154296875, 0.26666259765625, 0.3031768798828125, 0.339691162109375, 0.3762054443359375, 0.4127197265625, 0.4492340087890625, 0.485748291015625, 0.5222625732421875, 0.55877685546875, 0.5952911376953125, 0.631805419921875, 0.6683197021484375, 0.704833984375, 0.7413482666015625, 0.777862548828125, 0.8143768310546875, 0.85089111328125, 0.8874053955078125, 0.923919677734375, 0.9604339599609375, 0.9969482421875, 1.0334625244140625, 1.069976806640625, 1.1064910888671875, 1.14300537109375, 1.1795196533203125, 1.216033935546875, 1.2525482177734375, 1.2890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 9.0, 16.0, 24.0, 30.0, 48.0, 72.0, 124.0, 211.0, 333.0, 607.0, 1049.0, 1938.0, 3647.0, 7759.0, 17973.0, 49154.0, 177594.0, 2260314.0, 1437548.0, 158003.0, 45190.0, 17102.0, 7528.0, 3657.0, 1790.0, 1022.0, 559.0, 317.0, 208.0, 151.0, 103.0, 62.0, 50.0, 19.0, 27.0, 5.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.05859375, -4.91387939453125, -4.7691650390625, -4.62445068359375, -4.479736328125, -4.33502197265625, -4.1903076171875, -4.04559326171875, -3.90087890625, -3.75616455078125, -3.6114501953125, -3.46673583984375, -3.322021484375, -3.17730712890625, -3.0325927734375, -2.88787841796875, -2.7431640625, -2.59844970703125, -2.4537353515625, -2.30902099609375, -2.164306640625, -2.01959228515625, -1.8748779296875, -1.73016357421875, -1.58544921875, -1.44073486328125, -1.2960205078125, -1.15130615234375, -1.006591796875, -0.86187744140625, -0.7171630859375, -0.57244873046875, -0.427734375, -0.28302001953125, -0.1383056640625, 0.00640869140625, 0.151123046875, 0.29583740234375, 0.4405517578125, 0.58526611328125, 0.72998046875, 0.87469482421875, 1.0194091796875, 1.16412353515625, 1.308837890625, 1.45355224609375, 1.5982666015625, 1.74298095703125, 1.8876953125, 2.03240966796875, 2.1771240234375, 2.32183837890625, 2.466552734375, 2.61126708984375, 2.7559814453125, 2.90069580078125, 3.04541015625, 3.19012451171875, 3.3348388671875, 3.47955322265625, 3.624267578125, 3.76898193359375, 3.9136962890625, 4.05841064453125, 4.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 21.0, 19.0, 25.0, 40.0, 42.0, 84.0, 129.0, 192.0, 345.0, 1015.0, 1057.0, 395.0, 193.0, 140.0, 95.0, 57.0, 33.0, 32.0, 22.0, 18.0, 12.0, 16.0, 12.0, 10.0, 3.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.060546875, -1.991973876953125, -1.92340087890625, -1.854827880859375, -1.7862548828125, -1.717681884765625, -1.64910888671875, -1.580535888671875, -1.511962890625, -1.443389892578125, -1.37481689453125, -1.306243896484375, -1.2376708984375, -1.169097900390625, -1.10052490234375, -1.031951904296875, -0.96337890625, -0.894805908203125, -0.82623291015625, -0.757659912109375, -0.6890869140625, -0.620513916015625, -0.55194091796875, -0.483367919921875, -0.414794921875, -0.346221923828125, -0.27764892578125, -0.209075927734375, -0.1405029296875, -0.071929931640625, -0.00335693359375, 0.065216064453125, 0.1337890625, 0.202362060546875, 0.27093505859375, 0.339508056640625, 0.4080810546875, 0.476654052734375, 0.54522705078125, 0.613800048828125, 0.682373046875, 0.750946044921875, 0.81951904296875, 0.888092041015625, 0.9566650390625, 1.025238037109375, 1.09381103515625, 1.162384033203125, 1.23095703125, 1.299530029296875, 1.36810302734375, 1.436676025390625, 1.5052490234375, 1.573822021484375, 1.64239501953125, 1.710968017578125, 1.779541015625, 1.848114013671875, 1.91668701171875, 1.985260009765625, 2.0538330078125, 2.122406005859375, 2.19097900390625, 2.259552001953125, 2.328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 17.0, 50.0, 87.0, 164.0, 207.0, 212.0, 127.0, 62.0, 31.0, 20.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.24348258972168, -21.3341121673584, -20.424741744995117, -19.515371322631836, -18.606000900268555, -17.696630477905273, -16.787261962890625, -15.877890586853027, -14.968520164489746, -14.059149742126465, -13.149779319763184, -12.240409851074219, -11.331039428710938, -10.421669006347656, -9.512298583984375, -8.602928161621094, -7.6935577392578125, -6.784187316894531, -5.87481689453125, -4.965446949005127, -4.056076526641846, -3.1467061042785645, -2.2373361587524414, -1.3279657363891602, -0.4185953140258789, 0.4907749891281128, 1.4001452922821045, 2.3095154762268066, 3.218885898590088, 4.128256320953369, 5.037626266479492, 5.946996688842773, 6.856365203857422, 7.765735626220703, 8.675106048583984, 9.584476470947266, 10.493846893310547, 11.403217315673828, 12.312586784362793, 13.221957206726074, 14.131327629089355, 15.040698051452637, 15.950068473815918, 16.859437942504883, 17.768808364868164, 18.678178787231445, 19.587549209594727, 20.496919631958008, 21.40629005432129, 22.31566047668457, 23.22503089904785, 24.134401321411133, 25.043771743774414, 25.953142166137695, 26.862510681152344, 27.771881103515625, 28.681251525878906, 29.590621948242188, 30.49999237060547, 31.40936279296875, 32.31873321533203, 33.22810363769531, 34.137474060058594, 35.046844482421875, 35.956214904785156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 4.0, 8.0, 15.0, 11.0, 16.0, 19.0, 25.0, 29.0, 34.0, 30.0, 36.0, 44.0, 37.0, 46.0, 45.0, 51.0, 53.0, 36.0, 39.0, 44.0, 39.0, 46.0, 35.0, 31.0, 36.0, 31.0, 26.0, 22.0, 16.0, 28.0, 14.0, 7.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203773498535156, -8.894710540771484, -8.585647583007812, -8.27658462524414, -7.967521667480469, -7.658458709716797, -7.349395751953125, -7.040332794189453, -6.731269836425781, -6.422206878662109, -6.1131439208984375, -5.804080963134766, -5.495018005371094, -5.185955047607422, -4.87689208984375, -4.567829132080078, -4.258766174316406, -3.9497032165527344, -3.6406402587890625, -3.3315773010253906, -3.0225143432617188, -2.713451385498047, -2.404388427734375, -2.095325469970703, -1.7862625122070312, -1.4771995544433594, -1.1681365966796875, -0.8590736389160156, -0.5500106811523438, -0.24094772338867188, 0.068115234375, 0.3771781921386719, 0.6862411499023438, 0.9953041076660156, 1.3043670654296875, 1.6134300231933594, 1.9224929809570312, 2.231555938720703, 2.540618896484375, 2.849681854248047, 3.1587448120117188, 3.4678077697753906, 3.7768707275390625, 4.085933685302734, 4.394996643066406, 4.704059600830078, 5.01312255859375, 5.322185516357422, 5.631248474121094, 5.940311431884766, 6.2493743896484375, 6.558437347412109, 6.867500305175781, 7.176563262939453, 7.485626220703125, 7.794689178466797, 8.103752136230469, 8.41281509399414, 8.721878051757812, 9.030941009521484, 9.340003967285156, 9.649066925048828, 9.9581298828125, 10.267192840576172, 10.576255798339844]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 19.0, 15.0, 22.0, 28.0, 44.0, 95.0, 127.0, 274.0, 420.0, 778.0, 1505.0, 3078.0, 6518.0, 15613.0, 39708.0, 118723.0, 645624.0, 139889.0, 44807.0, 17224.0, 7245.0, 3201.0, 1594.0, 850.0, 515.0, 257.0, 129.0, 92.0, 57.0, 35.0, 21.0, 21.0, 5.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.41998291015625, -6.2227783203125, -6.02557373046875, -5.828369140625, -5.63116455078125, -5.4339599609375, -5.23675537109375, -5.03955078125, -4.84234619140625, -4.6451416015625, -4.44793701171875, -4.250732421875, -4.05352783203125, -3.8563232421875, -3.65911865234375, -3.4619140625, -3.26470947265625, -3.0675048828125, -2.87030029296875, -2.673095703125, -2.47589111328125, -2.2786865234375, -2.08148193359375, -1.88427734375, -1.68707275390625, -1.4898681640625, -1.29266357421875, -1.095458984375, -0.89825439453125, -0.7010498046875, -0.50384521484375, -0.306640625, -0.10943603515625, 0.0877685546875, 0.28497314453125, 0.482177734375, 0.67938232421875, 0.8765869140625, 1.07379150390625, 1.27099609375, 1.46820068359375, 1.6654052734375, 1.86260986328125, 2.059814453125, 2.25701904296875, 2.4542236328125, 2.65142822265625, 2.8486328125, 3.04583740234375, 3.2430419921875, 3.44024658203125, 3.637451171875, 3.83465576171875, 4.0318603515625, 4.22906494140625, 4.42626953125, 4.62347412109375, 4.8206787109375, 5.01788330078125, 5.215087890625, 5.41229248046875, 5.6094970703125, 5.80670166015625, 6.00390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 8.0, 10.0, 18.0, 19.0, 19.0, 18.0, 35.0, 30.0, 39.0, 46.0, 54.0, 58.0, 52.0, 46.0, 64.0, 61.0, 50.0, 63.0, 48.0, 40.0, 32.0, 28.0, 25.0, 23.0, 19.0, 20.0, 11.0, 7.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.861358642578125, -0.82720947265625, -0.793060302734375, -0.7589111328125, -0.724761962890625, -0.69061279296875, -0.656463623046875, -0.622314453125, -0.588165283203125, -0.55401611328125, -0.519866943359375, -0.4857177734375, -0.451568603515625, -0.41741943359375, -0.383270263671875, -0.34912109375, -0.314971923828125, -0.28082275390625, -0.246673583984375, -0.2125244140625, -0.178375244140625, -0.14422607421875, -0.110076904296875, -0.075927734375, -0.041778564453125, -0.00762939453125, 0.026519775390625, 0.0606689453125, 0.094818115234375, 0.12896728515625, 0.163116455078125, 0.197265625, 0.231414794921875, 0.26556396484375, 0.299713134765625, 0.3338623046875, 0.368011474609375, 0.40216064453125, 0.436309814453125, 0.470458984375, 0.504608154296875, 0.53875732421875, 0.572906494140625, 0.6070556640625, 0.641204833984375, 0.67535400390625, 0.709503173828125, 0.74365234375, 0.777801513671875, 0.81195068359375, 0.846099853515625, 0.8802490234375, 0.914398193359375, 0.94854736328125, 0.982696533203125, 1.016845703125, 1.050994873046875, 1.08514404296875, 1.119293212890625, 1.1534423828125, 1.187591552734375, 1.22174072265625, 1.255889892578125, 1.2900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 13.0, 14.0, 18.0, 22.0, 29.0, 44.0, 57.0, 96.0, 138.0, 237.0, 409.0, 737.0, 1600.0, 4537.0, 17995.0, 91339.0, 768581.0, 128274.0, 24610.0, 5853.0, 1879.0, 798.0, 454.0, 279.0, 158.0, 99.0, 73.0, 51.0, 38.0, 31.0, 20.0, 9.0, 6.0, 10.0, 7.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1875, -7.910888671875, -7.63427734375, -7.357666015625, -7.0810546875, -6.804443359375, -6.52783203125, -6.251220703125, -5.974609375, -5.697998046875, -5.42138671875, -5.144775390625, -4.8681640625, -4.591552734375, -4.31494140625, -4.038330078125, -3.76171875, -3.485107421875, -3.20849609375, -2.931884765625, -2.6552734375, -2.378662109375, -2.10205078125, -1.825439453125, -1.548828125, -1.272216796875, -0.99560546875, -0.718994140625, -0.4423828125, -0.165771484375, 0.11083984375, 0.387451171875, 0.6640625, 0.940673828125, 1.21728515625, 1.493896484375, 1.7705078125, 2.047119140625, 2.32373046875, 2.600341796875, 2.876953125, 3.153564453125, 3.43017578125, 3.706787109375, 3.9833984375, 4.260009765625, 4.53662109375, 4.813232421875, 5.08984375, 5.366455078125, 5.64306640625, 5.919677734375, 6.1962890625, 6.472900390625, 6.74951171875, 7.026123046875, 7.302734375, 7.579345703125, 7.85595703125, 8.132568359375, 8.4091796875, 8.685791015625, 8.96240234375, 9.239013671875, 9.515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 7.0, 12.0, 10.0, 27.0, 36.0, 36.0, 51.0, 43.0, 43.0, 61.0, 61.0, 64.0, 43.0, 68.0, 48.0, 53.0, 52.0, 49.0, 41.0, 39.0, 28.0, 32.0, 17.0, 13.0, 10.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.9375, -5.767333984375, -5.59716796875, -5.427001953125, -5.2568359375, -5.086669921875, -4.91650390625, -4.746337890625, -4.576171875, -4.406005859375, -4.23583984375, -4.065673828125, -3.8955078125, -3.725341796875, -3.55517578125, -3.385009765625, -3.21484375, -3.044677734375, -2.87451171875, -2.704345703125, -2.5341796875, -2.364013671875, -2.19384765625, -2.023681640625, -1.853515625, -1.683349609375, -1.51318359375, -1.343017578125, -1.1728515625, -1.002685546875, -0.83251953125, -0.662353515625, -0.4921875, -0.322021484375, -0.15185546875, 0.018310546875, 0.1884765625, 0.358642578125, 0.52880859375, 0.698974609375, 0.869140625, 1.039306640625, 1.20947265625, 1.379638671875, 1.5498046875, 1.719970703125, 1.89013671875, 2.060302734375, 2.23046875, 2.400634765625, 2.57080078125, 2.740966796875, 2.9111328125, 3.081298828125, 3.25146484375, 3.421630859375, 3.591796875, 3.761962890625, 3.93212890625, 4.102294921875, 4.2724609375, 4.442626953125, 4.61279296875, 4.782958984375, 4.953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 20.0, 29.0, 43.0, 58.0, 112.0, 172.0, 302.0, 540.0, 1160.0, 2275.0, 5742.0, 15629.0, 46922.0, 203773.0, 631187.0, 93405.0, 29439.0, 10284.0, 3848.0, 1717.0, 853.0, 411.0, 228.0, 121.0, 71.0, 68.0, 42.0, 28.0, 16.0, 9.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.3428955078125, -3.228759765625, -3.1146240234375, -3.00048828125, -2.8863525390625, -2.772216796875, -2.6580810546875, -2.5439453125, -2.4298095703125, -2.315673828125, -2.2015380859375, -2.08740234375, -1.9732666015625, -1.859130859375, -1.7449951171875, -1.630859375, -1.5167236328125, -1.402587890625, -1.2884521484375, -1.17431640625, -1.0601806640625, -0.946044921875, -0.8319091796875, -0.7177734375, -0.6036376953125, -0.489501953125, -0.3753662109375, -0.26123046875, -0.1470947265625, -0.032958984375, 0.0811767578125, 0.1953125, 0.3094482421875, 0.423583984375, 0.5377197265625, 0.65185546875, 0.7659912109375, 0.880126953125, 0.9942626953125, 1.1083984375, 1.2225341796875, 1.336669921875, 1.4508056640625, 1.56494140625, 1.6790771484375, 1.793212890625, 1.9073486328125, 2.021484375, 2.1356201171875, 2.249755859375, 2.3638916015625, 2.47802734375, 2.5921630859375, 2.706298828125, 2.8204345703125, 2.9345703125, 3.0487060546875, 3.162841796875, 3.2769775390625, 3.39111328125, 3.5052490234375, 3.619384765625, 3.7335205078125, 3.84765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 9.0, 3.0, 5.0, 13.0, 4.0, 10.0, 8.0, 14.0, 22.0, 22.0, 32.0, 51.0, 122.0, 326.0, 148.0, 55.0, 28.0, 36.0, 17.0, 10.0, 8.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010080337524414062, -0.0009760856628417969, -0.0009441375732421875, -0.0009121894836425781, -0.0008802413940429688, -0.0008482933044433594, -0.00081634521484375, -0.0007843971252441406, -0.0007524490356445312, -0.0007205009460449219, -0.0006885528564453125, -0.0006566047668457031, -0.0006246566772460938, -0.0005927085876464844, -0.000560760498046875, -0.0005288124084472656, -0.0004968643188476562, -0.0004649162292480469, -0.0004329681396484375, -0.0004010200500488281, -0.00036907196044921875, -0.0003371238708496094, -0.00030517578125, -0.0002732276916503906, -0.00024127960205078125, -0.00020933151245117188, -0.0001773834228515625, -0.00014543533325195312, -0.00011348724365234375, -8.153915405273438e-05, -4.9591064453125e-05, -1.7642974853515625e-05, 1.430511474609375e-05, 4.6253204345703125e-05, 7.82012939453125e-05, 0.00011014938354492188, 0.00014209747314453125, 0.00017404556274414062, 0.00020599365234375, 0.00023794174194335938, 0.00026988983154296875, 0.0003018379211425781, 0.0003337860107421875, 0.0003657341003417969, 0.00039768218994140625, 0.0004296302795410156, 0.000461578369140625, 0.0004935264587402344, 0.0005254745483398438, 0.0005574226379394531, 0.0005893707275390625, 0.0006213188171386719, 0.0006532669067382812, 0.0006852149963378906, 0.0007171630859375, 0.0007491111755371094, 0.0007810592651367188, 0.0008130073547363281, 0.0008449554443359375, 0.0008769035339355469, 0.0009088516235351562, 0.0009407997131347656, 0.000972747802734375, 0.0010046958923339844, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 9.0, 7.0, 19.0, 23.0, 34.0, 62.0, 105.0, 117.0, 264.0, 560.0, 1469.0, 5220.0, 31444.0, 350213.0, 606255.0, 43164.0, 6534.0, 1666.0, 649.0, 306.0, 163.0, 89.0, 56.0, 30.0, 21.0, 16.0, 10.0, 10.0, 5.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.34246826171875, -4.1693115234375, -3.99615478515625, -3.822998046875, -3.64984130859375, -3.4766845703125, -3.30352783203125, -3.13037109375, -2.95721435546875, -2.7840576171875, -2.61090087890625, -2.437744140625, -2.26458740234375, -2.0914306640625, -1.91827392578125, -1.7451171875, -1.57196044921875, -1.3988037109375, -1.22564697265625, -1.052490234375, -0.87933349609375, -0.7061767578125, -0.53302001953125, -0.35986328125, -0.18670654296875, -0.0135498046875, 0.15960693359375, 0.332763671875, 0.50592041015625, 0.6790771484375, 0.85223388671875, 1.025390625, 1.19854736328125, 1.3717041015625, 1.54486083984375, 1.718017578125, 1.89117431640625, 2.0643310546875, 2.23748779296875, 2.41064453125, 2.58380126953125, 2.7569580078125, 2.93011474609375, 3.103271484375, 3.27642822265625, 3.4495849609375, 3.62274169921875, 3.7958984375, 3.96905517578125, 4.1422119140625, 4.31536865234375, 4.488525390625, 4.66168212890625, 4.8348388671875, 5.00799560546875, 5.18115234375, 5.35430908203125, 5.5274658203125, 5.70062255859375, 5.873779296875, 6.04693603515625, 6.2200927734375, 6.39324951171875, 6.56640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 16.0, 3.0, 7.0, 8.0, 9.0, 20.0, 14.0, 28.0, 19.0, 26.0, 41.0, 65.0, 117.0, 134.0, 108.0, 102.0, 69.0, 29.0, 26.0, 22.0, 16.0, 13.0, 21.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.509735107421875, -2.43939208984375, -2.369049072265625, -2.2987060546875, -2.228363037109375, -2.15802001953125, -2.087677001953125, -2.017333984375, -1.946990966796875, -1.87664794921875, -1.806304931640625, -1.7359619140625, -1.665618896484375, -1.59527587890625, -1.524932861328125, -1.45458984375, -1.384246826171875, -1.31390380859375, -1.243560791015625, -1.1732177734375, -1.102874755859375, -1.03253173828125, -0.962188720703125, -0.891845703125, -0.821502685546875, -0.75115966796875, -0.680816650390625, -0.6104736328125, -0.540130615234375, -0.46978759765625, -0.399444580078125, -0.3291015625, -0.258758544921875, -0.18841552734375, -0.118072509765625, -0.0477294921875, 0.022613525390625, 0.09295654296875, 0.163299560546875, 0.233642578125, 0.303985595703125, 0.37432861328125, 0.444671630859375, 0.5150146484375, 0.585357666015625, 0.65570068359375, 0.726043701171875, 0.79638671875, 0.866729736328125, 0.93707275390625, 1.007415771484375, 1.0777587890625, 1.148101806640625, 1.21844482421875, 1.288787841796875, 1.359130859375, 1.429473876953125, 1.49981689453125, 1.570159912109375, 1.6405029296875, 1.710845947265625, 1.78118896484375, 1.851531982421875, 1.921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 13.0, 32.0, 78.0, 180.0, 246.0, 265.0, 107.0, 59.0, 13.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.47672653198242, -35.871986389160156, -33.26724624633789, -30.662508010864258, -28.057769775390625, -25.45302963256836, -22.848289489746094, -20.24355125427246, -17.638811111450195, -15.034071922302246, -12.429332733154297, -9.824592590332031, -7.219853401184082, -4.615114212036133, -2.010374069213867, 0.5943641662597656, 3.1991043090820312, 5.8038434982299805, 8.40858268737793, 11.013322830200195, 13.618062019348145, 16.222801208496094, 18.82754135131836, 21.432279586791992, 24.037019729614258, 26.641759872436523, 29.246498107910156, 31.851238250732422, 34.45597839355469, 37.06071472167969, 39.66545867919922, 42.27019500732422, 44.87493133544922, 47.479671478271484, 50.08441162109375, 52.68914794921875, 55.293888092041016, 57.89862823486328, 60.50336837768555, 63.10810852050781, 65.71284484863281, 68.31758117675781, 70.92232513427734, 73.52706146240234, 76.13180541992188, 78.73654174804688, 81.34127807617188, 83.9460220336914, 86.55076599121094, 89.15550231933594, 91.76024627685547, 94.36498260498047, 96.9697265625, 99.574462890625, 102.17919921875, 104.78394317626953, 107.38867950439453, 109.99341583251953, 112.59815979003906, 115.20289611816406, 117.8076400756836, 120.4123764038086, 123.01712036132812, 125.62185668945312, 128.22659301757812]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 10.0, 16.0, 11.0, 15.0, 13.0, 19.0, 34.0, 24.0, 28.0, 35.0, 34.0, 49.0, 39.0, 49.0, 49.0, 48.0, 46.0, 45.0, 45.0, 37.0, 41.0, 40.0, 34.0, 31.0, 36.0, 24.0, 18.0, 23.0, 20.0, 13.0, 9.0, 12.0, 9.0, 3.0, 7.0, 2.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.024023056030273, -23.28664779663086, -22.549270629882812, -21.8118953704834, -21.074520111083984, -20.337142944335938, -19.599767684936523, -18.86239242553711, -18.125015258789062, -17.38763999938965, -16.6502628326416, -15.912887573242188, -15.175512313842773, -14.438136100769043, -13.700759887695312, -12.963384628295898, -12.226009368896484, -11.488633155822754, -10.75125789642334, -10.01388168334961, -9.276506423950195, -8.539130210876465, -7.801753997802734, -7.064378261566162, -6.32700252532959, -5.589626789093018, -4.852251052856445, -4.114874839782715, -3.3774991035461426, -2.6401233673095703, -1.9027471542358398, -1.1653714179992676, -0.4279975891113281, 0.3093782663345337, 1.0467541217803955, 1.7841300964355469, 2.521505832672119, 3.2588815689086914, 3.996257781982422, 4.733633518218994, 5.471009254455566, 6.208384990692139, 6.945760726928711, 7.683136940002441, 8.420513153076172, 9.157888412475586, 9.895264625549316, 10.632640838623047, 11.370016098022461, 12.107392311096191, 12.844767570495605, 13.582143783569336, 14.31951904296875, 15.05689525604248, 15.794271469116211, 16.531646728515625, 17.269023895263672, 18.006399154663086, 18.743776321411133, 19.481151580810547, 20.21852684020996, 20.955902099609375, 21.693279266357422, 22.430654525756836, 23.16802978515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 11.0, 19.0, 24.0, 29.0, 48.0, 83.0, 153.0, 297.0, 553.0, 1172.0, 2470.0, 6197.0, 17621.0, 65191.0, 641809.0, 3320005.0, 100923.0, 24117.0, 7829.0, 3075.0, 1322.0, 621.0, 327.0, 131.0, 96.0, 59.0, 26.0, 20.0, 13.0, 5.0, 7.0, 9.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.78594970703125, -6.5679931640625, -6.35003662109375, -6.132080078125, -5.91412353515625, -5.6961669921875, -5.47821044921875, -5.26025390625, -5.04229736328125, -4.8243408203125, -4.60638427734375, -4.388427734375, -4.17047119140625, -3.9525146484375, -3.73455810546875, -3.5166015625, -3.29864501953125, -3.0806884765625, -2.86273193359375, -2.644775390625, -2.42681884765625, -2.2088623046875, -1.99090576171875, -1.77294921875, -1.55499267578125, -1.3370361328125, -1.11907958984375, -0.901123046875, -0.68316650390625, -0.4652099609375, -0.24725341796875, -0.029296875, 0.18865966796875, 0.4066162109375, 0.62457275390625, 0.842529296875, 1.06048583984375, 1.2784423828125, 1.49639892578125, 1.71435546875, 1.93231201171875, 2.1502685546875, 2.36822509765625, 2.586181640625, 2.80413818359375, 3.0220947265625, 3.24005126953125, 3.4580078125, 3.67596435546875, 3.8939208984375, 4.11187744140625, 4.329833984375, 4.54779052734375, 4.7657470703125, 4.98370361328125, 5.20166015625, 5.41961669921875, 5.6375732421875, 5.85552978515625, 6.073486328125, 6.29144287109375, 6.5093994140625, 6.72735595703125, 6.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 11.0, 10.0, 15.0, 15.0, 16.0, 24.0, 29.0, 38.0, 50.0, 44.0, 55.0, 52.0, 59.0, 57.0, 73.0, 66.0, 54.0, 58.0, 44.0, 40.0, 49.0, 28.0, 30.0, 15.0, 14.0, 12.0, 11.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2109375, -1.1689910888671875, -1.127044677734375, -1.0850982666015625, -1.04315185546875, -1.0012054443359375, -0.959259033203125, -0.9173126220703125, -0.8753662109375, -0.8334197998046875, -0.791473388671875, -0.7495269775390625, -0.70758056640625, -0.6656341552734375, -0.623687744140625, -0.5817413330078125, -0.539794921875, -0.4978485107421875, -0.455902099609375, -0.4139556884765625, -0.37200927734375, -0.3300628662109375, -0.288116455078125, -0.2461700439453125, -0.2042236328125, -0.1622772216796875, -0.120330810546875, -0.0783843994140625, -0.03643798828125, 0.0055084228515625, 0.047454833984375, 0.0894012451171875, 0.13134765625, 0.1732940673828125, 0.215240478515625, 0.2571868896484375, 0.29913330078125, 0.3410797119140625, 0.383026123046875, 0.4249725341796875, 0.4669189453125, 0.5088653564453125, 0.550811767578125, 0.5927581787109375, 0.63470458984375, 0.6766510009765625, 0.718597412109375, 0.7605438232421875, 0.802490234375, 0.8444366455078125, 0.886383056640625, 0.9283294677734375, 0.97027587890625, 1.0122222900390625, 1.054168701171875, 1.0961151123046875, 1.1380615234375, 1.1800079345703125, 1.221954345703125, 1.2639007568359375, 1.30584716796875, 1.3477935791015625, 1.389739990234375, 1.4316864013671875, 1.4736328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 9.0, 8.0, 12.0, 17.0, 30.0, 62.0, 102.0, 133.0, 229.0, 414.0, 706.0, 1221.0, 2433.0, 4868.0, 11026.0, 29162.0, 97115.0, 640439.0, 3141840.0, 186708.0, 47249.0, 16565.0, 6772.0, 3305.0, 1683.0, 883.0, 523.0, 311.0, 165.0, 119.0, 68.0, 39.0, 22.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69952392578125, -5.5279541015625, -5.35638427734375, -5.184814453125, -5.01324462890625, -4.8416748046875, -4.67010498046875, -4.49853515625, -4.32696533203125, -4.1553955078125, -3.98382568359375, -3.812255859375, -3.64068603515625, -3.4691162109375, -3.29754638671875, -3.1259765625, -2.95440673828125, -2.7828369140625, -2.61126708984375, -2.439697265625, -2.26812744140625, -2.0965576171875, -1.92498779296875, -1.75341796875, -1.58184814453125, -1.4102783203125, -1.23870849609375, -1.067138671875, -0.89556884765625, -0.7239990234375, -0.55242919921875, -0.380859375, -0.20928955078125, -0.0377197265625, 0.13385009765625, 0.305419921875, 0.47698974609375, 0.6485595703125, 0.82012939453125, 0.99169921875, 1.16326904296875, 1.3348388671875, 1.50640869140625, 1.677978515625, 1.84954833984375, 2.0211181640625, 2.19268798828125, 2.3642578125, 2.53582763671875, 2.7073974609375, 2.87896728515625, 3.050537109375, 3.22210693359375, 3.3936767578125, 3.56524658203125, 3.73681640625, 3.90838623046875, 4.0799560546875, 4.25152587890625, 4.423095703125, 4.59466552734375, 4.7662353515625, 4.93780517578125, 5.109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 18.0, 13.0, 23.0, 30.0, 50.0, 74.0, 108.0, 190.0, 395.0, 1640.0, 818.0, 277.0, 129.0, 66.0, 52.0, 44.0, 30.0, 24.0, 16.0, 11.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.554412841796875, -2.47406005859375, -2.393707275390625, -2.3133544921875, -2.233001708984375, -2.15264892578125, -2.072296142578125, -1.991943359375, -1.911590576171875, -1.83123779296875, -1.750885009765625, -1.6705322265625, -1.590179443359375, -1.50982666015625, -1.429473876953125, -1.34912109375, -1.268768310546875, -1.18841552734375, -1.108062744140625, -1.0277099609375, -0.947357177734375, -0.86700439453125, -0.786651611328125, -0.706298828125, -0.625946044921875, -0.54559326171875, -0.465240478515625, -0.3848876953125, -0.304534912109375, -0.22418212890625, -0.143829345703125, -0.0634765625, 0.016876220703125, 0.09722900390625, 0.177581787109375, 0.2579345703125, 0.338287353515625, 0.41864013671875, 0.498992919921875, 0.579345703125, 0.659698486328125, 0.74005126953125, 0.820404052734375, 0.9007568359375, 0.981109619140625, 1.06146240234375, 1.141815185546875, 1.22216796875, 1.302520751953125, 1.38287353515625, 1.463226318359375, 1.5435791015625, 1.623931884765625, 1.70428466796875, 1.784637451171875, 1.864990234375, 1.945343017578125, 2.02569580078125, 2.106048583984375, 2.1864013671875, 2.266754150390625, 2.34710693359375, 2.427459716796875, 2.5078125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 21.0, 37.0, 77.0, 168.0, 224.0, 190.0, 147.0, 79.0, 27.0, 12.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.649436950683594, -27.853559494018555, -27.057682037353516, -26.261804580688477, -25.465927124023438, -24.6700496673584, -23.87417221069336, -23.078292846679688, -22.28241729736328, -21.486539840698242, -20.690662384033203, -19.894784927368164, -19.098907470703125, -18.303030014038086, -17.507152557373047, -16.711273193359375, -15.915395736694336, -15.119518280029297, -14.323640823364258, -13.527763366699219, -12.73188591003418, -11.93600845336914, -11.140130043029785, -10.344252586364746, -9.548375129699707, -8.752497673034668, -7.956620216369629, -7.160742282867432, -6.364864826202393, -5.5689873695373535, -4.773109436035156, -3.977231979370117, -3.181354522705078, -2.385477066040039, -1.589599370956421, -0.7937216758728027, 0.002155780792236328, 0.7980332374572754, 1.5939111709594727, 2.3897886276245117, 3.185666084289551, 3.98154354095459, 4.777420997619629, 5.573298931121826, 6.369176387786865, 7.165053844451904, 7.960931777954102, 8.75680923461914, 9.55268669128418, 10.348564147949219, 11.144441604614258, 11.940319061279297, 12.736196517944336, 13.532073974609375, 14.32795238494873, 15.12382984161377, 15.919707298278809, 16.715585708618164, 17.511463165283203, 18.307340621948242, 19.10321807861328, 19.89909553527832, 20.69497299194336, 21.4908504486084, 22.286727905273438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 9.0, 7.0, 9.0, 19.0, 17.0, 27.0, 17.0, 19.0, 37.0, 38.0, 38.0, 40.0, 42.0, 42.0, 52.0, 47.0, 47.0, 48.0, 50.0, 42.0, 44.0, 50.0, 23.0, 36.0, 28.0, 32.0, 23.0, 22.0, 11.0, 14.0, 19.0, 10.0, 6.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.208544731140137, -7.939805507659912, -7.6710662841796875, -7.402327060699463, -7.133587837219238, -6.864849090576172, -6.596109867095947, -6.327370643615723, -6.058631420135498, -5.789892196655273, -5.521152973175049, -5.252413749694824, -4.983675003051758, -4.714935302734375, -4.446196556091309, -4.177457332611084, -3.9087181091308594, -3.6399788856506348, -3.37123966217041, -3.1025006771087646, -2.83376145362854, -2.5650222301483154, -2.29628324508667, -2.0275440216064453, -1.7588047981262207, -1.490065574645996, -1.221326470375061, -0.9525873064994812, -0.6838481426239014, -0.41510891914367676, -0.1463698148727417, 0.12236928939819336, 0.39110851287841797, 0.6598476767539978, 0.9285868406295776, 1.1973259449005127, 1.4660651683807373, 1.734804391860962, 2.0035433769226074, 2.272282600402832, 2.5410218238830566, 2.8097610473632812, 3.078500270843506, 3.3472392559051514, 3.615978479385376, 3.8847177028656006, 4.153456687927246, 4.422195911407471, 4.690935134887695, 4.95967435836792, 5.2284135818481445, 5.497152805328369, 5.765892028808594, 6.03463077545166, 6.303369998931885, 6.572109222412109, 6.840848445892334, 7.109587669372559, 7.378326892852783, 7.647066116333008, 7.915804862976074, 8.184544563293457, 8.453283309936523, 8.722023010253906, 8.990761756896973]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 12.0, 19.0, 24.0, 30.0, 43.0, 74.0, 110.0, 164.0, 253.0, 486.0, 920.0, 1778.0, 3610.0, 7745.0, 16602.0, 35793.0, 104619.0, 578180.0, 206443.0, 49669.0, 22057.0, 10158.0, 4779.0, 2368.0, 1118.0, 608.0, 338.0, 193.0, 115.0, 89.0, 49.0, 28.0, 20.0, 15.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.468475341796875, -3.33343505859375, -3.198394775390625, -3.0633544921875, -2.928314208984375, -2.79327392578125, -2.658233642578125, -2.523193359375, -2.388153076171875, -2.25311279296875, -2.118072509765625, -1.9830322265625, -1.847991943359375, -1.71295166015625, -1.577911376953125, -1.44287109375, -1.307830810546875, -1.17279052734375, -1.037750244140625, -0.9027099609375, -0.767669677734375, -0.63262939453125, -0.497589111328125, -0.362548828125, -0.227508544921875, -0.09246826171875, 0.042572021484375, 0.1776123046875, 0.312652587890625, 0.44769287109375, 0.582733154296875, 0.7177734375, 0.852813720703125, 0.98785400390625, 1.122894287109375, 1.2579345703125, 1.392974853515625, 1.52801513671875, 1.663055419921875, 1.798095703125, 1.933135986328125, 2.06817626953125, 2.203216552734375, 2.3382568359375, 2.473297119140625, 2.60833740234375, 2.743377685546875, 2.87841796875, 3.013458251953125, 3.14849853515625, 3.283538818359375, 3.4185791015625, 3.553619384765625, 3.68865966796875, 3.823699951171875, 3.958740234375, 4.093780517578125, 4.22882080078125, 4.363861083984375, 4.4989013671875, 4.633941650390625, 4.76898193359375, 4.904022216796875, 5.0390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 8.0, 13.0, 14.0, 17.0, 15.0, 25.0, 24.0, 36.0, 40.0, 36.0, 39.0, 55.0, 43.0, 51.0, 66.0, 70.0, 53.0, 49.0, 43.0, 53.0, 45.0, 41.0, 39.0, 16.0, 28.0, 13.0, 21.0, 12.0, 1.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1874542236328125, -1.147369384765625, -1.1072845458984375, -1.06719970703125, -1.0271148681640625, -0.987030029296875, -0.9469451904296875, -0.9068603515625, -0.8667755126953125, -0.826690673828125, -0.7866058349609375, -0.74652099609375, -0.7064361572265625, -0.666351318359375, -0.6262664794921875, -0.586181640625, -0.5460968017578125, -0.506011962890625, -0.4659271240234375, -0.42584228515625, -0.3857574462890625, -0.345672607421875, -0.3055877685546875, -0.2655029296875, -0.2254180908203125, -0.185333251953125, -0.1452484130859375, -0.10516357421875, -0.0650787353515625, -0.024993896484375, 0.0150909423828125, 0.05517578125, 0.0952606201171875, 0.135345458984375, 0.1754302978515625, 0.21551513671875, 0.2555999755859375, 0.295684814453125, 0.3357696533203125, 0.3758544921875, 0.4159393310546875, 0.456024169921875, 0.4961090087890625, 0.53619384765625, 0.5762786865234375, 0.616363525390625, 0.6564483642578125, 0.696533203125, 0.7366180419921875, 0.776702880859375, 0.8167877197265625, 0.85687255859375, 0.8969573974609375, 0.937042236328125, 0.9771270751953125, 1.0172119140625, 1.0572967529296875, 1.097381591796875, 1.1374664306640625, 1.17755126953125, 1.2176361083984375, 1.257720947265625, 1.2978057861328125, 1.337890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 7.0, 14.0, 20.0, 14.0, 23.0, 40.0, 43.0, 88.0, 107.0, 209.0, 371.0, 791.0, 1934.0, 5495.0, 17180.0, 57144.0, 687099.0, 222431.0, 37457.0, 11539.0, 3769.0, 1426.0, 612.0, 287.0, 162.0, 94.0, 56.0, 44.0, 29.0, 11.0, 18.0, 13.0, 7.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.98828125, -7.7713623046875, -7.554443359375, -7.3375244140625, -7.12060546875, -6.9036865234375, -6.686767578125, -6.4698486328125, -6.2529296875, -6.0360107421875, -5.819091796875, -5.6021728515625, -5.38525390625, -5.1683349609375, -4.951416015625, -4.7344970703125, -4.517578125, -4.3006591796875, -4.083740234375, -3.8668212890625, -3.64990234375, -3.4329833984375, -3.216064453125, -2.9991455078125, -2.7822265625, -2.5653076171875, -2.348388671875, -2.1314697265625, -1.91455078125, -1.6976318359375, -1.480712890625, -1.2637939453125, -1.046875, -0.8299560546875, -0.613037109375, -0.3961181640625, -0.17919921875, 0.0377197265625, 0.254638671875, 0.4715576171875, 0.6884765625, 0.9053955078125, 1.122314453125, 1.3392333984375, 1.55615234375, 1.7730712890625, 1.989990234375, 2.2069091796875, 2.423828125, 2.6407470703125, 2.857666015625, 3.0745849609375, 3.29150390625, 3.5084228515625, 3.725341796875, 3.9422607421875, 4.1591796875, 4.3760986328125, 4.593017578125, 4.8099365234375, 5.02685546875, 5.2437744140625, 5.460693359375, 5.6776123046875, 5.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 11.0, 8.0, 14.0, 17.0, 22.0, 35.0, 36.0, 59.0, 66.0, 79.0, 84.0, 79.0, 82.0, 66.0, 62.0, 62.0, 38.0, 41.0, 42.0, 21.0, 13.0, 9.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3671875, -9.12725830078125, -8.8873291015625, -8.64739990234375, -8.407470703125, -8.16754150390625, -7.9276123046875, -7.68768310546875, -7.44775390625, -7.20782470703125, -6.9678955078125, -6.72796630859375, -6.488037109375, -6.24810791015625, -6.0081787109375, -5.76824951171875, -5.5283203125, -5.28839111328125, -5.0484619140625, -4.80853271484375, -4.568603515625, -4.32867431640625, -4.0887451171875, -3.84881591796875, -3.60888671875, -3.36895751953125, -3.1290283203125, -2.88909912109375, -2.649169921875, -2.40924072265625, -2.1693115234375, -1.92938232421875, -1.689453125, -1.44952392578125, -1.2095947265625, -0.96966552734375, -0.729736328125, -0.48980712890625, -0.2498779296875, -0.00994873046875, 0.22998046875, 0.46990966796875, 0.7098388671875, 0.94976806640625, 1.189697265625, 1.42962646484375, 1.6695556640625, 1.90948486328125, 2.1494140625, 2.38934326171875, 2.6292724609375, 2.86920166015625, 3.109130859375, 3.34906005859375, 3.5889892578125, 3.82891845703125, 4.06884765625, 4.30877685546875, 4.5487060546875, 4.78863525390625, 5.028564453125, 5.26849365234375, 5.5084228515625, 5.74835205078125, 5.98828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 8.0, 26.0, 20.0, 29.0, 45.0, 81.0, 101.0, 176.0, 255.0, 446.0, 741.0, 1320.0, 2444.0, 4942.0, 10548.0, 24764.0, 65081.0, 410216.0, 415830.0, 65408.0, 24772.0, 10598.0, 4838.0, 2552.0, 1311.0, 794.0, 415.0, 293.0, 157.0, 124.0, 66.0, 41.0, 34.0, 18.0, 20.0, 12.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.583984375, -2.510162353515625, -2.43634033203125, -2.362518310546875, -2.2886962890625, -2.214874267578125, -2.14105224609375, -2.067230224609375, -1.993408203125, -1.919586181640625, -1.84576416015625, -1.771942138671875, -1.6981201171875, -1.624298095703125, -1.55047607421875, -1.476654052734375, -1.40283203125, -1.329010009765625, -1.25518798828125, -1.181365966796875, -1.1075439453125, -1.033721923828125, -0.95989990234375, -0.886077880859375, -0.812255859375, -0.738433837890625, -0.66461181640625, -0.590789794921875, -0.5169677734375, -0.443145751953125, -0.36932373046875, -0.295501708984375, -0.2216796875, -0.147857666015625, -0.07403564453125, -0.000213623046875, 0.0736083984375, 0.147430419921875, 0.22125244140625, 0.295074462890625, 0.368896484375, 0.442718505859375, 0.51654052734375, 0.590362548828125, 0.6641845703125, 0.738006591796875, 0.81182861328125, 0.885650634765625, 0.95947265625, 1.033294677734375, 1.10711669921875, 1.180938720703125, 1.2547607421875, 1.328582763671875, 1.40240478515625, 1.476226806640625, 1.550048828125, 1.623870849609375, 1.69769287109375, 1.771514892578125, 1.8453369140625, 1.919158935546875, 1.99298095703125, 2.066802978515625, 2.140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 7.0, 6.0, 13.0, 18.0, 14.0, 23.0, 46.0, 178.0, 383.0, 132.0, 39.0, 29.0, 23.0, 16.0, 19.0, 8.0, 5.0, 7.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008817464113235474, -0.000852733850479126, -0.0008237212896347046, -0.0007947087287902832, -0.0007656961679458618, -0.0007366836071014404, -0.000707671046257019, -0.0006786584854125977, -0.0006496459245681763, -0.0006206333637237549, -0.0005916208028793335, -0.0005626082420349121, -0.0005335956811904907, -0.0005045831203460693, -0.00047557055950164795, -0.00044655799865722656, -0.0004175454378128052, -0.0003885328769683838, -0.0003595203161239624, -0.000330507755279541, -0.00030149519443511963, -0.00027248263359069824, -0.00024347007274627686, -0.00021445751190185547, -0.00018544495105743408, -0.0001564323902130127, -0.0001274198293685913, -9.840726852416992e-05, -6.939470767974854e-05, -4.038214683532715e-05, -1.1369585990905762e-05, 1.7642974853515625e-05, 4.665553569793701e-05, 7.56680965423584e-05, 0.00010468065738677979, 0.00013369321823120117, 0.00016270577907562256, 0.00019171833992004395, 0.00022073090076446533, 0.0002497434616088867, 0.0002787560224533081, 0.0003077685832977295, 0.0003367811441421509, 0.00036579370498657227, 0.00039480626583099365, 0.00042381882667541504, 0.0004528313875198364, 0.0004818439483642578, 0.0005108565092086792, 0.0005398690700531006, 0.000568881630897522, 0.0005978941917419434, 0.0006269067525863647, 0.0006559193134307861, 0.0006849318742752075, 0.0007139444351196289, 0.0007429569959640503, 0.0007719695568084717, 0.0008009821176528931, 0.0008299946784973145, 0.0008590072393417358, 0.0008880198001861572, 0.0009170323610305786, 0.000946044921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 13.0, 16.0, 33.0, 39.0, 67.0, 101.0, 174.0, 269.0, 550.0, 1517.0, 4774.0, 20925.0, 121947.0, 794208.0, 81838.0, 15820.0, 3859.0, 1226.0, 505.0, 248.0, 146.0, 105.0, 53.0, 35.0, 20.0, 24.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.56640625, -4.43743896484375, -4.3084716796875, -4.17950439453125, -4.050537109375, -3.92156982421875, -3.7926025390625, -3.66363525390625, -3.53466796875, -3.40570068359375, -3.2767333984375, -3.14776611328125, -3.018798828125, -2.88983154296875, -2.7608642578125, -2.63189697265625, -2.5029296875, -2.37396240234375, -2.2449951171875, -2.11602783203125, -1.987060546875, -1.85809326171875, -1.7291259765625, -1.60015869140625, -1.47119140625, -1.34222412109375, -1.2132568359375, -1.08428955078125, -0.955322265625, -0.82635498046875, -0.6973876953125, -0.56842041015625, -0.439453125, -0.31048583984375, -0.1815185546875, -0.05255126953125, 0.076416015625, 0.20538330078125, 0.3343505859375, 0.46331787109375, 0.59228515625, 0.72125244140625, 0.8502197265625, 0.97918701171875, 1.108154296875, 1.23712158203125, 1.3660888671875, 1.49505615234375, 1.6240234375, 1.75299072265625, 1.8819580078125, 2.01092529296875, 2.139892578125, 2.26885986328125, 2.3978271484375, 2.52679443359375, 2.65576171875, 2.78472900390625, 2.9136962890625, 3.04266357421875, 3.171630859375, 3.30059814453125, 3.4295654296875, 3.55853271484375, 3.6875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 4.0, 10.0, 14.0, 13.0, 20.0, 12.0, 24.0, 33.0, 57.0, 118.0, 145.0, 165.0, 125.0, 51.0, 32.0, 33.0, 23.0, 20.0, 15.0, 14.0, 7.0, 12.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09375, -2.019378662109375, -1.94500732421875, -1.870635986328125, -1.7962646484375, -1.721893310546875, -1.64752197265625, -1.573150634765625, -1.498779296875, -1.424407958984375, -1.35003662109375, -1.275665283203125, -1.2012939453125, -1.126922607421875, -1.05255126953125, -0.978179931640625, -0.90380859375, -0.829437255859375, -0.75506591796875, -0.680694580078125, -0.6063232421875, -0.531951904296875, -0.45758056640625, -0.383209228515625, -0.308837890625, -0.234466552734375, -0.16009521484375, -0.085723876953125, -0.0113525390625, 0.063018798828125, 0.13739013671875, 0.211761474609375, 0.2861328125, 0.360504150390625, 0.43487548828125, 0.509246826171875, 0.5836181640625, 0.657989501953125, 0.73236083984375, 0.806732177734375, 0.881103515625, 0.955474853515625, 1.02984619140625, 1.104217529296875, 1.1785888671875, 1.252960205078125, 1.32733154296875, 1.401702880859375, 1.47607421875, 1.550445556640625, 1.62481689453125, 1.699188232421875, 1.7735595703125, 1.847930908203125, 1.92230224609375, 1.996673583984375, 2.071044921875, 2.145416259765625, 2.21978759765625, 2.294158935546875, 2.3685302734375, 2.442901611328125, 2.51727294921875, 2.591644287109375, 2.666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 28.0, 25.0, 53.0, 62.0, 82.0, 88.0, 115.0, 102.0, 101.0, 82.0, 69.0, 42.0, 36.0, 22.0, 23.0, 16.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.986961364746094, -31.047964096069336, -30.108964920043945, -29.169967651367188, -28.23097038269043, -27.291973114013672, -26.35297393798828, -25.413976669311523, -24.474979400634766, -23.535982131958008, -22.596982955932617, -21.65798568725586, -20.7189884185791, -19.779991149902344, -18.840991973876953, -17.901994705200195, -16.962995529174805, -16.023998260498047, -15.085000038146973, -14.146001815795898, -13.20700454711914, -12.268006324768066, -11.329008102416992, -10.390010833740234, -9.45101261138916, -8.512014389038086, -7.573017120361328, -6.634018898010254, -5.695021152496338, -4.756023406982422, -3.8170251846313477, -2.8780274391174316, -1.9390277862548828, -1.0000299215316772, -0.06103205680847168, 0.8779659271240234, 1.8169636726379395, 2.7559614181518555, 3.6949596405029297, 4.633957386016846, 5.572955131530762, 6.511952877044678, 7.450950622558594, 8.389948844909668, 9.328947067260742, 10.2679443359375, 11.206942558288574, 12.145940780639648, 13.084938049316406, 14.02393627166748, 14.962933540344238, 15.901931762695312, 16.84092903137207, 17.779926300048828, 18.71892547607422, 19.657922744750977, 20.596920013427734, 21.535917282104492, 22.474916458129883, 23.41391372680664, 24.3529109954834, 25.291908264160156, 26.230907440185547, 27.169904708862305, 28.108903884887695]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 5.0, 10.0, 4.0, 13.0, 14.0, 15.0, 22.0, 15.0, 17.0, 28.0, 28.0, 31.0, 34.0, 35.0, 37.0, 44.0, 54.0, 50.0, 48.0, 42.0, 39.0, 40.0, 45.0, 40.0, 32.0, 42.0, 25.0, 31.0, 21.0, 19.0, 15.0, 19.0, 16.0, 12.0, 7.0, 14.0, 3.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-24.45825958251953, -23.762027740478516, -23.0657958984375, -22.369564056396484, -21.67333221435547, -20.977100372314453, -20.280868530273438, -19.584636688232422, -18.888404846191406, -18.19217300415039, -17.495941162109375, -16.79970932006836, -16.103477478027344, -15.407245635986328, -14.711012840270996, -14.01478099822998, -13.318548202514648, -12.622316360473633, -11.926084518432617, -11.229852676391602, -10.533620834350586, -9.83738899230957, -9.141156196594238, -8.444924354553223, -7.748692512512207, -7.052460670471191, -6.356228828430176, -5.659996509552002, -4.963764667510986, -4.267532825469971, -3.571300506591797, -2.8750686645507812, -2.178834915161133, -1.4826029539108276, -0.7863709926605225, -0.09013891220092773, 0.6060929298400879, 1.3023247718811035, 1.9985570907592773, 2.694788932800293, 3.3910207748413086, 4.087252616882324, 4.78348445892334, 5.479716777801514, 6.175948619842529, 6.872180461883545, 7.568412780761719, 8.264644622802734, 8.96087646484375, 9.657108306884766, 10.353340148925781, 11.049571990966797, 11.745803833007812, 12.442035675048828, 13.13826847076416, 13.834500312805176, 14.530732154846191, 15.226963996887207, 15.923195838928223, 16.619428634643555, 17.31566047668457, 18.011892318725586, 18.7081241607666, 19.404356002807617, 20.100587844848633]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 17.0, 35.0, 38.0, 68.0, 108.0, 216.0, 456.0, 991.0, 2372.0, 6111.0, 17300.0, 68537.0, 1583259.0, 2416290.0, 70520.0, 17752.0, 6003.0, 2298.0, 978.0, 440.0, 216.0, 109.0, 59.0, 28.0, 18.0, 7.0, 15.0, 8.0, 4.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75, -7.4732666015625, -7.196533203125, -6.9197998046875, -6.64306640625, -6.3663330078125, -6.089599609375, -5.8128662109375, -5.5361328125, -5.2593994140625, -4.982666015625, -4.7059326171875, -4.42919921875, -4.1524658203125, -3.875732421875, -3.5989990234375, -3.322265625, -3.0455322265625, -2.768798828125, -2.4920654296875, -2.21533203125, -1.9385986328125, -1.661865234375, -1.3851318359375, -1.1083984375, -0.8316650390625, -0.554931640625, -0.2781982421875, -0.00146484375, 0.2752685546875, 0.552001953125, 0.8287353515625, 1.10546875, 1.3822021484375, 1.658935546875, 1.9356689453125, 2.21240234375, 2.4891357421875, 2.765869140625, 3.0426025390625, 3.3193359375, 3.5960693359375, 3.872802734375, 4.1495361328125, 4.42626953125, 4.7030029296875, 4.979736328125, 5.2564697265625, 5.533203125, 5.8099365234375, 6.086669921875, 6.3634033203125, 6.64013671875, 6.9168701171875, 7.193603515625, 7.4703369140625, 7.7470703125, 8.0238037109375, 8.300537109375, 8.5772705078125, 8.85400390625, 9.1307373046875, 9.407470703125, 9.6842041015625, 9.9609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 12.0, 11.0, 14.0, 16.0, 14.0, 15.0, 28.0, 18.0, 32.0, 36.0, 47.0, 30.0, 35.0, 62.0, 59.0, 54.0, 59.0, 67.0, 46.0, 48.0, 47.0, 40.0, 33.0, 38.0, 33.0, 36.0, 10.0, 18.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2179718017578125, -1.177154541015625, -1.1363372802734375, -1.09552001953125, -1.0547027587890625, -1.013885498046875, -0.9730682373046875, -0.9322509765625, -0.8914337158203125, -0.850616455078125, -0.8097991943359375, -0.76898193359375, -0.7281646728515625, -0.687347412109375, -0.6465301513671875, -0.605712890625, -0.5648956298828125, -0.524078369140625, -0.4832611083984375, -0.44244384765625, -0.4016265869140625, -0.360809326171875, -0.3199920654296875, -0.2791748046875, -0.2383575439453125, -0.197540283203125, -0.1567230224609375, -0.11590576171875, -0.0750885009765625, -0.034271240234375, 0.0065460205078125, 0.04736328125, 0.0881805419921875, 0.128997802734375, 0.1698150634765625, 0.21063232421875, 0.2514495849609375, 0.292266845703125, 0.3330841064453125, 0.3739013671875, 0.4147186279296875, 0.455535888671875, 0.4963531494140625, 0.53717041015625, 0.5779876708984375, 0.618804931640625, 0.6596221923828125, 0.700439453125, 0.7412567138671875, 0.782073974609375, 0.8228912353515625, 0.86370849609375, 0.9045257568359375, 0.945343017578125, 0.9861602783203125, 1.0269775390625, 1.0677947998046875, 1.108612060546875, 1.1494293212890625, 1.19024658203125, 1.2310638427734375, 1.271881103515625, 1.3126983642578125, 1.353515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 13.0, 11.0, 20.0, 33.0, 50.0, 80.0, 70.0, 127.0, 171.0, 222.0, 297.0, 497.0, 815.0, 1381.0, 2636.0, 5352.0, 12195.0, 30264.0, 97024.0, 718487.0, 3109359.0, 144639.0, 40798.0, 15409.0, 6567.0, 3247.0, 1675.0, 936.0, 565.0, 388.0, 274.0, 173.0, 132.0, 93.0, 63.0, 56.0, 39.0, 35.0, 23.0, 16.0, 14.0, 13.0, 9.0, 7.0, 1.0, 3.0], "bins": [-8.140625, -7.92718505859375, -7.7137451171875, -7.50030517578125, -7.286865234375, -7.07342529296875, -6.8599853515625, -6.64654541015625, -6.43310546875, -6.21966552734375, -6.0062255859375, -5.79278564453125, -5.579345703125, -5.36590576171875, -5.1524658203125, -4.93902587890625, -4.7255859375, -4.51214599609375, -4.2987060546875, -4.08526611328125, -3.871826171875, -3.65838623046875, -3.4449462890625, -3.23150634765625, -3.01806640625, -2.80462646484375, -2.5911865234375, -2.37774658203125, -2.164306640625, -1.95086669921875, -1.7374267578125, -1.52398681640625, -1.310546875, -1.09710693359375, -0.8836669921875, -0.67022705078125, -0.456787109375, -0.24334716796875, -0.0299072265625, 0.18353271484375, 0.39697265625, 0.61041259765625, 0.8238525390625, 1.03729248046875, 1.250732421875, 1.46417236328125, 1.6776123046875, 1.89105224609375, 2.1044921875, 2.31793212890625, 2.5313720703125, 2.74481201171875, 2.958251953125, 3.17169189453125, 3.3851318359375, 3.59857177734375, 3.81201171875, 4.02545166015625, 4.2388916015625, 4.45233154296875, 4.665771484375, 4.87921142578125, 5.0926513671875, 5.30609130859375, 5.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 12.0, 12.0, 16.0, 24.0, 30.0, 46.0, 65.0, 148.0, 290.0, 1484.0, 1301.0, 275.0, 109.0, 78.0, 41.0, 47.0, 17.0, 13.0, 14.0, 11.0, 4.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57421875, -2.4622802734375, -2.350341796875, -2.2384033203125, -2.12646484375, -2.0145263671875, -1.902587890625, -1.7906494140625, -1.6787109375, -1.5667724609375, -1.454833984375, -1.3428955078125, -1.23095703125, -1.1190185546875, -1.007080078125, -0.8951416015625, -0.783203125, -0.6712646484375, -0.559326171875, -0.4473876953125, -0.33544921875, -0.2235107421875, -0.111572265625, 0.0003662109375, 0.1123046875, 0.2242431640625, 0.336181640625, 0.4481201171875, 0.56005859375, 0.6719970703125, 0.783935546875, 0.8958740234375, 1.0078125, 1.1197509765625, 1.231689453125, 1.3436279296875, 1.45556640625, 1.5675048828125, 1.679443359375, 1.7913818359375, 1.9033203125, 2.0152587890625, 2.127197265625, 2.2391357421875, 2.35107421875, 2.4630126953125, 2.574951171875, 2.6868896484375, 2.798828125, 2.9107666015625, 3.022705078125, 3.1346435546875, 3.24658203125, 3.3585205078125, 3.470458984375, 3.5823974609375, 3.6943359375, 3.8062744140625, 3.918212890625, 4.0301513671875, 4.14208984375, 4.2540283203125, 4.365966796875, 4.4779052734375, 4.58984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 33.0, 53.0, 72.0, 132.0, 157.0, 151.0, 128.0, 91.0, 52.0, 36.0, 23.0, 10.0, 11.0, 10.0, 1.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.313812255859375, -15.635957717895508, -14.958102226257324, -14.280247688293457, -13.602392196655273, -12.924537658691406, -12.246683120727539, -11.568827629089355, -10.890972137451172, -10.213117599487305, -9.535262107849121, -8.857407569885254, -8.17955207824707, -7.501697540283203, -6.823842525482178, -6.145987510681152, -5.468132972717285, -4.79027795791626, -4.112422943115234, -3.434568166732788, -2.7567131519317627, -2.0788581371307373, -1.401003360748291, -0.7231483459472656, -0.045293331146240234, 0.6325616240501404, 1.310416579246521, 1.9882714748382568, 2.6661264896392822, 3.3439815044403076, 4.021836280822754, 4.699691295623779, 5.377546310424805, 6.05540132522583, 6.7332563400268555, 7.411110877990723, 8.088966369628906, 8.766820907592773, 9.44467544555664, 10.122530937194824, 10.800386428833008, 11.478240966796875, 12.156096458435059, 12.833950996398926, 13.51180648803711, 14.189661026000977, 14.867515563964844, 15.545371055603027, 16.223224639892578, 16.901079177856445, 17.578933715820312, 18.256790161132812, 18.93464469909668, 19.612499237060547, 20.290353775024414, 20.96820831298828, 21.64606475830078, 22.32391929626465, 23.001773834228516, 23.679630279541016, 24.357484817504883, 25.03533935546875, 25.713193893432617, 26.391048431396484, 27.068904876708984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 9.0, 8.0, 9.0, 10.0, 11.0, 17.0, 20.0, 27.0, 22.0, 23.0, 40.0, 43.0, 48.0, 41.0, 46.0, 57.0, 42.0, 44.0, 70.0, 55.0, 47.0, 48.0, 49.0, 34.0, 30.0, 35.0, 21.0, 23.0, 18.0, 14.0, 12.0, 7.0, 4.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.803576469421387, -10.422284126281738, -10.04099178314209, -9.659699440002441, -9.278407096862793, -8.897113800048828, -8.51582145690918, -8.134529113769531, -7.753236770629883, -7.371944427490234, -6.990652084350586, -6.6093597412109375, -6.228066921234131, -5.846774578094482, -5.465482234954834, -5.084189414978027, -4.702897548675537, -4.321605205535889, -3.940312623977661, -3.5590202808380127, -3.177727699279785, -2.7964353561401367, -2.4151430130004883, -2.0338504314422607, -1.6525580883026123, -1.2712656259536743, -0.8899732232093811, -0.5086808204650879, -0.1273883581161499, 0.2539041042327881, 0.6351964473724365, 1.016489028930664, 1.3977813720703125, 1.7790738344192505, 2.1603662967681885, 2.541658639907837, 2.9229512214660645, 3.304243564605713, 3.6855359077453613, 4.066828727722168, 4.448121070861816, 4.829413414001465, 5.210705757141113, 5.591998100280762, 5.973290920257568, 6.354583263397217, 6.735875606536865, 7.117168426513672, 7.498460292816162, 7.8797526359558105, 8.261045455932617, 8.642337799072266, 9.023630142211914, 9.404922485351562, 9.786214828491211, 10.16750717163086, 10.548799514770508, 10.930091857910156, 11.311384201049805, 11.692676544189453, 12.073968887329102, 12.45526123046875, 12.836553573608398, 13.217846870422363, 13.599139213562012]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 17.0, 19.0, 34.0, 40.0, 72.0, 85.0, 136.0, 185.0, 334.0, 527.0, 922.0, 1864.0, 3714.0, 8368.0, 19525.0, 46241.0, 116123.0, 355675.0, 316337.0, 103347.0, 42112.0, 17620.0, 7794.0, 3513.0, 1657.0, 875.0, 507.0, 281.0, 197.0, 112.0, 66.0, 70.0, 50.0, 33.0, 28.0, 19.0, 12.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-5.08203125, -4.93231201171875, -4.7825927734375, -4.63287353515625, -4.483154296875, -4.33343505859375, -4.1837158203125, -4.03399658203125, -3.88427734375, -3.73455810546875, -3.5848388671875, -3.43511962890625, -3.285400390625, -3.13568115234375, -2.9859619140625, -2.83624267578125, -2.6865234375, -2.53680419921875, -2.3870849609375, -2.23736572265625, -2.087646484375, -1.93792724609375, -1.7882080078125, -1.63848876953125, -1.48876953125, -1.33905029296875, -1.1893310546875, -1.03961181640625, -0.889892578125, -0.74017333984375, -0.5904541015625, -0.44073486328125, -0.291015625, -0.14129638671875, 0.0084228515625, 0.15814208984375, 0.307861328125, 0.45758056640625, 0.6072998046875, 0.75701904296875, 0.90673828125, 1.05645751953125, 1.2061767578125, 1.35589599609375, 1.505615234375, 1.65533447265625, 1.8050537109375, 1.95477294921875, 2.1044921875, 2.25421142578125, 2.4039306640625, 2.55364990234375, 2.703369140625, 2.85308837890625, 3.0028076171875, 3.15252685546875, 3.30224609375, 3.45196533203125, 3.6016845703125, 3.75140380859375, 3.901123046875, 4.05084228515625, 4.2005615234375, 4.35028076171875, 4.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 18.0, 14.0, 17.0, 17.0, 17.0, 28.0, 34.0, 36.0, 35.0, 40.0, 51.0, 45.0, 60.0, 64.0, 55.0, 50.0, 63.0, 41.0, 40.0, 37.0, 39.0, 32.0, 29.0, 27.0, 20.0, 17.0, 24.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3803253173828125, -1.335845947265625, -1.2913665771484375, -1.24688720703125, -1.2024078369140625, -1.157928466796875, -1.1134490966796875, -1.0689697265625, -1.0244903564453125, -0.980010986328125, -0.9355316162109375, -0.89105224609375, -0.8465728759765625, -0.802093505859375, -0.7576141357421875, -0.713134765625, -0.6686553955078125, -0.624176025390625, -0.5796966552734375, -0.53521728515625, -0.4907379150390625, -0.446258544921875, -0.4017791748046875, -0.3572998046875, -0.3128204345703125, -0.268341064453125, -0.2238616943359375, -0.17938232421875, -0.1349029541015625, -0.090423583984375, -0.0459442138671875, -0.00146484375, 0.0430145263671875, 0.087493896484375, 0.1319732666015625, 0.17645263671875, 0.2209320068359375, 0.265411376953125, 0.3098907470703125, 0.3543701171875, 0.3988494873046875, 0.443328857421875, 0.4878082275390625, 0.53228759765625, 0.5767669677734375, 0.621246337890625, 0.6657257080078125, 0.710205078125, 0.7546844482421875, 0.799163818359375, 0.8436431884765625, 0.88812255859375, 0.9326019287109375, 0.977081298828125, 1.0215606689453125, 1.0660400390625, 1.1105194091796875, 1.154998779296875, 1.1994781494140625, 1.24395751953125, 1.2884368896484375, 1.332916259765625, 1.3773956298828125, 1.421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 14.0, 25.0, 51.0, 57.0, 77.0, 170.0, 256.0, 412.0, 764.0, 1855.0, 6301.0, 38539.0, 387533.0, 551943.0, 48835.0, 7647.0, 2010.0, 893.0, 426.0, 263.0, 159.0, 104.0, 61.0, 34.0, 28.0, 22.0, 16.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.11712646484375, -6.8084716796875, -6.49981689453125, -6.191162109375, -5.88250732421875, -5.5738525390625, -5.26519775390625, -4.95654296875, -4.64788818359375, -4.3392333984375, -4.03057861328125, -3.721923828125, -3.41326904296875, -3.1046142578125, -2.79595947265625, -2.4873046875, -2.17864990234375, -1.8699951171875, -1.56134033203125, -1.252685546875, -0.94403076171875, -0.6353759765625, -0.32672119140625, -0.01806640625, 0.29058837890625, 0.5992431640625, 0.90789794921875, 1.216552734375, 1.52520751953125, 1.8338623046875, 2.14251708984375, 2.451171875, 2.75982666015625, 3.0684814453125, 3.37713623046875, 3.685791015625, 3.99444580078125, 4.3031005859375, 4.61175537109375, 4.92041015625, 5.22906494140625, 5.5377197265625, 5.84637451171875, 6.155029296875, 6.46368408203125, 6.7723388671875, 7.08099365234375, 7.3896484375, 7.69830322265625, 8.0069580078125, 8.31561279296875, 8.624267578125, 8.93292236328125, 9.2415771484375, 9.55023193359375, 9.85888671875, 10.16754150390625, 10.4761962890625, 10.78485107421875, 11.093505859375, 11.40216064453125, 11.7108154296875, 12.01947021484375, 12.328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 7.0, 8.0, 10.0, 9.0, 15.0, 19.0, 19.0, 20.0, 25.0, 41.0, 34.0, 40.0, 38.0, 41.0, 49.0, 44.0, 39.0, 55.0, 57.0, 50.0, 46.0, 40.0, 30.0, 38.0, 27.0, 29.0, 33.0, 23.0, 28.0, 14.0, 14.0, 8.0, 3.0, 6.0, 8.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7984619140625, -5.612548828125, -5.4266357421875, -5.24072265625, -5.0548095703125, -4.868896484375, -4.6829833984375, -4.4970703125, -4.3111572265625, -4.125244140625, -3.9393310546875, -3.75341796875, -3.5675048828125, -3.381591796875, -3.1956787109375, -3.009765625, -2.8238525390625, -2.637939453125, -2.4520263671875, -2.26611328125, -2.0802001953125, -1.894287109375, -1.7083740234375, -1.5224609375, -1.3365478515625, -1.150634765625, -0.9647216796875, -0.77880859375, -0.5928955078125, -0.406982421875, -0.2210693359375, -0.03515625, 0.1507568359375, 0.336669921875, 0.5225830078125, 0.70849609375, 0.8944091796875, 1.080322265625, 1.2662353515625, 1.4521484375, 1.6380615234375, 1.823974609375, 2.0098876953125, 2.19580078125, 2.3817138671875, 2.567626953125, 2.7535400390625, 2.939453125, 3.1253662109375, 3.311279296875, 3.4971923828125, 3.68310546875, 3.8690185546875, 4.054931640625, 4.2408447265625, 4.4267578125, 4.6126708984375, 4.798583984375, 4.9844970703125, 5.17041015625, 5.3563232421875, 5.542236328125, 5.7281494140625, 5.9140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 13.0, 23.0, 22.0, 34.0, 58.0, 93.0, 175.0, 298.0, 622.0, 1246.0, 3039.0, 8145.0, 23854.0, 75957.0, 330608.0, 462081.0, 96846.0, 28849.0, 9854.0, 3695.0, 1498.0, 693.0, 337.0, 204.0, 101.0, 59.0, 43.0, 30.0, 21.0, 14.0, 8.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.015625, -3.91546630859375, -3.8153076171875, -3.71514892578125, -3.614990234375, -3.51483154296875, -3.4146728515625, -3.31451416015625, -3.21435546875, -3.11419677734375, -3.0140380859375, -2.91387939453125, -2.813720703125, -2.71356201171875, -2.6134033203125, -2.51324462890625, -2.4130859375, -2.31292724609375, -2.2127685546875, -2.11260986328125, -2.012451171875, -1.91229248046875, -1.8121337890625, -1.71197509765625, -1.61181640625, -1.51165771484375, -1.4114990234375, -1.31134033203125, -1.211181640625, -1.11102294921875, -1.0108642578125, -0.91070556640625, -0.810546875, -0.71038818359375, -0.6102294921875, -0.51007080078125, -0.409912109375, -0.30975341796875, -0.2095947265625, -0.10943603515625, -0.00927734375, 0.09088134765625, 0.1910400390625, 0.29119873046875, 0.391357421875, 0.49151611328125, 0.5916748046875, 0.69183349609375, 0.7919921875, 0.89215087890625, 0.9923095703125, 1.09246826171875, 1.192626953125, 1.29278564453125, 1.3929443359375, 1.49310302734375, 1.59326171875, 1.69342041015625, 1.7935791015625, 1.89373779296875, 1.993896484375, 2.09405517578125, 2.1942138671875, 2.29437255859375, 2.39453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 19.0, 10.0, 17.0, 27.0, 26.0, 38.0, 45.0, 55.0, 99.0, 207.0, 140.0, 62.0, 41.0, 29.0, 30.0, 25.0, 21.0, 17.0, 16.0, 11.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000835418701171875, -0.0008098036050796509, -0.0007841885089874268, -0.0007585734128952026, -0.0007329583168029785, -0.0007073432207107544, -0.0006817281246185303, -0.0006561130285263062, -0.000630497932434082, -0.0006048828363418579, -0.0005792677402496338, -0.0005536526441574097, -0.0005280375480651855, -0.0005024224519729614, -0.0004768073558807373, -0.0004511922597885132, -0.00042557716369628906, -0.00039996206760406494, -0.0003743469715118408, -0.0003487318754196167, -0.0003231167793273926, -0.00029750168323516846, -0.00027188658714294434, -0.0002462714910507202, -0.0002206563949584961, -0.00019504129886627197, -0.00016942620277404785, -0.00014381110668182373, -0.00011819601058959961, -9.258091449737549e-05, -6.696581840515137e-05, -4.1350722312927246e-05, -1.5735626220703125e-05, 9.879469871520996e-06, 3.549456596374512e-05, 6.110966205596924e-05, 8.672475814819336e-05, 0.00011233985424041748, 0.0001379549503326416, 0.00016357004642486572, 0.00018918514251708984, 0.00021480023860931396, 0.00024041533470153809, 0.0002660304307937622, 0.00029164552688598633, 0.00031726062297821045, 0.00034287571907043457, 0.0003684908151626587, 0.0003941059112548828, 0.00041972100734710693, 0.00044533610343933105, 0.0004709511995315552, 0.0004965662956237793, 0.0005221813917160034, 0.0005477964878082275, 0.0005734115839004517, 0.0005990266799926758, 0.0006246417760848999, 0.000650256872177124, 0.0006758719682693481, 0.0007014870643615723, 0.0007271021604537964, 0.0007527172565460205, 0.0007783323526382446, 0.0008039474487304688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 10.0, 18.0, 19.0, 20.0, 43.0, 51.0, 85.0, 163.0, 314.0, 560.0, 1420.0, 4589.0, 22625.0, 173400.0, 709442.0, 113809.0, 16021.0, 3655.0, 1154.0, 509.0, 241.0, 127.0, 85.0, 48.0, 34.0, 17.0, 22.0, 21.0, 10.0, 11.0, 8.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.1875, -6.0220947265625, -5.856689453125, -5.6912841796875, -5.52587890625, -5.3604736328125, -5.195068359375, -5.0296630859375, -4.8642578125, -4.6988525390625, -4.533447265625, -4.3680419921875, -4.20263671875, -4.0372314453125, -3.871826171875, -3.7064208984375, -3.541015625, -3.3756103515625, -3.210205078125, -3.0447998046875, -2.87939453125, -2.7139892578125, -2.548583984375, -2.3831787109375, -2.2177734375, -2.0523681640625, -1.886962890625, -1.7215576171875, -1.55615234375, -1.3907470703125, -1.225341796875, -1.0599365234375, -0.89453125, -0.7291259765625, -0.563720703125, -0.3983154296875, -0.23291015625, -0.0675048828125, 0.097900390625, 0.2633056640625, 0.4287109375, 0.5941162109375, 0.759521484375, 0.9249267578125, 1.09033203125, 1.2557373046875, 1.421142578125, 1.5865478515625, 1.751953125, 1.9173583984375, 2.082763671875, 2.2481689453125, 2.41357421875, 2.5789794921875, 2.744384765625, 2.9097900390625, 3.0751953125, 3.2406005859375, 3.406005859375, 3.5714111328125, 3.73681640625, 3.9022216796875, 4.067626953125, 4.2330322265625, 4.3984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 12.0, 19.0, 15.0, 31.0, 42.0, 69.0, 89.0, 118.0, 145.0, 126.0, 93.0, 70.0, 44.0, 33.0, 24.0, 10.0, 13.0, 11.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.26953125, -6.1324462890625, -5.995361328125, -5.8582763671875, -5.72119140625, -5.5841064453125, -5.447021484375, -5.3099365234375, -5.1728515625, -5.0357666015625, -4.898681640625, -4.7615966796875, -4.62451171875, -4.4874267578125, -4.350341796875, -4.2132568359375, -4.076171875, -3.9390869140625, -3.802001953125, -3.6649169921875, -3.52783203125, -3.3907470703125, -3.253662109375, -3.1165771484375, -2.9794921875, -2.8424072265625, -2.705322265625, -2.5682373046875, -2.43115234375, -2.2940673828125, -2.156982421875, -2.0198974609375, -1.8828125, -1.7457275390625, -1.608642578125, -1.4715576171875, -1.33447265625, -1.1973876953125, -1.060302734375, -0.9232177734375, -0.7861328125, -0.6490478515625, -0.511962890625, -0.3748779296875, -0.23779296875, -0.1007080078125, 0.036376953125, 0.1734619140625, 0.310546875, 0.4476318359375, 0.584716796875, 0.7218017578125, 0.85888671875, 0.9959716796875, 1.133056640625, 1.2701416015625, 1.4072265625, 1.5443115234375, 1.681396484375, 1.8184814453125, 1.95556640625, 2.0926513671875, 2.229736328125, 2.3668212890625, 2.50390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 21.0, 65.0, 181.0, 338.0, 251.0, 103.0, 24.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.445945739746094, -42.7911262512207, -39.13630676269531, -35.48148727416992, -31.82666778564453, -28.17184829711914, -24.51702880859375, -20.86220932006836, -17.20738983154297, -13.552570343017578, -9.897750854492188, -6.242931365966797, -2.5881118774414062, 1.0667076110839844, 4.721527099609375, 8.376346588134766, 12.031166076660156, 15.685985565185547, 19.340805053710938, 22.995624542236328, 26.65044403076172, 30.30526351928711, 33.9600830078125, 37.61490249633789, 41.26972198486328, 44.92454147338867, 48.57936096191406, 52.23418045043945, 55.888999938964844, 59.543819427490234, 63.198638916015625, 66.85345458984375, 70.50827026367188, 74.1630859375, 77.81790924072266, 81.47273254394531, 85.12754821777344, 88.78236389160156, 92.43718719482422, 96.09201049804688, 99.746826171875, 103.40164184570312, 107.05646514892578, 110.71128845214844, 114.36610412597656, 118.02091979980469, 121.67574310302734, 125.33056640625, 128.98538208007812, 132.64019775390625, 136.29501342773438, 139.94984436035156, 143.6046600341797, 147.2594757080078, 150.914306640625, 154.56912231445312, 158.22393798828125, 161.87875366210938, 165.5335693359375, 169.1884002685547, 172.8432159423828, 176.49803161621094, 180.15286254882812, 183.80767822265625, 187.46249389648438]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 8.0, 13.0, 13.0, 15.0, 15.0, 23.0, 20.0, 22.0, 17.0, 25.0, 36.0, 44.0, 33.0, 52.0, 35.0, 41.0, 45.0, 50.0, 43.0, 35.0, 45.0, 39.0, 44.0, 27.0, 29.0, 28.0, 27.0, 20.0, 22.0, 17.0, 18.0, 16.0, 11.0, 11.0, 6.0, 6.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.444995880126953, -28.50366973876953, -27.56234359741211, -26.621017456054688, -25.679691314697266, -24.738365173339844, -23.797039031982422, -22.855712890625, -21.914386749267578, -20.973060607910156, -20.031734466552734, -19.090408325195312, -18.14908218383789, -17.20775604248047, -16.266429901123047, -15.325104713439941, -14.383779525756836, -13.442453384399414, -12.501127243041992, -11.55980110168457, -10.618474960327148, -9.677148818969727, -8.735823631286621, -7.794497489929199, -6.853171348571777, -5.9118452072143555, -4.970519065856934, -4.02919340133667, -3.087867259979248, -2.146541118621826, -1.2052154541015625, -0.2638893127441406, 0.6774368286132812, 1.6187628507614136, 2.560088872909546, 3.5014147758483887, 4.4427409172058105, 5.384067058563232, 6.325392723083496, 7.266718864440918, 8.20804500579834, 9.149371147155762, 10.090697288513184, 11.032022476196289, 11.973348617553711, 12.914674758911133, 13.856000900268555, 14.797327041625977, 15.738653182983398, 16.67997932434082, 17.621305465698242, 18.562631607055664, 19.503957748413086, 20.445283889770508, 21.386608123779297, 22.32793426513672, 23.26926040649414, 24.210586547851562, 25.151912689208984, 26.093238830566406, 27.034564971923828, 27.97589111328125, 28.917217254638672, 29.858543395996094, 30.799869537353516]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 12.0, 21.0, 25.0, 59.0, 110.0, 221.0, 571.0, 1665.0, 6552.0, 32435.0, 398894.0, 3672063.0, 66051.0, 11341.0, 2787.0, 860.0, 294.0, 134.0, 74.0, 33.0, 27.0, 18.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7454833984375, -9.342529296875, -8.9395751953125, -8.53662109375, -8.1336669921875, -7.730712890625, -7.3277587890625, -6.9248046875, -6.5218505859375, -6.118896484375, -5.7159423828125, -5.31298828125, -4.9100341796875, -4.507080078125, -4.1041259765625, -3.701171875, -3.2982177734375, -2.895263671875, -2.4923095703125, -2.08935546875, -1.6864013671875, -1.283447265625, -0.8804931640625, -0.4775390625, -0.0745849609375, 0.328369140625, 0.7313232421875, 1.13427734375, 1.5372314453125, 1.940185546875, 2.3431396484375, 2.74609375, 3.1490478515625, 3.552001953125, 3.9549560546875, 4.35791015625, 4.7608642578125, 5.163818359375, 5.5667724609375, 5.9697265625, 6.3726806640625, 6.775634765625, 7.1785888671875, 7.58154296875, 7.9844970703125, 8.387451171875, 8.7904052734375, 9.193359375, 9.5963134765625, 9.999267578125, 10.4022216796875, 10.80517578125, 11.2081298828125, 11.611083984375, 12.0140380859375, 12.4169921875, 12.8199462890625, 13.222900390625, 13.6258544921875, 14.02880859375, 14.4317626953125, 14.834716796875, 15.2376708984375, 15.640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 5.0, 9.0, 11.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 31.0, 41.0, 41.0, 42.0, 43.0, 35.0, 48.0, 61.0, 59.0, 52.0, 46.0, 35.0, 44.0, 39.0, 36.0, 34.0, 36.0, 22.0, 13.0, 22.0, 16.0, 17.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3505859375, -1.3067779541015625, -1.262969970703125, -1.2191619873046875, -1.17535400390625, -1.1315460205078125, -1.087738037109375, -1.0439300537109375, -1.0001220703125, -0.9563140869140625, -0.912506103515625, -0.8686981201171875, -0.82489013671875, -0.7810821533203125, -0.737274169921875, -0.6934661865234375, -0.649658203125, -0.6058502197265625, -0.562042236328125, -0.5182342529296875, -0.47442626953125, -0.4306182861328125, -0.386810302734375, -0.3430023193359375, -0.2991943359375, -0.2553863525390625, -0.211578369140625, -0.1677703857421875, -0.12396240234375, -0.0801544189453125, -0.036346435546875, 0.0074615478515625, 0.05126953125, 0.0950775146484375, 0.138885498046875, 0.1826934814453125, 0.22650146484375, 0.2703094482421875, 0.314117431640625, 0.3579254150390625, 0.4017333984375, 0.4455413818359375, 0.489349365234375, 0.5331573486328125, 0.57696533203125, 0.6207733154296875, 0.664581298828125, 0.7083892822265625, 0.752197265625, 0.7960052490234375, 0.839813232421875, 0.8836212158203125, 0.92742919921875, 0.9712371826171875, 1.015045166015625, 1.0588531494140625, 1.1026611328125, 1.1464691162109375, 1.190277099609375, 1.2340850830078125, 1.27789306640625, 1.3217010498046875, 1.365509033203125, 1.4093170166015625, 1.453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 9.0, 8.0, 12.0, 12.0, 25.0, 34.0, 49.0, 65.0, 90.0, 133.0, 188.0, 284.0, 444.0, 737.0, 1215.0, 2190.0, 4384.0, 9058.0, 20804.0, 56349.0, 205633.0, 3089075.0, 633878.0, 107111.0, 34773.0, 13884.0, 6298.0, 3162.0, 1665.0, 962.0, 578.0, 367.0, 257.0, 147.0, 113.0, 78.0, 62.0, 38.0, 32.0, 19.0, 12.0, 10.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.24609375, -6.04949951171875, -5.8529052734375, -5.65631103515625, -5.459716796875, -5.26312255859375, -5.0665283203125, -4.86993408203125, -4.67333984375, -4.47674560546875, -4.2801513671875, -4.08355712890625, -3.886962890625, -3.69036865234375, -3.4937744140625, -3.29718017578125, -3.1005859375, -2.90399169921875, -2.7073974609375, -2.51080322265625, -2.314208984375, -2.11761474609375, -1.9210205078125, -1.72442626953125, -1.52783203125, -1.33123779296875, -1.1346435546875, -0.93804931640625, -0.741455078125, -0.54486083984375, -0.3482666015625, -0.15167236328125, 0.044921875, 0.24151611328125, 0.4381103515625, 0.63470458984375, 0.831298828125, 1.02789306640625, 1.2244873046875, 1.42108154296875, 1.61767578125, 1.81427001953125, 2.0108642578125, 2.20745849609375, 2.404052734375, 2.60064697265625, 2.7972412109375, 2.99383544921875, 3.1904296875, 3.38702392578125, 3.5836181640625, 3.78021240234375, 3.976806640625, 4.17340087890625, 4.3699951171875, 4.56658935546875, 4.76318359375, 4.95977783203125, 5.1563720703125, 5.35296630859375, 5.549560546875, 5.74615478515625, 5.9427490234375, 6.13934326171875, 6.3359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 14.0, 17.0, 29.0, 41.0, 58.0, 92.0, 140.0, 245.0, 736.0, 1684.0, 401.0, 189.0, 109.0, 63.0, 45.0, 42.0, 28.0, 19.0, 20.0, 12.0, 8.0, 7.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.16015625, -3.04815673828125, -2.9361572265625, -2.82415771484375, -2.712158203125, -2.60015869140625, -2.4881591796875, -2.37615966796875, -2.26416015625, -2.15216064453125, -2.0401611328125, -1.92816162109375, -1.816162109375, -1.70416259765625, -1.5921630859375, -1.48016357421875, -1.3681640625, -1.25616455078125, -1.1441650390625, -1.03216552734375, -0.920166015625, -0.80816650390625, -0.6961669921875, -0.58416748046875, -0.47216796875, -0.36016845703125, -0.2481689453125, -0.13616943359375, -0.024169921875, 0.08782958984375, 0.1998291015625, 0.31182861328125, 0.423828125, 0.53582763671875, 0.6478271484375, 0.75982666015625, 0.871826171875, 0.98382568359375, 1.0958251953125, 1.20782470703125, 1.31982421875, 1.43182373046875, 1.5438232421875, 1.65582275390625, 1.767822265625, 1.87982177734375, 1.9918212890625, 2.10382080078125, 2.2158203125, 2.32781982421875, 2.4398193359375, 2.55181884765625, 2.663818359375, 2.77581787109375, 2.8878173828125, 2.99981689453125, 3.11181640625, 3.22381591796875, 3.3358154296875, 3.44781494140625, 3.559814453125, 3.67181396484375, 3.7838134765625, 3.89581298828125, 4.0078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 11.0, 14.0, 27.0, 39.0, 46.0, 78.0, 105.0, 106.0, 130.0, 121.0, 77.0, 70.0, 62.0, 39.0, 28.0, 15.0, 7.0, 10.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.542293548583984, -11.814962387084961, -11.087631225585938, -10.360299110412598, -9.632967948913574, -8.90563678741455, -8.178304672241211, -7.4509735107421875, -6.723642349243164, -5.996311187744141, -5.268979549407959, -4.541647911071777, -3.814316749572754, -3.0869853496551514, -2.359653949737549, -1.6323223114013672, -0.9049911499023438, -0.1776597499847412, 0.5496716499328613, 1.2770030498504639, 2.0043344497680664, 2.731665849685669, 3.4589972496032715, 4.186328887939453, 4.913660049438477, 5.6409912109375, 6.368322849273682, 7.095654487609863, 7.822985649108887, 8.55031681060791, 9.27764892578125, 10.004980087280273, 10.732311248779297, 11.45964241027832, 12.186973571777344, 12.914305686950684, 13.641636848449707, 14.36896800994873, 15.09630012512207, 15.823631286621094, 16.550962448120117, 17.27829360961914, 18.005624771118164, 18.732955932617188, 19.460289001464844, 20.187620162963867, 20.91495132446289, 21.642282485961914, 22.369613647460938, 23.09694480895996, 23.824275970458984, 24.551607131958008, 25.27893829345703, 26.006271362304688, 26.73360252380371, 27.460933685302734, 28.188264846801758, 28.91559600830078, 29.642927169799805, 30.370258331298828, 31.097591400146484, 31.824922561645508, 32.55225372314453, 33.27958679199219, 34.00691604614258]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 14.0, 15.0, 18.0, 19.0, 23.0, 23.0, 36.0, 26.0, 27.0, 31.0, 31.0, 35.0, 42.0, 43.0, 48.0, 43.0, 44.0, 34.0, 40.0, 32.0, 46.0, 31.0, 29.0, 33.0, 27.0, 28.0, 18.0, 15.0, 17.0, 19.0, 16.0, 9.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.027045249938965, -10.672649383544922, -10.318252563476562, -9.96385669708252, -9.609460830688477, -9.255064010620117, -8.900668144226074, -8.546272277832031, -8.191875457763672, -7.837479114532471, -7.4830827713012695, -7.128686904907227, -6.774290561676025, -6.419894218444824, -6.065498352050781, -5.71110200881958, -5.356705665588379, -5.002309322357178, -4.647912979125977, -4.293517112731934, -3.9391207695007324, -3.5847244262695312, -3.230328321456909, -2.875932216644287, -2.521535873413086, -2.1671395301818848, -1.8127434253692627, -1.458347201347351, -1.1039509773254395, -0.7495547533035278, -0.3951585292816162, -0.04076242446899414, 0.31363487243652344, 0.6680310964584351, 1.0224273204803467, 1.3768235445022583, 1.73121976852417, 2.085616111755371, 2.440012216567993, 2.7944083213806152, 3.1488046646118164, 3.5032010078430176, 3.8575971126556396, 4.211993217468262, 4.566389560699463, 4.920785903930664, 5.275181770324707, 5.629578113555908, 5.983974456787109, 6.3383708000183105, 6.692767143249512, 7.047163009643555, 7.401559352874756, 7.755955696105957, 8.1103515625, 8.46474838256836, 8.819144248962402, 9.173540115356445, 9.527936935424805, 9.882332801818848, 10.23672866821289, 10.59112548828125, 10.945521354675293, 11.299917221069336, 11.654314041137695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 19.0, 23.0, 26.0, 68.0, 96.0, 168.0, 289.0, 615.0, 1291.0, 3147.0, 8648.0, 28011.0, 102977.0, 384054.0, 377173.0, 100549.0, 27158.0, 8557.0, 3101.0, 1288.0, 570.0, 291.0, 188.0, 94.0, 59.0, 26.0, 18.0, 10.0, 7.0, 7.0, 3.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.63739013671875, -6.4232177734375, -6.20904541015625, -5.994873046875, -5.78070068359375, -5.5665283203125, -5.35235595703125, -5.13818359375, -4.92401123046875, -4.7098388671875, -4.49566650390625, -4.281494140625, -4.06732177734375, -3.8531494140625, -3.63897705078125, -3.4248046875, -3.21063232421875, -2.9964599609375, -2.78228759765625, -2.568115234375, -2.35394287109375, -2.1397705078125, -1.92559814453125, -1.71142578125, -1.49725341796875, -1.2830810546875, -1.06890869140625, -0.854736328125, -0.64056396484375, -0.4263916015625, -0.21221923828125, 0.001953125, 0.21612548828125, 0.4302978515625, 0.64447021484375, 0.858642578125, 1.07281494140625, 1.2869873046875, 1.50115966796875, 1.71533203125, 1.92950439453125, 2.1436767578125, 2.35784912109375, 2.572021484375, 2.78619384765625, 3.0003662109375, 3.21453857421875, 3.4287109375, 3.64288330078125, 3.8570556640625, 4.07122802734375, 4.285400390625, 4.49957275390625, 4.7137451171875, 4.92791748046875, 5.14208984375, 5.35626220703125, 5.5704345703125, 5.78460693359375, 5.998779296875, 6.21295166015625, 6.4271240234375, 6.64129638671875, 6.85546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 8.0, 15.0, 17.0, 22.0, 19.0, 25.0, 28.0, 34.0, 39.0, 53.0, 43.0, 46.0, 54.0, 42.0, 49.0, 61.0, 59.0, 50.0, 38.0, 56.0, 38.0, 41.0, 27.0, 29.0, 23.0, 20.0, 18.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.638671875, -1.5885772705078125, -1.538482666015625, -1.4883880615234375, -1.43829345703125, -1.3881988525390625, -1.338104248046875, -1.2880096435546875, -1.2379150390625, -1.1878204345703125, -1.137725830078125, -1.0876312255859375, -1.03753662109375, -0.9874420166015625, -0.937347412109375, -0.8872528076171875, -0.837158203125, -0.7870635986328125, -0.736968994140625, -0.6868743896484375, -0.63677978515625, -0.5866851806640625, -0.536590576171875, -0.4864959716796875, -0.4364013671875, -0.3863067626953125, -0.336212158203125, -0.2861175537109375, -0.23602294921875, -0.1859283447265625, -0.135833740234375, -0.0857391357421875, -0.03564453125, 0.0144500732421875, 0.064544677734375, 0.1146392822265625, 0.16473388671875, 0.2148284912109375, 0.264923095703125, 0.3150177001953125, 0.3651123046875, 0.4152069091796875, 0.465301513671875, 0.5153961181640625, 0.56549072265625, 0.6155853271484375, 0.665679931640625, 0.7157745361328125, 0.765869140625, 0.8159637451171875, 0.866058349609375, 0.9161529541015625, 0.96624755859375, 1.0163421630859375, 1.066436767578125, 1.1165313720703125, 1.1666259765625, 1.2167205810546875, 1.266815185546875, 1.3169097900390625, 1.36700439453125, 1.4170989990234375, 1.467193603515625, 1.5172882080078125, 1.5673828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 7.0, 6.0, 10.0, 12.0, 13.0, 24.0, 37.0, 31.0, 80.0, 130.0, 221.0, 356.0, 660.0, 1360.0, 3668.0, 14321.0, 107283.0, 718131.0, 173607.0, 20488.0, 4614.0, 1656.0, 812.0, 417.0, 223.0, 140.0, 73.0, 61.0, 35.0, 21.0, 16.0, 9.0, 20.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -11.03271484375, -10.7138671875, -10.39501953125, -10.076171875, -9.75732421875, -9.4384765625, -9.11962890625, -8.80078125, -8.48193359375, -8.1630859375, -7.84423828125, -7.525390625, -7.20654296875, -6.8876953125, -6.56884765625, -6.25, -5.93115234375, -5.6123046875, -5.29345703125, -4.974609375, -4.65576171875, -4.3369140625, -4.01806640625, -3.69921875, -3.38037109375, -3.0615234375, -2.74267578125, -2.423828125, -2.10498046875, -1.7861328125, -1.46728515625, -1.1484375, -0.82958984375, -0.5107421875, -0.19189453125, 0.126953125, 0.44580078125, 0.7646484375, 1.08349609375, 1.40234375, 1.72119140625, 2.0400390625, 2.35888671875, 2.677734375, 2.99658203125, 3.3154296875, 3.63427734375, 3.953125, 4.27197265625, 4.5908203125, 4.90966796875, 5.228515625, 5.54736328125, 5.8662109375, 6.18505859375, 6.50390625, 6.82275390625, 7.1416015625, 7.46044921875, 7.779296875, 8.09814453125, 8.4169921875, 8.73583984375, 9.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 9.0, 19.0, 24.0, 16.0, 24.0, 24.0, 24.0, 32.0, 36.0, 36.0, 38.0, 32.0, 46.0, 47.0, 50.0, 44.0, 44.0, 37.0, 46.0, 45.0, 56.0, 31.0, 31.0, 26.0, 22.0, 26.0, 19.0, 23.0, 14.0, 9.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.23046875, -7.008544921875, -6.78662109375, -6.564697265625, -6.3427734375, -6.120849609375, -5.89892578125, -5.677001953125, -5.455078125, -5.233154296875, -5.01123046875, -4.789306640625, -4.5673828125, -4.345458984375, -4.12353515625, -3.901611328125, -3.6796875, -3.457763671875, -3.23583984375, -3.013916015625, -2.7919921875, -2.570068359375, -2.34814453125, -2.126220703125, -1.904296875, -1.682373046875, -1.46044921875, -1.238525390625, -1.0166015625, -0.794677734375, -0.57275390625, -0.350830078125, -0.12890625, 0.093017578125, 0.31494140625, 0.536865234375, 0.7587890625, 0.980712890625, 1.20263671875, 1.424560546875, 1.646484375, 1.868408203125, 2.09033203125, 2.312255859375, 2.5341796875, 2.756103515625, 2.97802734375, 3.199951171875, 3.421875, 3.643798828125, 3.86572265625, 4.087646484375, 4.3095703125, 4.531494140625, 4.75341796875, 4.975341796875, 5.197265625, 5.419189453125, 5.64111328125, 5.863037109375, 6.0849609375, 6.306884765625, 6.52880859375, 6.750732421875, 6.97265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 11.0, 12.0, 30.0, 36.0, 79.0, 103.0, 242.0, 494.0, 1150.0, 3110.0, 10778.0, 56634.0, 394649.0, 488475.0, 73377.0, 13415.0, 3506.0, 1271.0, 539.0, 281.0, 134.0, 81.0, 53.0, 22.0, 24.0, 11.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.899169921875, -4.75537109375, -4.611572265625, -4.4677734375, -4.323974609375, -4.18017578125, -4.036376953125, -3.892578125, -3.748779296875, -3.60498046875, -3.461181640625, -3.3173828125, -3.173583984375, -3.02978515625, -2.885986328125, -2.7421875, -2.598388671875, -2.45458984375, -2.310791015625, -2.1669921875, -2.023193359375, -1.87939453125, -1.735595703125, -1.591796875, -1.447998046875, -1.30419921875, -1.160400390625, -1.0166015625, -0.872802734375, -0.72900390625, -0.585205078125, -0.44140625, -0.297607421875, -0.15380859375, -0.010009765625, 0.1337890625, 0.277587890625, 0.42138671875, 0.565185546875, 0.708984375, 0.852783203125, 0.99658203125, 1.140380859375, 1.2841796875, 1.427978515625, 1.57177734375, 1.715576171875, 1.859375, 2.003173828125, 2.14697265625, 2.290771484375, 2.4345703125, 2.578369140625, 2.72216796875, 2.865966796875, 3.009765625, 3.153564453125, 3.29736328125, 3.441162109375, 3.5849609375, 3.728759765625, 3.87255859375, 4.016357421875, 4.16015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 18.0, 12.0, 24.0, 28.0, 30.0, 47.0, 61.0, 70.0, 76.0, 101.0, 100.0, 78.0, 64.0, 60.0, 38.0, 28.0, 28.0, 23.0, 21.0, 11.0, 12.0, 6.0, 3.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006122589111328125, -0.0005916431546211243, -0.000571027398109436, -0.0005504116415977478, -0.0005297958850860596, -0.0005091801285743713, -0.0004885643720626831, -0.0004679486155509949, -0.00044733285903930664, -0.0004267171025276184, -0.0004061013460159302, -0.00038548558950424194, -0.0003648698329925537, -0.0003442540764808655, -0.00032363831996917725, -0.000303022563457489, -0.0002824068069458008, -0.00026179105043411255, -0.00024117529392242432, -0.00022055953741073608, -0.00019994378089904785, -0.00017932802438735962, -0.0001587122678756714, -0.00013809651136398315, -0.00011748075485229492, -9.686499834060669e-05, -7.624924182891846e-05, -5.5633485317230225e-05, -3.501772880554199e-05, -1.440197229385376e-05, 6.213784217834473e-06, 2.6829540729522705e-05, 4.744529724121094e-05, 6.806105375289917e-05, 8.86768102645874e-05, 0.00010929256677627563, 0.00012990832328796387, 0.0001505240797996521, 0.00017113983631134033, 0.00019175559282302856, 0.0002123713493347168, 0.00023298710584640503, 0.00025360286235809326, 0.0002742186188697815, 0.0002948343753814697, 0.00031545013189315796, 0.0003360658884048462, 0.0003566816449165344, 0.00037729740142822266, 0.0003979131579399109, 0.0004185289144515991, 0.00043914467096328735, 0.0004597604274749756, 0.0004803761839866638, 0.000500991940498352, 0.0005216076970100403, 0.0005422234535217285, 0.0005628392100334167, 0.000583454966545105, 0.0006040707230567932, 0.0006246864795684814, 0.0006453022360801697, 0.0006659179925918579, 0.0006865337491035461, 0.0007071495056152344]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 16.0, 41.0, 63.0, 187.0, 493.0, 1576.0, 8214.0, 109368.0, 841762.0, 77975.0, 6720.0, 1378.0, 414.0, 178.0, 77.0, 39.0, 15.0, 9.0, 7.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5152587890625, -7.241455078125, -6.9676513671875, -6.69384765625, -6.4200439453125, -6.146240234375, -5.8724365234375, -5.5986328125, -5.3248291015625, -5.051025390625, -4.7772216796875, -4.50341796875, -4.2296142578125, -3.955810546875, -3.6820068359375, -3.408203125, -3.1343994140625, -2.860595703125, -2.5867919921875, -2.31298828125, -2.0391845703125, -1.765380859375, -1.4915771484375, -1.2177734375, -0.9439697265625, -0.670166015625, -0.3963623046875, -0.12255859375, 0.1512451171875, 0.425048828125, 0.6988525390625, 0.97265625, 1.2464599609375, 1.520263671875, 1.7940673828125, 2.06787109375, 2.3416748046875, 2.615478515625, 2.8892822265625, 3.1630859375, 3.4368896484375, 3.710693359375, 3.9844970703125, 4.25830078125, 4.5321044921875, 4.805908203125, 5.0797119140625, 5.353515625, 5.6273193359375, 5.901123046875, 6.1749267578125, 6.44873046875, 6.7225341796875, 6.996337890625, 7.2701416015625, 7.5439453125, 7.8177490234375, 8.091552734375, 8.3653564453125, 8.63916015625, 8.9129638671875, 9.186767578125, 9.4605712890625, 9.734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 8.0, 15.0, 14.0, 16.0, 25.0, 39.0, 38.0, 64.0, 66.0, 65.0, 85.0, 84.0, 45.0, 70.0, 69.0, 66.0, 31.0, 33.0, 34.0, 24.0, 20.0, 11.0, 10.0, 9.0, 2.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.931640625, -2.841827392578125, -2.75201416015625, -2.662200927734375, -2.5723876953125, -2.482574462890625, -2.39276123046875, -2.302947998046875, -2.213134765625, -2.123321533203125, -2.03350830078125, -1.943695068359375, -1.8538818359375, -1.764068603515625, -1.67425537109375, -1.584442138671875, -1.49462890625, -1.404815673828125, -1.31500244140625, -1.225189208984375, -1.1353759765625, -1.045562744140625, -0.95574951171875, -0.865936279296875, -0.776123046875, -0.686309814453125, -0.59649658203125, -0.506683349609375, -0.4168701171875, -0.327056884765625, -0.23724365234375, -0.147430419921875, -0.0576171875, 0.032196044921875, 0.12200927734375, 0.211822509765625, 0.3016357421875, 0.391448974609375, 0.48126220703125, 0.571075439453125, 0.660888671875, 0.750701904296875, 0.84051513671875, 0.930328369140625, 1.0201416015625, 1.109954833984375, 1.19976806640625, 1.289581298828125, 1.37939453125, 1.469207763671875, 1.55902099609375, 1.648834228515625, 1.7386474609375, 1.828460693359375, 1.91827392578125, 2.008087158203125, 2.097900390625, 2.187713623046875, 2.27752685546875, 2.367340087890625, 2.4571533203125, 2.546966552734375, 2.63677978515625, 2.726593017578125, 2.81640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 13.0, 12.0, 22.0, 33.0, 29.0, 49.0, 68.0, 99.0, 93.0, 132.0, 94.0, 89.0, 81.0, 54.0, 42.0, 31.0, 23.0, 5.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.91415786743164, -41.5188102722168, -40.12346267700195, -38.72811508178711, -37.33277130126953, -35.93742370605469, -34.542076110839844, -33.146728515625, -31.751380920410156, -30.356033325195312, -28.96068572998047, -27.565340042114258, -26.169992446899414, -24.77464485168457, -23.37929916381836, -21.983951568603516, -20.588603973388672, -19.193256378173828, -17.797908782958984, -16.402563095092773, -15.00721549987793, -13.611867904663086, -12.216521263122559, -10.821174621582031, -9.425827026367188, -8.030479431152344, -6.635132789611816, -5.239785671234131, -3.8444385528564453, -2.4490914344787598, -1.0537443161010742, 0.3416023254394531, 1.7369461059570312, 3.132293224334717, 4.527640342712402, 5.922987461090088, 7.318334579467773, 8.713682174682617, 10.109028816223145, 11.504375457763672, 12.899723052978516, 14.29507064819336, 15.690417289733887, 17.085763931274414, 18.481111526489258, 19.8764591217041, 21.271804809570312, 22.667152404785156, 24.0625, 25.457847595214844, 26.853195190429688, 28.2485408782959, 29.643888473510742, 31.039236068725586, 32.4345817565918, 33.82992935180664, 35.225276947021484, 36.62062454223633, 38.01597213745117, 39.411319732666016, 40.806663513183594, 42.20201110839844, 43.59735870361328, 44.992706298828125, 46.38805389404297]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 9.0, 13.0, 8.0, 12.0, 26.0, 26.0, 23.0, 41.0, 38.0, 36.0, 44.0, 40.0, 44.0, 49.0, 42.0, 48.0, 48.0, 50.0, 41.0, 44.0, 29.0, 33.0, 27.0, 35.0, 25.0, 18.0, 27.0, 18.0, 12.0, 10.0, 10.0, 9.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.061729431152344, -31.95173454284668, -30.841739654541016, -29.731746673583984, -28.62175178527832, -27.511756896972656, -26.401763916015625, -25.29176902770996, -24.181774139404297, -23.071779251098633, -21.96178436279297, -20.851791381835938, -19.741796493530273, -18.63180160522461, -17.521808624267578, -16.411813735961914, -15.30181884765625, -14.191823959350586, -13.081830024719238, -11.97183609008789, -10.861841201782227, -9.751846313476562, -8.641852378845215, -7.531857967376709, -6.421863555908203, -5.311869144439697, -4.201874732971191, -3.0918803215026855, -1.9818859100341797, -0.8718914985656738, 0.23810291290283203, 1.348097324371338, 2.4580917358398438, 3.5680861473083496, 4.6780805587768555, 5.788074970245361, 6.898069381713867, 8.008064270019531, 9.118058204650879, 10.228052139282227, 11.33804702758789, 12.448041915893555, 13.558035850524902, 14.66802978515625, 15.778024673461914, 16.888019561767578, 17.99801254272461, 19.108007431030273, 20.218002319335938, 21.3279972076416, 22.437992095947266, 23.547985076904297, 24.65797996520996, 25.767974853515625, 26.877967834472656, 27.98796272277832, 29.097957611083984, 30.20795249938965, 31.317947387695312, 32.427940368652344, 33.537933349609375, 34.64793014526367, 35.7579231262207, 36.867919921875, 37.97791290283203]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 17.0, 5.0, 6.0, 14.0, 25.0, 23.0, 43.0, 68.0, 106.0, 149.0, 233.0, 380.0, 654.0, 1084.0, 1793.0, 3522.0, 7646.0, 24925.0, 3926244.0, 196586.0, 17639.0, 6108.0, 2900.0, 1585.0, 948.0, 555.0, 344.0, 229.0, 140.0, 92.0, 64.0, 50.0, 33.0, 25.0, 15.0, 11.0, 7.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.390625, -11.081787109375, -10.77294921875, -10.464111328125, -10.1552734375, -9.846435546875, -9.53759765625, -9.228759765625, -8.919921875, -8.611083984375, -8.30224609375, -7.993408203125, -7.6845703125, -7.375732421875, -7.06689453125, -6.758056640625, -6.44921875, -6.140380859375, -5.83154296875, -5.522705078125, -5.2138671875, -4.905029296875, -4.59619140625, -4.287353515625, -3.978515625, -3.669677734375, -3.36083984375, -3.052001953125, -2.7431640625, -2.434326171875, -2.12548828125, -1.816650390625, -1.5078125, -1.198974609375, -0.89013671875, -0.581298828125, -0.2724609375, 0.036376953125, 0.34521484375, 0.654052734375, 0.962890625, 1.271728515625, 1.58056640625, 1.889404296875, 2.1982421875, 2.507080078125, 2.81591796875, 3.124755859375, 3.43359375, 3.742431640625, 4.05126953125, 4.360107421875, 4.6689453125, 4.977783203125, 5.28662109375, 5.595458984375, 5.904296875, 6.213134765625, 6.52197265625, 6.830810546875, 7.1396484375, 7.448486328125, 7.75732421875, 8.066162109375, 8.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 7.0, 7.0, 9.0, 23.0, 24.0, 24.0, 30.0, 34.0, 52.0, 43.0, 48.0, 48.0, 63.0, 69.0, 71.0, 61.0, 72.0, 59.0, 37.0, 49.0, 34.0, 32.0, 20.0, 12.0, 16.0, 12.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.8614044189453125, -1.800933837890625, -1.7404632568359375, -1.67999267578125, -1.6195220947265625, -1.559051513671875, -1.4985809326171875, -1.4381103515625, -1.3776397705078125, -1.317169189453125, -1.2566986083984375, -1.19622802734375, -1.1357574462890625, -1.075286865234375, -1.0148162841796875, -0.954345703125, -0.8938751220703125, -0.833404541015625, -0.7729339599609375, -0.71246337890625, -0.6519927978515625, -0.591522216796875, -0.5310516357421875, -0.4705810546875, -0.4101104736328125, -0.349639892578125, -0.2891693115234375, -0.22869873046875, -0.1682281494140625, -0.107757568359375, -0.0472869873046875, 0.01318359375, 0.0736541748046875, 0.134124755859375, 0.1945953369140625, 0.25506591796875, 0.3155364990234375, 0.376007080078125, 0.4364776611328125, 0.4969482421875, 0.5574188232421875, 0.617889404296875, 0.6783599853515625, 0.73883056640625, 0.7993011474609375, 0.859771728515625, 0.9202423095703125, 0.980712890625, 1.0411834716796875, 1.101654052734375, 1.1621246337890625, 1.22259521484375, 1.2830657958984375, 1.343536376953125, 1.4040069580078125, 1.4644775390625, 1.5249481201171875, 1.585418701171875, 1.6458892822265625, 1.70635986328125, 1.7668304443359375, 1.827301025390625, 1.8877716064453125, 1.9482421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 10.0, 19.0, 21.0, 36.0, 62.0, 75.0, 115.0, 179.0, 252.0, 374.0, 583.0, 945.0, 1899.0, 4773.0, 27763.0, 4080460.0, 64413.0, 6914.0, 2341.0, 1132.0, 637.0, 390.0, 269.0, 191.0, 126.0, 83.0, 66.0, 48.0, 20.0, 18.0, 9.0, 14.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.278564453125, -12.81494140625, -12.351318359375, -11.8876953125, -11.424072265625, -10.96044921875, -10.496826171875, -10.033203125, -9.569580078125, -9.10595703125, -8.642333984375, -8.1787109375, -7.715087890625, -7.25146484375, -6.787841796875, -6.32421875, -5.860595703125, -5.39697265625, -4.933349609375, -4.4697265625, -4.006103515625, -3.54248046875, -3.078857421875, -2.615234375, -2.151611328125, -1.68798828125, -1.224365234375, -0.7607421875, -0.297119140625, 0.16650390625, 0.630126953125, 1.09375, 1.557373046875, 2.02099609375, 2.484619140625, 2.9482421875, 3.411865234375, 3.87548828125, 4.339111328125, 4.802734375, 5.266357421875, 5.72998046875, 6.193603515625, 6.6572265625, 7.120849609375, 7.58447265625, 8.048095703125, 8.51171875, 8.975341796875, 9.43896484375, 9.902587890625, 10.3662109375, 10.829833984375, 11.29345703125, 11.757080078125, 12.220703125, 12.684326171875, 13.14794921875, 13.611572265625, 14.0751953125, 14.538818359375, 15.00244140625, 15.466064453125, 15.9296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 17.0, 20.0, 47.0, 156.0, 3519.0, 210.0, 47.0, 25.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.133392333984375, -2.04998779296875, -1.966583251953125, -1.8831787109375, -1.799774169921875, -1.71636962890625, -1.632965087890625, -1.549560546875, -1.466156005859375, -1.38275146484375, -1.299346923828125, -1.2159423828125, -1.132537841796875, -1.04913330078125, -0.965728759765625, -0.88232421875, -0.798919677734375, -0.71551513671875, -0.632110595703125, -0.5487060546875, -0.465301513671875, -0.38189697265625, -0.298492431640625, -0.215087890625, -0.131683349609375, -0.04827880859375, 0.035125732421875, 0.1185302734375, 0.201934814453125, 0.28533935546875, 0.368743896484375, 0.4521484375, 0.535552978515625, 0.61895751953125, 0.702362060546875, 0.7857666015625, 0.869171142578125, 0.95257568359375, 1.035980224609375, 1.119384765625, 1.202789306640625, 1.28619384765625, 1.369598388671875, 1.4530029296875, 1.536407470703125, 1.61981201171875, 1.703216552734375, 1.78662109375, 1.870025634765625, 1.95343017578125, 2.036834716796875, 2.1202392578125, 2.203643798828125, 2.28704833984375, 2.370452880859375, 2.453857421875, 2.537261962890625, 2.62066650390625, 2.704071044921875, 2.7874755859375, 2.870880126953125, 2.95428466796875, 3.037689208984375, 3.12109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 11.0, 10.0, 25.0, 26.0, 35.0, 41.0, 68.0, 84.0, 105.0, 115.0, 88.0, 99.0, 75.0, 70.0, 50.0, 28.0, 17.0, 22.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.274593353271484, -8.061896324157715, -7.849198341369629, -7.636501312255859, -7.423803806304932, -7.211106300354004, -6.998409271240234, -6.785711765289307, -6.573014259338379, -6.360316753387451, -6.147619247436523, -5.934922218322754, -5.722224712371826, -5.509527206420898, -5.296830177307129, -5.084132671356201, -4.871435165405273, -4.658737659454346, -4.446040153503418, -4.233343124389648, -4.020645618438721, -3.807948112487793, -3.5952508449554443, -3.3825535774230957, -3.169856071472168, -2.9571585655212402, -2.7444612979888916, -2.531764030456543, -2.3190665245056152, -2.1063690185546875, -1.8936717510223389, -1.6809743642807007, -1.4682765007019043, -1.2555791139602661, -1.042881727218628, -0.8301843404769897, -0.6174869537353516, -0.4047895669937134, -0.1920921802520752, 0.02060520648956299, 0.23330259323120117, 0.44599997997283936, 0.6586973667144775, 0.8713947534561157, 1.084092140197754, 1.296789526939392, 1.5094869136810303, 1.7221843004226685, 1.9348816871643066, 2.1475791931152344, 2.360276460647583, 2.5729737281799316, 2.7856712341308594, 2.998368740081787, 3.2110660076141357, 3.4237632751464844, 3.636460781097412, 3.84915828704834, 4.061855316162109, 4.274552822113037, 4.487250328063965, 4.699947834014893, 4.91264533996582, 5.12534236907959, 5.338039875030518]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 16.0, 10.0, 11.0, 20.0, 22.0, 28.0, 29.0, 22.0, 25.0, 33.0, 38.0, 27.0, 45.0, 41.0, 47.0, 41.0, 48.0, 37.0, 38.0, 44.0, 45.0, 26.0, 34.0, 41.0, 23.0, 32.0, 20.0, 27.0, 17.0, 14.0, 13.0, 17.0, 9.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.4689292907714844, -3.3560986518859863, -3.2432680130004883, -3.130437135696411, -3.017606496810913, -2.904775857925415, -2.791944980621338, -2.67911434173584, -2.566283702850342, -2.4534530639648438, -2.3406224250793457, -2.2277915477752686, -2.1149609088897705, -2.0021302700042725, -1.8892995119094849, -1.7764687538146973, -1.6636381149291992, -1.5508074760437012, -1.4379767179489136, -1.325145959854126, -1.212315320968628, -1.0994846820831299, -0.9866539239883423, -0.8738232254981995, -0.7609925270080566, -0.6481618285179138, -0.535331130027771, -0.4225004315376282, -0.30966973304748535, -0.19683903455734253, -0.08400833606719971, 0.028822362422943115, 0.14165306091308594, 0.25448375940322876, 0.3673144578933716, 0.4801451563835144, 0.5929758548736572, 0.7058065533638, 0.8186372518539429, 0.9314679503440857, 1.0442986488342285, 1.1571292877197266, 1.2699600458145142, 1.3827908039093018, 1.4956214427947998, 1.6084520816802979, 1.7212828397750854, 1.834113597869873, 1.946944236755371, 2.059774875640869, 2.172605514526367, 2.2854363918304443, 2.3982670307159424, 2.5110976696014404, 2.6239285469055176, 2.7367591857910156, 2.8495898246765137, 2.9624204635620117, 3.0752511024475098, 3.188081979751587, 3.300912618637085, 3.413743257522583, 3.52657413482666, 3.639404773712158, 3.7522354125976562]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 11.0, 9.0, 10.0, 24.0, 42.0, 67.0, 120.0, 211.0, 421.0, 797.0, 1930.0, 4705.0, 13189.0, 39208.0, 128568.0, 376640.0, 327687.0, 104684.0, 32302.0, 10640.0, 4085.0, 1642.0, 757.0, 362.0, 185.0, 100.0, 48.0, 35.0, 22.0, 14.0, 15.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.80859375, -6.6241455078125, -6.439697265625, -6.2552490234375, -6.07080078125, -5.8863525390625, -5.701904296875, -5.5174560546875, -5.3330078125, -5.1485595703125, -4.964111328125, -4.7796630859375, -4.59521484375, -4.4107666015625, -4.226318359375, -4.0418701171875, -3.857421875, -3.6729736328125, -3.488525390625, -3.3040771484375, -3.11962890625, -2.9351806640625, -2.750732421875, -2.5662841796875, -2.3818359375, -2.1973876953125, -2.012939453125, -1.8284912109375, -1.64404296875, -1.4595947265625, -1.275146484375, -1.0906982421875, -0.90625, -0.7218017578125, -0.537353515625, -0.3529052734375, -0.16845703125, 0.0159912109375, 0.200439453125, 0.3848876953125, 0.5693359375, 0.7537841796875, 0.938232421875, 1.1226806640625, 1.30712890625, 1.4915771484375, 1.676025390625, 1.8604736328125, 2.044921875, 2.2293701171875, 2.413818359375, 2.5982666015625, 2.78271484375, 2.9671630859375, 3.151611328125, 3.3360595703125, 3.5205078125, 3.7049560546875, 3.889404296875, 4.0738525390625, 4.25830078125, 4.4427490234375, 4.627197265625, 4.8116455078125, 4.99609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 7.0, 9.0, 12.0, 18.0, 19.0, 19.0, 29.0, 22.0, 32.0, 29.0, 49.0, 50.0, 43.0, 48.0, 55.0, 67.0, 51.0, 54.0, 55.0, 56.0, 50.0, 49.0, 45.0, 27.0, 29.0, 10.0, 19.0, 8.0, 5.0, 11.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.892547607421875, -1.83099365234375, -1.769439697265625, -1.7078857421875, -1.646331787109375, -1.58477783203125, -1.523223876953125, -1.461669921875, -1.400115966796875, -1.33856201171875, -1.277008056640625, -1.2154541015625, -1.153900146484375, -1.09234619140625, -1.030792236328125, -0.96923828125, -0.907684326171875, -0.84613037109375, -0.784576416015625, -0.7230224609375, -0.661468505859375, -0.59991455078125, -0.538360595703125, -0.476806640625, -0.415252685546875, -0.35369873046875, -0.292144775390625, -0.2305908203125, -0.169036865234375, -0.10748291015625, -0.045928955078125, 0.015625, 0.077178955078125, 0.13873291015625, 0.200286865234375, 0.2618408203125, 0.323394775390625, 0.38494873046875, 0.446502685546875, 0.508056640625, 0.569610595703125, 0.63116455078125, 0.692718505859375, 0.7542724609375, 0.815826416015625, 0.87738037109375, 0.938934326171875, 1.00048828125, 1.062042236328125, 1.12359619140625, 1.185150146484375, 1.2467041015625, 1.308258056640625, 1.36981201171875, 1.431365966796875, 1.492919921875, 1.554473876953125, 1.61602783203125, 1.677581787109375, 1.7391357421875, 1.800689697265625, 1.86224365234375, 1.923797607421875, 1.9853515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 9.0, 13.0, 22.0, 36.0, 51.0, 73.0, 121.0, 171.0, 249.0, 422.0, 779.0, 1379.0, 3271.0, 10537.0, 47454.0, 328767.0, 548957.0, 81912.0, 15853.0, 4462.0, 1735.0, 914.0, 497.0, 291.0, 181.0, 126.0, 92.0, 48.0, 27.0, 23.0, 12.0, 13.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.62249755859375, -7.3778076171875, -7.13311767578125, -6.888427734375, -6.64373779296875, -6.3990478515625, -6.15435791015625, -5.90966796875, -5.66497802734375, -5.4202880859375, -5.17559814453125, -4.930908203125, -4.68621826171875, -4.4415283203125, -4.19683837890625, -3.9521484375, -3.70745849609375, -3.4627685546875, -3.21807861328125, -2.973388671875, -2.72869873046875, -2.4840087890625, -2.23931884765625, -1.99462890625, -1.74993896484375, -1.5052490234375, -1.26055908203125, -1.015869140625, -0.77117919921875, -0.5264892578125, -0.28179931640625, -0.037109375, 0.20758056640625, 0.4522705078125, 0.69696044921875, 0.941650390625, 1.18634033203125, 1.4310302734375, 1.67572021484375, 1.92041015625, 2.16510009765625, 2.4097900390625, 2.65447998046875, 2.899169921875, 3.14385986328125, 3.3885498046875, 3.63323974609375, 3.8779296875, 4.12261962890625, 4.3673095703125, 4.61199951171875, 4.856689453125, 5.10137939453125, 5.3460693359375, 5.59075927734375, 5.83544921875, 6.08013916015625, 6.3248291015625, 6.56951904296875, 6.814208984375, 7.05889892578125, 7.3035888671875, 7.54827880859375, 7.79296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 9.0, 13.0, 18.0, 20.0, 16.0, 32.0, 24.0, 26.0, 24.0, 22.0, 34.0, 29.0, 40.0, 37.0, 47.0, 48.0, 31.0, 52.0, 36.0, 41.0, 41.0, 33.0, 46.0, 33.0, 23.0, 28.0, 21.0, 32.0, 21.0, 17.0, 12.0, 9.0, 8.0, 16.0, 6.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.31640625, -7.08319091796875, -6.8499755859375, -6.61676025390625, -6.383544921875, -6.15032958984375, -5.9171142578125, -5.68389892578125, -5.45068359375, -5.21746826171875, -4.9842529296875, -4.75103759765625, -4.517822265625, -4.28460693359375, -4.0513916015625, -3.81817626953125, -3.5849609375, -3.35174560546875, -3.1185302734375, -2.88531494140625, -2.652099609375, -2.41888427734375, -2.1856689453125, -1.95245361328125, -1.71923828125, -1.48602294921875, -1.2528076171875, -1.01959228515625, -0.786376953125, -0.55316162109375, -0.3199462890625, -0.08673095703125, 0.146484375, 0.37969970703125, 0.6129150390625, 0.84613037109375, 1.079345703125, 1.31256103515625, 1.5457763671875, 1.77899169921875, 2.01220703125, 2.24542236328125, 2.4786376953125, 2.71185302734375, 2.945068359375, 3.17828369140625, 3.4114990234375, 3.64471435546875, 3.8779296875, 4.11114501953125, 4.3443603515625, 4.57757568359375, 4.810791015625, 5.04400634765625, 5.2772216796875, 5.51043701171875, 5.74365234375, 5.97686767578125, 6.2100830078125, 6.44329833984375, 6.676513671875, 6.90972900390625, 7.1429443359375, 7.37615966796875, 7.609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 13.0, 21.0, 29.0, 44.0, 74.0, 134.0, 273.0, 500.0, 1060.0, 2578.0, 7634.0, 28102.0, 147204.0, 604107.0, 205183.0, 36458.0, 9393.0, 3234.0, 1274.0, 559.0, 304.0, 151.0, 84.0, 46.0, 30.0, 15.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.677734375, -3.56488037109375, -3.4520263671875, -3.33917236328125, -3.226318359375, -3.11346435546875, -3.0006103515625, -2.88775634765625, -2.77490234375, -2.66204833984375, -2.5491943359375, -2.43634033203125, -2.323486328125, -2.21063232421875, -2.0977783203125, -1.98492431640625, -1.8720703125, -1.75921630859375, -1.6463623046875, -1.53350830078125, -1.420654296875, -1.30780029296875, -1.1949462890625, -1.08209228515625, -0.96923828125, -0.85638427734375, -0.7435302734375, -0.63067626953125, -0.517822265625, -0.40496826171875, -0.2921142578125, -0.17926025390625, -0.06640625, 0.04644775390625, 0.1593017578125, 0.27215576171875, 0.385009765625, 0.49786376953125, 0.6107177734375, 0.72357177734375, 0.83642578125, 0.94927978515625, 1.0621337890625, 1.17498779296875, 1.287841796875, 1.40069580078125, 1.5135498046875, 1.62640380859375, 1.7392578125, 1.85211181640625, 1.9649658203125, 2.07781982421875, 2.190673828125, 2.30352783203125, 2.4163818359375, 2.52923583984375, 2.64208984375, 2.75494384765625, 2.8677978515625, 2.98065185546875, 3.093505859375, 3.20635986328125, 3.3192138671875, 3.43206787109375, 3.544921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 8.0, 9.0, 9.0, 12.0, 22.0, 23.0, 32.0, 45.0, 60.0, 76.0, 110.0, 113.0, 102.0, 84.0, 72.0, 49.0, 43.0, 30.0, 26.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00079345703125, -0.0007698088884353638, -0.0007461607456207275, -0.0007225126028060913, -0.0006988644599914551, -0.0006752163171768188, -0.0006515681743621826, -0.0006279200315475464, -0.0006042718887329102, -0.0005806237459182739, -0.0005569756031036377, -0.0005333274602890015, -0.0005096793174743652, -0.000486031174659729, -0.0004623830318450928, -0.00043873488903045654, -0.0004150867462158203, -0.0003914386034011841, -0.00036779046058654785, -0.0003441423177719116, -0.0003204941749572754, -0.00029684603214263916, -0.00027319788932800293, -0.0002495497465133667, -0.00022590160369873047, -0.00020225346088409424, -0.000178605318069458, -0.00015495717525482178, -0.00013130903244018555, -0.00010766088962554932, -8.401274681091309e-05, -6.0364603996276855e-05, -3.6716461181640625e-05, -1.3068318367004395e-05, 1.0579824447631836e-05, 3.4227967262268066e-05, 5.78761100769043e-05, 8.152425289154053e-05, 0.00010517239570617676, 0.000128820538520813, 0.00015246868133544922, 0.00017611682415008545, 0.00019976496696472168, 0.0002234131097793579, 0.00024706125259399414, 0.00027070939540863037, 0.0002943575382232666, 0.00031800568103790283, 0.00034165382385253906, 0.0003653019666671753, 0.0003889501094818115, 0.00041259825229644775, 0.000436246395111084, 0.0004598945379257202, 0.00048354268074035645, 0.0005071908235549927, 0.0005308389663696289, 0.0005544871091842651, 0.0005781352519989014, 0.0006017833948135376, 0.0006254315376281738, 0.0006490796804428101, 0.0006727278232574463, 0.0006963759660720825, 0.0007200241088867188]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 21.0, 34.0, 53.0, 79.0, 139.0, 282.0, 557.0, 1410.0, 4586.0, 21904.0, 240558.0, 691339.0, 73082.0, 10099.0, 2618.0, 921.0, 390.0, 180.0, 113.0, 53.0, 41.0, 18.0, 22.0, 10.0, 7.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9921875, -5.8314208984375, -5.670654296875, -5.5098876953125, -5.34912109375, -5.1883544921875, -5.027587890625, -4.8668212890625, -4.7060546875, -4.5452880859375, -4.384521484375, -4.2237548828125, -4.06298828125, -3.9022216796875, -3.741455078125, -3.5806884765625, -3.419921875, -3.2591552734375, -3.098388671875, -2.9376220703125, -2.77685546875, -2.6160888671875, -2.455322265625, -2.2945556640625, -2.1337890625, -1.9730224609375, -1.812255859375, -1.6514892578125, -1.49072265625, -1.3299560546875, -1.169189453125, -1.0084228515625, -0.84765625, -0.6868896484375, -0.526123046875, -0.3653564453125, -0.20458984375, -0.0438232421875, 0.116943359375, 0.2777099609375, 0.4384765625, 0.5992431640625, 0.760009765625, 0.9207763671875, 1.08154296875, 1.2423095703125, 1.403076171875, 1.5638427734375, 1.724609375, 1.8853759765625, 2.046142578125, 2.2069091796875, 2.36767578125, 2.5284423828125, 2.689208984375, 2.8499755859375, 3.0107421875, 3.1715087890625, 3.332275390625, 3.4930419921875, 3.65380859375, 3.8145751953125, 3.975341796875, 4.1361083984375, 4.296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 10.0, 6.0, 6.0, 13.0, 15.0, 14.0, 26.0, 20.0, 46.0, 39.0, 56.0, 56.0, 73.0, 66.0, 61.0, 75.0, 65.0, 56.0, 57.0, 36.0, 37.0, 37.0, 32.0, 18.0, 16.0, 14.0, 10.0, 6.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98095703125, -1.9013671875, -1.82177734375, -1.7421875, -1.66259765625, -1.5830078125, -1.50341796875, -1.423828125, -1.34423828125, -1.2646484375, -1.18505859375, -1.10546875, -1.02587890625, -0.9462890625, -0.86669921875, -0.787109375, -0.70751953125, -0.6279296875, -0.54833984375, -0.46875, -0.38916015625, -0.3095703125, -0.22998046875, -0.150390625, -0.07080078125, 0.0087890625, 0.08837890625, 0.16796875, 0.24755859375, 0.3271484375, 0.40673828125, 0.486328125, 0.56591796875, 0.6455078125, 0.72509765625, 0.8046875, 0.88427734375, 0.9638671875, 1.04345703125, 1.123046875, 1.20263671875, 1.2822265625, 1.36181640625, 1.44140625, 1.52099609375, 1.6005859375, 1.68017578125, 1.759765625, 1.83935546875, 1.9189453125, 1.99853515625, 2.078125, 2.15771484375, 2.2373046875, 2.31689453125, 2.396484375, 2.47607421875, 2.5556640625, 2.63525390625, 2.71484375, 2.79443359375, 2.8740234375, 2.95361328125, 3.033203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 17.0, 25.0, 42.0, 78.0, 94.0, 124.0, 147.0, 120.0, 113.0, 71.0, 66.0, 31.0, 25.0, 9.0, 9.0, 6.0, 2.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.62795639038086, -59.896305084228516, -58.16465377807617, -56.43300247192383, -54.70135498046875, -52.969703674316406, -51.23805236816406, -49.50640106201172, -47.774749755859375, -46.04309844970703, -44.31144714355469, -42.579795837402344, -40.84814453125, -39.116493225097656, -37.38484573364258, -35.653194427490234, -33.92154312133789, -32.18989181518555, -30.458240509033203, -28.726591110229492, -26.99493980407715, -25.263288497924805, -23.531639099121094, -21.79998779296875, -20.068336486816406, -18.336685180664062, -16.60503387451172, -14.873384475708008, -13.141733169555664, -11.41008186340332, -9.678431510925293, -7.946781158447266, -6.2151336669921875, -4.483482837677002, -2.7518320083618164, -1.0201811790466309, 0.7114696502685547, 2.4431209564208984, 4.174771308898926, 5.906421661376953, 7.638072967529297, 9.36972427368164, 11.101374626159668, 12.833024978637695, 14.564676284790039, 16.296327590942383, 18.027976989746094, 19.759628295898438, 21.49127960205078, 23.222930908203125, 24.95458221435547, 26.68623161315918, 28.417882919311523, 30.149534225463867, 31.881183624267578, 33.61283493041992, 35.344486236572266, 37.07613754272461, 38.80778884887695, 40.5394401550293, 42.271087646484375, 44.00273895263672, 45.73439025878906, 47.466041564941406, 49.19769287109375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 9.0, 13.0, 27.0, 18.0, 27.0, 17.0, 41.0, 47.0, 33.0, 31.0, 42.0, 50.0, 56.0, 55.0, 59.0, 49.0, 62.0, 46.0, 31.0, 28.0, 30.0, 27.0, 29.0, 28.0, 17.0, 21.0, 17.0, 11.0, 7.0, 7.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.503570556640625, -43.09716033935547, -41.69075393676758, -40.28434371948242, -38.87793731689453, -37.471527099609375, -36.06511688232422, -34.65871047973633, -33.25230026245117, -31.84589195251465, -30.439483642578125, -29.03307342529297, -27.626665115356445, -26.220256805419922, -24.8138484954834, -23.407440185546875, -22.00103187561035, -20.594623565673828, -19.188215255737305, -17.78180694580078, -16.375396728515625, -14.968988418579102, -13.562580108642578, -12.156170845031738, -10.749762535095215, -9.343354225158691, -7.936944961547852, -6.530536651611328, -5.1241278648376465, -3.717719078063965, -2.3113107681274414, -0.9049015045166016, 0.5015068054199219, 1.907915472984314, 3.314324140548706, 4.720732688903809, 6.12714147567749, 7.533550262451172, 8.939958572387695, 10.346367835998535, 11.752776145935059, 13.159184455871582, 14.565593719482422, 15.972002029418945, 17.37841033935547, 18.784820556640625, 20.191226959228516, 21.597637176513672, 23.004045486450195, 24.41045379638672, 25.816862106323242, 27.223270416259766, 28.629680633544922, 30.036088943481445, 31.44249725341797, 32.848907470703125, 34.255313873291016, 35.66172409057617, 37.06813049316406, 38.47454071044922, 39.88094711303711, 41.287357330322266, 42.693763732910156, 44.10017395019531, 45.50658416748047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 14.0, 21.0, 41.0, 56.0, 100.0, 178.0, 321.0, 716.0, 1782.0, 6294.0, 55760.0, 4103617.0, 19271.0, 3727.0, 1254.0, 526.0, 265.0, 150.0, 72.0, 39.0, 28.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.14111328125, -14.6416015625, -14.14208984375, -13.642578125, -13.14306640625, -12.6435546875, -12.14404296875, -11.64453125, -11.14501953125, -10.6455078125, -10.14599609375, -9.646484375, -9.14697265625, -8.6474609375, -8.14794921875, -7.6484375, -7.14892578125, -6.6494140625, -6.14990234375, -5.650390625, -5.15087890625, -4.6513671875, -4.15185546875, -3.65234375, -3.15283203125, -2.6533203125, -2.15380859375, -1.654296875, -1.15478515625, -0.6552734375, -0.15576171875, 0.34375, 0.84326171875, 1.3427734375, 1.84228515625, 2.341796875, 2.84130859375, 3.3408203125, 3.84033203125, 4.33984375, 4.83935546875, 5.3388671875, 5.83837890625, 6.337890625, 6.83740234375, 7.3369140625, 7.83642578125, 8.3359375, 8.83544921875, 9.3349609375, 9.83447265625, 10.333984375, 10.83349609375, 11.3330078125, 11.83251953125, 12.33203125, 12.83154296875, 13.3310546875, 13.83056640625, 14.330078125, 14.82958984375, 15.3291015625, 15.82861328125, 16.328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 8.0, 21.0, 13.0, 26.0, 32.0, 42.0, 47.0, 53.0, 26.0, 46.0, 55.0, 64.0, 61.0, 51.0, 43.0, 50.0, 50.0, 44.0, 50.0, 29.0, 27.0, 26.0, 34.0, 15.0, 19.0, 11.0, 11.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.880859375, -1.82232666015625, -1.7637939453125, -1.70526123046875, -1.646728515625, -1.58819580078125, -1.5296630859375, -1.47113037109375, -1.41259765625, -1.35406494140625, -1.2955322265625, -1.23699951171875, -1.178466796875, -1.11993408203125, -1.0614013671875, -1.00286865234375, -0.9443359375, -0.88580322265625, -0.8272705078125, -0.76873779296875, -0.710205078125, -0.65167236328125, -0.5931396484375, -0.53460693359375, -0.47607421875, -0.41754150390625, -0.3590087890625, -0.30047607421875, -0.241943359375, -0.18341064453125, -0.1248779296875, -0.06634521484375, -0.0078125, 0.05072021484375, 0.1092529296875, 0.16778564453125, 0.226318359375, 0.28485107421875, 0.3433837890625, 0.40191650390625, 0.46044921875, 0.51898193359375, 0.5775146484375, 0.63604736328125, 0.694580078125, 0.75311279296875, 0.8116455078125, 0.87017822265625, 0.9287109375, 0.98724365234375, 1.0457763671875, 1.10430908203125, 1.162841796875, 1.22137451171875, 1.2799072265625, 1.33843994140625, 1.39697265625, 1.45550537109375, 1.5140380859375, 1.57257080078125, 1.631103515625, 1.68963623046875, 1.7481689453125, 1.80670166015625, 1.865234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 10.0, 20.0, 26.0, 26.0, 44.0, 59.0, 72.0, 103.0, 122.0, 183.0, 252.0, 371.0, 577.0, 1022.0, 1742.0, 3686.0, 8743.0, 27661.0, 260649.0, 3819073.0, 46848.0, 12580.0, 4768.0, 2200.0, 1217.0, 690.0, 429.0, 314.0, 218.0, 143.0, 106.0, 72.0, 55.0, 39.0, 37.0, 19.0, 24.0, 15.0, 11.0, 6.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.26171875, -6.04705810546875, -5.8323974609375, -5.61773681640625, -5.403076171875, -5.18841552734375, -4.9737548828125, -4.75909423828125, -4.54443359375, -4.32977294921875, -4.1151123046875, -3.90045166015625, -3.685791015625, -3.47113037109375, -3.2564697265625, -3.04180908203125, -2.8271484375, -2.61248779296875, -2.3978271484375, -2.18316650390625, -1.968505859375, -1.75384521484375, -1.5391845703125, -1.32452392578125, -1.10986328125, -0.89520263671875, -0.6805419921875, -0.46588134765625, -0.251220703125, -0.03656005859375, 0.1781005859375, 0.39276123046875, 0.607421875, 0.82208251953125, 1.0367431640625, 1.25140380859375, 1.466064453125, 1.68072509765625, 1.8953857421875, 2.11004638671875, 2.32470703125, 2.53936767578125, 2.7540283203125, 2.96868896484375, 3.183349609375, 3.39801025390625, 3.6126708984375, 3.82733154296875, 4.0419921875, 4.25665283203125, 4.4713134765625, 4.68597412109375, 4.900634765625, 5.11529541015625, 5.3299560546875, 5.54461669921875, 5.75927734375, 5.97393798828125, 6.1885986328125, 6.40325927734375, 6.617919921875, 6.83258056640625, 7.0472412109375, 7.26190185546875, 7.4765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 34.0, 99.0, 364.0, 3151.0, 173.0, 60.0, 32.0, 23.0, 10.0, 10.0, 10.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.248504638671875, -1.19232177734375, -1.136138916015625, -1.0799560546875, -1.023773193359375, -0.96759033203125, -0.911407470703125, -0.855224609375, -0.799041748046875, -0.74285888671875, -0.686676025390625, -0.6304931640625, -0.574310302734375, -0.51812744140625, -0.461944580078125, -0.40576171875, -0.349578857421875, -0.29339599609375, -0.237213134765625, -0.1810302734375, -0.124847412109375, -0.06866455078125, -0.012481689453125, 0.043701171875, 0.099884033203125, 0.15606689453125, 0.212249755859375, 0.2684326171875, 0.324615478515625, 0.38079833984375, 0.436981201171875, 0.4931640625, 0.549346923828125, 0.60552978515625, 0.661712646484375, 0.7178955078125, 0.774078369140625, 0.83026123046875, 0.886444091796875, 0.942626953125, 0.998809814453125, 1.05499267578125, 1.111175537109375, 1.1673583984375, 1.223541259765625, 1.27972412109375, 1.335906982421875, 1.39208984375, 1.448272705078125, 1.50445556640625, 1.560638427734375, 1.6168212890625, 1.673004150390625, 1.72918701171875, 1.785369873046875, 1.841552734375, 1.897735595703125, 1.95391845703125, 2.010101318359375, 2.0662841796875, 2.122467041015625, 2.17864990234375, 2.234832763671875, 2.291015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 24.0, 18.0, 35.0, 62.0, 88.0, 94.0, 125.0, 121.0, 112.0, 102.0, 67.0, 53.0, 23.0, 17.0, 15.0, 18.0, 10.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.574706077575684, -8.327876091003418, -8.081045150756836, -7.83421516418457, -7.587385177612305, -7.340554714202881, -7.093724250793457, -6.846894264221191, -6.600064277648926, -6.353233814239502, -6.106403827667236, -5.8595733642578125, -5.612743377685547, -5.365912914276123, -5.119082450866699, -4.872252464294434, -4.62542200088501, -4.378591537475586, -4.13176155090332, -3.8849310874938965, -3.638101100921631, -3.391270637512207, -3.1444404125213623, -2.8976101875305176, -2.650779962539673, -2.403949737548828, -2.1571195125579834, -1.9102891683578491, -1.6634589433670044, -1.4166287183761597, -1.1697983741760254, -0.9229681491851807, -0.6761379241943359, -0.4293076694011688, -0.1824774146080017, 0.06435286998748779, 0.3111830949783325, 0.5580133199691772, 0.8048436641693115, 1.0516738891601562, 1.298504114151001, 1.5453343391418457, 1.7921645641326904, 2.038994789123535, 2.285825252532959, 2.5326552391052246, 2.7794857025146484, 3.026315927505493, 3.273146152496338, 3.5199763774871826, 3.7668066024780273, 4.013637065887451, 4.260467052459717, 4.507297515869141, 4.754127502441406, 5.00095796585083, 5.247788429260254, 5.494618892669678, 5.741448879241943, 5.988279342651367, 6.235109329223633, 6.481939792633057, 6.7287702560424805, 6.975600242614746, 7.222430229187012]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 15.0, 15.0, 16.0, 24.0, 17.0, 27.0, 35.0, 35.0, 45.0, 28.0, 37.0, 49.0, 48.0, 42.0, 42.0, 41.0, 41.0, 46.0, 41.0, 38.0, 41.0, 21.0, 34.0, 39.0, 34.0, 25.0, 22.0, 17.0, 13.0, 6.0, 7.0, 12.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.112955093383789, -3.997013568878174, -3.8810720443725586, -3.7651305198669434, -3.6491892337799072, -3.533247709274292, -3.4173061847686768, -3.3013646602630615, -3.1854231357574463, -3.069481611251831, -2.953540086746216, -2.8375988006591797, -2.7216572761535645, -2.605715751647949, -2.489774227142334, -2.3738327026367188, -2.2578911781311035, -2.1419496536254883, -2.026008129119873, -1.9100667238235474, -1.7941251993179321, -1.6781837940216064, -1.5622422695159912, -1.446300745010376, -1.3303594589233398, -1.2144179344177246, -1.098476529121399, -0.9825350046157837, -0.8665934801101685, -0.750652015209198, -0.6347105503082275, -0.5187690258026123, -0.40282750129699707, -0.2868860065937042, -0.17094452679157257, -0.05500304698944092, 0.06093844771385193, 0.17687994241714478, 0.29282140731811523, 0.40876293182373047, 0.5247043967247009, 0.6406458616256714, 0.7565873861312866, 0.8725288510322571, 0.9884703159332275, 1.1044118404388428, 1.220353364944458, 1.3362948894500732, 1.452236294746399, 1.5681778192520142, 1.6841192245483398, 1.800060749053955, 1.9160022735595703, 2.0319437980651855, 2.147885322570801, 2.263826847076416, 2.379768133163452, 2.4957096576690674, 2.6116511821746826, 2.7275924682617188, 2.843533992767334, 2.959475517272949, 3.0754170417785645, 3.1913585662841797, 3.307300090789795]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 42.0, 74.0, 119.0, 202.0, 324.0, 641.0, 1262.0, 2333.0, 4979.0, 11450.0, 29618.0, 85347.0, 245795.0, 376364.0, 186541.0, 63356.0, 22754.0, 9091.0, 4023.0, 1928.0, 962.0, 540.0, 309.0, 157.0, 88.0, 61.0, 42.0, 19.0, 21.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.1640625, -4.03924560546875, -3.9144287109375, -3.78961181640625, -3.664794921875, -3.53997802734375, -3.4151611328125, -3.29034423828125, -3.16552734375, -3.04071044921875, -2.9158935546875, -2.79107666015625, -2.666259765625, -2.54144287109375, -2.4166259765625, -2.29180908203125, -2.1669921875, -2.04217529296875, -1.9173583984375, -1.79254150390625, -1.667724609375, -1.54290771484375, -1.4180908203125, -1.29327392578125, -1.16845703125, -1.04364013671875, -0.9188232421875, -0.79400634765625, -0.669189453125, -0.54437255859375, -0.4195556640625, -0.29473876953125, -0.169921875, -0.04510498046875, 0.0797119140625, 0.20452880859375, 0.329345703125, 0.45416259765625, 0.5789794921875, 0.70379638671875, 0.82861328125, 0.95343017578125, 1.0782470703125, 1.20306396484375, 1.327880859375, 1.45269775390625, 1.5775146484375, 1.70233154296875, 1.8271484375, 1.95196533203125, 2.0767822265625, 2.20159912109375, 2.326416015625, 2.45123291015625, 2.5760498046875, 2.70086669921875, 2.82568359375, 2.95050048828125, 3.0753173828125, 3.20013427734375, 3.324951171875, 3.44976806640625, 3.5745849609375, 3.69940185546875, 3.82421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 13.0, 15.0, 20.0, 21.0, 22.0, 33.0, 39.0, 30.0, 51.0, 45.0, 41.0, 51.0, 49.0, 59.0, 47.0, 66.0, 58.0, 48.0, 49.0, 36.0, 39.0, 25.0, 35.0, 24.0, 18.0, 16.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.7986907958984375, -1.737030029296875, -1.6753692626953125, -1.61370849609375, -1.5520477294921875, -1.490386962890625, -1.4287261962890625, -1.3670654296875, -1.3054046630859375, -1.243743896484375, -1.1820831298828125, -1.12042236328125, -1.0587615966796875, -0.997100830078125, -0.9354400634765625, -0.873779296875, -0.8121185302734375, -0.750457763671875, -0.6887969970703125, -0.62713623046875, -0.5654754638671875, -0.503814697265625, -0.4421539306640625, -0.3804931640625, -0.3188323974609375, -0.257171630859375, -0.1955108642578125, -0.13385009765625, -0.0721893310546875, -0.010528564453125, 0.0511322021484375, 0.11279296875, 0.1744537353515625, 0.236114501953125, 0.2977752685546875, 0.35943603515625, 0.4210968017578125, 0.482757568359375, 0.5444183349609375, 0.6060791015625, 0.6677398681640625, 0.729400634765625, 0.7910614013671875, 0.85272216796875, 0.9143829345703125, 0.976043701171875, 1.0377044677734375, 1.099365234375, 1.1610260009765625, 1.222686767578125, 1.2843475341796875, 1.34600830078125, 1.4076690673828125, 1.469329833984375, 1.5309906005859375, 1.5926513671875, 1.6543121337890625, 1.715972900390625, 1.7776336669921875, 1.83929443359375, 1.9009552001953125, 1.962615966796875, 2.0242767333984375, 2.0859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 10.0, 12.0, 15.0, 26.0, 25.0, 35.0, 53.0, 83.0, 125.0, 209.0, 316.0, 500.0, 923.0, 2045.0, 5785.0, 27246.0, 292348.0, 642134.0, 60904.0, 9901.0, 2939.0, 1311.0, 578.0, 392.0, 225.0, 122.0, 95.0, 45.0, 51.0, 25.0, 15.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.796875, -7.56884765625, -7.3408203125, -7.11279296875, -6.884765625, -6.65673828125, -6.4287109375, -6.20068359375, -5.97265625, -5.74462890625, -5.5166015625, -5.28857421875, -5.060546875, -4.83251953125, -4.6044921875, -4.37646484375, -4.1484375, -3.92041015625, -3.6923828125, -3.46435546875, -3.236328125, -3.00830078125, -2.7802734375, -2.55224609375, -2.32421875, -2.09619140625, -1.8681640625, -1.64013671875, -1.412109375, -1.18408203125, -0.9560546875, -0.72802734375, -0.5, -0.27197265625, -0.0439453125, 0.18408203125, 0.412109375, 0.64013671875, 0.8681640625, 1.09619140625, 1.32421875, 1.55224609375, 1.7802734375, 2.00830078125, 2.236328125, 2.46435546875, 2.6923828125, 2.92041015625, 3.1484375, 3.37646484375, 3.6044921875, 3.83251953125, 4.060546875, 4.28857421875, 4.5166015625, 4.74462890625, 4.97265625, 5.20068359375, 5.4287109375, 5.65673828125, 5.884765625, 6.11279296875, 6.3408203125, 6.56884765625, 6.796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 8.0, 14.0, 14.0, 12.0, 12.0, 12.0, 27.0, 22.0, 29.0, 25.0, 29.0, 39.0, 44.0, 46.0, 39.0, 47.0, 56.0, 42.0, 61.0, 51.0, 47.0, 40.0, 44.0, 44.0, 37.0, 34.0, 27.0, 17.0, 13.0, 17.0, 7.0, 12.0, 14.0, 1.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.28948974609375, -8.0399169921875, -7.79034423828125, -7.540771484375, -7.29119873046875, -7.0416259765625, -6.79205322265625, -6.54248046875, -6.29290771484375, -6.0433349609375, -5.79376220703125, -5.544189453125, -5.29461669921875, -5.0450439453125, -4.79547119140625, -4.5458984375, -4.29632568359375, -4.0467529296875, -3.79718017578125, -3.547607421875, -3.29803466796875, -3.0484619140625, -2.79888916015625, -2.54931640625, -2.29974365234375, -2.0501708984375, -1.80059814453125, -1.551025390625, -1.30145263671875, -1.0518798828125, -0.80230712890625, -0.552734375, -0.30316162109375, -0.0535888671875, 0.19598388671875, 0.445556640625, 0.69512939453125, 0.9447021484375, 1.19427490234375, 1.44384765625, 1.69342041015625, 1.9429931640625, 2.19256591796875, 2.442138671875, 2.69171142578125, 2.9412841796875, 3.19085693359375, 3.4404296875, 3.69000244140625, 3.9395751953125, 4.18914794921875, 4.438720703125, 4.68829345703125, 4.9378662109375, 5.18743896484375, 5.43701171875, 5.68658447265625, 5.9361572265625, 6.18572998046875, 6.435302734375, 6.68487548828125, 6.9344482421875, 7.18402099609375, 7.43359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 5.0, 14.0, 31.0, 27.0, 38.0, 61.0, 81.0, 157.0, 310.0, 660.0, 1674.0, 5768.0, 31078.0, 315974.0, 615924.0, 63387.0, 9187.0, 2300.0, 900.0, 426.0, 192.0, 106.0, 61.0, 53.0, 37.0, 23.0, 14.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.80078125, -3.67047119140625, -3.5401611328125, -3.40985107421875, -3.279541015625, -3.14923095703125, -3.0189208984375, -2.88861083984375, -2.75830078125, -2.62799072265625, -2.4976806640625, -2.36737060546875, -2.237060546875, -2.10675048828125, -1.9764404296875, -1.84613037109375, -1.7158203125, -1.58551025390625, -1.4552001953125, -1.32489013671875, -1.194580078125, -1.06427001953125, -0.9339599609375, -0.80364990234375, -0.67333984375, -0.54302978515625, -0.4127197265625, -0.28240966796875, -0.152099609375, -0.02178955078125, 0.1085205078125, 0.23883056640625, 0.369140625, 0.49945068359375, 0.6297607421875, 0.76007080078125, 0.890380859375, 1.02069091796875, 1.1510009765625, 1.28131103515625, 1.41162109375, 1.54193115234375, 1.6722412109375, 1.80255126953125, 1.932861328125, 2.06317138671875, 2.1934814453125, 2.32379150390625, 2.4541015625, 2.58441162109375, 2.7147216796875, 2.84503173828125, 2.975341796875, 3.10565185546875, 3.2359619140625, 3.36627197265625, 3.49658203125, 3.62689208984375, 3.7572021484375, 3.88751220703125, 4.017822265625, 4.14813232421875, 4.2784423828125, 4.40875244140625, 4.5390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 15.0, 18.0, 26.0, 17.0, 28.0, 27.0, 53.0, 51.0, 80.0, 75.0, 89.0, 85.0, 75.0, 63.0, 56.0, 44.0, 35.0, 14.0, 25.0, 15.0, 14.0, 10.0, 10.0, 15.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005002021789550781, -0.00048532336950302124, -0.00047044456005096436, -0.00045556575059890747, -0.0004406869411468506, -0.0004258081316947937, -0.0004109293222427368, -0.00039605051279067993, -0.00038117170333862305, -0.00036629289388656616, -0.0003514140844345093, -0.0003365352749824524, -0.0003216564655303955, -0.0003067776560783386, -0.00029189884662628174, -0.00027702003717422485, -0.00026214122772216797, -0.0002472624182701111, -0.0002323836088180542, -0.00021750479936599731, -0.00020262598991394043, -0.00018774718046188354, -0.00017286837100982666, -0.00015798956155776978, -0.0001431107521057129, -0.000128231942653656, -0.00011335313320159912, -9.847432374954224e-05, -8.359551429748535e-05, -6.871670484542847e-05, -5.383789539337158e-05, -3.89590859413147e-05, -2.4080276489257812e-05, -9.201467037200928e-06, 5.677342414855957e-06, 2.0556151866912842e-05, 3.5434961318969727e-05, 5.031377077102661e-05, 6.51925802230835e-05, 8.007138967514038e-05, 9.495019912719727e-05, 0.00010982900857925415, 0.00012470781803131104, 0.00013958662748336792, 0.0001544654369354248, 0.0001693442463874817, 0.00018422305583953857, 0.00019910186529159546, 0.00021398067474365234, 0.00022885948419570923, 0.0002437382936477661, 0.000258617103099823, 0.0002734959125518799, 0.00028837472200393677, 0.00030325353145599365, 0.00031813234090805054, 0.0003330111503601074, 0.0003478899598121643, 0.0003627687692642212, 0.0003776475787162781, 0.00039252638816833496, 0.00040740519762039185, 0.00042228400707244873, 0.0004371628165245056, 0.0004520416259765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 9.0, 9.0, 15.0, 20.0, 30.0, 56.0, 84.0, 174.0, 372.0, 1201.0, 5894.0, 111012.0, 883976.0, 40511.0, 3634.0, 881.0, 325.0, 152.0, 71.0, 50.0, 25.0, 16.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.9432373046875, -6.714599609375, -6.4859619140625, -6.25732421875, -6.0286865234375, -5.800048828125, -5.5714111328125, -5.3427734375, -5.1141357421875, -4.885498046875, -4.6568603515625, -4.42822265625, -4.1995849609375, -3.970947265625, -3.7423095703125, -3.513671875, -3.2850341796875, -3.056396484375, -2.8277587890625, -2.59912109375, -2.3704833984375, -2.141845703125, -1.9132080078125, -1.6845703125, -1.4559326171875, -1.227294921875, -0.9986572265625, -0.77001953125, -0.5413818359375, -0.312744140625, -0.0841064453125, 0.14453125, 0.3731689453125, 0.601806640625, 0.8304443359375, 1.05908203125, 1.2877197265625, 1.516357421875, 1.7449951171875, 1.9736328125, 2.2022705078125, 2.430908203125, 2.6595458984375, 2.88818359375, 3.1168212890625, 3.345458984375, 3.5740966796875, 3.802734375, 4.0313720703125, 4.260009765625, 4.4886474609375, 4.71728515625, 4.9459228515625, 5.174560546875, 5.4031982421875, 5.6318359375, 5.8604736328125, 6.089111328125, 6.3177490234375, 6.54638671875, 6.7750244140625, 7.003662109375, 7.2322998046875, 7.4609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 7.0, 20.0, 27.0, 25.0, 44.0, 49.0, 54.0, 57.0, 68.0, 71.0, 71.0, 62.0, 64.0, 62.0, 65.0, 44.0, 38.0, 32.0, 28.0, 16.0, 14.0, 15.0, 8.0, 6.0, 3.0, 8.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.10546875, -2.029296875, -1.953125, -1.876953125, -1.80078125, -1.724609375, -1.6484375, -1.572265625, -1.49609375, -1.419921875, -1.34375, -1.267578125, -1.19140625, -1.115234375, -1.0390625, -0.962890625, -0.88671875, -0.810546875, -0.734375, -0.658203125, -0.58203125, -0.505859375, -0.4296875, -0.353515625, -0.27734375, -0.201171875, -0.125, -0.048828125, 0.02734375, 0.103515625, 0.1796875, 0.255859375, 0.33203125, 0.408203125, 0.484375, 0.560546875, 0.63671875, 0.712890625, 0.7890625, 0.865234375, 0.94140625, 1.017578125, 1.09375, 1.169921875, 1.24609375, 1.322265625, 1.3984375, 1.474609375, 1.55078125, 1.626953125, 1.703125, 1.779296875, 1.85546875, 1.931640625, 2.0078125, 2.083984375, 2.16015625, 2.236328125, 2.3125, 2.388671875, 2.46484375, 2.541015625, 2.6171875, 2.693359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 9.0, 14.0, 22.0, 42.0, 78.0, 112.0, 167.0, 169.0, 161.0, 95.0, 62.0, 38.0, 19.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-80.1387710571289, -78.24723815917969, -76.35569763183594, -74.46415710449219, -72.57262420654297, -70.68109130859375, -68.78955078125, -66.89801025390625, -65.00647735595703, -63.11494064331055, -61.22340393066406, -59.33186721801758, -57.440330505371094, -55.54879379272461, -53.657257080078125, -51.76572036743164, -49.874183654785156, -47.98264694213867, -46.09111022949219, -44.1995735168457, -42.30803680419922, -40.416500091552734, -38.52496337890625, -36.633426666259766, -34.74188995361328, -32.8503532409668, -30.958816528320312, -29.067279815673828, -27.175743103027344, -25.28420639038086, -23.392669677734375, -21.50113296508789, -19.609596252441406, -17.718059539794922, -15.826522827148438, -13.934986114501953, -12.043449401855469, -10.151912689208984, -8.2603759765625, -6.368839263916016, -4.477302551269531, -2.585765838623047, -0.6942291259765625, 1.1973075866699219, 3.0888442993164062, 4.980381011962891, 6.871917724609375, 8.76345443725586, 10.654991149902344, 12.546527862548828, 14.438064575195312, 16.329601287841797, 18.22113800048828, 20.112674713134766, 22.00421142578125, 23.895748138427734, 25.78728485107422, 27.678821563720703, 29.570358276367188, 31.461894989013672, 33.353431701660156, 35.24496841430664, 37.136505126953125, 39.02804183959961, 40.919578552246094]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 13.0, 25.0, 23.0, 22.0, 28.0, 37.0, 32.0, 40.0, 44.0, 51.0, 56.0, 57.0, 50.0, 44.0, 55.0, 39.0, 40.0, 31.0, 38.0, 34.0, 31.0, 23.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.078405380249023, -30.00717544555664, -28.935945510864258, -27.864715576171875, -26.79348373413086, -25.72225570678711, -24.651023864746094, -23.57979393005371, -22.508563995361328, -21.437334060668945, -20.366104125976562, -19.29487419128418, -18.223644256591797, -17.15241241455078, -16.0811824798584, -15.009952545166016, -13.938722610473633, -12.86749267578125, -11.796262741088867, -10.725031852722168, -9.653801918029785, -8.582571983337402, -7.511341571807861, -6.44011116027832, -5.3688812255859375, -4.297651290893555, -3.2264208793640137, -2.1551907062530518, -1.0839605331420898, -0.012730598449707031, 1.058499813079834, 2.129730224609375, 3.2009620666503906, 4.272192001342773, 5.3434224128723145, 6.4146528244018555, 7.485882759094238, 8.557112693786621, 9.62834358215332, 10.699573516845703, 11.770803451538086, 12.842033386230469, 13.913263320922852, 14.98449420928955, 16.05572509765625, 17.126953125, 18.198184967041016, 19.2694149017334, 20.34064483642578, 21.411874771118164, 22.483104705810547, 23.55433464050293, 24.625564575195312, 25.696796417236328, 26.76802635192871, 27.839256286621094, 28.910486221313477, 29.98171615600586, 31.052946090698242, 32.124176025390625, 33.19540786743164, 34.26663589477539, 35.337867736816406, 36.409095764160156, 37.48032760620117]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 22.0, 38.0, 88.0, 170.0, 253.0, 439.0, 833.0, 1843.0, 5771.0, 57627.0, 4110120.0, 11767.0, 2859.0, 1120.0, 564.0, 309.0, 175.0, 116.0, 61.0, 43.0, 21.0, 13.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.46044921875, -12.9833984375, -12.50634765625, -12.029296875, -11.55224609375, -11.0751953125, -10.59814453125, -10.12109375, -9.64404296875, -9.1669921875, -8.68994140625, -8.212890625, -7.73583984375, -7.2587890625, -6.78173828125, -6.3046875, -5.82763671875, -5.3505859375, -4.87353515625, -4.396484375, -3.91943359375, -3.4423828125, -2.96533203125, -2.48828125, -2.01123046875, -1.5341796875, -1.05712890625, -0.580078125, -0.10302734375, 0.3740234375, 0.85107421875, 1.328125, 1.80517578125, 2.2822265625, 2.75927734375, 3.236328125, 3.71337890625, 4.1904296875, 4.66748046875, 5.14453125, 5.62158203125, 6.0986328125, 6.57568359375, 7.052734375, 7.52978515625, 8.0068359375, 8.48388671875, 8.9609375, 9.43798828125, 9.9150390625, 10.39208984375, 10.869140625, 11.34619140625, 11.8232421875, 12.30029296875, 12.77734375, 13.25439453125, 13.7314453125, 14.20849609375, 14.685546875, 15.16259765625, 15.6396484375, 16.11669921875, 16.59375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 8.0, 17.0, 15.0, 24.0, 35.0, 32.0, 46.0, 39.0, 50.0, 41.0, 56.0, 53.0, 60.0, 62.0, 63.0, 55.0, 52.0, 49.0, 46.0, 36.0, 32.0, 18.0, 20.0, 16.0, 14.0, 13.0, 7.0, 7.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1328125, -2.066497802734375, -2.00018310546875, -1.933868408203125, -1.8675537109375, -1.801239013671875, -1.73492431640625, -1.668609619140625, -1.602294921875, -1.535980224609375, -1.46966552734375, -1.403350830078125, -1.3370361328125, -1.270721435546875, -1.20440673828125, -1.138092041015625, -1.07177734375, -1.005462646484375, -0.93914794921875, -0.872833251953125, -0.8065185546875, -0.740203857421875, -0.67388916015625, -0.607574462890625, -0.541259765625, -0.474945068359375, -0.40863037109375, -0.342315673828125, -0.2760009765625, -0.209686279296875, -0.14337158203125, -0.077056884765625, -0.0107421875, 0.055572509765625, 0.12188720703125, 0.188201904296875, 0.2545166015625, 0.320831298828125, 0.38714599609375, 0.453460693359375, 0.519775390625, 0.586090087890625, 0.65240478515625, 0.718719482421875, 0.7850341796875, 0.851348876953125, 0.91766357421875, 0.983978271484375, 1.05029296875, 1.116607666015625, 1.18292236328125, 1.249237060546875, 1.3155517578125, 1.381866455078125, 1.44818115234375, 1.514495849609375, 1.580810546875, 1.647125244140625, 1.71343994140625, 1.779754638671875, 1.8460693359375, 1.912384033203125, 1.97869873046875, 2.045013427734375, 2.111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 9.0, 10.0, 16.0, 24.0, 29.0, 34.0, 46.0, 88.0, 122.0, 176.0, 329.0, 619.0, 1123.0, 2358.0, 6967.0, 42662.0, 4081714.0, 45675.0, 7246.0, 2409.0, 1134.0, 597.0, 338.0, 189.0, 104.0, 62.0, 57.0, 40.0, 24.0, 13.0, 11.0, 10.0, 8.0, 6.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.9375, -11.6353759765625, -11.333251953125, -11.0311279296875, -10.72900390625, -10.4268798828125, -10.124755859375, -9.8226318359375, -9.5205078125, -9.2183837890625, -8.916259765625, -8.6141357421875, -8.31201171875, -8.0098876953125, -7.707763671875, -7.4056396484375, -7.103515625, -6.8013916015625, -6.499267578125, -6.1971435546875, -5.89501953125, -5.5928955078125, -5.290771484375, -4.9886474609375, -4.6865234375, -4.3843994140625, -4.082275390625, -3.7801513671875, -3.47802734375, -3.1759033203125, -2.873779296875, -2.5716552734375, -2.26953125, -1.9674072265625, -1.665283203125, -1.3631591796875, -1.06103515625, -0.7589111328125, -0.456787109375, -0.1546630859375, 0.1474609375, 0.4495849609375, 0.751708984375, 1.0538330078125, 1.35595703125, 1.6580810546875, 1.960205078125, 2.2623291015625, 2.564453125, 2.8665771484375, 3.168701171875, 3.4708251953125, 3.77294921875, 4.0750732421875, 4.377197265625, 4.6793212890625, 4.9814453125, 5.2835693359375, 5.585693359375, 5.8878173828125, 6.18994140625, 6.4920654296875, 6.794189453125, 7.0963134765625, 7.3984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 11.0, 19.0, 46.0, 161.0, 3553.0, 158.0, 39.0, 24.0, 19.0, 14.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.784088134765625, -2.71856689453125, -2.653045654296875, -2.5875244140625, -2.522003173828125, -2.45648193359375, -2.390960693359375, -2.325439453125, -2.259918212890625, -2.19439697265625, -2.128875732421875, -2.0633544921875, -1.997833251953125, -1.93231201171875, -1.866790771484375, -1.80126953125, -1.735748291015625, -1.67022705078125, -1.604705810546875, -1.5391845703125, -1.473663330078125, -1.40814208984375, -1.342620849609375, -1.277099609375, -1.211578369140625, -1.14605712890625, -1.080535888671875, -1.0150146484375, -0.949493408203125, -0.88397216796875, -0.818450927734375, -0.7529296875, -0.687408447265625, -0.62188720703125, -0.556365966796875, -0.4908447265625, -0.425323486328125, -0.35980224609375, -0.294281005859375, -0.228759765625, -0.163238525390625, -0.09771728515625, -0.032196044921875, 0.0333251953125, 0.098846435546875, 0.16436767578125, 0.229888916015625, 0.29541015625, 0.360931396484375, 0.42645263671875, 0.491973876953125, 0.5574951171875, 0.623016357421875, 0.68853759765625, 0.754058837890625, 0.819580078125, 0.885101318359375, 0.95062255859375, 1.016143798828125, 1.0816650390625, 1.147186279296875, 1.21270751953125, 1.278228759765625, 1.34375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 13.0, 28.0, 35.0, 56.0, 119.0, 153.0, 204.0, 167.0, 108.0, 52.0, 29.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.651954650878906, -7.372481346130371, -7.093008518218994, -6.813535213470459, -6.534062385559082, -6.254589080810547, -5.975115776062012, -5.695642948150635, -5.416170120239258, -5.136696815490723, -4.857223987579346, -4.5777506828308105, -4.298277854919434, -4.018804550170898, -3.7393314838409424, -3.4598584175109863, -3.180385112762451, -2.900912046432495, -2.621438980102539, -2.341965675354004, -2.062492847442627, -1.7830196619033813, -1.5035464763641357, -1.2240734100341797, -0.9446003437042236, -0.6651272773742676, -0.38565415143966675, -0.10618102550506592, 0.17329204082489014, 0.4527651071548462, 0.7322382926940918, 1.0117113590240479, 1.291184425354004, 1.57065749168396, 1.850130558013916, 2.129603862762451, 2.409076690673828, 2.6885499954223633, 2.9680230617523193, 3.2474961280822754, 3.5269691944122314, 3.8064422607421875, 4.085915565490723, 4.3653883934021, 4.644861698150635, 4.924334526062012, 5.203807830810547, 5.483281135559082, 5.762753963470459, 6.042227268218994, 6.321700096130371, 6.601173400878906, 6.880646228790283, 7.160119533538818, 7.439592361450195, 7.7190656661987305, 7.998538970947266, 8.2780122756958, 8.557485580444336, 8.836957931518555, 9.11643123626709, 9.395904541015625, 9.67537784576416, 9.954851150512695, 10.234323501586914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 3.0, 10.0, 5.0, 11.0, 9.0, 9.0, 11.0, 18.0, 21.0, 22.0, 22.0, 32.0, 27.0, 34.0, 36.0, 40.0, 40.0, 49.0, 47.0, 57.0, 47.0, 43.0, 46.0, 37.0, 43.0, 39.0, 32.0, 32.0, 28.0, 21.0, 23.0, 22.0, 18.0, 14.0, 9.0, 12.0, 3.0, 3.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-3.4852757453918457, -3.389942169189453, -3.2946088314056396, -3.199275255203247, -3.1039419174194336, -3.008608341217041, -2.9132747650146484, -2.817941188812256, -2.7226078510284424, -2.62727427482605, -2.5319409370422363, -2.4366073608398438, -2.341273784637451, -2.2459404468536377, -2.150606870651245, -2.0552735328674316, -1.959939956665039, -1.864606499671936, -1.769273042678833, -1.6739394664764404, -1.5786060094833374, -1.4832725524902344, -1.3879389762878418, -1.2926055192947388, -1.1972720623016357, -1.1019386053085327, -1.0066051483154297, -0.9112715721130371, -0.8159381151199341, -0.720604658126831, -0.6252711415290833, -0.5299376249313354, -0.4346041679382324, -0.339270681142807, -0.2439371943473816, -0.14860370755195618, -0.05327022075653076, 0.04206326603889465, 0.13739675283432007, 0.23273026943206787, 0.3280637264251709, 0.4233972132205963, 0.5187307000160217, 0.6140642166137695, 0.7093976736068726, 0.8047311305999756, 0.9000646471977234, 0.9953981637954712, 1.0907316207885742, 1.1860650777816772, 1.2813985347747803, 1.3767321109771729, 1.4720655679702759, 1.567399024963379, 1.6627326011657715, 1.7580660581588745, 1.8533995151519775, 1.9487329721450806, 2.0440664291381836, 2.139400005340576, 2.2347335815429688, 2.3300669193267822, 2.425400495529175, 2.5207338333129883, 2.616067409515381]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 7.0, 11.0, 19.0, 15.0, 26.0, 52.0, 64.0, 109.0, 160.0, 277.0, 437.0, 698.0, 1157.0, 2162.0, 3993.0, 7905.0, 17595.0, 41488.0, 104303.0, 262260.0, 338252.0, 157974.0, 61327.0, 24994.0, 11167.0, 5503.0, 2796.0, 1498.0, 848.0, 537.0, 313.0, 200.0, 138.0, 74.0, 59.0, 37.0, 28.0, 21.0, 17.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.533203125, -3.438262939453125, -3.34332275390625, -3.248382568359375, -3.1534423828125, -3.058502197265625, -2.96356201171875, -2.868621826171875, -2.773681640625, -2.678741455078125, -2.58380126953125, -2.488861083984375, -2.3939208984375, -2.298980712890625, -2.20404052734375, -2.109100341796875, -2.01416015625, -1.919219970703125, -1.82427978515625, -1.729339599609375, -1.6343994140625, -1.539459228515625, -1.44451904296875, -1.349578857421875, -1.254638671875, -1.159698486328125, -1.06475830078125, -0.969818115234375, -0.8748779296875, -0.779937744140625, -0.68499755859375, -0.590057373046875, -0.4951171875, -0.400177001953125, -0.30523681640625, -0.210296630859375, -0.1153564453125, -0.020416259765625, 0.07452392578125, 0.169464111328125, 0.264404296875, 0.359344482421875, 0.45428466796875, 0.549224853515625, 0.6441650390625, 0.739105224609375, 0.83404541015625, 0.928985595703125, 1.02392578125, 1.118865966796875, 1.21380615234375, 1.308746337890625, 1.4036865234375, 1.498626708984375, 1.59356689453125, 1.688507080078125, 1.783447265625, 1.878387451171875, 1.97332763671875, 2.068267822265625, 2.1632080078125, 2.258148193359375, 2.35308837890625, 2.448028564453125, 2.54296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 14.0, 30.0, 31.0, 22.0, 40.0, 41.0, 46.0, 46.0, 36.0, 53.0, 58.0, 55.0, 50.0, 60.0, 47.0, 51.0, 61.0, 43.0, 37.0, 27.0, 26.0, 23.0, 15.0, 12.0, 8.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.995513916015625, -1.93048095703125, -1.865447998046875, -1.8004150390625, -1.735382080078125, -1.67034912109375, -1.605316162109375, -1.540283203125, -1.475250244140625, -1.41021728515625, -1.345184326171875, -1.2801513671875, -1.215118408203125, -1.15008544921875, -1.085052490234375, -1.02001953125, -0.954986572265625, -0.88995361328125, -0.824920654296875, -0.7598876953125, -0.694854736328125, -0.62982177734375, -0.564788818359375, -0.499755859375, -0.434722900390625, -0.36968994140625, -0.304656982421875, -0.2396240234375, -0.174591064453125, -0.10955810546875, -0.044525146484375, 0.0205078125, 0.085540771484375, 0.15057373046875, 0.215606689453125, 0.2806396484375, 0.345672607421875, 0.41070556640625, 0.475738525390625, 0.540771484375, 0.605804443359375, 0.67083740234375, 0.735870361328125, 0.8009033203125, 0.865936279296875, 0.93096923828125, 0.996002197265625, 1.06103515625, 1.126068115234375, 1.19110107421875, 1.256134033203125, 1.3211669921875, 1.386199951171875, 1.45123291015625, 1.516265869140625, 1.581298828125, 1.646331787109375, 1.71136474609375, 1.776397705078125, 1.8414306640625, 1.906463623046875, 1.97149658203125, 2.036529541015625, 2.1015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 6.0, 9.0, 7.0, 13.0, 17.0, 21.0, 45.0, 49.0, 80.0, 109.0, 154.0, 248.0, 366.0, 618.0, 1088.0, 2496.0, 7560.0, 43327.0, 607667.0, 346510.0, 27804.0, 5755.0, 2106.0, 944.0, 537.0, 326.0, 214.0, 146.0, 100.0, 61.0, 49.0, 31.0, 29.0, 22.0, 18.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.46484375, -6.26214599609375, -6.0594482421875, -5.85675048828125, -5.654052734375, -5.45135498046875, -5.2486572265625, -5.04595947265625, -4.84326171875, -4.64056396484375, -4.4378662109375, -4.23516845703125, -4.032470703125, -3.82977294921875, -3.6270751953125, -3.42437744140625, -3.2216796875, -3.01898193359375, -2.8162841796875, -2.61358642578125, -2.410888671875, -2.20819091796875, -2.0054931640625, -1.80279541015625, -1.60009765625, -1.39739990234375, -1.1947021484375, -0.99200439453125, -0.789306640625, -0.58660888671875, -0.3839111328125, -0.18121337890625, 0.021484375, 0.22418212890625, 0.4268798828125, 0.62957763671875, 0.832275390625, 1.03497314453125, 1.2376708984375, 1.44036865234375, 1.64306640625, 1.84576416015625, 2.0484619140625, 2.25115966796875, 2.453857421875, 2.65655517578125, 2.8592529296875, 3.06195068359375, 3.2646484375, 3.46734619140625, 3.6700439453125, 3.87274169921875, 4.075439453125, 4.27813720703125, 4.4808349609375, 4.68353271484375, 4.88623046875, 5.08892822265625, 5.2916259765625, 5.49432373046875, 5.697021484375, 5.89971923828125, 6.1024169921875, 6.30511474609375, 6.5078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 15.0, 7.0, 5.0, 13.0, 23.0, 21.0, 13.0, 24.0, 29.0, 26.0, 24.0, 44.0, 50.0, 26.0, 43.0, 37.0, 35.0, 49.0, 47.0, 43.0, 37.0, 43.0, 38.0, 40.0, 28.0, 29.0, 20.0, 21.0, 24.0, 21.0, 17.0, 18.0, 16.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.8125, -6.61279296875, -6.4130859375, -6.21337890625, -6.013671875, -5.81396484375, -5.6142578125, -5.41455078125, -5.21484375, -5.01513671875, -4.8154296875, -4.61572265625, -4.416015625, -4.21630859375, -4.0166015625, -3.81689453125, -3.6171875, -3.41748046875, -3.2177734375, -3.01806640625, -2.818359375, -2.61865234375, -2.4189453125, -2.21923828125, -2.01953125, -1.81982421875, -1.6201171875, -1.42041015625, -1.220703125, -1.02099609375, -0.8212890625, -0.62158203125, -0.421875, -0.22216796875, -0.0224609375, 0.17724609375, 0.376953125, 0.57666015625, 0.7763671875, 0.97607421875, 1.17578125, 1.37548828125, 1.5751953125, 1.77490234375, 1.974609375, 2.17431640625, 2.3740234375, 2.57373046875, 2.7734375, 2.97314453125, 3.1728515625, 3.37255859375, 3.572265625, 3.77197265625, 3.9716796875, 4.17138671875, 4.37109375, 4.57080078125, 4.7705078125, 4.97021484375, 5.169921875, 5.36962890625, 5.5693359375, 5.76904296875, 5.96875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 10.0, 19.0, 18.0, 32.0, 45.0, 85.0, 180.0, 366.0, 1073.0, 4428.0, 42956.0, 855178.0, 133012.0, 8510.0, 1662.0, 501.0, 224.0, 94.0, 57.0, 33.0, 16.0, 18.0, 12.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640625, -4.478759765625, -4.31689453125, -4.155029296875, -3.9931640625, -3.831298828125, -3.66943359375, -3.507568359375, -3.345703125, -3.183837890625, -3.02197265625, -2.860107421875, -2.6982421875, -2.536376953125, -2.37451171875, -2.212646484375, -2.05078125, -1.888916015625, -1.72705078125, -1.565185546875, -1.4033203125, -1.241455078125, -1.07958984375, -0.917724609375, -0.755859375, -0.593994140625, -0.43212890625, -0.270263671875, -0.1083984375, 0.053466796875, 0.21533203125, 0.377197265625, 0.5390625, 0.700927734375, 0.86279296875, 1.024658203125, 1.1865234375, 1.348388671875, 1.51025390625, 1.672119140625, 1.833984375, 1.995849609375, 2.15771484375, 2.319580078125, 2.4814453125, 2.643310546875, 2.80517578125, 2.967041015625, 3.12890625, 3.290771484375, 3.45263671875, 3.614501953125, 3.7763671875, 3.938232421875, 4.10009765625, 4.261962890625, 4.423828125, 4.585693359375, 4.74755859375, 4.909423828125, 5.0712890625, 5.233154296875, 5.39501953125, 5.556884765625, 5.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 14.0, 18.0, 18.0, 31.0, 63.0, 90.0, 189.0, 185.0, 134.0, 70.0, 47.0, 36.0, 21.0, 7.0, 14.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007348060607910156, -0.0007087960839271545, -0.0006827861070632935, -0.0006567761301994324, -0.0006307661533355713, -0.0006047561764717102, -0.0005787461996078491, -0.000552736222743988, -0.000526726245880127, -0.0005007162690162659, -0.0004747062921524048, -0.0004486963152885437, -0.0004226863384246826, -0.00039667636156082153, -0.00037066638469696045, -0.00034465640783309937, -0.0003186464309692383, -0.0002926364541053772, -0.0002666264772415161, -0.00024061650037765503, -0.00021460652351379395, -0.00018859654664993286, -0.00016258656978607178, -0.0001365765929222107, -0.00011056661605834961, -8.455663919448853e-05, -5.854666233062744e-05, -3.253668546676636e-05, -6.5267086029052734e-06, 1.948326826095581e-05, 4.5493245124816895e-05, 7.150322198867798e-05, 9.751319885253906e-05, 0.00012352317571640015, 0.00014953315258026123, 0.00017554312944412231, 0.0002015531063079834, 0.00022756308317184448, 0.00025357306003570557, 0.00027958303689956665, 0.00030559301376342773, 0.0003316029906272888, 0.0003576129674911499, 0.000383622944355011, 0.00040963292121887207, 0.00043564289808273315, 0.00046165287494659424, 0.0004876628518104553, 0.0005136728286743164, 0.0005396828055381775, 0.0005656927824020386, 0.0005917027592658997, 0.0006177127361297607, 0.0006437227129936218, 0.0006697326898574829, 0.000695742666721344, 0.0007217526435852051, 0.0007477626204490662, 0.0007737725973129272, 0.0007997825741767883, 0.0008257925510406494, 0.0008518025279045105, 0.0008778125047683716, 0.0009038224816322327, 0.0009298324584960938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 20.0, 17.0, 28.0, 46.0, 79.0, 132.0, 212.0, 422.0, 840.0, 1859.0, 5178.0, 22440.0, 185323.0, 705192.0, 104737.0, 14912.0, 3952.0, 1508.0, 707.0, 386.0, 204.0, 126.0, 69.0, 37.0, 37.0, 20.0, 11.0, 12.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.842559814453125, -3.73394775390625, -3.625335693359375, -3.5167236328125, -3.408111572265625, -3.29949951171875, -3.190887451171875, -3.082275390625, -2.973663330078125, -2.86505126953125, -2.756439208984375, -2.6478271484375, -2.539215087890625, -2.43060302734375, -2.321990966796875, -2.21337890625, -2.104766845703125, -1.99615478515625, -1.887542724609375, -1.7789306640625, -1.670318603515625, -1.56170654296875, -1.453094482421875, -1.344482421875, -1.235870361328125, -1.12725830078125, -1.018646240234375, -0.9100341796875, -0.801422119140625, -0.69281005859375, -0.584197998046875, -0.4755859375, -0.366973876953125, -0.25836181640625, -0.149749755859375, -0.0411376953125, 0.067474365234375, 0.17608642578125, 0.284698486328125, 0.393310546875, 0.501922607421875, 0.61053466796875, 0.719146728515625, 0.8277587890625, 0.936370849609375, 1.04498291015625, 1.153594970703125, 1.26220703125, 1.370819091796875, 1.47943115234375, 1.588043212890625, 1.6966552734375, 1.805267333984375, 1.91387939453125, 2.022491455078125, 2.131103515625, 2.239715576171875, 2.34832763671875, 2.456939697265625, 2.5655517578125, 2.674163818359375, 2.78277587890625, 2.891387939453125, 3.0]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 24.0, 34.0, 30.0, 42.0, 44.0, 71.0, 64.0, 69.0, 96.0, 97.0, 77.0, 83.0, 59.0, 52.0, 32.0, 26.0, 17.0, 16.0, 10.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.011810302734375, -2.92987060546875, -2.847930908203125, -2.7659912109375, -2.684051513671875, -2.60211181640625, -2.520172119140625, -2.438232421875, -2.356292724609375, -2.27435302734375, -2.192413330078125, -2.1104736328125, -2.028533935546875, -1.94659423828125, -1.864654541015625, -1.78271484375, -1.700775146484375, -1.61883544921875, -1.536895751953125, -1.4549560546875, -1.373016357421875, -1.29107666015625, -1.209136962890625, -1.127197265625, -1.045257568359375, -0.96331787109375, -0.881378173828125, -0.7994384765625, -0.717498779296875, -0.63555908203125, -0.553619384765625, -0.4716796875, -0.389739990234375, -0.30780029296875, -0.225860595703125, -0.1439208984375, -0.061981201171875, 0.01995849609375, 0.101898193359375, 0.183837890625, 0.265777587890625, 0.34771728515625, 0.429656982421875, 0.5115966796875, 0.593536376953125, 0.67547607421875, 0.757415771484375, 0.83935546875, 0.921295166015625, 1.00323486328125, 1.085174560546875, 1.1671142578125, 1.249053955078125, 1.33099365234375, 1.412933349609375, 1.494873046875, 1.576812744140625, 1.65875244140625, 1.740692138671875, 1.8226318359375, 1.904571533203125, 1.98651123046875, 2.068450927734375, 2.150390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 30.0, 89.0, 178.0, 288.0, 245.0, 89.0, 39.0, 18.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.6630630493164, -92.97833251953125, -90.29359436035156, -87.6088638305664, -84.92412567138672, -82.23939514160156, -79.55465698242188, -76.86992645263672, -74.18519592285156, -71.5004653930664, -68.81572723388672, -66.13099670410156, -63.446258544921875, -60.76152801513672, -58.0767936706543, -55.392059326171875, -52.70732116699219, -50.022586822509766, -47.337852478027344, -44.65312194824219, -41.9683837890625, -39.283653259277344, -36.59891891479492, -33.9141845703125, -31.229450225830078, -28.544715881347656, -25.859981536865234, -23.175249099731445, -20.490514755249023, -17.8057804107666, -15.121047973632812, -12.43631362915039, -9.7515869140625, -7.066853046417236, -4.382119178771973, -1.6973857879638672, 0.9873485565185547, 3.6720829010009766, 6.356815338134766, 9.041549682617188, 11.72628402709961, 14.411018371582031, 17.095752716064453, 19.780485153198242, 22.465219497680664, 25.149953842163086, 27.834686279296875, 30.519420623779297, 33.20415496826172, 35.88888931274414, 38.57362365722656, 41.25835418701172, 43.943092346191406, 46.62782287597656, 49.312557220458984, 51.997291564941406, 54.68202590942383, 57.36676025390625, 60.05149459838867, 62.736228942871094, 65.42095947265625, 68.10569763183594, 70.7904281616211, 73.47515869140625, 76.15989685058594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 5.0, 11.0, 11.0, 12.0, 20.0, 29.0, 23.0, 28.0, 43.0, 47.0, 48.0, 52.0, 78.0, 75.0, 70.0, 66.0, 55.0, 51.0, 34.0, 46.0, 33.0, 37.0, 22.0, 20.0, 12.0, 18.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.164466857910156, -51.79619216918945, -50.427913665771484, -49.05963897705078, -47.69136428833008, -46.323089599609375, -44.954811096191406, -43.5865364074707, -42.21826171875, -40.8499870300293, -39.48170852661133, -38.113433837890625, -36.74515914916992, -35.37688446044922, -34.00860595703125, -32.64033126831055, -31.27205467224121, -29.903778076171875, -28.535503387451172, -27.167226791381836, -25.798952102661133, -24.430675506591797, -23.062400817871094, -21.694124221801758, -20.325847625732422, -18.957571029663086, -17.589296340942383, -16.221019744873047, -14.852745056152344, -13.484468460083008, -12.116192817687988, -10.747917175292969, -9.379642486572266, -8.011366844177246, -6.643091201782227, -5.274815082550049, -3.9065394401550293, -2.5382637977600098, -1.169987678527832, 0.1982879638671875, 1.566563606262207, 2.9348392486572266, 4.303114891052246, 5.671391010284424, 7.039666652679443, 8.407941818237305, 9.77621841430664, 11.14449405670166, 12.51276969909668, 13.8810453414917, 15.249320983886719, 16.617597579956055, 17.985872268676758, 19.354148864746094, 20.722423553466797, 22.090700149536133, 23.45897674560547, 24.827253341674805, 26.195528030395508, 27.563804626464844, 28.932079315185547, 30.300355911254883, 31.66863250732422, 33.03690719604492, 34.405181884765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 9.0, 20.0, 17.0, 29.0, 57.0, 100.0, 191.0, 347.0, 716.0, 1525.0, 3426.0, 9330.0, 38199.0, 3975536.0, 138118.0, 16995.0, 5215.0, 2245.0, 1046.0, 492.0, 300.0, 164.0, 75.0, 34.0, 34.0, 21.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.0087890625, -5.775390625, -5.5419921875, -5.30859375, -5.0751953125, -4.841796875, -4.6083984375, -4.375, -4.1416015625, -3.908203125, -3.6748046875, -3.44140625, -3.2080078125, -2.974609375, -2.7412109375, -2.5078125, -2.2744140625, -2.041015625, -1.8076171875, -1.57421875, -1.3408203125, -1.107421875, -0.8740234375, -0.640625, -0.4072265625, -0.173828125, 0.0595703125, 0.29296875, 0.5263671875, 0.759765625, 0.9931640625, 1.2265625, 1.4599609375, 1.693359375, 1.9267578125, 2.16015625, 2.3935546875, 2.626953125, 2.8603515625, 3.09375, 3.3271484375, 3.560546875, 3.7939453125, 4.02734375, 4.2607421875, 4.494140625, 4.7275390625, 4.9609375, 5.1943359375, 5.427734375, 5.6611328125, 5.89453125, 6.1279296875, 6.361328125, 6.5947265625, 6.828125, 7.0615234375, 7.294921875, 7.5283203125, 7.76171875, 7.9951171875, 8.228515625, 8.4619140625, 8.6953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 7.0, 14.0, 21.0, 18.0, 21.0, 33.0, 28.0, 40.0, 50.0, 57.0, 53.0, 67.0, 69.0, 59.0, 57.0, 64.0, 57.0, 54.0, 43.0, 32.0, 29.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.556640625, -2.487640380859375, -2.41864013671875, -2.349639892578125, -2.2806396484375, -2.211639404296875, -2.14263916015625, -2.073638916015625, -2.004638671875, -1.935638427734375, -1.86663818359375, -1.797637939453125, -1.7286376953125, -1.659637451171875, -1.59063720703125, -1.521636962890625, -1.45263671875, -1.383636474609375, -1.31463623046875, -1.245635986328125, -1.1766357421875, -1.107635498046875, -1.03863525390625, -0.969635009765625, -0.900634765625, -0.831634521484375, -0.76263427734375, -0.693634033203125, -0.6246337890625, -0.555633544921875, -0.48663330078125, -0.417633056640625, -0.3486328125, -0.279632568359375, -0.21063232421875, -0.141632080078125, -0.0726318359375, -0.003631591796875, 0.06536865234375, 0.134368896484375, 0.203369140625, 0.272369384765625, 0.34136962890625, 0.410369873046875, 0.4793701171875, 0.548370361328125, 0.61737060546875, 0.686370849609375, 0.75537109375, 0.824371337890625, 0.89337158203125, 0.962371826171875, 1.0313720703125, 1.100372314453125, 1.16937255859375, 1.238372802734375, 1.307373046875, 1.376373291015625, 1.44537353515625, 1.514373779296875, 1.5833740234375, 1.652374267578125, 1.72137451171875, 1.790374755859375, 1.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 16.0, 16.0, 34.0, 35.0, 51.0, 78.0, 115.0, 179.0, 268.0, 421.0, 707.0, 1152.0, 1934.0, 3424.0, 7092.0, 18143.0, 77336.0, 3801452.0, 230352.0, 30511.0, 10381.0, 4413.0, 2483.0, 1351.0, 896.0, 482.0, 299.0, 214.0, 137.0, 84.0, 67.0, 42.0, 19.0, 21.0, 18.0, 9.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.33837890625, -4.1923828125, -4.04638671875, -3.900390625, -3.75439453125, -3.6083984375, -3.46240234375, -3.31640625, -3.17041015625, -3.0244140625, -2.87841796875, -2.732421875, -2.58642578125, -2.4404296875, -2.29443359375, -2.1484375, -2.00244140625, -1.8564453125, -1.71044921875, -1.564453125, -1.41845703125, -1.2724609375, -1.12646484375, -0.98046875, -0.83447265625, -0.6884765625, -0.54248046875, -0.396484375, -0.25048828125, -0.1044921875, 0.04150390625, 0.1875, 0.33349609375, 0.4794921875, 0.62548828125, 0.771484375, 0.91748046875, 1.0634765625, 1.20947265625, 1.35546875, 1.50146484375, 1.6474609375, 1.79345703125, 1.939453125, 2.08544921875, 2.2314453125, 2.37744140625, 2.5234375, 2.66943359375, 2.8154296875, 2.96142578125, 3.107421875, 3.25341796875, 3.3994140625, 3.54541015625, 3.69140625, 3.83740234375, 3.9833984375, 4.12939453125, 4.275390625, 4.42138671875, 4.5673828125, 4.71337890625, 4.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 9.0, 12.0, 11.0, 20.0, 54.0, 90.0, 245.0, 2856.0, 469.0, 126.0, 57.0, 33.0, 21.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.94854736328125, -1.8756103515625, -1.80267333984375, -1.729736328125, -1.65679931640625, -1.5838623046875, -1.51092529296875, -1.43798828125, -1.36505126953125, -1.2921142578125, -1.21917724609375, -1.146240234375, -1.07330322265625, -1.0003662109375, -0.92742919921875, -0.8544921875, -0.78155517578125, -0.7086181640625, -0.63568115234375, -0.562744140625, -0.48980712890625, -0.4168701171875, -0.34393310546875, -0.27099609375, -0.19805908203125, -0.1251220703125, -0.05218505859375, 0.020751953125, 0.09368896484375, 0.1666259765625, 0.23956298828125, 0.3125, 0.38543701171875, 0.4583740234375, 0.53131103515625, 0.604248046875, 0.67718505859375, 0.7501220703125, 0.82305908203125, 0.89599609375, 0.96893310546875, 1.0418701171875, 1.11480712890625, 1.187744140625, 1.26068115234375, 1.3336181640625, 1.40655517578125, 1.4794921875, 1.55242919921875, 1.6253662109375, 1.69830322265625, 1.771240234375, 1.84417724609375, 1.9171142578125, 1.99005126953125, 2.06298828125, 2.13592529296875, 2.2088623046875, 2.28179931640625, 2.354736328125, 2.42767333984375, 2.5006103515625, 2.57354736328125, 2.646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 7.0, 6.0, 19.0, 27.0, 37.0, 58.0, 99.0, 133.0, 145.0, 161.0, 118.0, 74.0, 47.0, 23.0, 22.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.110759735107422, -9.742130279541016, -9.37350082397461, -9.004871368408203, -8.636241912841797, -8.26761245727539, -7.898983478546143, -7.530354022979736, -7.16172456741333, -6.793095111846924, -6.424465656280518, -6.0558366775512695, -5.687207221984863, -5.318577766418457, -4.949948310852051, -4.5813188552856445, -4.212689399719238, -3.844059944152832, -3.475430488586426, -3.1068012714385986, -2.7381718158721924, -2.369542360305786, -2.000913143157959, -1.6322836875915527, -1.2636542320251465, -0.895024836063385, -0.5263954401016235, -0.15776610374450684, 0.21086335182189941, 0.5794928073883057, 0.9481220245361328, 1.316751480102539, 1.685379981994629, 2.054009437561035, 2.4226388931274414, 2.7912681102752686, 3.159897565841675, 3.528527021408081, 3.897156238555908, 4.2657856941223145, 4.634415149688721, 5.003044605255127, 5.371674060821533, 5.740303039550781, 6.1089324951171875, 6.477561950683594, 6.84619140625, 7.214820861816406, 7.5834503173828125, 7.952079772949219, 8.320709228515625, 8.689338684082031, 9.057968139648438, 9.426597595214844, 9.79522705078125, 10.163856506347656, 10.532485961914062, 10.901115417480469, 11.269744873046875, 11.638374328613281, 12.007003784179688, 12.375633239746094, 12.7442626953125, 13.112892150878906, 13.481520652770996]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 5.0, 17.0, 16.0, 13.0, 22.0, 26.0, 22.0, 40.0, 23.0, 37.0, 43.0, 38.0, 47.0, 45.0, 44.0, 59.0, 50.0, 36.0, 38.0, 41.0, 29.0, 44.0, 36.0, 31.0, 30.0, 31.0, 26.0, 17.0, 15.0, 12.0, 20.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.804723262786865, -4.625757217407227, -4.44679069519043, -4.267824649810791, -4.088858604431152, -3.9098923206329346, -3.730926036834717, -3.551959991455078, -3.3729937076568604, -3.1940274238586426, -3.015061378479004, -2.836095094680786, -2.6571288108825684, -2.4781627655029297, -2.299196481704712, -2.120230197906494, -1.9412641525268555, -1.7622979879379272, -1.583331823348999, -1.4043655395507812, -1.225399374961853, -1.0464332103729248, -0.867466926574707, -0.6885007619857788, -0.5095345973968506, -0.3305684030056, -0.15160220861434937, 0.027364015579223633, 0.20633018016815186, 0.3852963447570801, 0.5642626285552979, 0.7432287931442261, 0.9221954345703125, 1.1011615991592407, 1.280127763748169, 1.4590940475463867, 1.638060212135315, 1.8170263767242432, 1.995992660522461, 2.1749587059020996, 2.3539249897003174, 2.532891273498535, 2.711857318878174, 2.8908236026763916, 3.0697898864746094, 3.248755931854248, 3.427722215652466, 3.6066884994506836, 3.7856545448303223, 3.96462082862854, 4.143587112426758, 4.3225531578063965, 4.501519203186035, 4.680485725402832, 4.859451770782471, 5.038417816162109, 5.217384338378906, 5.396350383758545, 5.575316905975342, 5.7542829513549805, 5.933248996734619, 6.112215042114258, 6.291181564331055, 6.470147609710693, 6.649113655090332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 3.0, 11.0, 17.0, 16.0, 43.0, 69.0, 120.0, 233.0, 472.0, 1169.0, 2903.0, 8065.0, 27037.0, 105325.0, 464332.0, 334662.0, 73743.0, 20001.0, 6296.0, 2265.0, 924.0, 408.0, 201.0, 89.0, 57.0, 32.0, 23.0, 10.0, 12.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.49493408203125, -4.2984619140625, -4.10198974609375, -3.905517578125, -3.70904541015625, -3.5125732421875, -3.31610107421875, -3.11962890625, -2.92315673828125, -2.7266845703125, -2.53021240234375, -2.333740234375, -2.13726806640625, -1.9407958984375, -1.74432373046875, -1.5478515625, -1.35137939453125, -1.1549072265625, -0.95843505859375, -0.761962890625, -0.56549072265625, -0.3690185546875, -0.17254638671875, 0.02392578125, 0.22039794921875, 0.4168701171875, 0.61334228515625, 0.809814453125, 1.00628662109375, 1.2027587890625, 1.39923095703125, 1.595703125, 1.79217529296875, 1.9886474609375, 2.18511962890625, 2.381591796875, 2.57806396484375, 2.7745361328125, 2.97100830078125, 3.16748046875, 3.36395263671875, 3.5604248046875, 3.75689697265625, 3.953369140625, 4.14984130859375, 4.3463134765625, 4.54278564453125, 4.7392578125, 4.93572998046875, 5.1322021484375, 5.32867431640625, 5.525146484375, 5.72161865234375, 5.9180908203125, 6.11456298828125, 6.31103515625, 6.50750732421875, 6.7039794921875, 6.90045166015625, 7.096923828125, 7.29339599609375, 7.4898681640625, 7.68634033203125, 7.8828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 14.0, 20.0, 20.0, 27.0, 21.0, 30.0, 36.0, 33.0, 49.0, 53.0, 54.0, 57.0, 55.0, 54.0, 48.0, 52.0, 54.0, 44.0, 51.0, 34.0, 43.0, 21.0, 20.0, 20.0, 16.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.15625, -2.0941314697265625, -2.032012939453125, -1.9698944091796875, -1.90777587890625, -1.8456573486328125, -1.783538818359375, -1.7214202880859375, -1.6593017578125, -1.5971832275390625, -1.535064697265625, -1.4729461669921875, -1.41082763671875, -1.3487091064453125, -1.286590576171875, -1.2244720458984375, -1.162353515625, -1.1002349853515625, -1.038116455078125, -0.9759979248046875, -0.91387939453125, -0.8517608642578125, -0.789642333984375, -0.7275238037109375, -0.6654052734375, -0.6032867431640625, -0.541168212890625, -0.4790496826171875, -0.41693115234375, -0.3548126220703125, -0.292694091796875, -0.2305755615234375, -0.16845703125, -0.1063385009765625, -0.044219970703125, 0.0178985595703125, 0.08001708984375, 0.1421356201171875, 0.204254150390625, 0.2663726806640625, 0.3284912109375, 0.3906097412109375, 0.452728271484375, 0.5148468017578125, 0.57696533203125, 0.6390838623046875, 0.701202392578125, 0.7633209228515625, 0.825439453125, 0.8875579833984375, 0.949676513671875, 1.0117950439453125, 1.07391357421875, 1.1360321044921875, 1.198150634765625, 1.2602691650390625, 1.3223876953125, 1.3845062255859375, 1.446624755859375, 1.5087432861328125, 1.57086181640625, 1.6329803466796875, 1.695098876953125, 1.7572174072265625, 1.8193359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 11.0, 21.0, 13.0, 20.0, 33.0, 29.0, 48.0, 75.0, 94.0, 137.0, 196.0, 322.0, 437.0, 707.0, 1194.0, 2467.0, 6475.0, 28654.0, 219443.0, 682245.0, 83539.0, 13957.0, 3931.0, 1795.0, 968.0, 564.0, 361.0, 228.0, 152.0, 111.0, 95.0, 58.0, 52.0, 29.0, 24.0, 20.0, 9.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.94140625, -7.7283935546875, -7.515380859375, -7.3023681640625, -7.08935546875, -6.8763427734375, -6.663330078125, -6.4503173828125, -6.2373046875, -6.0242919921875, -5.811279296875, -5.5982666015625, -5.38525390625, -5.1722412109375, -4.959228515625, -4.7462158203125, -4.533203125, -4.3201904296875, -4.107177734375, -3.8941650390625, -3.68115234375, -3.4681396484375, -3.255126953125, -3.0421142578125, -2.8291015625, -2.6160888671875, -2.403076171875, -2.1900634765625, -1.97705078125, -1.7640380859375, -1.551025390625, -1.3380126953125, -1.125, -0.9119873046875, -0.698974609375, -0.4859619140625, -0.27294921875, -0.0599365234375, 0.153076171875, 0.3660888671875, 0.5791015625, 0.7921142578125, 1.005126953125, 1.2181396484375, 1.43115234375, 1.6441650390625, 1.857177734375, 2.0701904296875, 2.283203125, 2.4962158203125, 2.709228515625, 2.9222412109375, 3.13525390625, 3.3482666015625, 3.561279296875, 3.7742919921875, 3.9873046875, 4.2003173828125, 4.413330078125, 4.6263427734375, 4.83935546875, 5.0523681640625, 5.265380859375, 5.4783935546875, 5.69140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 3.0, 10.0, 13.0, 15.0, 18.0, 17.0, 30.0, 29.0, 30.0, 45.0, 47.0, 60.0, 52.0, 48.0, 53.0, 62.0, 67.0, 50.0, 53.0, 41.0, 44.0, 36.0, 26.0, 25.0, 28.0, 22.0, 16.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.6484375, -9.403076171875, -9.15771484375, -8.912353515625, -8.6669921875, -8.421630859375, -8.17626953125, -7.930908203125, -7.685546875, -7.440185546875, -7.19482421875, -6.949462890625, -6.7041015625, -6.458740234375, -6.21337890625, -5.968017578125, -5.72265625, -5.477294921875, -5.23193359375, -4.986572265625, -4.7412109375, -4.495849609375, -4.25048828125, -4.005126953125, -3.759765625, -3.514404296875, -3.26904296875, -3.023681640625, -2.7783203125, -2.532958984375, -2.28759765625, -2.042236328125, -1.796875, -1.551513671875, -1.30615234375, -1.060791015625, -0.8154296875, -0.570068359375, -0.32470703125, -0.079345703125, 0.166015625, 0.411376953125, 0.65673828125, 0.902099609375, 1.1474609375, 1.392822265625, 1.63818359375, 1.883544921875, 2.12890625, 2.374267578125, 2.61962890625, 2.864990234375, 3.1103515625, 3.355712890625, 3.60107421875, 3.846435546875, 4.091796875, 4.337158203125, 4.58251953125, 4.827880859375, 5.0732421875, 5.318603515625, 5.56396484375, 5.809326171875, 6.0546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 7.0, 9.0, 6.0, 21.0, 23.0, 34.0, 55.0, 50.0, 79.0, 115.0, 153.0, 222.0, 332.0, 615.0, 950.0, 1782.0, 3486.0, 7622.0, 19299.0, 55593.0, 179897.0, 510079.0, 178105.0, 55123.0, 19161.0, 7785.0, 3507.0, 1797.0, 962.0, 542.0, 361.0, 200.0, 173.0, 106.0, 83.0, 48.0, 34.0, 22.0, 17.0, 16.0, 9.0, 18.0, 6.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0], "bins": [-1.6611328125, -1.610015869140625, -1.55889892578125, -1.507781982421875, -1.4566650390625, -1.405548095703125, -1.35443115234375, -1.303314208984375, -1.252197265625, -1.201080322265625, -1.14996337890625, -1.098846435546875, -1.0477294921875, -0.996612548828125, -0.94549560546875, -0.894378662109375, -0.84326171875, -0.792144775390625, -0.74102783203125, -0.689910888671875, -0.6387939453125, -0.587677001953125, -0.53656005859375, -0.485443115234375, -0.434326171875, -0.383209228515625, -0.33209228515625, -0.280975341796875, -0.2298583984375, -0.178741455078125, -0.12762451171875, -0.076507568359375, -0.025390625, 0.025726318359375, 0.07684326171875, 0.127960205078125, 0.1790771484375, 0.230194091796875, 0.28131103515625, 0.332427978515625, 0.383544921875, 0.434661865234375, 0.48577880859375, 0.536895751953125, 0.5880126953125, 0.639129638671875, 0.69024658203125, 0.741363525390625, 0.79248046875, 0.843597412109375, 0.89471435546875, 0.945831298828125, 0.9969482421875, 1.048065185546875, 1.09918212890625, 1.150299072265625, 1.201416015625, 1.252532958984375, 1.30364990234375, 1.354766845703125, 1.4058837890625, 1.457000732421875, 1.50811767578125, 1.559234619140625, 1.6103515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 11.0, 4.0, 11.0, 9.0, 27.0, 30.0, 38.0, 45.0, 60.0, 90.0, 145.0, 188.0, 110.0, 57.0, 40.0, 43.0, 18.0, 24.0, 18.0, 14.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009059906005859375, -0.0008816048502922058, -0.0008572190999984741, -0.0008328333497047424, -0.0008084475994110107, -0.000784061849117279, -0.0007596760988235474, -0.0007352903485298157, -0.000710904598236084, -0.0006865188479423523, -0.0006621330976486206, -0.0006377473473548889, -0.0006133615970611572, -0.0005889758467674255, -0.0005645900964736938, -0.0005402043461799622, -0.0005158185958862305, -0.0004914328455924988, -0.0004670470952987671, -0.0004426613450050354, -0.0004182755947113037, -0.000393889844417572, -0.00036950409412384033, -0.00034511834383010864, -0.00032073259353637695, -0.00029634684324264526, -0.0002719610929489136, -0.0002475753426551819, -0.0002231895923614502, -0.0001988038420677185, -0.00017441809177398682, -0.00015003234148025513, -0.00012564659118652344, -0.00010126084089279175, -7.687509059906006e-05, -5.248934030532837e-05, -2.810359001159668e-05, -3.7178397178649902e-06, 2.06679105758667e-05, 4.505366086959839e-05, 6.943941116333008e-05, 9.382516145706177e-05, 0.00011821091175079346, 0.00014259666204452515, 0.00016698241233825684, 0.00019136816263198853, 0.00021575391292572021, 0.0002401396632194519, 0.0002645254135131836, 0.0002889111638069153, 0.00031329691410064697, 0.00033768266439437866, 0.00036206841468811035, 0.00038645416498184204, 0.00041083991527557373, 0.0004352256655693054, 0.0004596114158630371, 0.0004839971661567688, 0.0005083829164505005, 0.0005327686667442322, 0.0005571544170379639, 0.0005815401673316956, 0.0006059259176254272, 0.0006303116679191589, 0.0006546974182128906]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 5.0, 9.0, 15.0, 21.0, 30.0, 45.0, 48.0, 65.0, 118.0, 179.0, 262.0, 437.0, 842.0, 1558.0, 3540.0, 10174.0, 40402.0, 225977.0, 602687.0, 124945.0, 24565.0, 6912.0, 2661.0, 1231.0, 709.0, 369.0, 259.0, 162.0, 107.0, 62.0, 42.0, 34.0, 20.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.272735595703125, -2.19781494140625, -2.122894287109375, -2.0479736328125, -1.973052978515625, -1.89813232421875, -1.823211669921875, -1.748291015625, -1.673370361328125, -1.59844970703125, -1.523529052734375, -1.4486083984375, -1.373687744140625, -1.29876708984375, -1.223846435546875, -1.14892578125, -1.074005126953125, -0.99908447265625, -0.924163818359375, -0.8492431640625, -0.774322509765625, -0.69940185546875, -0.624481201171875, -0.549560546875, -0.474639892578125, -0.39971923828125, -0.324798583984375, -0.2498779296875, -0.174957275390625, -0.10003662109375, -0.025115966796875, 0.0498046875, 0.124725341796875, 0.19964599609375, 0.274566650390625, 0.3494873046875, 0.424407958984375, 0.49932861328125, 0.574249267578125, 0.649169921875, 0.724090576171875, 0.79901123046875, 0.873931884765625, 0.9488525390625, 1.023773193359375, 1.09869384765625, 1.173614501953125, 1.24853515625, 1.323455810546875, 1.39837646484375, 1.473297119140625, 1.5482177734375, 1.623138427734375, 1.69805908203125, 1.772979736328125, 1.847900390625, 1.922821044921875, 1.99774169921875, 2.072662353515625, 2.1475830078125, 2.222503662109375, 2.29742431640625, 2.372344970703125, 2.447265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 8.0, 16.0, 19.0, 12.0, 26.0, 27.0, 19.0, 34.0, 41.0, 47.0, 56.0, 67.0, 84.0, 52.0, 80.0, 64.0, 56.0, 48.0, 22.0, 25.0, 26.0, 15.0, 28.0, 18.0, 15.0, 11.0, 12.0, 10.0, 3.0, 11.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61260986328125, -1.5592041015625, -1.50579833984375, -1.452392578125, -1.39898681640625, -1.3455810546875, -1.29217529296875, -1.23876953125, -1.18536376953125, -1.1319580078125, -1.07855224609375, -1.025146484375, -0.97174072265625, -0.9183349609375, -0.86492919921875, -0.8115234375, -0.75811767578125, -0.7047119140625, -0.65130615234375, -0.597900390625, -0.54449462890625, -0.4910888671875, -0.43768310546875, -0.38427734375, -0.33087158203125, -0.2774658203125, -0.22406005859375, -0.170654296875, -0.11724853515625, -0.0638427734375, -0.01043701171875, 0.04296875, 0.09637451171875, 0.1497802734375, 0.20318603515625, 0.256591796875, 0.30999755859375, 0.3634033203125, 0.41680908203125, 0.47021484375, 0.52362060546875, 0.5770263671875, 0.63043212890625, 0.683837890625, 0.73724365234375, 0.7906494140625, 0.84405517578125, 0.8974609375, 0.95086669921875, 1.0042724609375, 1.05767822265625, 1.111083984375, 1.16448974609375, 1.2178955078125, 1.27130126953125, 1.32470703125, 1.37811279296875, 1.4315185546875, 1.48492431640625, 1.538330078125, 1.59173583984375, 1.6451416015625, 1.69854736328125, 1.751953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 23.0, 82.0, 179.0, 253.0, 248.0, 117.0, 54.0, 22.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.33924865722656, -51.71582794189453, -49.0924072265625, -46.46898651123047, -43.8455696105957, -41.22214889526367, -38.59872817993164, -35.975311279296875, -33.351890563964844, -30.728469848632812, -28.105051040649414, -25.481630325317383, -22.858211517333984, -20.234790802001953, -17.611370086669922, -14.987951278686523, -12.36452865600586, -9.741108894348145, -7.1176886558532715, -4.494268417358398, -1.8708486557006836, 0.7525711059570312, 3.3759918212890625, 5.999410629272461, 8.622831344604492, 11.246251106262207, 13.869670867919922, 16.493091583251953, 19.116512298583984, 21.739931106567383, 24.363351821899414, 26.986770629882812, 29.610191345214844, 32.233612060546875, 34.857032775878906, 37.48045349121094, 40.1038703918457, 42.727291107177734, 45.350711822509766, 47.97412872314453, 50.59754943847656, 53.220970153808594, 55.844390869140625, 58.467811584472656, 61.09122848510742, 63.71464920043945, 66.33807373046875, 68.96148681640625, 71.58491516113281, 74.20833587646484, 76.83175659179688, 79.4551773071289, 82.07859802246094, 84.70201110839844, 87.325439453125, 89.9488525390625, 92.57227325439453, 95.19569396972656, 97.8191146850586, 100.44253540039062, 103.06595611572266, 105.68937683105469, 108.31278991699219, 110.93621063232422, 113.55963134765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 17.0, 50.0, 39.0, 38.0, 32.0, 44.0, 52.0, 50.0, 55.0, 39.0, 47.0, 30.0, 45.0, 39.0, 40.0, 37.0, 30.0, 22.0, 31.0, 24.0, 18.0, 15.0, 11.0, 12.0, 7.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.92465591430664, -24.99482536315918, -24.064992904663086, -23.135162353515625, -22.205331802368164, -21.275501251220703, -20.34566879272461, -19.41583824157715, -18.486007690429688, -17.556177139282227, -16.626344680786133, -15.696514129638672, -14.766683578491211, -13.836852073669434, -12.907020568847656, -11.977190017700195, -11.047358512878418, -10.11752700805664, -9.18769645690918, -8.257864952087402, -7.328034400939941, -6.398202896118164, -5.468371868133545, -4.538540840148926, -3.6087098121643066, -2.6788787841796875, -1.7490476369857788, -0.8192164897918701, 0.11061453819274902, 1.0404458045959473, 1.9702768325805664, 2.9001078605651855, 3.8299388885498047, 4.759769916534424, 5.689600944519043, 6.61943244934082, 7.549263000488281, 8.479094505310059, 9.408926010131836, 10.338756561279297, 11.268587112426758, 12.198418617248535, 13.128249168395996, 14.058080673217773, 14.987911224365234, 15.917742729187012, 16.84757423400879, 17.77740478515625, 18.707237243652344, 19.637067794799805, 20.5669002532959, 21.49673080444336, 22.42656135559082, 23.35639190673828, 24.286224365234375, 25.216054916381836, 26.145885467529297, 27.075716018676758, 28.00554847717285, 28.935379028320312, 29.865209579467773, 30.795040130615234, 31.724872589111328, 32.654701232910156, 33.58453369140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 13.0, 16.0, 27.0, 50.0, 82.0, 134.0, 218.0, 378.0, 730.0, 1398.0, 2791.0, 6263.0, 15490.0, 46147.0, 221830.0, 3062423.0, 714655.0, 81176.0, 23810.0, 9025.0, 3785.0, 1796.0, 880.0, 473.0, 279.0, 165.0, 81.0, 60.0, 39.0, 23.0, 16.0, 5.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.806640625, -3.682708740234375, -3.55877685546875, -3.434844970703125, -3.3109130859375, -3.186981201171875, -3.06304931640625, -2.939117431640625, -2.815185546875, -2.691253662109375, -2.56732177734375, -2.443389892578125, -2.3194580078125, -2.195526123046875, -2.07159423828125, -1.947662353515625, -1.82373046875, -1.699798583984375, -1.57586669921875, -1.451934814453125, -1.3280029296875, -1.204071044921875, -1.08013916015625, -0.956207275390625, -0.832275390625, -0.708343505859375, -0.58441162109375, -0.460479736328125, -0.3365478515625, -0.212615966796875, -0.08868408203125, 0.035247802734375, 0.1591796875, 0.283111572265625, 0.40704345703125, 0.530975341796875, 0.6549072265625, 0.778839111328125, 0.90277099609375, 1.026702880859375, 1.150634765625, 1.274566650390625, 1.39849853515625, 1.522430419921875, 1.6463623046875, 1.770294189453125, 1.89422607421875, 2.018157958984375, 2.14208984375, 2.266021728515625, 2.38995361328125, 2.513885498046875, 2.6378173828125, 2.761749267578125, 2.88568115234375, 3.009613037109375, 3.133544921875, 3.257476806640625, 3.38140869140625, 3.505340576171875, 3.6292724609375, 3.753204345703125, 3.87713623046875, 4.001068115234375, 4.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 2.0, 10.0, 14.0, 16.0, 11.0, 17.0, 29.0, 24.0, 37.0, 30.0, 37.0, 55.0, 46.0, 56.0, 55.0, 58.0, 49.0, 52.0, 51.0, 46.0, 47.0, 42.0, 37.0, 34.0, 37.0, 27.0, 21.0, 13.0, 12.0, 8.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.09765625, -2.0394134521484375, -1.981170654296875, -1.9229278564453125, -1.86468505859375, -1.8064422607421875, -1.748199462890625, -1.6899566650390625, -1.6317138671875, -1.5734710693359375, -1.515228271484375, -1.4569854736328125, -1.39874267578125, -1.3404998779296875, -1.282257080078125, -1.2240142822265625, -1.165771484375, -1.1075286865234375, -1.049285888671875, -0.9910430908203125, -0.93280029296875, -0.8745574951171875, -0.816314697265625, -0.7580718994140625, -0.6998291015625, -0.6415863037109375, -0.583343505859375, -0.5251007080078125, -0.46685791015625, -0.4086151123046875, -0.350372314453125, -0.2921295166015625, -0.23388671875, -0.1756439208984375, -0.117401123046875, -0.0591583251953125, -0.00091552734375, 0.0573272705078125, 0.115570068359375, 0.1738128662109375, 0.2320556640625, 0.2902984619140625, 0.348541259765625, 0.4067840576171875, 0.46502685546875, 0.5232696533203125, 0.581512451171875, 0.6397552490234375, 0.697998046875, 0.7562408447265625, 0.814483642578125, 0.8727264404296875, 0.93096923828125, 0.9892120361328125, 1.047454833984375, 1.1056976318359375, 1.1639404296875, 1.2221832275390625, 1.280426025390625, 1.3386688232421875, 1.39691162109375, 1.4551544189453125, 1.513397216796875, 1.5716400146484375, 1.6298828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 15.0, 18.0, 27.0, 27.0, 47.0, 72.0, 100.0, 161.0, 301.0, 481.0, 998.0, 2225.0, 5333.0, 14975.0, 55191.0, 409637.0, 3402055.0, 242913.0, 40631.0, 11417.0, 4124.0, 1687.0, 820.0, 417.0, 224.0, 133.0, 81.0, 51.0, 32.0, 12.0, 14.0, 22.0, 7.0, 8.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.1644287109375, -4.012451171875, -3.8604736328125, -3.70849609375, -3.5565185546875, -3.404541015625, -3.2525634765625, -3.1005859375, -2.9486083984375, -2.796630859375, -2.6446533203125, -2.49267578125, -2.3406982421875, -2.188720703125, -2.0367431640625, -1.884765625, -1.7327880859375, -1.580810546875, -1.4288330078125, -1.27685546875, -1.1248779296875, -0.972900390625, -0.8209228515625, -0.6689453125, -0.5169677734375, -0.364990234375, -0.2130126953125, -0.06103515625, 0.0909423828125, 0.242919921875, 0.3948974609375, 0.546875, 0.6988525390625, 0.850830078125, 1.0028076171875, 1.15478515625, 1.3067626953125, 1.458740234375, 1.6107177734375, 1.7626953125, 1.9146728515625, 2.066650390625, 2.2186279296875, 2.37060546875, 2.5225830078125, 2.674560546875, 2.8265380859375, 2.978515625, 3.1304931640625, 3.282470703125, 3.4344482421875, 3.58642578125, 3.7384033203125, 3.890380859375, 4.0423583984375, 4.1943359375, 4.3463134765625, 4.498291015625, 4.6502685546875, 4.80224609375, 4.9542236328125, 5.106201171875, 5.2581787109375, 5.41015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 11.0, 23.0, 23.0, 22.0, 47.0, 54.0, 94.0, 160.0, 294.0, 828.0, 1213.0, 620.0, 307.0, 144.0, 71.0, 44.0, 32.0, 14.0, 16.0, 6.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7998046875, -5.615234375, -5.4306640625, -5.24609375, -5.0615234375, -4.876953125, -4.6923828125, -4.5078125, -4.3232421875, -4.138671875, -3.9541015625, -3.76953125, -3.5849609375, -3.400390625, -3.2158203125, -3.03125, -2.8466796875, -2.662109375, -2.4775390625, -2.29296875, -2.1083984375, -1.923828125, -1.7392578125, -1.5546875, -1.3701171875, -1.185546875, -1.0009765625, -0.81640625, -0.6318359375, -0.447265625, -0.2626953125, -0.078125, 0.1064453125, 0.291015625, 0.4755859375, 0.66015625, 0.8447265625, 1.029296875, 1.2138671875, 1.3984375, 1.5830078125, 1.767578125, 1.9521484375, 2.13671875, 2.3212890625, 2.505859375, 2.6904296875, 2.875, 3.0595703125, 3.244140625, 3.4287109375, 3.61328125, 3.7978515625, 3.982421875, 4.1669921875, 4.3515625, 4.5361328125, 4.720703125, 4.9052734375, 5.08984375, 5.2744140625, 5.458984375, 5.6435546875, 5.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 0.0, 3.0, 4.0, 8.0, 6.0, 12.0, 20.0, 20.0, 42.0, 57.0, 116.0, 174.0, 215.0, 155.0, 85.0, 41.0, 16.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.24077606201172, -80.50762176513672, -78.77445983886719, -77.04130554199219, -75.30814361572266, -73.57498931884766, -71.84182739257812, -70.10867309570312, -68.3755111694336, -66.6423568725586, -64.90919494628906, -63.1760368347168, -61.44287872314453, -59.709720611572266, -57.9765625, -56.243404388427734, -54.51024627685547, -52.7770881652832, -51.04393005371094, -49.31077194213867, -47.577613830566406, -45.84445571899414, -44.111297607421875, -42.37813949584961, -40.64498519897461, -38.911827087402344, -37.17866897583008, -35.44551086425781, -33.71235275268555, -31.97919464111328, -30.246036529541016, -28.51287841796875, -26.779720306396484, -25.04656219482422, -23.313404083251953, -21.580245971679688, -19.847087860107422, -18.113929748535156, -16.38077163696289, -14.647614479064941, -12.914456367492676, -11.18129825592041, -9.448140144348145, -7.714982509613037, -5.9818243980407715, -4.248666763305664, -2.5155086517333984, -0.7823505401611328, 0.9508075714111328, 2.6839656829833984, 4.417123794555664, 6.1502814292907715, 7.883439540863037, 9.616597175598145, 11.34975528717041, 13.082913398742676, 14.816071510314941, 16.54922866821289, 18.282386779785156, 20.015544891357422, 21.748703002929688, 23.481861114501953, 25.21501922607422, 26.948177337646484, 28.68133544921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 15.0, 22.0, 22.0, 17.0, 25.0, 30.0, 24.0, 26.0, 39.0, 39.0, 31.0, 36.0, 38.0, 47.0, 38.0, 37.0, 43.0, 40.0, 33.0, 48.0, 38.0, 36.0, 38.0, 29.0, 39.0, 24.0, 24.0, 19.0, 18.0, 19.0, 6.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.709545135498047, -22.95271110534668, -22.195877075195312, -21.439043045043945, -20.682209014892578, -19.92537498474121, -19.168540954589844, -18.41170883178711, -17.65487289428711, -16.898038864135742, -16.141204833984375, -15.384370803833008, -14.62753677368164, -13.870702743530273, -13.113869667053223, -12.357035636901855, -11.600202560424805, -10.843368530273438, -10.08653450012207, -9.329700469970703, -8.572866439819336, -7.816032886505127, -7.059199333190918, -6.302365303039551, -5.545531272888184, -4.788697242736816, -4.031863212585449, -3.2750296592712402, -2.518195629119873, -1.7613615989685059, -1.0045280456542969, -0.2476940155029297, 0.5091381072998047, 1.2659720182418823, 2.02280592918396, 2.779639720916748, 3.5364737510681152, 4.293307781219482, 5.050141334533691, 5.806975364685059, 6.563809394836426, 7.320643424987793, 8.07747745513916, 8.834310531616211, 9.591144561767578, 10.347978591918945, 11.104812622070312, 11.86164665222168, 12.618480682373047, 13.375314712524414, 14.132148742675781, 14.888982772827148, 15.645816802978516, 16.402650833129883, 17.15948486328125, 17.916316986083984, 18.673152923583984, 19.42998695373535, 20.18682098388672, 20.943655014038086, 21.700489044189453, 22.45732307434082, 23.214157104492188, 23.970989227294922, 24.72782325744629]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 5.0, 18.0, 22.0, 35.0, 52.0, 85.0, 157.0, 235.0, 412.0, 721.0, 1248.0, 2263.0, 4441.0, 9073.0, 20757.0, 54174.0, 214790.0, 534412.0, 134038.0, 40176.0, 15953.0, 7209.0, 3651.0, 1978.0, 1121.0, 604.0, 347.0, 201.0, 146.0, 94.0, 45.0, 36.0, 16.0, 19.0, 14.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.82275390625, -4.6689453125, -4.51513671875, -4.361328125, -4.20751953125, -4.0537109375, -3.89990234375, -3.74609375, -3.59228515625, -3.4384765625, -3.28466796875, -3.130859375, -2.97705078125, -2.8232421875, -2.66943359375, -2.515625, -2.36181640625, -2.2080078125, -2.05419921875, -1.900390625, -1.74658203125, -1.5927734375, -1.43896484375, -1.28515625, -1.13134765625, -0.9775390625, -0.82373046875, -0.669921875, -0.51611328125, -0.3623046875, -0.20849609375, -0.0546875, 0.09912109375, 0.2529296875, 0.40673828125, 0.560546875, 0.71435546875, 0.8681640625, 1.02197265625, 1.17578125, 1.32958984375, 1.4833984375, 1.63720703125, 1.791015625, 1.94482421875, 2.0986328125, 2.25244140625, 2.40625, 2.56005859375, 2.7138671875, 2.86767578125, 3.021484375, 3.17529296875, 3.3291015625, 3.48291015625, 3.63671875, 3.79052734375, 3.9443359375, 4.09814453125, 4.251953125, 4.40576171875, 4.5595703125, 4.71337890625, 4.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 9.0, 17.0, 14.0, 19.0, 28.0, 26.0, 32.0, 30.0, 35.0, 35.0, 41.0, 43.0, 52.0, 40.0, 56.0, 55.0, 53.0, 48.0, 60.0, 39.0, 34.0, 32.0, 31.0, 29.0, 25.0, 22.0, 24.0, 16.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.172637939453125, -2.11480712890625, -2.056976318359375, -1.9991455078125, -1.941314697265625, -1.88348388671875, -1.825653076171875, -1.767822265625, -1.709991455078125, -1.65216064453125, -1.594329833984375, -1.5364990234375, -1.478668212890625, -1.42083740234375, -1.363006591796875, -1.30517578125, -1.247344970703125, -1.18951416015625, -1.131683349609375, -1.0738525390625, -1.016021728515625, -0.95819091796875, -0.900360107421875, -0.842529296875, -0.784698486328125, -0.72686767578125, -0.669036865234375, -0.6112060546875, -0.553375244140625, -0.49554443359375, -0.437713623046875, -0.3798828125, -0.322052001953125, -0.26422119140625, -0.206390380859375, -0.1485595703125, -0.090728759765625, -0.03289794921875, 0.024932861328125, 0.082763671875, 0.140594482421875, 0.19842529296875, 0.256256103515625, 0.3140869140625, 0.371917724609375, 0.42974853515625, 0.487579345703125, 0.54541015625, 0.603240966796875, 0.66107177734375, 0.718902587890625, 0.7767333984375, 0.834564208984375, 0.89239501953125, 0.950225830078125, 1.008056640625, 1.065887451171875, 1.12371826171875, 1.181549072265625, 1.2393798828125, 1.297210693359375, 1.35504150390625, 1.412872314453125, 1.470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 4.0, 9.0, 9.0, 20.0, 25.0, 39.0, 57.0, 91.0, 131.0, 209.0, 348.0, 601.0, 1139.0, 2652.0, 9504.0, 72258.0, 869258.0, 76908.0, 9888.0, 2738.0, 1208.0, 542.0, 314.0, 207.0, 131.0, 68.0, 65.0, 45.0, 19.0, 19.0, 14.0, 13.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0440673828125, -7.728759765625, -7.4134521484375, -7.09814453125, -6.7828369140625, -6.467529296875, -6.1522216796875, -5.8369140625, -5.5216064453125, -5.206298828125, -4.8909912109375, -4.57568359375, -4.2603759765625, -3.945068359375, -3.6297607421875, -3.314453125, -2.9991455078125, -2.683837890625, -2.3685302734375, -2.05322265625, -1.7379150390625, -1.422607421875, -1.1072998046875, -0.7919921875, -0.4766845703125, -0.161376953125, 0.1539306640625, 0.46923828125, 0.7845458984375, 1.099853515625, 1.4151611328125, 1.73046875, 2.0457763671875, 2.361083984375, 2.6763916015625, 2.99169921875, 3.3070068359375, 3.622314453125, 3.9376220703125, 4.2529296875, 4.5682373046875, 4.883544921875, 5.1988525390625, 5.51416015625, 5.8294677734375, 6.144775390625, 6.4600830078125, 6.775390625, 7.0906982421875, 7.406005859375, 7.7213134765625, 8.03662109375, 8.3519287109375, 8.667236328125, 8.9825439453125, 9.2978515625, 9.6131591796875, 9.928466796875, 10.2437744140625, 10.55908203125, 10.8743896484375, 11.189697265625, 11.5050048828125, 11.8203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 9.0, 6.0, 8.0, 3.0, 7.0, 9.0, 13.0, 13.0, 17.0, 25.0, 42.0, 27.0, 33.0, 40.0, 44.0, 57.0, 56.0, 57.0, 42.0, 48.0, 47.0, 55.0, 58.0, 44.0, 53.0, 37.0, 24.0, 35.0, 24.0, 19.0, 19.0, 6.0, 7.0, 4.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.89453125, -7.63128662109375, -7.3680419921875, -7.10479736328125, -6.841552734375, -6.57830810546875, -6.3150634765625, -6.05181884765625, -5.78857421875, -5.52532958984375, -5.2620849609375, -4.99884033203125, -4.735595703125, -4.47235107421875, -4.2091064453125, -3.94586181640625, -3.6826171875, -3.41937255859375, -3.1561279296875, -2.89288330078125, -2.629638671875, -2.36639404296875, -2.1031494140625, -1.83990478515625, -1.57666015625, -1.31341552734375, -1.0501708984375, -0.78692626953125, -0.523681640625, -0.26043701171875, 0.0028076171875, 0.26605224609375, 0.529296875, 0.79254150390625, 1.0557861328125, 1.31903076171875, 1.582275390625, 1.84552001953125, 2.1087646484375, 2.37200927734375, 2.63525390625, 2.89849853515625, 3.1617431640625, 3.42498779296875, 3.688232421875, 3.95147705078125, 4.2147216796875, 4.47796630859375, 4.7412109375, 5.00445556640625, 5.2677001953125, 5.53094482421875, 5.794189453125, 6.05743408203125, 6.3206787109375, 6.58392333984375, 6.84716796875, 7.11041259765625, 7.3736572265625, 7.63690185546875, 7.900146484375, 8.16339111328125, 8.4266357421875, 8.68988037109375, 8.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 16.0, 18.0, 25.0, 36.0, 51.0, 100.0, 166.0, 326.0, 588.0, 1319.0, 3443.0, 10184.0, 37700.0, 444717.0, 494895.0, 38450.0, 10274.0, 3521.0, 1364.0, 589.0, 293.0, 178.0, 99.0, 52.0, 32.0, 24.0, 19.0, 14.0, 13.0, 8.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0], "bins": [-5.20703125, -5.080047607421875, -4.95306396484375, -4.826080322265625, -4.6990966796875, -4.572113037109375, -4.44512939453125, -4.318145751953125, -4.191162109375, -4.064178466796875, -3.93719482421875, -3.810211181640625, -3.6832275390625, -3.556243896484375, -3.42926025390625, -3.302276611328125, -3.17529296875, -3.048309326171875, -2.92132568359375, -2.794342041015625, -2.6673583984375, -2.540374755859375, -2.41339111328125, -2.286407470703125, -2.159423828125, -2.032440185546875, -1.90545654296875, -1.778472900390625, -1.6514892578125, -1.524505615234375, -1.39752197265625, -1.270538330078125, -1.1435546875, -1.016571044921875, -0.88958740234375, -0.762603759765625, -0.6356201171875, -0.508636474609375, -0.38165283203125, -0.254669189453125, -0.127685546875, -0.000701904296875, 0.12628173828125, 0.253265380859375, 0.3802490234375, 0.507232666015625, 0.63421630859375, 0.761199951171875, 0.88818359375, 1.015167236328125, 1.14215087890625, 1.269134521484375, 1.3961181640625, 1.523101806640625, 1.65008544921875, 1.777069091796875, 1.904052734375, 2.031036376953125, 2.15802001953125, 2.285003662109375, 2.4119873046875, 2.538970947265625, 2.66595458984375, 2.792938232421875, 2.919921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 5.0, 6.0, 6.0, 7.0, 19.0, 17.0, 35.0, 38.0, 72.0, 198.0, 271.0, 134.0, 54.0, 27.0, 25.0, 17.0, 11.0, 5.0, 9.0, 4.0, 7.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011396408081054688, -0.0011032074689865112, -0.0010667741298675537, -0.0010303407907485962, -0.0009939074516296387, -0.0009574741125106812, -0.0009210407733917236, -0.0008846074342727661, -0.0008481740951538086, -0.0008117407560348511, -0.0007753074169158936, -0.000738874077796936, -0.0007024407386779785, -0.000666007399559021, -0.0006295740604400635, -0.000593140721321106, -0.0005567073822021484, -0.0005202740430831909, -0.0004838407039642334, -0.0004474073648452759, -0.00041097402572631836, -0.00037454068660736084, -0.0003381073474884033, -0.0003016740083694458, -0.0002652406692504883, -0.00022880733013153076, -0.00019237399101257324, -0.00015594065189361572, -0.0001195073127746582, -8.307397365570068e-05, -4.6640634536743164e-05, -1.0207295417785645e-05, 2.6226043701171875e-05, 6.26593828201294e-05, 9.909272193908691e-05, 0.00013552606105804443, 0.00017195940017700195, 0.00020839273929595947, 0.000244826078414917, 0.0002812594175338745, 0.00031769275665283203, 0.00035412609577178955, 0.00039055943489074707, 0.0004269927740097046, 0.0004634261131286621, 0.0004998594522476196, 0.0005362927913665771, 0.0005727261304855347, 0.0006091594696044922, 0.0006455928087234497, 0.0006820261478424072, 0.0007184594869613647, 0.0007548928260803223, 0.0007913261651992798, 0.0008277595043182373, 0.0008641928434371948, 0.0009006261825561523, 0.0009370595216751099, 0.0009734928607940674, 0.001009926199913025, 0.0010463595390319824, 0.00108279287815094, 0.0011192262172698975, 0.001155659556388855, 0.0011920928955078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 9.0, 8.0, 21.0, 19.0, 33.0, 45.0, 107.0, 160.0, 276.0, 534.0, 1222.0, 3217.0, 11507.0, 71179.0, 830680.0, 108069.0, 14768.0, 3920.0, 1381.0, 632.0, 300.0, 181.0, 90.0, 67.0, 41.0, 28.0, 18.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.015625, -4.86627197265625, -4.7169189453125, -4.56756591796875, -4.418212890625, -4.26885986328125, -4.1195068359375, -3.97015380859375, -3.82080078125, -3.67144775390625, -3.5220947265625, -3.37274169921875, -3.223388671875, -3.07403564453125, -2.9246826171875, -2.77532958984375, -2.6259765625, -2.47662353515625, -2.3272705078125, -2.17791748046875, -2.028564453125, -1.87921142578125, -1.7298583984375, -1.58050537109375, -1.43115234375, -1.28179931640625, -1.1324462890625, -0.98309326171875, -0.833740234375, -0.68438720703125, -0.5350341796875, -0.38568115234375, -0.236328125, -0.08697509765625, 0.0623779296875, 0.21173095703125, 0.361083984375, 0.51043701171875, 0.6597900390625, 0.80914306640625, 0.95849609375, 1.10784912109375, 1.2572021484375, 1.40655517578125, 1.555908203125, 1.70526123046875, 1.8546142578125, 2.00396728515625, 2.1533203125, 2.30267333984375, 2.4520263671875, 2.60137939453125, 2.750732421875, 2.90008544921875, 3.0494384765625, 3.19879150390625, 3.34814453125, 3.49749755859375, 3.6468505859375, 3.79620361328125, 3.945556640625, 4.09490966796875, 4.2442626953125, 4.39361572265625, 4.54296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 6.0, 7.0, 12.0, 16.0, 18.0, 26.0, 38.0, 45.0, 65.0, 97.0, 123.0, 114.0, 110.0, 81.0, 51.0, 45.0, 31.0, 29.0, 21.0, 13.0, 7.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.39666748046875, -2.2933349609375, -2.19000244140625, -2.086669921875, -1.98333740234375, -1.8800048828125, -1.77667236328125, -1.67333984375, -1.57000732421875, -1.4666748046875, -1.36334228515625, -1.260009765625, -1.15667724609375, -1.0533447265625, -0.95001220703125, -0.8466796875, -0.74334716796875, -0.6400146484375, -0.53668212890625, -0.433349609375, -0.33001708984375, -0.2266845703125, -0.12335205078125, -0.02001953125, 0.08331298828125, 0.1866455078125, 0.28997802734375, 0.393310546875, 0.49664306640625, 0.5999755859375, 0.70330810546875, 0.806640625, 0.90997314453125, 1.0133056640625, 1.11663818359375, 1.219970703125, 1.32330322265625, 1.4266357421875, 1.52996826171875, 1.63330078125, 1.73663330078125, 1.8399658203125, 1.94329833984375, 2.046630859375, 2.14996337890625, 2.2532958984375, 2.35662841796875, 2.4599609375, 2.56329345703125, 2.6666259765625, 2.76995849609375, 2.873291015625, 2.97662353515625, 3.0799560546875, 3.18328857421875, 3.28662109375, 3.38995361328125, 3.4932861328125, 3.59661865234375, 3.699951171875, 3.80328369140625, 3.9066162109375, 4.00994873046875, 4.11328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 1.0, 5.0, 5.0, 13.0, 26.0, 42.0, 83.0, 93.0, 141.0, 159.0, 139.0, 94.0, 75.0, 42.0, 32.0, 14.0, 11.0, 5.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.12789535522461, -34.59796905517578, -33.06803894042969, -31.53811264038086, -30.00818634033203, -28.47825813293457, -26.94832992553711, -25.41840362548828, -23.88847541809082, -22.35854721069336, -20.82862091064453, -19.29869270324707, -17.76876449584961, -16.23883819580078, -14.70890998840332, -13.178982734680176, -11.649055480957031, -10.119128227233887, -8.589200973510742, -7.059272766113281, -5.529345512390137, -3.999418258666992, -2.4694900512695312, -0.9395627975463867, 0.5903644561767578, 2.1202919483184814, 3.650219440460205, 5.180147171020508, 6.710074424743652, 8.240001678466797, 9.769929885864258, 11.299857139587402, 12.829784393310547, 14.359711647033691, 15.889638900756836, 17.419567108154297, 18.949493408203125, 20.479421615600586, 22.009349822998047, 23.539276123046875, 25.069204330444336, 26.599132537841797, 28.129058837890625, 29.658987045288086, 31.188915252685547, 32.718841552734375, 34.24877166748047, 35.7786979675293, 37.308624267578125, 38.83855056762695, 40.36848068237305, 41.898406982421875, 43.4283332824707, 44.95825958251953, 46.488189697265625, 48.01811599731445, 49.54804229736328, 51.07796859741211, 52.6078987121582, 54.13782501220703, 55.66775131225586, 57.19767761230469, 58.72760772705078, 60.25753402709961, 61.7874641418457]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 5.0, 9.0, 9.0, 16.0, 8.0, 18.0, 15.0, 26.0, 17.0, 15.0, 18.0, 27.0, 29.0, 26.0, 29.0, 33.0, 52.0, 42.0, 47.0, 41.0, 47.0, 49.0, 43.0, 50.0, 31.0, 35.0, 24.0, 31.0, 41.0, 22.0, 15.0, 23.0, 16.0, 16.0, 10.0, 16.0, 10.0, 8.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.409465789794922, -26.574079513549805, -25.738693237304688, -24.903305053710938, -24.06791877746582, -23.232532501220703, -22.397144317626953, -21.561758041381836, -20.72637176513672, -19.8909854888916, -19.055599212646484, -18.220211029052734, -17.384824752807617, -16.5494384765625, -15.714051246643066, -14.878664016723633, -14.043277740478516, -13.207891464233398, -12.372504234313965, -11.537117004394531, -10.701730728149414, -9.866344451904297, -9.030957221984863, -8.19556999206543, -7.3601837158203125, -6.524796962738037, -5.689410209655762, -4.854023456573486, -4.018636703491211, -3.1832499504089355, -2.34786319732666, -1.5124764442443848, -0.6770896911621094, 0.15829706192016602, 0.9936838150024414, 1.8290705680847168, 2.664457321166992, 3.4998440742492676, 4.335230827331543, 5.170617580413818, 6.006004333496094, 6.841391086578369, 7.6767778396606445, 8.512165069580078, 9.347551345825195, 10.182937622070312, 11.018324851989746, 11.85371208190918, 12.689098358154297, 13.524484634399414, 14.359871864318848, 15.195259094238281, 16.0306453704834, 16.866031646728516, 17.701419830322266, 18.536806106567383, 19.3721923828125, 20.207578659057617, 21.042964935302734, 21.878353118896484, 22.7137393951416, 23.54912567138672, 24.38451385498047, 25.219900131225586, 26.055286407470703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 10.0, 19.0, 21.0, 19.0, 36.0, 46.0, 72.0, 77.0, 130.0, 240.0, 795.0, 9504.0, 2650207.0, 1523389.0, 8351.0, 713.0, 200.0, 132.0, 76.0, 54.0, 47.0, 37.0, 20.0, 17.0, 21.0, 11.0, 6.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.2342529296875, -9.788818359375, -9.3433837890625, -8.89794921875, -8.4525146484375, -8.007080078125, -7.5616455078125, -7.1162109375, -6.6707763671875, -6.225341796875, -5.7799072265625, -5.33447265625, -4.8890380859375, -4.443603515625, -3.9981689453125, -3.552734375, -3.1072998046875, -2.661865234375, -2.2164306640625, -1.77099609375, -1.3255615234375, -0.880126953125, -0.4346923828125, 0.0107421875, 0.4561767578125, 0.901611328125, 1.3470458984375, 1.79248046875, 2.2379150390625, 2.683349609375, 3.1287841796875, 3.57421875, 4.0196533203125, 4.465087890625, 4.9105224609375, 5.35595703125, 5.8013916015625, 6.246826171875, 6.6922607421875, 7.1376953125, 7.5831298828125, 8.028564453125, 8.4739990234375, 8.91943359375, 9.3648681640625, 9.810302734375, 10.2557373046875, 10.701171875, 11.1466064453125, 11.592041015625, 12.0374755859375, 12.48291015625, 12.9283447265625, 13.373779296875, 13.8192138671875, 14.2646484375, 14.7100830078125, 15.155517578125, 15.6009521484375, 16.04638671875, 16.4918212890625, 16.937255859375, 17.3826904296875, 17.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 8.0, 15.0, 19.0, 16.0, 20.0, 22.0, 34.0, 45.0, 34.0, 42.0, 54.0, 58.0, 59.0, 76.0, 39.0, 50.0, 52.0, 58.0, 60.0, 44.0, 26.0, 31.0, 35.0, 20.0, 20.0, 17.0, 7.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.12127685546875, -2.0589599609375, -1.99664306640625, -1.934326171875, -1.87200927734375, -1.8096923828125, -1.74737548828125, -1.68505859375, -1.62274169921875, -1.5604248046875, -1.49810791015625, -1.435791015625, -1.37347412109375, -1.3111572265625, -1.24884033203125, -1.1865234375, -1.12420654296875, -1.0618896484375, -0.99957275390625, -0.937255859375, -0.87493896484375, -0.8126220703125, -0.75030517578125, -0.68798828125, -0.62567138671875, -0.5633544921875, -0.50103759765625, -0.438720703125, -0.37640380859375, -0.3140869140625, -0.25177001953125, -0.189453125, -0.12713623046875, -0.0648193359375, -0.00250244140625, 0.059814453125, 0.12213134765625, 0.1844482421875, 0.24676513671875, 0.30908203125, 0.37139892578125, 0.4337158203125, 0.49603271484375, 0.558349609375, 0.62066650390625, 0.6829833984375, 0.74530029296875, 0.8076171875, 0.86993408203125, 0.9322509765625, 0.99456787109375, 1.056884765625, 1.11920166015625, 1.1815185546875, 1.24383544921875, 1.30615234375, 1.36846923828125, 1.4307861328125, 1.49310302734375, 1.555419921875, 1.61773681640625, 1.6800537109375, 1.74237060546875, 1.8046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 19.0, 34.0, 31.0, 53.0, 92.0, 174.0, 239.0, 436.0, 855.0, 1449.0, 2980.0, 5939.0, 12725.0, 31139.0, 94880.0, 517164.0, 2870596.0, 505603.0, 94379.0, 30657.0, 12413.0, 5840.0, 2870.0, 1581.0, 848.0, 492.0, 281.0, 190.0, 104.0, 70.0, 37.0, 27.0, 20.0, 10.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.139251708984375, -3.03631591796875, -2.933380126953125, -2.8304443359375, -2.727508544921875, -2.62457275390625, -2.521636962890625, -2.418701171875, -2.315765380859375, -2.21282958984375, -2.109893798828125, -2.0069580078125, -1.904022216796875, -1.80108642578125, -1.698150634765625, -1.59521484375, -1.492279052734375, -1.38934326171875, -1.286407470703125, -1.1834716796875, -1.080535888671875, -0.97760009765625, -0.874664306640625, -0.771728515625, -0.668792724609375, -0.56585693359375, -0.462921142578125, -0.3599853515625, -0.257049560546875, -0.15411376953125, -0.051177978515625, 0.0517578125, 0.154693603515625, 0.25762939453125, 0.360565185546875, 0.4635009765625, 0.566436767578125, 0.66937255859375, 0.772308349609375, 0.875244140625, 0.978179931640625, 1.08111572265625, 1.184051513671875, 1.2869873046875, 1.389923095703125, 1.49285888671875, 1.595794677734375, 1.69873046875, 1.801666259765625, 1.90460205078125, 2.007537841796875, 2.1104736328125, 2.213409423828125, 2.31634521484375, 2.419281005859375, 2.522216796875, 2.625152587890625, 2.72808837890625, 2.831024169921875, 2.9339599609375, 3.036895751953125, 3.13983154296875, 3.242767333984375, 3.345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 11.0, 12.0, 10.0, 18.0, 15.0, 32.0, 38.0, 58.0, 74.0, 119.0, 203.0, 368.0, 654.0, 878.0, 601.0, 346.0, 219.0, 130.0, 73.0, 50.0, 36.0, 27.0, 19.0, 21.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.69921875, -3.56488037109375, -3.4305419921875, -3.29620361328125, -3.161865234375, -3.02752685546875, -2.8931884765625, -2.75885009765625, -2.62451171875, -2.49017333984375, -2.3558349609375, -2.22149658203125, -2.087158203125, -1.95281982421875, -1.8184814453125, -1.68414306640625, -1.5498046875, -1.41546630859375, -1.2811279296875, -1.14678955078125, -1.012451171875, -0.87811279296875, -0.7437744140625, -0.60943603515625, -0.47509765625, -0.34075927734375, -0.2064208984375, -0.07208251953125, 0.062255859375, 0.19659423828125, 0.3309326171875, 0.46527099609375, 0.599609375, 0.73394775390625, 0.8682861328125, 1.00262451171875, 1.136962890625, 1.27130126953125, 1.4056396484375, 1.53997802734375, 1.67431640625, 1.80865478515625, 1.9429931640625, 2.07733154296875, 2.211669921875, 2.34600830078125, 2.4803466796875, 2.61468505859375, 2.7490234375, 2.88336181640625, 3.0177001953125, 3.15203857421875, 3.286376953125, 3.42071533203125, 3.5550537109375, 3.68939208984375, 3.82373046875, 3.95806884765625, 4.0924072265625, 4.22674560546875, 4.361083984375, 4.49542236328125, 4.6297607421875, 4.76409912109375, 4.8984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 37.0, 132.0, 365.0, 326.0, 84.0, 31.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.76509094238281, -65.88572692871094, -63.006370544433594, -60.127010345458984, -57.247650146484375, -54.368289947509766, -51.488929748535156, -48.60956573486328, -45.73020935058594, -42.85084915161133, -39.97148895263672, -37.09212875366211, -34.2127685546875, -31.33340835571289, -28.45404624938965, -25.57468605041504, -22.695323944091797, -19.815963745117188, -16.936603546142578, -14.057242393493652, -11.177882194519043, -8.298521995544434, -5.419160842895508, -2.5398006439208984, 0.33955955505371094, 3.2189199924468994, 6.098280429840088, 8.977641105651855, 11.857001304626465, 14.736361503601074, 17.61572265625, 20.49508285522461, 23.37444305419922, 26.253803253173828, 29.133163452148438, 32.01252365112305, 34.891883850097656, 37.771244049072266, 40.650604248046875, 43.52996826171875, 46.409324645996094, 49.2886848449707, 52.16804504394531, 55.04740524291992, 57.92676544189453, 60.80612564086914, 63.68548583984375, 66.56484985351562, 69.4442138671875, 72.32357788085938, 75.20293426513672, 78.0822982788086, 80.96165466308594, 83.84101867675781, 86.72037506103516, 89.59973907470703, 92.47909545898438, 95.35845947265625, 98.2378158569336, 101.11717987060547, 103.99653625488281, 106.87590026855469, 109.75525665283203, 112.6346206665039, 115.51397705078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 4.0, 7.0, 7.0, 4.0, 9.0, 6.0, 15.0, 10.0, 13.0, 19.0, 24.0, 20.0, 30.0, 25.0, 30.0, 28.0, 52.0, 44.0, 28.0, 51.0, 36.0, 41.0, 46.0, 44.0, 35.0, 37.0, 46.0, 36.0, 29.0, 33.0, 17.0, 28.0, 20.0, 21.0, 19.0, 11.0, 7.0, 7.0, 9.0, 5.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.872273445129395, -15.355517387390137, -14.838761329650879, -14.322005271911621, -13.805248260498047, -13.288492202758789, -12.771736145019531, -12.254980087280273, -11.738224029541016, -11.221467971801758, -10.7047119140625, -10.187955856323242, -9.671199798583984, -9.154443740844727, -8.637686729431152, -8.120930671691895, -7.604174613952637, -7.087418556213379, -6.570662498474121, -6.053905963897705, -5.537149906158447, -5.0203938484191895, -4.503637313842773, -3.9868812561035156, -3.470125198364258, -2.953369140625, -2.436612844467163, -1.9198566675186157, -1.4031004905700684, -0.8863444328308105, -0.36958813667297363, 0.14716815948486328, 0.6639251708984375, 1.1806813478469849, 1.6974375247955322, 2.214193820953369, 2.730949878692627, 3.2477059364318848, 3.7644622325897217, 4.281218528747559, 4.797974586486816, 5.314730644226074, 5.831486701965332, 6.348243236541748, 6.864999294281006, 7.381755352020264, 7.89851188659668, 8.415267944335938, 8.932024002075195, 9.448780059814453, 9.965536117553711, 10.482292175292969, 10.999048233032227, 11.515804290771484, 12.032561302185059, 12.549317359924316, 13.066073417663574, 13.582829475402832, 14.09958553314209, 14.616341590881348, 15.133098602294922, 15.64985466003418, 16.166610717773438, 16.683366775512695, 17.200122833251953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 7.0, 9.0, 17.0, 29.0, 28.0, 44.0, 75.0, 90.0, 134.0, 217.0, 344.0, 540.0, 895.0, 1813.0, 3478.0, 7481.0, 17962.0, 48083.0, 196729.0, 561021.0, 141883.0, 39349.0, 15144.0, 6389.0, 3085.0, 1553.0, 773.0, 466.0, 274.0, 203.0, 145.0, 79.0, 67.0, 35.0, 24.0, 26.0, 16.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.386962890625, -4.24267578125, -4.098388671875, -3.9541015625, -3.809814453125, -3.66552734375, -3.521240234375, -3.376953125, -3.232666015625, -3.08837890625, -2.944091796875, -2.7998046875, -2.655517578125, -2.51123046875, -2.366943359375, -2.22265625, -2.078369140625, -1.93408203125, -1.789794921875, -1.6455078125, -1.501220703125, -1.35693359375, -1.212646484375, -1.068359375, -0.924072265625, -0.77978515625, -0.635498046875, -0.4912109375, -0.346923828125, -0.20263671875, -0.058349609375, 0.0859375, 0.230224609375, 0.37451171875, 0.518798828125, 0.6630859375, 0.807373046875, 0.95166015625, 1.095947265625, 1.240234375, 1.384521484375, 1.52880859375, 1.673095703125, 1.8173828125, 1.961669921875, 2.10595703125, 2.250244140625, 2.39453125, 2.538818359375, 2.68310546875, 2.827392578125, 2.9716796875, 3.115966796875, 3.26025390625, 3.404541015625, 3.548828125, 3.693115234375, 3.83740234375, 3.981689453125, 4.1259765625, 4.270263671875, 4.41455078125, 4.558837890625, 4.703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 10.0, 8.0, 19.0, 22.0, 15.0, 17.0, 25.0, 32.0, 32.0, 41.0, 39.0, 47.0, 47.0, 37.0, 50.0, 55.0, 41.0, 47.0, 45.0, 44.0, 33.0, 31.0, 48.0, 27.0, 27.0, 27.0, 25.0, 13.0, 17.0, 17.0, 11.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -2.0131378173828125, -1.959869384765625, -1.9066009521484375, -1.85333251953125, -1.8000640869140625, -1.746795654296875, -1.6935272216796875, -1.6402587890625, -1.5869903564453125, -1.533721923828125, -1.4804534912109375, -1.42718505859375, -1.3739166259765625, -1.320648193359375, -1.2673797607421875, -1.214111328125, -1.1608428955078125, -1.107574462890625, -1.0543060302734375, -1.00103759765625, -0.9477691650390625, -0.894500732421875, -0.8412322998046875, -0.7879638671875, -0.7346954345703125, -0.681427001953125, -0.6281585693359375, -0.57489013671875, -0.5216217041015625, -0.468353271484375, -0.4150848388671875, -0.36181640625, -0.3085479736328125, -0.255279541015625, -0.2020111083984375, -0.14874267578125, -0.0954742431640625, -0.042205810546875, 0.0110626220703125, 0.0643310546875, 0.1175994873046875, 0.170867919921875, 0.2241363525390625, 0.27740478515625, 0.3306732177734375, 0.383941650390625, 0.4372100830078125, 0.490478515625, 0.5437469482421875, 0.597015380859375, 0.6502838134765625, 0.70355224609375, 0.7568206787109375, 0.810089111328125, 0.8633575439453125, 0.9166259765625, 0.9698944091796875, 1.023162841796875, 1.0764312744140625, 1.12969970703125, 1.1829681396484375, 1.236236572265625, 1.2895050048828125, 1.3427734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 10.0, 11.0, 9.0, 15.0, 22.0, 24.0, 33.0, 40.0, 58.0, 99.0, 138.0, 224.0, 344.0, 627.0, 1287.0, 3094.0, 9175.0, 36008.0, 313049.0, 614501.0, 50560.0, 12074.0, 3764.0, 1527.0, 682.0, 421.0, 251.0, 158.0, 103.0, 80.0, 44.0, 36.0, 18.0, 7.0, 15.0, 14.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-7.73046875, -7.527587890625, -7.32470703125, -7.121826171875, -6.9189453125, -6.716064453125, -6.51318359375, -6.310302734375, -6.107421875, -5.904541015625, -5.70166015625, -5.498779296875, -5.2958984375, -5.093017578125, -4.89013671875, -4.687255859375, -4.484375, -4.281494140625, -4.07861328125, -3.875732421875, -3.6728515625, -3.469970703125, -3.26708984375, -3.064208984375, -2.861328125, -2.658447265625, -2.45556640625, -2.252685546875, -2.0498046875, -1.846923828125, -1.64404296875, -1.441162109375, -1.23828125, -1.035400390625, -0.83251953125, -0.629638671875, -0.4267578125, -0.223876953125, -0.02099609375, 0.181884765625, 0.384765625, 0.587646484375, 0.79052734375, 0.993408203125, 1.1962890625, 1.399169921875, 1.60205078125, 1.804931640625, 2.0078125, 2.210693359375, 2.41357421875, 2.616455078125, 2.8193359375, 3.022216796875, 3.22509765625, 3.427978515625, 3.630859375, 3.833740234375, 4.03662109375, 4.239501953125, 4.4423828125, 4.645263671875, 4.84814453125, 5.051025390625, 5.25390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 6.0, 15.0, 10.0, 21.0, 17.0, 28.0, 29.0, 33.0, 44.0, 60.0, 53.0, 59.0, 55.0, 61.0, 69.0, 51.0, 51.0, 51.0, 52.0, 45.0, 29.0, 34.0, 25.0, 22.0, 18.0, 15.0, 7.0, 4.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.0108642578125, -7.756103515625, -7.5013427734375, -7.24658203125, -6.9918212890625, -6.737060546875, -6.4822998046875, -6.2275390625, -5.9727783203125, -5.718017578125, -5.4632568359375, -5.20849609375, -4.9537353515625, -4.698974609375, -4.4442138671875, -4.189453125, -3.9346923828125, -3.679931640625, -3.4251708984375, -3.17041015625, -2.9156494140625, -2.660888671875, -2.4061279296875, -2.1513671875, -1.8966064453125, -1.641845703125, -1.3870849609375, -1.13232421875, -0.8775634765625, -0.622802734375, -0.3680419921875, -0.11328125, 0.1414794921875, 0.396240234375, 0.6510009765625, 0.90576171875, 1.1605224609375, 1.415283203125, 1.6700439453125, 1.9248046875, 2.1795654296875, 2.434326171875, 2.6890869140625, 2.94384765625, 3.1986083984375, 3.453369140625, 3.7081298828125, 3.962890625, 4.2176513671875, 4.472412109375, 4.7271728515625, 4.98193359375, 5.2366943359375, 5.491455078125, 5.7462158203125, 6.0009765625, 6.2557373046875, 6.510498046875, 6.7652587890625, 7.02001953125, 7.2747802734375, 7.529541015625, 7.7843017578125, 8.0390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 17.0, 21.0, 43.0, 85.0, 160.0, 381.0, 1127.0, 3974.0, 22097.0, 589497.0, 405792.0, 19839.0, 3717.0, 1054.0, 388.0, 154.0, 72.0, 42.0, 28.0, 19.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.390625, -6.2177734375, -6.044921875, -5.8720703125, -5.69921875, -5.5263671875, -5.353515625, -5.1806640625, -5.0078125, -4.8349609375, -4.662109375, -4.4892578125, -4.31640625, -4.1435546875, -3.970703125, -3.7978515625, -3.625, -3.4521484375, -3.279296875, -3.1064453125, -2.93359375, -2.7607421875, -2.587890625, -2.4150390625, -2.2421875, -2.0693359375, -1.896484375, -1.7236328125, -1.55078125, -1.3779296875, -1.205078125, -1.0322265625, -0.859375, -0.6865234375, -0.513671875, -0.3408203125, -0.16796875, 0.0048828125, 0.177734375, 0.3505859375, 0.5234375, 0.6962890625, 0.869140625, 1.0419921875, 1.21484375, 1.3876953125, 1.560546875, 1.7333984375, 1.90625, 2.0791015625, 2.251953125, 2.4248046875, 2.59765625, 2.7705078125, 2.943359375, 3.1162109375, 3.2890625, 3.4619140625, 3.634765625, 3.8076171875, 3.98046875, 4.1533203125, 4.326171875, 4.4990234375, 4.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 3.0, 10.0, 14.0, 4.0, 15.0, 13.0, 25.0, 40.0, 59.0, 97.0, 143.0, 184.0, 111.0, 69.0, 49.0, 43.0, 31.0, 14.0, 12.0, 14.0, 3.0, 5.0, 5.0, 11.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00080108642578125, -0.0007783696055412292, -0.0007556527853012085, -0.0007329359650611877, -0.000710219144821167, -0.0006875023245811462, -0.0006647855043411255, -0.0006420686841011047, -0.000619351863861084, -0.0005966350436210632, -0.0005739182233810425, -0.0005512014031410217, -0.000528484582901001, -0.0005057677626609802, -0.00048305094242095947, -0.0004603341221809387, -0.00043761730194091797, -0.0004149004817008972, -0.00039218366146087646, -0.0003694668412208557, -0.00034675002098083496, -0.0003240332007408142, -0.00030131638050079346, -0.0002785995602607727, -0.00025588274002075195, -0.0002331659197807312, -0.00021044909954071045, -0.0001877322793006897, -0.00016501545906066895, -0.0001422986388206482, -0.00011958181858062744, -9.686499834060669e-05, -7.414817810058594e-05, -5.1431357860565186e-05, -2.8714537620544434e-05, -5.997717380523682e-06, 1.671910285949707e-05, 3.943592309951782e-05, 6.215274333953857e-05, 8.486956357955933e-05, 0.00010758638381958008, 0.00013030320405960083, 0.00015302002429962158, 0.00017573684453964233, 0.00019845366477966309, 0.00022117048501968384, 0.0002438873052597046, 0.00026660412549972534, 0.0002893209457397461, 0.00031203776597976685, 0.0003347545862197876, 0.00035747140645980835, 0.0003801882266998291, 0.00040290504693984985, 0.0004256218671798706, 0.00044833868741989136, 0.0004710555076599121, 0.0004937723278999329, 0.0005164891481399536, 0.0005392059683799744, 0.0005619227886199951, 0.0005846396088600159, 0.0006073564291000366, 0.0006300732493400574, 0.0006527900695800781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 12.0, 9.0, 15.0, 34.0, 65.0, 112.0, 148.0, 268.0, 495.0, 948.0, 2083.0, 5288.0, 20155.0, 171669.0, 766134.0, 63127.0, 11299.0, 3522.0, 1484.0, 696.0, 400.0, 223.0, 138.0, 85.0, 44.0, 37.0, 19.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.46875, -3.34619140625, -3.2236328125, -3.10107421875, -2.978515625, -2.85595703125, -2.7333984375, -2.61083984375, -2.48828125, -2.36572265625, -2.2431640625, -2.12060546875, -1.998046875, -1.87548828125, -1.7529296875, -1.63037109375, -1.5078125, -1.38525390625, -1.2626953125, -1.14013671875, -1.017578125, -0.89501953125, -0.7724609375, -0.64990234375, -0.52734375, -0.40478515625, -0.2822265625, -0.15966796875, -0.037109375, 0.08544921875, 0.2080078125, 0.33056640625, 0.453125, 0.57568359375, 0.6982421875, 0.82080078125, 0.943359375, 1.06591796875, 1.1884765625, 1.31103515625, 1.43359375, 1.55615234375, 1.6787109375, 1.80126953125, 1.923828125, 2.04638671875, 2.1689453125, 2.29150390625, 2.4140625, 2.53662109375, 2.6591796875, 2.78173828125, 2.904296875, 3.02685546875, 3.1494140625, 3.27197265625, 3.39453125, 3.51708984375, 3.6396484375, 3.76220703125, 3.884765625, 4.00732421875, 4.1298828125, 4.25244140625, 4.375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 2.0, 13.0, 18.0, 15.0, 19.0, 27.0, 54.0, 75.0, 116.0, 127.0, 130.0, 105.0, 74.0, 55.0, 45.0, 23.0, 17.0, 9.0, 15.0, 10.0, 2.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.506744384765625, -2.41387939453125, -2.321014404296875, -2.2281494140625, -2.135284423828125, -2.04241943359375, -1.949554443359375, -1.856689453125, -1.763824462890625, -1.67095947265625, -1.578094482421875, -1.4852294921875, -1.392364501953125, -1.29949951171875, -1.206634521484375, -1.11376953125, -1.020904541015625, -0.92803955078125, -0.835174560546875, -0.7423095703125, -0.649444580078125, -0.55657958984375, -0.463714599609375, -0.370849609375, -0.277984619140625, -0.18511962890625, -0.092254638671875, 0.0006103515625, 0.093475341796875, 0.18634033203125, 0.279205322265625, 0.3720703125, 0.464935302734375, 0.55780029296875, 0.650665283203125, 0.7435302734375, 0.836395263671875, 0.92926025390625, 1.022125244140625, 1.114990234375, 1.207855224609375, 1.30072021484375, 1.393585205078125, 1.4864501953125, 1.579315185546875, 1.67218017578125, 1.765045166015625, 1.85791015625, 1.950775146484375, 2.04364013671875, 2.136505126953125, 2.2293701171875, 2.322235107421875, 2.41510009765625, 2.507965087890625, 2.600830078125, 2.693695068359375, 2.78656005859375, 2.879425048828125, 2.9722900390625, 3.065155029296875, 3.15802001953125, 3.250885009765625, 3.34375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 38.0, 87.0, 217.0, 337.0, 196.0, 53.0, 25.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.62693786621094, -117.05058288574219, -114.47422790527344, -111.89787292480469, -109.32151794433594, -106.74517059326172, -104.16881561279297, -101.59246063232422, -99.01610565185547, -96.43975067138672, -93.86339569091797, -91.28704071044922, -88.710693359375, -86.13433837890625, -83.5579833984375, -80.98162841796875, -78.4052734375, -75.82891845703125, -73.2525634765625, -70.67620849609375, -68.099853515625, -65.52350616455078, -62.94715118408203, -60.37079620361328, -57.79444122314453, -55.21808624267578, -52.64173126220703, -50.06538009643555, -47.4890251159668, -44.91267013549805, -42.33631896972656, -39.75996398925781, -37.183616638183594, -34.607261657714844, -32.030906677246094, -29.45455551147461, -26.87820053100586, -24.30184555053711, -21.725492477416992, -19.149139404296875, -16.572784423828125, -13.996430397033691, -11.420076370239258, -8.843722343444824, -6.267368316650391, -3.691014289855957, -1.1146602630615234, 1.4616928100585938, 4.038047790527344, 6.614401817321777, 9.190755844116211, 11.767109870910645, 14.343463897705078, 16.919818878173828, 19.496171951293945, 22.072525024414062, 24.648880004882812, 27.225234985351562, 29.80158805847168, 32.3779411315918, 34.95429611206055, 37.5306510925293, 40.10700225830078, 42.68335723876953, 45.25971221923828]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 9.0, 20.0, 21.0, 18.0, 24.0, 19.0, 20.0, 27.0, 28.0, 35.0, 38.0, 55.0, 44.0, 55.0, 68.0, 45.0, 52.0, 38.0, 42.0, 36.0, 36.0, 32.0, 27.0, 21.0, 27.0, 24.0, 18.0, 24.0, 16.0, 7.0, 15.0, 5.0, 9.0, 6.0, 6.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.12070083618164, -24.28488540649414, -23.449068069458008, -22.613252639770508, -21.777437210083008, -20.941619873046875, -20.105804443359375, -19.269989013671875, -18.434173583984375, -17.598358154296875, -16.762540817260742, -15.926725387573242, -15.090909957885742, -14.255093574523926, -13.41927719116211, -12.58346176147461, -11.747644424438477, -10.91182804107666, -10.07601261138916, -9.240196228027344, -8.404380798339844, -7.568564414978027, -6.732748031616211, -5.896932125091553, -5.0611162185668945, -4.225300312042236, -3.389484167098999, -2.5536680221557617, -1.7178521156311035, -0.8820362091064453, -0.046219825744628906, 0.7895960807800293, 1.6254119873046875, 2.4612278938293457, 3.297044038772583, 4.13286018371582, 4.9686760902404785, 5.804491996765137, 6.640308380126953, 7.476124286651611, 8.31194019317627, 9.147756576538086, 9.983572006225586, 10.819388389587402, 11.655204772949219, 12.491020202636719, 13.326836585998535, 14.162652969360352, 14.998468399047852, 15.834284782409668, 16.670101165771484, 17.505916595458984, 18.341732025146484, 19.177547454833984, 20.013364791870117, 20.849180221557617, 21.68499755859375, 22.52081298828125, 23.356630325317383, 24.192445755004883, 25.028261184692383, 25.864078521728516, 26.699893951416016, 27.535709381103516, 28.371524810791016]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 11.0, 12.0, 16.0, 17.0, 51.0, 83.0, 97.0, 175.0, 303.0, 536.0, 938.0, 1821.0, 3442.0, 7060.0, 16181.0, 39772.0, 121458.0, 586430.0, 2406296.0, 776869.0, 150948.0, 47334.0, 18301.0, 8101.0, 3846.0, 1836.0, 985.0, 560.0, 300.0, 191.0, 100.0, 71.0, 40.0, 27.0, 23.0, 15.0, 8.0, 12.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.90374755859375, -2.8172607421875, -2.73077392578125, -2.644287109375, -2.55780029296875, -2.4713134765625, -2.38482666015625, -2.29833984375, -2.21185302734375, -2.1253662109375, -2.03887939453125, -1.952392578125, -1.86590576171875, -1.7794189453125, -1.69293212890625, -1.6064453125, -1.51995849609375, -1.4334716796875, -1.34698486328125, -1.260498046875, -1.17401123046875, -1.0875244140625, -1.00103759765625, -0.91455078125, -0.82806396484375, -0.7415771484375, -0.65509033203125, -0.568603515625, -0.48211669921875, -0.3956298828125, -0.30914306640625, -0.22265625, -0.13616943359375, -0.0496826171875, 0.03680419921875, 0.123291015625, 0.20977783203125, 0.2962646484375, 0.38275146484375, 0.46923828125, 0.55572509765625, 0.6422119140625, 0.72869873046875, 0.815185546875, 0.90167236328125, 0.9881591796875, 1.07464599609375, 1.1611328125, 1.24761962890625, 1.3341064453125, 1.42059326171875, 1.507080078125, 1.59356689453125, 1.6800537109375, 1.76654052734375, 1.85302734375, 1.93951416015625, 2.0260009765625, 2.11248779296875, 2.198974609375, 2.28546142578125, 2.3719482421875, 2.45843505859375, 2.544921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 10.0, 7.0, 9.0, 18.0, 25.0, 20.0, 25.0, 27.0, 32.0, 25.0, 53.0, 39.0, 42.0, 36.0, 52.0, 52.0, 54.0, 48.0, 37.0, 45.0, 32.0, 35.0, 38.0, 36.0, 30.0, 37.0, 25.0, 19.0, 20.0, 10.0, 11.0, 16.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.8515625, -1.8030242919921875, -1.754486083984375, -1.7059478759765625, -1.65740966796875, -1.6088714599609375, -1.560333251953125, -1.5117950439453125, -1.4632568359375, -1.4147186279296875, -1.366180419921875, -1.3176422119140625, -1.26910400390625, -1.2205657958984375, -1.172027587890625, -1.1234893798828125, -1.074951171875, -1.0264129638671875, -0.977874755859375, -0.9293365478515625, -0.88079833984375, -0.8322601318359375, -0.783721923828125, -0.7351837158203125, -0.6866455078125, -0.6381072998046875, -0.589569091796875, -0.5410308837890625, -0.49249267578125, -0.4439544677734375, -0.395416259765625, -0.3468780517578125, -0.29833984375, -0.2498016357421875, -0.201263427734375, -0.1527252197265625, -0.10418701171875, -0.0556488037109375, -0.007110595703125, 0.0414276123046875, 0.0899658203125, 0.1385040283203125, 0.187042236328125, 0.2355804443359375, 0.28411865234375, 0.3326568603515625, 0.381195068359375, 0.4297332763671875, 0.478271484375, 0.5268096923828125, 0.575347900390625, 0.6238861083984375, 0.67242431640625, 0.7209625244140625, 0.769500732421875, 0.8180389404296875, 0.8665771484375, 0.9151153564453125, 0.963653564453125, 1.0121917724609375, 1.06072998046875, 1.1092681884765625, 1.157806396484375, 1.2063446044921875, 1.2548828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 12.0, 26.0, 30.0, 45.0, 83.0, 151.0, 248.0, 551.0, 973.0, 2423.0, 7166.0, 25878.0, 128970.0, 1794426.0, 2038948.0, 149610.0, 30764.0, 8512.0, 2908.0, 1212.0, 602.0, 294.0, 175.0, 95.0, 56.0, 31.0, 21.0, 20.0, 13.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.84100341796875, -4.6741943359375, -4.50738525390625, -4.340576171875, -4.17376708984375, -4.0069580078125, -3.84014892578125, -3.67333984375, -3.50653076171875, -3.3397216796875, -3.17291259765625, -3.006103515625, -2.83929443359375, -2.6724853515625, -2.50567626953125, -2.3388671875, -2.17205810546875, -2.0052490234375, -1.83843994140625, -1.671630859375, -1.50482177734375, -1.3380126953125, -1.17120361328125, -1.00439453125, -0.83758544921875, -0.6707763671875, -0.50396728515625, -0.337158203125, -0.17034912109375, -0.0035400390625, 0.16326904296875, 0.330078125, 0.49688720703125, 0.6636962890625, 0.83050537109375, 0.997314453125, 1.16412353515625, 1.3309326171875, 1.49774169921875, 1.66455078125, 1.83135986328125, 1.9981689453125, 2.16497802734375, 2.331787109375, 2.49859619140625, 2.6654052734375, 2.83221435546875, 2.9990234375, 3.16583251953125, 3.3326416015625, 3.49945068359375, 3.666259765625, 3.83306884765625, 3.9998779296875, 4.16668701171875, 4.33349609375, 4.50030517578125, 4.6671142578125, 4.83392333984375, 5.000732421875, 5.16754150390625, 5.3343505859375, 5.50115966796875, 5.66796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 15.0, 11.0, 21.0, 34.0, 42.0, 64.0, 92.0, 123.0, 223.0, 362.0, 677.0, 800.0, 530.0, 331.0, 218.0, 133.0, 101.0, 65.0, 57.0, 41.0, 18.0, 26.0, 13.0, 15.0, 7.0, 8.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.34765625, -6.17340087890625, -5.9991455078125, -5.82489013671875, -5.650634765625, -5.47637939453125, -5.3021240234375, -5.12786865234375, -4.95361328125, -4.77935791015625, -4.6051025390625, -4.43084716796875, -4.256591796875, -4.08233642578125, -3.9080810546875, -3.73382568359375, -3.5595703125, -3.38531494140625, -3.2110595703125, -3.03680419921875, -2.862548828125, -2.68829345703125, -2.5140380859375, -2.33978271484375, -2.16552734375, -1.99127197265625, -1.8170166015625, -1.64276123046875, -1.468505859375, -1.29425048828125, -1.1199951171875, -0.94573974609375, -0.771484375, -0.59722900390625, -0.4229736328125, -0.24871826171875, -0.074462890625, 0.09979248046875, 0.2740478515625, 0.44830322265625, 0.62255859375, 0.79681396484375, 0.9710693359375, 1.14532470703125, 1.319580078125, 1.49383544921875, 1.6680908203125, 1.84234619140625, 2.0166015625, 2.19085693359375, 2.3651123046875, 2.53936767578125, 2.713623046875, 2.88787841796875, 3.0621337890625, 3.23638916015625, 3.41064453125, 3.58489990234375, 3.7591552734375, 3.93341064453125, 4.107666015625, 4.28192138671875, 4.4561767578125, 4.63043212890625, 4.8046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 21.0, 45.0, 68.0, 123.0, 211.0, 190.0, 118.0, 95.0, 39.0, 27.0, 13.0, 5.0, 10.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.571048736572266, -44.5204963684082, -42.469940185546875, -40.41938781738281, -38.36883544921875, -36.31828308105469, -34.267730712890625, -32.2171745300293, -30.166622161865234, -28.116069793701172, -26.065515518188477, -24.01496124267578, -21.96440887451172, -19.913856506347656, -17.86330223083496, -15.812748908996582, -13.762195587158203, -11.711642265319824, -9.661088943481445, -7.610535621643066, -5.5599822998046875, -3.5094289779663086, -1.4588756561279297, 0.5916776657104492, 2.642230987548828, 4.692784309387207, 6.743337631225586, 8.793890953063965, 10.844444274902344, 12.894997596740723, 14.945550918579102, 16.996105194091797, 19.046661376953125, 21.097213745117188, 23.147768020629883, 25.198322296142578, 27.24887466430664, 29.299427032470703, 31.3499813079834, 33.400535583496094, 35.451087951660156, 37.50164031982422, 39.55219268798828, 41.60274887084961, 43.65330123901367, 45.703853607177734, 47.75440979003906, 49.804962158203125, 51.85551452636719, 53.90606689453125, 55.95661926269531, 58.00717544555664, 60.0577278137207, 62.108280181884766, 64.1588363647461, 66.20938873291016, 68.25994110107422, 70.31049346923828, 72.36104583740234, 74.4115982055664, 76.462158203125, 78.51271057128906, 80.56326293945312, 82.61381530761719, 84.66436767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 8.0, 16.0, 17.0, 19.0, 17.0, 21.0, 25.0, 32.0, 33.0, 41.0, 32.0, 43.0, 36.0, 49.0, 49.0, 53.0, 43.0, 40.0, 43.0, 45.0, 44.0, 45.0, 29.0, 26.0, 31.0, 27.0, 19.0, 18.0, 16.0, 7.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.193378448486328, -29.28727149963379, -28.381162643432617, -27.475055694580078, -26.568946838378906, -25.662839889526367, -24.756732940673828, -23.850624084472656, -22.944517135620117, -22.038410186767578, -21.132301330566406, -20.226194381713867, -19.320087432861328, -18.413978576660156, -17.507871627807617, -16.601764678955078, -15.695655822753906, -14.78954792022705, -13.883440017700195, -12.977333068847656, -12.0712251663208, -11.165117263793945, -10.259010314941406, -9.35290241241455, -8.446794509887695, -7.54068660736084, -6.634579181671143, -5.728471755981445, -4.82236385345459, -3.9162559509277344, -3.010148525238037, -2.10404109954834, -1.1979351043701172, -0.2918274402618408, 0.6142802238464355, 1.520387887954712, 2.4264955520629883, 3.3326034545898438, 4.238710880279541, 5.144818305969238, 6.050926208496094, 6.957034111022949, 7.8631415367126465, 8.769248962402344, 9.6753568649292, 10.581464767456055, 11.487571716308594, 12.39367961883545, 13.299787521362305, 14.20589542388916, 15.112003326416016, 16.018110275268555, 16.924217224121094, 17.830326080322266, 18.736433029174805, 19.642539978027344, 20.548648834228516, 21.454755783081055, 22.360864639282227, 23.266971588134766, 24.173080444335938, 25.079187393188477, 25.985294342041016, 26.891403198242188, 27.797510147094727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 14.0, 19.0, 36.0, 46.0, 113.0, 191.0, 495.0, 1221.0, 2994.0, 9012.0, 31260.0, 130595.0, 602408.0, 206221.0, 44887.0, 12426.0, 4033.0, 1409.0, 599.0, 275.0, 131.0, 76.0, 32.0, 20.0, 19.0, 9.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.9344482421875, -6.728271484375, -6.5220947265625, -6.31591796875, -6.1097412109375, -5.903564453125, -5.6973876953125, -5.4912109375, -5.2850341796875, -5.078857421875, -4.8726806640625, -4.66650390625, -4.4603271484375, -4.254150390625, -4.0479736328125, -3.841796875, -3.6356201171875, -3.429443359375, -3.2232666015625, -3.01708984375, -2.8109130859375, -2.604736328125, -2.3985595703125, -2.1923828125, -1.9862060546875, -1.780029296875, -1.5738525390625, -1.36767578125, -1.1614990234375, -0.955322265625, -0.7491455078125, -0.54296875, -0.3367919921875, -0.130615234375, 0.0755615234375, 0.28173828125, 0.4879150390625, 0.694091796875, 0.9002685546875, 1.1064453125, 1.3126220703125, 1.518798828125, 1.7249755859375, 1.93115234375, 2.1373291015625, 2.343505859375, 2.5496826171875, 2.755859375, 2.9620361328125, 3.168212890625, 3.3743896484375, 3.58056640625, 3.7867431640625, 3.992919921875, 4.1990966796875, 4.4052734375, 4.6114501953125, 4.817626953125, 5.0238037109375, 5.22998046875, 5.4361572265625, 5.642333984375, 5.8485107421875, 6.0546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 11.0, 19.0, 28.0, 19.0, 35.0, 39.0, 42.0, 35.0, 45.0, 46.0, 61.0, 64.0, 64.0, 67.0, 57.0, 53.0, 48.0, 41.0, 39.0, 37.0, 29.0, 28.0, 24.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 0.0, 1.0, 3.0], "bins": [-2.98828125, -2.9210205078125, -2.853759765625, -2.7864990234375, -2.71923828125, -2.6519775390625, -2.584716796875, -2.5174560546875, -2.4501953125, -2.3829345703125, -2.315673828125, -2.2484130859375, -2.18115234375, -2.1138916015625, -2.046630859375, -1.9793701171875, -1.912109375, -1.8448486328125, -1.777587890625, -1.7103271484375, -1.64306640625, -1.5758056640625, -1.508544921875, -1.4412841796875, -1.3740234375, -1.3067626953125, -1.239501953125, -1.1722412109375, -1.10498046875, -1.0377197265625, -0.970458984375, -0.9031982421875, -0.8359375, -0.7686767578125, -0.701416015625, -0.6341552734375, -0.56689453125, -0.4996337890625, -0.432373046875, -0.3651123046875, -0.2978515625, -0.2305908203125, -0.163330078125, -0.0960693359375, -0.02880859375, 0.0384521484375, 0.105712890625, 0.1729736328125, 0.240234375, 0.3074951171875, 0.374755859375, 0.4420166015625, 0.50927734375, 0.5765380859375, 0.643798828125, 0.7110595703125, 0.7783203125, 0.8455810546875, 0.912841796875, 0.9801025390625, 1.04736328125, 1.1146240234375, 1.181884765625, 1.2491455078125, 1.31640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 20.0, 20.0, 33.0, 61.0, 80.0, 136.0, 229.0, 348.0, 599.0, 1126.0, 2498.0, 6922.0, 33266.0, 647087.0, 319965.0, 25523.0, 5806.0, 2264.0, 1029.0, 576.0, 326.0, 224.0, 123.0, 70.0, 65.0, 37.0, 24.0, 10.0, 12.0, 9.0, 4.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0546875, -10.718994140625, -10.38330078125, -10.047607421875, -9.7119140625, -9.376220703125, -9.04052734375, -8.704833984375, -8.369140625, -8.033447265625, -7.69775390625, -7.362060546875, -7.0263671875, -6.690673828125, -6.35498046875, -6.019287109375, -5.68359375, -5.347900390625, -5.01220703125, -4.676513671875, -4.3408203125, -4.005126953125, -3.66943359375, -3.333740234375, -2.998046875, -2.662353515625, -2.32666015625, -1.990966796875, -1.6552734375, -1.319580078125, -0.98388671875, -0.648193359375, -0.3125, 0.023193359375, 0.35888671875, 0.694580078125, 1.0302734375, 1.365966796875, 1.70166015625, 2.037353515625, 2.373046875, 2.708740234375, 3.04443359375, 3.380126953125, 3.7158203125, 4.051513671875, 4.38720703125, 4.722900390625, 5.05859375, 5.394287109375, 5.72998046875, 6.065673828125, 6.4013671875, 6.737060546875, 7.07275390625, 7.408447265625, 7.744140625, 8.079833984375, 8.41552734375, 8.751220703125, 9.0869140625, 9.422607421875, 9.75830078125, 10.093994140625, 10.4296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 15.0, 24.0, 21.0, 21.0, 26.0, 30.0, 38.0, 40.0, 30.0, 35.0, 62.0, 42.0, 51.0, 51.0, 48.0, 57.0, 36.0, 36.0, 36.0, 38.0, 38.0, 41.0, 27.0, 15.0, 20.0, 12.0, 16.0, 8.0, 11.0, 6.0, 6.0, 8.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.078125, -7.8057861328125, -7.533447265625, -7.2611083984375, -6.98876953125, -6.7164306640625, -6.444091796875, -6.1717529296875, -5.8994140625, -5.6270751953125, -5.354736328125, -5.0823974609375, -4.81005859375, -4.5377197265625, -4.265380859375, -3.9930419921875, -3.720703125, -3.4483642578125, -3.176025390625, -2.9036865234375, -2.63134765625, -2.3590087890625, -2.086669921875, -1.8143310546875, -1.5419921875, -1.2696533203125, -0.997314453125, -0.7249755859375, -0.45263671875, -0.1802978515625, 0.092041015625, 0.3643798828125, 0.63671875, 0.9090576171875, 1.181396484375, 1.4537353515625, 1.72607421875, 1.9984130859375, 2.270751953125, 2.5430908203125, 2.8154296875, 3.0877685546875, 3.360107421875, 3.6324462890625, 3.90478515625, 4.1771240234375, 4.449462890625, 4.7218017578125, 4.994140625, 5.2664794921875, 5.538818359375, 5.8111572265625, 6.08349609375, 6.3558349609375, 6.628173828125, 6.9005126953125, 7.1728515625, 7.4451904296875, 7.717529296875, 7.9898681640625, 8.26220703125, 8.5345458984375, 8.806884765625, 9.0792236328125, 9.3515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 12.0, 14.0, 11.0, 25.0, 40.0, 51.0, 81.0, 112.0, 176.0, 293.0, 472.0, 808.0, 1557.0, 2923.0, 6744.0, 17495.0, 53191.0, 243205.0, 599157.0, 80909.0, 24213.0, 8792.0, 3836.0, 1877.0, 989.0, 567.0, 324.0, 220.0, 136.0, 95.0, 69.0, 40.0, 26.0, 22.0, 14.0, 5.0, 6.0, 10.0, 9.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.693878173828125, -2.60455322265625, -2.515228271484375, -2.4259033203125, -2.336578369140625, -2.24725341796875, -2.157928466796875, -2.068603515625, -1.979278564453125, -1.88995361328125, -1.800628662109375, -1.7113037109375, -1.621978759765625, -1.53265380859375, -1.443328857421875, -1.35400390625, -1.264678955078125, -1.17535400390625, -1.086029052734375, -0.9967041015625, -0.907379150390625, -0.81805419921875, -0.728729248046875, -0.639404296875, -0.550079345703125, -0.46075439453125, -0.371429443359375, -0.2821044921875, -0.192779541015625, -0.10345458984375, -0.014129638671875, 0.0751953125, 0.164520263671875, 0.25384521484375, 0.343170166015625, 0.4324951171875, 0.521820068359375, 0.61114501953125, 0.700469970703125, 0.789794921875, 0.879119873046875, 0.96844482421875, 1.057769775390625, 1.1470947265625, 1.236419677734375, 1.32574462890625, 1.415069580078125, 1.50439453125, 1.593719482421875, 1.68304443359375, 1.772369384765625, 1.8616943359375, 1.951019287109375, 2.04034423828125, 2.129669189453125, 2.218994140625, 2.308319091796875, 2.39764404296875, 2.486968994140625, 2.5762939453125, 2.665618896484375, 2.75494384765625, 2.844268798828125, 2.93359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 9.0, 7.0, 16.0, 17.0, 15.0, 26.0, 29.0, 44.0, 58.0, 84.0, 212.0, 145.0, 80.0, 57.0, 35.0, 33.0, 27.0, 19.0, 16.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00118255615234375, -0.001147627830505371, -0.0011126995086669922, -0.0010777711868286133, -0.0010428428649902344, -0.0010079145431518555, -0.0009729862213134766, -0.0009380578994750977, -0.0009031295776367188, -0.0008682012557983398, -0.0008332729339599609, -0.000798344612121582, -0.0007634162902832031, -0.0007284879684448242, -0.0006935596466064453, -0.0006586313247680664, -0.0006237030029296875, -0.0005887746810913086, -0.0005538463592529297, -0.0005189180374145508, -0.0004839897155761719, -0.00044906139373779297, -0.00041413307189941406, -0.00037920475006103516, -0.00034427642822265625, -0.00030934810638427734, -0.00027441978454589844, -0.00023949146270751953, -0.00020456314086914062, -0.00016963481903076172, -0.0001347064971923828, -9.97781753540039e-05, -6.4849853515625e-05, -2.9921531677246094e-05, 5.0067901611328125e-06, 3.993511199951172e-05, 7.486343383789062e-05, 0.00010979175567626953, 0.00014472007751464844, 0.00017964839935302734, 0.00021457672119140625, 0.00024950504302978516, 0.00028443336486816406, 0.00031936168670654297, 0.0003542900085449219, 0.0003892183303833008, 0.0004241466522216797, 0.0004590749740600586, 0.0004940032958984375, 0.0005289316177368164, 0.0005638599395751953, 0.0005987882614135742, 0.0006337165832519531, 0.000668644905090332, 0.0007035732269287109, 0.0007385015487670898, 0.0007734298706054688, 0.0008083581924438477, 0.0008432865142822266, 0.0008782148361206055, 0.0009131431579589844, 0.0009480714797973633, 0.0009829998016357422, 0.001017928123474121, 0.0010528564453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 17.0, 23.0, 39.0, 47.0, 63.0, 125.0, 178.0, 321.0, 570.0, 1039.0, 2117.0, 5057.0, 15002.0, 62453.0, 599093.0, 297054.0, 45394.0, 11795.0, 4085.0, 1864.0, 931.0, 488.0, 279.0, 156.0, 113.0, 78.0, 43.0, 29.0, 17.0, 9.0, 17.0, 12.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.928253173828125, -2.82330322265625, -2.718353271484375, -2.6134033203125, -2.508453369140625, -2.40350341796875, -2.298553466796875, -2.193603515625, -2.088653564453125, -1.98370361328125, -1.878753662109375, -1.7738037109375, -1.668853759765625, -1.56390380859375, -1.458953857421875, -1.35400390625, -1.249053955078125, -1.14410400390625, -1.039154052734375, -0.9342041015625, -0.829254150390625, -0.72430419921875, -0.619354248046875, -0.514404296875, -0.409454345703125, -0.30450439453125, -0.199554443359375, -0.0946044921875, 0.010345458984375, 0.11529541015625, 0.220245361328125, 0.3251953125, 0.430145263671875, 0.53509521484375, 0.640045166015625, 0.7449951171875, 0.849945068359375, 0.95489501953125, 1.059844970703125, 1.164794921875, 1.269744873046875, 1.37469482421875, 1.479644775390625, 1.5845947265625, 1.689544677734375, 1.79449462890625, 1.899444580078125, 2.00439453125, 2.109344482421875, 2.21429443359375, 2.319244384765625, 2.4241943359375, 2.529144287109375, 2.63409423828125, 2.739044189453125, 2.843994140625, 2.948944091796875, 3.05389404296875, 3.158843994140625, 3.2637939453125, 3.368743896484375, 3.47369384765625, 3.578643798828125, 3.68359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 4.0, 4.0, 14.0, 8.0, 12.0, 18.0, 16.0, 18.0, 36.0, 28.0, 20.0, 38.0, 34.0, 58.0, 53.0, 75.0, 68.0, 79.0, 62.0, 50.0, 40.0, 29.0, 24.0, 26.0, 19.0, 19.0, 15.0, 12.0, 16.0, 14.0, 13.0, 11.0, 3.0, 7.0, 6.0, 5.0, 7.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.248046875, -2.178863525390625, -2.10968017578125, -2.040496826171875, -1.9713134765625, -1.902130126953125, -1.83294677734375, -1.763763427734375, -1.694580078125, -1.625396728515625, -1.55621337890625, -1.487030029296875, -1.4178466796875, -1.348663330078125, -1.27947998046875, -1.210296630859375, -1.14111328125, -1.071929931640625, -1.00274658203125, -0.933563232421875, -0.8643798828125, -0.795196533203125, -0.72601318359375, -0.656829833984375, -0.587646484375, -0.518463134765625, -0.44927978515625, -0.380096435546875, -0.3109130859375, -0.241729736328125, -0.17254638671875, -0.103363037109375, -0.0341796875, 0.035003662109375, 0.10418701171875, 0.173370361328125, 0.2425537109375, 0.311737060546875, 0.38092041015625, 0.450103759765625, 0.519287109375, 0.588470458984375, 0.65765380859375, 0.726837158203125, 0.7960205078125, 0.865203857421875, 0.93438720703125, 1.003570556640625, 1.07275390625, 1.141937255859375, 1.21112060546875, 1.280303955078125, 1.3494873046875, 1.418670654296875, 1.48785400390625, 1.557037353515625, 1.626220703125, 1.695404052734375, 1.76458740234375, 1.833770751953125, 1.9029541015625, 1.972137451171875, 2.04132080078125, 2.110504150390625, 2.1796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 9.0, 15.0, 49.0, 114.0, 217.0, 304.0, 157.0, 75.0, 17.0, 15.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-75.54513549804688, -72.65704345703125, -69.7689437866211, -66.88085174560547, -63.99275207519531, -61.10465621948242, -58.21656036376953, -55.328468322753906, -52.44036865234375, -49.55227279663086, -46.66417694091797, -43.77608108520508, -40.88798522949219, -37.9998893737793, -35.111793518066406, -32.22370147705078, -29.33560562133789, -26.447509765625, -23.55941390991211, -20.67131805419922, -17.783222198486328, -14.895127296447754, -12.00703239440918, -9.118936538696289, -6.230840682983398, -3.342745065689087, -0.4546494483947754, 2.433445930480957, 5.321541786193848, 8.209637641906738, 11.097732543945312, 13.985828399658203, 16.873924255371094, 19.762020111083984, 22.650115966796875, 25.538211822509766, 28.426307678222656, 31.314403533935547, 34.20249938964844, 37.09059143066406, 39.97869110107422, 42.86678695678711, 45.7548828125, 48.64297866821289, 51.53107452392578, 54.41917037963867, 57.30726623535156, 60.19535827636719, 63.08345413208008, 65.97154998779297, 68.8596420288086, 71.74774169921875, 74.63583374023438, 77.52393341064453, 80.41202545166016, 83.30012512207031, 86.18821716308594, 89.07630920410156, 91.96440887451172, 94.85250091552734, 97.7406005859375, 100.62869262695312, 103.51679229736328, 106.4048843383789, 109.29298400878906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 8.0, 9.0, 9.0, 11.0, 6.0, 15.0, 17.0, 18.0, 27.0, 29.0, 27.0, 34.0, 24.0, 29.0, 33.0, 48.0, 46.0, 48.0, 65.0, 42.0, 46.0, 38.0, 36.0, 45.0, 12.0, 29.0, 23.0, 32.0, 17.0, 22.0, 15.0, 15.0, 16.0, 21.0, 8.0, 9.0, 12.0, 5.0, 6.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.49323081970215, -22.629426956176758, -21.765621185302734, -20.901817321777344, -20.038013458251953, -19.17420768737793, -18.31040382385254, -17.446598052978516, -16.582794189453125, -15.718989372253418, -14.855184555053711, -13.99138069152832, -13.127575874328613, -12.263771057128906, -11.399967193603516, -10.536162376403809, -9.672357559204102, -8.808552742004395, -7.944748401641846, -7.080944061279297, -6.21713924407959, -5.353334426879883, -4.489530086517334, -3.625725746154785, -2.761920928955078, -1.8981163501739502, -1.0343117713928223, -0.17050719261169434, 0.6932973861694336, 1.5571022033691406, 2.4209065437316895, 3.2847108840942383, 4.148517608642578, 5.012322425842285, 5.876126766204834, 6.739931106567383, 7.60373592376709, 8.467540740966797, 9.331344604492188, 10.195149421691895, 11.058954238891602, 11.922759056091309, 12.786563873291016, 13.650367736816406, 14.514172554016113, 15.37797737121582, 16.24178123474121, 17.105587005615234, 17.969390869140625, 18.833194732666016, 19.69700050354004, 20.56080436706543, 21.424610137939453, 22.288414001464844, 23.152217864990234, 24.016021728515625, 24.87982749938965, 25.74363136291504, 26.607437133789062, 27.471240997314453, 28.335044860839844, 29.198850631713867, 30.062654495239258, 30.92646026611328, 31.790264129638672]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 9.0, 19.0, 25.0, 33.0, 40.0, 55.0, 78.0, 105.0, 184.0, 301.0, 450.0, 740.0, 1422.0, 2520.0, 5222.0, 11600.0, 29860.0, 99581.0, 577906.0, 2602619.0, 688151.0, 115385.0, 33306.0, 12867.0, 5518.0, 2714.0, 1467.0, 764.0, 447.0, 271.0, 200.0, 127.0, 81.0, 52.0, 36.0, 23.0, 20.0, 14.0, 13.0, 10.0, 1.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.86328125, -2.76953125, -2.67578125, -2.58203125, -2.48828125, -2.39453125, -2.30078125, -2.20703125, -2.11328125, -2.01953125, -1.92578125, -1.83203125, -1.73828125, -1.64453125, -1.55078125, -1.45703125, -1.36328125, -1.26953125, -1.17578125, -1.08203125, -0.98828125, -0.89453125, -0.80078125, -0.70703125, -0.61328125, -0.51953125, -0.42578125, -0.33203125, -0.23828125, -0.14453125, -0.05078125, 0.04296875, 0.13671875, 0.23046875, 0.32421875, 0.41796875, 0.51171875, 0.60546875, 0.69921875, 0.79296875, 0.88671875, 0.98046875, 1.07421875, 1.16796875, 1.26171875, 1.35546875, 1.44921875, 1.54296875, 1.63671875, 1.73046875, 1.82421875, 1.91796875, 2.01171875, 2.10546875, 2.19921875, 2.29296875, 2.38671875, 2.48046875, 2.57421875, 2.66796875, 2.76171875, 2.85546875, 2.94921875, 3.04296875, 3.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 2.0, 7.0, 10.0, 9.0, 8.0, 15.0, 17.0, 17.0, 32.0, 34.0, 35.0, 36.0, 41.0, 55.0, 50.0, 65.0, 59.0, 59.0, 71.0, 46.0, 41.0, 53.0, 38.0, 46.0, 33.0, 28.0, 28.0, 18.0, 18.0, 12.0, 7.0, 8.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.865234375, -2.7971343994140625, -2.729034423828125, -2.6609344482421875, -2.59283447265625, -2.5247344970703125, -2.456634521484375, -2.3885345458984375, -2.3204345703125, -2.2523345947265625, -2.184234619140625, -2.1161346435546875, -2.04803466796875, -1.9799346923828125, -1.911834716796875, -1.8437347412109375, -1.775634765625, -1.7075347900390625, -1.639434814453125, -1.5713348388671875, -1.50323486328125, -1.4351348876953125, -1.367034912109375, -1.2989349365234375, -1.2308349609375, -1.1627349853515625, -1.094635009765625, -1.0265350341796875, -0.95843505859375, -0.8903350830078125, -0.822235107421875, -0.7541351318359375, -0.68603515625, -0.6179351806640625, -0.549835205078125, -0.4817352294921875, -0.41363525390625, -0.3455352783203125, -0.277435302734375, -0.2093353271484375, -0.1412353515625, -0.0731353759765625, -0.005035400390625, 0.0630645751953125, 0.13116455078125, 0.1992645263671875, 0.267364501953125, 0.3354644775390625, 0.403564453125, 0.4716644287109375, 0.539764404296875, 0.6078643798828125, 0.67596435546875, 0.7440643310546875, 0.812164306640625, 0.8802642822265625, 0.9483642578125, 1.0164642333984375, 1.084564208984375, 1.1526641845703125, 1.22076416015625, 1.2888641357421875, 1.356964111328125, 1.4250640869140625, 1.4931640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 11.0, 9.0, 27.0, 45.0, 65.0, 137.0, 330.0, 825.0, 2479.0, 9527.0, 55307.0, 773655.0, 3185266.0, 140944.0, 18764.0, 4325.0, 1382.0, 591.0, 258.0, 145.0, 72.0, 40.0, 28.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.72650146484375, -4.5037841796875, -4.28106689453125, -4.058349609375, -3.83563232421875, -3.6129150390625, -3.39019775390625, -3.16748046875, -2.94476318359375, -2.7220458984375, -2.49932861328125, -2.276611328125, -2.05389404296875, -1.8311767578125, -1.60845947265625, -1.3857421875, -1.16302490234375, -0.9403076171875, -0.71759033203125, -0.494873046875, -0.27215576171875, -0.0494384765625, 0.17327880859375, 0.39599609375, 0.61871337890625, 0.8414306640625, 1.06414794921875, 1.286865234375, 1.50958251953125, 1.7322998046875, 1.95501708984375, 2.177734375, 2.40045166015625, 2.6231689453125, 2.84588623046875, 3.068603515625, 3.29132080078125, 3.5140380859375, 3.73675537109375, 3.95947265625, 4.18218994140625, 4.4049072265625, 4.62762451171875, 4.850341796875, 5.07305908203125, 5.2957763671875, 5.51849365234375, 5.7412109375, 5.96392822265625, 6.1866455078125, 6.40936279296875, 6.632080078125, 6.85479736328125, 7.0775146484375, 7.30023193359375, 7.52294921875, 7.74566650390625, 7.9683837890625, 8.19110107421875, 8.413818359375, 8.63653564453125, 8.8592529296875, 9.08197021484375, 9.3046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 7.0, 4.0, 15.0, 8.0, 36.0, 41.0, 57.0, 84.0, 115.0, 201.0, 368.0, 667.0, 948.0, 652.0, 316.0, 203.0, 107.0, 73.0, 54.0, 24.0, 30.0, 19.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.2088623046875, -4.995849609375, -4.7828369140625, -4.56982421875, -4.3568115234375, -4.143798828125, -3.9307861328125, -3.7177734375, -3.5047607421875, -3.291748046875, -3.0787353515625, -2.86572265625, -2.6527099609375, -2.439697265625, -2.2266845703125, -2.013671875, -1.8006591796875, -1.587646484375, -1.3746337890625, -1.16162109375, -0.9486083984375, -0.735595703125, -0.5225830078125, -0.3095703125, -0.0965576171875, 0.116455078125, 0.3294677734375, 0.54248046875, 0.7554931640625, 0.968505859375, 1.1815185546875, 1.39453125, 1.6075439453125, 1.820556640625, 2.0335693359375, 2.24658203125, 2.4595947265625, 2.672607421875, 2.8856201171875, 3.0986328125, 3.3116455078125, 3.524658203125, 3.7376708984375, 3.95068359375, 4.1636962890625, 4.376708984375, 4.5897216796875, 4.802734375, 5.0157470703125, 5.228759765625, 5.4417724609375, 5.65478515625, 5.8677978515625, 6.080810546875, 6.2938232421875, 6.5068359375, 6.7198486328125, 6.932861328125, 7.1458740234375, 7.35888671875, 7.5718994140625, 7.784912109375, 7.9979248046875, 8.2109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 9.0, 15.0, 100.0, 282.0, 404.0, 138.0, 35.0, 13.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.06217956542969, -76.85025024414062, -72.6383285522461, -68.42640686035156, -64.2144775390625, -60.0025520324707, -55.790626525878906, -51.57870101928711, -47.36677551269531, -43.154850006103516, -38.94292449951172, -34.73099899291992, -30.519073486328125, -26.307147979736328, -22.09522247314453, -17.883296966552734, -13.671371459960938, -9.45944595336914, -5.247520446777344, -1.0355949401855469, 3.17633056640625, 7.388256072998047, 11.600181579589844, 15.81210708618164, 20.024032592773438, 24.235958099365234, 28.44788360595703, 32.65980911254883, 36.871734619140625, 41.08366012573242, 45.29558563232422, 49.507511138916016, 53.719451904296875, 57.93137741088867, 62.14330291748047, 66.355224609375, 70.56715393066406, 74.77908325195312, 78.99100494384766, 83.20292663574219, 87.41485595703125, 91.62678527832031, 95.83870697021484, 100.05062866210938, 104.26255798339844, 108.4744873046875, 112.68640899658203, 116.89833068847656, 121.11026000976562, 125.32218933105469, 129.53411865234375, 133.74603271484375, 137.9579620361328, 142.16989135742188, 146.38180541992188, 150.59373474121094, 154.8056640625, 159.01759338378906, 163.22952270507812, 167.44143676757812, 171.6533660888672, 175.86529541015625, 180.07720947265625, 184.2891387939453, 188.50106811523438]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 16.0, 12.0, 29.0, 37.0, 52.0, 37.0, 50.0, 54.0, 77.0, 92.0, 68.0, 95.0, 65.0, 69.0, 59.0, 44.0, 38.0, 23.0, 21.0, 15.0, 8.0, 4.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.531421661376953, -20.19291114807129, -18.854402542114258, -17.515892028808594, -16.177383422851562, -14.838872909545898, -13.500362396240234, -12.161852836608887, -10.823343276977539, -9.484833717346191, -8.146324157714844, -6.80781364440918, -5.469304084777832, -4.130794525146484, -2.7922840118408203, -1.4537744522094727, -0.115264892578125, 1.2232449054718018, 2.5617547035217285, 3.9002647399902344, 5.238774299621582, 6.57728385925293, 7.915794372558594, 9.254303932189941, 10.592813491821289, 11.931323051452637, 13.269832611083984, 14.608343124389648, 15.946852684020996, 17.285362243652344, 18.623872756958008, 19.962383270263672, 21.30089569091797, 22.639406204223633, 23.977914810180664, 25.316425323486328, 26.65493392944336, 27.993444442749023, 29.331954956054688, 30.67046356201172, 32.00897216796875, 33.34748077392578, 34.68599319458008, 36.02450180053711, 37.36301040649414, 38.70152282714844, 40.04003143310547, 41.3785400390625, 42.7170524597168, 44.05556106567383, 45.394073486328125, 46.732582092285156, 48.07109069824219, 49.40959930419922, 50.748111724853516, 52.08662033081055, 53.425132751464844, 54.763641357421875, 56.10215377807617, 57.4406623840332, 58.779170989990234, 60.11768341064453, 61.45619201660156, 62.794700622558594, 64.13320922851562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 30.0, 49.0, 65.0, 111.0, 211.0, 308.0, 608.0, 1142.0, 2452.0, 5553.0, 14072.0, 43485.0, 221011.0, 594097.0, 117993.0, 29059.0, 10087.0, 4151.0, 1955.0, 906.0, 462.0, 274.0, 175.0, 93.0, 54.0, 37.0, 26.0, 18.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.53955078125, -4.3603515625, -4.18115234375, -4.001953125, -3.82275390625, -3.6435546875, -3.46435546875, -3.28515625, -3.10595703125, -2.9267578125, -2.74755859375, -2.568359375, -2.38916015625, -2.2099609375, -2.03076171875, -1.8515625, -1.67236328125, -1.4931640625, -1.31396484375, -1.134765625, -0.95556640625, -0.7763671875, -0.59716796875, -0.41796875, -0.23876953125, -0.0595703125, 0.11962890625, 0.298828125, 0.47802734375, 0.6572265625, 0.83642578125, 1.015625, 1.19482421875, 1.3740234375, 1.55322265625, 1.732421875, 1.91162109375, 2.0908203125, 2.27001953125, 2.44921875, 2.62841796875, 2.8076171875, 2.98681640625, 3.166015625, 3.34521484375, 3.5244140625, 3.70361328125, 3.8828125, 4.06201171875, 4.2412109375, 4.42041015625, 4.599609375, 4.77880859375, 4.9580078125, 5.13720703125, 5.31640625, 5.49560546875, 5.6748046875, 5.85400390625, 6.033203125, 6.21240234375, 6.3916015625, 6.57080078125, 6.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 17.0, 12.0, 15.0, 18.0, 27.0, 32.0, 27.0, 36.0, 34.0, 48.0, 38.0, 59.0, 62.0, 49.0, 54.0, 64.0, 52.0, 56.0, 53.0, 38.0, 39.0, 37.0, 21.0, 18.0, 22.0, 12.0, 13.0, 8.0, 5.0, 10.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.498046875, -2.4297943115234375, -2.361541748046875, -2.2932891845703125, -2.22503662109375, -2.1567840576171875, -2.088531494140625, -2.0202789306640625, -1.9520263671875, -1.8837738037109375, -1.815521240234375, -1.7472686767578125, -1.67901611328125, -1.6107635498046875, -1.542510986328125, -1.4742584228515625, -1.406005859375, -1.3377532958984375, -1.269500732421875, -1.2012481689453125, -1.13299560546875, -1.0647430419921875, -0.996490478515625, -0.9282379150390625, -0.8599853515625, -0.7917327880859375, -0.723480224609375, -0.6552276611328125, -0.58697509765625, -0.5187225341796875, -0.450469970703125, -0.3822174072265625, -0.31396484375, -0.2457122802734375, -0.177459716796875, -0.1092071533203125, -0.04095458984375, 0.0272979736328125, 0.095550537109375, 0.1638031005859375, 0.2320556640625, 0.3003082275390625, 0.368560791015625, 0.4368133544921875, 0.50506591796875, 0.5733184814453125, 0.641571044921875, 0.7098236083984375, 0.778076171875, 0.8463287353515625, 0.914581298828125, 0.9828338623046875, 1.05108642578125, 1.1193389892578125, 1.187591552734375, 1.2558441162109375, 1.3240966796875, 1.3923492431640625, 1.460601806640625, 1.5288543701171875, 1.59710693359375, 1.6653594970703125, 1.733612060546875, 1.8018646240234375, 1.8701171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 21.0, 20.0, 28.0, 40.0, 45.0, 68.0, 120.0, 168.0, 286.0, 490.0, 892.0, 1770.0, 4364.0, 14404.0, 79786.0, 809453.0, 109615.0, 17626.0, 5092.0, 1950.0, 926.0, 477.0, 313.0, 182.0, 119.0, 69.0, 63.0, 37.0, 28.0, 18.0, 14.0, 7.0, 9.0, 7.0, 5.0, 6.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7421875, -9.47576904296875, -9.2093505859375, -8.94293212890625, -8.676513671875, -8.41009521484375, -8.1436767578125, -7.87725830078125, -7.61083984375, -7.34442138671875, -7.0780029296875, -6.81158447265625, -6.545166015625, -6.27874755859375, -6.0123291015625, -5.74591064453125, -5.4794921875, -5.21307373046875, -4.9466552734375, -4.68023681640625, -4.413818359375, -4.14739990234375, -3.8809814453125, -3.61456298828125, -3.34814453125, -3.08172607421875, -2.8153076171875, -2.54888916015625, -2.282470703125, -2.01605224609375, -1.7496337890625, -1.48321533203125, -1.216796875, -0.95037841796875, -0.6839599609375, -0.41754150390625, -0.151123046875, 0.11529541015625, 0.3817138671875, 0.64813232421875, 0.91455078125, 1.18096923828125, 1.4473876953125, 1.71380615234375, 1.980224609375, 2.24664306640625, 2.5130615234375, 2.77947998046875, 3.0458984375, 3.31231689453125, 3.5787353515625, 3.84515380859375, 4.111572265625, 4.37799072265625, 4.6444091796875, 4.91082763671875, 5.17724609375, 5.44366455078125, 5.7100830078125, 5.97650146484375, 6.242919921875, 6.50933837890625, 6.7757568359375, 7.04217529296875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 18.0, 11.0, 12.0, 16.0, 23.0, 32.0, 40.0, 44.0, 51.0, 51.0, 53.0, 56.0, 62.0, 74.0, 59.0, 58.0, 50.0, 38.0, 28.0, 39.0, 27.0, 21.0, 17.0, 13.0, 14.0, 15.0, 14.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.8934326171875, -7.607177734375, -7.3209228515625, -7.03466796875, -6.7484130859375, -6.462158203125, -6.1759033203125, -5.8896484375, -5.6033935546875, -5.317138671875, -5.0308837890625, -4.74462890625, -4.4583740234375, -4.172119140625, -3.8858642578125, -3.599609375, -3.3133544921875, -3.027099609375, -2.7408447265625, -2.45458984375, -2.1683349609375, -1.882080078125, -1.5958251953125, -1.3095703125, -1.0233154296875, -0.737060546875, -0.4508056640625, -0.16455078125, 0.1217041015625, 0.407958984375, 0.6942138671875, 0.98046875, 1.2667236328125, 1.552978515625, 1.8392333984375, 2.12548828125, 2.4117431640625, 2.697998046875, 2.9842529296875, 3.2705078125, 3.5567626953125, 3.843017578125, 4.1292724609375, 4.41552734375, 4.7017822265625, 4.988037109375, 5.2742919921875, 5.560546875, 5.8468017578125, 6.133056640625, 6.4193115234375, 6.70556640625, 6.9918212890625, 7.278076171875, 7.5643310546875, 7.8505859375, 8.1368408203125, 8.423095703125, 8.7093505859375, 8.99560546875, 9.2818603515625, 9.568115234375, 9.8543701171875, 10.140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 18.0, 28.0, 35.0, 69.0, 79.0, 161.0, 311.0, 546.0, 1159.0, 2636.0, 6806.0, 20439.0, 80486.0, 645501.0, 228415.0, 41815.0, 12162.0, 4241.0, 1797.0, 767.0, 379.0, 222.0, 148.0, 87.0, 54.0, 38.0, 27.0, 18.0, 15.0, 13.0, 13.0, 2.0, 2.0, 10.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.31451416015625, -2.2247314453125, -2.13494873046875, -2.045166015625, -1.95538330078125, -1.8656005859375, -1.77581787109375, -1.68603515625, -1.59625244140625, -1.5064697265625, -1.41668701171875, -1.326904296875, -1.23712158203125, -1.1473388671875, -1.05755615234375, -0.9677734375, -0.87799072265625, -0.7882080078125, -0.69842529296875, -0.608642578125, -0.51885986328125, -0.4290771484375, -0.33929443359375, -0.24951171875, -0.15972900390625, -0.0699462890625, 0.01983642578125, 0.109619140625, 0.19940185546875, 0.2891845703125, 0.37896728515625, 0.46875, 0.55853271484375, 0.6483154296875, 0.73809814453125, 0.827880859375, 0.91766357421875, 1.0074462890625, 1.09722900390625, 1.18701171875, 1.27679443359375, 1.3665771484375, 1.45635986328125, 1.546142578125, 1.63592529296875, 1.7257080078125, 1.81549072265625, 1.9052734375, 1.99505615234375, 2.0848388671875, 2.17462158203125, 2.264404296875, 2.35418701171875, 2.4439697265625, 2.53375244140625, 2.62353515625, 2.71331787109375, 2.8031005859375, 2.89288330078125, 2.982666015625, 3.07244873046875, 3.1622314453125, 3.25201416015625, 3.341796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 7.0, 19.0, 21.0, 24.0, 43.0, 57.0, 101.0, 134.0, 158.0, 118.0, 67.0, 55.0, 42.0, 28.0, 18.0, 21.0, 18.0, 6.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006933212280273438, -0.0006669163703918457, -0.0006405115127563477, -0.0006141066551208496, -0.0005877017974853516, -0.0005612969398498535, -0.0005348920822143555, -0.0005084872245788574, -0.0004820823669433594, -0.00045567750930786133, -0.0004292726516723633, -0.00040286779403686523, -0.0003764629364013672, -0.00035005807876586914, -0.0003236532211303711, -0.00029724836349487305, -0.000270843505859375, -0.00024443864822387695, -0.0002180337905883789, -0.00019162893295288086, -0.0001652240753173828, -0.00013881921768188477, -0.00011241436004638672, -8.600950241088867e-05, -5.9604644775390625e-05, -3.319978713989258e-05, -6.794929504394531e-06, 1.9609928131103516e-05, 4.601478576660156e-05, 7.241964340209961e-05, 9.882450103759766e-05, 0.0001252293586730957, 0.00015163421630859375, 0.0001780390739440918, 0.00020444393157958984, 0.0002308487892150879, 0.00025725364685058594, 0.000283658504486084, 0.00031006336212158203, 0.0003364682197570801, 0.0003628730773925781, 0.00038927793502807617, 0.0004156827926635742, 0.00044208765029907227, 0.0004684925079345703, 0.0004948973655700684, 0.0005213022232055664, 0.0005477070808410645, 0.0005741119384765625, 0.0006005167961120605, 0.0006269216537475586, 0.0006533265113830566, 0.0006797313690185547, 0.0007061362266540527, 0.0007325410842895508, 0.0007589459419250488, 0.0007853507995605469, 0.0008117556571960449, 0.000838160514831543, 0.000864565372467041, 0.0008909702301025391, 0.0009173750877380371, 0.0009437799453735352, 0.0009701848030090332, 0.0009965896606445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 3.0, 12.0, 14.0, 8.0, 14.0, 17.0, 27.0, 33.0, 62.0, 83.0, 121.0, 160.0, 221.0, 330.0, 567.0, 950.0, 1804.0, 3617.0, 8204.0, 21249.0, 65794.0, 289415.0, 527231.0, 84303.0, 25588.0, 9734.0, 4136.0, 1947.0, 1119.0, 623.0, 377.0, 244.0, 160.0, 95.0, 92.0, 57.0, 27.0, 29.0, 21.0, 20.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.176422119140625, -2.11065673828125, -2.044891357421875, -1.9791259765625, -1.913360595703125, -1.84759521484375, -1.781829833984375, -1.716064453125, -1.650299072265625, -1.58453369140625, -1.518768310546875, -1.4530029296875, -1.387237548828125, -1.32147216796875, -1.255706787109375, -1.18994140625, -1.124176025390625, -1.05841064453125, -0.992645263671875, -0.9268798828125, -0.861114501953125, -0.79534912109375, -0.729583740234375, -0.663818359375, -0.598052978515625, -0.53228759765625, -0.466522216796875, -0.4007568359375, -0.334991455078125, -0.26922607421875, -0.203460693359375, -0.1376953125, -0.071929931640625, -0.00616455078125, 0.059600830078125, 0.1253662109375, 0.191131591796875, 0.25689697265625, 0.322662353515625, 0.388427734375, 0.454193115234375, 0.51995849609375, 0.585723876953125, 0.6514892578125, 0.717254638671875, 0.78302001953125, 0.848785400390625, 0.91455078125, 0.980316162109375, 1.04608154296875, 1.111846923828125, 1.1776123046875, 1.243377685546875, 1.30914306640625, 1.374908447265625, 1.440673828125, 1.506439208984375, 1.57220458984375, 1.637969970703125, 1.7037353515625, 1.769500732421875, 1.83526611328125, 1.901031494140625, 1.966796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 11.0, 6.0, 15.0, 8.0, 12.0, 14.0, 20.0, 39.0, 35.0, 42.0, 64.0, 74.0, 80.0, 107.0, 105.0, 83.0, 43.0, 37.0, 41.0, 38.0, 22.0, 21.0, 11.0, 15.0, 13.0, 8.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.38739013671875, -2.3099365234375, -2.23248291015625, -2.155029296875, -2.07757568359375, -2.0001220703125, -1.92266845703125, -1.84521484375, -1.76776123046875, -1.6903076171875, -1.61285400390625, -1.535400390625, -1.45794677734375, -1.3804931640625, -1.30303955078125, -1.2255859375, -1.14813232421875, -1.0706787109375, -0.99322509765625, -0.915771484375, -0.83831787109375, -0.7608642578125, -0.68341064453125, -0.60595703125, -0.52850341796875, -0.4510498046875, -0.37359619140625, -0.296142578125, -0.21868896484375, -0.1412353515625, -0.06378173828125, 0.013671875, 0.09112548828125, 0.1685791015625, 0.24603271484375, 0.323486328125, 0.40093994140625, 0.4783935546875, 0.55584716796875, 0.63330078125, 0.71075439453125, 0.7882080078125, 0.86566162109375, 0.943115234375, 1.02056884765625, 1.0980224609375, 1.17547607421875, 1.2529296875, 1.33038330078125, 1.4078369140625, 1.48529052734375, 1.562744140625, 1.64019775390625, 1.7176513671875, 1.79510498046875, 1.87255859375, 1.95001220703125, 2.0274658203125, 2.10491943359375, 2.182373046875, 2.25982666015625, 2.3372802734375, 2.41473388671875, 2.4921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 11.0, 31.0, 63.0, 133.0, 217.0, 209.0, 133.0, 91.0, 53.0, 20.0, 7.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.09856414794922, -53.26109313964844, -51.42361831665039, -49.58614730834961, -47.74867630004883, -45.91120147705078, -44.07373046875, -42.23625946044922, -40.39878845214844, -38.561317443847656, -36.72384262084961, -34.88637161254883, -33.04890060424805, -31.211427688598633, -29.37395477294922, -27.536483764648438, -25.699010848999023, -23.86153793334961, -22.024066925048828, -20.186594009399414, -18.349123001098633, -16.51165008544922, -14.674178123474121, -12.836706161499023, -10.999234199523926, -9.161762237548828, -7.3242902755737305, -5.486817836761475, -3.649345874786377, -1.811873435974121, 0.025598526000976562, 1.8630704879760742, 3.700542449951172, 5.5380144119262695, 7.375486373901367, 9.212959289550781, 11.050430297851562, 12.887903213500977, 14.725375175476074, 16.562847137451172, 18.400318145751953, 20.237791061401367, 22.07526206970215, 23.912734985351562, 25.750205993652344, 27.587678909301758, 29.425151824951172, 31.262622833251953, 33.10009765625, 34.93756866455078, 36.77504348754883, 38.61251449584961, 40.44998550415039, 42.28746032714844, 44.12493133544922, 45.96240234375, 47.79987335205078, 49.63734436035156, 51.47481918334961, 53.31229019165039, 55.14976119995117, 56.98723602294922, 58.82470703125, 60.66217803955078, 62.49964904785156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 2.0, 19.0, 16.0, 19.0, 17.0, 14.0, 21.0, 27.0, 31.0, 29.0, 44.0, 50.0, 47.0, 77.0, 75.0, 62.0, 58.0, 76.0, 36.0, 37.0, 42.0, 27.0, 27.0, 31.0, 18.0, 13.0, 13.0, 10.0, 7.0, 10.0, 4.0, 9.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.8331413269043, -34.77885818481445, -33.72457504272461, -32.67029571533203, -31.616012573242188, -30.561729431152344, -29.5074462890625, -28.453163146972656, -27.398881912231445, -26.3445987701416, -25.29031753540039, -24.236034393310547, -23.181751251220703, -22.127470016479492, -21.07318687438965, -20.018905639648438, -18.964622497558594, -17.91033935546875, -16.85605812072754, -15.801774978637695, -14.747492790222168, -13.69321060180664, -12.638927459716797, -11.58464527130127, -10.530363082885742, -9.476080894470215, -8.421798706054688, -7.367515563964844, -6.313233375549316, -5.258951187133789, -4.2046685218811035, -3.150385856628418, -2.096101760864258, -1.0418193340301514, 0.012463092803955078, 1.0667455196380615, 2.121027946472168, 3.1753101348876953, 4.229592800140381, 5.283875465393066, 6.338157653808594, 7.392439842224121, 8.446722030639648, 9.501005172729492, 10.55528736114502, 11.609569549560547, 12.66385269165039, 13.718134880065918, 14.772417068481445, 15.826699256896973, 16.8809814453125, 17.935264587402344, 18.989547729492188, 20.0438289642334, 21.098112106323242, 22.152393341064453, 23.206676483154297, 24.26095962524414, 25.31524085998535, 26.369524002075195, 27.423805236816406, 28.47808837890625, 29.532371520996094, 30.586654663085938, 31.64093589782715]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 5.0, 5.0, 15.0, 7.0, 16.0, 22.0, 31.0, 36.0, 77.0, 103.0, 186.0, 328.0, 646.0, 1432.0, 3471.0, 9644.0, 32890.0, 186602.0, 2523138.0, 1294798.0, 104330.0, 23444.0, 7708.0, 2893.0, 1252.0, 558.0, 270.0, 149.0, 71.0, 37.0, 33.0, 28.0, 15.0, 9.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0], "bins": [-5.25, -5.12750244140625, -5.0050048828125, -4.88250732421875, -4.760009765625, -4.63751220703125, -4.5150146484375, -4.39251708984375, -4.27001953125, -4.14752197265625, -4.0250244140625, -3.90252685546875, -3.780029296875, -3.65753173828125, -3.5350341796875, -3.41253662109375, -3.2900390625, -3.16754150390625, -3.0450439453125, -2.92254638671875, -2.800048828125, -2.67755126953125, -2.5550537109375, -2.43255615234375, -2.31005859375, -2.18756103515625, -2.0650634765625, -1.94256591796875, -1.820068359375, -1.69757080078125, -1.5750732421875, -1.45257568359375, -1.330078125, -1.20758056640625, -1.0850830078125, -0.96258544921875, -0.840087890625, -0.71759033203125, -0.5950927734375, -0.47259521484375, -0.35009765625, -0.22760009765625, -0.1051025390625, 0.01739501953125, 0.139892578125, 0.26239013671875, 0.3848876953125, 0.50738525390625, 0.6298828125, 0.75238037109375, 0.8748779296875, 0.99737548828125, 1.119873046875, 1.24237060546875, 1.3648681640625, 1.48736572265625, 1.60986328125, 1.73236083984375, 1.8548583984375, 1.97735595703125, 2.099853515625, 2.22235107421875, 2.3448486328125, 2.46734619140625, 2.58984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 7.0, 16.0, 12.0, 14.0, 20.0, 21.0, 25.0, 35.0, 37.0, 52.0, 47.0, 50.0, 67.0, 62.0, 53.0, 59.0, 55.0, 51.0, 61.0, 60.0, 41.0, 33.0, 22.0, 25.0, 23.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.904144287109375, -2.83172607421875, -2.759307861328125, -2.6868896484375, -2.614471435546875, -2.54205322265625, -2.469635009765625, -2.397216796875, -2.324798583984375, -2.25238037109375, -2.179962158203125, -2.1075439453125, -2.035125732421875, -1.96270751953125, -1.890289306640625, -1.81787109375, -1.745452880859375, -1.67303466796875, -1.600616455078125, -1.5281982421875, -1.455780029296875, -1.38336181640625, -1.310943603515625, -1.238525390625, -1.166107177734375, -1.09368896484375, -1.021270751953125, -0.9488525390625, -0.876434326171875, -0.80401611328125, -0.731597900390625, -0.6591796875, -0.586761474609375, -0.51434326171875, -0.441925048828125, -0.3695068359375, -0.297088623046875, -0.22467041015625, -0.152252197265625, -0.079833984375, -0.007415771484375, 0.06500244140625, 0.137420654296875, 0.2098388671875, 0.282257080078125, 0.35467529296875, 0.427093505859375, 0.49951171875, 0.571929931640625, 0.64434814453125, 0.716766357421875, 0.7891845703125, 0.861602783203125, 0.93402099609375, 1.006439208984375, 1.078857421875, 1.151275634765625, 1.22369384765625, 1.296112060546875, 1.3685302734375, 1.440948486328125, 1.51336669921875, 1.585784912109375, 1.658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 9.0, 5.0, 5.0, 12.0, 13.0, 26.0, 33.0, 55.0, 106.0, 170.0, 346.0, 683.0, 1426.0, 3606.0, 9987.0, 32886.0, 170092.0, 2864419.0, 996518.0, 82217.0, 19958.0, 6637.0, 2547.0, 1156.0, 562.0, 304.0, 183.0, 105.0, 52.0, 44.0, 36.0, 14.0, 14.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.8037109375, -4.642578125, -4.4814453125, -4.3203125, -4.1591796875, -3.998046875, -3.8369140625, -3.67578125, -3.5146484375, -3.353515625, -3.1923828125, -3.03125, -2.8701171875, -2.708984375, -2.5478515625, -2.38671875, -2.2255859375, -2.064453125, -1.9033203125, -1.7421875, -1.5810546875, -1.419921875, -1.2587890625, -1.09765625, -0.9365234375, -0.775390625, -0.6142578125, -0.453125, -0.2919921875, -0.130859375, 0.0302734375, 0.19140625, 0.3525390625, 0.513671875, 0.6748046875, 0.8359375, 0.9970703125, 1.158203125, 1.3193359375, 1.48046875, 1.6416015625, 1.802734375, 1.9638671875, 2.125, 2.2861328125, 2.447265625, 2.6083984375, 2.76953125, 2.9306640625, 3.091796875, 3.2529296875, 3.4140625, 3.5751953125, 3.736328125, 3.8974609375, 4.05859375, 4.2197265625, 4.380859375, 4.5419921875, 4.703125, 4.8642578125, 5.025390625, 5.1865234375, 5.34765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 18.0, 16.0, 21.0, 25.0, 38.0, 57.0, 78.0, 113.0, 182.0, 365.0, 704.0, 850.0, 638.0, 385.0, 205.0, 127.0, 63.0, 43.0, 36.0, 19.0, 14.0, 18.0, 7.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.99029541015625, -3.8126220703125, -3.63494873046875, -3.457275390625, -3.27960205078125, -3.1019287109375, -2.92425537109375, -2.74658203125, -2.56890869140625, -2.3912353515625, -2.21356201171875, -2.035888671875, -1.85821533203125, -1.6805419921875, -1.50286865234375, -1.3251953125, -1.14752197265625, -0.9698486328125, -0.79217529296875, -0.614501953125, -0.43682861328125, -0.2591552734375, -0.08148193359375, 0.09619140625, 0.27386474609375, 0.4515380859375, 0.62921142578125, 0.806884765625, 0.98455810546875, 1.1622314453125, 1.33990478515625, 1.517578125, 1.69525146484375, 1.8729248046875, 2.05059814453125, 2.228271484375, 2.40594482421875, 2.5836181640625, 2.76129150390625, 2.93896484375, 3.11663818359375, 3.2943115234375, 3.47198486328125, 3.649658203125, 3.82733154296875, 4.0050048828125, 4.18267822265625, 4.3603515625, 4.53802490234375, 4.7156982421875, 4.89337158203125, 5.071044921875, 5.24871826171875, 5.4263916015625, 5.60406494140625, 5.78173828125, 5.95941162109375, 6.1370849609375, 6.31475830078125, 6.492431640625, 6.67010498046875, 6.8477783203125, 7.02545166015625, 7.203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 12.0, 23.0, 79.0, 150.0, 251.0, 245.0, 140.0, 50.0, 18.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.43997192382812, -87.19168853759766, -84.94339752197266, -82.69511413574219, -80.44683074951172, -78.19854736328125, -75.95025634765625, -73.70197296142578, -71.45368957519531, -69.20540618896484, -66.95711517333984, -64.70883178710938, -62.460548400878906, -60.21226119995117, -57.96397399902344, -55.71569061279297, -53.467403411865234, -51.2191162109375, -48.97083282470703, -46.7225456237793, -44.47426223754883, -42.225975036621094, -39.977691650390625, -37.72940444946289, -35.481117248535156, -33.23283004760742, -30.984546661376953, -28.73625946044922, -26.48797607421875, -24.239688873291016, -21.991403579711914, -19.743118286132812, -17.494834899902344, -15.246549606323242, -12.99826431274414, -10.749978065490723, -8.501692771911621, -6.2534074783325195, -4.005121231079102, -1.7568359375, 0.49144935607910156, 2.7397348880767822, 4.988020420074463, 7.236306190490723, 9.484591484069824, 11.732876777648926, 13.981163024902344, 16.229448318481445, 18.477733612060547, 20.72601890563965, 22.97430419921875, 25.222591400146484, 27.470874786376953, 29.719161987304688, 31.96744728088379, 34.21573257446289, 36.464019775390625, 38.71230697631836, 40.96059036254883, 43.20887756347656, 45.45716094970703, 47.705448150634766, 49.9537353515625, 52.20201873779297, 54.45030212402344]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 13.0, 9.0, 15.0, 21.0, 24.0, 19.0, 18.0, 19.0, 20.0, 35.0, 46.0, 30.0, 38.0, 48.0, 57.0, 53.0, 37.0, 48.0, 52.0, 34.0, 44.0, 32.0, 44.0, 21.0, 25.0, 25.0, 27.0, 27.0, 20.0, 12.0, 17.0, 16.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.417434692382812, -21.777280807495117, -21.137126922607422, -20.49697494506836, -19.856821060180664, -19.21666717529297, -18.576513290405273, -17.936359405517578, -17.296207427978516, -16.65605354309082, -16.015899658203125, -15.375746726989746, -14.735593795776367, -14.095439910888672, -13.455286026000977, -12.815133094787598, -12.174979209899902, -11.534825325012207, -10.894672393798828, -10.254518508911133, -9.614365577697754, -8.974211692810059, -8.33405876159668, -7.693904876708984, -7.053751468658447, -6.41359806060791, -5.773444652557373, -5.133291244506836, -4.493137359619141, -3.8529841899871826, -3.2128305435180664, -2.5726771354675293, -1.9325237274169922, -1.292370319366455, -0.6522167921066284, -0.012063264846801758, 0.6280901432037354, 1.2682435512542725, 1.9083971977233887, 2.548550605773926, 3.188704013824463, 3.828857421875, 4.469010829925537, 5.109164237976074, 5.7493181228637695, 6.389471054077148, 7.029624938964844, 7.669778347015381, 8.309931755065918, 8.950085639953613, 9.590238571166992, 10.230392456054688, 10.870545387268066, 11.510699272155762, 12.15085220336914, 12.791006088256836, 13.431159973144531, 14.071313858032227, 14.711466789245605, 15.3516206741333, 15.99177360534668, 16.631927490234375, 17.27208137512207, 17.912235260009766, 18.552387237548828]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 24.0, 17.0, 40.0, 46.0, 57.0, 106.0, 156.0, 239.0, 387.0, 573.0, 951.0, 1729.0, 3391.0, 7068.0, 18173.0, 64472.0, 289377.0, 467499.0, 139740.0, 33015.0, 10933.0, 4843.0, 2380.0, 1259.0, 738.0, 455.0, 294.0, 184.0, 106.0, 96.0, 62.0, 38.0, 27.0, 22.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.09173583984375, -2.9822998046875, -2.87286376953125, -2.763427734375, -2.65399169921875, -2.5445556640625, -2.43511962890625, -2.32568359375, -2.21624755859375, -2.1068115234375, -1.99737548828125, -1.887939453125, -1.77850341796875, -1.6690673828125, -1.55963134765625, -1.4501953125, -1.34075927734375, -1.2313232421875, -1.12188720703125, -1.012451171875, -0.90301513671875, -0.7935791015625, -0.68414306640625, -0.57470703125, -0.46527099609375, -0.3558349609375, -0.24639892578125, -0.136962890625, -0.02752685546875, 0.0819091796875, 0.19134521484375, 0.30078125, 0.41021728515625, 0.5196533203125, 0.62908935546875, 0.738525390625, 0.84796142578125, 0.9573974609375, 1.06683349609375, 1.17626953125, 1.28570556640625, 1.3951416015625, 1.50457763671875, 1.614013671875, 1.72344970703125, 1.8328857421875, 1.94232177734375, 2.0517578125, 2.16119384765625, 2.2706298828125, 2.38006591796875, 2.489501953125, 2.59893798828125, 2.7083740234375, 2.81781005859375, 2.92724609375, 3.03668212890625, 3.1461181640625, 3.25555419921875, 3.364990234375, 3.47442626953125, 3.5838623046875, 3.69329833984375, 3.802734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 17.0, 16.0, 21.0, 27.0, 18.0, 29.0, 46.0, 42.0, 44.0, 61.0, 50.0, 57.0, 53.0, 64.0, 66.0, 57.0, 46.0, 36.0, 36.0, 31.0, 32.0, 24.0, 21.0, 12.0, 16.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.869140625, -2.7957916259765625, -2.722442626953125, -2.6490936279296875, -2.57574462890625, -2.5023956298828125, -2.429046630859375, -2.3556976318359375, -2.2823486328125, -2.2089996337890625, -2.135650634765625, -2.0623016357421875, -1.98895263671875, -1.9156036376953125, -1.842254638671875, -1.7689056396484375, -1.695556640625, -1.6222076416015625, -1.548858642578125, -1.4755096435546875, -1.40216064453125, -1.3288116455078125, -1.255462646484375, -1.1821136474609375, -1.1087646484375, -1.0354156494140625, -0.962066650390625, -0.8887176513671875, -0.81536865234375, -0.7420196533203125, -0.668670654296875, -0.5953216552734375, -0.52197265625, -0.4486236572265625, -0.375274658203125, -0.3019256591796875, -0.22857666015625, -0.1552276611328125, -0.081878662109375, -0.0085296630859375, 0.0648193359375, 0.1381683349609375, 0.211517333984375, 0.2848663330078125, 0.35821533203125, 0.4315643310546875, 0.504913330078125, 0.5782623291015625, 0.651611328125, 0.7249603271484375, 0.798309326171875, 0.8716583251953125, 0.94500732421875, 1.0183563232421875, 1.091705322265625, 1.1650543212890625, 1.2384033203125, 1.3117523193359375, 1.385101318359375, 1.4584503173828125, 1.53179931640625, 1.6051483154296875, 1.678497314453125, 1.7518463134765625, 1.8251953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 10.0, 20.0, 25.0, 39.0, 62.0, 93.0, 128.0, 279.0, 615.0, 1414.0, 3743.0, 15811.0, 161969.0, 778769.0, 71215.0, 9423.0, 2776.0, 1057.0, 477.0, 261.0, 139.0, 73.0, 46.0, 33.0, 21.0, 13.0, 9.0, 9.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.2042236328125, -5.013916015625, -4.8236083984375, -4.63330078125, -4.4429931640625, -4.252685546875, -4.0623779296875, -3.8720703125, -3.6817626953125, -3.491455078125, -3.3011474609375, -3.11083984375, -2.9205322265625, -2.730224609375, -2.5399169921875, -2.349609375, -2.1593017578125, -1.968994140625, -1.7786865234375, -1.58837890625, -1.3980712890625, -1.207763671875, -1.0174560546875, -0.8271484375, -0.6368408203125, -0.446533203125, -0.2562255859375, -0.06591796875, 0.1243896484375, 0.314697265625, 0.5050048828125, 0.6953125, 0.8856201171875, 1.075927734375, 1.2662353515625, 1.45654296875, 1.6468505859375, 1.837158203125, 2.0274658203125, 2.2177734375, 2.4080810546875, 2.598388671875, 2.7886962890625, 2.97900390625, 3.1693115234375, 3.359619140625, 3.5499267578125, 3.740234375, 3.9305419921875, 4.120849609375, 4.3111572265625, 4.50146484375, 4.6917724609375, 4.882080078125, 5.0723876953125, 5.2626953125, 5.4530029296875, 5.643310546875, 5.8336181640625, 6.02392578125, 6.2142333984375, 6.404541015625, 6.5948486328125, 6.78515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 11.0, 15.0, 23.0, 13.0, 18.0, 19.0, 24.0, 42.0, 51.0, 37.0, 41.0, 41.0, 45.0, 50.0, 57.0, 59.0, 39.0, 51.0, 36.0, 45.0, 30.0, 25.0, 28.0, 25.0, 31.0, 24.0, 26.0, 12.0, 13.0, 17.0, 2.0, 3.0, 8.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.63671875, -7.4022216796875, -7.167724609375, -6.9332275390625, -6.69873046875, -6.4642333984375, -6.229736328125, -5.9952392578125, -5.7607421875, -5.5262451171875, -5.291748046875, -5.0572509765625, -4.82275390625, -4.5882568359375, -4.353759765625, -4.1192626953125, -3.884765625, -3.6502685546875, -3.415771484375, -3.1812744140625, -2.94677734375, -2.7122802734375, -2.477783203125, -2.2432861328125, -2.0087890625, -1.7742919921875, -1.539794921875, -1.3052978515625, -1.07080078125, -0.8363037109375, -0.601806640625, -0.3673095703125, -0.1328125, 0.1016845703125, 0.336181640625, 0.5706787109375, 0.80517578125, 1.0396728515625, 1.274169921875, 1.5086669921875, 1.7431640625, 1.9776611328125, 2.212158203125, 2.4466552734375, 2.68115234375, 2.9156494140625, 3.150146484375, 3.3846435546875, 3.619140625, 3.8536376953125, 4.088134765625, 4.3226318359375, 4.55712890625, 4.7916259765625, 5.026123046875, 5.2606201171875, 5.4951171875, 5.7296142578125, 5.964111328125, 6.1986083984375, 6.43310546875, 6.6676025390625, 6.902099609375, 7.1365966796875, 7.37109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 14.0, 13.0, 36.0, 78.0, 126.0, 246.0, 513.0, 1099.0, 2867.0, 10215.0, 48258.0, 349253.0, 563153.0, 55687.0, 11370.0, 3415.0, 1171.0, 498.0, 251.0, 112.0, 82.0, 36.0, 16.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.229400634765625, -2.16192626953125, -2.094451904296875, -2.0269775390625, -1.959503173828125, -1.89202880859375, -1.824554443359375, -1.757080078125, -1.689605712890625, -1.62213134765625, -1.554656982421875, -1.4871826171875, -1.419708251953125, -1.35223388671875, -1.284759521484375, -1.21728515625, -1.149810791015625, -1.08233642578125, -1.014862060546875, -0.9473876953125, -0.879913330078125, -0.81243896484375, -0.744964599609375, -0.677490234375, -0.610015869140625, -0.54254150390625, -0.475067138671875, -0.4075927734375, -0.340118408203125, -0.27264404296875, -0.205169677734375, -0.1376953125, -0.070220947265625, -0.00274658203125, 0.064727783203125, 0.1322021484375, 0.199676513671875, 0.26715087890625, 0.334625244140625, 0.402099609375, 0.469573974609375, 0.53704833984375, 0.604522705078125, 0.6719970703125, 0.739471435546875, 0.80694580078125, 0.874420166015625, 0.94189453125, 1.009368896484375, 1.07684326171875, 1.144317626953125, 1.2117919921875, 1.279266357421875, 1.34674072265625, 1.414215087890625, 1.481689453125, 1.549163818359375, 1.61663818359375, 1.684112548828125, 1.7515869140625, 1.819061279296875, 1.88653564453125, 1.954010009765625, 2.021484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 11.0, 5.0, 16.0, 13.0, 15.0, 29.0, 47.0, 52.0, 70.0, 111.0, 112.0, 125.0, 117.0, 81.0, 67.0, 25.0, 30.0, 16.0, 15.0, 10.0, 3.0, 6.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038123130798339844, -0.00036537274718284607, -0.0003495141863822937, -0.00033365562558174133, -0.00031779706478118896, -0.0003019385039806366, -0.00028607994318008423, -0.00027022138237953186, -0.0002543628215789795, -0.00023850426077842712, -0.00022264569997787476, -0.0002067871391773224, -0.00019092857837677002, -0.00017507001757621765, -0.00015921145677566528, -0.00014335289597511292, -0.00012749433517456055, -0.00011163577437400818, -9.577721357345581e-05, -7.991865277290344e-05, -6.406009197235107e-05, -4.8201531171798706e-05, -3.234297037124634e-05, -1.648440957069397e-05, -6.258487701416016e-07, 1.5232712030410767e-05, 3.1091272830963135e-05, 4.69498336315155e-05, 6.280839443206787e-05, 7.866695523262024e-05, 9.452551603317261e-05, 0.00011038407683372498, 0.00012624263763427734, 0.0001421011984348297, 0.00015795975923538208, 0.00017381832003593445, 0.00018967688083648682, 0.00020553544163703918, 0.00022139400243759155, 0.00023725256323814392, 0.0002531111240386963, 0.00026896968483924866, 0.000284828245639801, 0.0003006868064403534, 0.00031654536724090576, 0.00033240392804145813, 0.0003482624888420105, 0.00036412104964256287, 0.00037997961044311523, 0.0003958381712436676, 0.00041169673204421997, 0.00042755529284477234, 0.0004434138536453247, 0.0004592724144458771, 0.00047513097524642944, 0.0004909895360469818, 0.0005068480968475342, 0.0005227066576480865, 0.0005385652184486389, 0.0005544237792491913, 0.0005702823400497437, 0.000586140900850296, 0.0006019994616508484, 0.0006178580224514008, 0.0006337165832519531]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 12.0, 30.0, 45.0, 80.0, 151.0, 346.0, 1132.0, 5459.0, 60354.0, 884139.0, 87844.0, 6841.0, 1349.0, 406.0, 155.0, 99.0, 38.0, 24.0, 11.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.938812255859375, -4.80731201171875, -4.675811767578125, -4.5443115234375, -4.412811279296875, -4.28131103515625, -4.149810791015625, -4.018310546875, -3.886810302734375, -3.75531005859375, -3.623809814453125, -3.4923095703125, -3.360809326171875, -3.22930908203125, -3.097808837890625, -2.96630859375, -2.834808349609375, -2.70330810546875, -2.571807861328125, -2.4403076171875, -2.308807373046875, -2.17730712890625, -2.045806884765625, -1.914306640625, -1.782806396484375, -1.65130615234375, -1.519805908203125, -1.3883056640625, -1.256805419921875, -1.12530517578125, -0.993804931640625, -0.8623046875, -0.730804443359375, -0.59930419921875, -0.467803955078125, -0.3363037109375, -0.204803466796875, -0.07330322265625, 0.058197021484375, 0.189697265625, 0.321197509765625, 0.45269775390625, 0.584197998046875, 0.7156982421875, 0.847198486328125, 0.97869873046875, 1.110198974609375, 1.24169921875, 1.373199462890625, 1.50469970703125, 1.636199951171875, 1.7677001953125, 1.899200439453125, 2.03070068359375, 2.162200927734375, 2.293701171875, 2.425201416015625, 2.55670166015625, 2.688201904296875, 2.8197021484375, 2.951202392578125, 3.08270263671875, 3.214202880859375, 3.345703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 11.0, 7.0, 12.0, 22.0, 19.0, 38.0, 39.0, 57.0, 65.0, 84.0, 86.0, 80.0, 98.0, 87.0, 75.0, 45.0, 32.0, 33.0, 18.0, 22.0, 11.0, 12.0, 5.0, 7.0, 9.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.35791015625, -2.2958984375, -2.23388671875, -2.171875, -2.10986328125, -2.0478515625, -1.98583984375, -1.923828125, -1.86181640625, -1.7998046875, -1.73779296875, -1.67578125, -1.61376953125, -1.5517578125, -1.48974609375, -1.427734375, -1.36572265625, -1.3037109375, -1.24169921875, -1.1796875, -1.11767578125, -1.0556640625, -0.99365234375, -0.931640625, -0.86962890625, -0.8076171875, -0.74560546875, -0.68359375, -0.62158203125, -0.5595703125, -0.49755859375, -0.435546875, -0.37353515625, -0.3115234375, -0.24951171875, -0.1875, -0.12548828125, -0.0634765625, -0.00146484375, 0.060546875, 0.12255859375, 0.1845703125, 0.24658203125, 0.30859375, 0.37060546875, 0.4326171875, 0.49462890625, 0.556640625, 0.61865234375, 0.6806640625, 0.74267578125, 0.8046875, 0.86669921875, 0.9287109375, 0.99072265625, 1.052734375, 1.11474609375, 1.1767578125, 1.23876953125, 1.30078125, 1.36279296875, 1.4248046875, 1.48681640625, 1.548828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 8.0, 16.0, 19.0, 32.0, 78.0, 144.0, 247.0, 228.0, 116.0, 55.0, 24.0, 8.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.43402862548828, -44.93017578125, -43.42632293701172, -41.9224739074707, -40.41862106323242, -38.91476821899414, -37.410919189453125, -35.907066345214844, -34.40321350097656, -32.89936065673828, -31.395509719848633, -29.891658782958984, -28.387805938720703, -26.883953094482422, -25.380102157592773, -23.876251220703125, -22.372398376464844, -20.868545532226562, -19.364694595336914, -17.860843658447266, -16.356990814208984, -14.85313892364502, -13.349287033081055, -11.84543514251709, -10.341583251953125, -8.83773136138916, -7.333879470825195, -5.8300275802612305, -4.326175689697266, -2.822323799133301, -1.318471908569336, 0.1853799819946289, 1.6892318725585938, 3.1930837631225586, 4.696935653686523, 6.200787544250488, 7.704639434814453, 9.208491325378418, 10.712343215942383, 12.216195106506348, 13.720046997070312, 15.223898887634277, 16.727750778198242, 18.23160171508789, 19.735454559326172, 21.239307403564453, 22.7431583404541, 24.24700927734375, 25.75086212158203, 27.254714965820312, 28.75856590270996, 30.26241683959961, 31.76626968383789, 33.27012252807617, 34.77397155761719, 36.27782440185547, 37.78167724609375, 39.28553009033203, 40.78938293457031, 42.29323196411133, 43.79708480834961, 45.30093765258789, 46.804786682128906, 48.30863952636719, 49.81249237060547]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 4.0, 12.0, 10.0, 11.0, 17.0, 12.0, 18.0, 27.0, 16.0, 27.0, 33.0, 28.0, 39.0, 34.0, 60.0, 68.0, 80.0, 63.0, 73.0, 56.0, 42.0, 30.0, 32.0, 27.0, 20.0, 19.0, 31.0, 14.0, 10.0, 15.0, 10.0, 9.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.821874618530273, -29.876317977905273, -28.930763244628906, -27.985206604003906, -27.039649963378906, -26.094093322753906, -25.148536682128906, -24.20298194885254, -23.25742530822754, -22.31186866760254, -21.366313934326172, -20.420757293701172, -19.475200653076172, -18.529644012451172, -17.584087371826172, -16.638532638549805, -15.692975997924805, -14.747419357299805, -13.801863670349121, -12.856307983398438, -11.910751342773438, -10.965194702148438, -10.019639015197754, -9.07408332824707, -8.12852668762207, -7.1829705238342285, -6.237414360046387, -5.291858196258545, -4.346302032470703, -3.4007458686828613, -2.4551897048950195, -1.5096335411071777, -0.5640754699707031, 0.38148069381713867, 1.3270368576049805, 2.2725930213928223, 3.218149185180664, 4.163705348968506, 5.109261512756348, 6.0548176765441895, 7.000373840332031, 7.945930004119873, 8.891486167907715, 9.837041854858398, 10.782598495483398, 11.728155136108398, 12.673710823059082, 13.619266510009766, 14.564823150634766, 15.510379791259766, 16.455936431884766, 17.401491165161133, 18.347047805786133, 19.292604446411133, 20.2381591796875, 21.1837158203125, 22.1292724609375, 23.0748291015625, 24.0203857421875, 24.965940475463867, 25.911497116088867, 26.857053756713867, 27.802608489990234, 28.748165130615234, 29.693721771240234]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 16.0, 18.0, 46.0, 55.0, 97.0, 180.0, 334.0, 557.0, 1181.0, 2680.0, 6723.0, 20845.0, 100576.0, 1197512.0, 2591532.0, 220243.0, 34329.0, 9964.0, 3914.0, 1664.0, 814.0, 432.0, 211.0, 131.0, 65.0, 50.0, 29.0, 22.0, 9.0, 11.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.244293212890625, -3.13311767578125, -3.021942138671875, -2.9107666015625, -2.799591064453125, -2.68841552734375, -2.577239990234375, -2.466064453125, -2.354888916015625, -2.24371337890625, -2.132537841796875, -2.0213623046875, -1.910186767578125, -1.79901123046875, -1.687835693359375, -1.57666015625, -1.465484619140625, -1.35430908203125, -1.243133544921875, -1.1319580078125, -1.020782470703125, -0.90960693359375, -0.798431396484375, -0.687255859375, -0.576080322265625, -0.46490478515625, -0.353729248046875, -0.2425537109375, -0.131378173828125, -0.02020263671875, 0.090972900390625, 0.2021484375, 0.313323974609375, 0.42449951171875, 0.535675048828125, 0.6468505859375, 0.758026123046875, 0.86920166015625, 0.980377197265625, 1.091552734375, 1.202728271484375, 1.31390380859375, 1.425079345703125, 1.5362548828125, 1.647430419921875, 1.75860595703125, 1.869781494140625, 1.98095703125, 2.092132568359375, 2.20330810546875, 2.314483642578125, 2.4256591796875, 2.536834716796875, 2.64801025390625, 2.759185791015625, 2.870361328125, 2.981536865234375, 3.09271240234375, 3.203887939453125, 3.3150634765625, 3.426239013671875, 3.53741455078125, 3.648590087890625, 3.759765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 8.0, 10.0, 16.0, 9.0, 23.0, 21.0, 20.0, 37.0, 33.0, 46.0, 39.0, 47.0, 43.0, 47.0, 46.0, 54.0, 50.0, 47.0, 47.0, 43.0, 47.0, 50.0, 34.0, 35.0, 23.0, 18.0, 24.0, 17.0, 11.0, 15.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3984375, -2.33551025390625, -2.2725830078125, -2.20965576171875, -2.146728515625, -2.08380126953125, -2.0208740234375, -1.95794677734375, -1.89501953125, -1.83209228515625, -1.7691650390625, -1.70623779296875, -1.643310546875, -1.58038330078125, -1.5174560546875, -1.45452880859375, -1.3916015625, -1.32867431640625, -1.2657470703125, -1.20281982421875, -1.139892578125, -1.07696533203125, -1.0140380859375, -0.95111083984375, -0.88818359375, -0.82525634765625, -0.7623291015625, -0.69940185546875, -0.636474609375, -0.57354736328125, -0.5106201171875, -0.44769287109375, -0.384765625, -0.32183837890625, -0.2589111328125, -0.19598388671875, -0.133056640625, -0.07012939453125, -0.0072021484375, 0.05572509765625, 0.11865234375, 0.18157958984375, 0.2445068359375, 0.30743408203125, 0.370361328125, 0.43328857421875, 0.4962158203125, 0.55914306640625, 0.6220703125, 0.68499755859375, 0.7479248046875, 0.81085205078125, 0.873779296875, 0.93670654296875, 0.9996337890625, 1.06256103515625, 1.12548828125, 1.18841552734375, 1.2513427734375, 1.31427001953125, 1.377197265625, 1.44012451171875, 1.5030517578125, 1.56597900390625, 1.62890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 17.0, 13.0, 20.0, 29.0, 52.0, 100.0, 202.0, 512.0, 1536.0, 5289.0, 26583.0, 329817.0, 3647591.0, 159001.0, 17471.0, 3883.0, 1223.0, 463.0, 201.0, 112.0, 55.0, 29.0, 20.0, 18.0, 9.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.06951904296875, -6.8577880859375, -6.64605712890625, -6.434326171875, -6.22259521484375, -6.0108642578125, -5.79913330078125, -5.58740234375, -5.37567138671875, -5.1639404296875, -4.95220947265625, -4.740478515625, -4.52874755859375, -4.3170166015625, -4.10528564453125, -3.8935546875, -3.68182373046875, -3.4700927734375, -3.25836181640625, -3.046630859375, -2.83489990234375, -2.6231689453125, -2.41143798828125, -2.19970703125, -1.98797607421875, -1.7762451171875, -1.56451416015625, -1.352783203125, -1.14105224609375, -0.9293212890625, -0.71759033203125, -0.505859375, -0.29412841796875, -0.0823974609375, 0.12933349609375, 0.341064453125, 0.55279541015625, 0.7645263671875, 0.97625732421875, 1.18798828125, 1.39971923828125, 1.6114501953125, 1.82318115234375, 2.034912109375, 2.24664306640625, 2.4583740234375, 2.67010498046875, 2.8818359375, 3.09356689453125, 3.3052978515625, 3.51702880859375, 3.728759765625, 3.94049072265625, 4.1522216796875, 4.36395263671875, 4.57568359375, 4.78741455078125, 4.9991455078125, 5.21087646484375, 5.422607421875, 5.63433837890625, 5.8460693359375, 6.05780029296875, 6.26953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 9.0, 12.0, 6.0, 9.0, 15.0, 16.0, 25.0, 36.0, 63.0, 61.0, 97.0, 182.0, 320.0, 528.0, 822.0, 693.0, 427.0, 265.0, 159.0, 95.0, 70.0, 37.0, 26.0, 28.0, 18.0, 10.0, 9.0, 5.0, 4.0, 11.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.380615234375, -4.23388671875, -4.087158203125, -3.9404296875, -3.793701171875, -3.64697265625, -3.500244140625, -3.353515625, -3.206787109375, -3.06005859375, -2.913330078125, -2.7666015625, -2.619873046875, -2.47314453125, -2.326416015625, -2.1796875, -2.032958984375, -1.88623046875, -1.739501953125, -1.5927734375, -1.446044921875, -1.29931640625, -1.152587890625, -1.005859375, -0.859130859375, -0.71240234375, -0.565673828125, -0.4189453125, -0.272216796875, -0.12548828125, 0.021240234375, 0.16796875, 0.314697265625, 0.46142578125, 0.608154296875, 0.7548828125, 0.901611328125, 1.04833984375, 1.195068359375, 1.341796875, 1.488525390625, 1.63525390625, 1.781982421875, 1.9287109375, 2.075439453125, 2.22216796875, 2.368896484375, 2.515625, 2.662353515625, 2.80908203125, 2.955810546875, 3.1025390625, 3.249267578125, 3.39599609375, 3.542724609375, 3.689453125, 3.836181640625, 3.98291015625, 4.129638671875, 4.2763671875, 4.423095703125, 4.56982421875, 4.716552734375, 4.86328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 27.0, 56.0, 70.0, 104.0, 138.0, 125.0, 128.0, 96.0, 81.0, 44.0, 34.0, 25.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59521484375, -39.510807037353516, -38.42639923095703, -37.34198760986328, -36.2575798034668, -35.17317199707031, -34.08876037597656, -33.00435256958008, -31.919944763183594, -30.83553695678711, -29.751127243041992, -28.666717529296875, -27.58230972290039, -26.497901916503906, -25.41349220275879, -24.329082489013672, -23.244674682617188, -22.160266876220703, -21.075857162475586, -19.99144744873047, -18.907039642333984, -17.8226318359375, -16.738222122192383, -15.653813362121582, -14.569404602050781, -13.48499584197998, -12.40058708190918, -11.316178321838379, -10.231769561767578, -9.147360801696777, -8.062952041625977, -6.978543281555176, -5.894136428833008, -4.809727668762207, -3.7253189086914062, -2.6409101486206055, -1.5565013885498047, -0.4720926284790039, 0.6123161315917969, 1.6967248916625977, 2.7811336517333984, 3.865542411804199, 4.949951171875, 6.034359931945801, 7.118768692016602, 8.203177452087402, 9.287586212158203, 10.371994972229004, 11.456403732299805, 12.540812492370605, 13.625221252441406, 14.709630012512207, 15.794038772583008, 16.878448486328125, 17.96285629272461, 19.047264099121094, 20.13167381286621, 21.216083526611328, 22.300491333007812, 23.384899139404297, 24.469308853149414, 25.55371856689453, 26.638126373291016, 27.7225341796875, 28.806943893432617]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 14.0, 23.0, 18.0, 20.0, 37.0, 37.0, 35.0, 51.0, 55.0, 46.0, 55.0, 69.0, 88.0, 66.0, 63.0, 47.0, 35.0, 40.0, 34.0, 33.0, 20.0, 21.0, 20.0, 21.0, 5.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-29.58866310119629, -28.84001922607422, -28.09137535095215, -27.342731475830078, -26.59408950805664, -25.84544563293457, -25.0968017578125, -24.34815788269043, -23.59951400756836, -22.85087013244629, -22.10222625732422, -21.35358428955078, -20.60494041442871, -19.85629653930664, -19.10765266418457, -18.3590087890625, -17.610366821289062, -16.861722946166992, -16.113079071044922, -15.364436149597168, -14.615793228149414, -13.867149353027344, -13.118505477905273, -12.369861602783203, -11.62121868133545, -10.872574806213379, -10.123931884765625, -9.375288009643555, -8.626644134521484, -7.8780012130737305, -7.12935733795166, -6.380713939666748, -5.632072448730469, -4.883429050445557, -4.1347856521606445, -3.386141777038574, -2.637498378753662, -1.88885498046875, -1.1402111053466797, -0.3915677070617676, 0.35707569122314453, 1.1057192087173462, 1.8543627262115479, 2.603006362915039, 3.351649761199951, 4.100293159484863, 4.848937034606934, 5.597580432891846, 6.346223831176758, 7.09486722946167, 7.843510627746582, 8.592154502868652, 9.340797424316406, 10.089441299438477, 10.838085174560547, 11.586729049682617, 12.335371971130371, 13.084015846252441, 13.832658767700195, 14.581302642822266, 15.329946517944336, 16.078590393066406, 16.827232360839844, 17.575876235961914, 18.324520111083984]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 10.0, 14.0, 27.0, 28.0, 79.0, 94.0, 196.0, 332.0, 592.0, 1227.0, 2710.0, 7500.0, 27449.0, 171932.0, 638496.0, 159553.0, 25979.0, 7050.0, 2723.0, 1142.0, 574.0, 334.0, 205.0, 125.0, 62.0, 34.0, 27.0, 18.0, 17.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.02423095703125, -3.8922119140625, -3.76019287109375, -3.628173828125, -3.49615478515625, -3.3641357421875, -3.23211669921875, -3.10009765625, -2.96807861328125, -2.8360595703125, -2.70404052734375, -2.572021484375, -2.44000244140625, -2.3079833984375, -2.17596435546875, -2.0439453125, -1.91192626953125, -1.7799072265625, -1.64788818359375, -1.515869140625, -1.38385009765625, -1.2518310546875, -1.11981201171875, -0.98779296875, -0.85577392578125, -0.7237548828125, -0.59173583984375, -0.459716796875, -0.32769775390625, -0.1956787109375, -0.06365966796875, 0.068359375, 0.20037841796875, 0.3323974609375, 0.46441650390625, 0.596435546875, 0.72845458984375, 0.8604736328125, 0.99249267578125, 1.12451171875, 1.25653076171875, 1.3885498046875, 1.52056884765625, 1.652587890625, 1.78460693359375, 1.9166259765625, 2.04864501953125, 2.1806640625, 2.31268310546875, 2.4447021484375, 2.57672119140625, 2.708740234375, 2.84075927734375, 2.9727783203125, 3.10479736328125, 3.23681640625, 3.36883544921875, 3.5008544921875, 3.63287353515625, 3.764892578125, 3.89691162109375, 4.0289306640625, 4.16094970703125, 4.29296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 15.0, 8.0, 10.0, 12.0, 17.0, 21.0, 18.0, 22.0, 28.0, 34.0, 41.0, 46.0, 58.0, 57.0, 57.0, 50.0, 58.0, 41.0, 52.0, 54.0, 56.0, 42.0, 30.0, 33.0, 28.0, 16.0, 24.0, 20.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.158233642578125, -2.08599853515625, -2.013763427734375, -1.9415283203125, -1.869293212890625, -1.79705810546875, -1.724822998046875, -1.652587890625, -1.580352783203125, -1.50811767578125, -1.435882568359375, -1.3636474609375, -1.291412353515625, -1.21917724609375, -1.146942138671875, -1.07470703125, -1.002471923828125, -0.93023681640625, -0.858001708984375, -0.7857666015625, -0.713531494140625, -0.64129638671875, -0.569061279296875, -0.496826171875, -0.424591064453125, -0.35235595703125, -0.280120849609375, -0.2078857421875, -0.135650634765625, -0.06341552734375, 0.008819580078125, 0.0810546875, 0.153289794921875, 0.22552490234375, 0.297760009765625, 0.3699951171875, 0.442230224609375, 0.51446533203125, 0.586700439453125, 0.658935546875, 0.731170654296875, 0.80340576171875, 0.875640869140625, 0.9478759765625, 1.020111083984375, 1.09234619140625, 1.164581298828125, 1.23681640625, 1.309051513671875, 1.38128662109375, 1.453521728515625, 1.5257568359375, 1.597991943359375, 1.67022705078125, 1.742462158203125, 1.814697265625, 1.886932373046875, 1.95916748046875, 2.031402587890625, 2.1036376953125, 2.175872802734375, 2.24810791015625, 2.320343017578125, 2.392578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 4.0, 10.0, 10.0, 13.0, 19.0, 30.0, 36.0, 56.0, 79.0, 83.0, 140.0, 213.0, 334.0, 656.0, 1234.0, 2831.0, 8809.0, 43177.0, 517772.0, 417327.0, 41492.0, 8501.0, 2835.0, 1239.0, 601.0, 348.0, 207.0, 152.0, 93.0, 61.0, 50.0, 53.0, 19.0, 14.0, 13.0, 12.0, 8.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.046875, -4.906646728515625, -4.76641845703125, -4.626190185546875, -4.4859619140625, -4.345733642578125, -4.20550537109375, -4.065277099609375, -3.925048828125, -3.784820556640625, -3.64459228515625, -3.504364013671875, -3.3641357421875, -3.223907470703125, -3.08367919921875, -2.943450927734375, -2.80322265625, -2.662994384765625, -2.52276611328125, -2.382537841796875, -2.2423095703125, -2.102081298828125, -1.96185302734375, -1.821624755859375, -1.681396484375, -1.541168212890625, -1.40093994140625, -1.260711669921875, -1.1204833984375, -0.980255126953125, -0.84002685546875, -0.699798583984375, -0.5595703125, -0.419342041015625, -0.27911376953125, -0.138885498046875, 0.0013427734375, 0.141571044921875, 0.28179931640625, 0.422027587890625, 0.562255859375, 0.702484130859375, 0.84271240234375, 0.982940673828125, 1.1231689453125, 1.263397216796875, 1.40362548828125, 1.543853759765625, 1.68408203125, 1.824310302734375, 1.96453857421875, 2.104766845703125, 2.2449951171875, 2.385223388671875, 2.52545166015625, 2.665679931640625, 2.805908203125, 2.946136474609375, 3.08636474609375, 3.226593017578125, 3.3668212890625, 3.507049560546875, 3.64727783203125, 3.787506103515625, 3.927734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 15.0, 14.0, 13.0, 25.0, 26.0, 34.0, 35.0, 52.0, 53.0, 44.0, 65.0, 64.0, 52.0, 64.0, 54.0, 76.0, 49.0, 53.0, 37.0, 27.0, 23.0, 26.0, 16.0, 11.0, 9.0, 7.0, 6.0, 6.0, 6.0, 0.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8187255859375, -8.535888671875, -8.2530517578125, -7.97021484375, -7.6873779296875, -7.404541015625, -7.1217041015625, -6.8388671875, -6.5560302734375, -6.273193359375, -5.9903564453125, -5.70751953125, -5.4246826171875, -5.141845703125, -4.8590087890625, -4.576171875, -4.2933349609375, -4.010498046875, -3.7276611328125, -3.44482421875, -3.1619873046875, -2.879150390625, -2.5963134765625, -2.3134765625, -2.0306396484375, -1.747802734375, -1.4649658203125, -1.18212890625, -0.8992919921875, -0.616455078125, -0.3336181640625, -0.05078125, 0.2320556640625, 0.514892578125, 0.7977294921875, 1.08056640625, 1.3634033203125, 1.646240234375, 1.9290771484375, 2.2119140625, 2.4947509765625, 2.777587890625, 3.0604248046875, 3.34326171875, 3.6260986328125, 3.908935546875, 4.1917724609375, 4.474609375, 4.7574462890625, 5.040283203125, 5.3231201171875, 5.60595703125, 5.8887939453125, 6.171630859375, 6.4544677734375, 6.7373046875, 7.0201416015625, 7.302978515625, 7.5858154296875, 7.86865234375, 8.1514892578125, 8.434326171875, 8.7171630859375, 9.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 17.0, 24.0, 22.0, 62.0, 82.0, 129.0, 199.0, 323.0, 570.0, 1057.0, 2388.0, 5594.0, 15649.0, 58456.0, 627585.0, 271626.0, 43318.0, 12552.0, 4659.0, 1962.0, 1023.0, 493.0, 280.0, 179.0, 87.0, 56.0, 42.0, 36.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7517242431640625, -1.696807861328125, -1.6418914794921875, -1.58697509765625, -1.5320587158203125, -1.477142333984375, -1.4222259521484375, -1.3673095703125, -1.3123931884765625, -1.257476806640625, -1.2025604248046875, -1.14764404296875, -1.0927276611328125, -1.037811279296875, -0.9828948974609375, -0.927978515625, -0.8730621337890625, -0.818145751953125, -0.7632293701171875, -0.70831298828125, -0.6533966064453125, -0.598480224609375, -0.5435638427734375, -0.4886474609375, -0.4337310791015625, -0.378814697265625, -0.3238983154296875, -0.26898193359375, -0.2140655517578125, -0.159149169921875, -0.1042327880859375, -0.04931640625, 0.0055999755859375, 0.060516357421875, 0.1154327392578125, 0.17034912109375, 0.2252655029296875, 0.280181884765625, 0.3350982666015625, 0.3900146484375, 0.4449310302734375, 0.499847412109375, 0.5547637939453125, 0.60968017578125, 0.6645965576171875, 0.719512939453125, 0.7744293212890625, 0.829345703125, 0.8842620849609375, 0.939178466796875, 0.9940948486328125, 1.04901123046875, 1.1039276123046875, 1.158843994140625, 1.2137603759765625, 1.2686767578125, 1.3235931396484375, 1.378509521484375, 1.4334259033203125, 1.48834228515625, 1.5432586669921875, 1.598175048828125, 1.6530914306640625, 1.7080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 4.0, 13.0, 20.0, 32.0, 46.0, 58.0, 80.0, 122.0, 150.0, 146.0, 74.0, 67.0, 47.0, 26.0, 23.0, 16.0, 10.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005035400390625, -0.0004870593547821045, -0.000470578670501709, -0.0004540979862213135, -0.00043761730194091797, -0.00042113661766052246, -0.00040465593338012695, -0.00038817524909973145, -0.00037169456481933594, -0.00035521388053894043, -0.0003387331962585449, -0.0003222525119781494, -0.0003057718276977539, -0.0002892911434173584, -0.0002728104591369629, -0.0002563297748565674, -0.00023984909057617188, -0.00022336840629577637, -0.00020688772201538086, -0.00019040703773498535, -0.00017392635345458984, -0.00015744566917419434, -0.00014096498489379883, -0.00012448430061340332, -0.00010800361633300781, -9.15229320526123e-05, -7.50422477722168e-05, -5.856156349182129e-05, -4.208087921142578e-05, -2.5600194931030273e-05, -9.119510650634766e-06, 7.361173629760742e-06, 2.384185791015625e-05, 4.032254219055176e-05, 5.6803226470947266e-05, 7.328391075134277e-05, 8.976459503173828e-05, 0.00010624527931213379, 0.0001227259635925293, 0.0001392066478729248, 0.0001556873321533203, 0.00017216801643371582, 0.00018864870071411133, 0.00020512938499450684, 0.00022161006927490234, 0.00023809075355529785, 0.00025457143783569336, 0.00027105212211608887, 0.0002875328063964844, 0.0003040134906768799, 0.0003204941749572754, 0.0003369748592376709, 0.0003534555435180664, 0.0003699362277984619, 0.0003864169120788574, 0.00040289759635925293, 0.00041937828063964844, 0.00043585896492004395, 0.00045233964920043945, 0.00046882033348083496, 0.00048530101776123047, 0.000501781702041626, 0.0005182623863220215, 0.000534743070602417, 0.0005512237548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 6.0, 8.0, 20.0, 29.0, 51.0, 64.0, 116.0, 279.0, 622.0, 1682.0, 5975.0, 35047.0, 746901.0, 231614.0, 19796.0, 4080.0, 1262.0, 472.0, 231.0, 87.0, 51.0, 52.0, 26.0, 14.0, 20.0, 10.0, 11.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.059234619140625, -2.96612548828125, -2.873016357421875, -2.7799072265625, -2.686798095703125, -2.59368896484375, -2.500579833984375, -2.407470703125, -2.314361572265625, -2.22125244140625, -2.128143310546875, -2.0350341796875, -1.941925048828125, -1.84881591796875, -1.755706787109375, -1.66259765625, -1.569488525390625, -1.47637939453125, -1.383270263671875, -1.2901611328125, -1.197052001953125, -1.10394287109375, -1.010833740234375, -0.917724609375, -0.824615478515625, -0.73150634765625, -0.638397216796875, -0.5452880859375, -0.452178955078125, -0.35906982421875, -0.265960693359375, -0.1728515625, -0.079742431640625, 0.01336669921875, 0.106475830078125, 0.1995849609375, 0.292694091796875, 0.38580322265625, 0.478912353515625, 0.572021484375, 0.665130615234375, 0.75823974609375, 0.851348876953125, 0.9444580078125, 1.037567138671875, 1.13067626953125, 1.223785400390625, 1.31689453125, 1.410003662109375, 1.50311279296875, 1.596221923828125, 1.6893310546875, 1.782440185546875, 1.87554931640625, 1.968658447265625, 2.061767578125, 2.154876708984375, 2.24798583984375, 2.341094970703125, 2.4342041015625, 2.527313232421875, 2.62042236328125, 2.713531494140625, 2.806640625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 14.0, 21.0, 27.0, 45.0, 69.0, 114.0, 178.0, 173.0, 119.0, 69.0, 54.0, 30.0, 24.0, 15.0, 11.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-4.16015625, -4.0716552734375, -3.983154296875, -3.8946533203125, -3.80615234375, -3.7176513671875, -3.629150390625, -3.5406494140625, -3.4521484375, -3.3636474609375, -3.275146484375, -3.1866455078125, -3.09814453125, -3.0096435546875, -2.921142578125, -2.8326416015625, -2.744140625, -2.6556396484375, -2.567138671875, -2.4786376953125, -2.39013671875, -2.3016357421875, -2.213134765625, -2.1246337890625, -2.0361328125, -1.9476318359375, -1.859130859375, -1.7706298828125, -1.68212890625, -1.5936279296875, -1.505126953125, -1.4166259765625, -1.328125, -1.2396240234375, -1.151123046875, -1.0626220703125, -0.97412109375, -0.8856201171875, -0.797119140625, -0.7086181640625, -0.6201171875, -0.5316162109375, -0.443115234375, -0.3546142578125, -0.26611328125, -0.1776123046875, -0.089111328125, -0.0006103515625, 0.087890625, 0.1763916015625, 0.264892578125, 0.3533935546875, 0.44189453125, 0.5303955078125, 0.618896484375, 0.7073974609375, 0.7958984375, 0.8843994140625, 0.972900390625, 1.0614013671875, 1.14990234375, 1.2384033203125, 1.326904296875, 1.4154052734375, 1.50390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 7.0, 15.0, 26.0, 63.0, 175.0, 430.0, 187.0, 64.0, 16.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.28250122070312, -78.20263671875, -76.12277221679688, -74.04290771484375, -71.96304321289062, -69.8831787109375, -67.80331420898438, -65.72344970703125, -63.64358139038086, -61.563716888427734, -59.48385238647461, -57.403987884521484, -55.324119567871094, -53.24425506591797, -51.164390563964844, -49.08452606201172, -47.004661560058594, -44.92479705810547, -42.844932556152344, -40.76506805419922, -38.685203552246094, -36.60533905029297, -34.52547073364258, -32.44560623168945, -30.365741729736328, -28.285877227783203, -26.206012725830078, -24.12614631652832, -22.046281814575195, -19.96641731262207, -17.886550903320312, -15.806686401367188, -13.726829528808594, -11.646965026855469, -9.567099571228027, -7.487234592437744, -5.407369613647461, -3.327505111694336, -1.2476396560668945, 0.8322257995605469, 2.912090301513672, 4.991955280303955, 7.071820259094238, 9.15168571472168, 11.231550216674805, 13.31141471862793, 15.391280174255371, 17.471145629882812, 19.551010131835938, 21.630874633789062, 23.710739135742188, 25.790605545043945, 27.87047004699707, 29.950334548950195, 32.03020095825195, 34.11006546020508, 36.1899299621582, 38.26979446411133, 40.34965896606445, 42.42952346801758, 44.50939178466797, 46.589256286621094, 48.66912078857422, 50.748985290527344, 52.82884979248047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 14.0, 14.0, 10.0, 30.0, 30.0, 19.0, 24.0, 32.0, 40.0, 53.0, 62.0, 82.0, 98.0, 84.0, 57.0, 54.0, 41.0, 35.0, 30.0, 30.0, 19.0, 18.0, 17.0, 18.0, 11.0, 16.0, 7.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.24529266357422, -29.26091194152832, -28.276531219482422, -27.29214859008789, -26.307767868041992, -25.323387145996094, -24.339006423950195, -23.354625701904297, -22.370243072509766, -21.385862350463867, -20.40148162841797, -19.417098999023438, -18.43271827697754, -17.44833755493164, -16.463956832885742, -15.479575157165527, -14.495194435119629, -13.51081371307373, -12.526432037353516, -11.542051315307617, -10.557669639587402, -9.573288917541504, -8.588907241821289, -7.604526519775391, -6.620145320892334, -5.635764122009277, -4.651382923126221, -3.667001962661743, -2.6826207637786865, -1.698239803314209, -0.7138586044311523, 0.2705225944519043, 1.254903793334961, 2.2392849922180176, 3.223666191101074, 4.208046913146973, 5.1924285888671875, 6.176809310913086, 7.161190509796143, 8.1455717086792, 9.129953384399414, 10.114334106445312, 11.098715782165527, 12.083096504211426, 13.06747817993164, 14.051858901977539, 15.036239624023438, 16.02062225341797, 17.005001068115234, 17.989381790161133, 18.97376251220703, 19.958145141601562, 20.94252586364746, 21.92690658569336, 22.911287307739258, 23.895668029785156, 24.880050659179688, 25.864431381225586, 26.848812103271484, 27.833194732666016, 28.817575454711914, 29.801956176757812, 30.78633689880371, 31.77071762084961, 32.75510025024414]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 5.0, 13.0, 14.0, 15.0, 29.0, 49.0, 75.0, 136.0, 217.0, 367.0, 789.0, 1715.0, 4001.0, 11012.0, 38705.0, 256075.0, 2713143.0, 1038481.0, 95883.0, 21038.0, 6984.0, 2829.0, 1307.0, 608.0, 312.0, 184.0, 93.0, 67.0, 46.0, 24.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.03515625, -3.915679931640625, -3.79620361328125, -3.676727294921875, -3.5572509765625, -3.437774658203125, -3.31829833984375, -3.198822021484375, -3.079345703125, -2.959869384765625, -2.84039306640625, -2.720916748046875, -2.6014404296875, -2.481964111328125, -2.36248779296875, -2.243011474609375, -2.12353515625, -2.004058837890625, -1.88458251953125, -1.765106201171875, -1.6456298828125, -1.526153564453125, -1.40667724609375, -1.287200927734375, -1.167724609375, -1.048248291015625, -0.92877197265625, -0.809295654296875, -0.6898193359375, -0.570343017578125, -0.45086669921875, -0.331390380859375, -0.2119140625, -0.092437744140625, 0.02703857421875, 0.146514892578125, 0.2659912109375, 0.385467529296875, 0.50494384765625, 0.624420166015625, 0.743896484375, 0.863372802734375, 0.98284912109375, 1.102325439453125, 1.2218017578125, 1.341278076171875, 1.46075439453125, 1.580230712890625, 1.69970703125, 1.819183349609375, 1.93865966796875, 2.058135986328125, 2.1776123046875, 2.297088623046875, 2.41656494140625, 2.536041259765625, 2.655517578125, 2.774993896484375, 2.89447021484375, 3.013946533203125, 3.1334228515625, 3.252899169921875, 3.37237548828125, 3.491851806640625, 3.611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 12.0, 11.0, 13.0, 19.0, 16.0, 31.0, 23.0, 32.0, 40.0, 38.0, 44.0, 52.0, 55.0, 52.0, 64.0, 69.0, 63.0, 48.0, 44.0, 48.0, 50.0, 29.0, 27.0, 24.0, 13.0, 19.0, 15.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.939453125, -2.8662872314453125, -2.793121337890625, -2.7199554443359375, -2.64678955078125, -2.5736236572265625, -2.500457763671875, -2.4272918701171875, -2.3541259765625, -2.2809600830078125, -2.207794189453125, -2.1346282958984375, -2.06146240234375, -1.9882965087890625, -1.915130615234375, -1.8419647216796875, -1.768798828125, -1.6956329345703125, -1.622467041015625, -1.5493011474609375, -1.47613525390625, -1.4029693603515625, -1.329803466796875, -1.2566375732421875, -1.1834716796875, -1.1103057861328125, -1.037139892578125, -0.9639739990234375, -0.89080810546875, -0.8176422119140625, -0.744476318359375, -0.6713104248046875, -0.59814453125, -0.5249786376953125, -0.451812744140625, -0.3786468505859375, -0.30548095703125, -0.2323150634765625, -0.159149169921875, -0.0859832763671875, -0.0128173828125, 0.0603485107421875, 0.133514404296875, 0.2066802978515625, 0.27984619140625, 0.3530120849609375, 0.426177978515625, 0.4993438720703125, 0.572509765625, 0.6456756591796875, 0.718841552734375, 0.7920074462890625, 0.86517333984375, 0.9383392333984375, 1.011505126953125, 1.0846710205078125, 1.1578369140625, 1.2310028076171875, 1.304168701171875, 1.3773345947265625, 1.45050048828125, 1.5236663818359375, 1.596832275390625, 1.6699981689453125, 1.7431640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 19.0, 25.0, 27.0, 43.0, 59.0, 128.0, 246.0, 587.0, 1479.0, 4560.0, 18414.0, 121670.0, 3057645.0, 915305.0, 57896.0, 11114.0, 3040.0, 1072.0, 430.0, 198.0, 114.0, 61.0, 37.0, 21.0, 26.0, 13.0, 13.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.1484375, -5.97186279296875, -5.7952880859375, -5.61871337890625, -5.442138671875, -5.26556396484375, -5.0889892578125, -4.91241455078125, -4.73583984375, -4.55926513671875, -4.3826904296875, -4.20611572265625, -4.029541015625, -3.85296630859375, -3.6763916015625, -3.49981689453125, -3.3232421875, -3.14666748046875, -2.9700927734375, -2.79351806640625, -2.616943359375, -2.44036865234375, -2.2637939453125, -2.08721923828125, -1.91064453125, -1.73406982421875, -1.5574951171875, -1.38092041015625, -1.204345703125, -1.02777099609375, -0.8511962890625, -0.67462158203125, -0.498046875, -0.32147216796875, -0.1448974609375, 0.03167724609375, 0.208251953125, 0.38482666015625, 0.5614013671875, 0.73797607421875, 0.91455078125, 1.09112548828125, 1.2677001953125, 1.44427490234375, 1.620849609375, 1.79742431640625, 1.9739990234375, 2.15057373046875, 2.3271484375, 2.50372314453125, 2.6802978515625, 2.85687255859375, 3.033447265625, 3.21002197265625, 3.3865966796875, 3.56317138671875, 3.73974609375, 3.91632080078125, 4.0928955078125, 4.26947021484375, 4.446044921875, 4.62261962890625, 4.7991943359375, 4.97576904296875, 5.15234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 12.0, 9.0, 13.0, 23.0, 42.0, 51.0, 60.0, 86.0, 129.0, 222.0, 376.0, 597.0, 772.0, 580.0, 340.0, 226.0, 128.0, 97.0, 68.0, 49.0, 37.0, 33.0, 27.0, 15.0, 11.0, 6.0, 13.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.9659423828125, -3.826416015625, -3.6868896484375, -3.54736328125, -3.4078369140625, -3.268310546875, -3.1287841796875, -2.9892578125, -2.8497314453125, -2.710205078125, -2.5706787109375, -2.43115234375, -2.2916259765625, -2.152099609375, -2.0125732421875, -1.873046875, -1.7335205078125, -1.593994140625, -1.4544677734375, -1.31494140625, -1.1754150390625, -1.035888671875, -0.8963623046875, -0.7568359375, -0.6173095703125, -0.477783203125, -0.3382568359375, -0.19873046875, -0.0592041015625, 0.080322265625, 0.2198486328125, 0.359375, 0.4989013671875, 0.638427734375, 0.7779541015625, 0.91748046875, 1.0570068359375, 1.196533203125, 1.3360595703125, 1.4755859375, 1.6151123046875, 1.754638671875, 1.8941650390625, 2.03369140625, 2.1732177734375, 2.312744140625, 2.4522705078125, 2.591796875, 2.7313232421875, 2.870849609375, 3.0103759765625, 3.14990234375, 3.2894287109375, 3.428955078125, 3.5684814453125, 3.7080078125, 3.8475341796875, 3.987060546875, 4.1265869140625, 4.26611328125, 4.4056396484375, 4.545166015625, 4.6846923828125, 4.82421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 7.0, 25.0, 63.0, 162.0, 278.0, 252.0, 128.0, 54.0, 13.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.43502426147461, -17.206241607666016, -14.977458953857422, -12.748676300048828, -10.519893646240234, -8.29111099243164, -6.062328338623047, -3.833545684814453, -1.6047630310058594, 0.6240196228027344, 2.852802276611328, 5.081584930419922, 7.310367584228516, 9.53915023803711, 11.767932891845703, 13.996715545654297, 16.22549819946289, 18.454280853271484, 20.683063507080078, 22.911846160888672, 25.140628814697266, 27.36941146850586, 29.598194122314453, 31.826976776123047, 34.05575942993164, 36.284542083740234, 38.51332473754883, 40.74210739135742, 42.970890045166016, 45.19967269897461, 47.4284553527832, 49.6572380065918, 51.886016845703125, 54.11479949951172, 56.34358215332031, 58.572364807128906, 60.8011474609375, 63.029930114746094, 65.25871276855469, 67.48749542236328, 69.71627807617188, 71.94506072998047, 74.17384338378906, 76.40262603759766, 78.63140869140625, 80.86019134521484, 83.08897399902344, 85.31775665283203, 87.54653930664062, 89.77532196044922, 92.00410461425781, 94.2328872680664, 96.461669921875, 98.6904525756836, 100.91923522949219, 103.14801788330078, 105.37680053710938, 107.60558319091797, 109.83436584472656, 112.06314849853516, 114.29193115234375, 116.52071380615234, 118.74949645996094, 120.97827911376953, 123.20706176757812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 6.0, 10.0, 14.0, 10.0, 12.0, 19.0, 21.0, 14.0, 25.0, 27.0, 23.0, 23.0, 33.0, 37.0, 48.0, 39.0, 41.0, 39.0, 44.0, 43.0, 39.0, 42.0, 52.0, 45.0, 38.0, 29.0, 31.0, 31.0, 27.0, 14.0, 16.0, 14.0, 13.0, 9.0, 10.0, 11.0, 15.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.35088539123535, -17.808513641357422, -17.266143798828125, -16.723772048950195, -16.181400299072266, -15.639029502868652, -15.096658706665039, -14.55428695678711, -14.011916160583496, -13.469545364379883, -12.927173614501953, -12.38480281829834, -11.842432022094727, -11.300060272216797, -10.757689476013184, -10.21531867980957, -9.67294692993164, -9.130576133728027, -8.588204383850098, -8.045833587646484, -7.503462314605713, -6.961091041564941, -6.418720245361328, -5.876348972320557, -5.333977699279785, -4.791606426239014, -4.249235153198242, -3.706864356994629, -3.1644930839538574, -2.622121810913086, -2.0797507762908936, -1.5373797416687012, -0.9950065612792969, -0.45263540744781494, 0.08973574638366699, 0.6321069002151489, 1.1744780540466309, 1.7168493270874023, 2.2592203617095947, 2.801591396331787, 3.3439626693725586, 3.88633394241333, 4.428705215454102, 4.971076011657715, 5.513447284698486, 6.055818557739258, 6.598189353942871, 7.140560626983643, 7.682931900024414, 8.225302696228027, 8.767674446105957, 9.31004524230957, 9.8524169921875, 10.394787788391113, 10.937158584594727, 11.479530334472656, 12.02190113067627, 12.564271926879883, 13.106643676757812, 13.649014472961426, 14.191385269165039, 14.733757019042969, 15.276127815246582, 15.818498611450195, 16.360870361328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 13.0, 15.0, 34.0, 35.0, 88.0, 121.0, 172.0, 292.0, 459.0, 934.0, 1989.0, 4221.0, 10510.0, 28967.0, 96860.0, 385302.0, 376936.0, 94628.0, 28222.0, 10400.0, 4260.0, 1910.0, 952.0, 490.0, 269.0, 171.0, 94.0, 75.0, 56.0, 23.0, 24.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.33447265625, -3.2333984375, -3.13232421875, -3.03125, -2.93017578125, -2.8291015625, -2.72802734375, -2.626953125, -2.52587890625, -2.4248046875, -2.32373046875, -2.22265625, -2.12158203125, -2.0205078125, -1.91943359375, -1.818359375, -1.71728515625, -1.6162109375, -1.51513671875, -1.4140625, -1.31298828125, -1.2119140625, -1.11083984375, -1.009765625, -0.90869140625, -0.8076171875, -0.70654296875, -0.60546875, -0.50439453125, -0.4033203125, -0.30224609375, -0.201171875, -0.10009765625, 0.0009765625, 0.10205078125, 0.203125, 0.30419921875, 0.4052734375, 0.50634765625, 0.607421875, 0.70849609375, 0.8095703125, 0.91064453125, 1.01171875, 1.11279296875, 1.2138671875, 1.31494140625, 1.416015625, 1.51708984375, 1.6181640625, 1.71923828125, 1.8203125, 1.92138671875, 2.0224609375, 2.12353515625, 2.224609375, 2.32568359375, 2.4267578125, 2.52783203125, 2.62890625, 2.72998046875, 2.8310546875, 2.93212890625, 3.033203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 10.0, 10.0, 9.0, 14.0, 12.0, 16.0, 29.0, 25.0, 31.0, 29.0, 24.0, 34.0, 27.0, 31.0, 37.0, 42.0, 36.0, 55.0, 47.0, 46.0, 51.0, 32.0, 47.0, 35.0, 34.0, 31.0, 28.0, 34.0, 21.0, 19.0, 13.0, 17.0, 6.0, 9.0, 10.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.0382843017578125, -1.976959228515625, -1.9156341552734375, -1.85430908203125, -1.7929840087890625, -1.731658935546875, -1.6703338623046875, -1.6090087890625, -1.5476837158203125, -1.486358642578125, -1.4250335693359375, -1.36370849609375, -1.3023834228515625, -1.241058349609375, -1.1797332763671875, -1.118408203125, -1.0570831298828125, -0.995758056640625, -0.9344329833984375, -0.87310791015625, -0.8117828369140625, -0.750457763671875, -0.6891326904296875, -0.6278076171875, -0.5664825439453125, -0.505157470703125, -0.4438323974609375, -0.38250732421875, -0.3211822509765625, -0.259857177734375, -0.1985321044921875, -0.13720703125, -0.0758819580078125, -0.014556884765625, 0.0467681884765625, 0.10809326171875, 0.1694183349609375, 0.230743408203125, 0.2920684814453125, 0.3533935546875, 0.4147186279296875, 0.476043701171875, 0.5373687744140625, 0.59869384765625, 0.6600189208984375, 0.721343994140625, 0.7826690673828125, 0.843994140625, 0.9053192138671875, 0.966644287109375, 1.0279693603515625, 1.08929443359375, 1.1506195068359375, 1.211944580078125, 1.2732696533203125, 1.3345947265625, 1.3959197998046875, 1.457244873046875, 1.5185699462890625, 1.57989501953125, 1.6412200927734375, 1.702545166015625, 1.7638702392578125, 1.8251953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 15.0, 15.0, 16.0, 20.0, 34.0, 37.0, 43.0, 63.0, 94.0, 155.0, 254.0, 386.0, 634.0, 1092.0, 2358.0, 5917.0, 20900.0, 129893.0, 771564.0, 89035.0, 16307.0, 5061.0, 2083.0, 934.0, 518.0, 360.0, 253.0, 134.0, 111.0, 65.0, 57.0, 41.0, 22.0, 24.0, 11.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.1494140625, -3.998046875, -3.8466796875, -3.6953125, -3.5439453125, -3.392578125, -3.2412109375, -3.08984375, -2.9384765625, -2.787109375, -2.6357421875, -2.484375, -2.3330078125, -2.181640625, -2.0302734375, -1.87890625, -1.7275390625, -1.576171875, -1.4248046875, -1.2734375, -1.1220703125, -0.970703125, -0.8193359375, -0.66796875, -0.5166015625, -0.365234375, -0.2138671875, -0.0625, 0.0888671875, 0.240234375, 0.3916015625, 0.54296875, 0.6943359375, 0.845703125, 0.9970703125, 1.1484375, 1.2998046875, 1.451171875, 1.6025390625, 1.75390625, 1.9052734375, 2.056640625, 2.2080078125, 2.359375, 2.5107421875, 2.662109375, 2.8134765625, 2.96484375, 3.1162109375, 3.267578125, 3.4189453125, 3.5703125, 3.7216796875, 3.873046875, 4.0244140625, 4.17578125, 4.3271484375, 4.478515625, 4.6298828125, 4.78125, 4.9326171875, 5.083984375, 5.2353515625, 5.38671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 6.0, 6.0, 6.0, 9.0, 8.0, 25.0, 15.0, 21.0, 35.0, 33.0, 44.0, 63.0, 55.0, 56.0, 74.0, 68.0, 67.0, 68.0, 64.0, 57.0, 50.0, 31.0, 27.0, 21.0, 16.0, 24.0, 14.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.0960693359375, -8.778076171875, -8.4600830078125, -8.14208984375, -7.8240966796875, -7.506103515625, -7.1881103515625, -6.8701171875, -6.5521240234375, -6.234130859375, -5.9161376953125, -5.59814453125, -5.2801513671875, -4.962158203125, -4.6441650390625, -4.326171875, -4.0081787109375, -3.690185546875, -3.3721923828125, -3.05419921875, -2.7362060546875, -2.418212890625, -2.1002197265625, -1.7822265625, -1.4642333984375, -1.146240234375, -0.8282470703125, -0.51025390625, -0.1922607421875, 0.125732421875, 0.4437255859375, 0.76171875, 1.0797119140625, 1.397705078125, 1.7156982421875, 2.03369140625, 2.3516845703125, 2.669677734375, 2.9876708984375, 3.3056640625, 3.6236572265625, 3.941650390625, 4.2596435546875, 4.57763671875, 4.8956298828125, 5.213623046875, 5.5316162109375, 5.849609375, 6.1676025390625, 6.485595703125, 6.8035888671875, 7.12158203125, 7.4395751953125, 7.757568359375, 8.0755615234375, 8.3935546875, 8.7115478515625, 9.029541015625, 9.3475341796875, 9.66552734375, 9.9835205078125, 10.301513671875, 10.6195068359375, 10.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 12.0, 13.0, 18.0, 26.0, 60.0, 91.0, 122.0, 184.0, 285.0, 470.0, 814.0, 1447.0, 3127.0, 7910.0, 32942.0, 332038.0, 617047.0, 36446.0, 8571.0, 3200.0, 1511.0, 867.0, 497.0, 259.0, 183.0, 145.0, 83.0, 50.0, 45.0, 27.0, 18.0, 6.0, 11.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.7038726806640625, -1.648956298828125, -1.5940399169921875, -1.53912353515625, -1.4842071533203125, -1.429290771484375, -1.3743743896484375, -1.3194580078125, -1.2645416259765625, -1.209625244140625, -1.1547088623046875, -1.09979248046875, -1.0448760986328125, -0.989959716796875, -0.9350433349609375, -0.880126953125, -0.8252105712890625, -0.770294189453125, -0.7153778076171875, -0.66046142578125, -0.6055450439453125, -0.550628662109375, -0.4957122802734375, -0.4407958984375, -0.3858795166015625, -0.330963134765625, -0.2760467529296875, -0.22113037109375, -0.1662139892578125, -0.111297607421875, -0.0563812255859375, -0.00146484375, 0.0534515380859375, 0.108367919921875, 0.1632843017578125, 0.21820068359375, 0.2731170654296875, 0.328033447265625, 0.3829498291015625, 0.4378662109375, 0.4927825927734375, 0.547698974609375, 0.6026153564453125, 0.65753173828125, 0.7124481201171875, 0.767364501953125, 0.8222808837890625, 0.877197265625, 0.9321136474609375, 0.987030029296875, 1.0419464111328125, 1.09686279296875, 1.1517791748046875, 1.206695556640625, 1.2616119384765625, 1.3165283203125, 1.3714447021484375, 1.426361083984375, 1.4812774658203125, 1.53619384765625, 1.5911102294921875, 1.646026611328125, 1.7009429931640625, 1.755859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 9.0, 14.0, 17.0, 28.0, 46.0, 101.0, 153.0, 270.0, 168.0, 74.0, 44.0, 19.0, 16.0, 9.0, 6.0, 3.0, 8.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006971359252929688, -0.0006707906723022461, -0.0006444454193115234, -0.0006181001663208008, -0.0005917549133300781, -0.0005654096603393555, -0.0005390644073486328, -0.0005127191543579102, -0.0004863739013671875, -0.00046002864837646484, -0.0004336833953857422, -0.00040733814239501953, -0.0003809928894042969, -0.0003546476364135742, -0.00032830238342285156, -0.0003019571304321289, -0.00027561187744140625, -0.0002492666244506836, -0.00022292137145996094, -0.00019657611846923828, -0.00017023086547851562, -0.00014388561248779297, -0.00011754035949707031, -9.119510650634766e-05, -6.4849853515625e-05, -3.8504600524902344e-05, -1.2159347534179688e-05, 1.4185905456542969e-05, 4.0531158447265625e-05, 6.687641143798828e-05, 9.322166442871094e-05, 0.0001195669174194336, 0.00014591217041015625, 0.0001722574234008789, 0.00019860267639160156, 0.00022494792938232422, 0.0002512931823730469, 0.00027763843536376953, 0.0003039836883544922, 0.00033032894134521484, 0.0003566741943359375, 0.00038301944732666016, 0.0004093647003173828, 0.00043570995330810547, 0.0004620552062988281, 0.0004884004592895508, 0.0005147457122802734, 0.0005410909652709961, 0.0005674362182617188, 0.0005937814712524414, 0.0006201267242431641, 0.0006464719772338867, 0.0006728172302246094, 0.000699162483215332, 0.0007255077362060547, 0.0007518529891967773, 0.0007781982421875, 0.0008045434951782227, 0.0008308887481689453, 0.000857234001159668, 0.0008835792541503906, 0.0009099245071411133, 0.0009362697601318359, 0.0009626150131225586, 0.0009889602661132812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 10.0, 6.0, 10.0, 16.0, 24.0, 41.0, 63.0, 102.0, 190.0, 306.0, 615.0, 1319.0, 3072.0, 8589.0, 31210.0, 187497.0, 718816.0, 71877.0, 15744.0, 5047.0, 2010.0, 897.0, 453.0, 278.0, 112.0, 84.0, 60.0, 39.0, 23.0, 20.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.357421875, -1.3076171875, -1.2578125, -1.2080078125, -1.158203125, -1.1083984375, -1.05859375, -1.0087890625, -0.958984375, -0.9091796875, -0.859375, -0.8095703125, -0.759765625, -0.7099609375, -0.66015625, -0.6103515625, -0.560546875, -0.5107421875, -0.4609375, -0.4111328125, -0.361328125, -0.3115234375, -0.26171875, -0.2119140625, -0.162109375, -0.1123046875, -0.0625, -0.0126953125, 0.037109375, 0.0869140625, 0.13671875, 0.1865234375, 0.236328125, 0.2861328125, 0.3359375, 0.3857421875, 0.435546875, 0.4853515625, 0.53515625, 0.5849609375, 0.634765625, 0.6845703125, 0.734375, 0.7841796875, 0.833984375, 0.8837890625, 0.93359375, 0.9833984375, 1.033203125, 1.0830078125, 1.1328125, 1.1826171875, 1.232421875, 1.2822265625, 1.33203125, 1.3818359375, 1.431640625, 1.4814453125, 1.53125, 1.5810546875, 1.630859375, 1.6806640625, 1.73046875, 1.7802734375, 1.830078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 19.0, 24.0, 15.0, 48.0, 39.0, 53.0, 88.0, 117.0, 117.0, 127.0, 78.0, 55.0, 41.0, 47.0, 28.0, 27.0, 11.0, 13.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.919921875, -1.865875244140625, -1.81182861328125, -1.757781982421875, -1.7037353515625, -1.649688720703125, -1.59564208984375, -1.541595458984375, -1.487548828125, -1.433502197265625, -1.37945556640625, -1.325408935546875, -1.2713623046875, -1.217315673828125, -1.16326904296875, -1.109222412109375, -1.05517578125, -1.001129150390625, -0.94708251953125, -0.893035888671875, -0.8389892578125, -0.784942626953125, -0.73089599609375, -0.676849365234375, -0.622802734375, -0.568756103515625, -0.51470947265625, -0.460662841796875, -0.4066162109375, -0.352569580078125, -0.29852294921875, -0.244476318359375, -0.1904296875, -0.136383056640625, -0.08233642578125, -0.028289794921875, 0.0257568359375, 0.079803466796875, 0.13385009765625, 0.187896728515625, 0.241943359375, 0.295989990234375, 0.35003662109375, 0.404083251953125, 0.4581298828125, 0.512176513671875, 0.56622314453125, 0.620269775390625, 0.67431640625, 0.728363037109375, 0.78240966796875, 0.836456298828125, 0.8905029296875, 0.944549560546875, 0.99859619140625, 1.052642822265625, 1.106689453125, 1.160736083984375, 1.21478271484375, 1.268829345703125, 1.3228759765625, 1.376922607421875, 1.43096923828125, 1.485015869140625, 1.5390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 8.0, 30.0, 126.0, 594.0, 177.0, 39.0, 12.0, 9.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.8374786376953, -169.2025604248047, -165.567626953125, -161.93270874023438, -158.2977752685547, -154.66285705566406, -151.02792358398438, -147.39300537109375, -143.75808715820312, -140.1231689453125, -136.4882354736328, -132.8533172607422, -129.2183837890625, -125.58346557617188, -121.94853973388672, -118.31361389160156, -114.67868041992188, -111.04375457763672, -107.40882873535156, -103.77391052246094, -100.13898468017578, -96.50405883789062, -92.86913299560547, -89.23420715332031, -85.59928894042969, -81.96436309814453, -78.32943725585938, -74.69451904296875, -71.0595932006836, -67.42466735839844, -63.78974151611328, -60.154815673828125, -56.51988983154297, -52.88496398925781, -49.25004196166992, -45.615116119384766, -41.98019027709961, -38.34526824951172, -34.71034240722656, -31.075416564941406, -27.440492630004883, -23.80556869506836, -20.170642852783203, -16.53571891784668, -12.90079402923584, -9.265869140625, -5.630945205688477, -1.9960193634033203, 1.6389045715332031, 5.273829460144043, 8.908754348754883, 12.543678283691406, 16.178604125976562, 19.813528060913086, 23.44845199584961, 27.083377838134766, 30.71830177307129, 34.35322570800781, 37.98815155029297, 41.623077392578125, 45.257999420166016, 48.89292526245117, 52.52784729003906, 56.16277313232422, 59.797698974609375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 13.0, 7.0, 20.0, 14.0, 21.0, 24.0, 33.0, 34.0, 27.0, 28.0, 35.0, 51.0, 85.0, 96.0, 104.0, 86.0, 35.0, 33.0, 34.0, 18.0, 32.0, 19.0, 13.0, 16.0, 9.0, 15.0, 13.0, 3.0, 18.0, 7.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31207275390625, -28.33296012878418, -27.35384750366211, -26.374736785888672, -25.3956241607666, -24.41651153564453, -23.43739891052246, -22.45828628540039, -21.479175567626953, -20.500062942504883, -19.520950317382812, -18.541839599609375, -17.562726974487305, -16.583614349365234, -15.604501724243164, -14.625389099121094, -13.646276473999023, -12.667163848876953, -11.6880521774292, -10.708939552307129, -9.729827880859375, -8.750715255737305, -7.771602630615234, -6.792490482330322, -5.81337833404541, -4.834266185760498, -3.855153799057007, -2.8760414123535156, -1.8969292640686035, -0.9178171157836914, 0.061295509338378906, 1.040407657623291, 2.019519805908203, 2.9986319541931152, 3.9777443408966064, 4.956856727600098, 5.93596887588501, 6.915081024169922, 7.894193649291992, 8.873306274414062, 9.852417945861816, 10.831530570983887, 11.81064224243164, 12.789754867553711, 13.768867492675781, 14.747979164123535, 15.727091789245605, 16.70620346069336, 17.68531608581543, 18.6644287109375, 19.64354133605957, 20.62265396118164, 21.601764678955078, 22.58087730407715, 23.55998992919922, 24.53910255432129, 25.51821517944336, 26.49732780456543, 27.4764404296875, 28.455551147460938, 29.434663772583008, 30.413776397705078, 31.39288902282715, 32.37200164794922, 33.351112365722656]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 6.0, 5.0, 14.0, 23.0, 19.0, 39.0, 71.0, 101.0, 175.0, 357.0, 616.0, 1278.0, 2654.0, 6734.0, 20048.0, 74674.0, 457703.0, 2455829.0, 986113.0, 138410.0, 31940.0, 10056.0, 3806.0, 1770.0, 842.0, 428.0, 219.0, 150.0, 85.0, 41.0, 29.0, 21.0, 9.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.19921875, -6.046844482421875, -5.89447021484375, -5.742095947265625, -5.5897216796875, -5.437347412109375, -5.28497314453125, -5.132598876953125, -4.980224609375, -4.827850341796875, -4.67547607421875, -4.523101806640625, -4.3707275390625, -4.218353271484375, -4.06597900390625, -3.913604736328125, -3.76123046875, -3.608856201171875, -3.45648193359375, -3.304107666015625, -3.1517333984375, -2.999359130859375, -2.84698486328125, -2.694610595703125, -2.542236328125, -2.389862060546875, -2.23748779296875, -2.085113525390625, -1.9327392578125, -1.780364990234375, -1.62799072265625, -1.475616455078125, -1.3232421875, -1.170867919921875, -1.01849365234375, -0.866119384765625, -0.7137451171875, -0.561370849609375, -0.40899658203125, -0.256622314453125, -0.104248046875, 0.048126220703125, 0.20050048828125, 0.352874755859375, 0.5052490234375, 0.657623291015625, 0.80999755859375, 0.962371826171875, 1.11474609375, 1.267120361328125, 1.41949462890625, 1.571868896484375, 1.7242431640625, 1.876617431640625, 2.02899169921875, 2.181365966796875, 2.333740234375, 2.486114501953125, 2.63848876953125, 2.790863037109375, 2.9432373046875, 3.095611572265625, 3.24798583984375, 3.400360107421875, 3.552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 11.0, 12.0, 12.0, 15.0, 26.0, 25.0, 15.0, 28.0, 26.0, 30.0, 29.0, 32.0, 43.0, 39.0, 38.0, 41.0, 43.0, 62.0, 42.0, 50.0, 50.0, 43.0, 43.0, 45.0, 27.0, 24.0, 25.0, 9.0, 20.0, 15.0, 15.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-2.37890625, -2.315155029296875, -2.25140380859375, -2.187652587890625, -2.1239013671875, -2.060150146484375, -1.99639892578125, -1.932647705078125, -1.868896484375, -1.805145263671875, -1.74139404296875, -1.677642822265625, -1.6138916015625, -1.550140380859375, -1.48638916015625, -1.422637939453125, -1.35888671875, -1.295135498046875, -1.23138427734375, -1.167633056640625, -1.1038818359375, -1.040130615234375, -0.97637939453125, -0.912628173828125, -0.848876953125, -0.785125732421875, -0.72137451171875, -0.657623291015625, -0.5938720703125, -0.530120849609375, -0.46636962890625, -0.402618408203125, -0.3388671875, -0.275115966796875, -0.21136474609375, -0.147613525390625, -0.0838623046875, -0.020111083984375, 0.04364013671875, 0.107391357421875, 0.171142578125, 0.234893798828125, 0.29864501953125, 0.362396240234375, 0.4261474609375, 0.489898681640625, 0.55364990234375, 0.617401123046875, 0.68115234375, 0.744903564453125, 0.80865478515625, 0.872406005859375, 0.9361572265625, 0.999908447265625, 1.06365966796875, 1.127410888671875, 1.191162109375, 1.254913330078125, 1.31866455078125, 1.382415771484375, 1.4461669921875, 1.509918212890625, 1.57366943359375, 1.637420654296875, 1.701171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 15.0, 28.0, 17.0, 35.0, 49.0, 88.0, 122.0, 171.0, 317.0, 704.0, 1785.0, 7203.0, 100886.0, 3958150.0, 113907.0, 7537.0, 1754.0, 648.0, 323.0, 195.0, 122.0, 64.0, 39.0, 34.0, 20.0, 14.0, 8.0, 7.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.9920654296875, -16.499755859375, -16.0074462890625, -15.51513671875, -15.0228271484375, -14.530517578125, -14.0382080078125, -13.5458984375, -13.0535888671875, -12.561279296875, -12.0689697265625, -11.57666015625, -11.0843505859375, -10.592041015625, -10.0997314453125, -9.607421875, -9.1151123046875, -8.622802734375, -8.1304931640625, -7.63818359375, -7.1458740234375, -6.653564453125, -6.1612548828125, -5.6689453125, -5.1766357421875, -4.684326171875, -4.1920166015625, -3.69970703125, -3.2073974609375, -2.715087890625, -2.2227783203125, -1.73046875, -1.2381591796875, -0.745849609375, -0.2535400390625, 0.23876953125, 0.7310791015625, 1.223388671875, 1.7156982421875, 2.2080078125, 2.7003173828125, 3.192626953125, 3.6849365234375, 4.17724609375, 4.6695556640625, 5.161865234375, 5.6541748046875, 6.146484375, 6.6387939453125, 7.131103515625, 7.6234130859375, 8.11572265625, 8.6080322265625, 9.100341796875, 9.5926513671875, 10.0849609375, 10.5772705078125, 11.069580078125, 11.5618896484375, 12.05419921875, 12.5465087890625, 13.038818359375, 13.5311279296875, 14.0234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 5.0, 9.0, 10.0, 21.0, 23.0, 34.0, 45.0, 75.0, 88.0, 151.0, 220.0, 343.0, 528.0, 774.0, 611.0, 388.0, 250.0, 140.0, 120.0, 67.0, 52.0, 40.0, 33.0, 15.0, 11.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.671875, -9.392333984375, -9.11279296875, -8.833251953125, -8.5537109375, -8.274169921875, -7.99462890625, -7.715087890625, -7.435546875, -7.156005859375, -6.87646484375, -6.596923828125, -6.3173828125, -6.037841796875, -5.75830078125, -5.478759765625, -5.19921875, -4.919677734375, -4.64013671875, -4.360595703125, -4.0810546875, -3.801513671875, -3.52197265625, -3.242431640625, -2.962890625, -2.683349609375, -2.40380859375, -2.124267578125, -1.8447265625, -1.565185546875, -1.28564453125, -1.006103515625, -0.7265625, -0.447021484375, -0.16748046875, 0.112060546875, 0.3916015625, 0.671142578125, 0.95068359375, 1.230224609375, 1.509765625, 1.789306640625, 2.06884765625, 2.348388671875, 2.6279296875, 2.907470703125, 3.18701171875, 3.466552734375, 3.74609375, 4.025634765625, 4.30517578125, 4.584716796875, 4.8642578125, 5.143798828125, 5.42333984375, 5.702880859375, 5.982421875, 6.261962890625, 6.54150390625, 6.821044921875, 7.1005859375, 7.380126953125, 7.65966796875, 7.939208984375, 8.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 16.0, 15.0, 41.0, 64.0, 104.0, 153.0, 179.0, 163.0, 95.0, 59.0, 29.0, 25.0, 18.0, 7.0, 2.0, 8.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.10050964355469, -82.2998046875, -79.49910736083984, -76.69840240478516, -73.897705078125, -71.09700012207031, -68.29629516601562, -65.49559020996094, -62.69489288330078, -59.89419174194336, -57.09349060058594, -54.29278564453125, -51.49208450317383, -48.691383361816406, -45.89067840576172, -43.0899772644043, -40.289276123046875, -37.48857498168945, -34.68787384033203, -31.887168884277344, -29.086467742919922, -26.2857666015625, -23.485063552856445, -20.68436050415039, -17.88365936279297, -15.08295726776123, -12.282255172729492, -9.481553077697754, -6.680850982666016, -3.8801488876342773, -1.079446792602539, 1.7212562561035156, 4.521949768066406, 7.3226518630981445, 10.123353958129883, 12.924056053161621, 15.72475814819336, 18.52545928955078, 21.326162338256836, 24.12686538696289, 26.927566528320312, 29.728267669677734, 32.528968811035156, 35.329673767089844, 38.130374908447266, 40.93107604980469, 43.731781005859375, 46.5324821472168, 49.33318328857422, 52.13388442993164, 54.93458557128906, 57.73529052734375, 60.53599166870117, 63.336692810058594, 66.13739776611328, 68.93809509277344, 71.73880004882812, 74.53950500488281, 77.34020233154297, 80.14090728759766, 82.94160461425781, 85.7423095703125, 88.54301452636719, 91.34371948242188, 94.14441680908203]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 13.0, 11.0, 17.0, 17.0, 21.0, 17.0, 28.0, 28.0, 26.0, 38.0, 35.0, 43.0, 42.0, 31.0, 63.0, 54.0, 77.0, 65.0, 48.0, 35.0, 42.0, 33.0, 34.0, 29.0, 31.0, 24.0, 21.0, 15.0, 10.0, 13.0, 11.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.560752868652344, -41.1661262512207, -39.77149963378906, -38.37687301635742, -36.98224639892578, -35.587623596191406, -34.1929931640625, -32.798370361328125, -31.403743743896484, -30.009117126464844, -28.614490509033203, -27.219863891601562, -25.825239181518555, -24.430612564086914, -23.035985946655273, -21.641361236572266, -20.246732711791992, -18.85210609436035, -17.45747947692871, -16.062854766845703, -14.668228149414062, -13.273601531982422, -11.878974914550781, -10.484349250793457, -9.089722633361816, -7.695096492767334, -6.300470352172852, -4.905843734741211, -3.5112175941467285, -2.116591453552246, -0.7219648361206055, 0.6726608276367188, 2.0672874450683594, 3.461913585662842, 4.856539726257324, 6.251166343688965, 7.645792484283447, 9.04041862487793, 10.43504524230957, 11.829670906066895, 13.224297523498535, 14.618924140930176, 16.0135498046875, 17.40817642211914, 18.80280303955078, 20.197429656982422, 21.592056274414062, 22.98668098449707, 24.38130760192871, 25.77593421936035, 27.170560836791992, 28.565185546875, 29.95981216430664, 31.35443878173828, 32.74906539916992, 34.14369201660156, 35.5383186340332, 36.932945251464844, 38.327571868896484, 39.722198486328125, 41.116825103759766, 42.511451721191406, 43.90607452392578, 45.30070114135742, 46.69532775878906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 12.0, 21.0, 23.0, 47.0, 80.0, 149.0, 296.0, 627.0, 1335.0, 3488.0, 11567.0, 52423.0, 503832.0, 411947.0, 46219.0, 10639.0, 3328.0, 1276.0, 603.0, 288.0, 162.0, 84.0, 39.0, 33.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.48828125, -6.3173828125, -6.146484375, -5.9755859375, -5.8046875, -5.6337890625, -5.462890625, -5.2919921875, -5.12109375, -4.9501953125, -4.779296875, -4.6083984375, -4.4375, -4.2666015625, -4.095703125, -3.9248046875, -3.75390625, -3.5830078125, -3.412109375, -3.2412109375, -3.0703125, -2.8994140625, -2.728515625, -2.5576171875, -2.38671875, -2.2158203125, -2.044921875, -1.8740234375, -1.703125, -1.5322265625, -1.361328125, -1.1904296875, -1.01953125, -0.8486328125, -0.677734375, -0.5068359375, -0.3359375, -0.1650390625, 0.005859375, 0.1767578125, 0.34765625, 0.5185546875, 0.689453125, 0.8603515625, 1.03125, 1.2021484375, 1.373046875, 1.5439453125, 1.71484375, 1.8857421875, 2.056640625, 2.2275390625, 2.3984375, 2.5693359375, 2.740234375, 2.9111328125, 3.08203125, 3.2529296875, 3.423828125, 3.5947265625, 3.765625, 3.9365234375, 4.107421875, 4.2783203125, 4.44921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 6.0, 10.0, 6.0, 9.0, 26.0, 19.0, 20.0, 36.0, 33.0, 37.0, 37.0, 65.0, 51.0, 58.0, 54.0, 53.0, 89.0, 58.0, 58.0, 50.0, 42.0, 37.0, 33.0, 31.0, 16.0, 21.0, 9.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.49609375, -3.37030029296875, -3.2445068359375, -3.11871337890625, -2.992919921875, -2.86712646484375, -2.7413330078125, -2.61553955078125, -2.48974609375, -2.36395263671875, -2.2381591796875, -2.11236572265625, -1.986572265625, -1.86077880859375, -1.7349853515625, -1.60919189453125, -1.4833984375, -1.35760498046875, -1.2318115234375, -1.10601806640625, -0.980224609375, -0.85443115234375, -0.7286376953125, -0.60284423828125, -0.47705078125, -0.35125732421875, -0.2254638671875, -0.09967041015625, 0.026123046875, 0.15191650390625, 0.2777099609375, 0.40350341796875, 0.529296875, 0.65509033203125, 0.7808837890625, 0.90667724609375, 1.032470703125, 1.15826416015625, 1.2840576171875, 1.40985107421875, 1.53564453125, 1.66143798828125, 1.7872314453125, 1.91302490234375, 2.038818359375, 2.16461181640625, 2.2904052734375, 2.41619873046875, 2.5419921875, 2.66778564453125, 2.7935791015625, 2.91937255859375, 3.045166015625, 3.17095947265625, 3.2967529296875, 3.42254638671875, 3.54833984375, 3.67413330078125, 3.7999267578125, 3.92572021484375, 4.051513671875, 4.17730712890625, 4.3031005859375, 4.42889404296875, 4.5546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 10.0, 7.0, 21.0, 26.0, 37.0, 40.0, 71.0, 113.0, 185.0, 304.0, 533.0, 1169.0, 3408.0, 12334.0, 75402.0, 879342.0, 59583.0, 10544.0, 3002.0, 1111.0, 509.0, 272.0, 159.0, 92.0, 79.0, 61.0, 31.0, 22.0, 23.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0078125, -4.8377685546875, -4.667724609375, -4.4976806640625, -4.32763671875, -4.1575927734375, -3.987548828125, -3.8175048828125, -3.6474609375, -3.4774169921875, -3.307373046875, -3.1373291015625, -2.96728515625, -2.7972412109375, -2.627197265625, -2.4571533203125, -2.287109375, -2.1170654296875, -1.947021484375, -1.7769775390625, -1.60693359375, -1.4368896484375, -1.266845703125, -1.0968017578125, -0.9267578125, -0.7567138671875, -0.586669921875, -0.4166259765625, -0.24658203125, -0.0765380859375, 0.093505859375, 0.2635498046875, 0.43359375, 0.6036376953125, 0.773681640625, 0.9437255859375, 1.11376953125, 1.2838134765625, 1.453857421875, 1.6239013671875, 1.7939453125, 1.9639892578125, 2.134033203125, 2.3040771484375, 2.47412109375, 2.6441650390625, 2.814208984375, 2.9842529296875, 3.154296875, 3.3243408203125, 3.494384765625, 3.6644287109375, 3.83447265625, 4.0045166015625, 4.174560546875, 4.3446044921875, 4.5146484375, 4.6846923828125, 4.854736328125, 5.0247802734375, 5.19482421875, 5.3648681640625, 5.534912109375, 5.7049560546875, 5.875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 8.0, 8.0, 13.0, 14.0, 16.0, 18.0, 26.0, 31.0, 31.0, 33.0, 35.0, 55.0, 67.0, 73.0, 70.0, 67.0, 62.0, 61.0, 51.0, 41.0, 24.0, 22.0, 27.0, 9.0, 19.0, 18.0, 9.0, 6.0, 9.0, 8.0, 10.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-12.546875, -12.176513671875, -11.80615234375, -11.435791015625, -11.0654296875, -10.695068359375, -10.32470703125, -9.954345703125, -9.583984375, -9.213623046875, -8.84326171875, -8.472900390625, -8.1025390625, -7.732177734375, -7.36181640625, -6.991455078125, -6.62109375, -6.250732421875, -5.88037109375, -5.510009765625, -5.1396484375, -4.769287109375, -4.39892578125, -4.028564453125, -3.658203125, -3.287841796875, -2.91748046875, -2.547119140625, -2.1767578125, -1.806396484375, -1.43603515625, -1.065673828125, -0.6953125, -0.324951171875, 0.04541015625, 0.415771484375, 0.7861328125, 1.156494140625, 1.52685546875, 1.897216796875, 2.267578125, 2.637939453125, 3.00830078125, 3.378662109375, 3.7490234375, 4.119384765625, 4.48974609375, 4.860107421875, 5.23046875, 5.600830078125, 5.97119140625, 6.341552734375, 6.7119140625, 7.082275390625, 7.45263671875, 7.822998046875, 8.193359375, 8.563720703125, 8.93408203125, 9.304443359375, 9.6748046875, 10.045166015625, 10.41552734375, 10.785888671875, 11.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 4.0, 11.0, 12.0, 14.0, 22.0, 32.0, 31.0, 56.0, 70.0, 132.0, 197.0, 270.0, 503.0, 791.0, 1644.0, 3586.0, 8334.0, 23900.0, 105355.0, 796972.0, 74370.0, 18964.0, 7000.0, 2948.0, 1421.0, 703.0, 431.0, 256.0, 153.0, 112.0, 70.0, 49.0, 36.0, 24.0, 24.0, 14.0, 11.0, 9.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.82568359375, -0.8023605346679688, -0.7790374755859375, -0.7557144165039062, -0.732391357421875, -0.7090682983398438, -0.6857452392578125, -0.6624221801757812, -0.63909912109375, -0.6157760620117188, -0.5924530029296875, -0.5691299438476562, -0.545806884765625, -0.5224838256835938, -0.4991607666015625, -0.47583770751953125, -0.4525146484375, -0.42919158935546875, -0.4058685302734375, -0.38254547119140625, -0.359222412109375, -0.33589935302734375, -0.3125762939453125, -0.28925323486328125, -0.26593017578125, -0.24260711669921875, -0.2192840576171875, -0.19596099853515625, -0.172637939453125, -0.14931488037109375, -0.1259918212890625, -0.10266876220703125, -0.079345703125, -0.05602264404296875, -0.0326995849609375, -0.00937652587890625, 0.013946533203125, 0.03726959228515625, 0.0605926513671875, 0.08391571044921875, 0.10723876953125, 0.13056182861328125, 0.1538848876953125, 0.17720794677734375, 0.200531005859375, 0.22385406494140625, 0.2471771240234375, 0.27050018310546875, 0.2938232421875, 0.31714630126953125, 0.3404693603515625, 0.36379241943359375, 0.387115478515625, 0.41043853759765625, 0.4337615966796875, 0.45708465576171875, 0.48040771484375, 0.5037307739257812, 0.5270538330078125, 0.5503768920898438, 0.573699951171875, 0.5970230102539062, 0.6203460693359375, 0.6436691284179688, 0.6669921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 7.0, 6.0, 14.0, 25.0, 15.0, 42.0, 41.0, 48.0, 88.0, 102.0, 114.0, 109.0, 108.0, 66.0, 38.0, 40.0, 27.0, 21.0, 14.0, 15.0, 5.0, 8.0, 5.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002675056457519531, -0.0002602245658636093, -0.0002529434859752655, -0.0002456624060869217, -0.00023838132619857788, -0.00023110024631023407, -0.00022381916642189026, -0.00021653808653354645, -0.00020925700664520264, -0.00020197592675685883, -0.00019469484686851501, -0.0001874137669801712, -0.0001801326870918274, -0.00017285160720348358, -0.00016557052731513977, -0.00015828944742679596, -0.00015100836753845215, -0.00014372728765010834, -0.00013644620776176453, -0.00012916512787342072, -0.0001218840479850769, -0.0001146029680967331, -0.00010732188820838928, -0.00010004080832004547, -9.275972843170166e-05, -8.547864854335785e-05, -7.819756865501404e-05, -7.091648876667023e-05, -6.363540887832642e-05, -5.6354328989982605e-05, -4.9073249101638794e-05, -4.179216921329498e-05, -3.451108932495117e-05, -2.723000943660736e-05, -1.994892954826355e-05, -1.2667849659919739e-05, -5.386769771575928e-06, 1.8943101167678833e-06, 9.175390005111694e-06, 1.6456469893455505e-05, 2.3737549781799316e-05, 3.101862967014313e-05, 3.829970955848694e-05, 4.558078944683075e-05, 5.286186933517456e-05, 6.014294922351837e-05, 6.742402911186218e-05, 7.4705109000206e-05, 8.19861888885498e-05, 8.926726877689362e-05, 9.654834866523743e-05, 0.00010382942855358124, 0.00011111050844192505, 0.00011839158833026886, 0.00012567266821861267, 0.00013295374810695648, 0.0001402348279953003, 0.0001475159078836441, 0.00015479698777198792, 0.00016207806766033173, 0.00016935914754867554, 0.00017664022743701935, 0.00018392130732536316, 0.00019120238721370697, 0.00019848346710205078]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 16.0, 7.0, 12.0, 18.0, 26.0, 46.0, 76.0, 85.0, 128.0, 212.0, 328.0, 585.0, 991.0, 2026.0, 4190.0, 10450.0, 30537.0, 161880.0, 761164.0, 49798.0, 14657.0, 5631.0, 2503.0, 1313.0, 744.0, 403.0, 270.0, 157.0, 95.0, 65.0, 48.0, 38.0, 17.0, 14.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.86279296875, -0.8310546875, -0.79931640625, -0.767578125, -0.73583984375, -0.7041015625, -0.67236328125, -0.640625, -0.60888671875, -0.5771484375, -0.54541015625, -0.513671875, -0.48193359375, -0.4501953125, -0.41845703125, -0.38671875, -0.35498046875, -0.3232421875, -0.29150390625, -0.259765625, -0.22802734375, -0.1962890625, -0.16455078125, -0.1328125, -0.10107421875, -0.0693359375, -0.03759765625, -0.005859375, 0.02587890625, 0.0576171875, 0.08935546875, 0.12109375, 0.15283203125, 0.1845703125, 0.21630859375, 0.248046875, 0.27978515625, 0.3115234375, 0.34326171875, 0.375, 0.40673828125, 0.4384765625, 0.47021484375, 0.501953125, 0.53369140625, 0.5654296875, 0.59716796875, 0.62890625, 0.66064453125, 0.6923828125, 0.72412109375, 0.755859375, 0.78759765625, 0.8193359375, 0.85107421875, 0.8828125, 0.91455078125, 0.9462890625, 0.97802734375, 1.009765625, 1.04150390625, 1.0732421875, 1.10498046875, 1.13671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 10.0, 8.0, 9.0, 9.0, 15.0, 10.0, 9.0, 13.0, 18.0, 17.0, 23.0, 34.0, 45.0, 51.0, 65.0, 82.0, 100.0, 97.0, 89.0, 62.0, 45.0, 32.0, 24.0, 21.0, 15.0, 10.0, 13.0, 14.0, 10.0, 8.0, 11.0, 7.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.961090087890625, -0.93096923828125, -0.900848388671875, -0.8707275390625, -0.840606689453125, -0.81048583984375, -0.780364990234375, -0.750244140625, -0.720123291015625, -0.69000244140625, -0.659881591796875, -0.6297607421875, -0.599639892578125, -0.56951904296875, -0.539398193359375, -0.50927734375, -0.479156494140625, -0.44903564453125, -0.418914794921875, -0.3887939453125, -0.358673095703125, -0.32855224609375, -0.298431396484375, -0.268310546875, -0.238189697265625, -0.20806884765625, -0.177947998046875, -0.1478271484375, -0.117706298828125, -0.08758544921875, -0.057464599609375, -0.02734375, 0.002777099609375, 0.03289794921875, 0.063018798828125, 0.0931396484375, 0.123260498046875, 0.15338134765625, 0.183502197265625, 0.213623046875, 0.243743896484375, 0.27386474609375, 0.303985595703125, 0.3341064453125, 0.364227294921875, 0.39434814453125, 0.424468994140625, 0.45458984375, 0.484710693359375, 0.51483154296875, 0.544952392578125, 0.5750732421875, 0.605194091796875, 0.63531494140625, 0.665435791015625, 0.695556640625, 0.725677490234375, 0.75579833984375, 0.785919189453125, 0.8160400390625, 0.846160888671875, 0.87628173828125, 0.906402587890625, 0.9365234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 10.0, 4.0, 3.0, 9.0, 13.0, 17.0, 26.0, 46.0, 89.0, 322.0, 225.0, 96.0, 46.0, 40.0, 18.0, 16.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.705677032470703, -15.398041725158691, -14.09040641784668, -12.782772064208984, -11.475136756896973, -10.167501449584961, -8.859867095947266, -7.552231788635254, -6.244596481323242, -4.9369611740112305, -3.629326343536377, -2.3216912746429443, -1.0140562057495117, 0.2935791015625, 1.6012139320373535, 2.908848762512207, 4.216484069824219, 5.5241193771362305, 6.831754207611084, 8.139389038085938, 9.44702434539795, 10.754659652709961, 12.062294006347656, 13.369929313659668, 14.67756462097168, 15.985199928283691, 17.292835235595703, 18.6004695892334, 19.908103942871094, 21.215740203857422, 22.523374557495117, 23.831008911132812, 25.138648986816406, 26.4462833404541, 27.75391960144043, 29.061553955078125, 30.369190216064453, 31.67682456970215, 32.984458923339844, 34.29209518432617, 35.5997314453125, 36.90736770629883, 38.21500015258789, 39.52263641357422, 40.83027267456055, 42.137908935546875, 43.44554138183594, 44.753177642822266, 46.06081008911133, 47.368446350097656, 48.67607879638672, 49.98371505737305, 51.291351318359375, 52.59898376464844, 53.906620025634766, 55.214256286621094, 56.521888732910156, 57.829524993896484, 59.13715744018555, 60.444793701171875, 61.7524299621582, 63.06006622314453, 64.3676986694336, 65.67533111572266, 66.98297119140625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 7.0, 10.0, 6.0, 10.0, 6.0, 8.0, 9.0, 14.0, 27.0, 15.0, 21.0, 27.0, 41.0, 41.0, 77.0, 102.0, 128.0, 114.0, 76.0, 45.0, 19.0, 31.0, 14.0, 13.0, 14.0, 14.0, 12.0, 15.0, 12.0, 11.0, 7.0, 6.0, 7.0, 4.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.786760330200195, -30.809301376342773, -29.83184051513672, -28.854381561279297, -27.876920700073242, -26.89946174621582, -25.922000885009766, -24.944541931152344, -23.967082977294922, -22.9896240234375, -22.012163162231445, -21.034704208374023, -20.05724334716797, -19.079784393310547, -18.102325439453125, -17.12486457824707, -16.147403717041016, -15.169943809509277, -14.192483901977539, -13.215024948120117, -12.237564086914062, -11.26010513305664, -10.282645225524902, -9.305185317993164, -8.327725410461426, -7.3502655029296875, -6.372805595397949, -5.395346164703369, -4.417886257171631, -3.4404263496398926, -2.4629669189453125, -1.4855070114135742, -0.5080451965332031, 0.4694145917892456, 1.4468743801116943, 2.4243340492248535, 3.401793956756592, 4.37925386428833, 5.35671329498291, 6.334173202514648, 7.311633110046387, 8.289093017578125, 9.266552925109863, 10.244012832641602, 11.221471786499023, 12.198932647705078, 13.1763916015625, 14.153851509094238, 15.131311416625977, 16.1087703704834, 17.086231231689453, 18.063690185546875, 19.04115104675293, 20.01861000061035, 20.996070861816406, 21.973529815673828, 22.95098876953125, 23.928447723388672, 24.905908584594727, 25.88336753845215, 26.860828399658203, 27.838287353515625, 28.815746307373047, 29.7932071685791, 30.770668029785156]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 8.0, 13.0, 14.0, 19.0, 29.0, 29.0, 35.0, 32.0, 43.0, 52.0, 88.0, 220.0, 107.0, 61.0, 40.0, 36.0, 29.0, 19.0, 25.0, 15.0, 22.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.235137939453125, -3.10894775390625, -2.982757568359375, -2.8565673828125, -2.730377197265625, -2.60418701171875, -2.477996826171875, -2.351806640625, -2.225616455078125, -2.09942626953125, -1.973236083984375, -1.8470458984375, -1.720855712890625, -1.59466552734375, -1.468475341796875, -1.34228515625, -1.216094970703125, -1.08990478515625, -0.963714599609375, -0.8375244140625, -0.711334228515625, -0.58514404296875, -0.458953857421875, -0.332763671875, -0.206573486328125, -0.08038330078125, 0.045806884765625, 0.1719970703125, 0.298187255859375, 0.42437744140625, 0.550567626953125, 0.6767578125, 0.802947998046875, 0.92913818359375, 1.055328369140625, 1.1815185546875, 1.307708740234375, 1.43389892578125, 1.560089111328125, 1.686279296875, 1.812469482421875, 1.93865966796875, 2.064849853515625, 2.1910400390625, 2.317230224609375, 2.44342041015625, 2.569610595703125, 2.69580078125, 2.821990966796875, 2.94818115234375, 3.074371337890625, 3.2005615234375, 3.326751708984375, 3.45294189453125, 3.579132080078125, 3.705322265625, 3.831512451171875, 3.95770263671875, 4.083892822265625, 4.2100830078125, 4.336273193359375, 4.46246337890625, 4.588653564453125, 4.71484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 11.0, 13.0, 16.0, 37.0, 39.0, 72.0, 114.0, 248.0, 555.0, 1634.0, 5896.0, 59546.0, 8302411.0, 13253.0, 2926.0, 944.0, 384.0, 158.0, 73.0, 53.0, 41.0, 31.0, 26.0, 20.0, 8.0, 7.0, 12.0, 11.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 0.0, 1.0], "bins": [-23.040096282958984, -22.346797943115234, -21.653501510620117, -20.960203170776367, -20.266904830932617, -19.573606491088867, -18.88031005859375, -18.18701171875, -17.49371337890625, -16.8004150390625, -16.107118606567383, -15.413820266723633, -14.720521926879883, -14.02722454071045, -13.333927154541016, -12.640628814697266, -11.947331428527832, -11.254034042358398, -10.560735702514648, -9.867438316345215, -9.174139976501465, -8.480842590332031, -7.7875447273254395, -7.094246864318848, -6.400949001312256, -5.707651138305664, -5.014353275299072, -4.3210554122924805, -3.6277577877044678, -2.934459924697876, -2.2411623001098633, -1.5478644371032715, -0.8545665740966797, -0.16126877069473267, 0.5320290327072144, 1.2253267765045166, 1.9186246395111084, 2.6119225025177, 3.305220127105713, 3.9985179901123047, 4.6918158531188965, 5.385113716125488, 6.07841157913208, 6.771709442138672, 7.4650068283081055, 8.158305168151855, 8.851602554321289, 9.544900894165039, 10.238198280334473, 10.931495666503906, 11.624794006347656, 12.31809139251709, 13.01138973236084, 13.704687118530273, 14.397985458374023, 15.091282844543457, 15.78458023071289, 16.47787857055664, 17.171175003051758, 17.864473342895508, 18.557771682739258, 19.251070022583008, 19.944366455078125, 20.637664794921875, 21.330963134765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-37.35580062866211, -36.37879180908203, -35.40178298950195, -34.42477798461914, -33.44776916503906, -32.470760345458984, -31.493751525878906, -30.51674461364746, -29.539735794067383, -28.562726974487305, -27.58572006225586, -26.60871124267578, -25.631704330444336, -24.654695510864258, -23.677688598632812, -22.700679779052734, -21.723670959472656, -20.746662139892578, -19.769655227661133, -18.792646408081055, -17.81563949584961, -16.83863067626953, -15.86162281036377, -14.884614944458008, -13.907608032226562, -12.9306001663208, -11.953592300415039, -10.976583480834961, -9.9995756149292, -9.022567749023438, -8.045559883117676, -7.068551540374756, -6.091543197631836, -5.114535331726074, -4.137526988983154, -3.1605191230773926, -2.1835110187530518, -1.206502914428711, -0.22949504852294922, 0.7475132942199707, 1.7245211601257324, 2.7015292644500732, 3.678537368774414, 4.655545234680176, 5.6325531005859375, 6.609561443328857, 7.586569309234619, 8.563577651977539, 9.5405855178833, 10.517593383789062, 11.494601249694824, 12.471609115600586, 13.448617935180664, 14.425625801086426, 15.402633666992188, 16.379642486572266, 17.35664939880371, 18.33365821838379, 19.310665130615234, 20.287673950195312, 21.264680862426758, 22.241689682006836, 23.21869659423828, 24.19570541381836, 25.172714233398438]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 19.0, 16.0, 26.0, 34.0, 27.0, 45.0, 50.0, 56.0, 69.0, 65.0, 84.0, 61.0, 76.0, 54.0, 54.0, 52.0, 36.0, 37.0, 29.0, 24.0, 20.0, 12.0, 12.0, 12.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.942779541015625, -3.83477783203125, -3.726776123046875, -3.6187744140625, -3.510772705078125, -3.40277099609375, -3.294769287109375, -3.186767578125, -3.078765869140625, -2.97076416015625, -2.862762451171875, -2.7547607421875, -2.646759033203125, -2.53875732421875, -2.430755615234375, -2.32275390625, -2.214752197265625, -2.10675048828125, -1.998748779296875, -1.8907470703125, -1.782745361328125, -1.67474365234375, -1.566741943359375, -1.458740234375, -1.350738525390625, -1.24273681640625, -1.134735107421875, -1.0267333984375, -0.918731689453125, -0.81072998046875, -0.702728271484375, -0.5947265625, -0.486724853515625, -0.37872314453125, -0.270721435546875, -0.1627197265625, -0.054718017578125, 0.05328369140625, 0.161285400390625, 0.269287109375, 0.377288818359375, 0.48529052734375, 0.593292236328125, 0.7012939453125, 0.809295654296875, 0.91729736328125, 1.025299072265625, 1.13330078125, 1.241302490234375, 1.34930419921875, 1.457305908203125, 1.5653076171875, 1.673309326171875, 1.78131103515625, 1.889312744140625, 1.997314453125, 2.105316162109375, 2.21331787109375, 2.321319580078125, 2.4293212890625, 2.537322998046875, 2.64532470703125, 2.753326416015625, 2.861328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 6.0, 7.0, 19.0, 11.0, 26.0, 51.0, 77.0, 151.0, 297.0, 638.0, 1459.0, 3924.0, 11169.0, 35279.0, 114885.0, 211167.0, 98864.0, 30260.0, 9929.0, 3456.0, 1392.0, 586.0, 244.0, 142.0, 60.0, 47.0, 30.0, 21.0, 15.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.453125, -18.76904296875, -18.0849609375, -17.40087890625, -16.716796875, -16.03271484375, -15.3486328125, -14.66455078125, -13.98046875, -13.29638671875, -12.6123046875, -11.92822265625, -11.244140625, -10.56005859375, -9.8759765625, -9.19189453125, -8.5078125, -7.82373046875, -7.1396484375, -6.45556640625, -5.771484375, -5.08740234375, -4.4033203125, -3.71923828125, -3.03515625, -2.35107421875, -1.6669921875, -0.98291015625, -0.298828125, 0.38525390625, 1.0693359375, 1.75341796875, 2.4375, 3.12158203125, 3.8056640625, 4.48974609375, 5.173828125, 5.85791015625, 6.5419921875, 7.22607421875, 7.91015625, 8.59423828125, 9.2783203125, 9.96240234375, 10.646484375, 11.33056640625, 12.0146484375, 12.69873046875, 13.3828125, 14.06689453125, 14.7509765625, 15.43505859375, 16.119140625, 16.80322265625, 17.4873046875, 18.17138671875, 18.85546875, 19.53955078125, 20.2236328125, 20.90771484375, 21.591796875, 22.27587890625, 22.9599609375, 23.64404296875, 24.328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 8.0, 6.0, 11.0, 17.0, 28.0, 26.0, 37.0, 43.0, 58.0, 41.0, 60.0, 56.0, 60.0, 73.0, 63.0, 70.0, 55.0, 62.0, 34.0, 33.0, 34.0, 30.0, 22.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.452789306640625, -3.34893798828125, -3.245086669921875, -3.1412353515625, -3.037384033203125, -2.93353271484375, -2.829681396484375, -2.725830078125, -2.621978759765625, -2.51812744140625, -2.414276123046875, -2.3104248046875, -2.206573486328125, -2.10272216796875, -1.998870849609375, -1.89501953125, -1.791168212890625, -1.68731689453125, -1.583465576171875, -1.4796142578125, -1.375762939453125, -1.27191162109375, -1.168060302734375, -1.064208984375, -0.960357666015625, -0.85650634765625, -0.752655029296875, -0.6488037109375, -0.544952392578125, -0.44110107421875, -0.337249755859375, -0.2333984375, -0.129547119140625, -0.02569580078125, 0.078155517578125, 0.1820068359375, 0.285858154296875, 0.38970947265625, 0.493560791015625, 0.597412109375, 0.701263427734375, 0.80511474609375, 0.908966064453125, 1.0128173828125, 1.116668701171875, 1.22052001953125, 1.324371337890625, 1.42822265625, 1.532073974609375, 1.63592529296875, 1.739776611328125, 1.8436279296875, 1.947479248046875, 2.05133056640625, 2.155181884765625, 2.259033203125, 2.362884521484375, 2.46673583984375, 2.570587158203125, 2.6744384765625, 2.778289794921875, 2.88214111328125, 2.985992431640625, 3.08984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 7.0, 4.0, 6.0, 13.0, 17.0, 38.0, 75.0, 106.0, 96.0, 46.0, 25.0, 10.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.659618377685547, -29.742244720458984, -28.82486915588379, -27.907495498657227, -26.990121841430664, -26.07274627685547, -25.155372619628906, -24.237998962402344, -23.32062339782715, -22.403249740600586, -21.48587417602539, -20.568500518798828, -19.651126861572266, -18.73375129699707, -17.816377639770508, -16.899002075195312, -15.981629371643066, -15.064254760742188, -14.146881103515625, -13.229506492614746, -12.312131881713867, -11.394758224487305, -10.477383613586426, -9.560009002685547, -8.642635345458984, -7.725261211395264, -6.807886600494385, -5.890512466430664, -4.973137855529785, -4.0557637214660645, -3.1383895874023438, -2.221014976501465, -1.303640365600586, -0.3862660527229309, 0.5311082601547241, 1.4484825134277344, 2.365856885910034, 3.283231258392334, 4.200605392456055, 5.117980003356934, 6.035354137420654, 6.952728271484375, 7.870102882385254, 8.787477493286133, 9.704851150512695, 10.622225761413574, 11.539600372314453, 12.456974029541016, 13.374348640441895, 14.291723251342773, 15.209096908569336, 16.12647247314453, 17.043846130371094, 17.961219787597656, 18.87859344482422, 19.795969009399414, 20.713342666625977, 21.63071632385254, 22.548091888427734, 23.465465545654297, 24.38283920288086, 25.300214767456055, 26.217588424682617, 27.134963989257812, 28.052337646484375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 9.0, 2.0, 5.0, 27.0, 54.0, 132.0, 121.0, 59.0, 20.0, 8.0, 9.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.553199768066406, -24.54115104675293, -23.52910041809082, -22.517051696777344, -21.505001068115234, -20.492952346801758, -19.48090362548828, -18.468852996826172, -17.456804275512695, -16.44475555419922, -15.43270492553711, -14.420656204223633, -13.40860652923584, -12.396556854248047, -11.38450813293457, -10.372458457946777, -9.360408782958984, -8.348359107971191, -7.336309909820557, -6.324260711669922, -5.312211036682129, -4.300161361694336, -3.288112163543701, -2.2760629653930664, -1.2640132904052734, -0.25196385383605957, 0.7600855827331543, 1.7721350193023682, 2.784184455871582, 3.796234130859375, 4.80828332901001, 5.8203325271606445, 6.832378387451172, 7.844428062438965, 8.856477737426758, 9.868526458740234, 10.880576133728027, 11.89262580871582, 12.904674530029297, 13.91672420501709, 14.928773880004883, 15.940823554992676, 16.95287322998047, 17.964921951293945, 18.976970672607422, 19.98902130126953, 21.001070022583008, 22.013118743896484, 23.025169372558594, 24.03721809387207, 25.04926872253418, 26.061317443847656, 27.073368072509766, 28.085416793823242, 29.09746551513672, 30.109516143798828, 31.121564865112305, 32.13361358642578, 33.14566421508789, 34.15771484375, 35.169761657714844, 36.18181228637695, 37.19386291503906, 38.205909729003906, 39.217960357666016]}, "eval/loss": 1.85287344455719, "eval/wer": 0.9976993256644189, "eval/runtime": 896.1552, "eval/samples_per_second": 2.948, "eval/steps_per_second": 0.369, "train/train_runtime": 114528.9287, "train/train_samples_per_second": 4.984, "train/train_steps_per_second": 0.156, "train/total_flos": 0.0, "train/train_loss": 0.9826719127995244} \ No newline at end of file +{"train/loss": 0.0608, "train/learning_rate": 4.156769596199525e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 115972, "_timestamp": 1647709849, "_step": 17848, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 6.0, 15.0, 19.0, 22.0, 48.0, 65.0, 61.0, 84.0, 114.0, 110.0, 103.0, 76.0, 77.0, 49.0, 35.0, 19.0, 15.0, 16.0, 9.0, 7.0, 10.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.100801467895508, -26.244380950927734, -25.38796043395996, -24.531539916992188, -23.675119400024414, -22.81869888305664, -21.9622802734375, -21.105859756469727, -20.249439239501953, -19.39301872253418, -18.536598205566406, -17.680177688598633, -16.82375717163086, -15.967337608337402, -15.110917091369629, -14.254497528076172, -13.398076057434082, -12.541655540466309, -11.685235023498535, -10.828815460205078, -9.972394943237305, -9.115974426269531, -8.259553909301758, -7.403133869171143, -6.546713352203369, -5.690292835235596, -4.8338727951049805, -3.977452278137207, -3.1210319995880127, -2.2646117210388184, -1.408191204071045, -0.5517711639404297, 0.30464935302734375, 1.161069631576538, 2.0174899101257324, 2.873910427093506, 3.7303307056427, 4.5867509841918945, 5.443171501159668, 6.299591541290283, 7.156012058258057, 8.012432098388672, 8.868852615356445, 9.725273132324219, 10.581693649291992, 11.438114166259766, 12.294534683227539, 13.150954246520996, 14.00737476348877, 14.863795280456543, 15.720215797424316, 16.576635360717773, 17.433055877685547, 18.28947639465332, 19.145896911621094, 20.002317428588867, 20.85873794555664, 21.715158462524414, 22.571578979492188, 23.42799949645996, 24.284420013427734, 25.140838623046875, 25.99726104736328, 26.853679656982422, 27.710100173950195]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 13.0, 14.0, 18.0, 24.0, 29.0, 38.0, 54.0, 58.0, 64.0, 54.0, 61.0, 62.0, 63.0, 63.0, 54.0, 68.0, 43.0, 42.0, 37.0, 36.0, 24.0, 15.0, 15.0, 10.0, 5.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.098886489868164, -20.288461685180664, -19.478036880493164, -18.66761016845703, -17.85718536376953, -17.04676055908203, -16.23633575439453, -15.425910949707031, -14.615485191345215, -13.805060386657715, -12.994634628295898, -12.184209823608398, -11.373785018920898, -10.563359260559082, -9.752934455871582, -8.942508697509766, -8.132083892822266, -7.321658611297607, -6.511233329772949, -5.700808525085449, -4.890383243560791, -4.079957962036133, -3.269533157348633, -2.4591078758239746, -1.6486825942993164, -0.8382574319839478, -0.0278322696685791, 0.7825927734375, 1.5930180549621582, 2.4034433364868164, 3.2138681411743164, 4.024293422698975, 4.834716796875, 5.645142078399658, 6.455567359924316, 7.265992164611816, 8.076417922973633, 8.886842727661133, 9.697267532348633, 10.507692337036133, 11.31811809539795, 12.12854290008545, 12.938968658447266, 13.749393463134766, 14.559818267822266, 15.370244026184082, 16.180667877197266, 16.9910945892334, 17.8015193939209, 18.6119441986084, 19.4223690032959, 20.23279571533203, 21.04322052001953, 21.85364532470703, 22.66407012939453, 23.47449493408203, 24.28491973876953, 25.09534454345703, 25.90576934814453, 26.71619415283203, 27.526620864868164, 28.337045669555664, 29.147470474243164, 29.957895278930664, 30.768321990966797]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 8.0, 9.0, 16.0, 16.0, 30.0, 23.0, 38.0, 41.0, 47.0, 67.0, 64.0, 59.0, 52.0, 64.0, 59.0, 64.0, 69.0, 52.0, 27.0, 43.0, 26.0, 33.0, 21.0, 15.0, 14.0, 3.0, 8.0, 8.0, 5.0, 4.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.3742828369140625, -1.317901611328125, -1.2615203857421875, -1.20513916015625, -1.1487579345703125, -1.092376708984375, -1.0359954833984375, -0.9796142578125, -0.9232330322265625, -0.866851806640625, -0.8104705810546875, -0.75408935546875, -0.6977081298828125, -0.641326904296875, -0.5849456787109375, -0.528564453125, -0.4721832275390625, -0.415802001953125, -0.3594207763671875, -0.30303955078125, -0.2466583251953125, -0.190277099609375, -0.1338958740234375, -0.0775146484375, -0.0211334228515625, 0.035247802734375, 0.0916290283203125, 0.14801025390625, 0.2043914794921875, 0.260772705078125, 0.3171539306640625, 0.37353515625, 0.4299163818359375, 0.486297607421875, 0.5426788330078125, 0.59906005859375, 0.6554412841796875, 0.711822509765625, 0.7682037353515625, 0.8245849609375, 0.8809661865234375, 0.937347412109375, 0.9937286376953125, 1.05010986328125, 1.1064910888671875, 1.162872314453125, 1.2192535400390625, 1.275634765625, 1.3320159912109375, 1.388397216796875, 1.4447784423828125, 1.50115966796875, 1.5575408935546875, 1.613922119140625, 1.6703033447265625, 1.7266845703125, 1.7830657958984375, 1.839447021484375, 1.8958282470703125, 1.95220947265625, 2.0085906982421875, 2.064971923828125, 2.1213531494140625, 2.177734375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 15.0, 16.0, 30.0, 34.0, 41.0, 80.0, 131.0, 151.0, 344.0, 714.0, 1926.0, 6215.0, 26205.0, 199978.0, 3804105.0, 125763.0, 19798.0, 5179.0, 1791.0, 763.0, 362.0, 202.0, 134.0, 92.0, 56.0, 38.0, 24.0, 22.0, 17.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.3924560546875, -11.839599609375, -11.2867431640625, -10.73388671875, -10.1810302734375, -9.628173828125, -9.0753173828125, -8.5224609375, -7.9696044921875, -7.416748046875, -6.8638916015625, -6.31103515625, -5.7581787109375, -5.205322265625, -4.6524658203125, -4.099609375, -3.5467529296875, -2.993896484375, -2.4410400390625, -1.88818359375, -1.3353271484375, -0.782470703125, -0.2296142578125, 0.3232421875, 0.8760986328125, 1.428955078125, 1.9818115234375, 2.53466796875, 3.0875244140625, 3.640380859375, 4.1932373046875, 4.74609375, 5.2989501953125, 5.851806640625, 6.4046630859375, 6.95751953125, 7.5103759765625, 8.063232421875, 8.6160888671875, 9.1689453125, 9.7218017578125, 10.274658203125, 10.8275146484375, 11.38037109375, 11.9332275390625, 12.486083984375, 13.0389404296875, 13.591796875, 14.1446533203125, 14.697509765625, 15.2503662109375, 15.80322265625, 16.3560791015625, 16.908935546875, 17.4617919921875, 18.0146484375, 18.5675048828125, 19.120361328125, 19.6732177734375, 20.22607421875, 20.7789306640625, 21.331787109375, 21.8846435546875, 22.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 6.0, 15.0, 35.0, 68.0, 88.0, 197.0, 534.0, 1911.0, 663.0, 258.0, 125.0, 63.0, 40.0, 25.0, 19.0, 8.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9921875, -13.5498046875, -13.107421875, -12.6650390625, -12.22265625, -11.7802734375, -11.337890625, -10.8955078125, -10.453125, -10.0107421875, -9.568359375, -9.1259765625, -8.68359375, -8.2412109375, -7.798828125, -7.3564453125, -6.9140625, -6.4716796875, -6.029296875, -5.5869140625, -5.14453125, -4.7021484375, -4.259765625, -3.8173828125, -3.375, -2.9326171875, -2.490234375, -2.0478515625, -1.60546875, -1.1630859375, -0.720703125, -0.2783203125, 0.1640625, 0.6064453125, 1.048828125, 1.4912109375, 1.93359375, 2.3759765625, 2.818359375, 3.2607421875, 3.703125, 4.1455078125, 4.587890625, 5.0302734375, 5.47265625, 5.9150390625, 6.357421875, 6.7998046875, 7.2421875, 7.6845703125, 8.126953125, 8.5693359375, 9.01171875, 9.4541015625, 9.896484375, 10.3388671875, 10.78125, 11.2236328125, 11.666015625, 12.1083984375, 12.55078125, 12.9931640625, 13.435546875, 13.8779296875, 14.3203125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 17.0, 38.0, 40.0, 66.0, 94.0, 142.0, 256.0, 571.0, 1528.0, 5103.0, 24760.0, 246907.0, 3771734.0, 120822.0, 16099.0, 3772.0, 1178.0, 476.0, 235.0, 141.0, 101.0, 70.0, 39.0, 30.0, 21.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.58349609375, -36.3857421875, -35.18798828125, -33.990234375, -32.79248046875, -31.5947265625, -30.39697265625, -29.19921875, -28.00146484375, -26.8037109375, -25.60595703125, -24.408203125, -23.21044921875, -22.0126953125, -20.81494140625, -19.6171875, -18.41943359375, -17.2216796875, -16.02392578125, -14.826171875, -13.62841796875, -12.4306640625, -11.23291015625, -10.03515625, -8.83740234375, -7.6396484375, -6.44189453125, -5.244140625, -4.04638671875, -2.8486328125, -1.65087890625, -0.453125, 0.74462890625, 1.9423828125, 3.14013671875, 4.337890625, 5.53564453125, 6.7333984375, 7.93115234375, 9.12890625, 10.32666015625, 11.5244140625, 12.72216796875, 13.919921875, 15.11767578125, 16.3154296875, 17.51318359375, 18.7109375, 19.90869140625, 21.1064453125, 22.30419921875, 23.501953125, 24.69970703125, 25.8974609375, 27.09521484375, 28.29296875, 29.49072265625, 30.6884765625, 31.88623046875, 33.083984375, 34.28173828125, 35.4794921875, 36.67724609375, 37.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 15.0, 11.0, 16.0, 36.0, 54.0, 90.0, 97.0, 144.0, 154.0, 118.0, 78.0, 61.0, 31.0, 30.0, 27.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.96833801269531, -54.66822052001953, -53.36810302734375, -52.06798553466797, -50.76786804199219, -49.467750549316406, -48.167633056640625, -46.867515563964844, -45.56739807128906, -44.26728057861328, -42.9671630859375, -41.66704559326172, -40.36692810058594, -39.066810607910156, -37.766693115234375, -36.466575622558594, -35.16645431518555, -33.866336822509766, -32.566219329833984, -31.266101837158203, -29.965984344482422, -28.66586685180664, -27.365747451782227, -26.065629959106445, -24.765512466430664, -23.465394973754883, -22.1652774810791, -20.86515998840332, -19.565040588378906, -18.264923095703125, -16.964805603027344, -15.664688110351562, -14.364574432373047, -13.064456939697266, -11.764339447021484, -10.464221000671387, -9.164103507995605, -7.863986015319824, -6.563868045806885, -5.263750076293945, -3.963632583618164, -2.6635148525238037, -1.3633971214294434, -0.06327939033508301, 1.2368383407592773, 2.5369558334350586, 3.837073802947998, 5.1371917724609375, 6.437309265136719, 7.7374267578125, 9.037544250488281, 10.337662696838379, 11.63778018951416, 12.937897682189941, 14.238016128540039, 15.53813362121582, 16.8382511138916, 18.138368606567383, 19.438486099243164, 20.738603591918945, 22.03872299194336, 23.33884048461914, 24.638957977294922, 25.939075469970703, 27.239192962646484]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 16.0, 9.0, 18.0, 16.0, 14.0, 33.0, 21.0, 28.0, 30.0, 41.0, 50.0, 37.0, 39.0, 39.0, 40.0, 51.0, 35.0, 51.0, 41.0, 38.0, 31.0, 33.0, 35.0, 30.0, 27.0, 10.0, 18.0, 19.0, 26.0, 15.0, 12.0, 16.0, 10.0, 8.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.482481002807617, -20.81058120727539, -20.13867950439453, -19.466779708862305, -18.794879913330078, -18.12297821044922, -17.451078414916992, -16.779178619384766, -16.107276916503906, -15.435376167297363, -14.76347541809082, -14.091575622558594, -13.41967487335205, -12.747774124145508, -12.075874328613281, -11.403973579406738, -10.732072830200195, -10.060172080993652, -9.38827133178711, -8.716371536254883, -8.04447078704834, -7.372570037841797, -6.700669765472412, -6.028769493103027, -5.356868743896484, -4.684967994689941, -4.013067722320557, -3.3411672115325928, -2.669266700744629, -1.997366189956665, -1.3254656791687012, -0.6535654067993164, 0.018337249755859375, 0.6902377605438232, 1.362138271331787, 2.034038782119751, 2.705939292907715, 3.3778398036956787, 4.049740314483643, 4.721640586853027, 5.39354133605957, 6.065442085266113, 6.737342357635498, 7.409242630004883, 8.081143379211426, 8.753044128417969, 9.424943923950195, 10.096844673156738, 10.768745422363281, 11.440646171569824, 12.112546920776367, 12.784446716308594, 13.456347465515137, 14.12824821472168, 14.800148010253906, 15.47204875946045, 16.143949508666992, 16.81584930419922, 17.487751007080078, 18.159650802612305, 18.83155059814453, 19.50345230102539, 20.175352096557617, 20.847251892089844, 21.519153594970703]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 4.0, 8.0, 10.0, 14.0, 12.0, 22.0, 25.0, 30.0, 35.0, 35.0, 35.0, 40.0, 47.0, 60.0, 54.0, 61.0, 59.0, 52.0, 54.0, 56.0, 44.0, 32.0, 34.0, 38.0, 28.0, 29.0, 17.0, 14.0, 13.0, 7.0, 15.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7455596923828125, -1.691314697265625, -1.6370697021484375, -1.58282470703125, -1.5285797119140625, -1.474334716796875, -1.4200897216796875, -1.3658447265625, -1.3115997314453125, -1.257354736328125, -1.2031097412109375, -1.14886474609375, -1.0946197509765625, -1.040374755859375, -0.9861297607421875, -0.931884765625, -0.8776397705078125, -0.823394775390625, -0.7691497802734375, -0.71490478515625, -0.6606597900390625, -0.606414794921875, -0.5521697998046875, -0.4979248046875, -0.4436798095703125, -0.389434814453125, -0.3351898193359375, -0.28094482421875, -0.2266998291015625, -0.172454833984375, -0.1182098388671875, -0.06396484375, -0.0097198486328125, 0.044525146484375, 0.0987701416015625, 0.15301513671875, 0.2072601318359375, 0.261505126953125, 0.3157501220703125, 0.3699951171875, 0.4242401123046875, 0.478485107421875, 0.5327301025390625, 0.58697509765625, 0.6412200927734375, 0.695465087890625, 0.7497100830078125, 0.803955078125, 0.8582000732421875, 0.912445068359375, 0.9666900634765625, 1.02093505859375, 1.0751800537109375, 1.129425048828125, 1.1836700439453125, 1.2379150390625, 1.2921600341796875, 1.346405029296875, 1.4006500244140625, 1.45489501953125, 1.5091400146484375, 1.563385009765625, 1.6176300048828125, 1.671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 16.0, 13.0, 20.0, 20.0, 48.0, 60.0, 103.0, 149.0, 240.0, 362.0, 684.0, 1206.0, 2251.0, 4407.0, 9451.0, 22248.0, 66329.0, 679915.0, 191254.0, 40420.0, 15206.0, 6726.0, 3343.0, 1734.0, 923.0, 526.0, 301.0, 201.0, 140.0, 80.0, 45.0, 44.0, 26.0, 18.0, 15.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.43798828125, -8.1806640625, -7.92333984375, -7.666015625, -7.40869140625, -7.1513671875, -6.89404296875, -6.63671875, -6.37939453125, -6.1220703125, -5.86474609375, -5.607421875, -5.35009765625, -5.0927734375, -4.83544921875, -4.578125, -4.32080078125, -4.0634765625, -3.80615234375, -3.548828125, -3.29150390625, -3.0341796875, -2.77685546875, -2.51953125, -2.26220703125, -2.0048828125, -1.74755859375, -1.490234375, -1.23291015625, -0.9755859375, -0.71826171875, -0.4609375, -0.20361328125, 0.0537109375, 0.31103515625, 0.568359375, 0.82568359375, 1.0830078125, 1.34033203125, 1.59765625, 1.85498046875, 2.1123046875, 2.36962890625, 2.626953125, 2.88427734375, 3.1416015625, 3.39892578125, 3.65625, 3.91357421875, 4.1708984375, 4.42822265625, 4.685546875, 4.94287109375, 5.2001953125, 5.45751953125, 5.71484375, 5.97216796875, 6.2294921875, 6.48681640625, 6.744140625, 7.00146484375, 7.2587890625, 7.51611328125, 7.7734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 2.0, 10.0, 12.0, 13.0, 13.0, 18.0, 20.0, 25.0, 26.0, 36.0, 35.0, 39.0, 32.0, 45.0, 31.0, 43.0, 38.0, 39.0, 1057.0, 46.0, 44.0, 45.0, 42.0, 35.0, 32.0, 31.0, 26.0, 22.0, 19.0, 22.0, 17.0, 17.0, 9.0, 17.0, 14.0, 7.0, 10.0, 7.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.058868408203125, -1.02105712890625, -0.983245849609375, -0.9454345703125, -0.907623291015625, -0.86981201171875, -0.832000732421875, -0.794189453125, -0.756378173828125, -0.71856689453125, -0.680755615234375, -0.6429443359375, -0.605133056640625, -0.56732177734375, -0.529510498046875, -0.49169921875, -0.453887939453125, -0.41607666015625, -0.378265380859375, -0.3404541015625, -0.302642822265625, -0.26483154296875, -0.227020263671875, -0.189208984375, -0.151397705078125, -0.11358642578125, -0.075775146484375, -0.0379638671875, -0.000152587890625, 0.03765869140625, 0.075469970703125, 0.11328125, 0.151092529296875, 0.18890380859375, 0.226715087890625, 0.2645263671875, 0.302337646484375, 0.34014892578125, 0.377960205078125, 0.415771484375, 0.453582763671875, 0.49139404296875, 0.529205322265625, 0.5670166015625, 0.604827880859375, 0.64263916015625, 0.680450439453125, 0.71826171875, 0.756072998046875, 0.79388427734375, 0.831695556640625, 0.8695068359375, 0.907318115234375, 0.94512939453125, 0.982940673828125, 1.020751953125, 1.058563232421875, 1.09637451171875, 1.134185791015625, 1.1719970703125, 1.209808349609375, 1.24761962890625, 1.285430908203125, 1.3232421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 13.0, 12.0, 15.0, 22.0, 25.0, 34.0, 57.0, 75.0, 89.0, 131.0, 197.0, 290.0, 402.0, 590.0, 972.0, 1543.0, 2527.0, 4484.0, 8431.0, 19502.0, 60751.0, 1383133.0, 529715.0, 49483.0, 16652.0, 7581.0, 3949.0, 2268.0, 1377.0, 895.0, 585.0, 405.0, 263.0, 199.0, 109.0, 93.0, 60.0, 48.0, 40.0, 27.0, 19.0, 16.0, 15.0, 3.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.810546875, -2.71966552734375, -2.6287841796875, -2.53790283203125, -2.447021484375, -2.35614013671875, -2.2652587890625, -2.17437744140625, -2.08349609375, -1.99261474609375, -1.9017333984375, -1.81085205078125, -1.719970703125, -1.62908935546875, -1.5382080078125, -1.44732666015625, -1.3564453125, -1.26556396484375, -1.1746826171875, -1.08380126953125, -0.992919921875, -0.90203857421875, -0.8111572265625, -0.72027587890625, -0.62939453125, -0.53851318359375, -0.4476318359375, -0.35675048828125, -0.265869140625, -0.17498779296875, -0.0841064453125, 0.00677490234375, 0.09765625, 0.18853759765625, 0.2794189453125, 0.37030029296875, 0.461181640625, 0.55206298828125, 0.6429443359375, 0.73382568359375, 0.82470703125, 0.91558837890625, 1.0064697265625, 1.09735107421875, 1.188232421875, 1.27911376953125, 1.3699951171875, 1.46087646484375, 1.5517578125, 1.64263916015625, 1.7335205078125, 1.82440185546875, 1.915283203125, 2.00616455078125, 2.0970458984375, 2.18792724609375, 2.27880859375, 2.36968994140625, 2.4605712890625, 2.55145263671875, 2.642333984375, 2.73321533203125, 2.8240966796875, 2.91497802734375, 3.005859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 8.0, 19.0, 149.0, 709.0, 73.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.934814453125, -2.85400390625, -2.773193359375, -2.6923828125, -2.611572265625, -2.53076171875, -2.449951171875, -2.369140625, -2.288330078125, -2.20751953125, -2.126708984375, -2.0458984375, -1.965087890625, -1.88427734375, -1.803466796875, -1.72265625, -1.641845703125, -1.56103515625, -1.480224609375, -1.3994140625, -1.318603515625, -1.23779296875, -1.156982421875, -1.076171875, -0.995361328125, -0.91455078125, -0.833740234375, -0.7529296875, -0.672119140625, -0.59130859375, -0.510498046875, -0.4296875, -0.348876953125, -0.26806640625, -0.187255859375, -0.1064453125, -0.025634765625, 0.05517578125, 0.135986328125, 0.216796875, 0.297607421875, 0.37841796875, 0.459228515625, 0.5400390625, 0.620849609375, 0.70166015625, 0.782470703125, 0.86328125, 0.944091796875, 1.02490234375, 1.105712890625, 1.1865234375, 1.267333984375, 1.34814453125, 1.428955078125, 1.509765625, 1.590576171875, 1.67138671875, 1.752197265625, 1.8330078125, 1.913818359375, 1.99462890625, 2.075439453125, 2.15625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 3.0, 9.0, 12.0, 11.0, 17.0, 28.0, 87.0, 377.0, 3379.0, 1025580.0, 17285.0, 1361.0, 210.0, 74.0, 25.0, 17.0, 9.0, 9.0, 3.0, 4.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.7587890625, -36.673828125, -35.5888671875, -34.50390625, -33.4189453125, -32.333984375, -31.2490234375, -30.1640625, -29.0791015625, -27.994140625, -26.9091796875, -25.82421875, -24.7392578125, -23.654296875, -22.5693359375, -21.484375, -20.3994140625, -19.314453125, -18.2294921875, -17.14453125, -16.0595703125, -14.974609375, -13.8896484375, -12.8046875, -11.7197265625, -10.634765625, -9.5498046875, -8.46484375, -7.3798828125, -6.294921875, -5.2099609375, -4.125, -3.0400390625, -1.955078125, -0.8701171875, 0.21484375, 1.2998046875, 2.384765625, 3.4697265625, 4.5546875, 5.6396484375, 6.724609375, 7.8095703125, 8.89453125, 9.9794921875, 11.064453125, 12.1494140625, 13.234375, 14.3193359375, 15.404296875, 16.4892578125, 17.57421875, 18.6591796875, 19.744140625, 20.8291015625, 21.9140625, 22.9990234375, 24.083984375, 25.1689453125, 26.25390625, 27.3388671875, 28.423828125, 29.5087890625, 30.59375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 12.0, 65.0, 204.0, 488.0, 172.0, 41.0, 19.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.455366611480713, -7.2503156661987305, -7.045264720916748, -6.840213775634766, -6.635162830352783, -6.430111885070801, -6.225060939788818, -6.020009994506836, -5.8149590492248535, -5.609908103942871, -5.404857158660889, -5.199806213378906, -4.994755268096924, -4.789704322814941, -4.584653377532959, -4.379602432250977, -4.174551486968994, -3.9695005416870117, -3.7644495964050293, -3.559398651123047, -3.3543477058410645, -3.149296760559082, -2.9442458152770996, -2.739194869995117, -2.5341439247131348, -2.3290929794311523, -2.12404203414917, -1.9189910888671875, -1.713940143585205, -1.5088891983032227, -1.3038382530212402, -1.0987873077392578, -0.8937363624572754, -0.688685417175293, -0.48363447189331055, -0.2785835266113281, -0.0735325813293457, 0.13151836395263672, 0.33656930923461914, 0.5416202545166016, 0.746671199798584, 0.9517221450805664, 1.1567730903625488, 1.3618240356445312, 1.5668749809265137, 1.771925926208496, 1.9769768714904785, 2.182027816772461, 2.3870787620544434, 2.592129707336426, 2.797180652618408, 3.0022315979003906, 3.207282543182373, 3.4123334884643555, 3.617384433746338, 3.8224353790283203, 4.027486324310303, 4.232537269592285, 4.437588214874268, 4.64263916015625, 4.847690105438232, 5.052741050720215, 5.257791996002197, 5.46284294128418, 5.667893886566162]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 9.0, 5.0, 6.0, 15.0, 16.0, 23.0, 12.0, 25.0, 37.0, 25.0, 33.0, 27.0, 36.0, 37.0, 45.0, 40.0, 34.0, 35.0, 35.0, 34.0, 45.0, 33.0, 42.0, 38.0, 24.0, 30.0, 31.0, 23.0, 32.0, 30.0, 27.0, 16.0, 10.0, 16.0, 12.0, 12.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4209628105163574, -1.3770132064819336, -1.3330636024475098, -1.289113998413086, -1.245164394378662, -1.2012147903442383, -1.1572651863098145, -1.1133155822753906, -1.0693659782409668, -1.025416374206543, -0.9814667701721191, -0.9375171661376953, -0.8935675621032715, -0.8496179580688477, -0.8056683540344238, -0.76171875, -0.7177691459655762, -0.6738195419311523, -0.6298699378967285, -0.5859203338623047, -0.5419707298278809, -0.49802112579345703, -0.4540715217590332, -0.4101219177246094, -0.36617231369018555, -0.3222227096557617, -0.2782731056213379, -0.23432350158691406, -0.19037389755249023, -0.1464242935180664, -0.10247468948364258, -0.05852508544921875, -0.014575481414794922, 0.029374122619628906, 0.07332372665405273, 0.11727333068847656, 0.1612229347229004, 0.20517253875732422, 0.24912214279174805, 0.2930717468261719, 0.3370213508605957, 0.38097095489501953, 0.42492055892944336, 0.4688701629638672, 0.512819766998291, 0.5567693710327148, 0.6007189750671387, 0.6446685791015625, 0.6886181831359863, 0.7325677871704102, 0.776517391204834, 0.8204669952392578, 0.8644165992736816, 0.9083662033081055, 0.9523158073425293, 0.9962654113769531, 1.040215015411377, 1.0841646194458008, 1.1281142234802246, 1.1720638275146484, 1.2160134315490723, 1.259963035583496, 1.30391263961792, 1.3478622436523438, 1.3918118476867676]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 10.0, 19.0, 20.0, 17.0, 32.0, 41.0, 37.0, 45.0, 55.0, 62.0, 64.0, 74.0, 69.0, 61.0, 46.0, 50.0, 49.0, 40.0, 44.0, 34.0, 25.0, 24.0, 15.0, 12.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9296417236328125, -1.868072509765625, -1.8065032958984375, -1.74493408203125, -1.6833648681640625, -1.621795654296875, -1.5602264404296875, -1.4986572265625, -1.4370880126953125, -1.375518798828125, -1.3139495849609375, -1.25238037109375, -1.1908111572265625, -1.129241943359375, -1.0676727294921875, -1.006103515625, -0.9445343017578125, -0.882965087890625, -0.8213958740234375, -0.75982666015625, -0.6982574462890625, -0.636688232421875, -0.5751190185546875, -0.5135498046875, -0.4519805908203125, -0.390411376953125, -0.3288421630859375, -0.26727294921875, -0.2057037353515625, -0.144134521484375, -0.0825653076171875, -0.02099609375, 0.0405731201171875, 0.102142333984375, 0.1637115478515625, 0.22528076171875, 0.2868499755859375, 0.348419189453125, 0.4099884033203125, 0.4715576171875, 0.5331268310546875, 0.594696044921875, 0.6562652587890625, 0.71783447265625, 0.7794036865234375, 0.840972900390625, 0.9025421142578125, 0.964111328125, 1.0256805419921875, 1.087249755859375, 1.1488189697265625, 1.21038818359375, 1.2719573974609375, 1.333526611328125, 1.3950958251953125, 1.4566650390625, 1.5182342529296875, 1.579803466796875, 1.6413726806640625, 1.70294189453125, 1.7645111083984375, 1.826080322265625, 1.8876495361328125, 1.94921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 13.0, 26.0, 43.0, 71.0, 101.0, 159.0, 323.0, 636.0, 1258.0, 2356.0, 4870.0, 11814.0, 31549.0, 109248.0, 485832.0, 295952.0, 66730.0, 21353.0, 8443.0, 3852.0, 1804.0, 969.0, 512.0, 255.0, 156.0, 87.0, 42.0, 28.0, 17.0, 12.0, 6.0, 8.0, 6.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.55206298828125, -5.3775634765625, -5.20306396484375, -5.028564453125, -4.85406494140625, -4.6795654296875, -4.50506591796875, -4.33056640625, -4.15606689453125, -3.9815673828125, -3.80706787109375, -3.632568359375, -3.45806884765625, -3.2835693359375, -3.10906982421875, -2.9345703125, -2.76007080078125, -2.5855712890625, -2.41107177734375, -2.236572265625, -2.06207275390625, -1.8875732421875, -1.71307373046875, -1.53857421875, -1.36407470703125, -1.1895751953125, -1.01507568359375, -0.840576171875, -0.66607666015625, -0.4915771484375, -0.31707763671875, -0.142578125, 0.03192138671875, 0.2064208984375, 0.38092041015625, 0.555419921875, 0.72991943359375, 0.9044189453125, 1.07891845703125, 1.25341796875, 1.42791748046875, 1.6024169921875, 1.77691650390625, 1.951416015625, 2.12591552734375, 2.3004150390625, 2.47491455078125, 2.6494140625, 2.82391357421875, 2.9984130859375, 3.17291259765625, 3.347412109375, 3.52191162109375, 3.6964111328125, 3.87091064453125, 4.04541015625, 4.21990966796875, 4.3944091796875, 4.56890869140625, 4.743408203125, 4.91790771484375, 5.0924072265625, 5.26690673828125, 5.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 11.0, 12.0, 12.0, 16.0, 27.0, 29.0, 41.0, 51.0, 69.0, 104.0, 117.0, 249.0, 1515.0, 264.0, 134.0, 79.0, 66.0, 60.0, 43.0, 27.0, 16.0, 18.0, 19.0, 21.0, 5.0, 5.0, 8.0, 3.0, 9.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.78125, -8.547119140625, -8.31298828125, -8.078857421875, -7.8447265625, -7.610595703125, -7.37646484375, -7.142333984375, -6.908203125, -6.674072265625, -6.43994140625, -6.205810546875, -5.9716796875, -5.737548828125, -5.50341796875, -5.269287109375, -5.03515625, -4.801025390625, -4.56689453125, -4.332763671875, -4.0986328125, -3.864501953125, -3.63037109375, -3.396240234375, -3.162109375, -2.927978515625, -2.69384765625, -2.459716796875, -2.2255859375, -1.991455078125, -1.75732421875, -1.523193359375, -1.2890625, -1.054931640625, -0.82080078125, -0.586669921875, -0.3525390625, -0.118408203125, 0.11572265625, 0.349853515625, 0.583984375, 0.818115234375, 1.05224609375, 1.286376953125, 1.5205078125, 1.754638671875, 1.98876953125, 2.222900390625, 2.45703125, 2.691162109375, 2.92529296875, 3.159423828125, 3.3935546875, 3.627685546875, 3.86181640625, 4.095947265625, 4.330078125, 4.564208984375, 4.79833984375, 5.032470703125, 5.2666015625, 5.500732421875, 5.73486328125, 5.968994140625, 6.203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 12.0, 15.0, 11.0, 16.0, 24.0, 30.0, 37.0, 42.0, 86.0, 247.0, 3052.0, 528091.0, 2606748.0, 6641.0, 334.0, 81.0, 60.0, 35.0, 36.0, 21.0, 18.0, 11.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.21875, -27.177734375, -26.13671875, -25.095703125, -24.0546875, -23.013671875, -21.97265625, -20.931640625, -19.890625, -18.849609375, -17.80859375, -16.767578125, -15.7265625, -14.685546875, -13.64453125, -12.603515625, -11.5625, -10.521484375, -9.48046875, -8.439453125, -7.3984375, -6.357421875, -5.31640625, -4.275390625, -3.234375, -2.193359375, -1.15234375, -0.111328125, 0.9296875, 1.970703125, 3.01171875, 4.052734375, 5.09375, 6.134765625, 7.17578125, 8.216796875, 9.2578125, 10.298828125, 11.33984375, 12.380859375, 13.421875, 14.462890625, 15.50390625, 16.544921875, 17.5859375, 18.626953125, 19.66796875, 20.708984375, 21.75, 22.791015625, 23.83203125, 24.873046875, 25.9140625, 26.955078125, 27.99609375, 29.037109375, 30.078125, 31.119140625, 32.16015625, 33.201171875, 34.2421875, 35.283203125, 36.32421875, 37.365234375, 38.40625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 105.0, 311.0, 411.0, 143.0, 33.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.548988342285156, -15.81141471862793, -14.07384204864502, -12.33626937866211, -10.598695755004883, -8.861122131347656, -7.123549461364746, -5.385976791381836, -3.6484031677246094, -1.910830020904541, -0.17325687408447266, 1.5643162727355957, 3.301889419555664, 5.039463043212891, 6.777035713195801, 8.514608383178711, 10.252182006835938, 11.989755630493164, 13.727328300476074, 15.464900970458984, 17.20247459411621, 18.940048217773438, 20.67761993408203, 22.415193557739258, 24.152767181396484, 25.89034080505371, 27.627914428710938, 29.36548614501953, 31.103059768676758, 32.840633392333984, 34.57820510864258, 36.31578063964844, 38.05335235595703, 39.790924072265625, 41.528499603271484, 43.26607131958008, 45.00364685058594, 46.74121856689453, 48.478790283203125, 50.21636199951172, 51.95393753051758, 53.69150924682617, 55.42908477783203, 57.166656494140625, 58.90422821044922, 60.64180374145508, 62.37937545776367, 64.11695098876953, 65.85452270507812, 67.59209442138672, 69.32966613769531, 71.06724548339844, 72.80481719970703, 74.54238891601562, 76.27996063232422, 78.01753234863281, 79.75511169433594, 81.49268341064453, 83.23025512695312, 84.96783447265625, 86.70540618896484, 88.44297790527344, 90.18054962158203, 91.91812133789062, 93.65569305419922]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 2.0, 6.0, 10.0, 8.0, 17.0, 15.0, 25.0, 17.0, 22.0, 29.0, 28.0, 44.0, 30.0, 45.0, 46.0, 44.0, 45.0, 48.0, 57.0, 40.0, 38.0, 40.0, 42.0, 34.0, 29.0, 36.0, 31.0, 23.0, 19.0, 21.0, 21.0, 18.0, 16.0, 9.0, 11.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-18.908187866210938, -18.34250259399414, -17.776817321777344, -17.211132049560547, -16.64544677734375, -16.079761505126953, -15.514076232910156, -14.94839096069336, -14.382705688476562, -13.817020416259766, -13.251335144042969, -12.685649871826172, -12.119964599609375, -11.554279327392578, -10.988594055175781, -10.422908782958984, -9.857222557067871, -9.291537284851074, -8.725852012634277, -8.16016674041748, -7.594481468200684, -7.028796195983887, -6.463110446929932, -5.897425174713135, -5.331739902496338, -4.766054630279541, -4.200369358062744, -3.634683847427368, -3.0689985752105713, -2.5033133029937744, -1.9376277923583984, -1.3719425201416016, -0.8062572479248047, -0.24057191610336304, 0.3251134157180786, 0.890798807144165, 1.456484079360962, 2.022169351577759, 2.5878548622131348, 3.1535401344299316, 3.7192254066467285, 4.284910678863525, 4.850595951080322, 5.416281700134277, 5.981966972351074, 6.547652244567871, 7.113337516784668, 7.679022789001465, 8.244708061218262, 8.810393333435059, 9.376078605651855, 9.941763877868652, 10.50744915008545, 11.073134422302246, 11.63882064819336, 12.204505920410156, 12.770191192626953, 13.33587646484375, 13.901561737060547, 14.467247009277344, 15.03293228149414, 15.598617553710938, 16.164302825927734, 16.72998809814453, 17.295673370361328]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 9.0, 12.0, 16.0, 20.0, 31.0, 30.0, 36.0, 36.0, 43.0, 50.0, 51.0, 53.0, 55.0, 56.0, 49.0, 46.0, 53.0, 53.0, 36.0, 48.0, 34.0, 36.0, 23.0, 20.0, 16.0, 16.0, 17.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6923980712890625, -1.635772705078125, -1.5791473388671875, -1.52252197265625, -1.4658966064453125, -1.409271240234375, -1.3526458740234375, -1.2960205078125, -1.2393951416015625, -1.182769775390625, -1.1261444091796875, -1.06951904296875, -1.0128936767578125, -0.956268310546875, -0.8996429443359375, -0.843017578125, -0.7863922119140625, -0.729766845703125, -0.6731414794921875, -0.61651611328125, -0.5598907470703125, -0.503265380859375, -0.4466400146484375, -0.3900146484375, -0.3333892822265625, -0.276763916015625, -0.2201385498046875, -0.16351318359375, -0.1068878173828125, -0.050262451171875, 0.0063629150390625, 0.06298828125, 0.1196136474609375, 0.176239013671875, 0.2328643798828125, 0.28948974609375, 0.3461151123046875, 0.402740478515625, 0.4593658447265625, 0.5159912109375, 0.5726165771484375, 0.629241943359375, 0.6858673095703125, 0.74249267578125, 0.7991180419921875, 0.855743408203125, 0.9123687744140625, 0.968994140625, 1.0256195068359375, 1.082244873046875, 1.1388702392578125, 1.19549560546875, 1.2521209716796875, 1.308746337890625, 1.3653717041015625, 1.4219970703125, 1.4786224365234375, 1.535247802734375, 1.5918731689453125, 1.64849853515625, 1.7051239013671875, 1.761749267578125, 1.8183746337890625, 1.875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 16.0, 19.0, 23.0, 39.0, 63.0, 99.0, 161.0, 247.0, 440.0, 763.0, 1389.0, 2432.0, 4509.0, 9173.0, 19044.0, 45304.0, 142590.0, 2512468.0, 1276869.0, 108832.0, 37382.0, 16242.0, 7622.0, 3742.0, 2093.0, 1023.0, 634.0, 368.0, 247.0, 133.0, 93.0, 72.0, 32.0, 27.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.2421875, -7.98388671875, -7.7255859375, -7.46728515625, -7.208984375, -6.95068359375, -6.6923828125, -6.43408203125, -6.17578125, -5.91748046875, -5.6591796875, -5.40087890625, -5.142578125, -4.88427734375, -4.6259765625, -4.36767578125, -4.109375, -3.85107421875, -3.5927734375, -3.33447265625, -3.076171875, -2.81787109375, -2.5595703125, -2.30126953125, -2.04296875, -1.78466796875, -1.5263671875, -1.26806640625, -1.009765625, -0.75146484375, -0.4931640625, -0.23486328125, 0.0234375, 0.28173828125, 0.5400390625, 0.79833984375, 1.056640625, 1.31494140625, 1.5732421875, 1.83154296875, 2.08984375, 2.34814453125, 2.6064453125, 2.86474609375, 3.123046875, 3.38134765625, 3.6396484375, 3.89794921875, 4.15625, 4.41455078125, 4.6728515625, 4.93115234375, 5.189453125, 5.44775390625, 5.7060546875, 5.96435546875, 6.22265625, 6.48095703125, 6.7392578125, 6.99755859375, 7.255859375, 7.51416015625, 7.7724609375, 8.03076171875, 8.2890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 11.0, 17.0, 23.0, 35.0, 54.0, 47.0, 78.0, 110.0, 160.0, 243.0, 453.0, 862.0, 817.0, 435.0, 243.0, 136.0, 97.0, 68.0, 38.0, 39.0, 22.0, 15.0, 13.0, 10.0, 10.0, 8.0, 5.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.63653564453125, -8.3824462890625, -8.12835693359375, -7.874267578125, -7.62017822265625, -7.3660888671875, -7.11199951171875, -6.85791015625, -6.60382080078125, -6.3497314453125, -6.09564208984375, -5.841552734375, -5.58746337890625, -5.3333740234375, -5.07928466796875, -4.8251953125, -4.57110595703125, -4.3170166015625, -4.06292724609375, -3.808837890625, -3.55474853515625, -3.3006591796875, -3.04656982421875, -2.79248046875, -2.53839111328125, -2.2843017578125, -2.03021240234375, -1.776123046875, -1.52203369140625, -1.2679443359375, -1.01385498046875, -0.759765625, -0.50567626953125, -0.2515869140625, 0.00250244140625, 0.256591796875, 0.51068115234375, 0.7647705078125, 1.01885986328125, 1.27294921875, 1.52703857421875, 1.7811279296875, 2.03521728515625, 2.289306640625, 2.54339599609375, 2.7974853515625, 3.05157470703125, 3.3056640625, 3.55975341796875, 3.8138427734375, 4.06793212890625, 4.322021484375, 4.57611083984375, 4.8302001953125, 5.08428955078125, 5.33837890625, 5.59246826171875, 5.8465576171875, 6.10064697265625, 6.354736328125, 6.60882568359375, 6.8629150390625, 7.11700439453125, 7.37109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 6.0, 16.0, 33.0, 45.0, 83.0, 133.0, 211.0, 333.0, 617.0, 1089.0, 2109.0, 4169.0, 8404.0, 18610.0, 47134.0, 151846.0, 1340661.0, 2332577.0, 189572.0, 56206.0, 21460.0, 9447.0, 4509.0, 2160.0, 1175.0, 659.0, 404.0, 192.0, 148.0, 90.0, 45.0, 40.0, 23.0, 18.0, 18.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.39208984375, -14.9404296875, -14.48876953125, -14.037109375, -13.58544921875, -13.1337890625, -12.68212890625, -12.23046875, -11.77880859375, -11.3271484375, -10.87548828125, -10.423828125, -9.97216796875, -9.5205078125, -9.06884765625, -8.6171875, -8.16552734375, -7.7138671875, -7.26220703125, -6.810546875, -6.35888671875, -5.9072265625, -5.45556640625, -5.00390625, -4.55224609375, -4.1005859375, -3.64892578125, -3.197265625, -2.74560546875, -2.2939453125, -1.84228515625, -1.390625, -0.93896484375, -0.4873046875, -0.03564453125, 0.416015625, 0.86767578125, 1.3193359375, 1.77099609375, 2.22265625, 2.67431640625, 3.1259765625, 3.57763671875, 4.029296875, 4.48095703125, 4.9326171875, 5.38427734375, 5.8359375, 6.28759765625, 6.7392578125, 7.19091796875, 7.642578125, 8.09423828125, 8.5458984375, 8.99755859375, 9.44921875, 9.90087890625, 10.3525390625, 10.80419921875, 11.255859375, 11.70751953125, 12.1591796875, 12.61083984375, 13.0625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 17.0, 30.0, 35.0, 72.0, 139.0, 220.0, 203.0, 116.0, 72.0, 30.0, 33.0, 14.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.809171676635742, -23.043285369873047, -21.27739906311035, -19.511512756347656, -17.745624542236328, -15.97973918914795, -14.213851928710938, -12.447965621948242, -10.682079315185547, -8.916193008422852, -7.150306224822998, -5.3844194412231445, -3.618533134460449, -1.852646827697754, -0.08675956726074219, 1.6791267395019531, 3.4450130462646484, 5.210899353027344, 6.976786136627197, 8.74267292022705, 10.508559226989746, 12.274445533752441, 14.040332794189453, 15.806219100952148, 17.572105407714844, 19.33799171447754, 21.103878021240234, 22.869766235351562, 24.635650634765625, 26.401538848876953, 28.16742515563965, 29.933311462402344, 31.699195861816406, 33.465084075927734, 35.2309684753418, 36.996856689453125, 38.76274108886719, 40.528629302978516, 42.294517517089844, 44.060401916503906, 45.82628631591797, 47.5921745300293, 49.35805892944336, 51.12394714355469, 52.88983154296875, 54.65571975708008, 56.421607971191406, 58.18749237060547, 59.9533805847168, 61.719268798828125, 63.48515319824219, 65.25103759765625, 67.01692962646484, 68.7828140258789, 70.54869842529297, 72.31459045410156, 74.08047485351562, 75.84635925292969, 77.61225128173828, 79.37813568115234, 81.1440200805664, 82.90990447998047, 84.67579650878906, 86.44168090820312, 88.20756530761719]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 8.0, 13.0, 17.0, 15.0, 21.0, 16.0, 21.0, 25.0, 23.0, 26.0, 26.0, 28.0, 35.0, 42.0, 34.0, 34.0, 30.0, 32.0, 43.0, 42.0, 37.0, 24.0, 32.0, 27.0, 30.0, 22.0, 26.0, 21.0, 39.0, 20.0, 20.0, 23.0, 23.0, 20.0, 14.0, 14.0, 8.0, 10.0, 11.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.984928131103516, -18.428075790405273, -17.87122344970703, -17.31437110900879, -16.757518768310547, -16.200666427612305, -15.643814086914062, -15.08696174621582, -14.530109405517578, -13.973257064819336, -13.416404724121094, -12.859552383422852, -12.30270004272461, -11.745847702026367, -11.188995361328125, -10.632143020629883, -10.075289726257324, -9.518437385559082, -8.96158504486084, -8.404732704162598, -7.8478803634643555, -7.291028022766113, -6.734175205230713, -6.177322864532471, -5.6204705238342285, -5.063618183135986, -4.506765842437744, -3.949913263320923, -3.3930609226226807, -2.8362085819244385, -2.279356002807617, -1.722503662109375, -1.1656513214111328, -0.6087989211082458, -0.05194652080535889, 0.5049059391021729, 1.061758279800415, 1.6186106204986572, 2.1754631996154785, 2.7323155403137207, 3.289167881011963, 3.846020221710205, 4.402872562408447, 4.959725379943848, 5.51657772064209, 6.073430061340332, 6.630282402038574, 7.187134742736816, 7.743987083435059, 8.3008394241333, 8.857691764831543, 9.414544105529785, 9.971396446228027, 10.52824878692627, 11.085102081298828, 11.64195442199707, 12.198806762695312, 12.755659103393555, 13.312511444091797, 13.869363784790039, 14.426216125488281, 14.983068466186523, 15.539920806884766, 16.096773147583008, 16.65362548828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 7.0, 7.0, 9.0, 13.0, 13.0, 18.0, 20.0, 25.0, 23.0, 36.0, 28.0, 28.0, 30.0, 47.0, 49.0, 49.0, 50.0, 48.0, 59.0, 60.0, 54.0, 36.0, 38.0, 44.0, 25.0, 21.0, 25.0, 24.0, 27.0, 13.0, 15.0, 12.0, 9.0, 12.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6366424560546875, -1.584808349609375, -1.5329742431640625, -1.48114013671875, -1.4293060302734375, -1.377471923828125, -1.3256378173828125, -1.2738037109375, -1.2219696044921875, -1.170135498046875, -1.1183013916015625, -1.06646728515625, -1.0146331787109375, -0.962799072265625, -0.9109649658203125, -0.859130859375, -0.8072967529296875, -0.755462646484375, -0.7036285400390625, -0.65179443359375, -0.5999603271484375, -0.548126220703125, -0.4962921142578125, -0.4444580078125, -0.3926239013671875, -0.340789794921875, -0.2889556884765625, -0.23712158203125, -0.1852874755859375, -0.133453369140625, -0.0816192626953125, -0.02978515625, 0.0220489501953125, 0.073883056640625, 0.1257171630859375, 0.17755126953125, 0.2293853759765625, 0.281219482421875, 0.3330535888671875, 0.3848876953125, 0.4367218017578125, 0.488555908203125, 0.5403900146484375, 0.59222412109375, 0.6440582275390625, 0.695892333984375, 0.7477264404296875, 0.799560546875, 0.8513946533203125, 0.903228759765625, 0.9550628662109375, 1.00689697265625, 1.0587310791015625, 1.110565185546875, 1.1623992919921875, 1.2142333984375, 1.2660675048828125, 1.317901611328125, 1.3697357177734375, 1.42156982421875, 1.4734039306640625, 1.525238037109375, 1.5770721435546875, 1.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 7.0, 6.0, 9.0, 20.0, 22.0, 45.0, 59.0, 82.0, 120.0, 191.0, 326.0, 494.0, 722.0, 1188.0, 1899.0, 3161.0, 5391.0, 9684.0, 18303.0, 39062.0, 104645.0, 453598.0, 271888.0, 73123.0, 30123.0, 14815.0, 7935.0, 4505.0, 2621.0, 1626.0, 1074.0, 609.0, 421.0, 263.0, 157.0, 95.0, 90.0, 43.0, 29.0, 25.0, 17.0, 13.0, 15.0, 9.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-8.6640625, -8.41534423828125, -8.1666259765625, -7.91790771484375, -7.669189453125, -7.42047119140625, -7.1717529296875, -6.92303466796875, -6.67431640625, -6.42559814453125, -6.1768798828125, -5.92816162109375, -5.679443359375, -5.43072509765625, -5.1820068359375, -4.93328857421875, -4.6845703125, -4.43585205078125, -4.1871337890625, -3.93841552734375, -3.689697265625, -3.44097900390625, -3.1922607421875, -2.94354248046875, -2.69482421875, -2.44610595703125, -2.1973876953125, -1.94866943359375, -1.699951171875, -1.45123291015625, -1.2025146484375, -0.95379638671875, -0.705078125, -0.45635986328125, -0.2076416015625, 0.04107666015625, 0.289794921875, 0.53851318359375, 0.7872314453125, 1.03594970703125, 1.28466796875, 1.53338623046875, 1.7821044921875, 2.03082275390625, 2.279541015625, 2.52825927734375, 2.7769775390625, 3.02569580078125, 3.2744140625, 3.52313232421875, 3.7718505859375, 4.02056884765625, 4.269287109375, 4.51800537109375, 4.7667236328125, 5.01544189453125, 5.26416015625, 5.51287841796875, 5.7615966796875, 6.01031494140625, 6.259033203125, 6.50775146484375, 6.7564697265625, 7.00518798828125, 7.25390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 2.0, 10.0, 12.0, 8.0, 10.0, 16.0, 9.0, 20.0, 33.0, 41.0, 40.0, 41.0, 35.0, 30.0, 51.0, 50.0, 35.0, 1065.0, 46.0, 40.0, 38.0, 48.0, 47.0, 42.0, 34.0, 33.0, 29.0, 35.0, 20.0, 16.0, 21.0, 7.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2813262939453125, -1.239410400390625, -1.1974945068359375, -1.15557861328125, -1.1136627197265625, -1.071746826171875, -1.0298309326171875, -0.9879150390625, -0.9459991455078125, -0.904083251953125, -0.8621673583984375, -0.82025146484375, -0.7783355712890625, -0.736419677734375, -0.6945037841796875, -0.652587890625, -0.6106719970703125, -0.568756103515625, -0.5268402099609375, -0.48492431640625, -0.4430084228515625, -0.401092529296875, -0.3591766357421875, -0.3172607421875, -0.2753448486328125, -0.233428955078125, -0.1915130615234375, -0.14959716796875, -0.1076812744140625, -0.065765380859375, -0.0238494873046875, 0.01806640625, 0.0599822998046875, 0.101898193359375, 0.1438140869140625, 0.18572998046875, 0.2276458740234375, 0.269561767578125, 0.3114776611328125, 0.3533935546875, 0.3953094482421875, 0.437225341796875, 0.4791412353515625, 0.52105712890625, 0.5629730224609375, 0.604888916015625, 0.6468048095703125, 0.688720703125, 0.7306365966796875, 0.772552490234375, 0.8144683837890625, 0.85638427734375, 0.8983001708984375, 0.940216064453125, 0.9821319580078125, 1.0240478515625, 1.0659637451171875, 1.107879638671875, 1.1497955322265625, 1.19171142578125, 1.2336273193359375, 1.275543212890625, 1.3174591064453125, 1.359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 8.0, 16.0, 19.0, 24.0, 43.0, 49.0, 70.0, 83.0, 142.0, 213.0, 274.0, 400.0, 624.0, 880.0, 1410.0, 2124.0, 3360.0, 5928.0, 11335.0, 26321.0, 84356.0, 1206892.0, 629569.0, 73494.0, 24076.0, 10481.0, 5511.0, 3260.0, 2039.0, 1249.0, 861.0, 576.0, 403.0, 279.0, 217.0, 131.0, 98.0, 64.0, 64.0, 43.0, 34.0, 19.0, 17.0, 9.0, 17.0, 3.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.83203125, -5.64361572265625, -5.4552001953125, -5.26678466796875, -5.078369140625, -4.88995361328125, -4.7015380859375, -4.51312255859375, -4.32470703125, -4.13629150390625, -3.9478759765625, -3.75946044921875, -3.571044921875, -3.38262939453125, -3.1942138671875, -3.00579833984375, -2.8173828125, -2.62896728515625, -2.4405517578125, -2.25213623046875, -2.063720703125, -1.87530517578125, -1.6868896484375, -1.49847412109375, -1.31005859375, -1.12164306640625, -0.9332275390625, -0.74481201171875, -0.556396484375, -0.36798095703125, -0.1795654296875, 0.00885009765625, 0.197265625, 0.38568115234375, 0.5740966796875, 0.76251220703125, 0.950927734375, 1.13934326171875, 1.3277587890625, 1.51617431640625, 1.70458984375, 1.89300537109375, 2.0814208984375, 2.26983642578125, 2.458251953125, 2.64666748046875, 2.8350830078125, 3.02349853515625, 3.2119140625, 3.40032958984375, 3.5887451171875, 3.77716064453125, 3.965576171875, 4.15399169921875, 4.3424072265625, 4.53082275390625, 4.71923828125, 4.90765380859375, 5.0960693359375, 5.28448486328125, 5.472900390625, 5.66131591796875, 5.8497314453125, 6.03814697265625, 6.2265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 14.0, 49.0, 182.0, 521.0, 80.0, 27.0, 14.0, 11.0, 10.0, 7.0, 5.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.212493896484375, -3.09881591796875, -2.985137939453125, -2.8714599609375, -2.757781982421875, -2.64410400390625, -2.530426025390625, -2.416748046875, -2.303070068359375, -2.18939208984375, -2.075714111328125, -1.9620361328125, -1.848358154296875, -1.73468017578125, -1.621002197265625, -1.50732421875, -1.393646240234375, -1.27996826171875, -1.166290283203125, -1.0526123046875, -0.938934326171875, -0.82525634765625, -0.711578369140625, -0.597900390625, -0.484222412109375, -0.37054443359375, -0.256866455078125, -0.1431884765625, -0.029510498046875, 0.08416748046875, 0.197845458984375, 0.3115234375, 0.425201416015625, 0.53887939453125, 0.652557373046875, 0.7662353515625, 0.879913330078125, 0.99359130859375, 1.107269287109375, 1.220947265625, 1.334625244140625, 1.44830322265625, 1.561981201171875, 1.6756591796875, 1.789337158203125, 1.90301513671875, 2.016693115234375, 2.13037109375, 2.244049072265625, 2.35772705078125, 2.471405029296875, 2.5850830078125, 2.698760986328125, 2.81243896484375, 2.926116943359375, 3.039794921875, 3.153472900390625, 3.26715087890625, 3.380828857421875, 3.4945068359375, 3.608184814453125, 3.72186279296875, 3.835540771484375, 3.94921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 11.0, 19.0, 22.0, 37.0, 48.0, 103.0, 309.0, 1315.0, 9255.0, 1002341.0, 31241.0, 2921.0, 543.0, 171.0, 65.0, 46.0, 26.0, 20.0, 8.0, 4.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.8125, -53.23388671875, -51.6552734375, -50.07666015625, -48.498046875, -46.91943359375, -45.3408203125, -43.76220703125, -42.18359375, -40.60498046875, -39.0263671875, -37.44775390625, -35.869140625, -34.29052734375, -32.7119140625, -31.13330078125, -29.5546875, -27.97607421875, -26.3974609375, -24.81884765625, -23.240234375, -21.66162109375, -20.0830078125, -18.50439453125, -16.92578125, -15.34716796875, -13.7685546875, -12.18994140625, -10.611328125, -9.03271484375, -7.4541015625, -5.87548828125, -4.296875, -2.71826171875, -1.1396484375, 0.43896484375, 2.017578125, 3.59619140625, 5.1748046875, 6.75341796875, 8.33203125, 9.91064453125, 11.4892578125, 13.06787109375, 14.646484375, 16.22509765625, 17.8037109375, 19.38232421875, 20.9609375, 22.53955078125, 24.1181640625, 25.69677734375, 27.275390625, 28.85400390625, 30.4326171875, 32.01123046875, 33.58984375, 35.16845703125, 36.7470703125, 38.32568359375, 39.904296875, 41.48291015625, 43.0615234375, 44.64013671875, 46.21875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 8.0, 5.0, 17.0, 27.0, 16.0, 46.0, 66.0, 71.0, 139.0, 140.0, 114.0, 94.0, 57.0, 36.0, 29.0, 25.0, 14.0, 17.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6988325119018555, -2.601017475128174, -2.503202438354492, -2.4053874015808105, -2.307572364807129, -2.2097573280334473, -2.1119422912597656, -2.014127492904663, -1.9163124561309814, -1.8184974193572998, -1.7206823825836182, -1.6228673458099365, -1.5250524282455444, -1.4272373914718628, -1.3294223546981812, -1.231607437133789, -1.1337922811508179, -1.0359772443771362, -0.9381622672080994, -0.8403472304344177, -0.7425322532653809, -0.6447172164916992, -0.5469021797180176, -0.4490872025489807, -0.3512721657752991, -0.2534571588039398, -0.15564213693141937, -0.057827115058898926, 0.03998789191246033, 0.13780289888381958, 0.23561793565750122, 0.3334329128265381, 0.4312479496002197, 0.5290629863739014, 0.6268779635429382, 0.7246930003166199, 0.8225079774856567, 0.9203230142593384, 1.01813805103302, 1.115952968597412, 1.2137680053710938, 1.3115830421447754, 1.409398078918457, 1.5072131156921387, 1.6050280332565308, 1.7028430700302124, 1.800658106803894, 1.8984730243682861, 1.9962881803512573, 2.0941030979156494, 2.191918134689331, 2.2897331714630127, 2.3875482082366943, 2.485363245010376, 2.5831782817840576, 2.6809933185577393, 2.778808355331421, 2.8766233921051025, 2.974438428878784, 3.072253465652466, 3.1700685024261475, 3.26788330078125, 3.3656983375549316, 3.4635133743286133, 3.561328411102295]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 10.0, 14.0, 11.0, 13.0, 7.0, 22.0, 28.0, 21.0, 29.0, 31.0, 29.0, 45.0, 46.0, 30.0, 48.0, 40.0, 59.0, 50.0, 44.0, 45.0, 47.0, 36.0, 37.0, 36.0, 25.0, 29.0, 31.0, 28.0, 21.0, 11.0, 14.0, 12.0, 14.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5662386417388916, -2.489405632019043, -2.4125723838806152, -2.3357393741607666, -2.258906364440918, -2.1820731163024902, -2.1052401065826416, -2.028407096862793, -1.9515738487243652, -1.874740719795227, -1.7979077100753784, -1.7210745811462402, -1.644241452217102, -1.5674083232879639, -1.4905753135681152, -1.413742184638977, -1.3369091749191284, -1.2600760459899902, -1.1832430362701416, -1.1064099073410034, -1.0295767784118652, -0.9527437090873718, -0.8759106397628784, -0.7990775108337402, -0.7222444415092468, -0.6454113721847534, -0.5685782432556152, -0.4917451739311218, -0.41491207480430603, -0.33807897567749023, -0.2612459063529968, -0.18441277742385864, -0.10757970809936523, -0.030746616423130035, 0.046086475253105164, 0.12291955947875977, 0.19975265860557556, 0.27658575773239136, 0.35341882705688477, 0.43025195598602295, 0.5070850253105164, 0.5839180946350098, 0.660751223564148, 0.7375842928886414, 0.8144173622131348, 0.891250491142273, 0.9680835604667664, 1.0449166297912598, 1.121749758720398, 1.1985828876495361, 1.2754158973693848, 1.352249026298523, 1.4290821552276611, 1.5059151649475098, 1.582748293876648, 1.6595814228057861, 1.7364144325256348, 1.813247561454773, 1.8900805711746216, 1.9669137001037598, 2.0437467098236084, 2.120579957962036, 2.1974129676818848, 2.2742462158203125, 2.351079225540161]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 10.0, 4.0, 10.0, 15.0, 17.0, 13.0, 19.0, 24.0, 22.0, 27.0, 36.0, 30.0, 35.0, 46.0, 52.0, 38.0, 50.0, 58.0, 52.0, 53.0, 50.0, 42.0, 48.0, 40.0, 29.0, 23.0, 25.0, 22.0, 21.0, 12.0, 16.0, 9.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4736785888671875, -1.421966552734375, -1.3702545166015625, -1.31854248046875, -1.2668304443359375, -1.215118408203125, -1.1634063720703125, -1.1116943359375, -1.0599822998046875, -1.008270263671875, -0.9565582275390625, -0.90484619140625, -0.8531341552734375, -0.801422119140625, -0.7497100830078125, -0.697998046875, -0.6462860107421875, -0.594573974609375, -0.5428619384765625, -0.49114990234375, -0.4394378662109375, -0.387725830078125, -0.3360137939453125, -0.2843017578125, -0.2325897216796875, -0.180877685546875, -0.1291656494140625, -0.07745361328125, -0.0257415771484375, 0.025970458984375, 0.0776824951171875, 0.12939453125, 0.1811065673828125, 0.232818603515625, 0.2845306396484375, 0.33624267578125, 0.3879547119140625, 0.439666748046875, 0.4913787841796875, 0.5430908203125, 0.5948028564453125, 0.646514892578125, 0.6982269287109375, 0.74993896484375, 0.8016510009765625, 0.853363037109375, 0.9050750732421875, 0.956787109375, 1.0084991455078125, 1.060211181640625, 1.1119232177734375, 1.16363525390625, 1.2153472900390625, 1.267059326171875, 1.3187713623046875, 1.3704833984375, 1.4221954345703125, 1.473907470703125, 1.5256195068359375, 1.57733154296875, 1.6290435791015625, 1.680755615234375, 1.7324676513671875, 1.7841796875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 20.0, 21.0, 48.0, 63.0, 101.0, 146.0, 252.0, 426.0, 799.0, 1555.0, 3268.0, 7324.0, 19001.0, 64964.0, 405593.0, 440507.0, 69748.0, 20190.0, 7629.0, 3264.0, 1549.0, 864.0, 469.0, 267.0, 165.0, 108.0, 61.0, 40.0, 32.0, 11.0, 9.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9349365234375, -5.760498046875, -5.5860595703125, -5.41162109375, -5.2371826171875, -5.062744140625, -4.8883056640625, -4.7138671875, -4.5394287109375, -4.364990234375, -4.1905517578125, -4.01611328125, -3.8416748046875, -3.667236328125, -3.4927978515625, -3.318359375, -3.1439208984375, -2.969482421875, -2.7950439453125, -2.62060546875, -2.4461669921875, -2.271728515625, -2.0972900390625, -1.9228515625, -1.7484130859375, -1.573974609375, -1.3995361328125, -1.22509765625, -1.0506591796875, -0.876220703125, -0.7017822265625, -0.52734375, -0.3529052734375, -0.178466796875, -0.0040283203125, 0.17041015625, 0.3448486328125, 0.519287109375, 0.6937255859375, 0.8681640625, 1.0426025390625, 1.217041015625, 1.3914794921875, 1.56591796875, 1.7403564453125, 1.914794921875, 2.0892333984375, 2.263671875, 2.4381103515625, 2.612548828125, 2.7869873046875, 2.96142578125, 3.1358642578125, 3.310302734375, 3.4847412109375, 3.6591796875, 3.8336181640625, 4.008056640625, 4.1824951171875, 4.35693359375, 4.5313720703125, 4.705810546875, 4.8802490234375, 5.0546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 13.0, 10.0, 7.0, 14.0, 14.0, 18.0, 19.0, 23.0, 32.0, 28.0, 31.0, 32.0, 38.0, 57.0, 67.0, 78.0, 131.0, 293.0, 1410.0, 158.0, 88.0, 80.0, 60.0, 39.0, 40.0, 37.0, 37.0, 28.0, 22.0, 22.0, 21.0, 15.0, 14.0, 10.0, 12.0, 7.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.64453125, -6.45556640625, -6.2666015625, -6.07763671875, -5.888671875, -5.69970703125, -5.5107421875, -5.32177734375, -5.1328125, -4.94384765625, -4.7548828125, -4.56591796875, -4.376953125, -4.18798828125, -3.9990234375, -3.81005859375, -3.62109375, -3.43212890625, -3.2431640625, -3.05419921875, -2.865234375, -2.67626953125, -2.4873046875, -2.29833984375, -2.109375, -1.92041015625, -1.7314453125, -1.54248046875, -1.353515625, -1.16455078125, -0.9755859375, -0.78662109375, -0.59765625, -0.40869140625, -0.2197265625, -0.03076171875, 0.158203125, 0.34716796875, 0.5361328125, 0.72509765625, 0.9140625, 1.10302734375, 1.2919921875, 1.48095703125, 1.669921875, 1.85888671875, 2.0478515625, 2.23681640625, 2.42578125, 2.61474609375, 2.8037109375, 2.99267578125, 3.181640625, 3.37060546875, 3.5595703125, 3.74853515625, 3.9375, 4.12646484375, 4.3154296875, 4.50439453125, 4.693359375, 4.88232421875, 5.0712890625, 5.26025390625, 5.44921875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 5.0, 11.0, 19.0, 17.0, 23.0, 31.0, 47.0, 76.0, 105.0, 203.0, 369.0, 755.0, 1600.0, 3776.0, 9398.0, 26711.0, 104771.0, 938916.0, 1853056.0, 150674.0, 35031.0, 11654.0, 4638.0, 1823.0, 874.0, 468.0, 226.0, 148.0, 85.0, 51.0, 29.0, 26.0, 20.0, 9.0, 11.0, 9.0, 8.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.521484375, -7.25390625, -6.986328125, -6.71875, -6.451171875, -6.18359375, -5.916015625, -5.6484375, -5.380859375, -5.11328125, -4.845703125, -4.578125, -4.310546875, -4.04296875, -3.775390625, -3.5078125, -3.240234375, -2.97265625, -2.705078125, -2.4375, -2.169921875, -1.90234375, -1.634765625, -1.3671875, -1.099609375, -0.83203125, -0.564453125, -0.296875, -0.029296875, 0.23828125, 0.505859375, 0.7734375, 1.041015625, 1.30859375, 1.576171875, 1.84375, 2.111328125, 2.37890625, 2.646484375, 2.9140625, 3.181640625, 3.44921875, 3.716796875, 3.984375, 4.251953125, 4.51953125, 4.787109375, 5.0546875, 5.322265625, 5.58984375, 5.857421875, 6.125, 6.392578125, 6.66015625, 6.927734375, 7.1953125, 7.462890625, 7.73046875, 7.998046875, 8.265625, 8.533203125, 8.80078125, 9.068359375, 9.3359375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 10.0, 78.0, 349.0, 436.0, 121.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.652995109558105, -13.462892532348633, -11.272789001464844, -9.082686424255371, -6.892583847045898, -4.702481269836426, -2.5123777389526367, -0.32227516174316406, 1.8678274154663086, 4.057929992675781, 6.248033046722412, 8.438136100769043, 10.628238677978516, 12.818341255187988, 15.008444786071777, 17.19854736328125, 19.388648986816406, 21.578752517700195, 23.76885414123535, 25.95895767211914, 28.149059295654297, 30.339162826538086, 32.529266357421875, 34.71936798095703, 36.90947341918945, 39.09957504272461, 41.28968048095703, 43.47978210449219, 45.669883728027344, 47.8599853515625, 50.05009078979492, 52.24019241333008, 54.43029022216797, 56.620391845703125, 58.81049728393555, 61.0005989074707, 63.19070053100586, 65.38080596923828, 67.57090759277344, 69.7610092163086, 71.95111083984375, 74.1412124633789, 76.33131408691406, 78.52142333984375, 80.7115249633789, 82.90162658691406, 85.09172821044922, 87.28182983398438, 89.47193908691406, 91.66204071044922, 93.85214233398438, 96.04225158691406, 98.23235321044922, 100.42245483398438, 102.61255645751953, 104.80265808105469, 106.99275970458984, 109.182861328125, 111.37296295166016, 113.56306457519531, 115.753173828125, 117.94327545166016, 120.13337707519531, 122.32347869873047, 124.51358032226562]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 15.0, 11.0, 21.0, 12.0, 14.0, 19.0, 24.0, 24.0, 36.0, 36.0, 36.0, 29.0, 35.0, 46.0, 69.0, 31.0, 39.0, 43.0, 43.0, 46.0, 40.0, 45.0, 47.0, 26.0, 17.0, 32.0, 20.0, 25.0, 21.0, 9.0, 11.0, 13.0, 4.0, 10.0, 4.0, 2.0, 6.0, 7.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.92365074157715, -21.245601654052734, -20.56755256652832, -19.889503479003906, -19.21145248413086, -18.533403396606445, -17.85535430908203, -17.177305221557617, -16.499256134033203, -15.821207046508789, -15.143157005310059, -14.465107917785645, -13.787057876586914, -13.1090087890625, -12.430959701538086, -11.752910614013672, -11.074859619140625, -10.396810531616211, -9.71876049041748, -9.040711402893066, -8.362661361694336, -7.684612274169922, -7.006563186645508, -6.3285136222839355, -5.650464057922363, -4.972414493560791, -4.294364929199219, -3.6163158416748047, -2.9382662773132324, -2.26021671295166, -1.582167625427246, -0.9041180610656738, -0.22606849670410156, 0.45198094844818115, 1.1300303936004639, 1.808079719543457, 2.4861292839050293, 3.1641788482666016, 3.8422279357910156, 4.520277500152588, 5.19832706451416, 5.876376628875732, 6.554426193237305, 7.232475280761719, 7.910524845123291, 8.588574409484863, 9.266623497009277, 9.944673538208008, 10.622722625732422, 11.300771713256836, 11.978821754455566, 12.65687084197998, 13.334920883178711, 14.012969970703125, 14.691019058227539, 15.369068145751953, 16.047119140625, 16.725168228149414, 17.403217315673828, 18.081268310546875, 18.75931739807129, 19.437366485595703, 20.115415573120117, 20.79346466064453, 21.471513748168945]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 12.0, 20.0, 18.0, 24.0, 24.0, 27.0, 29.0, 38.0, 28.0, 38.0, 46.0, 52.0, 55.0, 49.0, 55.0, 60.0, 42.0, 41.0, 50.0, 47.0, 49.0, 37.0, 24.0, 18.0, 21.0, 21.0, 9.0, 14.0, 8.0, 5.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.798919677734375, -1.73944091796875, -1.679962158203125, -1.6204833984375, -1.561004638671875, -1.50152587890625, -1.442047119140625, -1.382568359375, -1.323089599609375, -1.26361083984375, -1.204132080078125, -1.1446533203125, -1.085174560546875, -1.02569580078125, -0.966217041015625, -0.90673828125, -0.847259521484375, -0.78778076171875, -0.728302001953125, -0.6688232421875, -0.609344482421875, -0.54986572265625, -0.490386962890625, -0.430908203125, -0.371429443359375, -0.31195068359375, -0.252471923828125, -0.1929931640625, -0.133514404296875, -0.07403564453125, -0.014556884765625, 0.044921875, 0.104400634765625, 0.16387939453125, 0.223358154296875, 0.2828369140625, 0.342315673828125, 0.40179443359375, 0.461273193359375, 0.520751953125, 0.580230712890625, 0.63970947265625, 0.699188232421875, 0.7586669921875, 0.818145751953125, 0.87762451171875, 0.937103271484375, 0.99658203125, 1.056060791015625, 1.11553955078125, 1.175018310546875, 1.2344970703125, 1.293975830078125, 1.35345458984375, 1.412933349609375, 1.472412109375, 1.531890869140625, 1.59136962890625, 1.650848388671875, 1.7103271484375, 1.769805908203125, 1.82928466796875, 1.888763427734375, 1.9482421875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 16.0, 23.0, 23.0, 36.0, 63.0, 129.0, 198.0, 399.0, 863.0, 2439.0, 8102.0, 31760.0, 256106.0, 3760769.0, 106491.0, 18688.0, 5237.0, 1573.0, 620.0, 285.0, 175.0, 103.0, 56.0, 40.0, 17.0, 17.0, 17.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.17431640625, -12.6923828125, -12.21044921875, -11.728515625, -11.24658203125, -10.7646484375, -10.28271484375, -9.80078125, -9.31884765625, -8.8369140625, -8.35498046875, -7.873046875, -7.39111328125, -6.9091796875, -6.42724609375, -5.9453125, -5.46337890625, -4.9814453125, -4.49951171875, -4.017578125, -3.53564453125, -3.0537109375, -2.57177734375, -2.08984375, -1.60791015625, -1.1259765625, -0.64404296875, -0.162109375, 0.31982421875, 0.8017578125, 1.28369140625, 1.765625, 2.24755859375, 2.7294921875, 3.21142578125, 3.693359375, 4.17529296875, 4.6572265625, 5.13916015625, 5.62109375, 6.10302734375, 6.5849609375, 7.06689453125, 7.548828125, 8.03076171875, 8.5126953125, 8.99462890625, 9.4765625, 9.95849609375, 10.4404296875, 10.92236328125, 11.404296875, 11.88623046875, 12.3681640625, 12.85009765625, 13.33203125, 13.81396484375, 14.2958984375, 14.77783203125, 15.259765625, 15.74169921875, 16.2236328125, 16.70556640625, 17.1875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 2.0, 14.0, 16.0, 27.0, 37.0, 43.0, 69.0, 94.0, 142.0, 290.0, 600.0, 1024.0, 822.0, 329.0, 198.0, 104.0, 75.0, 63.0, 28.0, 29.0, 18.0, 11.0, 5.0, 9.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.364013671875, -10.05615234375, -9.748291015625, -9.4404296875, -9.132568359375, -8.82470703125, -8.516845703125, -8.208984375, -7.901123046875, -7.59326171875, -7.285400390625, -6.9775390625, -6.669677734375, -6.36181640625, -6.053955078125, -5.74609375, -5.438232421875, -5.13037109375, -4.822509765625, -4.5146484375, -4.206787109375, -3.89892578125, -3.591064453125, -3.283203125, -2.975341796875, -2.66748046875, -2.359619140625, -2.0517578125, -1.743896484375, -1.43603515625, -1.128173828125, -0.8203125, -0.512451171875, -0.20458984375, 0.103271484375, 0.4111328125, 0.718994140625, 1.02685546875, 1.334716796875, 1.642578125, 1.950439453125, 2.25830078125, 2.566162109375, 2.8740234375, 3.181884765625, 3.48974609375, 3.797607421875, 4.10546875, 4.413330078125, 4.72119140625, 5.029052734375, 5.3369140625, 5.644775390625, 5.95263671875, 6.260498046875, 6.568359375, 6.876220703125, 7.18408203125, 7.491943359375, 7.7998046875, 8.107666015625, 8.41552734375, 8.723388671875, 9.03125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 4.0, 13.0, 12.0, 18.0, 18.0, 32.0, 61.0, 68.0, 129.0, 203.0, 343.0, 579.0, 1065.0, 2054.0, 4148.0, 8872.0, 21268.0, 57608.0, 197488.0, 2362900.0, 1305131.0, 151496.0, 47402.0, 18012.0, 7658.0, 3720.0, 1752.0, 931.0, 496.0, 291.0, 188.0, 105.0, 75.0, 32.0, 25.0, 15.0, 22.0, 10.0, 10.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.2838134765625, -12.880126953125, -12.4764404296875, -12.07275390625, -11.6690673828125, -11.265380859375, -10.8616943359375, -10.4580078125, -10.0543212890625, -9.650634765625, -9.2469482421875, -8.84326171875, -8.4395751953125, -8.035888671875, -7.6322021484375, -7.228515625, -6.8248291015625, -6.421142578125, -6.0174560546875, -5.61376953125, -5.2100830078125, -4.806396484375, -4.4027099609375, -3.9990234375, -3.5953369140625, -3.191650390625, -2.7879638671875, -2.38427734375, -1.9805908203125, -1.576904296875, -1.1732177734375, -0.76953125, -0.3658447265625, 0.037841796875, 0.4415283203125, 0.84521484375, 1.2489013671875, 1.652587890625, 2.0562744140625, 2.4599609375, 2.8636474609375, 3.267333984375, 3.6710205078125, 4.07470703125, 4.4783935546875, 4.882080078125, 5.2857666015625, 5.689453125, 6.0931396484375, 6.496826171875, 6.9005126953125, 7.30419921875, 7.7078857421875, 8.111572265625, 8.5152587890625, 8.9189453125, 9.3226318359375, 9.726318359375, 10.1300048828125, 10.53369140625, 10.9373779296875, 11.341064453125, 11.7447509765625, 12.1484375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 14.0, 32.0, 46.0, 63.0, 100.0, 134.0, 131.0, 141.0, 84.0, 66.0, 52.0, 36.0, 19.0, 14.0, 12.0, 10.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.166698455810547, -28.94232749938965, -27.71795654296875, -26.493587493896484, -25.269216537475586, -24.044845581054688, -22.820476531982422, -21.596105575561523, -20.371734619140625, -19.147363662719727, -17.922992706298828, -16.698623657226562, -15.474252700805664, -14.249881744384766, -13.025511741638184, -11.801141738891602, -10.576770782470703, -9.352399826049805, -8.128029823303223, -6.903659343719482, -5.679288864135742, -4.454918384552002, -3.2305479049682617, -2.0061779022216797, -0.7818069458007812, 0.442563533782959, 1.6669340133666992, 2.8913044929504395, 4.11567497253418, 5.34004545211792, 6.56441593170166, 7.788785934448242, 9.01315689086914, 10.237527847290039, 11.461897850036621, 12.686267852783203, 13.910638809204102, 15.135009765625, 16.359378814697266, 17.583749771118164, 18.808120727539062, 20.03249168395996, 21.25686264038086, 22.481231689453125, 23.705602645874023, 24.929973602294922, 26.154342651367188, 27.378713607788086, 28.603084564208984, 29.827455520629883, 31.05182647705078, 32.27619552612305, 33.50056457519531, 34.724937438964844, 35.94930648803711, 37.173675537109375, 38.398048400878906, 39.62241744995117, 40.8467903137207, 42.07115936279297, 43.2955322265625, 44.519901275634766, 45.74427032470703, 46.96864318847656, 48.19301223754883]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 6.0, 4.0, 17.0, 11.0, 19.0, 19.0, 22.0, 28.0, 21.0, 32.0, 35.0, 35.0, 38.0, 35.0, 51.0, 51.0, 46.0, 49.0, 42.0, 43.0, 43.0, 35.0, 49.0, 30.0, 37.0, 46.0, 34.0, 20.0, 22.0, 10.0, 10.0, 11.0, 11.0, 2.0, 7.0, 4.0, 5.0, 0.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.810224533081055, -19.05238151550293, -18.294538497924805, -17.536697387695312, -16.778854370117188, -16.021011352539062, -15.263168334960938, -14.505325317382812, -13.747483253479004, -12.989640235900879, -12.23179817199707, -11.473955154418945, -10.71611213684082, -9.958270072937012, -9.200427055358887, -8.442584991455078, -7.684741973876953, -6.926899433135986, -6.1690568923950195, -5.4112138748168945, -4.653371334075928, -3.895528793334961, -3.137685775756836, -2.379843235015869, -1.6220006942749023, -0.864158034324646, -0.10631537437438965, 0.6515274047851562, 1.409369945526123, 2.16721248626709, 2.925055503845215, 3.6828980445861816, 4.440740585327148, 5.198583126068115, 5.956425666809082, 6.714268684387207, 7.472111225128174, 8.22995376586914, 8.987796783447266, 9.74563980102539, 10.5034818649292, 11.261324882507324, 12.019166946411133, 12.777009963989258, 13.534852981567383, 14.292695045471191, 15.050538063049316, 15.808380126953125, 16.56622314453125, 17.324066162109375, 18.0819091796875, 18.839752197265625, 19.597593307495117, 20.355436325073242, 21.113279342651367, 21.871122360229492, 22.628963470458984, 23.38680648803711, 24.144649505615234, 24.90249252319336, 25.66033363342285, 26.418176651000977, 27.1760196685791, 27.933862686157227, 28.69170570373535]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 13.0, 6.0, 8.0, 18.0, 17.0, 24.0, 26.0, 26.0, 22.0, 30.0, 30.0, 31.0, 39.0, 43.0, 46.0, 30.0, 58.0, 49.0, 44.0, 41.0, 55.0, 41.0, 44.0, 34.0, 28.0, 28.0, 32.0, 16.0, 21.0, 17.0, 15.0, 12.0, 12.0, 9.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8505859375, -1.7976531982421875, -1.744720458984375, -1.6917877197265625, -1.63885498046875, -1.5859222412109375, -1.532989501953125, -1.4800567626953125, -1.4271240234375, -1.3741912841796875, -1.321258544921875, -1.2683258056640625, -1.21539306640625, -1.1624603271484375, -1.109527587890625, -1.0565948486328125, -1.003662109375, -0.9507293701171875, -0.897796630859375, -0.8448638916015625, -0.79193115234375, -0.7389984130859375, -0.686065673828125, -0.6331329345703125, -0.5802001953125, -0.5272674560546875, -0.474334716796875, -0.4214019775390625, -0.36846923828125, -0.3155364990234375, -0.262603759765625, -0.2096710205078125, -0.15673828125, -0.1038055419921875, -0.050872802734375, 0.0020599365234375, 0.05499267578125, 0.1079254150390625, 0.160858154296875, 0.2137908935546875, 0.2667236328125, 0.3196563720703125, 0.372589111328125, 0.4255218505859375, 0.47845458984375, 0.5313873291015625, 0.584320068359375, 0.6372528076171875, 0.690185546875, 0.7431182861328125, 0.796051025390625, 0.8489837646484375, 0.90191650390625, 0.9548492431640625, 1.007781982421875, 1.0607147216796875, 1.1136474609375, 1.1665802001953125, 1.219512939453125, 1.2724456787109375, 1.32537841796875, 1.3783111572265625, 1.431243896484375, 1.4841766357421875, 1.537109375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 3.0, 6.0, 11.0, 15.0, 29.0, 44.0, 71.0, 88.0, 150.0, 221.0, 446.0, 738.0, 1334.0, 2427.0, 4721.0, 9796.0, 21573.0, 48253.0, 117982.0, 291562.0, 318361.0, 131426.0, 53521.0, 23522.0, 11069.0, 5136.0, 2687.0, 1446.0, 809.0, 416.0, 249.0, 151.0, 87.0, 63.0, 45.0, 39.0, 17.0, 11.0, 10.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.1915283203125, -8.875244140625, -8.5589599609375, -8.24267578125, -7.9263916015625, -7.610107421875, -7.2938232421875, -6.9775390625, -6.6612548828125, -6.344970703125, -6.0286865234375, -5.71240234375, -5.3961181640625, -5.079833984375, -4.7635498046875, -4.447265625, -4.1309814453125, -3.814697265625, -3.4984130859375, -3.18212890625, -2.8658447265625, -2.549560546875, -2.2332763671875, -1.9169921875, -1.6007080078125, -1.284423828125, -0.9681396484375, -0.65185546875, -0.3355712890625, -0.019287109375, 0.2969970703125, 0.61328125, 0.9295654296875, 1.245849609375, 1.5621337890625, 1.87841796875, 2.1947021484375, 2.510986328125, 2.8272705078125, 3.1435546875, 3.4598388671875, 3.776123046875, 4.0924072265625, 4.40869140625, 4.7249755859375, 5.041259765625, 5.3575439453125, 5.673828125, 5.9901123046875, 6.306396484375, 6.6226806640625, 6.93896484375, 7.2552490234375, 7.571533203125, 7.8878173828125, 8.2041015625, 8.5203857421875, 8.836669921875, 9.1529541015625, 9.46923828125, 9.7855224609375, 10.101806640625, 10.4180908203125, 10.734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 7.0, 13.0, 15.0, 13.0, 18.0, 16.0, 17.0, 16.0, 26.0, 32.0, 29.0, 39.0, 43.0, 35.0, 34.0, 48.0, 1063.0, 47.0, 44.0, 38.0, 53.0, 46.0, 29.0, 42.0, 36.0, 33.0, 26.0, 20.0, 33.0, 13.0, 17.0, 9.0, 10.0, 6.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4404296875, -1.3959197998046875, -1.351409912109375, -1.3069000244140625, -1.26239013671875, -1.2178802490234375, -1.173370361328125, -1.1288604736328125, -1.0843505859375, -1.0398406982421875, -0.995330810546875, -0.9508209228515625, -0.90631103515625, -0.8618011474609375, -0.817291259765625, -0.7727813720703125, -0.728271484375, -0.6837615966796875, -0.639251708984375, -0.5947418212890625, -0.55023193359375, -0.5057220458984375, -0.461212158203125, -0.4167022705078125, -0.3721923828125, -0.3276824951171875, -0.283172607421875, -0.2386627197265625, -0.19415283203125, -0.1496429443359375, -0.105133056640625, -0.0606231689453125, -0.01611328125, 0.0283966064453125, 0.072906494140625, 0.1174163818359375, 0.16192626953125, 0.2064361572265625, 0.250946044921875, 0.2954559326171875, 0.3399658203125, 0.3844757080078125, 0.428985595703125, 0.4734954833984375, 0.51800537109375, 0.5625152587890625, 0.607025146484375, 0.6515350341796875, 0.696044921875, 0.7405548095703125, 0.785064697265625, 0.8295745849609375, 0.87408447265625, 0.9185943603515625, 0.963104248046875, 1.0076141357421875, 1.0521240234375, 1.0966339111328125, 1.141143798828125, 1.1856536865234375, 1.23016357421875, 1.2746734619140625, 1.319183349609375, 1.3636932373046875, 1.408203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 7.0, 35.0, 34.0, 44.0, 89.0, 114.0, 227.0, 374.0, 550.0, 1078.0, 1815.0, 3912.0, 9233.0, 30366.0, 170941.0, 1609085.0, 214818.0, 35321.0, 10293.0, 4083.0, 2018.0, 1013.0, 605.0, 398.0, 216.0, 144.0, 82.0, 74.0, 45.0, 20.0, 16.0, 12.0, 19.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.6009521484375, -12.225341796875, -11.8497314453125, -11.47412109375, -11.0985107421875, -10.722900390625, -10.3472900390625, -9.9716796875, -9.5960693359375, -9.220458984375, -8.8448486328125, -8.46923828125, -8.0936279296875, -7.718017578125, -7.3424072265625, -6.966796875, -6.5911865234375, -6.215576171875, -5.8399658203125, -5.46435546875, -5.0887451171875, -4.713134765625, -4.3375244140625, -3.9619140625, -3.5863037109375, -3.210693359375, -2.8350830078125, -2.45947265625, -2.0838623046875, -1.708251953125, -1.3326416015625, -0.95703125, -0.5814208984375, -0.205810546875, 0.1697998046875, 0.54541015625, 0.9210205078125, 1.296630859375, 1.6722412109375, 2.0478515625, 2.4234619140625, 2.799072265625, 3.1746826171875, 3.55029296875, 3.9259033203125, 4.301513671875, 4.6771240234375, 5.052734375, 5.4283447265625, 5.803955078125, 6.1795654296875, 6.55517578125, 6.9307861328125, 7.306396484375, 7.6820068359375, 8.0576171875, 8.4332275390625, 8.808837890625, 9.1844482421875, 9.56005859375, 9.9356689453125, 10.311279296875, 10.6868896484375, 11.0625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 6.0, 3.0, 8.0, 3.0, 10.0, 8.0, 9.0, 23.0, 34.0, 74.0, 94.0, 163.0, 175.0, 155.0, 77.0, 36.0, 27.0, 26.0, 13.0, 9.0, 10.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.265625, -3.16156005859375, -3.0574951171875, -2.95343017578125, -2.849365234375, -2.74530029296875, -2.6412353515625, -2.53717041015625, -2.43310546875, -2.32904052734375, -2.2249755859375, -2.12091064453125, -2.016845703125, -1.91278076171875, -1.8087158203125, -1.70465087890625, -1.6005859375, -1.49652099609375, -1.3924560546875, -1.28839111328125, -1.184326171875, -1.08026123046875, -0.9761962890625, -0.87213134765625, -0.76806640625, -0.66400146484375, -0.5599365234375, -0.45587158203125, -0.351806640625, -0.24774169921875, -0.1436767578125, -0.03961181640625, 0.064453125, 0.16851806640625, 0.2725830078125, 0.37664794921875, 0.480712890625, 0.58477783203125, 0.6888427734375, 0.79290771484375, 0.89697265625, 1.00103759765625, 1.1051025390625, 1.20916748046875, 1.313232421875, 1.41729736328125, 1.5213623046875, 1.62542724609375, 1.7294921875, 1.83355712890625, 1.9376220703125, 2.04168701171875, 2.145751953125, 2.24981689453125, 2.3538818359375, 2.45794677734375, 2.56201171875, 2.66607666015625, 2.7701416015625, 2.87420654296875, 2.978271484375, 3.08233642578125, 3.1864013671875, 3.29046630859375, 3.39453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 4.0, 8.0, 9.0, 12.0, 22.0, 18.0, 45.0, 42.0, 79.0, 154.0, 454.0, 2122.0, 19717.0, 1004554.0, 18438.0, 1969.0, 470.0, 172.0, 77.0, 44.0, 36.0, 28.0, 15.0, 7.0, 9.0, 10.0, 1.0, 4.0, 7.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -49.09716796875, -47.5380859375, -45.97900390625, -44.419921875, -42.86083984375, -41.3017578125, -39.74267578125, -38.18359375, -36.62451171875, -35.0654296875, -33.50634765625, -31.947265625, -30.38818359375, -28.8291015625, -27.27001953125, -25.7109375, -24.15185546875, -22.5927734375, -21.03369140625, -19.474609375, -17.91552734375, -16.3564453125, -14.79736328125, -13.23828125, -11.67919921875, -10.1201171875, -8.56103515625, -7.001953125, -5.44287109375, -3.8837890625, -2.32470703125, -0.765625, 0.79345703125, 2.3525390625, 3.91162109375, 5.470703125, 7.02978515625, 8.5888671875, 10.14794921875, 11.70703125, 13.26611328125, 14.8251953125, 16.38427734375, 17.943359375, 19.50244140625, 21.0615234375, 22.62060546875, 24.1796875, 25.73876953125, 27.2978515625, 28.85693359375, 30.416015625, 31.97509765625, 33.5341796875, 35.09326171875, 36.65234375, 38.21142578125, 39.7705078125, 41.32958984375, 42.888671875, 44.44775390625, 46.0068359375, 47.56591796875, 49.125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 10.0, 44.0, 99.0, 249.0, 350.0, 150.0, 63.0, 25.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.100538730621338, -6.691324710845947, -6.282110691070557, -5.872896194458008, -5.463682174682617, -5.054468154907227, -4.645254135131836, -4.236040115356445, -3.8268260955810547, -3.417612075805664, -3.0083980560302734, -2.5991837978363037, -2.189969778060913, -1.7807557582855225, -1.3715415000915527, -0.9623274803161621, -0.5531134605407715, -0.14389938116073608, 0.2653146982192993, 0.6745288372039795, 1.0837428569793701, 1.4929568767547607, 1.9021711349487305, 2.311385154724121, 2.7205991744995117, 3.1298131942749023, 3.539027214050293, 3.9482414722442627, 4.357455253601074, 4.766669273376465, 5.175883769989014, 5.585097789764404, 5.994312286376953, 6.403526306152344, 6.812740325927734, 7.221954345703125, 7.631168365478516, 8.040382385253906, 8.449596405029297, 8.858810424804688, 9.268024444580078, 9.677238464355469, 10.08645248413086, 10.49566650390625, 10.90488052368164, 11.314094543457031, 11.723308563232422, 12.132522583007812, 12.54173755645752, 12.95095157623291, 13.3601655960083, 13.769379615783691, 14.178593635559082, 14.587807655334473, 14.99702262878418, 15.40623664855957, 15.815450668334961, 16.22466468811035, 16.633878707885742, 17.043092727661133, 17.452306747436523, 17.861520767211914, 18.270734786987305, 18.679948806762695, 19.089162826538086]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 7.0, 3.0, 11.0, 10.0, 9.0, 21.0, 23.0, 23.0, 24.0, 29.0, 25.0, 35.0, 34.0, 48.0, 46.0, 46.0, 43.0, 51.0, 39.0, 53.0, 56.0, 38.0, 43.0, 41.0, 42.0, 22.0, 27.0, 26.0, 18.0, 27.0, 19.0, 15.0, 6.0, 11.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.884923934936523, -4.75705099105835, -4.629178524017334, -4.50130558013916, -4.373432636260986, -4.2455596923828125, -4.117687225341797, -3.989814281463623, -3.8619415760040283, -3.7340688705444336, -3.6061959266662598, -3.478323221206665, -3.3504505157470703, -3.2225775718688965, -3.0947048664093018, -2.966832160949707, -2.838959217071533, -2.7110865116119385, -2.5832135677337646, -2.45534086227417, -2.327467918395996, -2.1995952129364014, -2.0717225074768066, -1.9438496828079224, -1.815976858139038, -1.6881040334701538, -1.5602312088012695, -1.4323585033416748, -1.3044856786727905, -1.1766128540039062, -1.0487401485443115, -0.9208673238754272, -0.7929940223693848, -0.6651211977005005, -0.537248432636261, -0.4093756377696991, -0.2815028429031372, -0.15363001823425293, -0.025757253170013428, 0.10211551189422607, 0.22998833656311035, 0.35786113142967224, 0.48573392629623413, 0.6136066913604736, 0.7414795160293579, 0.8693523406982422, 0.9972251057624817, 1.1250978708267212, 1.2529706954956055, 1.3808435201644897, 1.508716344833374, 1.6365890502929688, 1.764461874961853, 1.8923346996307373, 2.020207405090332, 2.148080348968506, 2.2759530544281006, 2.4038257598876953, 2.531698703765869, 2.659571409225464, 2.7874441146850586, 2.9153170585632324, 3.043189764022827, 3.171062469482422, 3.2989354133605957]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 15.0, 9.0, 9.0, 8.0, 13.0, 9.0, 20.0, 24.0, 25.0, 31.0, 33.0, 31.0, 33.0, 35.0, 40.0, 34.0, 45.0, 45.0, 46.0, 40.0, 46.0, 46.0, 43.0, 37.0, 42.0, 26.0, 39.0, 23.0, 20.0, 26.0, 30.0, 17.0, 19.0, 11.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7112274169921875, -1.657806396484375, -1.6043853759765625, -1.55096435546875, -1.4975433349609375, -1.444122314453125, -1.3907012939453125, -1.3372802734375, -1.2838592529296875, -1.230438232421875, -1.1770172119140625, -1.12359619140625, -1.0701751708984375, -1.016754150390625, -0.9633331298828125, -0.909912109375, -0.8564910888671875, -0.803070068359375, -0.7496490478515625, -0.69622802734375, -0.6428070068359375, -0.589385986328125, -0.5359649658203125, -0.4825439453125, -0.4291229248046875, -0.375701904296875, -0.3222808837890625, -0.26885986328125, -0.2154388427734375, -0.162017822265625, -0.1085968017578125, -0.05517578125, -0.0017547607421875, 0.051666259765625, 0.1050872802734375, 0.15850830078125, 0.2119293212890625, 0.265350341796875, 0.3187713623046875, 0.3721923828125, 0.4256134033203125, 0.479034423828125, 0.5324554443359375, 0.58587646484375, 0.6392974853515625, 0.692718505859375, 0.7461395263671875, 0.799560546875, 0.8529815673828125, 0.906402587890625, 0.9598236083984375, 1.01324462890625, 1.0666656494140625, 1.120086669921875, 1.1735076904296875, 1.2269287109375, 1.2803497314453125, 1.333770751953125, 1.3871917724609375, 1.44061279296875, 1.4940338134765625, 1.547454833984375, 1.6008758544921875, 1.654296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 16.0, 21.0, 27.0, 51.0, 82.0, 111.0, 148.0, 195.0, 341.0, 549.0, 800.0, 1296.0, 2206.0, 4000.0, 8629.0, 32631.0, 586669.0, 369272.0, 24918.0, 7450.0, 3595.0, 2014.0, 1243.0, 735.0, 505.0, 352.0, 205.0, 138.0, 96.0, 62.0, 48.0, 36.0, 27.0, 14.0, 13.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.84765625, -6.64581298828125, -6.4439697265625, -6.24212646484375, -6.040283203125, -5.83843994140625, -5.6365966796875, -5.43475341796875, -5.23291015625, -5.03106689453125, -4.8292236328125, -4.62738037109375, -4.425537109375, -4.22369384765625, -4.0218505859375, -3.82000732421875, -3.6181640625, -3.41632080078125, -3.2144775390625, -3.01263427734375, -2.810791015625, -2.60894775390625, -2.4071044921875, -2.20526123046875, -2.00341796875, -1.80157470703125, -1.5997314453125, -1.39788818359375, -1.196044921875, -0.99420166015625, -0.7923583984375, -0.59051513671875, -0.388671875, -0.18682861328125, 0.0150146484375, 0.21685791015625, 0.418701171875, 0.62054443359375, 0.8223876953125, 1.02423095703125, 1.22607421875, 1.42791748046875, 1.6297607421875, 1.83160400390625, 2.033447265625, 2.23529052734375, 2.4371337890625, 2.63897705078125, 2.8408203125, 3.04266357421875, 3.2445068359375, 3.44635009765625, 3.648193359375, 3.85003662109375, 4.0518798828125, 4.25372314453125, 4.45556640625, 4.65740966796875, 4.8592529296875, 5.06109619140625, 5.262939453125, 5.46478271484375, 5.6666259765625, 5.86846923828125, 6.0703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 4.0, 6.0, 10.0, 15.0, 17.0, 21.0, 13.0, 19.0, 27.0, 29.0, 24.0, 47.0, 27.0, 46.0, 63.0, 73.0, 79.0, 179.0, 1620.0, 158.0, 93.0, 91.0, 62.0, 50.0, 53.0, 31.0, 29.0, 31.0, 24.0, 20.0, 15.0, 12.0, 10.0, 6.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.9140625, -7.6907958984375, -7.467529296875, -7.2442626953125, -7.02099609375, -6.7977294921875, -6.574462890625, -6.3511962890625, -6.1279296875, -5.9046630859375, -5.681396484375, -5.4581298828125, -5.23486328125, -5.0115966796875, -4.788330078125, -4.5650634765625, -4.341796875, -4.1185302734375, -3.895263671875, -3.6719970703125, -3.44873046875, -3.2254638671875, -3.002197265625, -2.7789306640625, -2.5556640625, -2.3323974609375, -2.109130859375, -1.8858642578125, -1.66259765625, -1.4393310546875, -1.216064453125, -0.9927978515625, -0.76953125, -0.5462646484375, -0.322998046875, -0.0997314453125, 0.12353515625, 0.3468017578125, 0.570068359375, 0.7933349609375, 1.0166015625, 1.2398681640625, 1.463134765625, 1.6864013671875, 1.90966796875, 2.1329345703125, 2.356201171875, 2.5794677734375, 2.802734375, 3.0260009765625, 3.249267578125, 3.4725341796875, 3.69580078125, 3.9190673828125, 4.142333984375, 4.3656005859375, 4.5888671875, 4.8121337890625, 5.035400390625, 5.2586669921875, 5.48193359375, 5.7052001953125, 5.928466796875, 6.1517333984375, 6.375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 4.0, 13.0, 24.0, 26.0, 38.0, 50.0, 109.0, 130.0, 293.0, 526.0, 1124.0, 2801.0, 8692.0, 34005.0, 351680.0, 2653148.0, 70702.0, 14561.0, 4482.0, 1711.0, 706.0, 366.0, 188.0, 103.0, 69.0, 50.0, 31.0, 24.0, 16.0, 15.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.0718994140625, -11.628173828125, -11.1844482421875, -10.74072265625, -10.2969970703125, -9.853271484375, -9.4095458984375, -8.9658203125, -8.5220947265625, -8.078369140625, -7.6346435546875, -7.19091796875, -6.7471923828125, -6.303466796875, -5.8597412109375, -5.416015625, -4.9722900390625, -4.528564453125, -4.0848388671875, -3.64111328125, -3.1973876953125, -2.753662109375, -2.3099365234375, -1.8662109375, -1.4224853515625, -0.978759765625, -0.5350341796875, -0.09130859375, 0.3524169921875, 0.796142578125, 1.2398681640625, 1.68359375, 2.1273193359375, 2.571044921875, 3.0147705078125, 3.45849609375, 3.9022216796875, 4.345947265625, 4.7896728515625, 5.2333984375, 5.6771240234375, 6.120849609375, 6.5645751953125, 7.00830078125, 7.4520263671875, 7.895751953125, 8.3394775390625, 8.783203125, 9.2269287109375, 9.670654296875, 10.1143798828125, 10.55810546875, 11.0018310546875, 11.445556640625, 11.8892822265625, 12.3330078125, 12.7767333984375, 13.220458984375, 13.6641845703125, 14.10791015625, 14.5516357421875, 14.995361328125, 15.4390869140625, 15.8828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 76.0, 378.0, 425.0, 101.0, 18.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90983581542969, -50.507896423339844, -48.10595703125, -45.704017639160156, -43.30207824707031, -40.90013885498047, -38.49819564819336, -36.096256256103516, -33.69431686401367, -31.292377471923828, -28.890438079833984, -26.488496780395508, -24.086557388305664, -21.68461799621582, -19.282676696777344, -16.8807373046875, -14.478797912597656, -12.076858520507812, -9.674918174743652, -7.27297830581665, -4.871038436889648, -2.4690990447998047, -0.06715869903564453, 2.3347816467285156, 4.736721038818359, 7.138660907745361, 9.540600776672363, 11.942541122436523, 14.344480514526367, 16.74641990661621, 19.148361206054688, 21.55030059814453, 23.952232360839844, 26.354171752929688, 28.75611114501953, 31.158052444458008, 33.55998992919922, 35.96192932128906, 38.36387252807617, 40.765811920166016, 43.16775131225586, 45.5696907043457, 47.97163009643555, 50.37356948852539, 52.7755126953125, 55.177452087402344, 57.57939147949219, 59.98133087158203, 62.383270263671875, 64.78520965576172, 67.18714904785156, 69.5890884399414, 71.99102783203125, 74.3929672241211, 76.79490661621094, 79.19685363769531, 81.59878540039062, 84.00072479248047, 86.40266418457031, 88.80460357666016, 91.20654296875, 93.60848236083984, 96.01042175292969, 98.41236877441406, 100.8143081665039]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 2.0, 5.0, 13.0, 8.0, 9.0, 22.0, 14.0, 23.0, 17.0, 29.0, 25.0, 31.0, 32.0, 41.0, 38.0, 51.0, 46.0, 41.0, 32.0, 43.0, 51.0, 41.0, 43.0, 37.0, 41.0, 29.0, 30.0, 26.0, 15.0, 26.0, 23.0, 22.0, 17.0, 18.0, 10.0, 13.0, 7.0, 10.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.594375610351562, -19.866798400878906, -19.139219284057617, -18.41164207458496, -17.684064865112305, -16.956485748291016, -16.22890853881836, -15.501331329345703, -14.77375316619873, -14.046175003051758, -13.318597793579102, -12.591019630432129, -11.863441467285156, -11.1358642578125, -10.408286094665527, -9.680707931518555, -8.953130722045898, -8.225552558898926, -7.4979753494262695, -6.770397186279297, -6.042819499969482, -5.315241813659668, -4.587663650512695, -3.860085964202881, -3.1325082778930664, -2.404930591583252, -1.6773526668548584, -0.9497747421264648, -0.2221970558166504, 0.5053806304931641, 1.2329587936401367, 1.9605364799499512, 2.688112258911133, 3.4156899452209473, 4.143267631530762, 4.870845794677734, 5.598423480987549, 6.326001167297363, 7.053579330444336, 7.78115701675415, 8.508734703063965, 9.236312866210938, 9.963890075683594, 10.691468238830566, 11.419046401977539, 12.146623611450195, 12.874201774597168, 13.60177993774414, 14.329357147216797, 15.05693531036377, 15.784512519836426, 16.5120906829834, 17.239667892456055, 17.967247009277344, 18.69482421875, 19.422401428222656, 20.149978637695312, 20.87755584716797, 21.605134963989258, 22.332712173461914, 23.06028938293457, 23.78786849975586, 24.515445709228516, 25.243022918701172, 25.97060203552246]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 6.0, 11.0, 10.0, 11.0, 9.0, 21.0, 15.0, 21.0, 34.0, 20.0, 24.0, 25.0, 34.0, 48.0, 36.0, 34.0, 43.0, 54.0, 39.0, 47.0, 43.0, 49.0, 35.0, 41.0, 29.0, 35.0, 33.0, 21.0, 24.0, 23.0, 21.0, 15.0, 14.0, 8.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.794921875, -1.7416534423828125, -1.688385009765625, -1.6351165771484375, -1.58184814453125, -1.5285797119140625, -1.475311279296875, -1.4220428466796875, -1.3687744140625, -1.3155059814453125, -1.262237548828125, -1.2089691162109375, -1.15570068359375, -1.1024322509765625, -1.049163818359375, -0.9958953857421875, -0.942626953125, -0.8893585205078125, -0.836090087890625, -0.7828216552734375, -0.72955322265625, -0.6762847900390625, -0.623016357421875, -0.5697479248046875, -0.5164794921875, -0.4632110595703125, -0.409942626953125, -0.3566741943359375, -0.30340576171875, -0.2501373291015625, -0.196868896484375, -0.1436004638671875, -0.09033203125, -0.0370635986328125, 0.016204833984375, 0.0694732666015625, 0.12274169921875, 0.1760101318359375, 0.229278564453125, 0.2825469970703125, 0.3358154296875, 0.3890838623046875, 0.442352294921875, 0.4956207275390625, 0.54888916015625, 0.6021575927734375, 0.655426025390625, 0.7086944580078125, 0.761962890625, 0.8152313232421875, 0.868499755859375, 0.9217681884765625, 0.97503662109375, 1.0283050537109375, 1.081573486328125, 1.1348419189453125, 1.1881103515625, 1.2413787841796875, 1.294647216796875, 1.3479156494140625, 1.40118408203125, 1.4544525146484375, 1.507720947265625, 1.5609893798828125, 1.6142578125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 13.0, 11.0, 21.0, 19.0, 18.0, 37.0, 43.0, 84.0, 124.0, 215.0, 304.0, 509.0, 870.0, 1611.0, 2886.0, 5368.0, 11372.0, 25495.0, 68031.0, 295125.0, 3256945.0, 400281.0, 75026.0, 27016.0, 11402.0, 5284.0, 2779.0, 1451.0, 766.0, 437.0, 250.0, 165.0, 103.0, 74.0, 30.0, 37.0, 28.0, 15.0, 14.0, 9.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.27337646484375, -7.0428466796875, -6.81231689453125, -6.581787109375, -6.35125732421875, -6.1207275390625, -5.89019775390625, -5.65966796875, -5.42913818359375, -5.1986083984375, -4.96807861328125, -4.737548828125, -4.50701904296875, -4.2764892578125, -4.04595947265625, -3.8154296875, -3.58489990234375, -3.3543701171875, -3.12384033203125, -2.893310546875, -2.66278076171875, -2.4322509765625, -2.20172119140625, -1.97119140625, -1.74066162109375, -1.5101318359375, -1.27960205078125, -1.049072265625, -0.81854248046875, -0.5880126953125, -0.35748291015625, -0.126953125, 0.10357666015625, 0.3341064453125, 0.56463623046875, 0.795166015625, 1.02569580078125, 1.2562255859375, 1.48675537109375, 1.71728515625, 1.94781494140625, 2.1783447265625, 2.40887451171875, 2.639404296875, 2.86993408203125, 3.1004638671875, 3.33099365234375, 3.5615234375, 3.79205322265625, 4.0225830078125, 4.25311279296875, 4.483642578125, 4.71417236328125, 4.9447021484375, 5.17523193359375, 5.40576171875, 5.63629150390625, 5.8668212890625, 6.09735107421875, 6.327880859375, 6.55841064453125, 6.7889404296875, 7.01947021484375, 7.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 12.0, 16.0, 18.0, 30.0, 41.0, 64.0, 60.0, 95.0, 125.0, 253.0, 458.0, 1021.0, 838.0, 362.0, 207.0, 157.0, 76.0, 69.0, 48.0, 38.0, 23.0, 18.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.78179931640625, -6.4971923828125, -6.21258544921875, -5.927978515625, -5.64337158203125, -5.3587646484375, -5.07415771484375, -4.78955078125, -4.50494384765625, -4.2203369140625, -3.93572998046875, -3.651123046875, -3.36651611328125, -3.0819091796875, -2.79730224609375, -2.5126953125, -2.22808837890625, -1.9434814453125, -1.65887451171875, -1.374267578125, -1.08966064453125, -0.8050537109375, -0.52044677734375, -0.23583984375, 0.04876708984375, 0.3333740234375, 0.61798095703125, 0.902587890625, 1.18719482421875, 1.4718017578125, 1.75640869140625, 2.041015625, 2.32562255859375, 2.6102294921875, 2.89483642578125, 3.179443359375, 3.46405029296875, 3.7486572265625, 4.03326416015625, 4.31787109375, 4.60247802734375, 4.8870849609375, 5.17169189453125, 5.456298828125, 5.74090576171875, 6.0255126953125, 6.31011962890625, 6.5947265625, 6.87933349609375, 7.1639404296875, 7.44854736328125, 7.733154296875, 8.01776123046875, 8.3023681640625, 8.58697509765625, 8.87158203125, 9.15618896484375, 9.4407958984375, 9.72540283203125, 10.010009765625, 10.29461669921875, 10.5792236328125, 10.86383056640625, 11.1484375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 11.0, 12.0, 23.0, 21.0, 26.0, 44.0, 66.0, 122.0, 193.0, 340.0, 598.0, 1199.0, 2514.0, 6167.0, 16359.0, 50694.0, 200574.0, 2786965.0, 950454.0, 123257.0, 34204.0, 11727.0, 4599.0, 1914.0, 929.0, 530.0, 257.0, 156.0, 98.0, 61.0, 51.0, 33.0, 17.0, 13.0, 10.0, 10.0, 7.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.4921875, -15.0474853515625, -14.602783203125, -14.1580810546875, -13.71337890625, -13.2686767578125, -12.823974609375, -12.3792724609375, -11.9345703125, -11.4898681640625, -11.045166015625, -10.6004638671875, -10.15576171875, -9.7110595703125, -9.266357421875, -8.8216552734375, -8.376953125, -7.9322509765625, -7.487548828125, -7.0428466796875, -6.59814453125, -6.1534423828125, -5.708740234375, -5.2640380859375, -4.8193359375, -4.3746337890625, -3.929931640625, -3.4852294921875, -3.04052734375, -2.5958251953125, -2.151123046875, -1.7064208984375, -1.26171875, -0.8170166015625, -0.372314453125, 0.0723876953125, 0.51708984375, 0.9617919921875, 1.406494140625, 1.8511962890625, 2.2958984375, 2.7406005859375, 3.185302734375, 3.6300048828125, 4.07470703125, 4.5194091796875, 4.964111328125, 5.4088134765625, 5.853515625, 6.2982177734375, 6.742919921875, 7.1876220703125, 7.63232421875, 8.0770263671875, 8.521728515625, 8.9664306640625, 9.4111328125, 9.8558349609375, 10.300537109375, 10.7452392578125, 11.18994140625, 11.6346435546875, 12.079345703125, 12.5240478515625, 12.96875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 10.0, 15.0, 19.0, 22.0, 27.0, 38.0, 70.0, 71.0, 103.0, 105.0, 102.0, 96.0, 72.0, 70.0, 36.0, 33.0, 19.0, 25.0, 14.0, 13.0, 6.0, 3.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.627105712890625, -40.634674072265625, -39.64223861694336, -38.649803161621094, -37.657371520996094, -36.664939880371094, -35.67250442504883, -34.68006896972656, -33.68763732910156, -32.69520568847656, -31.702770233154297, -30.710336685180664, -29.71790313720703, -28.7254695892334, -27.733036041259766, -26.740602493286133, -25.7481689453125, -24.755735397338867, -23.763301849365234, -22.7708683013916, -21.77843475341797, -20.786001205444336, -19.793567657470703, -18.80113410949707, -17.808700561523438, -16.816267013549805, -15.823833465576172, -14.831399917602539, -13.838966369628906, -12.846532821655273, -11.85409927368164, -10.861665725708008, -9.869230270385742, -8.87679672241211, -7.884363174438477, -6.891929626464844, -5.899496078491211, -4.907062530517578, -3.9146289825439453, -2.9221954345703125, -1.9297618865966797, -0.9373283386230469, 0.05510520935058594, 1.0475387573242188, 2.0399723052978516, 3.0324058532714844, 4.024839401245117, 5.01727294921875, 6.009706497192383, 7.002140045166016, 7.994573593139648, 8.987007141113281, 9.979440689086914, 10.971874237060547, 11.96430778503418, 12.956741333007812, 13.949174880981445, 14.941608428955078, 15.934041976928711, 16.926475524902344, 17.918909072875977, 18.91134262084961, 19.903776168823242, 20.896209716796875, 21.888643264770508]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 10.0, 10.0, 20.0, 12.0, 17.0, 28.0, 25.0, 21.0, 28.0, 28.0, 36.0, 40.0, 35.0, 36.0, 46.0, 38.0, 41.0, 49.0, 41.0, 41.0, 29.0, 41.0, 41.0, 27.0, 40.0, 15.0, 28.0, 27.0, 27.0, 15.0, 14.0, 14.0, 7.0, 10.0, 10.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.314502716064453, -21.644657135009766, -20.97481346130371, -20.304967880249023, -19.63512420654297, -18.96527862548828, -18.295434951782227, -17.62558937072754, -16.955745697021484, -16.285900115966797, -15.616056442260742, -14.946211814880371, -14.2763671875, -13.606522560119629, -12.936677932739258, -12.26683235168457, -11.5969877243042, -10.927143096923828, -10.257298469543457, -9.587453842163086, -8.917609214782715, -8.247764587402344, -7.5779194831848145, -6.908074855804443, -6.238230228424072, -5.568385601043701, -4.89854097366333, -4.228695869445801, -3.558851480484009, -2.8890068531036377, -2.2191619873046875, -1.5493173599243164, -0.8794727325439453, -0.20962804555892944, 0.4602166414260864, 1.130061388015747, 1.7999060153961182, 2.4697506427764893, 3.1395955085754395, 3.8094401359558105, 4.479284763336182, 5.149129390716553, 5.818974018096924, 6.488819122314453, 7.158663749694824, 7.828508377075195, 8.498353004455566, 9.168197631835938, 9.838042259216309, 10.50788688659668, 11.17773151397705, 11.847576141357422, 12.517420768737793, 13.187265396118164, 13.857110977172852, 14.526954650878906, 15.196800231933594, 15.866644859313965, 16.536489486694336, 17.206335067749023, 17.876178741455078, 18.546024322509766, 19.21586799621582, 19.885713577270508, 20.555557250976562]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 13.0, 19.0, 15.0, 20.0, 18.0, 27.0, 33.0, 30.0, 34.0, 35.0, 46.0, 38.0, 35.0, 60.0, 48.0, 33.0, 42.0, 51.0, 53.0, 40.0, 38.0, 26.0, 33.0, 32.0, 23.0, 24.0, 26.0, 24.0, 11.0, 12.0, 7.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.126953125, -2.0662384033203125, -2.005523681640625, -1.9448089599609375, -1.88409423828125, -1.8233795166015625, -1.762664794921875, -1.7019500732421875, -1.6412353515625, -1.5805206298828125, -1.519805908203125, -1.4590911865234375, -1.39837646484375, -1.3376617431640625, -1.276947021484375, -1.2162322998046875, -1.155517578125, -1.0948028564453125, -1.034088134765625, -0.9733734130859375, -0.91265869140625, -0.8519439697265625, -0.791229248046875, -0.7305145263671875, -0.6697998046875, -0.6090850830078125, -0.548370361328125, -0.4876556396484375, -0.42694091796875, -0.3662261962890625, -0.305511474609375, -0.2447967529296875, -0.18408203125, -0.1233673095703125, -0.062652587890625, -0.0019378662109375, 0.05877685546875, 0.1194915771484375, 0.180206298828125, 0.2409210205078125, 0.3016357421875, 0.3623504638671875, 0.423065185546875, 0.4837799072265625, 0.54449462890625, 0.6052093505859375, 0.665924072265625, 0.7266387939453125, 0.787353515625, 0.8480682373046875, 0.908782958984375, 0.9694976806640625, 1.03021240234375, 1.0909271240234375, 1.151641845703125, 1.2123565673828125, 1.2730712890625, 1.3337860107421875, 1.394500732421875, 1.4552154541015625, 1.51593017578125, 1.5766448974609375, 1.637359619140625, 1.6980743408203125, 1.7587890625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 5.0, 8.0, 14.0, 19.0, 26.0, 40.0, 75.0, 103.0, 164.0, 230.0, 325.0, 557.0, 890.0, 1386.0, 2401.0, 4185.0, 6981.0, 12640.0, 23114.0, 45474.0, 94733.0, 230778.0, 362975.0, 132082.0, 60989.0, 30189.0, 16326.0, 9055.0, 5108.0, 2979.0, 1714.0, 1074.0, 664.0, 399.0, 275.0, 196.0, 129.0, 79.0, 50.0, 36.0, 23.0, 21.0, 12.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3695068359375, -9.059326171875, -8.7491455078125, -8.43896484375, -8.1287841796875, -7.818603515625, -7.5084228515625, -7.1982421875, -6.8880615234375, -6.577880859375, -6.2677001953125, -5.95751953125, -5.6473388671875, -5.337158203125, -5.0269775390625, -4.716796875, -4.4066162109375, -4.096435546875, -3.7862548828125, -3.47607421875, -3.1658935546875, -2.855712890625, -2.5455322265625, -2.2353515625, -1.9251708984375, -1.614990234375, -1.3048095703125, -0.99462890625, -0.6844482421875, -0.374267578125, -0.0640869140625, 0.24609375, 0.5562744140625, 0.866455078125, 1.1766357421875, 1.48681640625, 1.7969970703125, 2.107177734375, 2.4173583984375, 2.7275390625, 3.0377197265625, 3.347900390625, 3.6580810546875, 3.96826171875, 4.2784423828125, 4.588623046875, 4.8988037109375, 5.208984375, 5.5191650390625, 5.829345703125, 6.1395263671875, 6.44970703125, 6.7598876953125, 7.070068359375, 7.3802490234375, 7.6904296875, 8.0006103515625, 8.310791015625, 8.6209716796875, 8.93115234375, 9.2413330078125, 9.551513671875, 9.8616943359375, 10.171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 10.0, 9.0, 11.0, 13.0, 19.0, 23.0, 30.0, 35.0, 28.0, 28.0, 31.0, 41.0, 46.0, 52.0, 51.0, 44.0, 1068.0, 46.0, 48.0, 27.0, 54.0, 29.0, 45.0, 45.0, 27.0, 26.0, 26.0, 19.0, 14.0, 10.0, 15.0, 13.0, 7.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9279937744140625, -1.865753173828125, -1.8035125732421875, -1.74127197265625, -1.6790313720703125, -1.616790771484375, -1.5545501708984375, -1.4923095703125, -1.4300689697265625, -1.367828369140625, -1.3055877685546875, -1.24334716796875, -1.1811065673828125, -1.118865966796875, -1.0566253662109375, -0.994384765625, -0.9321441650390625, -0.869903564453125, -0.8076629638671875, -0.74542236328125, -0.6831817626953125, -0.620941162109375, -0.5587005615234375, -0.4964599609375, -0.4342193603515625, -0.371978759765625, -0.3097381591796875, -0.24749755859375, -0.1852569580078125, -0.123016357421875, -0.0607757568359375, 0.00146484375, 0.0637054443359375, 0.125946044921875, 0.1881866455078125, 0.25042724609375, 0.3126678466796875, 0.374908447265625, 0.4371490478515625, 0.4993896484375, 0.5616302490234375, 0.623870849609375, 0.6861114501953125, 0.74835205078125, 0.8105926513671875, 0.872833251953125, 0.9350738525390625, 0.997314453125, 1.0595550537109375, 1.121795654296875, 1.1840362548828125, 1.24627685546875, 1.3085174560546875, 1.370758056640625, 1.4329986572265625, 1.4952392578125, 1.5574798583984375, 1.619720458984375, 1.6819610595703125, 1.74420166015625, 1.8064422607421875, 1.868682861328125, 1.9309234619140625, 1.9931640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 12.0, 9.0, 18.0, 33.0, 52.0, 83.0, 143.0, 251.0, 360.0, 687.0, 1285.0, 2331.0, 4612.0, 10008.0, 25140.0, 78515.0, 779240.0, 1062726.0, 85201.0, 25904.0, 10361.0, 4815.0, 2409.0, 1183.0, 734.0, 416.0, 251.0, 114.0, 94.0, 46.0, 31.0, 24.0, 12.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.953125, -12.5487060546875, -12.144287109375, -11.7398681640625, -11.33544921875, -10.9310302734375, -10.526611328125, -10.1221923828125, -9.7177734375, -9.3133544921875, -8.908935546875, -8.5045166015625, -8.10009765625, -7.6956787109375, -7.291259765625, -6.8868408203125, -6.482421875, -6.0780029296875, -5.673583984375, -5.2691650390625, -4.86474609375, -4.4603271484375, -4.055908203125, -3.6514892578125, -3.2470703125, -2.8426513671875, -2.438232421875, -2.0338134765625, -1.62939453125, -1.2249755859375, -0.820556640625, -0.4161376953125, -0.01171875, 0.3927001953125, 0.797119140625, 1.2015380859375, 1.60595703125, 2.0103759765625, 2.414794921875, 2.8192138671875, 3.2236328125, 3.6280517578125, 4.032470703125, 4.4368896484375, 4.84130859375, 5.2457275390625, 5.650146484375, 6.0545654296875, 6.458984375, 6.8634033203125, 7.267822265625, 7.6722412109375, 8.07666015625, 8.4810791015625, 8.885498046875, 9.2899169921875, 9.6943359375, 10.0987548828125, 10.503173828125, 10.9075927734375, 11.31201171875, 11.7164306640625, 12.120849609375, 12.5252685546875, 12.9296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 23.0, 27.0, 43.0, 65.0, 199.0, 302.0, 108.0, 65.0, 39.0, 23.0, 12.0, 11.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.54296875, -4.410369873046875, -4.27777099609375, -4.145172119140625, -4.0125732421875, -3.879974365234375, -3.74737548828125, -3.614776611328125, -3.482177734375, -3.349578857421875, -3.21697998046875, -3.084381103515625, -2.9517822265625, -2.819183349609375, -2.68658447265625, -2.553985595703125, -2.42138671875, -2.288787841796875, -2.15618896484375, -2.023590087890625, -1.8909912109375, -1.758392333984375, -1.62579345703125, -1.493194580078125, -1.360595703125, -1.227996826171875, -1.09539794921875, -0.962799072265625, -0.8302001953125, -0.697601318359375, -0.56500244140625, -0.432403564453125, -0.2998046875, -0.167205810546875, -0.03460693359375, 0.097991943359375, 0.2305908203125, 0.363189697265625, 0.49578857421875, 0.628387451171875, 0.760986328125, 0.893585205078125, 1.02618408203125, 1.158782958984375, 1.2913818359375, 1.423980712890625, 1.55657958984375, 1.689178466796875, 1.82177734375, 1.954376220703125, 2.08697509765625, 2.219573974609375, 2.3521728515625, 2.484771728515625, 2.61737060546875, 2.749969482421875, 2.882568359375, 3.015167236328125, 3.14776611328125, 3.280364990234375, 3.4129638671875, 3.545562744140625, 3.67816162109375, 3.810760498046875, 3.943359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 7.0, 16.0, 14.0, 29.0, 30.0, 42.0, 67.0, 133.0, 401.0, 1306.0, 6589.0, 203829.0, 825381.0, 8315.0, 1583.0, 409.0, 136.0, 77.0, 33.0, 31.0, 19.0, 16.0, 14.0, 9.0, 8.0, 6.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.97119140625, -47.2861328125, -45.60107421875, -43.916015625, -42.23095703125, -40.5458984375, -38.86083984375, -37.17578125, -35.49072265625, -33.8056640625, -32.12060546875, -30.435546875, -28.75048828125, -27.0654296875, -25.38037109375, -23.6953125, -22.01025390625, -20.3251953125, -18.64013671875, -16.955078125, -15.27001953125, -13.5849609375, -11.89990234375, -10.21484375, -8.52978515625, -6.8447265625, -5.15966796875, -3.474609375, -1.78955078125, -0.1044921875, 1.58056640625, 3.265625, 4.95068359375, 6.6357421875, 8.32080078125, 10.005859375, 11.69091796875, 13.3759765625, 15.06103515625, 16.74609375, 18.43115234375, 20.1162109375, 21.80126953125, 23.486328125, 25.17138671875, 26.8564453125, 28.54150390625, 30.2265625, 31.91162109375, 33.5966796875, 35.28173828125, 36.966796875, 38.65185546875, 40.3369140625, 42.02197265625, 43.70703125, 45.39208984375, 47.0771484375, 48.76220703125, 50.447265625, 52.13232421875, 53.8173828125, 55.50244140625, 57.1875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 18.0, 59.0, 165.0, 398.0, 257.0, 75.0, 19.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.732600212097168, -5.197275161743164, -4.661950588226318, -4.126626014709473, -3.5913009643554688, -3.055976152420044, -2.520651340484619, -1.9853265285491943, -1.4500017166137695, -0.9146769046783447, -0.3793520927429199, 0.15597271919250488, 0.6912975311279297, 1.2266223430633545, 1.7619471549987793, 2.297271966934204, 2.832596778869629, 3.3679215908050537, 3.9032464027404785, 4.438570976257324, 4.973896026611328, 5.509221076965332, 6.044545650482178, 6.579870223999023, 7.115195274353027, 7.650520324707031, 8.185844421386719, 8.721169471740723, 9.256494522094727, 9.79181957244873, 10.327144622802734, 10.862468719482422, 11.39779281616211, 11.933117866516113, 12.468442916870117, 13.003767013549805, 13.539092063903809, 14.074417114257812, 14.6097412109375, 15.145066261291504, 15.680391311645508, 16.215715408325195, 16.751041412353516, 17.286365509033203, 17.82168960571289, 18.35701560974121, 18.8923397064209, 19.42766571044922, 19.962989807128906, 20.498313903808594, 21.033639907836914, 21.5689640045166, 22.104290008544922, 22.63961410522461, 23.174938201904297, 23.710264205932617, 24.245588302612305, 24.780912399291992, 25.316238403320312, 25.8515625, 26.386886596679688, 26.922212600708008, 27.457536697387695, 27.992862701416016, 28.528186798095703]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 10.0, 4.0, 5.0, 9.0, 8.0, 18.0, 19.0, 22.0, 17.0, 24.0, 30.0, 32.0, 34.0, 44.0, 61.0, 46.0, 53.0, 50.0, 58.0, 49.0, 50.0, 49.0, 39.0, 36.0, 43.0, 48.0, 25.0, 20.0, 24.0, 25.0, 13.0, 14.0, 14.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4067554473876953, -2.2869205474853516, -2.167085886001587, -2.047250986099243, -1.927416205406189, -1.8075814247131348, -1.687746524810791, -1.5679117441177368, -1.4480769634246826, -1.3282421827316284, -1.2084074020385742, -1.0885725021362305, -0.9687377214431763, -0.8489029407501221, -0.7290681004524231, -0.6092332601547241, -0.4893984794616699, -0.36956366896629333, -0.24972885847091675, -0.12989404797554016, -0.010059237480163574, 0.10977554321289062, 0.2296103835105896, 0.3494452238082886, 0.4692800045013428, 0.589114785194397, 0.708949625492096, 0.8287844657897949, 0.9486192464828491, 1.0684540271759033, 1.188288927078247, 1.3081237077713013, 1.4279584884643555, 1.5477932691574097, 1.6676280498504639, 1.7874629497528076, 1.9072977304458618, 2.027132511138916, 2.1469674110412598, 2.2668023109436035, 2.386636972427368, 2.506471872329712, 2.6263065338134766, 2.7461414337158203, 2.865976333618164, 2.9858109951019287, 3.1056458950042725, 3.225480556488037, 3.345315456390381, 3.4651503562927246, 3.5849850177764893, 3.704819917678833, 3.8246545791625977, 3.9444894790649414, 4.064324378967285, 4.184159278869629, 4.303994178771973, 4.423829078674316, 4.54366397857666, 4.663498401641846, 4.7833333015441895, 4.903168201446533, 5.023003101348877, 5.142838001251221, 5.262672424316406]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 12.0, 10.0, 11.0, 17.0, 23.0, 24.0, 29.0, 25.0, 32.0, 30.0, 39.0, 57.0, 39.0, 58.0, 56.0, 46.0, 50.0, 45.0, 53.0, 41.0, 45.0, 33.0, 44.0, 27.0, 27.0, 29.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.17535400390625, -2.1085205078125, -2.04168701171875, -1.974853515625, -1.90802001953125, -1.8411865234375, -1.77435302734375, -1.70751953125, -1.64068603515625, -1.5738525390625, -1.50701904296875, -1.440185546875, -1.37335205078125, -1.3065185546875, -1.23968505859375, -1.1728515625, -1.10601806640625, -1.0391845703125, -0.97235107421875, -0.905517578125, -0.83868408203125, -0.7718505859375, -0.70501708984375, -0.63818359375, -0.57135009765625, -0.5045166015625, -0.43768310546875, -0.370849609375, -0.30401611328125, -0.2371826171875, -0.17034912109375, -0.103515625, -0.03668212890625, 0.0301513671875, 0.09698486328125, 0.163818359375, 0.23065185546875, 0.2974853515625, 0.36431884765625, 0.43115234375, 0.49798583984375, 0.5648193359375, 0.63165283203125, 0.698486328125, 0.76531982421875, 0.8321533203125, 0.89898681640625, 0.9658203125, 1.03265380859375, 1.0994873046875, 1.16632080078125, 1.233154296875, 1.29998779296875, 1.3668212890625, 1.43365478515625, 1.50048828125, 1.56732177734375, 1.6341552734375, 1.70098876953125, 1.767822265625, 1.83465576171875, 1.9014892578125, 1.96832275390625, 2.03515625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 16.0, 14.0, 20.0, 30.0, 33.0, 53.0, 89.0, 126.0, 224.0, 297.0, 479.0, 943.0, 1737.0, 3461.0, 7274.0, 18681.0, 61330.0, 308724.0, 493430.0, 104745.0, 27379.0, 10033.0, 4329.0, 2192.0, 1130.0, 657.0, 388.0, 238.0, 148.0, 96.0, 77.0, 47.0, 34.0, 21.0, 20.0, 16.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.135162353515625, -2.05938720703125, -1.983612060546875, -1.9078369140625, -1.832061767578125, -1.75628662109375, -1.680511474609375, -1.604736328125, -1.528961181640625, -1.45318603515625, -1.377410888671875, -1.3016357421875, -1.225860595703125, -1.15008544921875, -1.074310302734375, -0.99853515625, -0.922760009765625, -0.84698486328125, -0.771209716796875, -0.6954345703125, -0.619659423828125, -0.54388427734375, -0.468109130859375, -0.392333984375, -0.316558837890625, -0.24078369140625, -0.165008544921875, -0.0892333984375, -0.013458251953125, 0.06231689453125, 0.138092041015625, 0.2138671875, 0.289642333984375, 0.36541748046875, 0.441192626953125, 0.5169677734375, 0.592742919921875, 0.66851806640625, 0.744293212890625, 0.820068359375, 0.895843505859375, 0.97161865234375, 1.047393798828125, 1.1231689453125, 1.198944091796875, 1.27471923828125, 1.350494384765625, 1.42626953125, 1.502044677734375, 1.57781982421875, 1.653594970703125, 1.7293701171875, 1.805145263671875, 1.88092041015625, 1.956695556640625, 2.032470703125, 2.108245849609375, 2.18402099609375, 2.259796142578125, 2.3355712890625, 2.411346435546875, 2.48712158203125, 2.562896728515625, 2.638671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 17.0, 14.0, 11.0, 13.0, 22.0, 34.0, 35.0, 27.0, 30.0, 49.0, 37.0, 54.0, 104.0, 481.0, 1569.0, 102.0, 55.0, 53.0, 37.0, 42.0, 43.0, 29.0, 25.0, 25.0, 18.0, 21.0, 21.0, 13.0, 9.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.0390625, -7.79559326171875, -7.5521240234375, -7.30865478515625, -7.065185546875, -6.82171630859375, -6.5782470703125, -6.33477783203125, -6.09130859375, -5.84783935546875, -5.6043701171875, -5.36090087890625, -5.117431640625, -4.87396240234375, -4.6304931640625, -4.38702392578125, -4.1435546875, -3.90008544921875, -3.6566162109375, -3.41314697265625, -3.169677734375, -2.92620849609375, -2.6827392578125, -2.43927001953125, -2.19580078125, -1.95233154296875, -1.7088623046875, -1.46539306640625, -1.221923828125, -0.97845458984375, -0.7349853515625, -0.49151611328125, -0.248046875, -0.00457763671875, 0.2388916015625, 0.48236083984375, 0.725830078125, 0.96929931640625, 1.2127685546875, 1.45623779296875, 1.69970703125, 1.94317626953125, 2.1866455078125, 2.43011474609375, 2.673583984375, 2.91705322265625, 3.1605224609375, 3.40399169921875, 3.6474609375, 3.89093017578125, 4.1343994140625, 4.37786865234375, 4.621337890625, 4.86480712890625, 5.1082763671875, 5.35174560546875, 5.59521484375, 5.83868408203125, 6.0821533203125, 6.32562255859375, 6.569091796875, 6.81256103515625, 7.0560302734375, 7.29949951171875, 7.54296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 10.0, 7.0, 8.0, 19.0, 12.0, 28.0, 22.0, 41.0, 37.0, 67.0, 93.0, 169.0, 352.0, 963.0, 3785.0, 20974.0, 371483.0, 2680276.0, 56846.0, 7645.0, 1760.0, 505.0, 214.0, 96.0, 75.0, 56.0, 40.0, 28.0, 21.0, 10.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.16082763671875, -7.9075927734375, -7.65435791015625, -7.401123046875, -7.14788818359375, -6.8946533203125, -6.64141845703125, -6.38818359375, -6.13494873046875, -5.8817138671875, -5.62847900390625, -5.375244140625, -5.12200927734375, -4.8687744140625, -4.61553955078125, -4.3623046875, -4.10906982421875, -3.8558349609375, -3.60260009765625, -3.349365234375, -3.09613037109375, -2.8428955078125, -2.58966064453125, -2.33642578125, -2.08319091796875, -1.8299560546875, -1.57672119140625, -1.323486328125, -1.07025146484375, -0.8170166015625, -0.56378173828125, -0.310546875, -0.05731201171875, 0.1959228515625, 0.44915771484375, 0.702392578125, 0.95562744140625, 1.2088623046875, 1.46209716796875, 1.71533203125, 1.96856689453125, 2.2218017578125, 2.47503662109375, 2.728271484375, 2.98150634765625, 3.2347412109375, 3.48797607421875, 3.7412109375, 3.99444580078125, 4.2476806640625, 4.50091552734375, 4.754150390625, 5.00738525390625, 5.2606201171875, 5.51385498046875, 5.76708984375, 6.02032470703125, 6.2735595703125, 6.52679443359375, 6.780029296875, 7.03326416015625, 7.2864990234375, 7.53973388671875, 7.79296875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [25.0, 547.0, 427.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.352025032043457, -2.1149377822875977, 0.12214946746826172, 2.359236717224121, 4.5963239669799805, 6.83341121673584, 9.0704984664917, 11.307585716247559, 13.544672966003418, 15.781760215759277, 18.018848419189453, 20.255935668945312, 22.493022918701172, 24.73011016845703, 26.96719741821289, 29.20428466796875, 31.44137191772461, 33.67845916748047, 35.91554641723633, 38.15263366699219, 40.38972091674805, 42.626808166503906, 44.863895416259766, 47.100982666015625, 49.338069915771484, 51.575157165527344, 53.8122444152832, 56.04933166503906, 58.28641891479492, 60.52350616455078, 62.76059341430664, 64.9976806640625, 67.23477172851562, 69.47186279296875, 71.70894622802734, 73.94602966308594, 76.18312072753906, 78.42021179199219, 80.65729522705078, 82.89437866210938, 85.1314697265625, 87.36856079101562, 89.60564422607422, 91.84272766113281, 94.07981872558594, 96.31690979003906, 98.55399322509766, 100.79107666015625, 103.02816772460938, 105.2652587890625, 107.5023422241211, 109.73942565917969, 111.97651672363281, 114.21360778808594, 116.45069122314453, 118.68777465820312, 120.92486572265625, 123.16195678710938, 125.39904022216797, 127.63612365722656, 129.8732147216797, 132.1103057861328, 134.34738159179688, 136.58447265625, 138.82156372070312]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 13.0, 13.0, 18.0, 17.0, 24.0, 24.0, 34.0, 48.0, 36.0, 42.0, 48.0, 44.0, 37.0, 32.0, 34.0, 58.0, 39.0, 34.0, 23.0, 36.0, 38.0, 31.0, 34.0, 28.0, 27.0, 22.0, 17.0, 22.0, 19.0, 17.0, 9.0, 13.0, 8.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.37146759033203, -19.653667449951172, -18.935867309570312, -18.218067169189453, -17.500267028808594, -16.782468795776367, -16.064668655395508, -15.346868515014648, -14.629068374633789, -13.91126823425293, -13.19346809387207, -12.475668907165527, -11.757868766784668, -11.040068626403809, -10.322269439697266, -9.604469299316406, -8.886669158935547, -8.168869018554688, -7.451069355010986, -6.733269691467285, -6.015469551086426, -5.297669410705566, -4.579869747161865, -3.862070083618164, -3.1442699432373047, -2.4264700412750244, -1.7086701393127441, -0.9908702373504639, -0.2730703353881836, 0.4447295665740967, 1.162529468536377, 1.8803291320800781, 2.5981311798095703, 3.3159310817718506, 4.033730983734131, 4.751530647277832, 5.469330787658691, 6.187130928039551, 6.904930591583252, 7.622730255126953, 8.340530395507812, 9.058330535888672, 9.776130676269531, 10.493929862976074, 11.211730003356934, 11.929530143737793, 12.647329330444336, 13.365129470825195, 14.082929611206055, 14.800729751586914, 15.518529891967773, 16.236330032348633, 16.95412826538086, 17.67192840576172, 18.389728546142578, 19.107528686523438, 19.825328826904297, 20.543128967285156, 21.260929107666016, 21.978729248046875, 22.696529388427734, 23.41432762145996, 24.13212776184082, 24.84992790222168, 25.56772804260254]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 17.0, 11.0, 26.0, 32.0, 19.0, 30.0, 28.0, 38.0, 41.0, 32.0, 39.0, 58.0, 49.0, 34.0, 64.0, 56.0, 51.0, 43.0, 38.0, 40.0, 41.0, 32.0, 38.0, 19.0, 17.0, 13.0, 18.0, 7.0, 11.0, 9.0, 3.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.302734375, -2.2364501953125, -2.170166015625, -2.1038818359375, -2.03759765625, -1.9713134765625, -1.905029296875, -1.8387451171875, -1.7724609375, -1.7061767578125, -1.639892578125, -1.5736083984375, -1.50732421875, -1.4410400390625, -1.374755859375, -1.3084716796875, -1.2421875, -1.1759033203125, -1.109619140625, -1.0433349609375, -0.97705078125, -0.9107666015625, -0.844482421875, -0.7781982421875, -0.7119140625, -0.6456298828125, -0.579345703125, -0.5130615234375, -0.44677734375, -0.3804931640625, -0.314208984375, -0.2479248046875, -0.181640625, -0.1153564453125, -0.049072265625, 0.0172119140625, 0.08349609375, 0.1497802734375, 0.216064453125, 0.2823486328125, 0.3486328125, 0.4149169921875, 0.481201171875, 0.5474853515625, 0.61376953125, 0.6800537109375, 0.746337890625, 0.8126220703125, 0.87890625, 0.9451904296875, 1.011474609375, 1.0777587890625, 1.14404296875, 1.2103271484375, 1.276611328125, 1.3428955078125, 1.4091796875, 1.4754638671875, 1.541748046875, 1.6080322265625, 1.67431640625, 1.7406005859375, 1.806884765625, 1.8731689453125, 1.939453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 9.0, 8.0, 10.0, 18.0, 25.0, 42.0, 66.0, 99.0, 115.0, 150.0, 218.0, 335.0, 504.0, 727.0, 1181.0, 1778.0, 2761.0, 4440.0, 7495.0, 12859.0, 22770.0, 44294.0, 103832.0, 626466.0, 2775035.0, 412048.0, 88648.0, 39105.0, 20446.0, 11462.0, 6531.0, 3892.0, 2381.0, 1542.0, 932.0, 605.0, 439.0, 277.0, 225.0, 148.0, 110.0, 89.0, 42.0, 38.0, 23.0, 11.0, 15.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.87890625, -4.72357177734375, -4.5682373046875, -4.41290283203125, -4.257568359375, -4.10223388671875, -3.9468994140625, -3.79156494140625, -3.63623046875, -3.48089599609375, -3.3255615234375, -3.17022705078125, -3.014892578125, -2.85955810546875, -2.7042236328125, -2.54888916015625, -2.3935546875, -2.23822021484375, -2.0828857421875, -1.92755126953125, -1.772216796875, -1.61688232421875, -1.4615478515625, -1.30621337890625, -1.15087890625, -0.99554443359375, -0.8402099609375, -0.68487548828125, -0.529541015625, -0.37420654296875, -0.2188720703125, -0.06353759765625, 0.091796875, 0.24713134765625, 0.4024658203125, 0.55780029296875, 0.713134765625, 0.86846923828125, 1.0238037109375, 1.17913818359375, 1.33447265625, 1.48980712890625, 1.6451416015625, 1.80047607421875, 1.955810546875, 2.11114501953125, 2.2664794921875, 2.42181396484375, 2.5771484375, 2.73248291015625, 2.8878173828125, 3.04315185546875, 3.198486328125, 3.35382080078125, 3.5091552734375, 3.66448974609375, 3.81982421875, 3.97515869140625, 4.1304931640625, 4.28582763671875, 4.441162109375, 4.59649658203125, 4.7518310546875, 4.90716552734375, 5.0625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 14.0, 17.0, 34.0, 45.0, 71.0, 117.0, 173.0, 297.0, 708.0, 1141.0, 655.0, 288.0, 174.0, 100.0, 75.0, 43.0, 32.0, 19.0, 12.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2578125, -10.9488525390625, -10.639892578125, -10.3309326171875, -10.02197265625, -9.7130126953125, -9.404052734375, -9.0950927734375, -8.7861328125, -8.4771728515625, -8.168212890625, -7.8592529296875, -7.55029296875, -7.2413330078125, -6.932373046875, -6.6234130859375, -6.314453125, -6.0054931640625, -5.696533203125, -5.3875732421875, -5.07861328125, -4.7696533203125, -4.460693359375, -4.1517333984375, -3.8427734375, -3.5338134765625, -3.224853515625, -2.9158935546875, -2.60693359375, -2.2979736328125, -1.989013671875, -1.6800537109375, -1.37109375, -1.0621337890625, -0.753173828125, -0.4442138671875, -0.13525390625, 0.1737060546875, 0.482666015625, 0.7916259765625, 1.1005859375, 1.4095458984375, 1.718505859375, 2.0274658203125, 2.33642578125, 2.6453857421875, 2.954345703125, 3.2633056640625, 3.572265625, 3.8812255859375, 4.190185546875, 4.4991455078125, 4.80810546875, 5.1170654296875, 5.426025390625, 5.7349853515625, 6.0439453125, 6.3529052734375, 6.661865234375, 6.9708251953125, 7.27978515625, 7.5887451171875, 7.897705078125, 8.2066650390625, 8.515625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 12.0, 14.0, 13.0, 24.0, 36.0, 23.0, 41.0, 46.0, 72.0, 103.0, 136.0, 175.0, 263.0, 428.0, 745.0, 1329.0, 2720.0, 5510.0, 12774.0, 31928.0, 96561.0, 472135.0, 3078413.0, 357934.0, 82316.0, 28538.0, 11259.0, 5018.0, 2443.0, 1182.0, 710.0, 469.0, 223.0, 179.0, 110.0, 98.0, 60.0, 55.0, 38.0, 29.0, 27.0, 16.0, 12.0, 13.0, 5.0, 8.0, 13.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5625, -10.2154541015625, -9.868408203125, -9.5213623046875, -9.17431640625, -8.8272705078125, -8.480224609375, -8.1331787109375, -7.7861328125, -7.4390869140625, -7.092041015625, -6.7449951171875, -6.39794921875, -6.0509033203125, -5.703857421875, -5.3568115234375, -5.009765625, -4.6627197265625, -4.315673828125, -3.9686279296875, -3.62158203125, -3.2745361328125, -2.927490234375, -2.5804443359375, -2.2333984375, -1.8863525390625, -1.539306640625, -1.1922607421875, -0.84521484375, -0.4981689453125, -0.151123046875, 0.1959228515625, 0.54296875, 0.8900146484375, 1.237060546875, 1.5841064453125, 1.93115234375, 2.2781982421875, 2.625244140625, 2.9722900390625, 3.3193359375, 3.6663818359375, 4.013427734375, 4.3604736328125, 4.70751953125, 5.0545654296875, 5.401611328125, 5.7486572265625, 6.095703125, 6.4427490234375, 6.789794921875, 7.1368408203125, 7.48388671875, 7.8309326171875, 8.177978515625, 8.5250244140625, 8.8720703125, 9.2191162109375, 9.566162109375, 9.9132080078125, 10.26025390625, 10.6072998046875, 10.954345703125, 11.3013916015625, 11.6484375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 10.0, 9.0, 15.0, 24.0, 30.0, 39.0, 44.0, 94.0, 118.0, 160.0, 138.0, 104.0, 72.0, 42.0, 43.0, 26.0, 16.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.158594131469727, -16.842029571533203, -15.525463104248047, -14.208897590637207, -12.892332077026367, -11.575766563415527, -10.259201049804688, -8.942635536193848, -7.626070022583008, -6.309504508972168, -4.992938995361328, -3.6763734817504883, -2.3598079681396484, -1.0432424545288086, 0.27332305908203125, 1.589888572692871, 2.906454086303711, 4.223019599914551, 5.539585113525391, 6.8561506271362305, 8.17271614074707, 9.48928165435791, 10.80584716796875, 12.12241268157959, 13.43897819519043, 14.75554370880127, 16.07210922241211, 17.388675689697266, 18.70524024963379, 20.021804809570312, 21.33837127685547, 22.654937744140625, 23.97150421142578, 25.288070678710938, 26.60463523864746, 27.921199798583984, 29.23776626586914, 30.554332733154297, 31.87089729309082, 33.187461853027344, 34.5040283203125, 35.820594787597656, 37.13716125488281, 38.4537239074707, 39.77029037475586, 41.086856842041016, 42.403419494628906, 43.71998596191406, 45.03655242919922, 46.353118896484375, 47.66968536376953, 48.98624801635742, 50.30281448364258, 51.619380950927734, 52.935943603515625, 54.25251007080078, 55.56907653808594, 56.885643005371094, 58.20220947265625, 59.51877212524414, 60.8353385925293, 62.15190505981445, 63.468467712402344, 64.7850341796875, 66.10160064697266]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 1.0, 5.0, 6.0, 2.0, 10.0, 8.0, 7.0, 22.0, 28.0, 14.0, 22.0, 19.0, 31.0, 35.0, 39.0, 36.0, 38.0, 29.0, 29.0, 37.0, 36.0, 44.0, 49.0, 33.0, 44.0, 32.0, 37.0, 25.0, 34.0, 26.0, 29.0, 22.0, 30.0, 14.0, 12.0, 16.0, 17.0, 9.0, 10.0, 12.0, 10.0, 9.0, 6.0, 5.0, 6.0, 6.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.290016174316406, -17.674758911132812, -17.059499740600586, -16.444242477416992, -15.828984260559082, -15.213726043701172, -14.598468780517578, -13.983210563659668, -13.367952346801758, -12.752694129943848, -12.137436866760254, -11.522178649902344, -10.906920433044434, -10.291662216186523, -9.67640495300293, -9.06114673614502, -8.445889472961426, -7.830631732940674, -7.215373516082764, -6.600115776062012, -5.984857559204102, -5.36959981918335, -4.754342079162598, -4.1390838623046875, -3.5238261222839355, -2.9085681438446045, -2.2933101654052734, -1.6780524253845215, -1.0627944469451904, -0.4475364685058594, 0.16772127151489258, 0.7829794883728027, 1.3982372283935547, 2.0134952068328857, 2.628753185272217, 3.2440109252929688, 3.8592689037323, 4.474526882171631, 5.089784622192383, 5.705042839050293, 6.320300579071045, 6.935558319091797, 7.550816535949707, 8.166074752807617, 8.781332015991211, 9.396590232849121, 10.011848449707031, 10.627105712890625, 11.242363929748535, 11.857622146606445, 12.472879409790039, 13.08813762664795, 13.70339584350586, 14.318653106689453, 14.933911323547363, 15.549169540405273, 16.164426803588867, 16.77968406677246, 17.394943237304688, 18.01020050048828, 18.625457763671875, 19.2407169342041, 19.855974197387695, 20.471233367919922, 21.086490631103516]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 19.0, 17.0, 19.0, 20.0, 23.0, 21.0, 33.0, 29.0, 43.0, 38.0, 39.0, 42.0, 47.0, 48.0, 44.0, 57.0, 49.0, 36.0, 46.0, 50.0, 34.0, 29.0, 29.0, 34.0, 28.0, 21.0, 17.0, 15.0, 18.0, 14.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.6990509033203125, -1.633453369140625, -1.5678558349609375, -1.50225830078125, -1.4366607666015625, -1.371063232421875, -1.3054656982421875, -1.2398681640625, -1.1742706298828125, -1.108673095703125, -1.0430755615234375, -0.97747802734375, -0.9118804931640625, -0.846282958984375, -0.7806854248046875, -0.715087890625, -0.6494903564453125, -0.583892822265625, -0.5182952880859375, -0.45269775390625, -0.3871002197265625, -0.321502685546875, -0.2559051513671875, -0.1903076171875, -0.1247100830078125, -0.059112548828125, 0.0064849853515625, 0.07208251953125, 0.1376800537109375, 0.203277587890625, 0.2688751220703125, 0.33447265625, 0.4000701904296875, 0.465667724609375, 0.5312652587890625, 0.59686279296875, 0.6624603271484375, 0.728057861328125, 0.7936553955078125, 0.8592529296875, 0.9248504638671875, 0.990447998046875, 1.0560455322265625, 1.12164306640625, 1.1872406005859375, 1.252838134765625, 1.3184356689453125, 1.384033203125, 1.4496307373046875, 1.515228271484375, 1.5808258056640625, 1.64642333984375, 1.7120208740234375, 1.777618408203125, 1.8432159423828125, 1.9088134765625, 1.9744110107421875, 2.040008544921875, 2.1056060791015625, 2.17120361328125, 2.2368011474609375, 2.302398681640625, 2.3679962158203125, 2.43359375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 9.0, 18.0, 22.0, 32.0, 32.0, 83.0, 110.0, 175.0, 240.0, 455.0, 601.0, 1092.0, 1709.0, 3130.0, 5302.0, 9713.0, 18598.0, 37554.0, 83641.0, 210482.0, 371410.0, 167647.0, 68728.0, 31721.0, 16166.0, 8395.0, 4635.0, 2703.0, 1528.0, 965.0, 588.0, 401.0, 201.0, 150.0, 99.0, 65.0, 57.0, 20.0, 24.0, 14.0, 15.0, 4.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6484375, -8.34375, -8.0390625, -7.734375, -7.4296875, -7.125, -6.8203125, -6.515625, -6.2109375, -5.90625, -5.6015625, -5.296875, -4.9921875, -4.6875, -4.3828125, -4.078125, -3.7734375, -3.46875, -3.1640625, -2.859375, -2.5546875, -2.25, -1.9453125, -1.640625, -1.3359375, -1.03125, -0.7265625, -0.421875, -0.1171875, 0.1875, 0.4921875, 0.796875, 1.1015625, 1.40625, 1.7109375, 2.015625, 2.3203125, 2.625, 2.9296875, 3.234375, 3.5390625, 3.84375, 4.1484375, 4.453125, 4.7578125, 5.0625, 5.3671875, 5.671875, 5.9765625, 6.28125, 6.5859375, 6.890625, 7.1953125, 7.5, 7.8046875, 8.109375, 8.4140625, 8.71875, 9.0234375, 9.328125, 9.6328125, 9.9375, 10.2421875, 10.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 7.0, 8.0, 12.0, 16.0, 19.0, 24.0, 21.0, 21.0, 30.0, 35.0, 37.0, 36.0, 49.0, 50.0, 42.0, 54.0, 1076.0, 46.0, 42.0, 52.0, 47.0, 49.0, 36.0, 37.0, 28.0, 22.0, 20.0, 17.0, 20.0, 13.0, 17.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08984375, -2.025390625, -1.9609375, -1.896484375, -1.83203125, -1.767578125, -1.703125, -1.638671875, -1.57421875, -1.509765625, -1.4453125, -1.380859375, -1.31640625, -1.251953125, -1.1875, -1.123046875, -1.05859375, -0.994140625, -0.9296875, -0.865234375, -0.80078125, -0.736328125, -0.671875, -0.607421875, -0.54296875, -0.478515625, -0.4140625, -0.349609375, -0.28515625, -0.220703125, -0.15625, -0.091796875, -0.02734375, 0.037109375, 0.1015625, 0.166015625, 0.23046875, 0.294921875, 0.359375, 0.423828125, 0.48828125, 0.552734375, 0.6171875, 0.681640625, 0.74609375, 0.810546875, 0.875, 0.939453125, 1.00390625, 1.068359375, 1.1328125, 1.197265625, 1.26171875, 1.326171875, 1.390625, 1.455078125, 1.51953125, 1.583984375, 1.6484375, 1.712890625, 1.77734375, 1.841796875, 1.90625, 1.970703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 15.0, 11.0, 39.0, 30.0, 52.0, 107.0, 154.0, 280.0, 399.0, 677.0, 1158.0, 2551.0, 5547.0, 14616.0, 52972.0, 1054775.0, 886692.0, 51394.0, 14457.0, 5503.0, 2576.0, 1287.0, 691.0, 423.0, 225.0, 169.0, 107.0, 73.0, 40.0, 27.0, 14.0, 14.0, 6.0, 9.0, 1.0, 8.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.359619140625, -18.73486328125, -18.110107421875, -17.4853515625, -16.860595703125, -16.23583984375, -15.611083984375, -14.986328125, -14.361572265625, -13.73681640625, -13.112060546875, -12.4873046875, -11.862548828125, -11.23779296875, -10.613037109375, -9.98828125, -9.363525390625, -8.73876953125, -8.114013671875, -7.4892578125, -6.864501953125, -6.23974609375, -5.614990234375, -4.990234375, -4.365478515625, -3.74072265625, -3.115966796875, -2.4912109375, -1.866455078125, -1.24169921875, -0.616943359375, 0.0078125, 0.632568359375, 1.25732421875, 1.882080078125, 2.5068359375, 3.131591796875, 3.75634765625, 4.381103515625, 5.005859375, 5.630615234375, 6.25537109375, 6.880126953125, 7.5048828125, 8.129638671875, 8.75439453125, 9.379150390625, 10.00390625, 10.628662109375, 11.25341796875, 11.878173828125, 12.5029296875, 13.127685546875, 13.75244140625, 14.377197265625, 15.001953125, 15.626708984375, 16.25146484375, 16.876220703125, 17.5009765625, 18.125732421875, 18.75048828125, 19.375244140625, 20.0]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 27.0, 33.0, 66.0, 94.0, 208.0, 224.0, 114.0, 55.0, 41.0, 21.0, 15.0, 10.0, 11.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.415283203125, -4.25244140625, -4.089599609375, -3.9267578125, -3.763916015625, -3.60107421875, -3.438232421875, -3.275390625, -3.112548828125, -2.94970703125, -2.786865234375, -2.6240234375, -2.461181640625, -2.29833984375, -2.135498046875, -1.97265625, -1.809814453125, -1.64697265625, -1.484130859375, -1.3212890625, -1.158447265625, -0.99560546875, -0.832763671875, -0.669921875, -0.507080078125, -0.34423828125, -0.181396484375, -0.0185546875, 0.144287109375, 0.30712890625, 0.469970703125, 0.6328125, 0.795654296875, 0.95849609375, 1.121337890625, 1.2841796875, 1.447021484375, 1.60986328125, 1.772705078125, 1.935546875, 2.098388671875, 2.26123046875, 2.424072265625, 2.5869140625, 2.749755859375, 2.91259765625, 3.075439453125, 3.23828125, 3.401123046875, 3.56396484375, 3.726806640625, 3.8896484375, 4.052490234375, 4.21533203125, 4.378173828125, 4.541015625, 4.703857421875, 4.86669921875, 5.029541015625, 5.1923828125, 5.355224609375, 5.51806640625, 5.680908203125, 5.84375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 7.0, 8.0, 14.0, 9.0, 22.0, 37.0, 55.0, 89.0, 208.0, 703.0, 4402.0, 356710.0, 680264.0, 4748.0, 733.0, 240.0, 112.0, 57.0, 34.0, 29.0, 14.0, 14.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.8125, -84.40234375, -81.9921875, -79.58203125, -77.171875, -74.76171875, -72.3515625, -69.94140625, -67.53125, -65.12109375, -62.7109375, -60.30078125, -57.890625, -55.48046875, -53.0703125, -50.66015625, -48.25, -45.83984375, -43.4296875, -41.01953125, -38.609375, -36.19921875, -33.7890625, -31.37890625, -28.96875, -26.55859375, -24.1484375, -21.73828125, -19.328125, -16.91796875, -14.5078125, -12.09765625, -9.6875, -7.27734375, -4.8671875, -2.45703125, -0.046875, 2.36328125, 4.7734375, 7.18359375, 9.59375, 12.00390625, 14.4140625, 16.82421875, 19.234375, 21.64453125, 24.0546875, 26.46484375, 28.875, 31.28515625, 33.6953125, 36.10546875, 38.515625, 40.92578125, 43.3359375, 45.74609375, 48.15625, 50.56640625, 52.9765625, 55.38671875, 57.796875, 60.20703125, 62.6171875, 65.02734375, 67.4375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 17.0, 55.0, 133.0, 351.0, 290.0, 101.0, 35.0, 17.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.813743591308594, -8.370620727539062, -7.927497863769531, -7.484375, -7.041252613067627, -6.598129749298096, -6.1550068855285645, -5.711884498596191, -5.26876163482666, -4.825638771057129, -4.382515907287598, -3.9393932819366455, -3.4962706565856934, -3.053147792816162, -2.610024929046631, -2.1669023036956787, -1.7237792015075684, -1.2806564569473267, -0.8375336527824402, -0.3944108486175537, 0.04871189594268799, 0.4918346405029297, 0.9349575042724609, 1.378080129623413, 1.8212029933929443, 2.2643258571624756, 2.7074484825134277, 3.150571346282959, 3.5936942100524902, 4.036816596984863, 4.4799394607543945, 4.923062324523926, 5.366185188293457, 5.809308052062988, 6.2524309158325195, 6.695553779602051, 7.138676166534424, 7.581799030303955, 8.024921417236328, 8.46804428100586, 8.91116714477539, 9.354290008544922, 9.797412872314453, 10.240535736083984, 10.683658599853516, 11.126781463623047, 11.569904327392578, 12.013026237487793, 12.45615005493164, 12.899272918701172, 13.342395782470703, 13.785518646240234, 14.228641510009766, 14.671764373779297, 15.114887237548828, 15.558009147644043, 16.001131057739258, 16.44425392150879, 16.88737678527832, 17.33049964904785, 17.773622512817383, 18.216745376586914, 18.659868240356445, 19.102991104125977, 19.546113967895508]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 23.0, 21.0, 37.0, 42.0, 46.0, 58.0, 56.0, 62.0, 71.0, 71.0, 65.0, 60.0, 57.0, 61.0, 53.0, 40.0, 34.0, 23.0, 34.0, 20.0, 21.0, 15.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7889270782470703, -3.6258251667022705, -3.4627232551574707, -3.299621343612671, -3.136519432067871, -2.973417282104492, -2.8103153705596924, -2.6472134590148926, -2.4841115474700928, -2.321009635925293, -2.157907724380493, -1.9948056936264038, -1.831703782081604, -1.6686018705368042, -1.5054998397827148, -1.342397928237915, -1.1792960166931152, -1.0161941051483154, -0.8530921339988708, -0.6899901628494263, -0.5268882513046265, -0.36378633975982666, -0.20068436861038208, -0.0375823974609375, 0.1255195140838623, 0.2886214554309845, 0.4517233967781067, 0.6148253679275513, 0.7779272794723511, 0.9410291910171509, 1.1041312217712402, 1.26723313331604, 1.4303350448608398, 1.5934369564056396, 1.7565388679504395, 1.9196408987045288, 2.082742691040039, 2.245844841003418, 2.4089467525482178, 2.5720486640930176, 2.7351505756378174, 2.898252487182617, 3.061354398727417, 3.224456310272217, 3.3875584602355957, 3.5506601333618164, 3.7137622833251953, 3.876864194869995, 4.039966106414795, 4.203068256378174, 4.3661699295043945, 4.529272079467773, 4.692373752593994, 4.855475902557373, 5.018577575683594, 5.181679725646973, 5.344781875610352, 5.5078840255737305, 5.670985698699951, 5.83408784866333, 5.997189521789551, 6.16029167175293, 6.32339334487915, 6.486495494842529, 6.64959716796875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 15.0, 23.0, 33.0, 34.0, 26.0, 39.0, 43.0, 54.0, 61.0, 55.0, 54.0, 55.0, 73.0, 57.0, 49.0, 53.0, 44.0, 38.0, 35.0, 34.0, 26.0, 26.0, 15.0, 10.0, 11.0, 8.0, 5.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24273681640625, -2.1593017578125, -2.07586669921875, -1.992431640625, -1.90899658203125, -1.8255615234375, -1.74212646484375, -1.65869140625, -1.57525634765625, -1.4918212890625, -1.40838623046875, -1.324951171875, -1.24151611328125, -1.1580810546875, -1.07464599609375, -0.9912109375, -0.90777587890625, -0.8243408203125, -0.74090576171875, -0.657470703125, -0.57403564453125, -0.4906005859375, -0.40716552734375, -0.32373046875, -0.24029541015625, -0.1568603515625, -0.07342529296875, 0.010009765625, 0.09344482421875, 0.1768798828125, 0.26031494140625, 0.34375, 0.42718505859375, 0.5106201171875, 0.59405517578125, 0.677490234375, 0.76092529296875, 0.8443603515625, 0.92779541015625, 1.01123046875, 1.09466552734375, 1.1781005859375, 1.26153564453125, 1.344970703125, 1.42840576171875, 1.5118408203125, 1.59527587890625, 1.6787109375, 1.76214599609375, 1.8455810546875, 1.92901611328125, 2.012451171875, 2.09588623046875, 2.1793212890625, 2.26275634765625, 2.34619140625, 2.42962646484375, 2.5130615234375, 2.59649658203125, 2.679931640625, 2.76336669921875, 2.8468017578125, 2.93023681640625, 3.013671875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 9.0, 8.0, 13.0, 9.0, 18.0, 21.0, 43.0, 54.0, 82.0, 96.0, 154.0, 241.0, 305.0, 459.0, 737.0, 989.0, 1544.0, 2397.0, 4013.0, 6952.0, 14391.0, 58775.0, 695115.0, 214136.0, 24401.0, 9550.0, 5023.0, 3097.0, 1993.0, 1366.0, 790.0, 522.0, 348.0, 251.0, 200.0, 117.0, 87.0, 62.0, 48.0, 51.0, 22.0, 16.0, 14.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.29315185546875, -4.1488037109375, -4.00445556640625, -3.860107421875, -3.71575927734375, -3.5714111328125, -3.42706298828125, -3.28271484375, -3.13836669921875, -2.9940185546875, -2.84967041015625, -2.705322265625, -2.56097412109375, -2.4166259765625, -2.27227783203125, -2.1279296875, -1.98358154296875, -1.8392333984375, -1.69488525390625, -1.550537109375, -1.40618896484375, -1.2618408203125, -1.11749267578125, -0.97314453125, -0.82879638671875, -0.6844482421875, -0.54010009765625, -0.395751953125, -0.25140380859375, -0.1070556640625, 0.03729248046875, 0.181640625, 0.32598876953125, 0.4703369140625, 0.61468505859375, 0.759033203125, 0.90338134765625, 1.0477294921875, 1.19207763671875, 1.33642578125, 1.48077392578125, 1.6251220703125, 1.76947021484375, 1.913818359375, 2.05816650390625, 2.2025146484375, 2.34686279296875, 2.4912109375, 2.63555908203125, 2.7799072265625, 2.92425537109375, 3.068603515625, 3.21295166015625, 3.3572998046875, 3.50164794921875, 3.64599609375, 3.79034423828125, 3.9346923828125, 4.07904052734375, 4.223388671875, 4.36773681640625, 4.5120849609375, 4.65643310546875, 4.80078125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 9.0, 11.0, 11.0, 20.0, 16.0, 16.0, 33.0, 20.0, 34.0, 43.0, 30.0, 39.0, 35.0, 47.0, 46.0, 103.0, 249.0, 1549.0, 211.0, 91.0, 57.0, 43.0, 52.0, 44.0, 30.0, 28.0, 23.0, 26.0, 17.0, 10.0, 13.0, 13.0, 13.0, 12.0, 6.0, 4.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.84375, -5.6307373046875, -5.417724609375, -5.2047119140625, -4.99169921875, -4.7786865234375, -4.565673828125, -4.3526611328125, -4.1396484375, -3.9266357421875, -3.713623046875, -3.5006103515625, -3.28759765625, -3.0745849609375, -2.861572265625, -2.6485595703125, -2.435546875, -2.2225341796875, -2.009521484375, -1.7965087890625, -1.58349609375, -1.3704833984375, -1.157470703125, -0.9444580078125, -0.7314453125, -0.5184326171875, -0.305419921875, -0.0924072265625, 0.12060546875, 0.3336181640625, 0.546630859375, 0.7596435546875, 0.97265625, 1.1856689453125, 1.398681640625, 1.6116943359375, 1.82470703125, 2.0377197265625, 2.250732421875, 2.4637451171875, 2.6767578125, 2.8897705078125, 3.102783203125, 3.3157958984375, 3.52880859375, 3.7418212890625, 3.954833984375, 4.1678466796875, 4.380859375, 4.5938720703125, 4.806884765625, 5.0198974609375, 5.23291015625, 5.4459228515625, 5.658935546875, 5.8719482421875, 6.0849609375, 6.2979736328125, 6.510986328125, 6.7239990234375, 6.93701171875, 7.1500244140625, 7.363037109375, 7.5760498046875, 7.7890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 11.0, 4.0, 7.0, 10.0, 12.0, 20.0, 20.0, 26.0, 45.0, 72.0, 101.0, 159.0, 296.0, 543.0, 985.0, 1948.0, 4352.0, 12097.0, 53617.0, 2012978.0, 1000333.0, 40026.0, 10216.0, 4013.0, 1690.0, 898.0, 440.0, 264.0, 157.0, 89.0, 84.0, 46.0, 34.0, 26.0, 20.0, 14.0, 9.0, 14.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0], "bins": [-9.1953125, -8.9462890625, -8.697265625, -8.4482421875, -8.19921875, -7.9501953125, -7.701171875, -7.4521484375, -7.203125, -6.9541015625, -6.705078125, -6.4560546875, -6.20703125, -5.9580078125, -5.708984375, -5.4599609375, -5.2109375, -4.9619140625, -4.712890625, -4.4638671875, -4.21484375, -3.9658203125, -3.716796875, -3.4677734375, -3.21875, -2.9697265625, -2.720703125, -2.4716796875, -2.22265625, -1.9736328125, -1.724609375, -1.4755859375, -1.2265625, -0.9775390625, -0.728515625, -0.4794921875, -0.23046875, 0.0185546875, 0.267578125, 0.5166015625, 0.765625, 1.0146484375, 1.263671875, 1.5126953125, 1.76171875, 2.0107421875, 2.259765625, 2.5087890625, 2.7578125, 3.0068359375, 3.255859375, 3.5048828125, 3.75390625, 4.0029296875, 4.251953125, 4.5009765625, 4.75, 4.9990234375, 5.248046875, 5.4970703125, 5.74609375, 5.9951171875, 6.244140625, 6.4931640625, 6.7421875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 25.0, 156.0, 511.0, 269.0, 49.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640542030334473, -4.840981960296631, -3.041422128677368, -1.2418622970581055, 0.5576977729797363, 2.357257843017578, 4.156817436218262, 5.956377983093262, 7.755937576293945, 9.555497169494629, 11.355057716369629, 13.154617309570312, 14.954177856445312, 16.753738403320312, 18.55329704284668, 20.35285758972168, 22.152416229248047, 23.951976776123047, 25.751535415649414, 27.551095962524414, 29.350656509399414, 31.15021514892578, 32.94977569580078, 34.74933624267578, 36.54889678955078, 38.34845733642578, 40.14801788330078, 41.94757843017578, 43.747135162353516, 45.546695709228516, 47.346256256103516, 49.145816802978516, 50.945377349853516, 52.744937896728516, 54.544498443603516, 56.34405517578125, 58.14361572265625, 59.94317626953125, 61.74273681640625, 63.54229736328125, 65.34185791015625, 67.14141845703125, 68.94097900390625, 70.74053955078125, 72.54010009765625, 74.33966064453125, 76.13922119140625, 77.93878173828125, 79.73833465576172, 81.53789520263672, 83.33745574951172, 85.13701629638672, 86.93657684326172, 88.73613739013672, 90.53569030761719, 92.33525085449219, 94.13481903076172, 95.93437957763672, 97.73394012451172, 99.53350067138672, 101.33306121826172, 103.13262176513672, 104.93217468261719, 106.73173522949219, 108.53129577636719]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 9.0, 6.0, 13.0, 14.0, 19.0, 15.0, 15.0, 24.0, 42.0, 28.0, 38.0, 34.0, 35.0, 59.0, 37.0, 33.0, 38.0, 61.0, 44.0, 47.0, 48.0, 42.0, 41.0, 37.0, 28.0, 37.0, 18.0, 14.0, 17.0, 20.0, 14.0, 16.0, 10.0, 9.0, 12.0, 10.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.468992233276367, -24.713703155517578, -23.95841407775879, -23.203125, -22.447834014892578, -21.69254493713379, -20.937255859375, -20.18196678161621, -19.426677703857422, -18.671388626098633, -17.916099548339844, -17.160808563232422, -16.405519485473633, -15.650230407714844, -14.894941329956055, -14.139652252197266, -13.384361267089844, -12.629072189331055, -11.87378215789795, -11.11849308013916, -10.363203048706055, -9.607913970947266, -8.852624893188477, -8.097335815429688, -7.342045783996582, -6.586756229400635, -5.8314666748046875, -5.076177597045898, -4.320888042449951, -3.565598487854004, -2.810309410095215, -2.0550198554992676, -1.2997283935546875, -0.5444389581680298, 0.21085047721862793, 0.9661397933959961, 1.7214293479919434, 2.4767189025878906, 3.2320079803466797, 3.987297534942627, 4.742587089538574, 5.4978766441345215, 6.253166198730469, 7.008455276489258, 7.763744831085205, 8.519034385681152, 9.274323463439941, 10.029613494873047, 10.784902572631836, 11.540191650390625, 12.29548168182373, 13.05077075958252, 13.806060791015625, 14.561349868774414, 15.316638946533203, 16.071928024291992, 16.82721710205078, 17.58250617980957, 18.33779525756836, 19.09308624267578, 19.84837532043457, 20.60366439819336, 21.35895347595215, 22.114242553710938, 22.86953353881836]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 13.0, 13.0, 14.0, 19.0, 30.0, 24.0, 33.0, 40.0, 31.0, 43.0, 46.0, 59.0, 51.0, 54.0, 60.0, 42.0, 57.0, 51.0, 39.0, 35.0, 35.0, 26.0, 31.0, 39.0, 24.0, 21.0, 12.0, 10.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.016082763671875, -1.94232177734375, -1.868560791015625, -1.7947998046875, -1.721038818359375, -1.64727783203125, -1.573516845703125, -1.499755859375, -1.425994873046875, -1.35223388671875, -1.278472900390625, -1.2047119140625, -1.130950927734375, -1.05718994140625, -0.983428955078125, -0.90966796875, -0.835906982421875, -0.76214599609375, -0.688385009765625, -0.6146240234375, -0.540863037109375, -0.46710205078125, -0.393341064453125, -0.319580078125, -0.245819091796875, -0.17205810546875, -0.098297119140625, -0.0245361328125, 0.049224853515625, 0.12298583984375, 0.196746826171875, 0.2705078125, 0.344268798828125, 0.41802978515625, 0.491790771484375, 0.5655517578125, 0.639312744140625, 0.71307373046875, 0.786834716796875, 0.860595703125, 0.934356689453125, 1.00811767578125, 1.081878662109375, 1.1556396484375, 1.229400634765625, 1.30316162109375, 1.376922607421875, 1.45068359375, 1.524444580078125, 1.59820556640625, 1.671966552734375, 1.7457275390625, 1.819488525390625, 1.89324951171875, 1.967010498046875, 2.040771484375, 2.114532470703125, 2.18829345703125, 2.262054443359375, 2.3358154296875, 2.409576416015625, 2.48333740234375, 2.557098388671875, 2.630859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 4.0, 6.0, 6.0, 14.0, 13.0, 26.0, 28.0, 52.0, 56.0, 86.0, 143.0, 200.0, 298.0, 446.0, 651.0, 1080.0, 1685.0, 2792.0, 4601.0, 8269.0, 15021.0, 29550.0, 65355.0, 248620.0, 2837591.0, 795599.0, 99004.0, 39165.0, 19105.0, 10193.0, 5752.0, 3350.0, 1987.0, 1249.0, 784.0, 507.0, 301.0, 227.0, 133.0, 103.0, 72.0, 56.0, 23.0, 29.0, 16.0, 5.0, 8.0, 10.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.578125, -6.38299560546875, -6.1878662109375, -5.99273681640625, -5.797607421875, -5.60247802734375, -5.4073486328125, -5.21221923828125, -5.01708984375, -4.82196044921875, -4.6268310546875, -4.43170166015625, -4.236572265625, -4.04144287109375, -3.8463134765625, -3.65118408203125, -3.4560546875, -3.26092529296875, -3.0657958984375, -2.87066650390625, -2.675537109375, -2.48040771484375, -2.2852783203125, -2.09014892578125, -1.89501953125, -1.69989013671875, -1.5047607421875, -1.30963134765625, -1.114501953125, -0.91937255859375, -0.7242431640625, -0.52911376953125, -0.333984375, -0.13885498046875, 0.0562744140625, 0.25140380859375, 0.446533203125, 0.64166259765625, 0.8367919921875, 1.03192138671875, 1.22705078125, 1.42218017578125, 1.6173095703125, 1.81243896484375, 2.007568359375, 2.20269775390625, 2.3978271484375, 2.59295654296875, 2.7880859375, 2.98321533203125, 3.1783447265625, 3.37347412109375, 3.568603515625, 3.76373291015625, 3.9588623046875, 4.15399169921875, 4.34912109375, 4.54425048828125, 4.7393798828125, 4.93450927734375, 5.129638671875, 5.32476806640625, 5.5198974609375, 5.71502685546875, 5.91015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 6.0, 6.0, 16.0, 23.0, 23.0, 50.0, 45.0, 69.0, 74.0, 104.0, 140.0, 274.0, 533.0, 824.0, 749.0, 393.0, 226.0, 143.0, 90.0, 72.0, 47.0, 32.0, 27.0, 29.0, 18.0, 12.0, 7.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.70367431640625, -4.4659423828125, -4.22821044921875, -3.990478515625, -3.75274658203125, -3.5150146484375, -3.27728271484375, -3.03955078125, -2.80181884765625, -2.5640869140625, -2.32635498046875, -2.088623046875, -1.85089111328125, -1.6131591796875, -1.37542724609375, -1.1376953125, -0.89996337890625, -0.6622314453125, -0.42449951171875, -0.186767578125, 0.05096435546875, 0.2886962890625, 0.52642822265625, 0.76416015625, 1.00189208984375, 1.2396240234375, 1.47735595703125, 1.715087890625, 1.95281982421875, 2.1905517578125, 2.42828369140625, 2.666015625, 2.90374755859375, 3.1414794921875, 3.37921142578125, 3.616943359375, 3.85467529296875, 4.0924072265625, 4.33013916015625, 4.56787109375, 4.80560302734375, 5.0433349609375, 5.28106689453125, 5.518798828125, 5.75653076171875, 5.9942626953125, 6.23199462890625, 6.4697265625, 6.70745849609375, 6.9451904296875, 7.18292236328125, 7.420654296875, 7.65838623046875, 7.8961181640625, 8.13385009765625, 8.37158203125, 8.60931396484375, 8.8470458984375, 9.08477783203125, 9.322509765625, 9.56024169921875, 9.7979736328125, 10.03570556640625, 10.2734375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 11.0, 8.0, 16.0, 23.0, 44.0, 52.0, 115.0, 190.0, 350.0, 660.0, 1311.0, 2815.0, 6283.0, 14593.0, 37653.0, 109665.0, 537679.0, 2992207.0, 350106.0, 87024.0, 30834.0, 12482.0, 5334.0, 2438.0, 1147.0, 547.0, 295.0, 158.0, 82.0, 53.0, 37.0, 32.0, 16.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.234375, -11.915771484375, -11.59716796875, -11.278564453125, -10.9599609375, -10.641357421875, -10.32275390625, -10.004150390625, -9.685546875, -9.366943359375, -9.04833984375, -8.729736328125, -8.4111328125, -8.092529296875, -7.77392578125, -7.455322265625, -7.13671875, -6.818115234375, -6.49951171875, -6.180908203125, -5.8623046875, -5.543701171875, -5.22509765625, -4.906494140625, -4.587890625, -4.269287109375, -3.95068359375, -3.632080078125, -3.3134765625, -2.994873046875, -2.67626953125, -2.357666015625, -2.0390625, -1.720458984375, -1.40185546875, -1.083251953125, -0.7646484375, -0.446044921875, -0.12744140625, 0.191162109375, 0.509765625, 0.828369140625, 1.14697265625, 1.465576171875, 1.7841796875, 2.102783203125, 2.42138671875, 2.739990234375, 3.05859375, 3.377197265625, 3.69580078125, 4.014404296875, 4.3330078125, 4.651611328125, 4.97021484375, 5.288818359375, 5.607421875, 5.926025390625, 6.24462890625, 6.563232421875, 6.8818359375, 7.200439453125, 7.51904296875, 7.837646484375, 8.15625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 16.0, 26.0, 57.0, 93.0, 156.0, 184.0, 181.0, 126.0, 63.0, 36.0, 34.0, 15.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.126312255859375, -59.4169807434082, -57.70764923095703, -55.998313903808594, -54.28898239135742, -52.57965087890625, -50.87031936645508, -49.160987854003906, -47.45165252685547, -45.7423210144043, -44.032989501953125, -42.32365417480469, -40.614322662353516, -38.904991149902344, -37.19565963745117, -35.486328125, -33.77699661254883, -32.067665100097656, -30.35833168029785, -28.64900016784668, -26.939666748046875, -25.230335235595703, -23.52100372314453, -21.81167221069336, -20.102338790893555, -18.393007278442383, -16.683673858642578, -14.974342346191406, -13.265009880065918, -11.55567741394043, -9.846345901489258, -8.13701343536377, -6.427677154541016, -4.718344688415527, -3.0090126991271973, -1.2996807098388672, 0.4096517562866211, 2.1189842224121094, 3.8283157348632812, 5.5376482009887695, 7.246980667114258, 8.956313133239746, 10.665645599365234, 12.374977111816406, 14.084309577941895, 15.793642044067383, 17.502973556518555, 19.21230697631836, 20.92163848876953, 22.630970001220703, 24.340303421020508, 26.04963493347168, 27.758968353271484, 29.468299865722656, 31.177631378173828, 32.886962890625, 34.59629821777344, 36.30562973022461, 38.01496124267578, 39.72429656982422, 41.43362808227539, 43.14295959472656, 44.852291107177734, 46.561622619628906, 48.27095413208008]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 14.0, 11.0, 15.0, 13.0, 15.0, 20.0, 22.0, 25.0, 21.0, 34.0, 28.0, 36.0, 36.0, 42.0, 36.0, 29.0, 32.0, 44.0, 31.0, 33.0, 48.0, 43.0, 33.0, 37.0, 35.0, 34.0, 29.0, 32.0, 24.0, 27.0, 20.0, 16.0, 11.0, 17.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.841964721679688, -17.242277145385742, -16.642589569091797, -16.04290199279785, -15.44321346282959, -14.843525886535645, -14.2438383102417, -13.644149780273438, -13.044462203979492, -12.444774627685547, -11.845087051391602, -11.245399475097656, -10.645710945129395, -10.04602336883545, -9.446335792541504, -8.846647262573242, -8.246960639953613, -7.647273063659668, -7.0475850105285645, -6.447897434234619, -5.848209381103516, -5.24852180480957, -4.648834228515625, -4.0491461753845215, -3.449458599090576, -2.8497707843780518, -2.2500829696655273, -1.650395393371582, -1.0507075786590576, -0.4510197639465332, 0.1486678123474121, 0.7483558654785156, 1.348043441772461, 1.9477312564849854, 2.5474190711975098, 3.147106647491455, 3.7467944622039795, 4.346482276916504, 4.946169853210449, 5.545857906341553, 6.145545482635498, 6.745233058929443, 7.344921112060547, 7.944608688354492, 8.544296264648438, 9.143983840942383, 9.743671417236328, 10.34335994720459, 10.943047523498535, 11.54273509979248, 12.142422676086426, 12.742111206054688, 13.341798782348633, 13.941486358642578, 14.541173934936523, 15.140861511230469, 15.740549087524414, 16.34023666381836, 16.939924240112305, 17.53961181640625, 18.139299392700195, 18.73898696899414, 19.33867645263672, 19.938364028930664, 20.53805160522461]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 11.0, 9.0, 12.0, 13.0, 18.0, 22.0, 35.0, 32.0, 37.0, 39.0, 37.0, 52.0, 63.0, 63.0, 65.0, 53.0, 67.0, 51.0, 40.0, 29.0, 36.0, 35.0, 26.0, 34.0, 27.0, 15.0, 19.0, 11.0, 11.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4517822265625, -2.372314453125, -2.2928466796875, -2.21337890625, -2.1339111328125, -2.054443359375, -1.9749755859375, -1.8955078125, -1.8160400390625, -1.736572265625, -1.6571044921875, -1.57763671875, -1.4981689453125, -1.418701171875, -1.3392333984375, -1.259765625, -1.1802978515625, -1.100830078125, -1.0213623046875, -0.94189453125, -0.8624267578125, -0.782958984375, -0.7034912109375, -0.6240234375, -0.5445556640625, -0.465087890625, -0.3856201171875, -0.30615234375, -0.2266845703125, -0.147216796875, -0.0677490234375, 0.01171875, 0.0911865234375, 0.170654296875, 0.2501220703125, 0.32958984375, 0.4090576171875, 0.488525390625, 0.5679931640625, 0.6474609375, 0.7269287109375, 0.806396484375, 0.8858642578125, 0.96533203125, 1.0447998046875, 1.124267578125, 1.2037353515625, 1.283203125, 1.3626708984375, 1.442138671875, 1.5216064453125, 1.60107421875, 1.6805419921875, 1.760009765625, 1.8394775390625, 1.9189453125, 1.9984130859375, 2.077880859375, 2.1573486328125, 2.23681640625, 2.3162841796875, 2.395751953125, 2.4752197265625, 2.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 4.0, 14.0, 15.0, 31.0, 68.0, 69.0, 127.0, 213.0, 319.0, 507.0, 739.0, 1129.0, 1780.0, 2924.0, 4516.0, 7082.0, 11398.0, 18787.0, 34332.0, 68378.0, 162734.0, 415208.0, 164195.0, 69390.0, 34629.0, 19337.0, 11371.0, 6928.0, 4424.0, 2803.0, 1776.0, 1161.0, 754.0, 521.0, 326.0, 194.0, 136.0, 84.0, 56.0, 28.0, 16.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5762939453125, -10.269775390625, -9.9632568359375, -9.65673828125, -9.3502197265625, -9.043701171875, -8.7371826171875, -8.4306640625, -8.1241455078125, -7.817626953125, -7.5111083984375, -7.20458984375, -6.8980712890625, -6.591552734375, -6.2850341796875, -5.978515625, -5.6719970703125, -5.365478515625, -5.0589599609375, -4.75244140625, -4.4459228515625, -4.139404296875, -3.8328857421875, -3.5263671875, -3.2198486328125, -2.913330078125, -2.6068115234375, -2.30029296875, -1.9937744140625, -1.687255859375, -1.3807373046875, -1.07421875, -0.7677001953125, -0.461181640625, -0.1546630859375, 0.15185546875, 0.4583740234375, 0.764892578125, 1.0714111328125, 1.3779296875, 1.6844482421875, 1.990966796875, 2.2974853515625, 2.60400390625, 2.9105224609375, 3.217041015625, 3.5235595703125, 3.830078125, 4.1365966796875, 4.443115234375, 4.7496337890625, 5.05615234375, 5.3626708984375, 5.669189453125, 5.9757080078125, 6.2822265625, 6.5887451171875, 6.895263671875, 7.2017822265625, 7.50830078125, 7.8148193359375, 8.121337890625, 8.4278564453125, 8.734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 15.0, 20.0, 14.0, 15.0, 23.0, 21.0, 34.0, 37.0, 39.0, 39.0, 53.0, 46.0, 43.0, 59.0, 1061.0, 47.0, 43.0, 38.0, 34.0, 32.0, 33.0, 33.0, 27.0, 27.0, 27.0, 17.0, 22.0, 15.0, 14.0, 11.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.45703125, -2.3908233642578125, -2.324615478515625, -2.2584075927734375, -2.19219970703125, -2.1259918212890625, -2.059783935546875, -1.9935760498046875, -1.9273681640625, -1.8611602783203125, -1.794952392578125, -1.7287445068359375, -1.66253662109375, -1.5963287353515625, -1.530120849609375, -1.4639129638671875, -1.397705078125, -1.3314971923828125, -1.265289306640625, -1.1990814208984375, -1.13287353515625, -1.0666656494140625, -1.000457763671875, -0.9342498779296875, -0.8680419921875, -0.8018341064453125, -0.735626220703125, -0.6694183349609375, -0.60321044921875, -0.5370025634765625, -0.470794677734375, -0.4045867919921875, -0.33837890625, -0.2721710205078125, -0.205963134765625, -0.1397552490234375, -0.07354736328125, -0.0073394775390625, 0.058868408203125, 0.1250762939453125, 0.1912841796875, 0.2574920654296875, 0.323699951171875, 0.3899078369140625, 0.45611572265625, 0.5223236083984375, 0.588531494140625, 0.6547393798828125, 0.720947265625, 0.7871551513671875, 0.853363037109375, 0.9195709228515625, 0.98577880859375, 1.0519866943359375, 1.118194580078125, 1.1844024658203125, 1.2506103515625, 1.3168182373046875, 1.383026123046875, 1.4492340087890625, 1.51544189453125, 1.5816497802734375, 1.647857666015625, 1.7140655517578125, 1.7802734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 0.0, 10.0, 3.0, 6.0, 20.0, 30.0, 33.0, 57.0, 68.0, 103.0, 186.0, 275.0, 439.0, 763.0, 1424.0, 3173.0, 8534.0, 26684.0, 132851.0, 1727473.0, 150553.0, 28509.0, 8945.0, 3449.0, 1479.0, 801.0, 422.0, 271.0, 175.0, 127.0, 107.0, 54.0, 35.0, 13.0, 12.0, 13.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.5625, -18.921630859375, -18.28076171875, -17.639892578125, -16.9990234375, -16.358154296875, -15.71728515625, -15.076416015625, -14.435546875, -13.794677734375, -13.15380859375, -12.512939453125, -11.8720703125, -11.231201171875, -10.59033203125, -9.949462890625, -9.30859375, -8.667724609375, -8.02685546875, -7.385986328125, -6.7451171875, -6.104248046875, -5.46337890625, -4.822509765625, -4.181640625, -3.540771484375, -2.89990234375, -2.259033203125, -1.6181640625, -0.977294921875, -0.33642578125, 0.304443359375, 0.9453125, 1.586181640625, 2.22705078125, 2.867919921875, 3.5087890625, 4.149658203125, 4.79052734375, 5.431396484375, 6.072265625, 6.713134765625, 7.35400390625, 7.994873046875, 8.6357421875, 9.276611328125, 9.91748046875, 10.558349609375, 11.19921875, 11.840087890625, 12.48095703125, 13.121826171875, 13.7626953125, 14.403564453125, 15.04443359375, 15.685302734375, 16.326171875, 16.967041015625, 17.60791015625, 18.248779296875, 18.8896484375, 19.530517578125, 20.17138671875, 20.812255859375, 21.453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 19.0, 26.0, 71.0, 109.0, 287.0, 235.0, 103.0, 50.0, 26.0, 16.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.453125, -5.2578125, -5.0625, -4.8671875, -4.671875, -4.4765625, -4.28125, -4.0859375, -3.890625, -3.6953125, -3.5, -3.3046875, -3.109375, -2.9140625, -2.71875, -2.5234375, -2.328125, -2.1328125, -1.9375, -1.7421875, -1.546875, -1.3515625, -1.15625, -0.9609375, -0.765625, -0.5703125, -0.375, -0.1796875, 0.015625, 0.2109375, 0.40625, 0.6015625, 0.796875, 0.9921875, 1.1875, 1.3828125, 1.578125, 1.7734375, 1.96875, 2.1640625, 2.359375, 2.5546875, 2.75, 2.9453125, 3.140625, 3.3359375, 3.53125, 3.7265625, 3.921875, 4.1171875, 4.3125, 4.5078125, 4.703125, 4.8984375, 5.09375, 5.2890625, 5.484375, 5.6796875, 5.875, 6.0703125, 6.265625, 6.4609375, 6.65625, 6.8515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 32.0, 52.0, 113.0, 382.0, 1554.0, 20360.0, 1017587.0, 7015.0, 992.0, 237.0, 99.0, 41.0, 12.0, 10.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.625, -102.63671875, -99.6484375, -96.66015625, -93.671875, -90.68359375, -87.6953125, -84.70703125, -81.71875, -78.73046875, -75.7421875, -72.75390625, -69.765625, -66.77734375, -63.7890625, -60.80078125, -57.8125, -54.82421875, -51.8359375, -48.84765625, -45.859375, -42.87109375, -39.8828125, -36.89453125, -33.90625, -30.91796875, -27.9296875, -24.94140625, -21.953125, -18.96484375, -15.9765625, -12.98828125, -10.0, -7.01171875, -4.0234375, -1.03515625, 1.953125, 4.94140625, 7.9296875, 10.91796875, 13.90625, 16.89453125, 19.8828125, 22.87109375, 25.859375, 28.84765625, 31.8359375, 34.82421875, 37.8125, 40.80078125, 43.7890625, 46.77734375, 49.765625, 52.75390625, 55.7421875, 58.73046875, 61.71875, 64.70703125, 67.6953125, 70.68359375, 73.671875, 76.66015625, 79.6484375, 82.63671875, 85.625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 12.0, 11.0, 20.0, 45.0, 59.0, 143.0, 272.0, 235.0, 99.0, 58.0, 25.0, 15.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.849494934082031, -11.527217864990234, -11.204939842224121, -10.882662773132324, -10.560384750366211, -10.238107681274414, -9.9158296585083, -9.593552589416504, -9.27127456665039, -8.948997497558594, -8.62671947479248, -8.304442405700684, -7.98216438293457, -7.659886837005615, -7.33760929107666, -7.015332221984863, -6.693054676055908, -6.370777130126953, -6.048499584197998, -5.726222038269043, -5.403944492340088, -5.081666946411133, -4.759389877319336, -4.437111854553223, -4.114834785461426, -3.7925572395324707, -3.4702796936035156, -3.1480021476745605, -2.8257246017456055, -2.5034470558166504, -2.1811697483062744, -1.8588922023773193, -1.5366144180297852, -1.21433687210083, -0.8920593857765198, -0.5697818994522095, -0.2475043535232544, 0.07477319240570068, 0.3970506191253662, 0.7193281650543213, 1.0416057109832764, 1.3638832569122314, 1.6861608028411865, 2.0084381103515625, 2.3307156562805176, 2.6529932022094727, 2.9752707481384277, 3.297548294067383, 3.619825839996338, 3.942103385925293, 4.264380931854248, 4.586658477783203, 4.908936023712158, 5.231213569641113, 5.55349063873291, 5.875768661499023, 6.19804573059082, 6.520323276519775, 6.8426008224487305, 7.1648783683776855, 7.487155914306641, 7.809433460235596, 8.13171100616455, 8.453988075256348, 8.776266098022461]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 15.0, 11.0, 18.0, 17.0, 34.0, 31.0, 34.0, 44.0, 45.0, 38.0, 49.0, 38.0, 55.0, 58.0, 57.0, 47.0, 48.0, 57.0, 58.0, 32.0, 29.0, 36.0, 38.0, 20.0, 15.0, 12.0, 10.0, 6.0, 3.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3224947452545166, -3.1939871311187744, -3.0654797554016113, -2.936972141265869, -2.808464527130127, -2.6799569129943848, -2.5514495372772217, -2.4229419231414795, -2.2944345474243164, -2.165926933288574, -2.037419557571411, -1.908911943435669, -1.7804043292999268, -1.6518968343734741, -1.5233893394470215, -1.3948817253112793, -1.266374111175537, -1.1378666162490845, -1.0093590021133423, -0.8808515071868896, -0.7523439526557922, -0.6238363981246948, -0.4953289031982422, -0.3668213486671448, -0.23831379413604736, -0.10980625450611115, 0.018701285123825073, 0.1472088098526001, 0.2757163643836975, 0.4042239189147949, 0.5327314138412476, 0.661238968372345, 0.7897462844848633, 0.9182538390159607, 1.046761393547058, 1.1752688884735107, 1.303776502609253, 1.4322839975357056, 1.5607914924621582, 1.6892991065979004, 1.817806601524353, 1.9463140964508057, 2.074821710586548, 2.203329086303711, 2.331836700439453, 2.4603443145751953, 2.5888519287109375, 2.7173593044281006, 2.8458669185638428, 2.974374532699585, 3.102881908416748, 3.2313895225524902, 3.3598971366882324, 3.4884047508239746, 3.6169121265411377, 3.74541974067688, 3.873927116394043, 4.002434730529785, 4.130942344665527, 4.2594499588012695, 4.3879570960998535, 4.516464710235596, 4.644972324371338, 4.77347993850708, 4.901987552642822]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 13.0, 10.0, 12.0, 11.0, 17.0, 27.0, 30.0, 37.0, 46.0, 47.0, 48.0, 65.0, 67.0, 51.0, 64.0, 43.0, 66.0, 53.0, 45.0, 35.0, 32.0, 30.0, 32.0, 28.0, 18.0, 21.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.534454345703125, -2.44781494140625, -2.361175537109375, -2.2745361328125, -2.187896728515625, -2.10125732421875, -2.014617919921875, -1.927978515625, -1.841339111328125, -1.75469970703125, -1.668060302734375, -1.5814208984375, -1.494781494140625, -1.40814208984375, -1.321502685546875, -1.23486328125, -1.148223876953125, -1.06158447265625, -0.974945068359375, -0.8883056640625, -0.801666259765625, -0.71502685546875, -0.628387451171875, -0.541748046875, -0.455108642578125, -0.36846923828125, -0.281829833984375, -0.1951904296875, -0.108551025390625, -0.02191162109375, 0.064727783203125, 0.1513671875, 0.238006591796875, 0.32464599609375, 0.411285400390625, 0.4979248046875, 0.584564208984375, 0.67120361328125, 0.757843017578125, 0.844482421875, 0.931121826171875, 1.01776123046875, 1.104400634765625, 1.1910400390625, 1.277679443359375, 1.36431884765625, 1.450958251953125, 1.53759765625, 1.624237060546875, 1.71087646484375, 1.797515869140625, 1.8841552734375, 1.970794677734375, 2.05743408203125, 2.144073486328125, 2.230712890625, 2.317352294921875, 2.40399169921875, 2.490631103515625, 2.5772705078125, 2.663909912109375, 2.75054931640625, 2.837188720703125, 2.923828125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 16.0, 10.0, 31.0, 31.0, 59.0, 106.0, 153.0, 225.0, 343.0, 578.0, 930.0, 1463.0, 2509.0, 4232.0, 7539.0, 14357.0, 31507.0, 102764.0, 662201.0, 144565.0, 38060.0, 16737.0, 8533.0, 4773.0, 2604.0, 1580.0, 966.0, 596.0, 403.0, 245.0, 150.0, 91.0, 82.0, 35.0, 27.0, 20.0, 12.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.58154296875, -4.4365234375, -4.29150390625, -4.146484375, -4.00146484375, -3.8564453125, -3.71142578125, -3.56640625, -3.42138671875, -3.2763671875, -3.13134765625, -2.986328125, -2.84130859375, -2.6962890625, -2.55126953125, -2.40625, -2.26123046875, -2.1162109375, -1.97119140625, -1.826171875, -1.68115234375, -1.5361328125, -1.39111328125, -1.24609375, -1.10107421875, -0.9560546875, -0.81103515625, -0.666015625, -0.52099609375, -0.3759765625, -0.23095703125, -0.0859375, 0.05908203125, 0.2041015625, 0.34912109375, 0.494140625, 0.63916015625, 0.7841796875, 0.92919921875, 1.07421875, 1.21923828125, 1.3642578125, 1.50927734375, 1.654296875, 1.79931640625, 1.9443359375, 2.08935546875, 2.234375, 2.37939453125, 2.5244140625, 2.66943359375, 2.814453125, 2.95947265625, 3.1044921875, 3.24951171875, 3.39453125, 3.53955078125, 3.6845703125, 3.82958984375, 3.974609375, 4.11962890625, 4.2646484375, 4.40966796875, 4.5546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 6.0, 14.0, 13.0, 16.0, 26.0, 17.0, 27.0, 27.0, 36.0, 30.0, 39.0, 38.0, 63.0, 81.0, 124.0, 283.0, 1510.0, 157.0, 92.0, 82.0, 50.0, 34.0, 38.0, 39.0, 24.0, 27.0, 23.0, 14.0, 17.0, 12.0, 13.0, 7.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.37890625, -7.1424560546875, -6.906005859375, -6.6695556640625, -6.43310546875, -6.1966552734375, -5.960205078125, -5.7237548828125, -5.4873046875, -5.2508544921875, -5.014404296875, -4.7779541015625, -4.54150390625, -4.3050537109375, -4.068603515625, -3.8321533203125, -3.595703125, -3.3592529296875, -3.122802734375, -2.8863525390625, -2.64990234375, -2.4134521484375, -2.177001953125, -1.9405517578125, -1.7041015625, -1.4676513671875, -1.231201171875, -0.9947509765625, -0.75830078125, -0.5218505859375, -0.285400390625, -0.0489501953125, 0.1875, 0.4239501953125, 0.660400390625, 0.8968505859375, 1.13330078125, 1.3697509765625, 1.606201171875, 1.8426513671875, 2.0791015625, 2.3155517578125, 2.552001953125, 2.7884521484375, 3.02490234375, 3.2613525390625, 3.497802734375, 3.7342529296875, 3.970703125, 4.2071533203125, 4.443603515625, 4.6800537109375, 4.91650390625, 5.1529541015625, 5.389404296875, 5.6258544921875, 5.8623046875, 6.0987548828125, 6.335205078125, 6.5716552734375, 6.80810546875, 7.0445556640625, 7.281005859375, 7.5174560546875, 7.75390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 9.0, 15.0, 19.0, 24.0, 42.0, 50.0, 90.0, 186.0, 425.0, 1079.0, 3521.0, 17145.0, 231829.0, 2807588.0, 71138.0, 8981.0, 2133.0, 731.0, 310.0, 134.0, 68.0, 44.0, 38.0, 24.0, 20.0, 8.0, 8.0, 9.0, 6.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1787109375, -14.708984375, -14.2392578125, -13.76953125, -13.2998046875, -12.830078125, -12.3603515625, -11.890625, -11.4208984375, -10.951171875, -10.4814453125, -10.01171875, -9.5419921875, -9.072265625, -8.6025390625, -8.1328125, -7.6630859375, -7.193359375, -6.7236328125, -6.25390625, -5.7841796875, -5.314453125, -4.8447265625, -4.375, -3.9052734375, -3.435546875, -2.9658203125, -2.49609375, -2.0263671875, -1.556640625, -1.0869140625, -0.6171875, -0.1474609375, 0.322265625, 0.7919921875, 1.26171875, 1.7314453125, 2.201171875, 2.6708984375, 3.140625, 3.6103515625, 4.080078125, 4.5498046875, 5.01953125, 5.4892578125, 5.958984375, 6.4287109375, 6.8984375, 7.3681640625, 7.837890625, 8.3076171875, 8.77734375, 9.2470703125, 9.716796875, 10.1865234375, 10.65625, 11.1259765625, 11.595703125, 12.0654296875, 12.53515625, 13.0048828125, 13.474609375, 13.9443359375, 14.4140625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 28.0, 102.0, 205.0, 336.0, 230.0, 79.0, 19.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.266178131103516, -27.768829345703125, -26.271480560302734, -24.774133682250977, -23.276784896850586, -21.779436111450195, -20.282089233398438, -18.784740447998047, -17.287391662597656, -15.790042877197266, -14.292695045471191, -12.795347213745117, -11.297998428344727, -9.800649642944336, -8.303301811218262, -6.8059539794921875, -5.308605194091797, -3.8112568855285645, -2.313908576965332, -0.8165602684020996, 0.6807880401611328, 2.1781363487243652, 3.6754846572875977, 5.172832489013672, 6.6701812744140625, 8.167530059814453, 9.664877891540527, 11.162225723266602, 12.659574508666992, 14.156923294067383, 15.654271125793457, 17.15161895751953, 18.648971557617188, 20.146320343017578, 21.64366912841797, 23.141016006469727, 24.638364791870117, 26.135713577270508, 27.633060455322266, 29.130409240722656, 30.627758026123047, 32.12510681152344, 33.62245559692383, 35.11980438232422, 36.617149353027344, 38.114498138427734, 39.611846923828125, 41.109195709228516, 42.606544494628906, 44.1038932800293, 45.60124206542969, 47.09859085083008, 48.59593963623047, 50.093284606933594, 51.590633392333984, 53.087982177734375, 54.585330963134766, 56.082679748535156, 57.58002853393555, 59.07737731933594, 60.57472229003906, 62.07207107543945, 63.569419860839844, 65.0667724609375, 66.56411743164062]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 8.0, 4.0, 7.0, 12.0, 18.0, 17.0, 18.0, 22.0, 22.0, 36.0, 26.0, 38.0, 43.0, 42.0, 37.0, 41.0, 43.0, 56.0, 60.0, 47.0, 41.0, 35.0, 51.0, 49.0, 29.0, 34.0, 30.0, 25.0, 23.0, 21.0, 13.0, 18.0, 6.0, 4.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.179262161254883, -21.414167404174805, -20.649070739746094, -19.883975982666016, -19.118881225585938, -18.35378646850586, -17.58868980407715, -16.82359504699707, -16.05849838256836, -15.293402671813965, -14.528307914733887, -13.763212203979492, -12.998117446899414, -12.23302173614502, -11.467926025390625, -10.702831268310547, -9.937736511230469, -9.172640800476074, -8.407546043395996, -7.642450332641602, -6.877355098724365, -6.112259864807129, -5.347164154052734, -4.582068920135498, -3.8169736862182617, -3.0518784523010254, -2.28678297996521, -1.5216875076293945, -0.7565922737121582, 0.008502960205078125, 0.7735986709594727, 1.538693904876709, 2.3037891387939453, 3.0688843727111816, 3.833979845046997, 4.5990753173828125, 5.364170551300049, 6.129265785217285, 6.89436149597168, 7.659456729888916, 8.424551963806152, 9.189647674560547, 9.954742431640625, 10.71983814239502, 11.484933853149414, 12.250028610229492, 13.015124320983887, 13.780220031738281, 14.54531478881836, 15.310410499572754, 16.07550621032715, 16.840600967407227, 17.605695724487305, 18.370792388916016, 19.135887145996094, 19.900981903076172, 20.66607666015625, 21.431171417236328, 22.19626808166504, 22.961362838745117, 23.726457595825195, 24.491554260253906, 25.256649017333984, 26.021743774414062, 26.786840438842773]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 15.0, 12.0, 18.0, 27.0, 34.0, 35.0, 49.0, 53.0, 45.0, 64.0, 62.0, 51.0, 37.0, 76.0, 48.0, 44.0, 49.0, 37.0, 35.0, 27.0, 34.0, 20.0, 21.0, 24.0, 11.0, 11.0, 5.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.248016357421875, -2.16204833984375, -2.076080322265625, -1.9901123046875, -1.904144287109375, -1.81817626953125, -1.732208251953125, -1.646240234375, -1.560272216796875, -1.47430419921875, -1.388336181640625, -1.3023681640625, -1.216400146484375, -1.13043212890625, -1.044464111328125, -0.95849609375, -0.872528076171875, -0.78656005859375, -0.700592041015625, -0.6146240234375, -0.528656005859375, -0.44268798828125, -0.356719970703125, -0.270751953125, -0.184783935546875, -0.09881591796875, -0.012847900390625, 0.0731201171875, 0.159088134765625, 0.24505615234375, 0.331024169921875, 0.4169921875, 0.502960205078125, 0.58892822265625, 0.674896240234375, 0.7608642578125, 0.846832275390625, 0.93280029296875, 1.018768310546875, 1.104736328125, 1.190704345703125, 1.27667236328125, 1.362640380859375, 1.4486083984375, 1.534576416015625, 1.62054443359375, 1.706512451171875, 1.79248046875, 1.878448486328125, 1.96441650390625, 2.050384521484375, 2.1363525390625, 2.222320556640625, 2.30828857421875, 2.394256591796875, 2.480224609375, 2.566192626953125, 2.65216064453125, 2.738128662109375, 2.8240966796875, 2.910064697265625, 2.99603271484375, 3.082000732421875, 3.16796875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 11.0, 17.0, 17.0, 37.0, 53.0, 82.0, 124.0, 190.0, 289.0, 456.0, 689.0, 1075.0, 1680.0, 2800.0, 4438.0, 7328.0, 12669.0, 22339.0, 42740.0, 98970.0, 535661.0, 2602756.0, 648047.0, 108012.0, 44733.0, 23310.0, 13796.0, 8214.0, 4903.0, 3168.0, 2009.0, 1282.0, 776.0, 531.0, 351.0, 221.0, 158.0, 121.0, 58.0, 45.0, 32.0, 29.0, 13.0, 13.0, 13.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.27734375, -4.1220703125, -3.966796875, -3.8115234375, -3.65625, -3.5009765625, -3.345703125, -3.1904296875, -3.03515625, -2.8798828125, -2.724609375, -2.5693359375, -2.4140625, -2.2587890625, -2.103515625, -1.9482421875, -1.79296875, -1.6376953125, -1.482421875, -1.3271484375, -1.171875, -1.0166015625, -0.861328125, -0.7060546875, -0.55078125, -0.3955078125, -0.240234375, -0.0849609375, 0.0703125, 0.2255859375, 0.380859375, 0.5361328125, 0.69140625, 0.8466796875, 1.001953125, 1.1572265625, 1.3125, 1.4677734375, 1.623046875, 1.7783203125, 1.93359375, 2.0888671875, 2.244140625, 2.3994140625, 2.5546875, 2.7099609375, 2.865234375, 3.0205078125, 3.17578125, 3.3310546875, 3.486328125, 3.6416015625, 3.796875, 3.9521484375, 4.107421875, 4.2626953125, 4.41796875, 4.5732421875, 4.728515625, 4.8837890625, 5.0390625, 5.1943359375, 5.349609375, 5.5048828125, 5.66015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 16.0, 17.0, 14.0, 24.0, 35.0, 41.0, 48.0, 66.0, 78.0, 121.0, 173.0, 325.0, 501.0, 687.0, 589.0, 434.0, 211.0, 161.0, 104.0, 88.0, 71.0, 46.0, 46.0, 35.0, 25.0, 23.0, 10.0, 15.0, 11.0, 5.0, 6.0, 8.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.629150390625, -5.42626953125, -5.223388671875, -5.0205078125, -4.817626953125, -4.61474609375, -4.411865234375, -4.208984375, -4.006103515625, -3.80322265625, -3.600341796875, -3.3974609375, -3.194580078125, -2.99169921875, -2.788818359375, -2.5859375, -2.383056640625, -2.18017578125, -1.977294921875, -1.7744140625, -1.571533203125, -1.36865234375, -1.165771484375, -0.962890625, -0.760009765625, -0.55712890625, -0.354248046875, -0.1513671875, 0.051513671875, 0.25439453125, 0.457275390625, 0.66015625, 0.863037109375, 1.06591796875, 1.268798828125, 1.4716796875, 1.674560546875, 1.87744140625, 2.080322265625, 2.283203125, 2.486083984375, 2.68896484375, 2.891845703125, 3.0947265625, 3.297607421875, 3.50048828125, 3.703369140625, 3.90625, 4.109130859375, 4.31201171875, 4.514892578125, 4.7177734375, 4.920654296875, 5.12353515625, 5.326416015625, 5.529296875, 5.732177734375, 5.93505859375, 6.137939453125, 6.3408203125, 6.543701171875, 6.74658203125, 6.949462890625, 7.15234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 13.0, 11.0, 20.0, 46.0, 67.0, 77.0, 125.0, 224.0, 319.0, 571.0, 922.0, 1672.0, 2929.0, 5010.0, 9760.0, 18857.0, 40894.0, 96712.0, 311018.0, 2355993.0, 1037543.0, 182851.0, 67346.0, 29606.0, 14601.0, 7406.0, 4163.0, 2253.0, 1276.0, 784.0, 471.0, 287.0, 154.0, 109.0, 66.0, 41.0, 34.0, 18.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.453125, -7.21875, -6.984375, -6.75, -6.515625, -6.28125, -6.046875, -5.8125, -5.578125, -5.34375, -5.109375, -4.875, -4.640625, -4.40625, -4.171875, -3.9375, -3.703125, -3.46875, -3.234375, -3.0, -2.765625, -2.53125, -2.296875, -2.0625, -1.828125, -1.59375, -1.359375, -1.125, -0.890625, -0.65625, -0.421875, -0.1875, 0.046875, 0.28125, 0.515625, 0.75, 0.984375, 1.21875, 1.453125, 1.6875, 1.921875, 2.15625, 2.390625, 2.625, 2.859375, 3.09375, 3.328125, 3.5625, 3.796875, 4.03125, 4.265625, 4.5, 4.734375, 4.96875, 5.203125, 5.4375, 5.671875, 5.90625, 6.140625, 6.375, 6.609375, 6.84375, 7.078125, 7.3125, 7.546875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 10.0, 8.0, 32.0, 55.0, 127.0, 185.0, 248.0, 165.0, 102.0, 41.0, 19.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3114242553711, -92.07685089111328, -89.84226989746094, -87.60769653320312, -85.37312316894531, -83.1385498046875, -80.90396881103516, -78.66939544677734, -76.434814453125, -74.20024108886719, -71.96566009521484, -69.73108673095703, -67.49651336669922, -65.26193237304688, -63.02735900878906, -60.79278564453125, -58.55821228027344, -56.32363510131836, -54.08906173706055, -51.85448455810547, -49.619911193847656, -47.38533401489258, -45.1507568359375, -42.91618347167969, -40.68160629272461, -38.44702911376953, -36.21245574951172, -33.97787857055664, -31.743303298950195, -29.50872802734375, -27.274150848388672, -25.039575576782227, -22.804996490478516, -20.57042121887207, -18.335845947265625, -16.101268768310547, -13.866693496704102, -11.632118225097656, -9.397541999816895, -7.162965774536133, -4.9283905029296875, -2.693814754486084, -0.45923900604248047, 1.775336742401123, 4.009912490844727, 6.244487762451172, 8.479063987731934, 10.713640213012695, 12.94821548461914, 15.182790756225586, 17.41736602783203, 19.65194320678711, 21.886518478393555, 24.12109375, 26.355670928955078, 28.590246200561523, 30.82482147216797, 33.05939865112305, 35.29397201538086, 37.52854919433594, 39.76312255859375, 41.99769973754883, 44.232276916503906, 46.46685028076172, 48.7014274597168]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 7.0, 10.0, 21.0, 18.0, 23.0, 22.0, 26.0, 29.0, 30.0, 27.0, 28.0, 35.0, 36.0, 40.0, 28.0, 36.0, 39.0, 47.0, 50.0, 42.0, 40.0, 32.0, 35.0, 31.0, 35.0, 30.0, 38.0, 24.0, 18.0, 20.0, 26.0, 16.0, 8.0, 10.0, 10.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03443717956543, -20.38628578186035, -19.738136291503906, -19.089984893798828, -18.441835403442383, -17.793684005737305, -17.14553451538086, -16.49738311767578, -15.849231719970703, -15.201081275939941, -14.55293083190918, -13.904779434204102, -13.25662899017334, -12.608478546142578, -11.960328102111816, -11.312177658081055, -10.664027214050293, -10.015876770019531, -9.36772632598877, -8.719575881958008, -8.07142448425293, -7.423274040222168, -6.775123596191406, -6.126972675323486, -5.478822231292725, -4.830671787261963, -4.182520866394043, -3.5343704223632812, -2.8862197399139404, -2.2380690574645996, -1.589918613433838, -0.941767692565918, -0.29361724853515625, 0.3545333743095398, 1.0026839971542358, 1.650834560394287, 2.298985242843628, 2.9471359252929688, 3.5952863693237305, 4.24343729019165, 4.891587734222412, 5.539738178253174, 6.187889099121094, 6.8360395431518555, 7.484189987182617, 8.132341384887695, 8.78049087524414, 9.428642272949219, 10.07679271697998, 10.724943161010742, 11.373093605041504, 12.021244049072266, 12.669395446777344, 13.317545890808105, 13.965696334838867, 14.613847732543945, 15.26199722290039, 15.910147666931152, 16.558298110961914, 17.206449508666992, 17.854598999023438, 18.502750396728516, 19.150901794433594, 19.79905128479004, 20.447202682495117]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 13.0, 6.0, 13.0, 17.0, 13.0, 20.0, 20.0, 20.0, 40.0, 43.0, 36.0, 48.0, 58.0, 51.0, 55.0, 44.0, 53.0, 54.0, 47.0, 59.0, 39.0, 38.0, 23.0, 31.0, 22.0, 19.0, 21.0, 22.0, 23.0, 15.0, 10.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.123443603515625, -2.04180908203125, -1.960174560546875, -1.8785400390625, -1.796905517578125, -1.71527099609375, -1.633636474609375, -1.552001953125, -1.470367431640625, -1.38873291015625, -1.307098388671875, -1.2254638671875, -1.143829345703125, -1.06219482421875, -0.980560302734375, -0.89892578125, -0.817291259765625, -0.73565673828125, -0.654022216796875, -0.5723876953125, -0.490753173828125, -0.40911865234375, -0.327484130859375, -0.245849609375, -0.164215087890625, -0.08258056640625, -0.000946044921875, 0.0806884765625, 0.162322998046875, 0.24395751953125, 0.325592041015625, 0.4072265625, 0.488861083984375, 0.57049560546875, 0.652130126953125, 0.7337646484375, 0.815399169921875, 0.89703369140625, 0.978668212890625, 1.060302734375, 1.141937255859375, 1.22357177734375, 1.305206298828125, 1.3868408203125, 1.468475341796875, 1.55010986328125, 1.631744384765625, 1.71337890625, 1.795013427734375, 1.87664794921875, 1.958282470703125, 2.0399169921875, 2.121551513671875, 2.20318603515625, 2.284820556640625, 2.366455078125, 2.448089599609375, 2.52972412109375, 2.611358642578125, 2.6929931640625, 2.774627685546875, 2.85626220703125, 2.937896728515625, 3.01953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 9.0, 16.0, 37.0, 31.0, 55.0, 72.0, 129.0, 147.0, 192.0, 322.0, 492.0, 806.0, 1150.0, 1944.0, 3118.0, 5366.0, 9822.0, 20704.0, 55785.0, 376680.0, 463896.0, 60640.0, 22340.0, 10489.0, 5499.0, 3235.0, 1901.0, 1209.0, 747.0, 532.0, 342.0, 269.0, 175.0, 123.0, 73.0, 69.0, 29.0, 25.0, 21.0, 20.0, 13.0, 7.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.640625, -13.1865234375, -12.732421875, -12.2783203125, -11.82421875, -11.3701171875, -10.916015625, -10.4619140625, -10.0078125, -9.5537109375, -9.099609375, -8.6455078125, -8.19140625, -7.7373046875, -7.283203125, -6.8291015625, -6.375, -5.9208984375, -5.466796875, -5.0126953125, -4.55859375, -4.1044921875, -3.650390625, -3.1962890625, -2.7421875, -2.2880859375, -1.833984375, -1.3798828125, -0.92578125, -0.4716796875, -0.017578125, 0.4365234375, 0.890625, 1.3447265625, 1.798828125, 2.2529296875, 2.70703125, 3.1611328125, 3.615234375, 4.0693359375, 4.5234375, 4.9775390625, 5.431640625, 5.8857421875, 6.33984375, 6.7939453125, 7.248046875, 7.7021484375, 8.15625, 8.6103515625, 9.064453125, 9.5185546875, 9.97265625, 10.4267578125, 10.880859375, 11.3349609375, 11.7890625, 12.2431640625, 12.697265625, 13.1513671875, 13.60546875, 14.0595703125, 14.513671875, 14.9677734375, 15.421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 6.0, 15.0, 11.0, 19.0, 19.0, 25.0, 29.0, 23.0, 39.0, 41.0, 42.0, 44.0, 40.0, 63.0, 58.0, 1073.0, 45.0, 53.0, 59.0, 46.0, 41.0, 42.0, 29.0, 33.0, 24.0, 17.0, 17.0, 14.0, 8.0, 14.0, 7.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.380706787109375, -2.30633544921875, -2.231964111328125, -2.1575927734375, -2.083221435546875, -2.00885009765625, -1.934478759765625, -1.860107421875, -1.785736083984375, -1.71136474609375, -1.636993408203125, -1.5626220703125, -1.488250732421875, -1.41387939453125, -1.339508056640625, -1.26513671875, -1.190765380859375, -1.11639404296875, -1.042022705078125, -0.9676513671875, -0.893280029296875, -0.81890869140625, -0.744537353515625, -0.670166015625, -0.595794677734375, -0.52142333984375, -0.447052001953125, -0.3726806640625, -0.298309326171875, -0.22393798828125, -0.149566650390625, -0.0751953125, -0.000823974609375, 0.07354736328125, 0.147918701171875, 0.2222900390625, 0.296661376953125, 0.37103271484375, 0.445404052734375, 0.519775390625, 0.594146728515625, 0.66851806640625, 0.742889404296875, 0.8172607421875, 0.891632080078125, 0.96600341796875, 1.040374755859375, 1.11474609375, 1.189117431640625, 1.26348876953125, 1.337860107421875, 1.4122314453125, 1.486602783203125, 1.56097412109375, 1.635345458984375, 1.709716796875, 1.784088134765625, 1.85845947265625, 1.932830810546875, 2.0072021484375, 2.081573486328125, 2.15594482421875, 2.230316162109375, 2.3046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 10.0, 16.0, 24.0, 46.0, 74.0, 104.0, 148.0, 200.0, 316.0, 499.0, 739.0, 1225.0, 1936.0, 3985.0, 10746.0, 58438.0, 1918795.0, 77153.0, 12217.0, 4529.0, 2237.0, 1244.0, 731.0, 534.0, 392.0, 272.0, 149.0, 129.0, 64.0, 40.0, 25.0, 25.0, 11.0, 14.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.703125, -24.888427734375, -24.07373046875, -23.259033203125, -22.4443359375, -21.629638671875, -20.81494140625, -20.000244140625, -19.185546875, -18.370849609375, -17.55615234375, -16.741455078125, -15.9267578125, -15.112060546875, -14.29736328125, -13.482666015625, -12.66796875, -11.853271484375, -11.03857421875, -10.223876953125, -9.4091796875, -8.594482421875, -7.77978515625, -6.965087890625, -6.150390625, -5.335693359375, -4.52099609375, -3.706298828125, -2.8916015625, -2.076904296875, -1.26220703125, -0.447509765625, 0.3671875, 1.181884765625, 1.99658203125, 2.811279296875, 3.6259765625, 4.440673828125, 5.25537109375, 6.070068359375, 6.884765625, 7.699462890625, 8.51416015625, 9.328857421875, 10.1435546875, 10.958251953125, 11.77294921875, 12.587646484375, 13.40234375, 14.217041015625, 15.03173828125, 15.846435546875, 16.6611328125, 17.475830078125, 18.29052734375, 19.105224609375, 19.919921875, 20.734619140625, 21.54931640625, 22.364013671875, 23.1787109375, 23.993408203125, 24.80810546875, 25.622802734375, 26.4375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 42.0, 117.0, 425.0, 269.0, 67.0, 21.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.64306640625, -6.3955078125, -6.14794921875, -5.900390625, -5.65283203125, -5.4052734375, -5.15771484375, -4.91015625, -4.66259765625, -4.4150390625, -4.16748046875, -3.919921875, -3.67236328125, -3.4248046875, -3.17724609375, -2.9296875, -2.68212890625, -2.4345703125, -2.18701171875, -1.939453125, -1.69189453125, -1.4443359375, -1.19677734375, -0.94921875, -0.70166015625, -0.4541015625, -0.20654296875, 0.041015625, 0.28857421875, 0.5361328125, 0.78369140625, 1.03125, 1.27880859375, 1.5263671875, 1.77392578125, 2.021484375, 2.26904296875, 2.5166015625, 2.76416015625, 3.01171875, 3.25927734375, 3.5068359375, 3.75439453125, 4.001953125, 4.24951171875, 4.4970703125, 4.74462890625, 4.9921875, 5.23974609375, 5.4873046875, 5.73486328125, 5.982421875, 6.22998046875, 6.4775390625, 6.72509765625, 6.97265625, 7.22021484375, 7.4677734375, 7.71533203125, 7.962890625, 8.21044921875, 8.4580078125, 8.70556640625, 8.953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 17.0, 25.0, 33.0, 102.0, 496.0, 2862.0, 47850.0, 991885.0, 4212.0, 755.0, 152.0, 40.0, 23.0, 15.0, 11.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-140.625, -136.73046875, -132.8359375, -128.94140625, -125.046875, -121.15234375, -117.2578125, -113.36328125, -109.46875, -105.57421875, -101.6796875, -97.78515625, -93.890625, -89.99609375, -86.1015625, -82.20703125, -78.3125, -74.41796875, -70.5234375, -66.62890625, -62.734375, -58.83984375, -54.9453125, -51.05078125, -47.15625, -43.26171875, -39.3671875, -35.47265625, -31.578125, -27.68359375, -23.7890625, -19.89453125, -16.0, -12.10546875, -8.2109375, -4.31640625, -0.421875, 3.47265625, 7.3671875, 11.26171875, 15.15625, 19.05078125, 22.9453125, 26.83984375, 30.734375, 34.62890625, 38.5234375, 42.41796875, 46.3125, 50.20703125, 54.1015625, 57.99609375, 61.890625, 65.78515625, 69.6796875, 73.57421875, 77.46875, 81.36328125, 85.2578125, 89.15234375, 93.046875, 96.94140625, 100.8359375, 104.73046875, 108.625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 9.0, 13.0, 23.0, 26.0, 29.0, 54.0, 77.0, 162.0, 191.0, 126.0, 93.0, 59.0, 42.0, 15.0, 23.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.547995567321777, -8.305628776550293, -8.063262939453125, -7.820896625518799, -7.578530311584473, -7.3361639976501465, -7.09379768371582, -6.851430892944336, -6.609065055847168, -6.366698741912842, -6.124332427978516, -5.8819661140441895, -5.639599800109863, -5.397233486175537, -5.154867172241211, -4.912500381469727, -4.6701340675354, -4.427767753601074, -4.185401439666748, -3.943035125732422, -3.7006688117980957, -3.4583024978637695, -3.2159359455108643, -2.973569631576538, -2.731203317642212, -2.4888370037078857, -2.2464706897735596, -2.0041041374206543, -1.7617379426956177, -1.5193716287612915, -1.2770051956176758, -1.0346388816833496, -0.7922720909118652, -0.5499057769775391, -0.3075394034385681, -0.06517302989959717, 0.177193284034729, 0.4195595979690552, 0.6619260311126709, 0.9042923450469971, 1.1466586589813232, 1.3890249729156494, 1.6313912868499756, 1.8737577199935913, 2.116124153137207, 2.358490467071533, 2.6008567810058594, 2.8432230949401855, 3.0855894088745117, 3.327955722808838, 3.570322036743164, 3.8126883506774902, 4.055054664611816, 4.297420978546143, 4.539787292480469, 4.782154083251953, 5.024519920349121, 5.266886234283447, 5.509252548217773, 5.7516188621521, 5.993985176086426, 6.236351490020752, 6.478717803955078, 6.7210845947265625, 6.963450908660889]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 9.0, 7.0, 15.0, 10.0, 18.0, 25.0, 28.0, 25.0, 31.0, 28.0, 27.0, 27.0, 35.0, 46.0, 39.0, 39.0, 40.0, 44.0, 48.0, 43.0, 35.0, 38.0, 38.0, 33.0, 28.0, 28.0, 27.0, 17.0, 29.0, 19.0, 27.0, 17.0, 10.0, 14.0, 7.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8647117614746094, -3.7316665649414062, -3.598621368408203, -3.465576171875, -3.332530975341797, -3.1994857788085938, -3.0664408206939697, -2.9333956241607666, -2.8003504276275635, -2.6673052310943604, -2.5342600345611572, -2.401214838027954, -2.26816987991333, -2.135124683380127, -2.002079486846924, -1.8690342903137207, -1.7359890937805176, -1.6029438972473145, -1.4698987007141113, -1.3368536233901978, -1.2038084268569946, -1.0707632303237915, -0.9377180933952332, -0.8046729564666748, -0.6716277599334717, -0.5385825634002686, -0.4055374264717102, -0.27249225974082947, -0.13944709300994873, -0.0064018964767456055, 0.12664324045181274, 0.2596883773803711, 0.3927335739135742, 0.5257787704467773, 0.6588239073753357, 0.791869044303894, 0.9249142408370972, 1.0579594373703003, 1.1910045146942139, 1.324049711227417, 1.4570949077606201, 1.5901401042938232, 1.7231853008270264, 1.85623037815094, 1.989275574684143, 2.1223206520080566, 2.2553658485412598, 2.388411045074463, 2.521456241607666, 2.654501438140869, 2.7875466346740723, 2.9205918312072754, 3.0536370277404785, 3.1866822242736816, 3.3197271823883057, 3.452772378921509, 3.585817575454712, 3.718862771987915, 3.851907968521118, 3.9849531650543213, 4.117998123168945, 4.251043319702148, 4.384088516235352, 4.517133712768555, 4.650178909301758]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 10.0, 7.0, 12.0, 22.0, 19.0, 23.0, 28.0, 21.0, 33.0, 66.0, 47.0, 51.0, 53.0, 46.0, 69.0, 64.0, 55.0, 55.0, 56.0, 34.0, 39.0, 35.0, 27.0, 28.0, 22.0, 20.0, 18.0, 14.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.834686279296875, -2.73968505859375, -2.644683837890625, -2.5496826171875, -2.454681396484375, -2.35968017578125, -2.264678955078125, -2.169677734375, -2.074676513671875, -1.97967529296875, -1.884674072265625, -1.7896728515625, -1.694671630859375, -1.59967041015625, -1.504669189453125, -1.40966796875, -1.314666748046875, -1.21966552734375, -1.124664306640625, -1.0296630859375, -0.934661865234375, -0.83966064453125, -0.744659423828125, -0.649658203125, -0.554656982421875, -0.45965576171875, -0.364654541015625, -0.2696533203125, -0.174652099609375, -0.07965087890625, 0.015350341796875, 0.1103515625, 0.205352783203125, 0.30035400390625, 0.395355224609375, 0.4903564453125, 0.585357666015625, 0.68035888671875, 0.775360107421875, 0.870361328125, 0.965362548828125, 1.06036376953125, 1.155364990234375, 1.2503662109375, 1.345367431640625, 1.44036865234375, 1.535369873046875, 1.63037109375, 1.725372314453125, 1.82037353515625, 1.915374755859375, 2.0103759765625, 2.105377197265625, 2.20037841796875, 2.295379638671875, 2.390380859375, 2.485382080078125, 2.58038330078125, 2.675384521484375, 2.7703857421875, 2.865386962890625, 2.96038818359375, 3.055389404296875, 3.150390625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 25.0, 28.0, 47.0, 67.0, 115.0, 190.0, 260.0, 457.0, 706.0, 1206.0, 2049.0, 3518.0, 6397.0, 12337.0, 25738.0, 66906.0, 246401.0, 476009.0, 125749.0, 41750.0, 17990.0, 8979.0, 4929.0, 2607.0, 1598.0, 895.0, 601.0, 350.0, 235.0, 136.0, 97.0, 53.0, 42.0, 31.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.1973876953125, -3.088134765625, -2.9788818359375, -2.86962890625, -2.7603759765625, -2.651123046875, -2.5418701171875, -2.4326171875, -2.3233642578125, -2.214111328125, -2.1048583984375, -1.99560546875, -1.8863525390625, -1.777099609375, -1.6678466796875, -1.55859375, -1.4493408203125, -1.340087890625, -1.2308349609375, -1.12158203125, -1.0123291015625, -0.903076171875, -0.7938232421875, -0.6845703125, -0.5753173828125, -0.466064453125, -0.3568115234375, -0.24755859375, -0.1383056640625, -0.029052734375, 0.0802001953125, 0.189453125, 0.2987060546875, 0.407958984375, 0.5172119140625, 0.62646484375, 0.7357177734375, 0.844970703125, 0.9542236328125, 1.0634765625, 1.1727294921875, 1.281982421875, 1.3912353515625, 1.50048828125, 1.6097412109375, 1.718994140625, 1.8282470703125, 1.9375, 2.0467529296875, 2.156005859375, 2.2652587890625, 2.37451171875, 2.4837646484375, 2.593017578125, 2.7022705078125, 2.8115234375, 2.9207763671875, 3.030029296875, 3.1392822265625, 3.24853515625, 3.3577880859375, 3.467041015625, 3.5762939453125, 3.685546875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 10.0, 14.0, 7.0, 8.0, 9.0, 15.0, 19.0, 20.0, 13.0, 33.0, 24.0, 35.0, 32.0, 52.0, 56.0, 65.0, 94.0, 193.0, 1406.0, 330.0, 149.0, 81.0, 62.0, 51.0, 35.0, 35.0, 29.0, 29.0, 22.0, 23.0, 21.0, 11.0, 13.0, 11.0, 7.0, 3.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7589111328125, -6.486572265625, -6.2142333984375, -5.94189453125, -5.6695556640625, -5.397216796875, -5.1248779296875, -4.8525390625, -4.5802001953125, -4.307861328125, -4.0355224609375, -3.76318359375, -3.4908447265625, -3.218505859375, -2.9461669921875, -2.673828125, -2.4014892578125, -2.129150390625, -1.8568115234375, -1.58447265625, -1.3121337890625, -1.039794921875, -0.7674560546875, -0.4951171875, -0.2227783203125, 0.049560546875, 0.3218994140625, 0.59423828125, 0.8665771484375, 1.138916015625, 1.4112548828125, 1.68359375, 1.9559326171875, 2.228271484375, 2.5006103515625, 2.77294921875, 3.0452880859375, 3.317626953125, 3.5899658203125, 3.8623046875, 4.1346435546875, 4.406982421875, 4.6793212890625, 4.95166015625, 5.2239990234375, 5.496337890625, 5.7686767578125, 6.041015625, 6.3133544921875, 6.585693359375, 6.8580322265625, 7.13037109375, 7.4027099609375, 7.675048828125, 7.9473876953125, 8.2197265625, 8.4920654296875, 8.764404296875, 9.0367431640625, 9.30908203125, 9.5814208984375, 9.853759765625, 10.1260986328125, 10.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 14.0, 15.0, 14.0, 16.0, 18.0, 32.0, 44.0, 46.0, 61.0, 94.0, 137.0, 232.0, 461.0, 1187.0, 5278.0, 56616.0, 2670479.0, 391102.0, 15762.0, 2410.0, 680.0, 330.0, 179.0, 126.0, 91.0, 50.0, 50.0, 26.0, 25.0, 20.0, 19.0, 11.0, 15.0, 10.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-15.046875, -14.6260986328125, -14.205322265625, -13.7845458984375, -13.36376953125, -12.9429931640625, -12.522216796875, -12.1014404296875, -11.6806640625, -11.2598876953125, -10.839111328125, -10.4183349609375, -9.99755859375, -9.5767822265625, -9.156005859375, -8.7352294921875, -8.314453125, -7.8936767578125, -7.472900390625, -7.0521240234375, -6.63134765625, -6.2105712890625, -5.789794921875, -5.3690185546875, -4.9482421875, -4.5274658203125, -4.106689453125, -3.6859130859375, -3.26513671875, -2.8443603515625, -2.423583984375, -2.0028076171875, -1.58203125, -1.1612548828125, -0.740478515625, -0.3197021484375, 0.10107421875, 0.5218505859375, 0.942626953125, 1.3634033203125, 1.7841796875, 2.2049560546875, 2.625732421875, 3.0465087890625, 3.46728515625, 3.8880615234375, 4.308837890625, 4.7296142578125, 5.150390625, 5.5711669921875, 5.991943359375, 6.4127197265625, 6.83349609375, 7.2542724609375, 7.675048828125, 8.0958251953125, 8.5166015625, 8.9373779296875, 9.358154296875, 9.7789306640625, 10.19970703125, 10.6204833984375, 11.041259765625, 11.4620361328125, 11.8828125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [5.0, 445.0, 546.0, 19.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.746743202209473, -5.018730640411377, -0.29071807861328125, 4.437294960021973, 9.16530704498291, 13.893319129943848, 18.621334075927734, 23.349346160888672, 28.07735824584961, 32.80537033081055, 37.533382415771484, 42.26139831542969, 46.989410400390625, 51.71742248535156, 56.4454345703125, 61.17344665527344, 65.90145874023438, 70.62947082519531, 75.35748291015625, 80.08549499511719, 84.81350708007812, 89.54151916503906, 94.26953125, 98.99754333496094, 103.72555541992188, 108.45356750488281, 113.18157958984375, 117.90959167480469, 122.63760375976562, 127.36561584472656, 132.0936279296875, 136.82164001464844, 141.54966735839844, 146.27767944335938, 151.0056915283203, 155.73370361328125, 160.4617156982422, 165.18972778320312, 169.91773986816406, 174.645751953125, 179.37376403808594, 184.10177612304688, 188.8297882080078, 193.55780029296875, 198.2858123779297, 203.01382446289062, 207.74183654785156, 212.4698486328125, 217.1978759765625, 221.92588806152344, 226.65390014648438, 231.3819122314453, 236.10992431640625, 240.8379364013672, 245.56594848632812, 250.29396057128906, 255.02197265625, 259.75, 264.4779968261719, 269.2060241699219, 273.93402099609375, 278.66204833984375, 283.3900451660156, 288.1180725097656, 292.8460693359375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 10.0, 9.0, 14.0, 9.0, 11.0, 10.0, 13.0, 17.0, 26.0, 30.0, 29.0, 36.0, 31.0, 39.0, 41.0, 33.0, 50.0, 31.0, 32.0, 45.0, 51.0, 35.0, 49.0, 40.0, 29.0, 35.0, 25.0, 31.0, 24.0, 24.0, 31.0, 22.0, 17.0, 11.0, 13.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.77924156188965, -21.081886291503906, -20.384531021118164, -19.687175750732422, -18.989822387695312, -18.29246711730957, -17.595111846923828, -16.897756576538086, -16.200401306152344, -15.503046035766602, -14.805691719055176, -14.108336448669434, -13.410982131958008, -12.713626861572266, -12.016271591186523, -11.318916320800781, -10.621562957763672, -9.92420768737793, -9.226853370666504, -8.529498100280762, -7.832143306732178, -7.134788513183594, -6.437433242797852, -5.740078449249268, -5.042723655700684, -4.3453688621521, -3.6480138301849365, -2.9506587982177734, -2.2533040046691895, -1.5559492111206055, -0.8585939407348633, -0.1612391471862793, 0.5361175537109375, 1.233472466468811, 1.9308273792266846, 2.6281824111938477, 3.3255372047424316, 4.022891998291016, 4.720247268676758, 5.417602062225342, 6.114956855773926, 6.81231164932251, 7.509666442871094, 8.207021713256836, 8.904376983642578, 9.601731300354004, 10.299086570739746, 10.996440887451172, 11.693796157836914, 12.391151428222656, 13.088505744934082, 13.785861015319824, 14.48321533203125, 15.180570602416992, 15.877925872802734, 16.575281143188477, 17.27263641357422, 17.96999168395996, 18.667346954345703, 19.364700317382812, 20.062055587768555, 20.759410858154297, 21.45676612854004, 22.15412139892578, 22.85147476196289]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 15.0, 22.0, 15.0, 26.0, 28.0, 35.0, 30.0, 44.0, 54.0, 44.0, 45.0, 55.0, 49.0, 43.0, 58.0, 42.0, 55.0, 47.0, 41.0, 39.0, 31.0, 25.0, 28.0, 22.0, 16.0, 18.0, 19.0, 18.0, 9.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.45062255859375, -2.3621826171875, -2.27374267578125, -2.185302734375, -2.09686279296875, -2.0084228515625, -1.91998291015625, -1.83154296875, -1.74310302734375, -1.6546630859375, -1.56622314453125, -1.477783203125, -1.38934326171875, -1.3009033203125, -1.21246337890625, -1.1240234375, -1.03558349609375, -0.9471435546875, -0.85870361328125, -0.770263671875, -0.68182373046875, -0.5933837890625, -0.50494384765625, -0.41650390625, -0.32806396484375, -0.2396240234375, -0.15118408203125, -0.062744140625, 0.02569580078125, 0.1141357421875, 0.20257568359375, 0.291015625, 0.37945556640625, 0.4678955078125, 0.55633544921875, 0.644775390625, 0.73321533203125, 0.8216552734375, 0.91009521484375, 0.99853515625, 1.08697509765625, 1.1754150390625, 1.26385498046875, 1.352294921875, 1.44073486328125, 1.5291748046875, 1.61761474609375, 1.7060546875, 1.79449462890625, 1.8829345703125, 1.97137451171875, 2.059814453125, 2.14825439453125, 2.2366943359375, 2.32513427734375, 2.41357421875, 2.50201416015625, 2.5904541015625, 2.67889404296875, 2.767333984375, 2.85577392578125, 2.9442138671875, 3.03265380859375, 3.12109375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 10.0, 5.0, 7.0, 8.0, 14.0, 14.0, 33.0, 45.0, 62.0, 102.0, 172.0, 258.0, 393.0, 697.0, 1300.0, 2229.0, 4093.0, 7602.0, 14770.0, 29488.0, 68087.0, 313022.0, 2718772.0, 856636.0, 98117.0, 38020.0, 18534.0, 9578.0, 5301.0, 2836.0, 1590.0, 931.0, 547.0, 321.0, 244.0, 140.0, 94.0, 67.0, 38.0, 30.0, 16.0, 24.0, 14.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.2154541015625, -6.012939453125, -5.8104248046875, -5.60791015625, -5.4053955078125, -5.202880859375, -5.0003662109375, -4.7978515625, -4.5953369140625, -4.392822265625, -4.1903076171875, -3.98779296875, -3.7852783203125, -3.582763671875, -3.3802490234375, -3.177734375, -2.9752197265625, -2.772705078125, -2.5701904296875, -2.36767578125, -2.1651611328125, -1.962646484375, -1.7601318359375, -1.5576171875, -1.3551025390625, -1.152587890625, -0.9500732421875, -0.74755859375, -0.5450439453125, -0.342529296875, -0.1400146484375, 0.0625, 0.2650146484375, 0.467529296875, 0.6700439453125, 0.87255859375, 1.0750732421875, 1.277587890625, 1.4801025390625, 1.6826171875, 1.8851318359375, 2.087646484375, 2.2901611328125, 2.49267578125, 2.6951904296875, 2.897705078125, 3.1002197265625, 3.302734375, 3.5052490234375, 3.707763671875, 3.9102783203125, 4.11279296875, 4.3153076171875, 4.517822265625, 4.7203369140625, 4.9228515625, 5.1253662109375, 5.327880859375, 5.5303955078125, 5.73291015625, 5.9354248046875, 6.137939453125, 6.3404541015625, 6.54296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 16.0, 10.0, 21.0, 16.0, 49.0, 61.0, 74.0, 105.0, 148.0, 248.0, 491.0, 877.0, 816.0, 403.0, 208.0, 138.0, 91.0, 83.0, 58.0, 43.0, 32.0, 24.0, 16.0, 12.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.17938232421875, -5.9095458984375, -5.63970947265625, -5.369873046875, -5.10003662109375, -4.8302001953125, -4.56036376953125, -4.29052734375, -4.02069091796875, -3.7508544921875, -3.48101806640625, -3.211181640625, -2.94134521484375, -2.6715087890625, -2.40167236328125, -2.1318359375, -1.86199951171875, -1.5921630859375, -1.32232666015625, -1.052490234375, -0.78265380859375, -0.5128173828125, -0.24298095703125, 0.02685546875, 0.29669189453125, 0.5665283203125, 0.83636474609375, 1.106201171875, 1.37603759765625, 1.6458740234375, 1.91571044921875, 2.185546875, 2.45538330078125, 2.7252197265625, 2.99505615234375, 3.264892578125, 3.53472900390625, 3.8045654296875, 4.07440185546875, 4.34423828125, 4.61407470703125, 4.8839111328125, 5.15374755859375, 5.423583984375, 5.69342041015625, 5.9632568359375, 6.23309326171875, 6.5029296875, 6.77276611328125, 7.0426025390625, 7.31243896484375, 7.582275390625, 7.85211181640625, 8.1219482421875, 8.39178466796875, 8.66162109375, 8.93145751953125, 9.2012939453125, 9.47113037109375, 9.740966796875, 10.01080322265625, 10.2806396484375, 10.55047607421875, 10.8203125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 8.0, 25.0, 28.0, 56.0, 78.0, 108.0, 218.0, 492.0, 1378.0, 5216.0, 25015.0, 183040.0, 3617793.0, 315220.0, 35690.0, 6827.0, 1900.0, 572.0, 248.0, 139.0, 68.0, 49.0, 25.0, 20.0, 13.0, 12.0, 13.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.078125, -23.4700927734375, -22.862060546875, -22.2540283203125, -21.64599609375, -21.0379638671875, -20.429931640625, -19.8218994140625, -19.2138671875, -18.6058349609375, -17.997802734375, -17.3897705078125, -16.78173828125, -16.1737060546875, -15.565673828125, -14.9576416015625, -14.349609375, -13.7415771484375, -13.133544921875, -12.5255126953125, -11.91748046875, -11.3094482421875, -10.701416015625, -10.0933837890625, -9.4853515625, -8.8773193359375, -8.269287109375, -7.6612548828125, -7.05322265625, -6.4451904296875, -5.837158203125, -5.2291259765625, -4.62109375, -4.0130615234375, -3.405029296875, -2.7969970703125, -2.18896484375, -1.5809326171875, -0.972900390625, -0.3648681640625, 0.2431640625, 0.8511962890625, 1.459228515625, 2.0672607421875, 2.67529296875, 3.2833251953125, 3.891357421875, 4.4993896484375, 5.107421875, 5.7154541015625, 6.323486328125, 6.9315185546875, 7.53955078125, 8.1475830078125, 8.755615234375, 9.3636474609375, 9.9716796875, 10.5797119140625, 11.187744140625, 11.7957763671875, 12.40380859375, 13.0118408203125, 13.619873046875, 14.2279052734375, 14.8359375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 19.0, 25.0, 61.0, 87.0, 127.0, 152.0, 160.0, 102.0, 78.0, 58.0, 42.0, 31.0, 17.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-71.78440856933594, -70.34912872314453, -68.91385650634766, -67.47857666015625, -66.04330444335938, -64.60802459716797, -63.17274856567383, -61.73747253417969, -60.30219650268555, -58.866920471191406, -57.431644439697266, -55.996368408203125, -54.56108856201172, -53.12581253051758, -51.69053649902344, -50.2552604675293, -48.819984436035156, -47.384708404541016, -45.949432373046875, -44.514156341552734, -43.078880310058594, -41.64360046386719, -40.20832443237305, -38.773048400878906, -37.337772369384766, -35.902496337890625, -34.467220306396484, -33.031944274902344, -31.59666633605957, -30.16139030456543, -28.726112365722656, -27.290836334228516, -25.85555648803711, -24.42028045654297, -22.985004425048828, -21.549726486206055, -20.114450454711914, -18.679174423217773, -17.243896484375, -15.80862045288086, -14.373344421386719, -12.938068389892578, -11.502791404724121, -10.067514419555664, -8.632238388061523, -7.196961879730225, -5.761685371398926, -4.326408386230469, -2.891132354736328, -1.4558558464050293, -0.02057933807373047, 1.4146971702575684, 2.849973678588867, 4.285250186920166, 5.720526695251465, 7.155803680419922, 8.591079711914062, 10.026355743408203, 11.46163272857666, 12.896909713745117, 14.332185745239258, 15.767461776733398, 17.202739715576172, 18.638015747070312, 20.073291778564453]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 12.0, 6.0, 16.0, 14.0, 12.0, 16.0, 22.0, 25.0, 18.0, 24.0, 35.0, 35.0, 33.0, 45.0, 52.0, 38.0, 34.0, 42.0, 47.0, 46.0, 45.0, 34.0, 43.0, 38.0, 31.0, 30.0, 24.0, 20.0, 26.0, 18.0, 18.0, 15.0, 13.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.072383880615234, -20.38842010498047, -19.704458236694336, -19.02049446105957, -18.336532592773438, -17.652568817138672, -16.968605041503906, -16.284643173217773, -15.600679397583008, -14.916716575622559, -14.23275375366211, -13.548789978027344, -12.864827156066895, -12.180864334106445, -11.496901512145996, -10.812938690185547, -10.128975868225098, -9.445013046264648, -8.7610502243042, -8.07708740234375, -7.393123626708984, -6.709160804748535, -6.025197982788086, -5.3412346839904785, -4.657271862030029, -3.973308801651001, -3.2893457412719727, -2.6053829193115234, -1.9214198589324951, -1.2374567985534668, -0.5534939765930176, 0.13046932220458984, 0.8144321441650391, 1.4983952045440674, 2.1823582649230957, 2.866321086883545, 3.5502841472625732, 4.234247207641602, 4.918210029602051, 5.602173328399658, 6.286136150360107, 6.970098972320557, 7.654062271118164, 8.338025093078613, 9.021987915039062, 9.705951690673828, 10.389913558959961, 11.073877334594727, 11.757840156555176, 12.441802978515625, 13.125765800476074, 13.809728622436523, 14.493692398071289, 15.177655220031738, 15.861618041992188, 16.545581817626953, 17.229543685913086, 17.91350746154785, 18.597469329833984, 19.28143310546875, 19.965394973754883, 20.64935874938965, 21.33332061767578, 22.017284393310547, 22.701248168945312]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 9.0, 12.0, 21.0, 22.0, 33.0, 29.0, 31.0, 26.0, 41.0, 42.0, 46.0, 38.0, 50.0, 43.0, 49.0, 42.0, 36.0, 36.0, 43.0, 37.0, 39.0, 38.0, 41.0, 20.0, 20.0, 23.0, 10.0, 15.0, 13.0, 13.0, 19.0, 11.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.01641845703125, -1.9410400390625, -1.86566162109375, -1.790283203125, -1.71490478515625, -1.6395263671875, -1.56414794921875, -1.48876953125, -1.41339111328125, -1.3380126953125, -1.26263427734375, -1.187255859375, -1.11187744140625, -1.0364990234375, -0.96112060546875, -0.8857421875, -0.81036376953125, -0.7349853515625, -0.65960693359375, -0.584228515625, -0.50885009765625, -0.4334716796875, -0.35809326171875, -0.28271484375, -0.20733642578125, -0.1319580078125, -0.05657958984375, 0.018798828125, 0.09417724609375, 0.1695556640625, 0.24493408203125, 0.3203125, 0.39569091796875, 0.4710693359375, 0.54644775390625, 0.621826171875, 0.69720458984375, 0.7725830078125, 0.84796142578125, 0.92333984375, 0.99871826171875, 1.0740966796875, 1.14947509765625, 1.224853515625, 1.30023193359375, 1.3756103515625, 1.45098876953125, 1.5263671875, 1.60174560546875, 1.6771240234375, 1.75250244140625, 1.827880859375, 1.90325927734375, 1.9786376953125, 2.05401611328125, 2.12939453125, 2.20477294921875, 2.2801513671875, 2.35552978515625, 2.430908203125, 2.50628662109375, 2.5816650390625, 2.65704345703125, 2.732421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 9.0, 21.0, 34.0, 41.0, 70.0, 107.0, 125.0, 202.0, 280.0, 413.0, 605.0, 861.0, 1276.0, 1938.0, 2866.0, 4366.0, 6850.0, 10855.0, 18139.0, 31267.0, 61641.0, 279036.0, 471134.0, 70173.0, 34022.0, 19223.0, 11804.0, 7232.0, 4612.0, 3025.0, 1917.0, 1341.0, 889.0, 683.0, 427.0, 301.0, 215.0, 161.0, 105.0, 71.0, 63.0, 41.0, 29.0, 19.0, 13.0, 11.0, 7.0, 0.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.8828125, -9.5428466796875, -9.202880859375, -8.8629150390625, -8.52294921875, -8.1829833984375, -7.843017578125, -7.5030517578125, -7.1630859375, -6.8231201171875, -6.483154296875, -6.1431884765625, -5.80322265625, -5.4632568359375, -5.123291015625, -4.7833251953125, -4.443359375, -4.1033935546875, -3.763427734375, -3.4234619140625, -3.08349609375, -2.7435302734375, -2.403564453125, -2.0635986328125, -1.7236328125, -1.3836669921875, -1.043701171875, -0.7037353515625, -0.36376953125, -0.0238037109375, 0.316162109375, 0.6561279296875, 0.99609375, 1.3360595703125, 1.676025390625, 2.0159912109375, 2.35595703125, 2.6959228515625, 3.035888671875, 3.3758544921875, 3.7158203125, 4.0557861328125, 4.395751953125, 4.7357177734375, 5.07568359375, 5.4156494140625, 5.755615234375, 6.0955810546875, 6.435546875, 6.7755126953125, 7.115478515625, 7.4554443359375, 7.79541015625, 8.1353759765625, 8.475341796875, 8.8153076171875, 9.1552734375, 9.4952392578125, 9.835205078125, 10.1751708984375, 10.51513671875, 10.8551025390625, 11.195068359375, 11.5350341796875, 11.875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 13.0, 14.0, 11.0, 18.0, 11.0, 20.0, 19.0, 32.0, 41.0, 28.0, 41.0, 31.0, 48.0, 46.0, 45.0, 47.0, 1062.0, 48.0, 33.0, 30.0, 36.0, 41.0, 29.0, 33.0, 24.0, 30.0, 23.0, 19.0, 24.0, 18.0, 11.0, 8.0, 9.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.78515625, -1.7266693115234375, -1.668182373046875, -1.6096954345703125, -1.55120849609375, -1.4927215576171875, -1.434234619140625, -1.3757476806640625, -1.3172607421875, -1.2587738037109375, -1.200286865234375, -1.1417999267578125, -1.08331298828125, -1.0248260498046875, -0.966339111328125, -0.9078521728515625, -0.849365234375, -0.7908782958984375, -0.732391357421875, -0.6739044189453125, -0.61541748046875, -0.5569305419921875, -0.498443603515625, -0.4399566650390625, -0.3814697265625, -0.3229827880859375, -0.264495849609375, -0.2060089111328125, -0.14752197265625, -0.0890350341796875, -0.030548095703125, 0.0279388427734375, 0.08642578125, 0.1449127197265625, 0.203399658203125, 0.2618865966796875, 0.32037353515625, 0.3788604736328125, 0.437347412109375, 0.4958343505859375, 0.5543212890625, 0.6128082275390625, 0.671295166015625, 0.7297821044921875, 0.78826904296875, 0.8467559814453125, 0.905242919921875, 0.9637298583984375, 1.022216796875, 1.0807037353515625, 1.139190673828125, 1.1976776123046875, 1.25616455078125, 1.3146514892578125, 1.373138427734375, 1.4316253662109375, 1.4901123046875, 1.5485992431640625, 1.607086181640625, 1.6655731201171875, 1.72406005859375, 1.7825469970703125, 1.841033935546875, 1.8995208740234375, 1.9580078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 7.0, 4.0, 6.0, 14.0, 20.0, 30.0, 45.0, 54.0, 89.0, 128.0, 264.0, 375.0, 619.0, 937.0, 1589.0, 2993.0, 9093.0, 68365.0, 1954137.0, 44092.0, 7409.0, 2758.0, 1510.0, 929.0, 571.0, 346.0, 251.0, 162.0, 130.0, 67.0, 32.0, 36.0, 13.0, 15.0, 14.0, 7.0, 5.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.8359375, -37.515625, -36.1953125, -34.875, -33.5546875, -32.234375, -30.9140625, -29.59375, -28.2734375, -26.953125, -25.6328125, -24.3125, -22.9921875, -21.671875, -20.3515625, -19.03125, -17.7109375, -16.390625, -15.0703125, -13.75, -12.4296875, -11.109375, -9.7890625, -8.46875, -7.1484375, -5.828125, -4.5078125, -3.1875, -1.8671875, -0.546875, 0.7734375, 2.09375, 3.4140625, 4.734375, 6.0546875, 7.375, 8.6953125, 10.015625, 11.3359375, 12.65625, 13.9765625, 15.296875, 16.6171875, 17.9375, 19.2578125, 20.578125, 21.8984375, 23.21875, 24.5390625, 25.859375, 27.1796875, 28.5, 29.8203125, 31.140625, 32.4609375, 33.78125, 35.1015625, 36.421875, 37.7421875, 39.0625, 40.3828125, 41.703125, 43.0234375, 44.34375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 24.0, 47.0, 752.0, 76.0, 30.0, 19.0, 8.0, 10.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.828857421875, -10.42333984375, -10.017822265625, -9.6123046875, -9.206787109375, -8.80126953125, -8.395751953125, -7.990234375, -7.584716796875, -7.17919921875, -6.773681640625, -6.3681640625, -5.962646484375, -5.55712890625, -5.151611328125, -4.74609375, -4.340576171875, -3.93505859375, -3.529541015625, -3.1240234375, -2.718505859375, -2.31298828125, -1.907470703125, -1.501953125, -1.096435546875, -0.69091796875, -0.285400390625, 0.1201171875, 0.525634765625, 0.93115234375, 1.336669921875, 1.7421875, 2.147705078125, 2.55322265625, 2.958740234375, 3.3642578125, 3.769775390625, 4.17529296875, 4.580810546875, 4.986328125, 5.391845703125, 5.79736328125, 6.202880859375, 6.6083984375, 7.013916015625, 7.41943359375, 7.824951171875, 8.23046875, 8.635986328125, 9.04150390625, 9.447021484375, 9.8525390625, 10.258056640625, 10.66357421875, 11.069091796875, 11.474609375, 11.880126953125, 12.28564453125, 12.691162109375, 13.0966796875, 13.502197265625, 13.90771484375, 14.313232421875, 14.71875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 23.0, 64.0, 236.0, 1200.0, 14160.0, 1028432.0, 3671.0, 491.0, 125.0, 53.0, 22.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-244.375, -237.63671875, -230.8984375, -224.16015625, -217.421875, -210.68359375, -203.9453125, -197.20703125, -190.46875, -183.73046875, -176.9921875, -170.25390625, -163.515625, -156.77734375, -150.0390625, -143.30078125, -136.5625, -129.82421875, -123.0859375, -116.34765625, -109.609375, -102.87109375, -96.1328125, -89.39453125, -82.65625, -75.91796875, -69.1796875, -62.44140625, -55.703125, -48.96484375, -42.2265625, -35.48828125, -28.75, -22.01171875, -15.2734375, -8.53515625, -1.796875, 4.94140625, 11.6796875, 18.41796875, 25.15625, 31.89453125, 38.6328125, 45.37109375, 52.109375, 58.84765625, 65.5859375, 72.32421875, 79.0625, 85.80078125, 92.5390625, 99.27734375, 106.015625, 112.75390625, 119.4921875, 126.23046875, 132.96875, 139.70703125, 146.4453125, 153.18359375, 159.921875, 166.66015625, 173.3984375, 180.13671875, 186.875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 13.0, 16.0, 11.0, 9.0, 13.0, 16.0, 22.0, 38.0, 58.0, 63.0, 89.0, 135.0, 133.0, 78.0, 65.0, 43.0, 37.0, 40.0, 19.0, 21.0, 17.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.570699691772461, -6.352674961090088, -6.134650230407715, -5.916625499725342, -5.698600769042969, -5.480576038360596, -5.262551307678223, -5.044526100158691, -4.826501846313477, -4.6084771156311035, -4.3904523849487305, -4.172427654266357, -3.9544029235839844, -3.7363781929016113, -3.518353223800659, -3.300328493118286, -3.082303524017334, -2.864278793334961, -2.646254062652588, -2.428229331970215, -2.210204601287842, -1.9921797513961792, -1.7741549015045166, -1.5561301708221436, -1.3381054401397705, -1.1200807094573975, -0.9020559191703796, -0.6840311288833618, -0.46600639820098877, -0.24798166751861572, -0.029956817626953125, 0.18806791305541992, 0.40609264373779297, 0.624117374420166, 0.8421421647071838, 1.0601669549942017, 1.2781916856765747, 1.4962164163589478, 1.7142412662506104, 1.9322659969329834, 2.1502907276153564, 2.3683154582977295, 2.5863401889801025, 2.8043651580810547, 3.0223898887634277, 3.240414619445801, 3.458439350128174, 3.676464080810547, 3.89448881149292, 4.112513542175293, 4.330538272857666, 4.548563003540039, 4.766587734222412, 4.984612464904785, 5.202637672424316, 5.420661926269531, 5.6386871337890625, 5.8567118644714355, 6.074736595153809, 6.292761325836182, 6.510786056518555, 6.728810787200928, 6.946835517883301, 7.164860725402832, 7.382884979248047]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 6.0, 18.0, 11.0, 14.0, 18.0, 25.0, 23.0, 37.0, 28.0, 39.0, 42.0, 41.0, 40.0, 32.0, 51.0, 59.0, 50.0, 41.0, 48.0, 49.0, 39.0, 45.0, 40.0, 35.0, 26.0, 26.0, 23.0, 16.0, 18.0, 21.0, 7.0, 6.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.732614040374756, -6.518804550170898, -6.304995059967041, -6.091185569763184, -5.877376079559326, -5.663566589355469, -5.449756622314453, -5.235947132110596, -5.022137641906738, -4.808328151702881, -4.594518661499023, -4.380709171295166, -4.166899681091309, -3.953089952468872, -3.7392804622650146, -3.525470733642578, -3.3116614818573, -3.0978519916534424, -2.884042501449585, -2.6702327728271484, -2.456423282623291, -2.2426137924194336, -2.028804302215576, -1.8149946928024292, -1.6011852025985718, -1.3873757123947144, -1.1735661029815674, -0.95975661277771, -0.7459470629692078, -0.5321375131607056, -0.31832802295684814, -0.10451841354370117, 0.10929107666015625, 0.32310062646865845, 0.5369101762771606, 0.7507196664810181, 0.9645292162895203, 1.1783387660980225, 1.3921482563018799, 1.6059578657150269, 1.8197673559188843, 2.0335769653320312, 2.2473864555358887, 2.461195945739746, 2.6750054359436035, 2.888814926147461, 3.1026244163513184, 3.316434144973755, 3.5302436351776123, 3.7440531253814697, 3.957862615585327, 4.171672344207764, 4.385481834411621, 4.5992913246154785, 4.813100814819336, 5.026910305023193, 5.240719795227051, 5.454529285430908, 5.668338775634766, 5.882148265838623, 6.0959577560424805, 6.309767723083496, 6.523576736450195, 6.737386703491211, 6.951196193695068]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 13.0, 8.0, 19.0, 21.0, 22.0, 34.0, 38.0, 37.0, 32.0, 33.0, 38.0, 45.0, 59.0, 52.0, 46.0, 48.0, 51.0, 40.0, 52.0, 48.0, 36.0, 32.0, 26.0, 21.0, 23.0, 15.0, 24.0, 20.0, 14.0, 12.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.208892822265625, -2.11700439453125, -2.025115966796875, -1.9332275390625, -1.841339111328125, -1.74945068359375, -1.657562255859375, -1.565673828125, -1.473785400390625, -1.38189697265625, -1.290008544921875, -1.1981201171875, -1.106231689453125, -1.01434326171875, -0.922454833984375, -0.83056640625, -0.738677978515625, -0.64678955078125, -0.554901123046875, -0.4630126953125, -0.371124267578125, -0.27923583984375, -0.187347412109375, -0.095458984375, -0.003570556640625, 0.08831787109375, 0.180206298828125, 0.2720947265625, 0.363983154296875, 0.45587158203125, 0.547760009765625, 0.6396484375, 0.731536865234375, 0.82342529296875, 0.915313720703125, 1.0072021484375, 1.099090576171875, 1.19097900390625, 1.282867431640625, 1.374755859375, 1.466644287109375, 1.55853271484375, 1.650421142578125, 1.7423095703125, 1.834197998046875, 1.92608642578125, 2.017974853515625, 2.10986328125, 2.201751708984375, 2.29364013671875, 2.385528564453125, 2.4774169921875, 2.569305419921875, 2.66119384765625, 2.753082275390625, 2.844970703125, 2.936859130859375, 3.02874755859375, 3.120635986328125, 3.2125244140625, 3.304412841796875, 3.39630126953125, 3.488189697265625, 3.580078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 6.0, 18.0, 13.0, 32.0, 30.0, 56.0, 101.0, 132.0, 172.0, 252.0, 400.0, 597.0, 961.0, 1644.0, 2753.0, 4945.0, 9217.0, 18896.0, 42575.0, 133776.0, 597327.0, 147421.0, 45071.0, 19758.0, 9770.0, 5147.0, 2909.0, 1723.0, 1011.0, 675.0, 371.0, 258.0, 162.0, 100.0, 86.0, 59.0, 38.0, 14.0, 22.0, 10.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.05963134765625, -4.8614501953125, -4.66326904296875, -4.465087890625, -4.26690673828125, -4.0687255859375, -3.87054443359375, -3.67236328125, -3.47418212890625, -3.2760009765625, -3.07781982421875, -2.879638671875, -2.68145751953125, -2.4832763671875, -2.28509521484375, -2.0869140625, -1.88873291015625, -1.6905517578125, -1.49237060546875, -1.294189453125, -1.09600830078125, -0.8978271484375, -0.69964599609375, -0.50146484375, -0.30328369140625, -0.1051025390625, 0.09307861328125, 0.291259765625, 0.48944091796875, 0.6876220703125, 0.88580322265625, 1.083984375, 1.28216552734375, 1.4803466796875, 1.67852783203125, 1.876708984375, 2.07489013671875, 2.2730712890625, 2.47125244140625, 2.66943359375, 2.86761474609375, 3.0657958984375, 3.26397705078125, 3.462158203125, 3.66033935546875, 3.8585205078125, 4.05670166015625, 4.2548828125, 4.45306396484375, 4.6512451171875, 4.84942626953125, 5.047607421875, 5.24578857421875, 5.4439697265625, 5.64215087890625, 5.84033203125, 6.03851318359375, 6.2366943359375, 6.43487548828125, 6.633056640625, 6.83123779296875, 7.0294189453125, 7.22760009765625, 7.42578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 18.0, 33.0, 25.0, 26.0, 25.0, 31.0, 41.0, 41.0, 72.0, 71.0, 95.0, 146.0, 1424.0, 360.0, 131.0, 93.0, 70.0, 52.0, 45.0, 39.0, 35.0, 35.0, 21.0, 15.0, 16.0, 15.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.307373046875, -8.97412109375, -8.640869140625, -8.3076171875, -7.974365234375, -7.64111328125, -7.307861328125, -6.974609375, -6.641357421875, -6.30810546875, -5.974853515625, -5.6416015625, -5.308349609375, -4.97509765625, -4.641845703125, -4.30859375, -3.975341796875, -3.64208984375, -3.308837890625, -2.9755859375, -2.642333984375, -2.30908203125, -1.975830078125, -1.642578125, -1.309326171875, -0.97607421875, -0.642822265625, -0.3095703125, 0.023681640625, 0.35693359375, 0.690185546875, 1.0234375, 1.356689453125, 1.68994140625, 2.023193359375, 2.3564453125, 2.689697265625, 3.02294921875, 3.356201171875, 3.689453125, 4.022705078125, 4.35595703125, 4.689208984375, 5.0224609375, 5.355712890625, 5.68896484375, 6.022216796875, 6.35546875, 6.688720703125, 7.02197265625, 7.355224609375, 7.6884765625, 8.021728515625, 8.35498046875, 8.688232421875, 9.021484375, 9.354736328125, 9.68798828125, 10.021240234375, 10.3544921875, 10.687744140625, 11.02099609375, 11.354248046875, 11.6875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 17.0, 13.0, 11.0, 19.0, 22.0, 27.0, 32.0, 37.0, 55.0, 111.0, 156.0, 276.0, 766.0, 2423.0, 11071.0, 82469.0, 2693648.0, 322074.0, 25543.0, 4646.0, 1220.0, 427.0, 214.0, 118.0, 61.0, 41.0, 43.0, 32.0, 27.0, 20.0, 17.0, 9.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.797119140625, -16.25048828125, -15.703857421875, -15.1572265625, -14.610595703125, -14.06396484375, -13.517333984375, -12.970703125, -12.424072265625, -11.87744140625, -11.330810546875, -10.7841796875, -10.237548828125, -9.69091796875, -9.144287109375, -8.59765625, -8.051025390625, -7.50439453125, -6.957763671875, -6.4111328125, -5.864501953125, -5.31787109375, -4.771240234375, -4.224609375, -3.677978515625, -3.13134765625, -2.584716796875, -2.0380859375, -1.491455078125, -0.94482421875, -0.398193359375, 0.1484375, 0.695068359375, 1.24169921875, 1.788330078125, 2.3349609375, 2.881591796875, 3.42822265625, 3.974853515625, 4.521484375, 5.068115234375, 5.61474609375, 6.161376953125, 6.7080078125, 7.254638671875, 7.80126953125, 8.347900390625, 8.89453125, 9.441162109375, 9.98779296875, 10.534423828125, 11.0810546875, 11.627685546875, 12.17431640625, 12.720947265625, 13.267578125, 13.814208984375, 14.36083984375, 14.907470703125, 15.4541015625, 16.000732421875, 16.54736328125, 17.093994140625, 17.640625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 33.0, 93.0, 201.0, 300.0, 207.0, 122.0, 37.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96629524230957, -25.113798141479492, -23.261301040649414, -21.408803939819336, -19.556306838989258, -17.70380973815918, -15.851312637329102, -13.998815536499023, -12.146318435668945, -10.293821334838867, -8.441324234008789, -6.588827133178711, -4.736330032348633, -2.8838329315185547, -1.0313358306884766, 0.8211612701416016, 2.6736583709716797, 4.526155471801758, 6.378652572631836, 8.231149673461914, 10.083646774291992, 11.93614387512207, 13.788640975952148, 15.641138076782227, 17.493635177612305, 19.346132278442383, 21.19862937927246, 23.05112648010254, 24.903623580932617, 26.756120681762695, 28.608617782592773, 30.46111488342285, 32.31361389160156, 34.16611099243164, 36.01860809326172, 37.8711051940918, 39.723602294921875, 41.57609939575195, 43.42859649658203, 45.28109359741211, 47.13359069824219, 48.986087799072266, 50.838584899902344, 52.69108200073242, 54.5435791015625, 56.39607620239258, 58.248573303222656, 60.101070404052734, 61.95356750488281, 63.80606460571289, 65.65856170654297, 67.51106262207031, 69.36355590820312, 71.21604919433594, 73.06855010986328, 74.92105102539062, 76.77354431152344, 78.62603759765625, 80.4785385131836, 82.33103942871094, 84.18353271484375, 86.03602600097656, 87.8885269165039, 89.74102783203125, 91.59352111816406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 11.0, 16.0, 13.0, 31.0, 22.0, 18.0, 26.0, 26.0, 35.0, 36.0, 36.0, 40.0, 45.0, 37.0, 49.0, 56.0, 41.0, 31.0, 40.0, 36.0, 32.0, 35.0, 24.0, 27.0, 29.0, 20.0, 24.0, 19.0, 22.0, 13.0, 15.0, 20.0, 8.0, 7.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.59970474243164, -25.747615814208984, -24.89552879333496, -24.043439865112305, -23.19135284423828, -22.339263916015625, -21.48717498779297, -20.635087966918945, -19.78299903869629, -18.930910110473633, -18.07882308959961, -17.226734161376953, -16.37464714050293, -15.522558212280273, -14.670470237731934, -13.818382263183594, -12.966294288635254, -12.114206314086914, -11.262118339538574, -10.410030364990234, -9.557941436767578, -8.705853462219238, -7.853765487670898, -7.0016770362854, -6.1495890617370605, -5.297501087188721, -4.445412635803223, -3.593324661254883, -2.741236448287964, -1.889148235321045, -1.037060260772705, -0.18497180938720703, 0.6671161651611328, 1.5192043781280518, 2.3712925910949707, 3.2233805656433105, 4.075469017028809, 4.927556991577148, 5.779644966125488, 6.631733417510986, 7.483821392059326, 8.335909843444824, 9.187997817993164, 10.040085792541504, 10.892173767089844, 11.7442626953125, 12.596349716186523, 13.44843864440918, 14.30052661895752, 15.15261459350586, 16.004703521728516, 16.85679054260254, 17.708879470825195, 18.56096649169922, 19.413055419921875, 20.26514434814453, 21.117231369018555, 21.96932029724121, 22.821407318115234, 23.67349624633789, 24.525583267211914, 25.37767219543457, 26.229759216308594, 27.08184814453125, 27.933937072753906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 13.0, 13.0, 18.0, 28.0, 22.0, 33.0, 30.0, 23.0, 45.0, 43.0, 43.0, 45.0, 48.0, 65.0, 42.0, 37.0, 42.0, 46.0, 43.0, 47.0, 32.0, 27.0, 30.0, 25.0, 20.0, 19.0, 22.0, 17.0, 16.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.393798828125, -2.29736328125, -2.200927734375, -2.1044921875, -2.008056640625, -1.91162109375, -1.815185546875, -1.71875, -1.622314453125, -1.52587890625, -1.429443359375, -1.3330078125, -1.236572265625, -1.14013671875, -1.043701171875, -0.947265625, -0.850830078125, -0.75439453125, -0.657958984375, -0.5615234375, -0.465087890625, -0.36865234375, -0.272216796875, -0.17578125, -0.079345703125, 0.01708984375, 0.113525390625, 0.2099609375, 0.306396484375, 0.40283203125, 0.499267578125, 0.595703125, 0.692138671875, 0.78857421875, 0.885009765625, 0.9814453125, 1.077880859375, 1.17431640625, 1.270751953125, 1.3671875, 1.463623046875, 1.56005859375, 1.656494140625, 1.7529296875, 1.849365234375, 1.94580078125, 2.042236328125, 2.138671875, 2.235107421875, 2.33154296875, 2.427978515625, 2.5244140625, 2.620849609375, 2.71728515625, 2.813720703125, 2.91015625, 3.006591796875, 3.10302734375, 3.199462890625, 3.2958984375, 3.392333984375, 3.48876953125, 3.585205078125, 3.681640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 12.0, 14.0, 24.0, 18.0, 46.0, 62.0, 74.0, 154.0, 200.0, 335.0, 483.0, 776.0, 1200.0, 2117.0, 3588.0, 6547.0, 11816.0, 23213.0, 52388.0, 198159.0, 1589525.0, 1964535.0, 230896.0, 54733.0, 24184.0, 12369.0, 6673.0, 3784.0, 2243.0, 1365.0, 910.0, 570.0, 369.0, 271.0, 175.0, 126.0, 91.0, 68.0, 35.0, 36.0, 21.0, 20.0, 13.0, 9.0, 10.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.4140625, -5.2210693359375, -5.028076171875, -4.8350830078125, -4.64208984375, -4.4490966796875, -4.256103515625, -4.0631103515625, -3.8701171875, -3.6771240234375, -3.484130859375, -3.2911376953125, -3.09814453125, -2.9051513671875, -2.712158203125, -2.5191650390625, -2.326171875, -2.1331787109375, -1.940185546875, -1.7471923828125, -1.55419921875, -1.3612060546875, -1.168212890625, -0.9752197265625, -0.7822265625, -0.5892333984375, -0.396240234375, -0.2032470703125, -0.01025390625, 0.1827392578125, 0.375732421875, 0.5687255859375, 0.76171875, 0.9547119140625, 1.147705078125, 1.3406982421875, 1.53369140625, 1.7266845703125, 1.919677734375, 2.1126708984375, 2.3056640625, 2.4986572265625, 2.691650390625, 2.8846435546875, 3.07763671875, 3.2706298828125, 3.463623046875, 3.6566162109375, 3.849609375, 4.0426025390625, 4.235595703125, 4.4285888671875, 4.62158203125, 4.8145751953125, 5.007568359375, 5.2005615234375, 5.3935546875, 5.5865478515625, 5.779541015625, 5.9725341796875, 6.16552734375, 6.3585205078125, 6.551513671875, 6.7445068359375, 6.9375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 18.0, 19.0, 31.0, 39.0, 49.0, 84.0, 113.0, 172.0, 371.0, 713.0, 940.0, 643.0, 312.0, 153.0, 109.0, 82.0, 60.0, 38.0, 41.0, 12.0, 12.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3641357421875, -9.056396484375, -8.7486572265625, -8.44091796875, -8.1331787109375, -7.825439453125, -7.5177001953125, -7.2099609375, -6.9022216796875, -6.594482421875, -6.2867431640625, -5.97900390625, -5.6712646484375, -5.363525390625, -5.0557861328125, -4.748046875, -4.4403076171875, -4.132568359375, -3.8248291015625, -3.51708984375, -3.2093505859375, -2.901611328125, -2.5938720703125, -2.2861328125, -1.9783935546875, -1.670654296875, -1.3629150390625, -1.05517578125, -0.7474365234375, -0.439697265625, -0.1319580078125, 0.17578125, 0.4835205078125, 0.791259765625, 1.0989990234375, 1.40673828125, 1.7144775390625, 2.022216796875, 2.3299560546875, 2.6376953125, 2.9454345703125, 3.253173828125, 3.5609130859375, 3.86865234375, 4.1763916015625, 4.484130859375, 4.7918701171875, 5.099609375, 5.4073486328125, 5.715087890625, 6.0228271484375, 6.33056640625, 6.6383056640625, 6.946044921875, 7.2537841796875, 7.5615234375, 7.8692626953125, 8.177001953125, 8.4847412109375, 8.79248046875, 9.1002197265625, 9.407958984375, 9.7156982421875, 10.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 10.0, 32.0, 32.0, 50.0, 86.0, 174.0, 341.0, 681.0, 1664.0, 4676.0, 16562.0, 79864.0, 1387124.0, 2567562.0, 105722.0, 20632.0, 5629.0, 1860.0, 769.0, 370.0, 176.0, 104.0, 60.0, 29.0, 24.0, 8.0, 13.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.439697265625, -15.91064453125, -15.381591796875, -14.8525390625, -14.323486328125, -13.79443359375, -13.265380859375, -12.736328125, -12.207275390625, -11.67822265625, -11.149169921875, -10.6201171875, -10.091064453125, -9.56201171875, -9.032958984375, -8.50390625, -7.974853515625, -7.44580078125, -6.916748046875, -6.3876953125, -5.858642578125, -5.32958984375, -4.800537109375, -4.271484375, -3.742431640625, -3.21337890625, -2.684326171875, -2.1552734375, -1.626220703125, -1.09716796875, -0.568115234375, -0.0390625, 0.489990234375, 1.01904296875, 1.548095703125, 2.0771484375, 2.606201171875, 3.13525390625, 3.664306640625, 4.193359375, 4.722412109375, 5.25146484375, 5.780517578125, 6.3095703125, 6.838623046875, 7.36767578125, 7.896728515625, 8.42578125, 8.954833984375, 9.48388671875, 10.012939453125, 10.5419921875, 11.071044921875, 11.60009765625, 12.129150390625, 12.658203125, 13.187255859375, 13.71630859375, 14.245361328125, 14.7744140625, 15.303466796875, 15.83251953125, 16.361572265625, 16.890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 18.0, 24.0, 28.0, 41.0, 54.0, 73.0, 111.0, 142.0, 130.0, 103.0, 83.0, 70.0, 36.0, 25.0, 24.0, 18.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.594764709472656, -34.35810470581055, -33.12144088745117, -31.88477897644043, -30.648117065429688, -29.411457061767578, -28.174795150756836, -26.938133239746094, -25.70147132873535, -24.46480941772461, -23.228147506713867, -21.991485595703125, -20.754825592041016, -19.51816177368164, -18.28150177001953, -17.04483985900879, -15.808177947998047, -14.571516036987305, -13.334854125976562, -12.098193168640137, -10.861531257629395, -9.624869346618652, -8.388208389282227, -7.151546478271484, -5.914884567260742, -4.67822265625, -3.441561222076416, -2.204899549484253, -0.9682378768920898, 0.26842403411865234, 1.5050854682922363, 2.7417469024658203, 3.978412628173828, 5.21507453918457, 6.451735973358154, 7.688397407531738, 8.92505931854248, 10.161721229553223, 11.398382186889648, 12.63504409790039, 13.871706008911133, 15.108367919921875, 16.345029830932617, 17.58169174194336, 18.81835174560547, 20.055015563964844, 21.291675567626953, 22.528337478637695, 23.764999389648438, 25.00166130065918, 26.238323211669922, 27.474985122680664, 28.711647033691406, 29.948307037353516, 31.184968948364258, 32.421630859375, 33.658294677734375, 34.894954681396484, 36.13161849975586, 37.36827850341797, 38.604942321777344, 39.84160232543945, 41.07826614379883, 42.31492614746094, 43.55158615112305]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 3.0, 7.0, 13.0, 12.0, 11.0, 13.0, 19.0, 19.0, 22.0, 25.0, 31.0, 28.0, 37.0, 32.0, 25.0, 40.0, 42.0, 41.0, 42.0, 27.0, 40.0, 34.0, 41.0, 37.0, 37.0, 40.0, 35.0, 24.0, 24.0, 29.0, 12.0, 25.0, 18.0, 14.0, 16.0, 16.0, 10.0, 15.0, 8.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-22.668424606323242, -21.979143142700195, -21.28986167907715, -20.6005802154541, -19.911298751831055, -19.222017288208008, -18.532737731933594, -17.843456268310547, -17.1541748046875, -16.464893341064453, -15.775611877441406, -15.08633041381836, -14.397048950195312, -13.707767486572266, -13.018486976623535, -12.329205513000488, -11.639923095703125, -10.950641632080078, -10.261360168457031, -9.572078704833984, -8.882797241210938, -8.19351577758789, -7.50423526763916, -6.814953804016113, -6.125672340393066, -5.4363908767700195, -4.747109413146973, -4.057828426361084, -3.368546962738037, -2.6792654991149902, -1.9899845123291016, -1.3007030487060547, -0.6114234924316406, 0.0778578519821167, 0.767139196395874, 1.4564204216003418, 2.1457018852233887, 2.8349833488464355, 3.524264335632324, 4.213545799255371, 4.902827262878418, 5.592108726501465, 6.281390190124512, 6.9706711769104, 7.659952640533447, 8.349233627319336, 9.038515090942383, 9.72779655456543, 10.417078018188477, 11.106359481811523, 11.79564094543457, 12.484922409057617, 13.174203872680664, 13.863485336303711, 14.552765846252441, 15.242047309875488, 15.931328773498535, 16.620609283447266, 17.309890747070312, 17.99917221069336, 18.688453674316406, 19.377735137939453, 20.0670166015625, 20.756298065185547, 21.445579528808594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 14.0, 19.0, 21.0, 22.0, 15.0, 28.0, 26.0, 28.0, 34.0, 38.0, 29.0, 40.0, 30.0, 38.0, 40.0, 39.0, 41.0, 34.0, 35.0, 35.0, 37.0, 29.0, 35.0, 33.0, 14.0, 22.0, 20.0, 26.0, 16.0, 24.0, 19.0, 14.0, 5.0, 6.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.296875, -2.2203369140625, -2.143798828125, -2.0672607421875, -1.99072265625, -1.9141845703125, -1.837646484375, -1.7611083984375, -1.6845703125, -1.6080322265625, -1.531494140625, -1.4549560546875, -1.37841796875, -1.3018798828125, -1.225341796875, -1.1488037109375, -1.072265625, -0.9957275390625, -0.919189453125, -0.8426513671875, -0.76611328125, -0.6895751953125, -0.613037109375, -0.5364990234375, -0.4599609375, -0.3834228515625, -0.306884765625, -0.2303466796875, -0.15380859375, -0.0772705078125, -0.000732421875, 0.0758056640625, 0.15234375, 0.2288818359375, 0.305419921875, 0.3819580078125, 0.45849609375, 0.5350341796875, 0.611572265625, 0.6881103515625, 0.7646484375, 0.8411865234375, 0.917724609375, 0.9942626953125, 1.07080078125, 1.1473388671875, 1.223876953125, 1.3004150390625, 1.376953125, 1.4534912109375, 1.530029296875, 1.6065673828125, 1.68310546875, 1.7596435546875, 1.836181640625, 1.9127197265625, 1.9892578125, 2.0657958984375, 2.142333984375, 2.2188720703125, 2.29541015625, 2.3719482421875, 2.448486328125, 2.5250244140625, 2.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 12.0, 19.0, 31.0, 31.0, 40.0, 59.0, 109.0, 111.0, 171.0, 217.0, 282.0, 444.0, 591.0, 792.0, 1155.0, 1654.0, 2601.0, 4471.0, 9412.0, 25489.0, 117873.0, 722753.0, 113239.0, 24972.0, 9311.0, 4410.0, 2575.0, 1654.0, 1187.0, 764.0, 556.0, 441.0, 290.0, 235.0, 153.0, 109.0, 98.0, 76.0, 37.0, 40.0, 29.0, 18.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.19146728515625, -5.9884033203125, -5.78533935546875, -5.582275390625, -5.37921142578125, -5.1761474609375, -4.97308349609375, -4.77001953125, -4.56695556640625, -4.3638916015625, -4.16082763671875, -3.957763671875, -3.75469970703125, -3.5516357421875, -3.34857177734375, -3.1455078125, -2.94244384765625, -2.7393798828125, -2.53631591796875, -2.333251953125, -2.13018798828125, -1.9271240234375, -1.72406005859375, -1.52099609375, -1.31793212890625, -1.1148681640625, -0.91180419921875, -0.708740234375, -0.50567626953125, -0.3026123046875, -0.09954833984375, 0.103515625, 0.30657958984375, 0.5096435546875, 0.71270751953125, 0.915771484375, 1.11883544921875, 1.3218994140625, 1.52496337890625, 1.72802734375, 1.93109130859375, 2.1341552734375, 2.33721923828125, 2.540283203125, 2.74334716796875, 2.9464111328125, 3.14947509765625, 3.3525390625, 3.55560302734375, 3.7586669921875, 3.96173095703125, 4.164794921875, 4.36785888671875, 4.5709228515625, 4.77398681640625, 4.97705078125, 5.18011474609375, 5.3831787109375, 5.58624267578125, 5.789306640625, 5.99237060546875, 6.1954345703125, 6.39849853515625, 6.6015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 11.0, 7.0, 4.0, 12.0, 9.0, 9.0, 19.0, 25.0, 29.0, 26.0, 27.0, 32.0, 27.0, 39.0, 45.0, 35.0, 41.0, 40.0, 1078.0, 43.0, 38.0, 34.0, 38.0, 36.0, 43.0, 43.0, 32.0, 32.0, 21.0, 17.0, 20.0, 15.0, 19.0, 13.0, 12.0, 12.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.0850830078125, -2.011962890625, -1.9388427734375, -1.86572265625, -1.7926025390625, -1.719482421875, -1.6463623046875, -1.5732421875, -1.5001220703125, -1.427001953125, -1.3538818359375, -1.28076171875, -1.2076416015625, -1.134521484375, -1.0614013671875, -0.98828125, -0.9151611328125, -0.842041015625, -0.7689208984375, -0.69580078125, -0.6226806640625, -0.549560546875, -0.4764404296875, -0.4033203125, -0.3302001953125, -0.257080078125, -0.1839599609375, -0.11083984375, -0.0377197265625, 0.035400390625, 0.1085205078125, 0.181640625, 0.2547607421875, 0.327880859375, 0.4010009765625, 0.47412109375, 0.5472412109375, 0.620361328125, 0.6934814453125, 0.7666015625, 0.8397216796875, 0.912841796875, 0.9859619140625, 1.05908203125, 1.1322021484375, 1.205322265625, 1.2784423828125, 1.3515625, 1.4246826171875, 1.497802734375, 1.5709228515625, 1.64404296875, 1.7171630859375, 1.790283203125, 1.8634033203125, 1.9365234375, 2.0096435546875, 2.082763671875, 2.1558837890625, 2.22900390625, 2.3021240234375, 2.375244140625, 2.4483642578125, 2.521484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 9.0, 13.0, 10.0, 9.0, 19.0, 25.0, 22.0, 37.0, 31.0, 63.0, 66.0, 114.0, 120.0, 172.0, 276.0, 315.0, 457.0, 653.0, 1004.0, 1536.0, 2470.0, 4353.0, 9495.0, 32477.0, 1329657.0, 665232.0, 28540.0, 8662.0, 4153.0, 2322.0, 1489.0, 1017.0, 609.0, 444.0, 344.0, 211.0, 192.0, 120.0, 93.0, 68.0, 62.0, 34.0, 32.0, 28.0, 19.0, 18.0, 6.0, 9.0, 4.0, 4.0, 0.0, 3.0, 6.0, 5.0], "bins": [-8.3046875, -8.067138671875, -7.82958984375, -7.592041015625, -7.3544921875, -7.116943359375, -6.87939453125, -6.641845703125, -6.404296875, -6.166748046875, -5.92919921875, -5.691650390625, -5.4541015625, -5.216552734375, -4.97900390625, -4.741455078125, -4.50390625, -4.266357421875, -4.02880859375, -3.791259765625, -3.5537109375, -3.316162109375, -3.07861328125, -2.841064453125, -2.603515625, -2.365966796875, -2.12841796875, -1.890869140625, -1.6533203125, -1.415771484375, -1.17822265625, -0.940673828125, -0.703125, -0.465576171875, -0.22802734375, 0.009521484375, 0.2470703125, 0.484619140625, 0.72216796875, 0.959716796875, 1.197265625, 1.434814453125, 1.67236328125, 1.909912109375, 2.1474609375, 2.385009765625, 2.62255859375, 2.860107421875, 3.09765625, 3.335205078125, 3.57275390625, 3.810302734375, 4.0478515625, 4.285400390625, 4.52294921875, 4.760498046875, 4.998046875, 5.235595703125, 5.47314453125, 5.710693359375, 5.9482421875, 6.185791015625, 6.42333984375, 6.660888671875, 6.8984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 17.0, 19.0, 25.0, 28.0, 60.0, 184.0, 362.0, 97.0, 49.0, 30.0, 20.0, 15.0, 16.0, 13.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.38671875, -2.3244171142578125, -2.262115478515625, -2.1998138427734375, -2.13751220703125, -2.0752105712890625, -2.012908935546875, -1.9506072998046875, -1.8883056640625, -1.8260040283203125, -1.763702392578125, -1.7014007568359375, -1.63909912109375, -1.5767974853515625, -1.514495849609375, -1.4521942138671875, -1.389892578125, -1.3275909423828125, -1.265289306640625, -1.2029876708984375, -1.14068603515625, -1.0783843994140625, -1.016082763671875, -0.9537811279296875, -0.8914794921875, -0.8291778564453125, -0.766876220703125, -0.7045745849609375, -0.64227294921875, -0.5799713134765625, -0.517669677734375, -0.4553680419921875, -0.39306640625, -0.3307647705078125, -0.268463134765625, -0.2061614990234375, -0.14385986328125, -0.0815582275390625, -0.019256591796875, 0.0430450439453125, 0.1053466796875, 0.1676483154296875, 0.229949951171875, 0.2922515869140625, 0.35455322265625, 0.4168548583984375, 0.479156494140625, 0.5414581298828125, 0.603759765625, 0.6660614013671875, 0.728363037109375, 0.7906646728515625, 0.85296630859375, 0.9152679443359375, 0.977569580078125, 1.0398712158203125, 1.1021728515625, 1.1644744873046875, 1.226776123046875, 1.2890777587890625, 1.35137939453125, 1.4136810302734375, 1.475982666015625, 1.5382843017578125, 1.6005859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 3.0, 8.0, 5.0, 8.0, 18.0, 34.0, 55.0, 102.0, 292.0, 1296.0, 7571.0, 999347.0, 36042.0, 2828.0, 575.0, 153.0, 66.0, 33.0, 21.0, 17.0, 17.0, 15.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-28.71875, -27.60302734375, -26.4873046875, -25.37158203125, -24.255859375, -23.14013671875, -22.0244140625, -20.90869140625, -19.79296875, -18.67724609375, -17.5615234375, -16.44580078125, -15.330078125, -14.21435546875, -13.0986328125, -11.98291015625, -10.8671875, -9.75146484375, -8.6357421875, -7.52001953125, -6.404296875, -5.28857421875, -4.1728515625, -3.05712890625, -1.94140625, -0.82568359375, 0.2900390625, 1.40576171875, 2.521484375, 3.63720703125, 4.7529296875, 5.86865234375, 6.984375, 8.10009765625, 9.2158203125, 10.33154296875, 11.447265625, 12.56298828125, 13.6787109375, 14.79443359375, 15.91015625, 17.02587890625, 18.1416015625, 19.25732421875, 20.373046875, 21.48876953125, 22.6044921875, 23.72021484375, 24.8359375, 25.95166015625, 27.0673828125, 28.18310546875, 29.298828125, 30.41455078125, 31.5302734375, 32.64599609375, 33.76171875, 34.87744140625, 35.9931640625, 37.10888671875, 38.224609375, 39.34033203125, 40.4560546875, 41.57177734375, 42.6875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 17.0, 43.0, 228.0, 583.0, 107.0, 26.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082770347595215, -3.6443777084350586, -3.2059853076934814, -2.7675929069519043, -2.329200267791748, -1.8908076286315918, -1.4524152278900146, -1.0140228271484375, -0.5756301879882812, -0.13723766803741455, 0.30115485191345215, 0.7395473718643188, 1.1779398918151855, 1.6163325309753418, 2.054724931716919, 2.493117332458496, 2.9315099716186523, 3.3699026107788086, 3.8082950115203857, 4.246687412261963, 4.685080051422119, 5.123472690582275, 5.561864852905273, 6.00025749206543, 6.438650131225586, 6.877042770385742, 7.315435409545898, 7.7538275718688965, 8.192220687866211, 8.630613327026367, 9.069005012512207, 9.507397651672363, 9.945791244506836, 10.384183883666992, 10.822576522827148, 11.260969161987305, 11.699361801147461, 12.137754440307617, 12.576146125793457, 13.014538764953613, 13.45293140411377, 13.891324043273926, 14.329716682434082, 14.768109321594238, 15.206501007080078, 15.644893646240234, 16.08328628540039, 16.521678924560547, 16.960071563720703, 17.39846420288086, 17.836856842041016, 18.275249481201172, 18.713642120361328, 19.152034759521484, 19.59042739868164, 20.028820037841797, 20.467212677001953, 20.90560531616211, 21.343997955322266, 21.782390594482422, 22.220783233642578, 22.659175872802734, 23.09756851196289, 23.535961151123047, 23.97435188293457]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 10.0, 9.0, 10.0, 3.0, 13.0, 12.0, 21.0, 23.0, 25.0, 26.0, 25.0, 38.0, 43.0, 42.0, 43.0, 44.0, 55.0, 47.0, 55.0, 42.0, 42.0, 40.0, 44.0, 47.0, 38.0, 26.0, 25.0, 21.0, 23.0, 21.0, 19.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5552830696105957, -1.4940707683563232, -1.4328584671020508, -1.3716461658477783, -1.3104337453842163, -1.2492214441299438, -1.1880091428756714, -1.126796841621399, -1.065584421157837, -1.0043721199035645, -0.9431597590446472, -0.8819474577903748, -0.8207350969314575, -0.7595227956771851, -0.6983104944229126, -0.6370981931686401, -0.5758858919143677, -0.5146735906600952, -0.453461229801178, -0.3922489285469055, -0.33103659749031067, -0.2698242664337158, -0.20861196517944336, -0.1473996341228485, -0.08618730306625366, -0.02497497946023941, 0.03623734414577484, 0.0974496603012085, 0.15866199135780334, 0.2198743224143982, 0.28108662366867065, 0.3422989547252655, 0.40351128578186035, 0.4647236168384552, 0.52593594789505, 0.5871482491493225, 0.6483606100082397, 0.7095729112625122, 0.7707852125167847, 0.8319975137710571, 0.8932098746299744, 0.9544221758842468, 1.015634536743164, 1.0768468379974365, 1.138059139251709, 1.1992714405059814, 1.260483741760254, 1.321696162223816, 1.3829084634780884, 1.4441207647323608, 1.5053330659866333, 1.5665454864501953, 1.6277577877044678, 1.6889700889587402, 1.7501823902130127, 1.8113946914672852, 1.8726069927215576, 1.93381929397583, 1.9950315952301025, 2.056243896484375, 2.1174561977386475, 2.17866849899292, 2.2398810386657715, 2.301093339920044, 2.3623056411743164]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 9.0, 11.0, 11.0, 17.0, 14.0, 31.0, 26.0, 25.0, 39.0, 43.0, 32.0, 41.0, 42.0, 28.0, 39.0, 43.0, 48.0, 52.0, 41.0, 52.0, 37.0, 44.0, 35.0, 32.0, 24.0, 27.0, 29.0, 26.0, 14.0, 11.0, 11.0, 11.0, 9.0, 11.0, 6.0, 7.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.904296875, -2.815826416015625, -2.72735595703125, -2.638885498046875, -2.5504150390625, -2.461944580078125, -2.37347412109375, -2.285003662109375, -2.196533203125, -2.108062744140625, -2.01959228515625, -1.931121826171875, -1.8426513671875, -1.754180908203125, -1.66571044921875, -1.577239990234375, -1.48876953125, -1.400299072265625, -1.31182861328125, -1.223358154296875, -1.1348876953125, -1.046417236328125, -0.95794677734375, -0.869476318359375, -0.781005859375, -0.692535400390625, -0.60406494140625, -0.515594482421875, -0.4271240234375, -0.338653564453125, -0.25018310546875, -0.161712646484375, -0.0732421875, 0.015228271484375, 0.10369873046875, 0.192169189453125, 0.2806396484375, 0.369110107421875, 0.45758056640625, 0.546051025390625, 0.634521484375, 0.722991943359375, 0.81146240234375, 0.899932861328125, 0.9884033203125, 1.076873779296875, 1.16534423828125, 1.253814697265625, 1.34228515625, 1.430755615234375, 1.51922607421875, 1.607696533203125, 1.6961669921875, 1.784637451171875, 1.87310791015625, 1.961578369140625, 2.050048828125, 2.138519287109375, 2.22698974609375, 2.315460205078125, 2.4039306640625, 2.492401123046875, 2.58087158203125, 2.669342041015625, 2.7578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 6.0, 9.0, 7.0, 29.0, 31.0, 46.0, 65.0, 90.0, 160.0, 202.0, 320.0, 512.0, 814.0, 1188.0, 1812.0, 2901.0, 4678.0, 7652.0, 12303.0, 21298.0, 38886.0, 76964.0, 195786.0, 392694.0, 146780.0, 63315.0, 32729.0, 18351.0, 10852.0, 6478.0, 4121.0, 2569.0, 1669.0, 1129.0, 685.0, 485.0, 303.0, 213.0, 138.0, 98.0, 64.0, 46.0, 19.0, 17.0, 16.0, 11.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.47161865234375, -3.3572998046875, -3.24298095703125, -3.128662109375, -3.01434326171875, -2.9000244140625, -2.78570556640625, -2.67138671875, -2.55706787109375, -2.4427490234375, -2.32843017578125, -2.214111328125, -2.09979248046875, -1.9854736328125, -1.87115478515625, -1.7568359375, -1.64251708984375, -1.5281982421875, -1.41387939453125, -1.299560546875, -1.18524169921875, -1.0709228515625, -0.95660400390625, -0.84228515625, -0.72796630859375, -0.6136474609375, -0.49932861328125, -0.385009765625, -0.27069091796875, -0.1563720703125, -0.04205322265625, 0.072265625, 0.18658447265625, 0.3009033203125, 0.41522216796875, 0.529541015625, 0.64385986328125, 0.7581787109375, 0.87249755859375, 0.98681640625, 1.10113525390625, 1.2154541015625, 1.32977294921875, 1.444091796875, 1.55841064453125, 1.6727294921875, 1.78704833984375, 1.9013671875, 2.01568603515625, 2.1300048828125, 2.24432373046875, 2.358642578125, 2.47296142578125, 2.5872802734375, 2.70159912109375, 2.81591796875, 2.93023681640625, 3.0445556640625, 3.15887451171875, 3.273193359375, 3.38751220703125, 3.5018310546875, 3.61614990234375, 3.73046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 10.0, 16.0, 19.0, 15.0, 24.0, 27.0, 37.0, 34.0, 45.0, 49.0, 56.0, 83.0, 139.0, 251.0, 1420.0, 253.0, 136.0, 68.0, 54.0, 53.0, 50.0, 41.0, 27.0, 12.0, 24.0, 17.0, 8.0, 9.0, 6.0, 8.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-12.046875, -11.70703125, -11.3671875, -11.02734375, -10.6875, -10.34765625, -10.0078125, -9.66796875, -9.328125, -8.98828125, -8.6484375, -8.30859375, -7.96875, -7.62890625, -7.2890625, -6.94921875, -6.609375, -6.26953125, -5.9296875, -5.58984375, -5.25, -4.91015625, -4.5703125, -4.23046875, -3.890625, -3.55078125, -3.2109375, -2.87109375, -2.53125, -2.19140625, -1.8515625, -1.51171875, -1.171875, -0.83203125, -0.4921875, -0.15234375, 0.1875, 0.52734375, 0.8671875, 1.20703125, 1.546875, 1.88671875, 2.2265625, 2.56640625, 2.90625, 3.24609375, 3.5859375, 3.92578125, 4.265625, 4.60546875, 4.9453125, 5.28515625, 5.625, 5.96484375, 6.3046875, 6.64453125, 6.984375, 7.32421875, 7.6640625, 8.00390625, 8.34375, 8.68359375, 9.0234375, 9.36328125, 9.703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 22.0, 41.0, 49.0, 65.0, 89.0, 129.0, 215.0, 437.0, 1597.0, 10625.0, 221794.0, 2826820.0, 75691.0, 6014.0, 996.0, 358.0, 210.0, 120.0, 91.0, 71.0, 51.0, 32.0, 32.0, 20.0, 16.0, 13.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.189453125, -15.59765625, -15.005859375, -14.4140625, -13.822265625, -13.23046875, -12.638671875, -12.046875, -11.455078125, -10.86328125, -10.271484375, -9.6796875, -9.087890625, -8.49609375, -7.904296875, -7.3125, -6.720703125, -6.12890625, -5.537109375, -4.9453125, -4.353515625, -3.76171875, -3.169921875, -2.578125, -1.986328125, -1.39453125, -0.802734375, -0.2109375, 0.380859375, 0.97265625, 1.564453125, 2.15625, 2.748046875, 3.33984375, 3.931640625, 4.5234375, 5.115234375, 5.70703125, 6.298828125, 6.890625, 7.482421875, 8.07421875, 8.666015625, 9.2578125, 9.849609375, 10.44140625, 11.033203125, 11.625, 12.216796875, 12.80859375, 13.400390625, 13.9921875, 14.583984375, 15.17578125, 15.767578125, 16.359375, 16.951171875, 17.54296875, 18.134765625, 18.7265625, 19.318359375, 19.91015625, 20.501953125, 21.09375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [3.0, 20.0, 327.0, 597.0, 73.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.854573249816895, -9.474528312683105, -5.094483375549316, -0.7144384384155273, 3.6656064987182617, 8.04565143585205, 12.42569637298584, 16.805740356445312, 21.185787200927734, 25.565832138061523, 29.945877075195312, 34.32592010498047, 38.70596694946289, 43.08601379394531, 47.46605682373047, 51.846099853515625, 56.22614669799805, 60.60619354248047, 64.98623657226562, 69.36627960205078, 73.74632263183594, 78.12637329101562, 82.50641632080078, 86.88645935058594, 91.2665023803711, 95.64654541015625, 100.02659606933594, 104.4066390991211, 108.78668212890625, 113.1667251586914, 117.54676818847656, 121.92681884765625, 126.30685424804688, 130.68690490722656, 135.0669403076172, 139.44699096679688, 143.8270263671875, 148.2070770263672, 152.58712768554688, 156.9671630859375, 161.3472137451172, 165.72726440429688, 170.1072998046875, 174.4873504638672, 178.86740112304688, 183.2474365234375, 187.6274871826172, 192.0075225830078, 196.3875732421875, 200.7676239013672, 205.1476593017578, 209.5277099609375, 213.90774536132812, 218.2877960205078, 222.6678466796875, 227.04788208007812, 231.4279327392578, 235.8079833984375, 240.18801879882812, 244.5680694580078, 248.9481201171875, 253.32815551757812, 257.70819091796875, 262.0882568359375, 266.4682922363281]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 9.0, 12.0, 12.0, 14.0, 13.0, 12.0, 15.0, 24.0, 23.0, 34.0, 26.0, 23.0, 31.0, 32.0, 33.0, 19.0, 33.0, 37.0, 36.0, 27.0, 33.0, 24.0, 41.0, 39.0, 34.0, 36.0, 35.0, 39.0, 26.0, 24.0, 20.0, 22.0, 23.0, 18.0, 17.0, 14.0, 10.0, 13.0, 11.0, 10.0, 14.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.88700294494629, -21.217126846313477, -20.547252655029297, -19.877376556396484, -19.207500457763672, -18.53762435913086, -17.86775016784668, -17.197874069213867, -16.527999877929688, -15.858124732971191, -15.188248634338379, -14.518373489379883, -13.84849739074707, -13.178622245788574, -12.508747100830078, -11.838871002197266, -11.168994903564453, -10.499119758605957, -9.829243659973145, -9.159368515014648, -8.489492416381836, -7.81961727142334, -7.149742126464844, -6.4798665046691895, -5.809990882873535, -5.140115261077881, -4.470239639282227, -3.8003644943237305, -3.130488872528076, -2.460613250732422, -1.7907381057739258, -1.1208624839782715, -0.4509849548339844, 0.21889054775238037, 0.8887660503387451, 1.5586414337158203, 2.2285170555114746, 2.898392677307129, 3.568267822265625, 4.238143444061279, 4.908019065856934, 5.577894687652588, 6.247770309448242, 6.917645454406738, 7.587521076202393, 8.257396697998047, 8.927271842956543, 9.597146987915039, 10.267023086547852, 10.936898231506348, 11.60677433013916, 12.276649475097656, 12.946525573730469, 13.616400718688965, 14.286275863647461, 14.956151962280273, 15.62602710723877, 16.295902252197266, 16.965778350830078, 17.63565444946289, 18.30552864074707, 18.975404739379883, 19.645278930664062, 20.315155029296875, 20.985031127929688]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 16.0, 13.0, 13.0, 18.0, 24.0, 20.0, 25.0, 22.0, 33.0, 31.0, 34.0, 47.0, 37.0, 44.0, 43.0, 55.0, 53.0, 36.0, 42.0, 52.0, 39.0, 38.0, 28.0, 24.0, 36.0, 21.0, 21.0, 19.0, 18.0, 15.0, 11.0, 7.0, 10.0, 5.0, 8.0, 12.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.095703125, -3.002593994140625, -2.90948486328125, -2.816375732421875, -2.7232666015625, -2.630157470703125, -2.53704833984375, -2.443939208984375, -2.350830078125, -2.257720947265625, -2.16461181640625, -2.071502685546875, -1.9783935546875, -1.885284423828125, -1.79217529296875, -1.699066162109375, -1.60595703125, -1.512847900390625, -1.41973876953125, -1.326629638671875, -1.2335205078125, -1.140411376953125, -1.04730224609375, -0.954193115234375, -0.861083984375, -0.767974853515625, -0.67486572265625, -0.581756591796875, -0.4886474609375, -0.395538330078125, -0.30242919921875, -0.209320068359375, -0.1162109375, -0.023101806640625, 0.07000732421875, 0.163116455078125, 0.2562255859375, 0.349334716796875, 0.44244384765625, 0.535552978515625, 0.628662109375, 0.721771240234375, 0.81488037109375, 0.907989501953125, 1.0010986328125, 1.094207763671875, 1.18731689453125, 1.280426025390625, 1.37353515625, 1.466644287109375, 1.55975341796875, 1.652862548828125, 1.7459716796875, 1.839080810546875, 1.93218994140625, 2.025299072265625, 2.118408203125, 2.211517333984375, 2.30462646484375, 2.397735595703125, 2.4908447265625, 2.583953857421875, 2.67706298828125, 2.770172119140625, 2.86328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 11.0, 26.0, 32.0, 53.0, 81.0, 113.0, 147.0, 237.0, 332.0, 550.0, 867.0, 1486.0, 2600.0, 4608.0, 8473.0, 16960.0, 38347.0, 130966.0, 1106509.0, 2452063.0, 317416.0, 60328.0, 24414.0, 11817.0, 6306.0, 3623.0, 2091.0, 1292.0, 799.0, 523.0, 357.0, 234.0, 162.0, 103.0, 89.0, 65.0, 38.0, 37.0, 23.0, 17.0, 14.0, 12.0, 7.0, 9.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.4609375, -6.24725341796875, -6.0335693359375, -5.81988525390625, -5.606201171875, -5.39251708984375, -5.1788330078125, -4.96514892578125, -4.75146484375, -4.53778076171875, -4.3240966796875, -4.11041259765625, -3.896728515625, -3.68304443359375, -3.4693603515625, -3.25567626953125, -3.0419921875, -2.82830810546875, -2.6146240234375, -2.40093994140625, -2.187255859375, -1.97357177734375, -1.7598876953125, -1.54620361328125, -1.33251953125, -1.11883544921875, -0.9051513671875, -0.69146728515625, -0.477783203125, -0.26409912109375, -0.0504150390625, 0.16326904296875, 0.376953125, 0.59063720703125, 0.8043212890625, 1.01800537109375, 1.231689453125, 1.44537353515625, 1.6590576171875, 1.87274169921875, 2.08642578125, 2.30010986328125, 2.5137939453125, 2.72747802734375, 2.941162109375, 3.15484619140625, 3.3685302734375, 3.58221435546875, 3.7958984375, 4.00958251953125, 4.2232666015625, 4.43695068359375, 4.650634765625, 4.86431884765625, 5.0780029296875, 5.29168701171875, 5.50537109375, 5.71905517578125, 5.9327392578125, 6.14642333984375, 6.360107421875, 6.57379150390625, 6.7874755859375, 7.00115966796875, 7.21484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 16.0, 13.0, 14.0, 33.0, 37.0, 68.0, 73.0, 93.0, 155.0, 261.0, 467.0, 789.0, 801.0, 464.0, 225.0, 148.0, 115.0, 74.0, 55.0, 33.0, 27.0, 22.0, 12.0, 18.0, 8.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6953125, -9.41796875, -9.140625, -8.86328125, -8.5859375, -8.30859375, -8.03125, -7.75390625, -7.4765625, -7.19921875, -6.921875, -6.64453125, -6.3671875, -6.08984375, -5.8125, -5.53515625, -5.2578125, -4.98046875, -4.703125, -4.42578125, -4.1484375, -3.87109375, -3.59375, -3.31640625, -3.0390625, -2.76171875, -2.484375, -2.20703125, -1.9296875, -1.65234375, -1.375, -1.09765625, -0.8203125, -0.54296875, -0.265625, 0.01171875, 0.2890625, 0.56640625, 0.84375, 1.12109375, 1.3984375, 1.67578125, 1.953125, 2.23046875, 2.5078125, 2.78515625, 3.0625, 3.33984375, 3.6171875, 3.89453125, 4.171875, 4.44921875, 4.7265625, 5.00390625, 5.28125, 5.55859375, 5.8359375, 6.11328125, 6.390625, 6.66796875, 6.9453125, 7.22265625, 7.5, 7.77734375, 8.0546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 10.0, 24.0, 33.0, 45.0, 99.0, 129.0, 320.0, 751.0, 1812.0, 6095.0, 26018.0, 193031.0, 3549601.0, 365341.0, 38623.0, 8179.0, 2412.0, 876.0, 421.0, 184.0, 94.0, 54.0, 36.0, 20.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.01904296875, -16.4443359375, -15.86962890625, -15.294921875, -14.72021484375, -14.1455078125, -13.57080078125, -12.99609375, -12.42138671875, -11.8466796875, -11.27197265625, -10.697265625, -10.12255859375, -9.5478515625, -8.97314453125, -8.3984375, -7.82373046875, -7.2490234375, -6.67431640625, -6.099609375, -5.52490234375, -4.9501953125, -4.37548828125, -3.80078125, -3.22607421875, -2.6513671875, -2.07666015625, -1.501953125, -0.92724609375, -0.3525390625, 0.22216796875, 0.796875, 1.37158203125, 1.9462890625, 2.52099609375, 3.095703125, 3.67041015625, 4.2451171875, 4.81982421875, 5.39453125, 5.96923828125, 6.5439453125, 7.11865234375, 7.693359375, 8.26806640625, 8.8427734375, 9.41748046875, 9.9921875, 10.56689453125, 11.1416015625, 11.71630859375, 12.291015625, 12.86572265625, 13.4404296875, 14.01513671875, 14.58984375, 15.16455078125, 15.7392578125, 16.31396484375, 16.888671875, 17.46337890625, 18.0380859375, 18.61279296875, 19.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 23.0, 17.0, 35.0, 53.0, 93.0, 120.0, 140.0, 125.0, 131.0, 87.0, 48.0, 49.0, 20.0, 15.0, 11.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.46260070800781, -40.11937713623047, -38.776153564453125, -37.43292999267578, -36.08970642089844, -34.74648666381836, -33.403263092041016, -32.06003952026367, -30.716815948486328, -29.373592376708984, -28.03036880493164, -26.68714714050293, -25.343923568725586, -24.000699996948242, -22.65747833251953, -21.314254760742188, -19.971031188964844, -18.6278076171875, -17.284584045410156, -15.941362380981445, -14.598138809204102, -13.254915237426758, -11.91169261932373, -10.568470001220703, -9.22524642944336, -7.882023334503174, -6.538800239562988, -5.195577144622803, -3.852354049682617, -2.5091309547424316, -1.165907859802246, 0.17731475830078125, 1.520538330078125, 2.8637614250183105, 4.206984519958496, 5.550207614898682, 6.893430709838867, 8.236654281616211, 9.579876899719238, 10.923099517822266, 12.26632308959961, 13.609546661376953, 14.95276927947998, 16.295991897583008, 17.63921546936035, 18.982439041137695, 20.325660705566406, 21.66888427734375, 23.012107849121094, 24.355331420898438, 25.69855499267578, 27.041776657104492, 28.385000228881836, 29.72822380065918, 31.07144546508789, 32.414669036865234, 33.75789260864258, 35.10111618041992, 36.444339752197266, 37.78756332397461, 39.13078308105469, 40.47400665283203, 41.817230224609375, 43.16045379638672, 44.50367736816406]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 13.0, 9.0, 11.0, 17.0, 19.0, 23.0, 17.0, 34.0, 36.0, 35.0, 45.0, 35.0, 40.0, 39.0, 42.0, 54.0, 43.0, 42.0, 50.0, 40.0, 43.0, 38.0, 39.0, 32.0, 24.0, 18.0, 26.0, 22.0, 17.0, 21.0, 12.0, 13.0, 9.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.348052978515625, -27.520893096923828, -26.6937313079834, -25.8665714263916, -25.039409637451172, -24.212249755859375, -23.385089874267578, -22.55792808532715, -21.73076629638672, -20.903606414794922, -20.076444625854492, -19.249284744262695, -18.422122955322266, -17.59496307373047, -16.767803192138672, -15.940641403198242, -15.113481521606445, -14.286320686340332, -13.459159851074219, -12.631999969482422, -11.804838180541992, -10.977678298950195, -10.150517463684082, -9.323356628417969, -8.496195793151855, -7.669034957885742, -6.841874122619629, -6.014713764190674, -5.1875529289245605, -4.360392093658447, -3.533231735229492, -2.706070899963379, -1.8789100646972656, -1.051749348640442, -0.22458863258361816, 0.602571964263916, 1.4297327995300293, 2.2568936347961426, 3.0840539932250977, 3.911214828491211, 4.738375663757324, 5.5655364990234375, 6.392697334289551, 7.219857692718506, 8.047018051147461, 8.87417984008789, 9.701339721679688, 10.5285005569458, 11.355661392211914, 12.182822227478027, 13.00998306274414, 13.837142944335938, 14.664304733276367, 15.491464614868164, 16.318626403808594, 17.14578628540039, 17.972946166992188, 18.800106048583984, 19.627267837524414, 20.45442771911621, 21.28158950805664, 22.108749389648438, 22.935909271240234, 23.763071060180664, 24.590232849121094]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 11.0, 8.0, 20.0, 17.0, 24.0, 15.0, 21.0, 27.0, 33.0, 34.0, 38.0, 35.0, 36.0, 50.0, 41.0, 60.0, 55.0, 43.0, 41.0, 53.0, 38.0, 44.0, 39.0, 33.0, 30.0, 23.0, 18.0, 22.0, 14.0, 10.0, 16.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.79058837890625, -2.6925048828125, -2.59442138671875, -2.496337890625, -2.39825439453125, -2.3001708984375, -2.20208740234375, -2.10400390625, -2.00592041015625, -1.9078369140625, -1.80975341796875, -1.711669921875, -1.61358642578125, -1.5155029296875, -1.41741943359375, -1.3193359375, -1.22125244140625, -1.1231689453125, -1.02508544921875, -0.927001953125, -0.82891845703125, -0.7308349609375, -0.63275146484375, -0.53466796875, -0.43658447265625, -0.3385009765625, -0.24041748046875, -0.142333984375, -0.04425048828125, 0.0538330078125, 0.15191650390625, 0.25, 0.34808349609375, 0.4461669921875, 0.54425048828125, 0.642333984375, 0.74041748046875, 0.8385009765625, 0.93658447265625, 1.03466796875, 1.13275146484375, 1.2308349609375, 1.32891845703125, 1.427001953125, 1.52508544921875, 1.6231689453125, 1.72125244140625, 1.8193359375, 1.91741943359375, 2.0155029296875, 2.11358642578125, 2.211669921875, 2.30975341796875, 2.4078369140625, 2.50592041015625, 2.60400390625, 2.70208740234375, 2.8001708984375, 2.89825439453125, 2.996337890625, 3.09442138671875, 3.1925048828125, 3.29058837890625, 3.388671875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 9.0, 14.0, 13.0, 10.0, 20.0, 27.0, 43.0, 56.0, 81.0, 109.0, 120.0, 202.0, 281.0, 347.0, 509.0, 754.0, 1079.0, 1412.0, 2122.0, 3086.0, 4710.0, 7170.0, 11399.0, 19182.0, 33769.0, 70879.0, 296425.0, 417817.0, 82412.0, 37907.0, 20442.0, 12356.0, 7667.0, 5030.0, 3348.0, 2303.0, 1494.0, 1129.0, 802.0, 552.0, 403.0, 313.0, 205.0, 144.0, 107.0, 83.0, 51.0, 46.0, 35.0, 26.0, 19.0, 13.0, 11.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.203125, -4.06341552734375, -3.9237060546875, -3.78399658203125, -3.644287109375, -3.50457763671875, -3.3648681640625, -3.22515869140625, -3.08544921875, -2.94573974609375, -2.8060302734375, -2.66632080078125, -2.526611328125, -2.38690185546875, -2.2471923828125, -2.10748291015625, -1.9677734375, -1.82806396484375, -1.6883544921875, -1.54864501953125, -1.408935546875, -1.26922607421875, -1.1295166015625, -0.98980712890625, -0.85009765625, -0.71038818359375, -0.5706787109375, -0.43096923828125, -0.291259765625, -0.15155029296875, -0.0118408203125, 0.12786865234375, 0.267578125, 0.40728759765625, 0.5469970703125, 0.68670654296875, 0.826416015625, 0.96612548828125, 1.1058349609375, 1.24554443359375, 1.38525390625, 1.52496337890625, 1.6646728515625, 1.80438232421875, 1.944091796875, 2.08380126953125, 2.2235107421875, 2.36322021484375, 2.5029296875, 2.64263916015625, 2.7823486328125, 2.92205810546875, 3.061767578125, 3.20147705078125, 3.3411865234375, 3.48089599609375, 3.62060546875, 3.76031494140625, 3.9000244140625, 4.03973388671875, 4.179443359375, 4.31915283203125, 4.4588623046875, 4.59857177734375, 4.73828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 4.0, 3.0, 12.0, 19.0, 14.0, 17.0, 27.0, 23.0, 18.0, 17.0, 30.0, 44.0, 47.0, 37.0, 48.0, 52.0, 38.0, 56.0, 1067.0, 36.0, 53.0, 25.0, 42.0, 39.0, 31.0, 29.0, 24.0, 27.0, 30.0, 16.0, 14.0, 13.0, 10.0, 7.0, 13.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.333984375, -2.256988525390625, -2.17999267578125, -2.102996826171875, -2.0260009765625, -1.949005126953125, -1.87200927734375, -1.795013427734375, -1.718017578125, -1.641021728515625, -1.56402587890625, -1.487030029296875, -1.4100341796875, -1.333038330078125, -1.25604248046875, -1.179046630859375, -1.10205078125, -1.025054931640625, -0.94805908203125, -0.871063232421875, -0.7940673828125, -0.717071533203125, -0.64007568359375, -0.563079833984375, -0.486083984375, -0.409088134765625, -0.33209228515625, -0.255096435546875, -0.1781005859375, -0.101104736328125, -0.02410888671875, 0.052886962890625, 0.1298828125, 0.206878662109375, 0.28387451171875, 0.360870361328125, 0.4378662109375, 0.514862060546875, 0.59185791015625, 0.668853759765625, 0.745849609375, 0.822845458984375, 0.89984130859375, 0.976837158203125, 1.0538330078125, 1.130828857421875, 1.20782470703125, 1.284820556640625, 1.36181640625, 1.438812255859375, 1.51580810546875, 1.592803955078125, 1.6697998046875, 1.746795654296875, 1.82379150390625, 1.900787353515625, 1.977783203125, 2.054779052734375, 2.13177490234375, 2.208770751953125, 2.2857666015625, 2.362762451171875, 2.43975830078125, 2.516754150390625, 2.59375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 4.0, 5.0, 11.0, 22.0, 20.0, 38.0, 55.0, 70.0, 99.0, 161.0, 230.0, 337.0, 476.0, 754.0, 1192.0, 1908.0, 3155.0, 5493.0, 10518.0, 22086.0, 65521.0, 1396340.0, 496896.0, 50520.0, 18925.0, 9252.0, 5068.0, 2924.0, 1766.0, 1114.0, 706.0, 472.0, 283.0, 238.0, 152.0, 74.0, 81.0, 57.0, 31.0, 24.0, 20.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.546875, -5.39239501953125, -5.2379150390625, -5.08343505859375, -4.928955078125, -4.77447509765625, -4.6199951171875, -4.46551513671875, -4.31103515625, -4.15655517578125, -4.0020751953125, -3.84759521484375, -3.693115234375, -3.53863525390625, -3.3841552734375, -3.22967529296875, -3.0751953125, -2.92071533203125, -2.7662353515625, -2.61175537109375, -2.457275390625, -2.30279541015625, -2.1483154296875, -1.99383544921875, -1.83935546875, -1.68487548828125, -1.5303955078125, -1.37591552734375, -1.221435546875, -1.06695556640625, -0.9124755859375, -0.75799560546875, -0.603515625, -0.44903564453125, -0.2945556640625, -0.14007568359375, 0.014404296875, 0.16888427734375, 0.3233642578125, 0.47784423828125, 0.63232421875, 0.78680419921875, 0.9412841796875, 1.09576416015625, 1.250244140625, 1.40472412109375, 1.5592041015625, 1.71368408203125, 1.8681640625, 2.02264404296875, 2.1771240234375, 2.33160400390625, 2.486083984375, 2.64056396484375, 2.7950439453125, 2.94952392578125, 3.10400390625, 3.25848388671875, 3.4129638671875, 3.56744384765625, 3.721923828125, 3.87640380859375, 4.0308837890625, 4.18536376953125, 4.33984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 5.0, 11.0, 29.0, 93.0, 264.0, 382.0, 117.0, 41.0, 12.0, 7.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.923828125, -1.85784912109375, -1.7918701171875, -1.72589111328125, -1.659912109375, -1.59393310546875, -1.5279541015625, -1.46197509765625, -1.39599609375, -1.33001708984375, -1.2640380859375, -1.19805908203125, -1.132080078125, -1.06610107421875, -1.0001220703125, -0.93414306640625, -0.8681640625, -0.80218505859375, -0.7362060546875, -0.67022705078125, -0.604248046875, -0.53826904296875, -0.4722900390625, -0.40631103515625, -0.34033203125, -0.27435302734375, -0.2083740234375, -0.14239501953125, -0.076416015625, -0.01043701171875, 0.0555419921875, 0.12152099609375, 0.1875, 0.25347900390625, 0.3194580078125, 0.38543701171875, 0.451416015625, 0.51739501953125, 0.5833740234375, 0.64935302734375, 0.71533203125, 0.78131103515625, 0.8472900390625, 0.91326904296875, 0.979248046875, 1.04522705078125, 1.1112060546875, 1.17718505859375, 1.2431640625, 1.30914306640625, 1.3751220703125, 1.44110107421875, 1.507080078125, 1.57305908203125, 1.6390380859375, 1.70501708984375, 1.77099609375, 1.83697509765625, 1.9029541015625, 1.96893310546875, 2.034912109375, 2.10089111328125, 2.1668701171875, 2.23284912109375, 2.298828125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 11.0, 19.0, 22.0, 67.0, 288.0, 2357.0, 1013239.0, 31074.0, 1174.0, 188.0, 33.0, 18.0, 15.0, 13.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.375, -42.13037109375, -40.8857421875, -39.64111328125, -38.396484375, -37.15185546875, -35.9072265625, -34.66259765625, -33.41796875, -32.17333984375, -30.9287109375, -29.68408203125, -28.439453125, -27.19482421875, -25.9501953125, -24.70556640625, -23.4609375, -22.21630859375, -20.9716796875, -19.72705078125, -18.482421875, -17.23779296875, -15.9931640625, -14.74853515625, -13.50390625, -12.25927734375, -11.0146484375, -9.77001953125, -8.525390625, -7.28076171875, -6.0361328125, -4.79150390625, -3.546875, -2.30224609375, -1.0576171875, 0.18701171875, 1.431640625, 2.67626953125, 3.9208984375, 5.16552734375, 6.41015625, 7.65478515625, 8.8994140625, 10.14404296875, 11.388671875, 12.63330078125, 13.8779296875, 15.12255859375, 16.3671875, 17.61181640625, 18.8564453125, 20.10107421875, 21.345703125, 22.59033203125, 23.8349609375, 25.07958984375, 26.32421875, 27.56884765625, 28.8134765625, 30.05810546875, 31.302734375, 32.54736328125, 33.7919921875, 35.03662109375, 36.28125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 12.0, 20.0, 24.0, 39.0, 62.0, 140.0, 210.0, 216.0, 115.0, 52.0, 33.0, 28.0, 10.0, 7.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7362329959869385, -3.644993305206299, -3.55375337600708, -3.4625136852264404, -3.3712737560272217, -3.280034065246582, -3.1887941360473633, -3.0975544452667236, -3.006314754486084, -2.9150750637054443, -2.8238351345062256, -2.732595443725586, -2.641355514526367, -2.5501158237457275, -2.458876132965088, -2.367636203765869, -2.2763962745666504, -2.1851565837860107, -2.093916654586792, -2.0026769638061523, -1.9114370346069336, -1.820197343826294, -1.7289575338363647, -1.6377177238464355, -1.5464779138565063, -1.4552381038665771, -1.363998293876648, -1.2727584838867188, -1.181518793106079, -1.0902788639068604, -0.9990391731262207, -0.9077993631362915, -0.8165597915649414, -0.7253199815750122, -0.634080171585083, -0.5428404211997986, -0.4516006112098694, -0.3603608012199402, -0.26912105083465576, -0.17788124084472656, -0.08664143085479736, 0.004598364233970642, 0.09583815932273865, 0.18707793951034546, 0.27831774950027466, 0.36955755949020386, 0.4607973098754883, 0.5520371198654175, 0.6432769298553467, 0.7345167398452759, 0.8257565498352051, 0.9169963002204895, 1.0082361698150635, 1.0994758605957031, 1.1907156705856323, 1.2819554805755615, 1.3731952905654907, 1.46443510055542, 1.5556749105453491, 1.6469147205352783, 1.738154411315918, 1.8293943405151367, 1.9206340312957764, 2.011873722076416, 2.1031136512756348]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 12.0, 16.0, 18.0, 28.0, 13.0, 25.0, 31.0, 25.0, 38.0, 27.0, 39.0, 35.0, 41.0, 35.0, 37.0, 37.0, 37.0, 43.0, 34.0, 46.0, 45.0, 23.0, 36.0, 31.0, 20.0, 27.0, 20.0, 18.0, 18.0, 18.0, 17.0, 9.0, 3.0, 10.0, 8.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1061121225357056, -1.0673414468765259, -1.0285708904266357, -0.989800214767456, -0.9510295391082764, -0.9122588634490967, -0.8734882473945618, -0.8347176313400269, -0.7959469556808472, -0.7571762800216675, -0.7184056639671326, -0.6796350479125977, -0.640864372253418, -0.6020936965942383, -0.5633230805397034, -0.5245524644851685, -0.48578178882598877, -0.44701114296913147, -0.40824049711227417, -0.36946985125541687, -0.33069920539855957, -0.29192855954170227, -0.25315791368484497, -0.21438726782798767, -0.17561662197113037, -0.13684597611427307, -0.09807533025741577, -0.05930468440055847, -0.020534038543701172, 0.018236607313156128, 0.05700725317001343, 0.09577789902687073, 0.13454842567443848, 0.17331907153129578, 0.21208971738815308, 0.2508603632450104, 0.2896310091018677, 0.328401654958725, 0.3671723008155823, 0.4059429466724396, 0.4447135925292969, 0.4834842383861542, 0.5222548842430115, 0.5610255002975464, 0.5997961759567261, 0.6385668516159058, 0.6773374676704407, 0.7161080837249756, 0.7548787593841553, 0.793649435043335, 0.8324200510978699, 0.8711906671524048, 0.9099613428115845, 0.9487320184707642, 0.9875026345252991, 1.026273250579834, 1.0650439262390137, 1.1038146018981934, 1.142585277557373, 1.1813558340072632, 1.2201265096664429, 1.2588971853256226, 1.2976677417755127, 1.3364384174346924, 1.375209093093872]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 1.0, 6.0, 7.0, 11.0, 15.0, 21.0, 21.0, 19.0, 27.0, 27.0, 27.0, 41.0, 38.0, 34.0, 33.0, 46.0, 39.0, 36.0, 51.0, 43.0, 54.0, 48.0, 42.0, 34.0, 46.0, 30.0, 37.0, 32.0, 22.0, 15.0, 16.0, 18.0, 12.0, 5.0, 4.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -2.994903564453125, -2.89996337890625, -2.805023193359375, -2.7100830078125, -2.615142822265625, -2.52020263671875, -2.425262451171875, -2.330322265625, -2.235382080078125, -2.14044189453125, -2.045501708984375, -1.9505615234375, -1.855621337890625, -1.76068115234375, -1.665740966796875, -1.57080078125, -1.475860595703125, -1.38092041015625, -1.285980224609375, -1.1910400390625, -1.096099853515625, -1.00115966796875, -0.906219482421875, -0.811279296875, -0.716339111328125, -0.62139892578125, -0.526458740234375, -0.4315185546875, -0.336578369140625, -0.24163818359375, -0.146697998046875, -0.0517578125, 0.043182373046875, 0.13812255859375, 0.233062744140625, 0.3280029296875, 0.422943115234375, 0.51788330078125, 0.612823486328125, 0.707763671875, 0.802703857421875, 0.89764404296875, 0.992584228515625, 1.0875244140625, 1.182464599609375, 1.27740478515625, 1.372344970703125, 1.46728515625, 1.562225341796875, 1.65716552734375, 1.752105712890625, 1.8470458984375, 1.941986083984375, 2.03692626953125, 2.131866455078125, 2.226806640625, 2.321746826171875, 2.41668701171875, 2.511627197265625, 2.6065673828125, 2.701507568359375, 2.79644775390625, 2.891387939453125, 2.986328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 16.0, 13.0, 20.0, 31.0, 38.0, 56.0, 72.0, 88.0, 150.0, 195.0, 296.0, 450.0, 668.0, 1083.0, 1888.0, 3350.0, 6361.0, 13076.0, 30335.0, 88294.0, 455232.0, 324358.0, 71486.0, 25855.0, 11640.0, 5749.0, 3004.0, 1699.0, 1050.0, 615.0, 387.0, 286.0, 191.0, 147.0, 108.0, 83.0, 44.0, 32.0, 27.0, 16.0, 13.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-5.60546875, -5.440185546875, -5.27490234375, -5.109619140625, -4.9443359375, -4.779052734375, -4.61376953125, -4.448486328125, -4.283203125, -4.117919921875, -3.95263671875, -3.787353515625, -3.6220703125, -3.456787109375, -3.29150390625, -3.126220703125, -2.9609375, -2.795654296875, -2.63037109375, -2.465087890625, -2.2998046875, -2.134521484375, -1.96923828125, -1.803955078125, -1.638671875, -1.473388671875, -1.30810546875, -1.142822265625, -0.9775390625, -0.812255859375, -0.64697265625, -0.481689453125, -0.31640625, -0.151123046875, 0.01416015625, 0.179443359375, 0.3447265625, 0.510009765625, 0.67529296875, 0.840576171875, 1.005859375, 1.171142578125, 1.33642578125, 1.501708984375, 1.6669921875, 1.832275390625, 1.99755859375, 2.162841796875, 2.328125, 2.493408203125, 2.65869140625, 2.823974609375, 2.9892578125, 3.154541015625, 3.31982421875, 3.485107421875, 3.650390625, 3.815673828125, 3.98095703125, 4.146240234375, 4.3115234375, 4.476806640625, 4.64208984375, 4.807373046875, 4.97265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 3.0, 13.0, 8.0, 14.0, 13.0, 15.0, 17.0, 21.0, 22.0, 23.0, 23.0, 34.0, 42.0, 44.0, 43.0, 66.0, 77.0, 146.0, 336.0, 1393.0, 143.0, 76.0, 65.0, 43.0, 44.0, 44.0, 43.0, 40.0, 32.0, 27.0, 17.0, 15.0, 21.0, 11.0, 2.0, 10.0, 15.0, 7.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.28125, -8.98193359375, -8.6826171875, -8.38330078125, -8.083984375, -7.78466796875, -7.4853515625, -7.18603515625, -6.88671875, -6.58740234375, -6.2880859375, -5.98876953125, -5.689453125, -5.39013671875, -5.0908203125, -4.79150390625, -4.4921875, -4.19287109375, -3.8935546875, -3.59423828125, -3.294921875, -2.99560546875, -2.6962890625, -2.39697265625, -2.09765625, -1.79833984375, -1.4990234375, -1.19970703125, -0.900390625, -0.60107421875, -0.3017578125, -0.00244140625, 0.296875, 0.59619140625, 0.8955078125, 1.19482421875, 1.494140625, 1.79345703125, 2.0927734375, 2.39208984375, 2.69140625, 2.99072265625, 3.2900390625, 3.58935546875, 3.888671875, 4.18798828125, 4.4873046875, 4.78662109375, 5.0859375, 5.38525390625, 5.6845703125, 5.98388671875, 6.283203125, 6.58251953125, 6.8818359375, 7.18115234375, 7.48046875, 7.77978515625, 8.0791015625, 8.37841796875, 8.677734375, 8.97705078125, 9.2763671875, 9.57568359375, 9.875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 10.0, 16.0, 14.0, 21.0, 38.0, 30.0, 62.0, 88.0, 111.0, 185.0, 343.0, 746.0, 2014.0, 9220.0, 126202.0, 2919810.0, 76425.0, 7107.0, 1737.0, 659.0, 292.0, 175.0, 88.0, 70.0, 63.0, 42.0, 28.0, 24.0, 17.0, 13.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.15673828125, -17.4697265625, -16.78271484375, -16.095703125, -15.40869140625, -14.7216796875, -14.03466796875, -13.34765625, -12.66064453125, -11.9736328125, -11.28662109375, -10.599609375, -9.91259765625, -9.2255859375, -8.53857421875, -7.8515625, -7.16455078125, -6.4775390625, -5.79052734375, -5.103515625, -4.41650390625, -3.7294921875, -3.04248046875, -2.35546875, -1.66845703125, -0.9814453125, -0.29443359375, 0.392578125, 1.07958984375, 1.7666015625, 2.45361328125, 3.140625, 3.82763671875, 4.5146484375, 5.20166015625, 5.888671875, 6.57568359375, 7.2626953125, 7.94970703125, 8.63671875, 9.32373046875, 10.0107421875, 10.69775390625, 11.384765625, 12.07177734375, 12.7587890625, 13.44580078125, 14.1328125, 14.81982421875, 15.5068359375, 16.19384765625, 16.880859375, 17.56787109375, 18.2548828125, 18.94189453125, 19.62890625, 20.31591796875, 21.0029296875, 21.68994140625, 22.376953125, 23.06396484375, 23.7509765625, 24.43798828125, 25.125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 34.0, 769.0, 209.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.653095245361328, -17.30721664428711, -10.961339950561523, -4.6154632568359375, 1.7304153442382812, 8.0762939453125, 14.422168731689453, 20.768047332763672, 27.11392593383789, 33.45980453491211, 39.80567932128906, 46.15155792236328, 52.4974365234375, 58.84331512451172, 65.18919372558594, 71.53506469726562, 77.88095092773438, 84.2268295288086, 90.57270812988281, 96.9185791015625, 103.26446533203125, 109.61033630371094, 115.95621490478516, 122.30209350585938, 128.64796447753906, 134.99383544921875, 141.3397216796875, 147.6855926513672, 154.03147888183594, 160.37734985351562, 166.72323608398438, 173.06910705566406, 179.41497802734375, 185.76084899902344, 192.1067352294922, 198.45260620117188, 204.79849243164062, 211.1443634033203, 217.490234375, 223.83612060546875, 230.1820068359375, 236.5278778076172, 242.87376403808594, 249.21963500976562, 255.56552124023438, 261.9114074707031, 268.25726318359375, 274.6031494140625, 280.94903564453125, 287.294921875, 293.6407775878906, 299.9866638183594, 306.3325500488281, 312.6784362792969, 319.0242919921875, 325.37017822265625, 331.7160339355469, 338.0619201660156, 344.40777587890625, 350.753662109375, 357.09954833984375, 363.4454345703125, 369.7912902832031, 376.1371765136719, 382.4830627441406]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 9.0, 7.0, 12.0, 23.0, 21.0, 23.0, 25.0, 32.0, 35.0, 27.0, 35.0, 34.0, 35.0, 45.0, 50.0, 37.0, 47.0, 39.0, 40.0, 40.0, 39.0, 37.0, 27.0, 46.0, 23.0, 30.0, 30.0, 18.0, 25.0, 19.0, 16.0, 6.0, 7.0, 11.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.468902587890625, -31.489551544189453, -30.51020050048828, -29.53084945678711, -28.551498413085938, -27.572147369384766, -26.592798233032227, -25.613447189331055, -24.634096145629883, -23.65474510192871, -22.67539405822754, -21.696043014526367, -20.716693878173828, -19.737342834472656, -18.757991790771484, -17.778640747070312, -16.79928970336914, -15.819938659667969, -14.840587615966797, -13.861237525939941, -12.88188648223877, -11.902535438537598, -10.923185348510742, -9.94383430480957, -8.964483261108398, -7.985132217407227, -7.005781650543213, -6.026431083679199, -5.047080039978027, -4.0677289962768555, -3.088378429412842, -2.109027862548828, -1.129678726196289, -0.1503279209136963, 0.8290228843688965, 1.8083736896514893, 2.787724494934082, 3.767075538635254, 4.746426105499268, 5.725776672363281, 6.705127716064453, 7.684478759765625, 8.663829803466797, 9.643179893493652, 10.622530937194824, 11.601881980895996, 12.581232070922852, 13.560583114624023, 14.539934158325195, 15.519285202026367, 16.49863624572754, 17.47798728942871, 18.45733642578125, 19.436687469482422, 20.416038513183594, 21.395389556884766, 22.374740600585938, 23.35409164428711, 24.33344268798828, 25.312793731689453, 26.292144775390625, 27.271495819091797, 28.250844955444336, 29.230195999145508, 30.20954704284668]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 7.0, 10.0, 11.0, 14.0, 12.0, 21.0, 23.0, 19.0, 25.0, 21.0, 31.0, 27.0, 29.0, 35.0, 40.0, 31.0, 32.0, 38.0, 45.0, 53.0, 54.0, 39.0, 35.0, 46.0, 28.0, 36.0, 30.0, 28.0, 25.0, 26.0, 25.0, 12.0, 14.0, 14.0, 15.0, 8.0, 14.0, 12.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.91796875, -2.821807861328125, -2.72564697265625, -2.629486083984375, -2.5333251953125, -2.437164306640625, -2.34100341796875, -2.244842529296875, -2.148681640625, -2.052520751953125, -1.95635986328125, -1.860198974609375, -1.7640380859375, -1.667877197265625, -1.57171630859375, -1.475555419921875, -1.37939453125, -1.283233642578125, -1.18707275390625, -1.090911865234375, -0.9947509765625, -0.898590087890625, -0.80242919921875, -0.706268310546875, -0.610107421875, -0.513946533203125, -0.41778564453125, -0.321624755859375, -0.2254638671875, -0.129302978515625, -0.03314208984375, 0.063018798828125, 0.1591796875, 0.255340576171875, 0.35150146484375, 0.447662353515625, 0.5438232421875, 0.639984130859375, 0.73614501953125, 0.832305908203125, 0.928466796875, 1.024627685546875, 1.12078857421875, 1.216949462890625, 1.3131103515625, 1.409271240234375, 1.50543212890625, 1.601593017578125, 1.69775390625, 1.793914794921875, 1.89007568359375, 1.986236572265625, 2.0823974609375, 2.178558349609375, 2.27471923828125, 2.370880126953125, 2.467041015625, 2.563201904296875, 2.65936279296875, 2.755523681640625, 2.8516845703125, 2.947845458984375, 3.04400634765625, 3.140167236328125, 3.236328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 3.0, 7.0, 9.0, 19.0, 25.0, 50.0, 69.0, 88.0, 148.0, 236.0, 324.0, 512.0, 777.0, 1328.0, 2218.0, 3888.0, 7189.0, 13124.0, 26238.0, 61253.0, 262474.0, 1811125.0, 1664721.0, 229785.0, 55583.0, 24292.0, 12325.0, 6724.0, 3719.0, 2227.0, 1390.0, 889.0, 527.0, 331.0, 212.0, 122.0, 112.0, 74.0, 49.0, 35.0, 24.0, 17.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96484375, -5.76580810546875, -5.5667724609375, -5.36773681640625, -5.168701171875, -4.96966552734375, -4.7706298828125, -4.57159423828125, -4.37255859375, -4.17352294921875, -3.9744873046875, -3.77545166015625, -3.576416015625, -3.37738037109375, -3.1783447265625, -2.97930908203125, -2.7802734375, -2.58123779296875, -2.3822021484375, -2.18316650390625, -1.984130859375, -1.78509521484375, -1.5860595703125, -1.38702392578125, -1.18798828125, -0.98895263671875, -0.7899169921875, -0.59088134765625, -0.391845703125, -0.19281005859375, 0.0062255859375, 0.20526123046875, 0.404296875, 0.60333251953125, 0.8023681640625, 1.00140380859375, 1.200439453125, 1.39947509765625, 1.5985107421875, 1.79754638671875, 1.99658203125, 2.19561767578125, 2.3946533203125, 2.59368896484375, 2.792724609375, 2.99176025390625, 3.1907958984375, 3.38983154296875, 3.5888671875, 3.78790283203125, 3.9869384765625, 4.18597412109375, 4.385009765625, 4.58404541015625, 4.7830810546875, 4.98211669921875, 5.18115234375, 5.38018798828125, 5.5792236328125, 5.77825927734375, 5.977294921875, 6.17633056640625, 6.3753662109375, 6.57440185546875, 6.7734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 12.0, 18.0, 26.0, 24.0, 42.0, 38.0, 51.0, 57.0, 94.0, 106.0, 207.0, 360.0, 517.0, 685.0, 590.0, 375.0, 236.0, 155.0, 85.0, 86.0, 51.0, 43.0, 46.0, 31.0, 18.0, 15.0, 15.0, 16.0, 7.0, 6.0, 2.0, 10.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86138916015625, -5.6329345703125, -5.40447998046875, -5.176025390625, -4.94757080078125, -4.7191162109375, -4.49066162109375, -4.26220703125, -4.03375244140625, -3.8052978515625, -3.57684326171875, -3.348388671875, -3.11993408203125, -2.8914794921875, -2.66302490234375, -2.4345703125, -2.20611572265625, -1.9776611328125, -1.74920654296875, -1.520751953125, -1.29229736328125, -1.0638427734375, -0.83538818359375, -0.60693359375, -0.37847900390625, -0.1500244140625, 0.07843017578125, 0.306884765625, 0.53533935546875, 0.7637939453125, 0.99224853515625, 1.220703125, 1.44915771484375, 1.6776123046875, 1.90606689453125, 2.134521484375, 2.36297607421875, 2.5914306640625, 2.81988525390625, 3.04833984375, 3.27679443359375, 3.5052490234375, 3.73370361328125, 3.962158203125, 4.19061279296875, 4.4190673828125, 4.64752197265625, 4.8759765625, 5.10443115234375, 5.3328857421875, 5.56134033203125, 5.789794921875, 6.01824951171875, 6.2467041015625, 6.47515869140625, 6.70361328125, 6.93206787109375, 7.1605224609375, 7.38897705078125, 7.617431640625, 7.84588623046875, 8.0743408203125, 8.30279541015625, 8.53125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 5.0, 1.0, 11.0, 13.0, 15.0, 15.0, 21.0, 32.0, 38.0, 57.0, 73.0, 160.0, 306.0, 952.0, 4114.0, 25760.0, 339750.0, 3681674.0, 123746.0, 13763.0, 2507.0, 611.0, 232.0, 114.0, 74.0, 50.0, 37.0, 37.0, 29.0, 13.0, 11.0, 11.0, 12.0, 3.0, 8.0, 8.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0], "bins": [-27.09375, -26.3681640625, -25.642578125, -24.9169921875, -24.19140625, -23.4658203125, -22.740234375, -22.0146484375, -21.2890625, -20.5634765625, -19.837890625, -19.1123046875, -18.38671875, -17.6611328125, -16.935546875, -16.2099609375, -15.484375, -14.7587890625, -14.033203125, -13.3076171875, -12.58203125, -11.8564453125, -11.130859375, -10.4052734375, -9.6796875, -8.9541015625, -8.228515625, -7.5029296875, -6.77734375, -6.0517578125, -5.326171875, -4.6005859375, -3.875, -3.1494140625, -2.423828125, -1.6982421875, -0.97265625, -0.2470703125, 0.478515625, 1.2041015625, 1.9296875, 2.6552734375, 3.380859375, 4.1064453125, 4.83203125, 5.5576171875, 6.283203125, 7.0087890625, 7.734375, 8.4599609375, 9.185546875, 9.9111328125, 10.63671875, 11.3623046875, 12.087890625, 12.8134765625, 13.5390625, 14.2646484375, 14.990234375, 15.7158203125, 16.44140625, 17.1669921875, 17.892578125, 18.6181640625, 19.34375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 9.0, 14.0, 30.0, 72.0, 97.0, 120.0, 172.0, 179.0, 131.0, 66.0, 47.0, 22.0, 9.0, 12.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.42725372314453, -44.872169494628906, -43.31708526611328, -41.76200485229492, -40.2069206237793, -38.65183639526367, -37.09675598144531, -35.54167175292969, -33.98658752441406, -32.43150329589844, -30.876420974731445, -29.321338653564453, -27.766254425048828, -26.211170196533203, -24.65608787536621, -23.10100555419922, -21.545921325683594, -19.99083709716797, -18.435754776000977, -16.880672454833984, -15.32558822631836, -13.77050495147705, -12.215421676635742, -10.660338401794434, -9.105255126953125, -7.550171852111816, -5.995088577270508, -4.440005302429199, -2.8849220275878906, -1.329838752746582, 0.22524452209472656, 1.7803277969360352, 3.3354110717773438, 4.890494346618652, 6.445577621459961, 8.00066089630127, 9.555744171142578, 11.110827445983887, 12.665910720825195, 14.220993995666504, 15.776077270507812, 17.331161499023438, 18.88624382019043, 20.441326141357422, 21.996410369873047, 23.551494598388672, 25.106576919555664, 26.661659240722656, 28.21674346923828, 29.771827697753906, 31.3269100189209, 32.88199234008789, 34.437076568603516, 35.99216079711914, 37.5472412109375, 39.102325439453125, 40.65740966796875, 42.212493896484375, 43.767578125, 45.32265853881836, 46.877742767333984, 48.43282699584961, 49.98790740966797, 51.542991638183594, 53.09807586669922]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 7.0, 7.0, 11.0, 13.0, 12.0, 15.0, 14.0, 26.0, 26.0, 41.0, 28.0, 36.0, 27.0, 40.0, 46.0, 54.0, 48.0, 46.0, 49.0, 30.0, 43.0, 50.0, 41.0, 40.0, 32.0, 21.0, 17.0, 30.0, 24.0, 16.0, 14.0, 16.0, 15.0, 9.0, 16.0, 5.0, 9.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.067045211791992, -24.29473876953125, -23.522430419921875, -22.750123977661133, -21.97781753540039, -21.20551109313965, -20.433202743530273, -19.66089630126953, -18.88858985900879, -18.116283416748047, -17.343975067138672, -16.57166862487793, -15.799362182617188, -15.027054786682129, -14.25474739074707, -13.482440948486328, -12.71013355255127, -11.937826156616211, -11.165519714355469, -10.39321231842041, -9.620905876159668, -8.84859848022461, -8.076292037963867, -7.303984642028809, -6.531677722930908, -5.759370803833008, -4.987063884735107, -4.214756965637207, -3.4424498081207275, -2.670142889022827, -1.8978357315063477, -1.1255288124084473, -0.3532218933105469, 0.4190850853919983, 1.1913920640945435, 1.9636991024017334, 2.736006021499634, 3.508312940597534, 4.280620098114014, 5.052927017211914, 5.8252339363098145, 6.597540855407715, 7.369847774505615, 8.142154693603516, 8.914462089538574, 9.686768531799316, 10.459075927734375, 11.231382369995117, 12.003689765930176, 12.775997161865234, 13.548303604125977, 14.320611000061035, 15.092917442321777, 15.865224838256836, 16.637531280517578, 17.409839630126953, 18.182146072387695, 18.954452514648438, 19.726760864257812, 20.499067306518555, 21.271373748779297, 22.04368019104004, 22.815988540649414, 23.588294982910156, 24.3606014251709]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 5.0, 6.0, 17.0, 10.0, 15.0, 23.0, 19.0, 26.0, 30.0, 29.0, 27.0, 27.0, 54.0, 41.0, 41.0, 51.0, 45.0, 47.0, 38.0, 42.0, 51.0, 46.0, 35.0, 33.0, 20.0, 37.0, 27.0, 27.0, 16.0, 22.0, 19.0, 15.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.171875, -3.074005126953125, -2.97613525390625, -2.878265380859375, -2.7803955078125, -2.682525634765625, -2.58465576171875, -2.486785888671875, -2.388916015625, -2.291046142578125, -2.19317626953125, -2.095306396484375, -1.9974365234375, -1.899566650390625, -1.80169677734375, -1.703826904296875, -1.60595703125, -1.508087158203125, -1.41021728515625, -1.312347412109375, -1.2144775390625, -1.116607666015625, -1.01873779296875, -0.920867919921875, -0.822998046875, -0.725128173828125, -0.62725830078125, -0.529388427734375, -0.4315185546875, -0.333648681640625, -0.23577880859375, -0.137908935546875, -0.0400390625, 0.057830810546875, 0.15570068359375, 0.253570556640625, 0.3514404296875, 0.449310302734375, 0.54718017578125, 0.645050048828125, 0.742919921875, 0.840789794921875, 0.93865966796875, 1.036529541015625, 1.1343994140625, 1.232269287109375, 1.33013916015625, 1.428009033203125, 1.52587890625, 1.623748779296875, 1.72161865234375, 1.819488525390625, 1.9173583984375, 2.015228271484375, 2.11309814453125, 2.210968017578125, 2.308837890625, 2.406707763671875, 2.50457763671875, 2.602447509765625, 2.7003173828125, 2.798187255859375, 2.89605712890625, 2.993927001953125, 3.091796875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 12.0, 19.0, 17.0, 34.0, 30.0, 58.0, 48.0, 73.0, 111.0, 130.0, 176.0, 262.0, 384.0, 531.0, 732.0, 1053.0, 1446.0, 2225.0, 3469.0, 5939.0, 13468.0, 56814.0, 526579.0, 367296.0, 40773.0, 11307.0, 5430.0, 3244.0, 2006.0, 1451.0, 962.0, 630.0, 479.0, 347.0, 277.0, 203.0, 141.0, 101.0, 72.0, 53.0, 55.0, 29.0, 16.0, 11.0, 17.0, 10.0, 7.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.30078125, -4.17010498046875, -4.0394287109375, -3.90875244140625, -3.778076171875, -3.64739990234375, -3.5167236328125, -3.38604736328125, -3.25537109375, -3.12469482421875, -2.9940185546875, -2.86334228515625, -2.732666015625, -2.60198974609375, -2.4713134765625, -2.34063720703125, -2.2099609375, -2.07928466796875, -1.9486083984375, -1.81793212890625, -1.687255859375, -1.55657958984375, -1.4259033203125, -1.29522705078125, -1.16455078125, -1.03387451171875, -0.9031982421875, -0.77252197265625, -0.641845703125, -0.51116943359375, -0.3804931640625, -0.24981689453125, -0.119140625, 0.01153564453125, 0.1422119140625, 0.27288818359375, 0.403564453125, 0.53424072265625, 0.6649169921875, 0.79559326171875, 0.92626953125, 1.05694580078125, 1.1876220703125, 1.31829833984375, 1.448974609375, 1.57965087890625, 1.7103271484375, 1.84100341796875, 1.9716796875, 2.10235595703125, 2.2330322265625, 2.36370849609375, 2.494384765625, 2.62506103515625, 2.7557373046875, 2.88641357421875, 3.01708984375, 3.14776611328125, 3.2784423828125, 3.40911865234375, 3.539794921875, 3.67047119140625, 3.8011474609375, 3.93182373046875, 4.0625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 16.0, 17.0, 26.0, 20.0, 16.0, 30.0, 42.0, 37.0, 32.0, 29.0, 48.0, 26.0, 31.0, 34.0, 1067.0, 49.0, 39.0, 37.0, 41.0, 36.0, 33.0, 32.0, 29.0, 22.0, 25.0, 18.0, 19.0, 20.0, 19.0, 20.0, 6.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.1060791015625, -2.034423828125, -1.9627685546875, -1.89111328125, -1.8194580078125, -1.747802734375, -1.6761474609375, -1.6044921875, -1.5328369140625, -1.461181640625, -1.3895263671875, -1.31787109375, -1.2462158203125, -1.174560546875, -1.1029052734375, -1.03125, -0.9595947265625, -0.887939453125, -0.8162841796875, -0.74462890625, -0.6729736328125, -0.601318359375, -0.5296630859375, -0.4580078125, -0.3863525390625, -0.314697265625, -0.2430419921875, -0.17138671875, -0.0997314453125, -0.028076171875, 0.0435791015625, 0.115234375, 0.1868896484375, 0.258544921875, 0.3302001953125, 0.40185546875, 0.4735107421875, 0.545166015625, 0.6168212890625, 0.6884765625, 0.7601318359375, 0.831787109375, 0.9034423828125, 0.97509765625, 1.0467529296875, 1.118408203125, 1.1900634765625, 1.26171875, 1.3333740234375, 1.405029296875, 1.4766845703125, 1.54833984375, 1.6199951171875, 1.691650390625, 1.7633056640625, 1.8349609375, 1.9066162109375, 1.978271484375, 2.0499267578125, 2.12158203125, 2.1932373046875, 2.264892578125, 2.3365478515625, 2.408203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 7.0, 7.0, 9.0, 6.0, 19.0, 19.0, 20.0, 27.0, 48.0, 40.0, 72.0, 89.0, 109.0, 164.0, 207.0, 262.0, 363.0, 516.0, 735.0, 1191.0, 2089.0, 4056.0, 11325.0, 85587.0, 1878081.0, 89849.0, 11968.0, 4229.0, 2040.0, 1218.0, 770.0, 541.0, 382.0, 248.0, 187.0, 160.0, 112.0, 103.0, 53.0, 59.0, 43.0, 27.0, 29.0, 18.0, 18.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-3.974609375, -3.855987548828125, -3.73736572265625, -3.618743896484375, -3.5001220703125, -3.381500244140625, -3.26287841796875, -3.144256591796875, -3.025634765625, -2.907012939453125, -2.78839111328125, -2.669769287109375, -2.5511474609375, -2.432525634765625, -2.31390380859375, -2.195281982421875, -2.07666015625, -1.958038330078125, -1.83941650390625, -1.720794677734375, -1.6021728515625, -1.483551025390625, -1.36492919921875, -1.246307373046875, -1.127685546875, -1.009063720703125, -0.89044189453125, -0.771820068359375, -0.6531982421875, -0.534576416015625, -0.41595458984375, -0.297332763671875, -0.1787109375, -0.060089111328125, 0.05853271484375, 0.177154541015625, 0.2957763671875, 0.414398193359375, 0.53302001953125, 0.651641845703125, 0.770263671875, 0.888885498046875, 1.00750732421875, 1.126129150390625, 1.2447509765625, 1.363372802734375, 1.48199462890625, 1.600616455078125, 1.71923828125, 1.837860107421875, 1.95648193359375, 2.075103759765625, 2.1937255859375, 2.312347412109375, 2.43096923828125, 2.549591064453125, 2.668212890625, 2.786834716796875, 2.90545654296875, 3.024078369140625, 3.1427001953125, 3.261322021484375, 3.37994384765625, 3.498565673828125, 3.6171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 15.0, 17.0, 10.0, 32.0, 40.0, 78.0, 132.0, 155.0, 146.0, 101.0, 77.0, 49.0, 25.0, 27.0, 21.0, 7.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.45072174072265625, -0.4365997314453125, -0.42247772216796875, -0.408355712890625, -0.39423370361328125, -0.3801116943359375, -0.36598968505859375, -0.35186767578125, -0.33774566650390625, -0.3236236572265625, -0.30950164794921875, -0.295379638671875, -0.28125762939453125, -0.2671356201171875, -0.25301361083984375, -0.2388916015625, -0.22476959228515625, -0.2106475830078125, -0.19652557373046875, -0.182403564453125, -0.16828155517578125, -0.1541595458984375, -0.14003753662109375, -0.12591552734375, -0.11179351806640625, -0.0976715087890625, -0.08354949951171875, -0.069427490234375, -0.05530548095703125, -0.0411834716796875, -0.02706146240234375, -0.012939453125, 0.00118255615234375, 0.0153045654296875, 0.02942657470703125, 0.043548583984375, 0.05767059326171875, 0.0717926025390625, 0.08591461181640625, 0.10003662109375, 0.11415863037109375, 0.1282806396484375, 0.14240264892578125, 0.156524658203125, 0.17064666748046875, 0.1847686767578125, 0.19889068603515625, 0.2130126953125, 0.22713470458984375, 0.2412567138671875, 0.25537872314453125, 0.269500732421875, 0.28362274169921875, 0.2977447509765625, 0.31186676025390625, 0.32598876953125, 0.34011077880859375, 0.3542327880859375, 0.36835479736328125, 0.382476806640625, 0.39659881591796875, 0.4107208251953125, 0.42484283447265625, 0.43896484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 13.0, 30.0, 34.0, 56.0, 111.0, 378.0, 3271.0, 188902.0, 850654.0, 4317.0, 480.0, 103.0, 56.0, 36.0, 21.0, 23.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.73291015625, -8.4423828125, -8.15185546875, -7.861328125, -7.57080078125, -7.2802734375, -6.98974609375, -6.69921875, -6.40869140625, -6.1181640625, -5.82763671875, -5.537109375, -5.24658203125, -4.9560546875, -4.66552734375, -4.375, -4.08447265625, -3.7939453125, -3.50341796875, -3.212890625, -2.92236328125, -2.6318359375, -2.34130859375, -2.05078125, -1.76025390625, -1.4697265625, -1.17919921875, -0.888671875, -0.59814453125, -0.3076171875, -0.01708984375, 0.2734375, 0.56396484375, 0.8544921875, 1.14501953125, 1.435546875, 1.72607421875, 2.0166015625, 2.30712890625, 2.59765625, 2.88818359375, 3.1787109375, 3.46923828125, 3.759765625, 4.05029296875, 4.3408203125, 4.63134765625, 4.921875, 5.21240234375, 5.5029296875, 5.79345703125, 6.083984375, 6.37451171875, 6.6650390625, 6.95556640625, 7.24609375, 7.53662109375, 7.8271484375, 8.11767578125, 8.408203125, 8.69873046875, 8.9892578125, 9.27978515625, 9.5703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 6.0, 7.0, 22.0, 51.0, 93.0, 178.0, 264.0, 224.0, 85.0, 41.0, 20.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4520385265350342, -0.4051550328731537, -0.3582715392112732, -0.3113880455493927, -0.2645045518875122, -0.2176210582256317, -0.17073756456375122, -0.12385407090187073, -0.07697057723999023, -0.03008708357810974, 0.016796410083770752, 0.06367990374565125, 0.11056339740753174, 0.15744689106941223, 0.20433038473129272, 0.2512138783931732, 0.2980973720550537, 0.3449808657169342, 0.3918643593788147, 0.4387478530406952, 0.4856313467025757, 0.5325148105621338, 0.5793983340263367, 0.6262818574905396, 0.6731653213500977, 0.7200487852096558, 0.7669323086738586, 0.8138158321380615, 0.8606992959976196, 0.9075827598571777, 0.9544662833213806, 1.0013498067855835, 1.0482332706451416, 1.0951167345046997, 1.1420001983642578, 1.1888837814331055, 1.2357672452926636, 1.2826507091522217, 1.3295342922210693, 1.3764177560806274, 1.4233012199401855, 1.4701846837997437, 1.5170681476593018, 1.5639517307281494, 1.6108351945877075, 1.6577186584472656, 1.7046022415161133, 1.7514857053756714, 1.7983691692352295, 1.8452526330947876, 1.8921360969543457, 1.9390196800231934, 1.9859031438827515, 2.0327866077423096, 2.0796701908111572, 2.126553535461426, 2.1734371185302734, 2.220320701599121, 2.2672040462493896, 2.3140876293182373, 2.360970973968506, 2.4078545570373535, 2.454738140106201, 2.5016214847564697, 2.5485050678253174]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 7.0, 2.0, 4.0, 4.0, 6.0, 14.0, 12.0, 19.0, 10.0, 18.0, 19.0, 23.0, 27.0, 29.0, 39.0, 42.0, 35.0, 40.0, 43.0, 47.0, 53.0, 55.0, 38.0, 50.0, 39.0, 32.0, 36.0, 27.0, 34.0, 27.0, 32.0, 24.0, 21.0, 18.0, 25.0, 16.0, 11.0, 6.0, 9.0, 9.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432320773601532, -0.4188823699951172, -0.40544393658638, -0.3920055329799652, -0.3785671293735504, -0.36512869596481323, -0.35169029235839844, -0.33825188875198364, -0.32481348514556885, -0.31137508153915405, -0.29793664813041687, -0.2844982445240021, -0.2710598409175873, -0.2576214075088501, -0.2441830039024353, -0.2307446002960205, -0.21730618178844452, -0.20386776328086853, -0.19042935967445374, -0.17699094116687775, -0.16355253756046295, -0.15011411905288696, -0.13667571544647217, -0.12323729693889618, -0.10979888588190079, -0.0963604748249054, -0.08292206376791, -0.06948365271091461, -0.05604523792862892, -0.04260682314634323, -0.02916841208934784, -0.015730001032352448, -0.0022915899753570557, 0.01114682201296091, 0.024585234001278877, 0.03802364692091942, 0.05146205797791481, 0.0649004727602005, 0.07833888381719589, 0.09177729487419128, 0.10521570593118668, 0.11865411698818207, 0.13209253549575806, 0.14553093910217285, 0.15896935760974884, 0.17240777611732483, 0.18584617972373962, 0.19928458333015442, 0.2127230018377304, 0.2261614203453064, 0.2395998239517212, 0.253038227558136, 0.26647666096687317, 0.27991506457328796, 0.29335346817970276, 0.30679190158843994, 0.32023030519485474, 0.33366870880126953, 0.3471071422100067, 0.3605455458164215, 0.3739839494228363, 0.3874223828315735, 0.4008607864379883, 0.4142991900444031, 0.42773759365081787]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 8.0, 8.0, 14.0, 13.0, 17.0, 13.0, 21.0, 21.0, 30.0, 27.0, 34.0, 39.0, 40.0, 41.0, 41.0, 48.0, 52.0, 43.0, 36.0, 50.0, 52.0, 49.0, 38.0, 38.0, 28.0, 37.0, 25.0, 20.0, 18.0, 25.0, 18.0, 5.0, 13.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.101531982421875, -2.99993896484375, -2.898345947265625, -2.7967529296875, -2.695159912109375, -2.59356689453125, -2.491973876953125, -2.390380859375, -2.288787841796875, -2.18719482421875, -2.085601806640625, -1.9840087890625, -1.882415771484375, -1.78082275390625, -1.679229736328125, -1.57763671875, -1.476043701171875, -1.37445068359375, -1.272857666015625, -1.1712646484375, -1.069671630859375, -0.96807861328125, -0.866485595703125, -0.764892578125, -0.663299560546875, -0.56170654296875, -0.460113525390625, -0.3585205078125, -0.256927490234375, -0.15533447265625, -0.053741455078125, 0.0478515625, 0.149444580078125, 0.25103759765625, 0.352630615234375, 0.4542236328125, 0.555816650390625, 0.65740966796875, 0.759002685546875, 0.860595703125, 0.962188720703125, 1.06378173828125, 1.165374755859375, 1.2669677734375, 1.368560791015625, 1.47015380859375, 1.571746826171875, 1.67333984375, 1.774932861328125, 1.87652587890625, 1.978118896484375, 2.0797119140625, 2.181304931640625, 2.28289794921875, 2.384490966796875, 2.486083984375, 2.587677001953125, 2.68927001953125, 2.790863037109375, 2.8924560546875, 2.994049072265625, 3.09564208984375, 3.197235107421875, 3.298828125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 6.0, 9.0, 9.0, 22.0, 20.0, 41.0, 56.0, 74.0, 90.0, 175.0, 232.0, 284.0, 471.0, 591.0, 900.0, 1295.0, 1934.0, 2830.0, 4508.0, 7087.0, 11979.0, 20823.0, 39538.0, 81988.0, 205175.0, 377068.0, 149504.0, 64158.0, 32093.0, 17405.0, 10104.0, 6228.0, 3778.0, 2568.0, 1674.0, 1174.0, 835.0, 544.0, 364.0, 286.0, 177.0, 138.0, 100.0, 70.0, 56.0, 35.0, 18.0, 18.0, 8.0, 5.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.21484375, -3.112274169921875, -3.00970458984375, -2.907135009765625, -2.8045654296875, -2.701995849609375, -2.59942626953125, -2.496856689453125, -2.394287109375, -2.291717529296875, -2.18914794921875, -2.086578369140625, -1.9840087890625, -1.881439208984375, -1.77886962890625, -1.676300048828125, -1.57373046875, -1.471160888671875, -1.36859130859375, -1.266021728515625, -1.1634521484375, -1.060882568359375, -0.95831298828125, -0.855743408203125, -0.753173828125, -0.650604248046875, -0.54803466796875, -0.445465087890625, -0.3428955078125, -0.240325927734375, -0.13775634765625, -0.035186767578125, 0.0673828125, 0.169952392578125, 0.27252197265625, 0.375091552734375, 0.4776611328125, 0.580230712890625, 0.68280029296875, 0.785369873046875, 0.887939453125, 0.990509033203125, 1.09307861328125, 1.195648193359375, 1.2982177734375, 1.400787353515625, 1.50335693359375, 1.605926513671875, 1.70849609375, 1.811065673828125, 1.91363525390625, 2.016204833984375, 2.1187744140625, 2.221343994140625, 2.32391357421875, 2.426483154296875, 2.529052734375, 2.631622314453125, 2.73419189453125, 2.836761474609375, 2.9393310546875, 3.041900634765625, 3.14447021484375, 3.247039794921875, 3.349609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 11.0, 22.0, 25.0, 14.0, 34.0, 19.0, 35.0, 35.0, 51.0, 56.0, 64.0, 90.0, 184.0, 1389.0, 300.0, 160.0, 110.0, 63.0, 58.0, 50.0, 33.0, 34.0, 25.0, 26.0, 19.0, 21.0, 12.0, 21.0, 10.0, 9.0, 9.0, 9.0, 5.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.34375, -9.998291015625, -9.65283203125, -9.307373046875, -8.9619140625, -8.616455078125, -8.27099609375, -7.925537109375, -7.580078125, -7.234619140625, -6.88916015625, -6.543701171875, -6.1982421875, -5.852783203125, -5.50732421875, -5.161865234375, -4.81640625, -4.470947265625, -4.12548828125, -3.780029296875, -3.4345703125, -3.089111328125, -2.74365234375, -2.398193359375, -2.052734375, -1.707275390625, -1.36181640625, -1.016357421875, -0.6708984375, -0.325439453125, 0.02001953125, 0.365478515625, 0.7109375, 1.056396484375, 1.40185546875, 1.747314453125, 2.0927734375, 2.438232421875, 2.78369140625, 3.129150390625, 3.474609375, 3.820068359375, 4.16552734375, 4.510986328125, 4.8564453125, 5.201904296875, 5.54736328125, 5.892822265625, 6.23828125, 6.583740234375, 6.92919921875, 7.274658203125, 7.6201171875, 7.965576171875, 8.31103515625, 8.656494140625, 9.001953125, 9.347412109375, 9.69287109375, 10.038330078125, 10.3837890625, 10.729248046875, 11.07470703125, 11.420166015625, 11.765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 11.0, 10.0, 13.0, 14.0, 26.0, 10.0, 28.0, 25.0, 42.0, 60.0, 76.0, 95.0, 114.0, 181.0, 242.0, 401.0, 939.0, 2642.0, 11768.0, 119480.0, 2786104.0, 201856.0, 15923.0, 3231.0, 1040.0, 459.0, 265.0, 168.0, 121.0, 89.0, 52.0, 50.0, 39.0, 25.0, 21.0, 18.0, 13.0, 12.0, 12.0, 7.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.28125, -18.7236328125, -18.166015625, -17.6083984375, -17.05078125, -16.4931640625, -15.935546875, -15.3779296875, -14.8203125, -14.2626953125, -13.705078125, -13.1474609375, -12.58984375, -12.0322265625, -11.474609375, -10.9169921875, -10.359375, -9.8017578125, -9.244140625, -8.6865234375, -8.12890625, -7.5712890625, -7.013671875, -6.4560546875, -5.8984375, -5.3408203125, -4.783203125, -4.2255859375, -3.66796875, -3.1103515625, -2.552734375, -1.9951171875, -1.4375, -0.8798828125, -0.322265625, 0.2353515625, 0.79296875, 1.3505859375, 1.908203125, 2.4658203125, 3.0234375, 3.5810546875, 4.138671875, 4.6962890625, 5.25390625, 5.8115234375, 6.369140625, 6.9267578125, 7.484375, 8.0419921875, 8.599609375, 9.1572265625, 9.71484375, 10.2724609375, 10.830078125, 11.3876953125, 11.9453125, 12.5029296875, 13.060546875, 13.6181640625, 14.17578125, 14.7333984375, 15.291015625, 15.8486328125, 16.40625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 618.0, 393.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2069091796875, -579.0357055664062, -568.8645629882812, -558.693359375, -548.5221557617188, -538.3510131835938, -528.1798095703125, -518.0086059570312, -507.8374328613281, -497.666259765625, -487.49505615234375, -477.3238830566406, -467.1527099609375, -456.98150634765625, -446.8103332519531, -436.63916015625, -426.46795654296875, -416.2967834472656, -406.1255798339844, -395.95440673828125, -385.783203125, -375.6120300292969, -365.44085693359375, -355.2696533203125, -345.0984802246094, -334.92730712890625, -324.756103515625, -314.5849304199219, -304.41375732421875, -294.2425537109375, -284.0713806152344, -273.90020751953125, -263.72900390625, -253.5578155517578, -243.38662719726562, -233.2154541015625, -223.0442657470703, -212.87307739257812, -202.701904296875, -192.5307159423828, -182.3595428466797, -172.1883544921875, -162.01718139648438, -151.8459930419922, -141.6748046875, -131.5036163330078, -121.33243560791016, -111.1612548828125, -100.99006652832031, -90.81887817382812, -80.64769744873047, -70.47651672363281, -60.305328369140625, -50.1341438293457, -39.96295928955078, -29.791778564453125, -19.620586395263672, -9.44940185546875, 0.7217826843261719, 10.892967224121094, 21.064151763916016, 31.235336303710938, 41.40652084350586, 51.577701568603516, 61.7488899230957]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 13.0, 20.0, 14.0, 13.0, 25.0, 34.0, 22.0, 26.0, 42.0, 31.0, 32.0, 40.0, 40.0, 51.0, 44.0, 58.0, 45.0, 44.0, 45.0, 32.0, 39.0, 32.0, 21.0, 34.0, 27.0, 29.0, 21.0, 12.0, 20.0, 12.0, 10.0, 15.0, 10.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.83502769470215, -30.820438385009766, -29.805849075317383, -28.791259765625, -27.776670455932617, -26.762081146240234, -25.747493743896484, -24.73290252685547, -23.71831512451172, -22.703725814819336, -21.689136505126953, -20.67454719543457, -19.659957885742188, -18.645368576049805, -17.630779266357422, -16.616191864013672, -15.601600646972656, -14.587011337280273, -13.57242202758789, -12.557832717895508, -11.543243408203125, -10.528654098510742, -9.514065742492676, -8.499476432800293, -7.48488712310791, -6.470297813415527, -5.4557085037231445, -4.44111967086792, -3.426530361175537, -2.4119410514831543, -1.3973522186279297, -0.3827629089355469, 0.6318283081054688, 1.646417498588562, 2.6610066890716553, 3.675595760345459, 4.690185070037842, 5.704774379730225, 6.719363212585449, 7.733952522277832, 8.748541831970215, 9.763131141662598, 10.77772045135498, 11.792308807373047, 12.80689811706543, 13.821487426757812, 14.836076736450195, 15.850666046142578, 16.86525535583496, 17.879844665527344, 18.894433975219727, 19.90902328491211, 20.923612594604492, 21.938201904296875, 22.952789306640625, 23.96738052368164, 24.98196792602539, 25.996557235717773, 27.011146545410156, 28.02573585510254, 29.040325164794922, 30.054914474487305, 31.069503784179688, 32.08409118652344, 33.09868240356445]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 10.0, 9.0, 12.0, 17.0, 23.0, 28.0, 25.0, 30.0, 27.0, 42.0, 35.0, 37.0, 53.0, 47.0, 52.0, 44.0, 51.0, 57.0, 53.0, 42.0, 42.0, 34.0, 27.0, 29.0, 24.0, 29.0, 25.0, 17.0, 14.0, 9.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5625, -3.4490966796875, -3.335693359375, -3.2222900390625, -3.10888671875, -2.9954833984375, -2.882080078125, -2.7686767578125, -2.6552734375, -2.5418701171875, -2.428466796875, -2.3150634765625, -2.20166015625, -2.0882568359375, -1.974853515625, -1.8614501953125, -1.748046875, -1.6346435546875, -1.521240234375, -1.4078369140625, -1.29443359375, -1.1810302734375, -1.067626953125, -0.9542236328125, -0.8408203125, -0.7274169921875, -0.614013671875, -0.5006103515625, -0.38720703125, -0.2738037109375, -0.160400390625, -0.0469970703125, 0.06640625, 0.1798095703125, 0.293212890625, 0.4066162109375, 0.52001953125, 0.6334228515625, 0.746826171875, 0.8602294921875, 0.9736328125, 1.0870361328125, 1.200439453125, 1.3138427734375, 1.42724609375, 1.5406494140625, 1.654052734375, 1.7674560546875, 1.880859375, 1.9942626953125, 2.107666015625, 2.2210693359375, 2.33447265625, 2.4478759765625, 2.561279296875, 2.6746826171875, 2.7880859375, 2.9014892578125, 3.014892578125, 3.1282958984375, 3.24169921875, 3.3551025390625, 3.468505859375, 3.5819091796875, 3.6953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 16.0, 26.0, 45.0, 48.0, 81.0, 112.0, 212.0, 364.0, 592.0, 929.0, 1677.0, 3071.0, 5990.0, 12374.0, 27508.0, 77017.0, 537248.0, 2880165.0, 518450.0, 75922.0, 26745.0, 12218.0, 6032.0, 3118.0, 1667.0, 1033.0, 556.0, 372.0, 223.0, 141.0, 87.0, 68.0, 48.0, 24.0, 19.0, 16.0, 12.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5, -8.2384033203125, -7.976806640625, -7.7152099609375, -7.45361328125, -7.1920166015625, -6.930419921875, -6.6688232421875, -6.4072265625, -6.1456298828125, -5.884033203125, -5.6224365234375, -5.36083984375, -5.0992431640625, -4.837646484375, -4.5760498046875, -4.314453125, -4.0528564453125, -3.791259765625, -3.5296630859375, -3.26806640625, -3.0064697265625, -2.744873046875, -2.4832763671875, -2.2216796875, -1.9600830078125, -1.698486328125, -1.4368896484375, -1.17529296875, -0.9136962890625, -0.652099609375, -0.3905029296875, -0.12890625, 0.1326904296875, 0.394287109375, 0.6558837890625, 0.91748046875, 1.1790771484375, 1.440673828125, 1.7022705078125, 1.9638671875, 2.2254638671875, 2.487060546875, 2.7486572265625, 3.01025390625, 3.2718505859375, 3.533447265625, 3.7950439453125, 4.056640625, 4.3182373046875, 4.579833984375, 4.8414306640625, 5.10302734375, 5.3646240234375, 5.626220703125, 5.8878173828125, 6.1494140625, 6.4110107421875, 6.672607421875, 6.9342041015625, 7.19580078125, 7.4573974609375, 7.718994140625, 7.9805908203125, 8.2421875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 8.0, 10.0, 23.0, 27.0, 32.0, 37.0, 48.0, 98.0, 116.0, 248.0, 431.0, 764.0, 860.0, 510.0, 277.0, 160.0, 107.0, 82.0, 54.0, 38.0, 31.0, 22.0, 18.0, 18.0, 14.0, 7.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.0137939453125, -8.715087890625, -8.4163818359375, -8.11767578125, -7.8189697265625, -7.520263671875, -7.2215576171875, -6.9228515625, -6.6241455078125, -6.325439453125, -6.0267333984375, -5.72802734375, -5.4293212890625, -5.130615234375, -4.8319091796875, -4.533203125, -4.2344970703125, -3.935791015625, -3.6370849609375, -3.33837890625, -3.0396728515625, -2.740966796875, -2.4422607421875, -2.1435546875, -1.8448486328125, -1.546142578125, -1.2474365234375, -0.94873046875, -0.6500244140625, -0.351318359375, -0.0526123046875, 0.24609375, 0.5447998046875, 0.843505859375, 1.1422119140625, 1.44091796875, 1.7396240234375, 2.038330078125, 2.3370361328125, 2.6357421875, 2.9344482421875, 3.233154296875, 3.5318603515625, 3.83056640625, 4.1292724609375, 4.427978515625, 4.7266845703125, 5.025390625, 5.3240966796875, 5.622802734375, 5.9215087890625, 6.22021484375, 6.5189208984375, 6.817626953125, 7.1163330078125, 7.4150390625, 7.7137451171875, 8.012451171875, 8.3111572265625, 8.60986328125, 8.9085693359375, 9.207275390625, 9.5059814453125, 9.8046875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 17.0, 17.0, 20.0, 28.0, 30.0, 55.0, 96.0, 168.0, 377.0, 1310.0, 7880.0, 105315.0, 3889382.0, 176450.0, 10601.0, 1636.0, 444.0, 179.0, 91.0, 48.0, 40.0, 31.0, 13.0, 12.0, 7.0, 8.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.41064453125, -30.4462890625, -29.48193359375, -28.517578125, -27.55322265625, -26.5888671875, -25.62451171875, -24.66015625, -23.69580078125, -22.7314453125, -21.76708984375, -20.802734375, -19.83837890625, -18.8740234375, -17.90966796875, -16.9453125, -15.98095703125, -15.0166015625, -14.05224609375, -13.087890625, -12.12353515625, -11.1591796875, -10.19482421875, -9.23046875, -8.26611328125, -7.3017578125, -6.33740234375, -5.373046875, -4.40869140625, -3.4443359375, -2.47998046875, -1.515625, -0.55126953125, 0.4130859375, 1.37744140625, 2.341796875, 3.30615234375, 4.2705078125, 5.23486328125, 6.19921875, 7.16357421875, 8.1279296875, 9.09228515625, 10.056640625, 11.02099609375, 11.9853515625, 12.94970703125, 13.9140625, 14.87841796875, 15.8427734375, 16.80712890625, 17.771484375, 18.73583984375, 19.7001953125, 20.66455078125, 21.62890625, 22.59326171875, 23.5576171875, 24.52197265625, 25.486328125, 26.45068359375, 27.4150390625, 28.37939453125, 29.34375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 25.0, 23.0, 22.0, 47.0, 81.0, 99.0, 131.0, 110.0, 113.0, 96.0, 83.0, 50.0, 39.0, 23.0, 18.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.63386917114258, -44.47373580932617, -43.31360626220703, -42.153472900390625, -40.99333953857422, -39.83320617675781, -38.67307662963867, -37.512943267822266, -36.352813720703125, -35.19268035888672, -34.03255081176758, -32.87241744995117, -31.712284088134766, -30.552152633666992, -29.39202117919922, -28.231887817382812, -27.071754455566406, -25.911623001098633, -24.751489639282227, -23.591358184814453, -22.431224822998047, -21.271093368530273, -20.1109619140625, -18.950828552246094, -17.79069709777832, -16.630565643310547, -15.47043228149414, -14.310300827026367, -13.150168418884277, -11.990036010742188, -10.829904556274414, -9.669772148132324, -8.509637832641602, -7.349505424499512, -6.18937349319458, -5.029241561889648, -3.8691091537475586, -2.7089767456054688, -1.548844814300537, -0.38871288299560547, 0.7714195251464844, 1.9315516948699951, 3.091683864593506, 4.2518157958984375, 5.411948204040527, 6.572080612182617, 7.732212543487549, 8.89234447479248, 10.05247688293457, 11.21260929107666, 12.37274169921875, 13.532873153686523, 14.693005561828613, 15.853137969970703, 17.013269424438477, 18.17340087890625, 19.333534240722656, 20.49366569519043, 21.653799057006836, 22.81393051147461, 23.974063873291016, 25.13419532775879, 26.294326782226562, 27.45446014404297, 28.614591598510742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 1.0, 5.0, 7.0, 10.0, 12.0, 14.0, 23.0, 36.0, 19.0, 37.0, 38.0, 26.0, 41.0, 45.0, 38.0, 47.0, 31.0, 38.0, 46.0, 50.0, 37.0, 37.0, 38.0, 34.0, 39.0, 40.0, 33.0, 36.0, 24.0, 24.0, 16.0, 13.0, 12.0, 12.0, 2.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.061450958251953, -25.286300659179688, -24.51114845275879, -23.735998153686523, -22.960847854614258, -22.18569564819336, -21.410545349121094, -20.635395050048828, -19.86024284362793, -19.085092544555664, -18.309940338134766, -17.5347900390625, -16.759639739990234, -15.984487533569336, -15.20933723449707, -14.434185981750488, -13.659035682678223, -12.88388442993164, -12.108734130859375, -11.333582878112793, -10.558431625366211, -9.783281326293945, -9.008130073547363, -8.232978820800781, -7.457828044891357, -6.682677268981934, -5.907526016235352, -5.132375240325928, -4.357224464416504, -3.582073211669922, -2.806922435760498, -2.031771183013916, -1.2566204071044922, -0.48146945238113403, 0.2936815023422241, 1.0688323974609375, 1.8439834117889404, 2.6191344261169434, 3.394285202026367, 4.169436454772949, 4.944587230682373, 5.719738006591797, 6.494889259338379, 7.270040035247803, 8.045190811157227, 8.820342063903809, 9.59549331665039, 10.370643615722656, 11.145794868469238, 11.92094612121582, 12.696096420288086, 13.471247673034668, 14.24639892578125, 15.021549224853516, 15.796700477600098, 16.57185173034668, 17.347002029418945, 18.12215232849121, 18.89730453491211, 19.672454833984375, 20.44760513305664, 21.22275733947754, 21.997907638549805, 22.773059844970703, 23.54821014404297]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 6.0, 10.0, 8.0, 12.0, 22.0, 19.0, 21.0, 37.0, 28.0, 35.0, 38.0, 25.0, 36.0, 50.0, 45.0, 44.0, 38.0, 40.0, 33.0, 50.0, 45.0, 43.0, 37.0, 40.0, 33.0, 24.0, 15.0, 17.0, 24.0, 16.0, 16.0, 17.0, 15.0, 6.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84423828125, -2.7490234375, -2.65380859375, -2.55859375, -2.46337890625, -2.3681640625, -2.27294921875, -2.177734375, -2.08251953125, -1.9873046875, -1.89208984375, -1.796875, -1.70166015625, -1.6064453125, -1.51123046875, -1.416015625, -1.32080078125, -1.2255859375, -1.13037109375, -1.03515625, -0.93994140625, -0.8447265625, -0.74951171875, -0.654296875, -0.55908203125, -0.4638671875, -0.36865234375, -0.2734375, -0.17822265625, -0.0830078125, 0.01220703125, 0.107421875, 0.20263671875, 0.2978515625, 0.39306640625, 0.48828125, 0.58349609375, 0.6787109375, 0.77392578125, 0.869140625, 0.96435546875, 1.0595703125, 1.15478515625, 1.25, 1.34521484375, 1.4404296875, 1.53564453125, 1.630859375, 1.72607421875, 1.8212890625, 1.91650390625, 2.01171875, 2.10693359375, 2.2021484375, 2.29736328125, 2.392578125, 2.48779296875, 2.5830078125, 2.67822265625, 2.7734375, 2.86865234375, 2.9638671875, 3.05908203125, 3.154296875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 19.0, 25.0, 32.0, 44.0, 67.0, 92.0, 122.0, 150.0, 219.0, 342.0, 444.0, 662.0, 944.0, 1367.0, 2170.0, 3344.0, 5537.0, 9727.0, 18761.0, 43822.0, 173242.0, 586396.0, 125218.0, 36108.0, 16694.0, 8657.0, 5020.0, 3009.0, 1966.0, 1342.0, 893.0, 626.0, 382.0, 315.0, 221.0, 158.0, 111.0, 85.0, 46.0, 42.0, 32.0, 27.0, 15.0, 16.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.296875, -5.1334228515625, -4.969970703125, -4.8065185546875, -4.64306640625, -4.4796142578125, -4.316162109375, -4.1527099609375, -3.9892578125, -3.8258056640625, -3.662353515625, -3.4989013671875, -3.33544921875, -3.1719970703125, -3.008544921875, -2.8450927734375, -2.681640625, -2.5181884765625, -2.354736328125, -2.1912841796875, -2.02783203125, -1.8643798828125, -1.700927734375, -1.5374755859375, -1.3740234375, -1.2105712890625, -1.047119140625, -0.8836669921875, -0.72021484375, -0.5567626953125, -0.393310546875, -0.2298583984375, -0.06640625, 0.0970458984375, 0.260498046875, 0.4239501953125, 0.58740234375, 0.7508544921875, 0.914306640625, 1.0777587890625, 1.2412109375, 1.4046630859375, 1.568115234375, 1.7315673828125, 1.89501953125, 2.0584716796875, 2.221923828125, 2.3853759765625, 2.548828125, 2.7122802734375, 2.875732421875, 3.0391845703125, 3.20263671875, 3.3660888671875, 3.529541015625, 3.6929931640625, 3.8564453125, 4.0198974609375, 4.183349609375, 4.3468017578125, 4.51025390625, 4.6737060546875, 4.837158203125, 5.0006103515625, 5.1640625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 22.0, 24.0, 18.0, 19.0, 31.0, 28.0, 26.0, 34.0, 37.0, 31.0, 38.0, 36.0, 34.0, 36.0, 1059.0, 39.0, 47.0, 34.0, 39.0, 34.0, 39.0, 35.0, 31.0, 41.0, 20.0, 16.0, 21.0, 14.0, 14.0, 14.0, 17.0, 7.0, 6.0, 4.0, 9.0, 3.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.423828125, -2.347747802734375, -2.27166748046875, -2.195587158203125, -2.1195068359375, -2.043426513671875, -1.96734619140625, -1.891265869140625, -1.815185546875, -1.739105224609375, -1.66302490234375, -1.586944580078125, -1.5108642578125, -1.434783935546875, -1.35870361328125, -1.282623291015625, -1.20654296875, -1.130462646484375, -1.05438232421875, -0.978302001953125, -0.9022216796875, -0.826141357421875, -0.75006103515625, -0.673980712890625, -0.597900390625, -0.521820068359375, -0.44573974609375, -0.369659423828125, -0.2935791015625, -0.217498779296875, -0.14141845703125, -0.065338134765625, 0.0107421875, 0.086822509765625, 0.16290283203125, 0.238983154296875, 0.3150634765625, 0.391143798828125, 0.46722412109375, 0.543304443359375, 0.619384765625, 0.695465087890625, 0.77154541015625, 0.847625732421875, 0.9237060546875, 0.999786376953125, 1.07586669921875, 1.151947021484375, 1.22802734375, 1.304107666015625, 1.38018798828125, 1.456268310546875, 1.5323486328125, 1.608428955078125, 1.68450927734375, 1.760589599609375, 1.836669921875, 1.912750244140625, 1.98883056640625, 2.064910888671875, 2.1409912109375, 2.217071533203125, 2.29315185546875, 2.369232177734375, 2.4453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 10.0, 13.0, 28.0, 42.0, 55.0, 86.0, 131.0, 190.0, 288.0, 466.0, 678.0, 1234.0, 2022.0, 3582.0, 6827.0, 14110.0, 36540.0, 194763.0, 1674104.0, 109512.0, 27206.0, 11628.0, 5765.0, 3125.0, 1840.0, 1099.0, 617.0, 394.0, 273.0, 155.0, 125.0, 79.0, 48.0, 37.0, 20.0, 17.0, 5.0, 9.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.2830810546875, -5.109130859375, -4.9351806640625, -4.76123046875, -4.5872802734375, -4.413330078125, -4.2393798828125, -4.0654296875, -3.8914794921875, -3.717529296875, -3.5435791015625, -3.36962890625, -3.1956787109375, -3.021728515625, -2.8477783203125, -2.673828125, -2.4998779296875, -2.325927734375, -2.1519775390625, -1.97802734375, -1.8040771484375, -1.630126953125, -1.4561767578125, -1.2822265625, -1.1082763671875, -0.934326171875, -0.7603759765625, -0.58642578125, -0.4124755859375, -0.238525390625, -0.0645751953125, 0.109375, 0.2833251953125, 0.457275390625, 0.6312255859375, 0.80517578125, 0.9791259765625, 1.153076171875, 1.3270263671875, 1.5009765625, 1.6749267578125, 1.848876953125, 2.0228271484375, 2.19677734375, 2.3707275390625, 2.544677734375, 2.7186279296875, 2.892578125, 3.0665283203125, 3.240478515625, 3.4144287109375, 3.58837890625, 3.7623291015625, 3.936279296875, 4.1102294921875, 4.2841796875, 4.4581298828125, 4.632080078125, 4.8060302734375, 4.97998046875, 5.1539306640625, 5.327880859375, 5.5018310546875, 5.67578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 28.0, 33.0, 134.0, 342.0, 238.0, 93.0, 31.0, 17.0, 20.0, 9.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9052734375, -1.8489837646484375, -1.792694091796875, -1.7364044189453125, -1.68011474609375, -1.6238250732421875, -1.567535400390625, -1.5112457275390625, -1.4549560546875, -1.3986663818359375, -1.342376708984375, -1.2860870361328125, -1.22979736328125, -1.1735076904296875, -1.117218017578125, -1.0609283447265625, -1.004638671875, -0.9483489990234375, -0.892059326171875, -0.8357696533203125, -0.77947998046875, -0.7231903076171875, -0.666900634765625, -0.6106109619140625, -0.5543212890625, -0.4980316162109375, -0.441741943359375, -0.3854522705078125, -0.32916259765625, -0.2728729248046875, -0.216583251953125, -0.1602935791015625, -0.10400390625, -0.0477142333984375, 0.008575439453125, 0.0648651123046875, 0.12115478515625, 0.1774444580078125, 0.233734130859375, 0.2900238037109375, 0.3463134765625, 0.4026031494140625, 0.458892822265625, 0.5151824951171875, 0.57147216796875, 0.6277618408203125, 0.684051513671875, 0.7403411865234375, 0.796630859375, 0.8529205322265625, 0.909210205078125, 0.9654998779296875, 1.02178955078125, 1.0780792236328125, 1.134368896484375, 1.1906585693359375, 1.2469482421875, 1.3032379150390625, 1.359527587890625, 1.4158172607421875, 1.47210693359375, 1.5283966064453125, 1.584686279296875, 1.6409759521484375, 1.697265625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 5.0, 9.0, 15.0, 37.0, 65.0, 231.0, 1412.0, 41236.0, 1002252.0, 2701.0, 411.0, 77.0, 30.0, 23.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.9375, -31.84521484375, -30.7529296875, -29.66064453125, -28.568359375, -27.47607421875, -26.3837890625, -25.29150390625, -24.19921875, -23.10693359375, -22.0146484375, -20.92236328125, -19.830078125, -18.73779296875, -17.6455078125, -16.55322265625, -15.4609375, -14.36865234375, -13.2763671875, -12.18408203125, -11.091796875, -9.99951171875, -8.9072265625, -7.81494140625, -6.72265625, -5.63037109375, -4.5380859375, -3.44580078125, -2.353515625, -1.26123046875, -0.1689453125, 0.92333984375, 2.015625, 3.10791015625, 4.2001953125, 5.29248046875, 6.384765625, 7.47705078125, 8.5693359375, 9.66162109375, 10.75390625, 11.84619140625, 12.9384765625, 14.03076171875, 15.123046875, 16.21533203125, 17.3076171875, 18.39990234375, 19.4921875, 20.58447265625, 21.6767578125, 22.76904296875, 23.861328125, 24.95361328125, 26.0458984375, 27.13818359375, 28.23046875, 29.32275390625, 30.4150390625, 31.50732421875, 32.599609375, 33.69189453125, 34.7841796875, 35.87646484375, 36.96875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 31.0, 153.0, 664.0, 141.0, 19.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.514542579650879, -1.239621877670288, -0.9647012948989868, -0.6897806525230408, -0.4148600101470947, -0.1399393081665039, 0.13498127460479736, 0.40990185737609863, 0.6848225593566895, 0.9597432017326355, 1.2346638441085815, 1.5095844268798828, 1.7845051288604736, 2.0594258308410645, 2.334346294403076, 2.609266996383667, 2.884187698364258, 3.1591084003448486, 3.4340291023254395, 3.708949565887451, 3.983870267868042, 4.258790969848633, 4.5337114334106445, 4.808631896972656, 5.083552837371826, 5.358473300933838, 5.633394241333008, 5.9083147048950195, 6.183235168457031, 6.458156108856201, 6.733076572418213, 7.007997512817383, 7.282918930053711, 7.557839393615723, 7.832760334014893, 8.107681274414062, 8.382601737976074, 8.657522201538086, 8.932442665100098, 9.20736312866211, 9.482284545898438, 9.75720500946045, 10.032125473022461, 10.307046890258789, 10.5819673538208, 10.856887817382812, 11.131808280944824, 11.406728744506836, 11.681649208068848, 11.95656967163086, 12.231490135192871, 12.5064115524292, 12.781332015991211, 13.056252479553223, 13.331172943115234, 13.606093406677246, 13.881013870239258, 14.15593433380127, 14.430854797363281, 14.70577621459961, 14.980696678161621, 15.255617141723633, 15.530537605285645, 15.805458068847656, 16.080379486083984]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 12.0, 13.0, 19.0, 11.0, 23.0, 24.0, 35.0, 21.0, 25.0, 31.0, 43.0, 32.0, 38.0, 41.0, 36.0, 48.0, 39.0, 41.0, 40.0, 41.0, 30.0, 33.0, 33.0, 32.0, 28.0, 28.0, 31.0, 12.0, 19.0, 20.0, 14.0, 14.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9238834381103516, -0.8947098255157471, -0.8655362129211426, -0.8363626003265381, -0.8071890473365784, -0.7780154347419739, -0.7488418221473694, -0.7196682095527649, -0.6904945969581604, -0.6613209843635559, -0.6321473717689514, -0.6029738187789917, -0.5738002061843872, -0.5446265935897827, -0.5154529809951782, -0.48627936840057373, -0.4571057856082916, -0.42793217301368713, -0.39875859022140503, -0.36958497762680054, -0.34041136503219604, -0.31123775243759155, -0.28206416964530945, -0.25289055705070496, -0.22371695935726166, -0.19454336166381836, -0.16536974906921387, -0.13619615137577057, -0.10702254623174667, -0.07784894108772278, -0.04867534339427948, -0.019501730799674988, 0.00967186689376831, 0.038845472037792206, 0.0680190771818161, 0.0971926748752594, 0.1263662874698639, 0.1555398851633072, 0.1847134828567505, 0.21388709545135498, 0.24306069314479828, 0.2722342908382416, 0.30140790343284607, 0.3305814862251282, 0.35975509881973267, 0.38892871141433716, 0.41810232400894165, 0.44727593660354614, 0.47644951939582825, 0.5056231021881104, 0.5347967147827148, 0.5639703273773193, 0.5931439399719238, 0.6223175525665283, 0.6514911651611328, 0.6806647777557373, 0.709838330745697, 0.7390119433403015, 0.768185555934906, 0.7973591089248657, 0.8265327215194702, 0.8557063341140747, 0.8848799467086792, 0.9140535593032837, 0.9432271718978882]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 10.0, 8.0, 11.0, 14.0, 14.0, 24.0, 24.0, 29.0, 26.0, 20.0, 29.0, 46.0, 42.0, 44.0, 35.0, 47.0, 40.0, 33.0, 38.0, 34.0, 41.0, 51.0, 43.0, 39.0, 33.0, 28.0, 18.0, 17.0, 24.0, 23.0, 11.0, 12.0, 12.0, 9.0, 6.0, 14.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.744140625, -2.653533935546875, -2.56292724609375, -2.472320556640625, -2.3817138671875, -2.291107177734375, -2.20050048828125, -2.109893798828125, -2.019287109375, -1.928680419921875, -1.83807373046875, -1.747467041015625, -1.6568603515625, -1.566253662109375, -1.47564697265625, -1.385040283203125, -1.29443359375, -1.203826904296875, -1.11322021484375, -1.022613525390625, -0.9320068359375, -0.841400146484375, -0.75079345703125, -0.660186767578125, -0.569580078125, -0.478973388671875, -0.38836669921875, -0.297760009765625, -0.2071533203125, -0.116546630859375, -0.02593994140625, 0.064666748046875, 0.1552734375, 0.245880126953125, 0.33648681640625, 0.427093505859375, 0.5177001953125, 0.608306884765625, 0.69891357421875, 0.789520263671875, 0.880126953125, 0.970733642578125, 1.06134033203125, 1.151947021484375, 1.2425537109375, 1.333160400390625, 1.42376708984375, 1.514373779296875, 1.60498046875, 1.695587158203125, 1.78619384765625, 1.876800537109375, 1.9674072265625, 2.058013916015625, 2.14862060546875, 2.239227294921875, 2.329833984375, 2.420440673828125, 2.51104736328125, 2.601654052734375, 2.6922607421875, 2.782867431640625, 2.87347412109375, 2.964080810546875, 3.0546875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 21.0, 34.0, 46.0, 55.0, 97.0, 119.0, 145.0, 231.0, 329.0, 377.0, 538.0, 872.0, 1154.0, 1658.0, 2546.0, 4133.0, 7588.0, 16394.0, 46752.0, 185822.0, 553396.0, 152198.0, 40565.0, 14680.0, 7019.0, 3844.0, 2514.0, 1601.0, 1115.0, 759.0, 550.0, 365.0, 295.0, 194.0, 171.0, 108.0, 68.0, 59.0, 44.0, 33.0, 10.0, 18.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.90679931640625, -3.7784423828125, -3.65008544921875, -3.521728515625, -3.39337158203125, -3.2650146484375, -3.13665771484375, -3.00830078125, -2.87994384765625, -2.7515869140625, -2.62322998046875, -2.494873046875, -2.36651611328125, -2.2381591796875, -2.10980224609375, -1.9814453125, -1.85308837890625, -1.7247314453125, -1.59637451171875, -1.468017578125, -1.33966064453125, -1.2113037109375, -1.08294677734375, -0.95458984375, -0.82623291015625, -0.6978759765625, -0.56951904296875, -0.441162109375, -0.31280517578125, -0.1844482421875, -0.05609130859375, 0.072265625, 0.20062255859375, 0.3289794921875, 0.45733642578125, 0.585693359375, 0.71405029296875, 0.8424072265625, 0.97076416015625, 1.09912109375, 1.22747802734375, 1.3558349609375, 1.48419189453125, 1.612548828125, 1.74090576171875, 1.8692626953125, 1.99761962890625, 2.1259765625, 2.25433349609375, 2.3826904296875, 2.51104736328125, 2.639404296875, 2.76776123046875, 2.8961181640625, 3.02447509765625, 3.15283203125, 3.28118896484375, 3.4095458984375, 3.53790283203125, 3.666259765625, 3.79461669921875, 3.9229736328125, 4.05133056640625, 4.1796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 14.0, 11.0, 18.0, 19.0, 20.0, 17.0, 21.0, 25.0, 28.0, 42.0, 36.0, 44.0, 54.0, 71.0, 86.0, 188.0, 1519.0, 252.0, 113.0, 74.0, 43.0, 40.0, 36.0, 42.0, 33.0, 26.0, 17.0, 28.0, 15.0, 18.0, 18.0, 17.0, 9.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3260498046875, -9.011474609375, -8.6968994140625, -8.38232421875, -8.0677490234375, -7.753173828125, -7.4385986328125, -7.1240234375, -6.8094482421875, -6.494873046875, -6.1802978515625, -5.86572265625, -5.5511474609375, -5.236572265625, -4.9219970703125, -4.607421875, -4.2928466796875, -3.978271484375, -3.6636962890625, -3.34912109375, -3.0345458984375, -2.719970703125, -2.4053955078125, -2.0908203125, -1.7762451171875, -1.461669921875, -1.1470947265625, -0.83251953125, -0.5179443359375, -0.203369140625, 0.1112060546875, 0.42578125, 0.7403564453125, 1.054931640625, 1.3695068359375, 1.68408203125, 1.9986572265625, 2.313232421875, 2.6278076171875, 2.9423828125, 3.2569580078125, 3.571533203125, 3.8861083984375, 4.20068359375, 4.5152587890625, 4.829833984375, 5.1444091796875, 5.458984375, 5.7735595703125, 6.088134765625, 6.4027099609375, 6.71728515625, 7.0318603515625, 7.346435546875, 7.6610107421875, 7.9755859375, 8.2901611328125, 8.604736328125, 8.9193115234375, 9.23388671875, 9.5484619140625, 9.863037109375, 10.1776123046875, 10.4921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 5.0, 1.0, 4.0, 16.0, 15.0, 13.0, 21.0, 24.0, 33.0, 51.0, 59.0, 98.0, 140.0, 264.0, 452.0, 1064.0, 3451.0, 19201.0, 2195394.0, 904992.0, 15230.0, 3020.0, 996.0, 448.0, 257.0, 128.0, 84.0, 53.0, 41.0, 24.0, 32.0, 20.0, 18.0, 11.0, 11.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.862548828125, -21.17822265625, -20.493896484375, -19.8095703125, -19.125244140625, -18.44091796875, -17.756591796875, -17.072265625, -16.387939453125, -15.70361328125, -15.019287109375, -14.3349609375, -13.650634765625, -12.96630859375, -12.281982421875, -11.59765625, -10.913330078125, -10.22900390625, -9.544677734375, -8.8603515625, -8.176025390625, -7.49169921875, -6.807373046875, -6.123046875, -5.438720703125, -4.75439453125, -4.070068359375, -3.3857421875, -2.701416015625, -2.01708984375, -1.332763671875, -0.6484375, 0.035888671875, 0.72021484375, 1.404541015625, 2.0888671875, 2.773193359375, 3.45751953125, 4.141845703125, 4.826171875, 5.510498046875, 6.19482421875, 6.879150390625, 7.5634765625, 8.247802734375, 8.93212890625, 9.616455078125, 10.30078125, 10.985107421875, 11.66943359375, 12.353759765625, 13.0380859375, 13.722412109375, 14.40673828125, 15.091064453125, 15.775390625, 16.459716796875, 17.14404296875, 17.828369140625, 18.5126953125, 19.197021484375, 19.88134765625, 20.565673828125, 21.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 18.0, 144.0, 530.0, 269.0, 47.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.36990737915039, -17.147403717041016, -14.924901962280273, -12.702398300170898, -10.47989559173584, -8.257392883300781, -6.034889221191406, -3.8123865127563477, -1.589883804321289, 0.6326191425323486, 2.8551220893859863, 5.077625274658203, 7.300127983093262, 9.52263069152832, 11.745134353637695, 13.967637062072754, 16.190139770507812, 18.412643432617188, 20.63514518737793, 22.857648849487305, 25.080150604248047, 27.302654266357422, 29.525157928466797, 31.747661590576172, 33.97016143798828, 36.192665100097656, 38.41516876220703, 40.637672424316406, 42.860172271728516, 45.08267593383789, 47.305179595947266, 49.52768325805664, 51.75018310546875, 53.972686767578125, 56.1951904296875, 58.417694091796875, 60.640193939208984, 62.86269760131836, 65.085205078125, 67.30770111083984, 69.53020477294922, 71.7527084350586, 73.97521209716797, 76.19771575927734, 78.42021942138672, 80.64271545410156, 82.86521911621094, 85.08772277832031, 87.31022644042969, 89.53273010253906, 91.75523376464844, 93.97773742675781, 96.20024108886719, 98.42274475097656, 100.64524841308594, 102.86774444580078, 105.09025573730469, 107.31275939941406, 109.53526306152344, 111.75776672363281, 113.98027038574219, 116.20277404785156, 118.42527770996094, 120.64777374267578, 122.87027740478516]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 20.0, 17.0, 36.0, 32.0, 45.0, 33.0, 41.0, 43.0, 46.0, 43.0, 32.0, 35.0, 31.0, 46.0, 34.0, 42.0, 30.0, 40.0, 31.0, 29.0, 24.0, 21.0, 22.0, 18.0, 16.0, 20.0, 6.0, 8.0, 3.0, 7.0, 8.0, 10.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.262863159179688, -22.507118225097656, -21.751375198364258, -20.995630264282227, -20.239887237548828, -19.484142303466797, -18.728397369384766, -17.972652435302734, -17.216909408569336, -16.461164474487305, -15.705421447753906, -14.949676513671875, -14.19393253326416, -13.438188552856445, -12.682443618774414, -11.9266996383667, -11.170955657958984, -10.41521167755127, -9.659467697143555, -8.903722763061523, -8.147978782653809, -7.392234802246094, -6.636490345001221, -5.880745887756348, -5.125001907348633, -4.369257926940918, -3.613513469696045, -2.857769250869751, -2.102025032043457, -1.346280813217163, -0.5905365943908691, 0.1652078628540039, 0.9209537506103516, 1.6766979694366455, 2.4324421882629395, 3.1881864070892334, 3.9439306259155273, 4.699674606323242, 5.455419063568115, 6.211163520812988, 6.966907501220703, 7.722651481628418, 8.478395462036133, 9.234140396118164, 9.989884376525879, 10.745628356933594, 11.501373291015625, 12.25711727142334, 13.012861251831055, 13.76860523223877, 14.524349212646484, 15.280094146728516, 16.035839080810547, 16.791582107543945, 17.547327041625977, 18.303070068359375, 19.058815002441406, 19.814559936523438, 20.570302963256836, 21.326047897338867, 22.081790924072266, 22.837535858154297, 23.593280792236328, 24.34902572631836, 25.104768753051758]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 9.0, 8.0, 9.0, 15.0, 20.0, 30.0, 30.0, 18.0, 27.0, 41.0, 49.0, 49.0, 41.0, 36.0, 49.0, 37.0, 55.0, 49.0, 54.0, 39.0, 39.0, 38.0, 24.0, 35.0, 34.0, 21.0, 16.0, 29.0, 16.0, 16.0, 6.0, 13.0, 4.0, 5.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.56536865234375, -3.4569091796875, -3.34844970703125, -3.239990234375, -3.13153076171875, -3.0230712890625, -2.91461181640625, -2.80615234375, -2.69769287109375, -2.5892333984375, -2.48077392578125, -2.372314453125, -2.26385498046875, -2.1553955078125, -2.04693603515625, -1.9384765625, -1.83001708984375, -1.7215576171875, -1.61309814453125, -1.504638671875, -1.39617919921875, -1.2877197265625, -1.17926025390625, -1.07080078125, -0.96234130859375, -0.8538818359375, -0.74542236328125, -0.636962890625, -0.52850341796875, -0.4200439453125, -0.31158447265625, -0.203125, -0.09466552734375, 0.0137939453125, 0.12225341796875, 0.230712890625, 0.33917236328125, 0.4476318359375, 0.55609130859375, 0.66455078125, 0.77301025390625, 0.8814697265625, 0.98992919921875, 1.098388671875, 1.20684814453125, 1.3153076171875, 1.42376708984375, 1.5322265625, 1.64068603515625, 1.7491455078125, 1.85760498046875, 1.966064453125, 2.07452392578125, 2.1829833984375, 2.29144287109375, 2.39990234375, 2.50836181640625, 2.6168212890625, 2.72528076171875, 2.833740234375, 2.94219970703125, 3.0506591796875, 3.15911865234375, 3.267578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 5.0, 12.0, 14.0, 17.0, 24.0, 63.0, 60.0, 85.0, 135.0, 167.0, 301.0, 378.0, 576.0, 896.0, 1258.0, 1973.0, 3147.0, 4918.0, 8280.0, 14262.0, 27191.0, 58618.0, 190281.0, 1178063.0, 2135071.0, 395863.0, 89187.0, 36980.0, 18682.0, 10697.0, 6093.0, 3855.0, 2438.0, 1602.0, 1006.0, 699.0, 436.0, 323.0, 187.0, 131.0, 103.0, 61.0, 50.0, 28.0, 17.0, 12.0, 15.0, 5.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.21875, -6.02569580078125, -5.8326416015625, -5.63958740234375, -5.446533203125, -5.25347900390625, -5.0604248046875, -4.86737060546875, -4.67431640625, -4.48126220703125, -4.2882080078125, -4.09515380859375, -3.902099609375, -3.70904541015625, -3.5159912109375, -3.32293701171875, -3.1298828125, -2.93682861328125, -2.7437744140625, -2.55072021484375, -2.357666015625, -2.16461181640625, -1.9715576171875, -1.77850341796875, -1.58544921875, -1.39239501953125, -1.1993408203125, -1.00628662109375, -0.813232421875, -0.62017822265625, -0.4271240234375, -0.23406982421875, -0.041015625, 0.15203857421875, 0.3450927734375, 0.53814697265625, 0.731201171875, 0.92425537109375, 1.1173095703125, 1.31036376953125, 1.50341796875, 1.69647216796875, 1.8895263671875, 2.08258056640625, 2.275634765625, 2.46868896484375, 2.6617431640625, 2.85479736328125, 3.0478515625, 3.24090576171875, 3.4339599609375, 3.62701416015625, 3.820068359375, 4.01312255859375, 4.2061767578125, 4.39923095703125, 4.59228515625, 4.78533935546875, 4.9783935546875, 5.17144775390625, 5.364501953125, 5.55755615234375, 5.7506103515625, 5.94366455078125, 6.13671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 1.0, 8.0, 7.0, 5.0, 8.0, 11.0, 13.0, 12.0, 31.0, 22.0, 37.0, 43.0, 47.0, 50.0, 58.0, 67.0, 97.0, 135.0, 215.0, 341.0, 470.0, 619.0, 471.0, 355.0, 237.0, 178.0, 116.0, 84.0, 63.0, 56.0, 32.0, 40.0, 23.0, 19.0, 16.0, 17.0, 13.0, 13.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-6.87109375, -6.67791748046875, -6.4847412109375, -6.29156494140625, -6.098388671875, -5.90521240234375, -5.7120361328125, -5.51885986328125, -5.32568359375, -5.13250732421875, -4.9393310546875, -4.74615478515625, -4.552978515625, -4.35980224609375, -4.1666259765625, -3.97344970703125, -3.7802734375, -3.58709716796875, -3.3939208984375, -3.20074462890625, -3.007568359375, -2.81439208984375, -2.6212158203125, -2.42803955078125, -2.23486328125, -2.04168701171875, -1.8485107421875, -1.65533447265625, -1.462158203125, -1.26898193359375, -1.0758056640625, -0.88262939453125, -0.689453125, -0.49627685546875, -0.3031005859375, -0.10992431640625, 0.083251953125, 0.27642822265625, 0.4696044921875, 0.66278076171875, 0.85595703125, 1.04913330078125, 1.2423095703125, 1.43548583984375, 1.628662109375, 1.82183837890625, 2.0150146484375, 2.20819091796875, 2.4013671875, 2.59454345703125, 2.7877197265625, 2.98089599609375, 3.174072265625, 3.36724853515625, 3.5604248046875, 3.75360107421875, 3.94677734375, 4.13995361328125, 4.3331298828125, 4.52630615234375, 4.719482421875, 4.91265869140625, 5.1058349609375, 5.29901123046875, 5.4921875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 20.0, 10.0, 22.0, 26.0, 38.0, 46.0, 68.0, 75.0, 134.0, 230.0, 643.0, 3621.0, 34842.0, 1746019.0, 2363851.0, 39242.0, 3875.0, 701.0, 237.0, 115.0, 57.0, 55.0, 48.0, 54.0, 39.0, 33.0, 24.0, 25.0, 8.0, 12.0, 7.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.485595703125, -23.61181640625, -22.738037109375, -21.8642578125, -20.990478515625, -20.11669921875, -19.242919921875, -18.369140625, -17.495361328125, -16.62158203125, -15.747802734375, -14.8740234375, -14.000244140625, -13.12646484375, -12.252685546875, -11.37890625, -10.505126953125, -9.63134765625, -8.757568359375, -7.8837890625, -7.010009765625, -6.13623046875, -5.262451171875, -4.388671875, -3.514892578125, -2.64111328125, -1.767333984375, -0.8935546875, -0.019775390625, 0.85400390625, 1.727783203125, 2.6015625, 3.475341796875, 4.34912109375, 5.222900390625, 6.0966796875, 6.970458984375, 7.84423828125, 8.718017578125, 9.591796875, 10.465576171875, 11.33935546875, 12.213134765625, 13.0869140625, 13.960693359375, 14.83447265625, 15.708251953125, 16.58203125, 17.455810546875, 18.32958984375, 19.203369140625, 20.0771484375, 20.950927734375, 21.82470703125, 22.698486328125, 23.572265625, 24.446044921875, 25.31982421875, 26.193603515625, 27.0673828125, 27.941162109375, 28.81494140625, 29.688720703125, 30.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 7.0, 19.0, 62.0, 177.0, 303.0, 284.0, 115.0, 35.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.066129684448242, -24.87198829650879, -21.677846908569336, -18.48370361328125, -15.289563179016113, -12.09542179107666, -8.90127944946289, -5.7071380615234375, -2.5129966735839844, 0.6811449527740479, 3.87528657913208, 7.069428443908691, 10.263569831848145, 13.457711219787598, 16.651853561401367, 19.84599494934082, 23.040136337280273, 26.234277725219727, 29.42841911315918, 32.622562408447266, 35.81670379638672, 39.01084518432617, 42.204986572265625, 45.39912796020508, 48.59326934814453, 51.787410736083984, 54.98155212402344, 58.17569351196289, 61.369834899902344, 64.56398010253906, 67.75811767578125, 70.95226287841797, 74.14640045166016, 77.34054565429688, 80.53468322753906, 83.72882843017578, 86.92296600341797, 90.11711120605469, 93.31124877929688, 96.5053939819336, 99.69953155517578, 102.8936767578125, 106.08781433105469, 109.2819595336914, 112.4760971069336, 115.67024230957031, 118.8643798828125, 122.05852508544922, 125.25267028808594, 128.44680786132812, 131.64096069335938, 134.83509826660156, 138.02923583984375, 141.22337341308594, 144.4175262451172, 147.61166381835938, 150.80580139160156, 153.99993896484375, 157.194091796875, 160.3882293701172, 163.58236694335938, 166.77650451660156, 169.9706573486328, 173.164794921875, 176.3589324951172]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 11.0, 9.0, 12.0, 13.0, 14.0, 11.0, 15.0, 17.0, 20.0, 20.0, 23.0, 27.0, 26.0, 31.0, 43.0, 41.0, 34.0, 36.0, 48.0, 41.0, 45.0, 36.0, 42.0, 41.0, 35.0, 46.0, 34.0, 35.0, 20.0, 28.0, 27.0, 20.0, 19.0, 13.0, 15.0, 13.0, 5.0, 7.0, 16.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.957801818847656, -24.247831344604492, -23.537860870361328, -22.827890396118164, -22.117919921875, -21.407947540283203, -20.69797706604004, -19.988006591796875, -19.27803611755371, -18.568065643310547, -17.858095169067383, -17.14812469482422, -16.438152313232422, -15.728182792663574, -15.018211364746094, -14.30824089050293, -13.598270416259766, -12.888299942016602, -12.178329467773438, -11.468358039855957, -10.758387565612793, -10.048417091369629, -9.338445663452148, -8.628475189208984, -7.91850471496582, -7.208534240722656, -6.498563289642334, -5.788592338562012, -5.078621864318848, -4.368651390075684, -3.6586804389953613, -2.948709487915039, -2.238740921020508, -1.5287702083587646, -0.8187994956970215, -0.10882878303527832, 0.6011419296264648, 1.311112642288208, 2.021083354949951, 2.7310543060302734, 3.4410247802734375, 4.150995254516602, 4.860966205596924, 5.570937156677246, 6.28090763092041, 6.990878105163574, 7.7008490562438965, 8.410820007324219, 9.120790481567383, 9.830760955810547, 10.540731430053711, 11.250702857971191, 11.960673332214355, 12.67064380645752, 13.380615234375, 14.090585708618164, 14.800556182861328, 15.510526657104492, 16.220497131347656, 16.93046760559082, 17.640438079833984, 18.35041046142578, 19.060380935668945, 19.77035140991211, 20.480321884155273]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 13.0, 27.0, 14.0, 14.0, 12.0, 23.0, 21.0, 22.0, 26.0, 40.0, 33.0, 34.0, 42.0, 37.0, 30.0, 46.0, 44.0, 41.0, 41.0, 40.0, 41.0, 42.0, 33.0, 29.0, 30.0, 23.0, 30.0, 25.0, 22.0, 18.0, 16.0, 9.0, 6.0, 8.0, 10.0, 14.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.693359375, -2.60345458984375, -2.5135498046875, -2.42364501953125, -2.333740234375, -2.24383544921875, -2.1539306640625, -2.06402587890625, -1.97412109375, -1.88421630859375, -1.7943115234375, -1.70440673828125, -1.614501953125, -1.52459716796875, -1.4346923828125, -1.34478759765625, -1.2548828125, -1.16497802734375, -1.0750732421875, -0.98516845703125, -0.895263671875, -0.80535888671875, -0.7154541015625, -0.62554931640625, -0.53564453125, -0.44573974609375, -0.3558349609375, -0.26593017578125, -0.176025390625, -0.08612060546875, 0.0037841796875, 0.09368896484375, 0.18359375, 0.27349853515625, 0.3634033203125, 0.45330810546875, 0.543212890625, 0.63311767578125, 0.7230224609375, 0.81292724609375, 0.90283203125, 0.99273681640625, 1.0826416015625, 1.17254638671875, 1.262451171875, 1.35235595703125, 1.4422607421875, 1.53216552734375, 1.6220703125, 1.71197509765625, 1.8018798828125, 1.89178466796875, 1.981689453125, 2.07159423828125, 2.1614990234375, 2.25140380859375, 2.34130859375, 2.43121337890625, 2.5211181640625, 2.61102294921875, 2.700927734375, 2.79083251953125, 2.8807373046875, 2.97064208984375, 3.060546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 7.0, 16.0, 16.0, 29.0, 35.0, 49.0, 69.0, 84.0, 94.0, 148.0, 224.0, 277.0, 402.0, 473.0, 677.0, 920.0, 1292.0, 1865.0, 2634.0, 3950.0, 5825.0, 9487.0, 16601.0, 37772.0, 154652.0, 583999.0, 146131.0, 36349.0, 16044.0, 9245.0, 5997.0, 3892.0, 2644.0, 1860.0, 1322.0, 929.0, 632.0, 493.0, 388.0, 282.0, 198.0, 146.0, 100.0, 83.0, 54.0, 45.0, 34.0, 26.0, 19.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.28515625, -4.1490478515625, -4.012939453125, -3.8768310546875, -3.74072265625, -3.6046142578125, -3.468505859375, -3.3323974609375, -3.1962890625, -3.0601806640625, -2.924072265625, -2.7879638671875, -2.65185546875, -2.5157470703125, -2.379638671875, -2.2435302734375, -2.107421875, -1.9713134765625, -1.835205078125, -1.6990966796875, -1.56298828125, -1.4268798828125, -1.290771484375, -1.1546630859375, -1.0185546875, -0.8824462890625, -0.746337890625, -0.6102294921875, -0.47412109375, -0.3380126953125, -0.201904296875, -0.0657958984375, 0.0703125, 0.2064208984375, 0.342529296875, 0.4786376953125, 0.61474609375, 0.7508544921875, 0.886962890625, 1.0230712890625, 1.1591796875, 1.2952880859375, 1.431396484375, 1.5675048828125, 1.70361328125, 1.8397216796875, 1.975830078125, 2.1119384765625, 2.248046875, 2.3841552734375, 2.520263671875, 2.6563720703125, 2.79248046875, 2.9285888671875, 3.064697265625, 3.2008056640625, 3.3369140625, 3.4730224609375, 3.609130859375, 3.7452392578125, 3.88134765625, 4.0174560546875, 4.153564453125, 4.2896728515625, 4.42578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 8.0, 12.0, 5.0, 5.0, 15.0, 14.0, 19.0, 17.0, 24.0, 27.0, 16.0, 19.0, 33.0, 39.0, 34.0, 46.0, 41.0, 35.0, 43.0, 53.0, 1056.0, 48.0, 26.0, 38.0, 30.0, 30.0, 34.0, 27.0, 36.0, 20.0, 22.0, 24.0, 24.0, 10.0, 16.0, 19.0, 12.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.994659423828125, -1.92291259765625, -1.851165771484375, -1.7794189453125, -1.707672119140625, -1.63592529296875, -1.564178466796875, -1.492431640625, -1.420684814453125, -1.34893798828125, -1.277191162109375, -1.2054443359375, -1.133697509765625, -1.06195068359375, -0.990203857421875, -0.91845703125, -0.846710205078125, -0.77496337890625, -0.703216552734375, -0.6314697265625, -0.559722900390625, -0.48797607421875, -0.416229248046875, -0.344482421875, -0.272735595703125, -0.20098876953125, -0.129241943359375, -0.0574951171875, 0.014251708984375, 0.08599853515625, 0.157745361328125, 0.2294921875, 0.301239013671875, 0.37298583984375, 0.444732666015625, 0.5164794921875, 0.588226318359375, 0.65997314453125, 0.731719970703125, 0.803466796875, 0.875213623046875, 0.94696044921875, 1.018707275390625, 1.0904541015625, 1.162200927734375, 1.23394775390625, 1.305694580078125, 1.37744140625, 1.449188232421875, 1.52093505859375, 1.592681884765625, 1.6644287109375, 1.736175537109375, 1.80792236328125, 1.879669189453125, 1.951416015625, 2.023162841796875, 2.09490966796875, 2.166656494140625, 2.2384033203125, 2.310150146484375, 2.38189697265625, 2.453643798828125, 2.525390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 16.0, 11.0, 33.0, 48.0, 53.0, 93.0, 132.0, 176.0, 299.0, 468.0, 711.0, 1036.0, 1813.0, 3119.0, 5679.0, 11993.0, 30723.0, 148886.0, 1647846.0, 182442.0, 34334.0, 12759.0, 5995.0, 3323.0, 1860.0, 1154.0, 713.0, 430.0, 306.0, 200.0, 133.0, 83.0, 66.0, 47.0, 32.0, 27.0, 16.0, 16.0, 11.0, 1.0, 0.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.912109375, -3.784027099609375, -3.65594482421875, -3.527862548828125, -3.3997802734375, -3.271697998046875, -3.14361572265625, -3.015533447265625, -2.887451171875, -2.759368896484375, -2.63128662109375, -2.503204345703125, -2.3751220703125, -2.247039794921875, -2.11895751953125, -1.990875244140625, -1.86279296875, -1.734710693359375, -1.60662841796875, -1.478546142578125, -1.3504638671875, -1.222381591796875, -1.09429931640625, -0.966217041015625, -0.838134765625, -0.710052490234375, -0.58197021484375, -0.453887939453125, -0.3258056640625, -0.197723388671875, -0.06964111328125, 0.058441162109375, 0.1865234375, 0.314605712890625, 0.44268798828125, 0.570770263671875, 0.6988525390625, 0.826934814453125, 0.95501708984375, 1.083099365234375, 1.211181640625, 1.339263916015625, 1.46734619140625, 1.595428466796875, 1.7235107421875, 1.851593017578125, 1.97967529296875, 2.107757568359375, 2.23583984375, 2.363922119140625, 2.49200439453125, 2.620086669921875, 2.7481689453125, 2.876251220703125, 3.00433349609375, 3.132415771484375, 3.260498046875, 3.388580322265625, 3.51666259765625, 3.644744873046875, 3.7728271484375, 3.900909423828125, 4.02899169921875, 4.157073974609375, 4.28515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 17.0, 21.0, 26.0, 55.0, 120.0, 227.0, 259.0, 106.0, 39.0, 29.0, 21.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4947509765625, -1.449462890625, -1.4041748046875, -1.35888671875, -1.3135986328125, -1.268310546875, -1.2230224609375, -1.177734375, -1.1324462890625, -1.087158203125, -1.0418701171875, -0.99658203125, -0.9512939453125, -0.906005859375, -0.8607177734375, -0.8154296875, -0.7701416015625, -0.724853515625, -0.6795654296875, -0.63427734375, -0.5889892578125, -0.543701171875, -0.4984130859375, -0.453125, -0.4078369140625, -0.362548828125, -0.3172607421875, -0.27197265625, -0.2266845703125, -0.181396484375, -0.1361083984375, -0.0908203125, -0.0455322265625, -0.000244140625, 0.0450439453125, 0.09033203125, 0.1356201171875, 0.180908203125, 0.2261962890625, 0.271484375, 0.3167724609375, 0.362060546875, 0.4073486328125, 0.45263671875, 0.4979248046875, 0.543212890625, 0.5885009765625, 0.6337890625, 0.6790771484375, 0.724365234375, 0.7696533203125, 0.81494140625, 0.8602294921875, 0.905517578125, 0.9508056640625, 0.99609375, 1.0413818359375, 1.086669921875, 1.1319580078125, 1.17724609375, 1.2225341796875, 1.267822265625, 1.3131103515625, 1.3583984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 25.0, 32.0, 68.0, 122.0, 958.0, 83425.0, 961860.0, 1660.0, 192.0, 64.0, 43.0, 23.0, 13.0, 14.0, 5.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.828125, -26.9033203125, -25.978515625, -25.0537109375, -24.12890625, -23.2041015625, -22.279296875, -21.3544921875, -20.4296875, -19.5048828125, -18.580078125, -17.6552734375, -16.73046875, -15.8056640625, -14.880859375, -13.9560546875, -13.03125, -12.1064453125, -11.181640625, -10.2568359375, -9.33203125, -8.4072265625, -7.482421875, -6.5576171875, -5.6328125, -4.7080078125, -3.783203125, -2.8583984375, -1.93359375, -1.0087890625, -0.083984375, 0.8408203125, 1.765625, 2.6904296875, 3.615234375, 4.5400390625, 5.46484375, 6.3896484375, 7.314453125, 8.2392578125, 9.1640625, 10.0888671875, 11.013671875, 11.9384765625, 12.86328125, 13.7880859375, 14.712890625, 15.6376953125, 16.5625, 17.4873046875, 18.412109375, 19.3369140625, 20.26171875, 21.1865234375, 22.111328125, 23.0361328125, 23.9609375, 24.8857421875, 25.810546875, 26.7353515625, 27.66015625, 28.5849609375, 29.509765625, 30.4345703125, 31.359375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 9.0, 12.0, 13.0, 22.0, 32.0, 60.0, 84.0, 113.0, 152.0, 157.0, 129.0, 81.0, 51.0, 38.0, 24.0, 15.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.998117208480835, -1.9491727352142334, -1.9002282619476318, -1.8512837886810303, -1.8023391962051392, -1.7533947229385376, -1.704450249671936, -1.6555057764053345, -1.6065611839294434, -1.5576167106628418, -1.5086722373962402, -1.4597277641296387, -1.4107831716537476, -1.361838698387146, -1.3128942251205444, -1.2639497518539429, -1.2150052785873413, -1.1660608053207397, -1.1171163320541382, -1.068171739578247, -1.0192272663116455, -0.970282793045044, -0.9213383197784424, -0.8723938465118408, -0.8234493136405945, -0.7745048403739929, -0.7255603075027466, -0.676615834236145, -0.6276713609695435, -0.5787268280982971, -0.5297823548316956, -0.4808378517627716, -0.4318934679031372, -0.38294896483421326, -0.3340044617652893, -0.28505998849868774, -0.2361154854297638, -0.18717098236083984, -0.13822650909423828, -0.08928200602531433, -0.04033750295639038, 0.008606992661952972, 0.057551488280296326, 0.10649597644805908, 0.15544047951698303, 0.20438498258590698, 0.25332945585250854, 0.3022739589214325, 0.35121846199035645, 0.4001629650592804, 0.44910746812820435, 0.4980519413948059, 0.5469964742660522, 0.5959409475326538, 0.6448854207992554, 0.6938298940658569, 0.7427744269371033, 0.7917189002037048, 0.8406634330749512, 0.8896079063415527, 0.9385523796081543, 0.9874969124794006, 1.0364413261413574, 1.0853859186172485, 1.13433039188385]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 17.0, 16.0, 9.0, 13.0, 21.0, 22.0, 29.0, 34.0, 40.0, 38.0, 33.0, 34.0, 44.0, 39.0, 37.0, 42.0, 38.0, 45.0, 38.0, 39.0, 42.0, 30.0, 36.0, 26.0, 27.0, 25.0, 25.0, 23.0, 24.0, 20.0, 12.0, 12.0, 10.0, 3.0, 8.0, 7.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8735390901565552, -0.8446713089942932, -0.8158035278320312, -0.7869357466697693, -0.7580679655075073, -0.7292001843452454, -0.7003324031829834, -0.6714646816253662, -0.6425968408584595, -0.6137290596961975, -0.5848612785339355, -0.5559934973716736, -0.5271257162094116, -0.49825793504714966, -0.4693901836872101, -0.4405224025249481, -0.41165465116500854, -0.3827868700027466, -0.3539190888404846, -0.32505130767822266, -0.2961835265159607, -0.26731574535369873, -0.23844799399375916, -0.2095802128314972, -0.18071243166923523, -0.15184465050697327, -0.1229768767952919, -0.09410910308361053, -0.06524132192134857, -0.03637354075908661, -0.00750577449798584, 0.021362006664276123, 0.05022972822189331, 0.07909750938415527, 0.10796528309583664, 0.136833056807518, 0.16570083796977997, 0.19456861913204193, 0.2234363853931427, 0.25230416655540466, 0.2811719477176666, 0.3100397288799286, 0.33890751004219055, 0.3677752614021301, 0.3966430425643921, 0.42551082372665405, 0.454378604888916, 0.483246386051178, 0.5121141672134399, 0.5409819483757019, 0.5698497295379639, 0.5987175107002258, 0.6275852918624878, 0.6564530730247498, 0.6853208541870117, 0.7141885757446289, 0.7430564165115356, 0.7719241976737976, 0.8007919788360596, 0.8296597599983215, 0.8585275411605835, 0.8873953223228455, 0.9162631034851074, 0.9451308250427246, 0.9739986062049866]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 9.0, 11.0, 9.0, 12.0, 20.0, 18.0, 14.0, 20.0, 29.0, 26.0, 40.0, 35.0, 35.0, 35.0, 37.0, 33.0, 37.0, 36.0, 48.0, 40.0, 41.0, 45.0, 38.0, 39.0, 26.0, 21.0, 24.0, 29.0, 26.0, 22.0, 23.0, 14.0, 13.0, 15.0, 10.0, 15.0, 6.0, 13.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.701171875, -2.612457275390625, -2.52374267578125, -2.435028076171875, -2.3463134765625, -2.257598876953125, -2.16888427734375, -2.080169677734375, -1.991455078125, -1.902740478515625, -1.81402587890625, -1.725311279296875, -1.6365966796875, -1.547882080078125, -1.45916748046875, -1.370452880859375, -1.28173828125, -1.193023681640625, -1.10430908203125, -1.015594482421875, -0.9268798828125, -0.838165283203125, -0.74945068359375, -0.660736083984375, -0.572021484375, -0.483306884765625, -0.39459228515625, -0.305877685546875, -0.2171630859375, -0.128448486328125, -0.03973388671875, 0.048980712890625, 0.1376953125, 0.226409912109375, 0.31512451171875, 0.403839111328125, 0.4925537109375, 0.581268310546875, 0.66998291015625, 0.758697509765625, 0.847412109375, 0.936126708984375, 1.02484130859375, 1.113555908203125, 1.2022705078125, 1.290985107421875, 1.37969970703125, 1.468414306640625, 1.55712890625, 1.645843505859375, 1.73455810546875, 1.823272705078125, 1.9119873046875, 2.000701904296875, 2.08941650390625, 2.178131103515625, 2.266845703125, 2.355560302734375, 2.44427490234375, 2.532989501953125, 2.6217041015625, 2.710418701171875, 2.79913330078125, 2.887847900390625, 2.9765625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 13.0, 13.0, 14.0, 31.0, 31.0, 45.0, 50.0, 88.0, 110.0, 166.0, 230.0, 340.0, 570.0, 924.0, 1490.0, 2540.0, 4654.0, 8524.0, 18114.0, 52040.0, 378990.0, 479591.0, 59370.0, 19580.0, 9064.0, 4827.0, 2697.0, 1600.0, 925.0, 635.0, 391.0, 263.0, 152.0, 102.0, 100.0, 64.0, 47.0, 34.0, 29.0, 20.0, 21.0, 11.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.828125, -5.6341552734375, -5.440185546875, -5.2462158203125, -5.05224609375, -4.8582763671875, -4.664306640625, -4.4703369140625, -4.2763671875, -4.0823974609375, -3.888427734375, -3.6944580078125, -3.50048828125, -3.3065185546875, -3.112548828125, -2.9185791015625, -2.724609375, -2.5306396484375, -2.336669921875, -2.1427001953125, -1.94873046875, -1.7547607421875, -1.560791015625, -1.3668212890625, -1.1728515625, -0.9788818359375, -0.784912109375, -0.5909423828125, -0.39697265625, -0.2030029296875, -0.009033203125, 0.1849365234375, 0.37890625, 0.5728759765625, 0.766845703125, 0.9608154296875, 1.15478515625, 1.3487548828125, 1.542724609375, 1.7366943359375, 1.9306640625, 2.1246337890625, 2.318603515625, 2.5125732421875, 2.70654296875, 2.9005126953125, 3.094482421875, 3.2884521484375, 3.482421875, 3.6763916015625, 3.870361328125, 4.0643310546875, 4.25830078125, 4.4522705078125, 4.646240234375, 4.8402099609375, 5.0341796875, 5.2281494140625, 5.422119140625, 5.6160888671875, 5.81005859375, 6.0040283203125, 6.197998046875, 6.3919677734375, 6.5859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 9.0, 24.0, 20.0, 22.0, 34.0, 26.0, 23.0, 41.0, 50.0, 44.0, 77.0, 108.0, 146.0, 1509.0, 261.0, 119.0, 90.0, 74.0, 50.0, 47.0, 35.0, 37.0, 29.0, 25.0, 18.0, 19.0, 10.0, 13.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.3359375, -11.970703125, -11.60546875, -11.240234375, -10.875, -10.509765625, -10.14453125, -9.779296875, -9.4140625, -9.048828125, -8.68359375, -8.318359375, -7.953125, -7.587890625, -7.22265625, -6.857421875, -6.4921875, -6.126953125, -5.76171875, -5.396484375, -5.03125, -4.666015625, -4.30078125, -3.935546875, -3.5703125, -3.205078125, -2.83984375, -2.474609375, -2.109375, -1.744140625, -1.37890625, -1.013671875, -0.6484375, -0.283203125, 0.08203125, 0.447265625, 0.8125, 1.177734375, 1.54296875, 1.908203125, 2.2734375, 2.638671875, 3.00390625, 3.369140625, 3.734375, 4.099609375, 4.46484375, 4.830078125, 5.1953125, 5.560546875, 5.92578125, 6.291015625, 6.65625, 7.021484375, 7.38671875, 7.751953125, 8.1171875, 8.482421875, 8.84765625, 9.212890625, 9.578125, 9.943359375, 10.30859375, 10.673828125, 11.0390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 7.0, 11.0, 15.0, 8.0, 19.0, 26.0, 32.0, 38.0, 53.0, 64.0, 74.0, 125.0, 159.0, 286.0, 828.0, 5503.0, 84324.0, 2962562.0, 84260.0, 5558.0, 833.0, 266.0, 156.0, 120.0, 95.0, 52.0, 53.0, 37.0, 28.0, 25.0, 22.0, 10.0, 13.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.182861328125, -22.39697265625, -21.611083984375, -20.8251953125, -20.039306640625, -19.25341796875, -18.467529296875, -17.681640625, -16.895751953125, -16.10986328125, -15.323974609375, -14.5380859375, -13.752197265625, -12.96630859375, -12.180419921875, -11.39453125, -10.608642578125, -9.82275390625, -9.036865234375, -8.2509765625, -7.465087890625, -6.67919921875, -5.893310546875, -5.107421875, -4.321533203125, -3.53564453125, -2.749755859375, -1.9638671875, -1.177978515625, -0.39208984375, 0.393798828125, 1.1796875, 1.965576171875, 2.75146484375, 3.537353515625, 4.3232421875, 5.109130859375, 5.89501953125, 6.680908203125, 7.466796875, 8.252685546875, 9.03857421875, 9.824462890625, 10.6103515625, 11.396240234375, 12.18212890625, 12.968017578125, 13.75390625, 14.539794921875, 15.32568359375, 16.111572265625, 16.8974609375, 17.683349609375, 18.46923828125, 19.255126953125, 20.041015625, 20.826904296875, 21.61279296875, 22.398681640625, 23.1845703125, 23.970458984375, 24.75634765625, 25.542236328125, 26.328125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 35.0, 102.0, 329.0, 366.0, 138.0, 34.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.385540008544922, -27.14822769165039, -24.91091537475586, -22.673603057861328, -20.436290740966797, -18.198978424072266, -15.961664199829102, -13.72435188293457, -11.487039566040039, -9.249727249145508, -7.012414455413818, -4.775101661682129, -2.5377893447875977, -0.3004770278930664, 1.9368362426757812, 4.1741485595703125, 6.411460876464844, 8.648773193359375, 10.886085510253906, 13.123398780822754, 15.360711097717285, 17.5980224609375, 19.835336685180664, 22.072649002075195, 24.309961318969727, 26.547273635864258, 28.78458595275879, 31.021900177001953, 33.259212493896484, 35.496524810791016, 37.73383712768555, 39.97114944458008, 42.208457946777344, 44.445770263671875, 46.683082580566406, 48.92039489746094, 51.15770721435547, 53.39501953125, 55.63233184814453, 57.86964416503906, 60.106956481933594, 62.344268798828125, 64.58158111572266, 66.81889343261719, 69.05620574951172, 71.29351806640625, 73.53083038330078, 75.76814270019531, 78.00546264648438, 80.2427749633789, 82.48008728027344, 84.71739959716797, 86.9547119140625, 89.19202423095703, 91.42933654785156, 93.6666488647461, 95.90396118164062, 98.14127349853516, 100.37858581542969, 102.61589813232422, 104.85321044921875, 107.09052276611328, 109.32783508300781, 111.56514739990234, 113.80245971679688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 4.0, 6.0, 7.0, 7.0, 11.0, 14.0, 7.0, 14.0, 21.0, 18.0, 16.0, 28.0, 30.0, 24.0, 34.0, 35.0, 38.0, 44.0, 33.0, 48.0, 43.0, 47.0, 40.0, 43.0, 43.0, 33.0, 40.0, 40.0, 31.0, 41.0, 43.0, 19.0, 12.0, 16.0, 10.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.859025955200195, -28.9013614654541, -27.94369888305664, -26.986034393310547, -26.028371810913086, -25.070707321166992, -24.11304473876953, -23.155380249023438, -22.197715759277344, -21.24005126953125, -20.28238868713379, -19.324724197387695, -18.367061614990234, -17.40939712524414, -16.451732635498047, -15.494070053100586, -14.536407470703125, -13.578743934631348, -12.62108039855957, -11.663415908813477, -10.705753326416016, -9.748088836669922, -8.790425300598145, -7.832761764526367, -6.87509822845459, -5.9174346923828125, -4.959771156311035, -4.0021071434021, -3.0444436073303223, -2.086780071258545, -1.1291160583496094, -0.17145252227783203, 0.7862110137939453, 1.7438746690750122, 2.701538324356079, 3.6592020988464355, 4.616865634918213, 5.57452917098999, 6.532193183898926, 7.489856719970703, 8.44752025604248, 9.405183792114258, 10.362847328186035, 11.320510864257812, 12.278175354003906, 13.235837936401367, 14.193502426147461, 15.151165962219238, 16.108829498291016, 17.06649398803711, 18.02415657043457, 18.981821060180664, 19.939483642578125, 20.89714813232422, 21.854812622070312, 22.812475204467773, 23.770137786865234, 24.727802276611328, 25.68546485900879, 26.643129348754883, 27.600791931152344, 28.558456420898438, 29.51612091064453, 30.473783493041992, 31.431447982788086]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 7.0, 11.0, 13.0, 14.0, 17.0, 15.0, 19.0, 23.0, 27.0, 22.0, 23.0, 38.0, 34.0, 32.0, 35.0, 40.0, 32.0, 39.0, 53.0, 34.0, 43.0, 56.0, 47.0, 29.0, 21.0, 36.0, 22.0, 34.0, 27.0, 24.0, 21.0, 23.0, 13.0, 15.0, 12.0, 10.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.938720703125, -2.83642578125, -2.734130859375, -2.6318359375, -2.529541015625, -2.42724609375, -2.324951171875, -2.22265625, -2.120361328125, -2.01806640625, -1.915771484375, -1.8134765625, -1.711181640625, -1.60888671875, -1.506591796875, -1.404296875, -1.302001953125, -1.19970703125, -1.097412109375, -0.9951171875, -0.892822265625, -0.79052734375, -0.688232421875, -0.5859375, -0.483642578125, -0.38134765625, -0.279052734375, -0.1767578125, -0.074462890625, 0.02783203125, 0.130126953125, 0.232421875, 0.334716796875, 0.43701171875, 0.539306640625, 0.6416015625, 0.743896484375, 0.84619140625, 0.948486328125, 1.05078125, 1.153076171875, 1.25537109375, 1.357666015625, 1.4599609375, 1.562255859375, 1.66455078125, 1.766845703125, 1.869140625, 1.971435546875, 2.07373046875, 2.176025390625, 2.2783203125, 2.380615234375, 2.48291015625, 2.585205078125, 2.6875, 2.789794921875, 2.89208984375, 2.994384765625, 3.0966796875, 3.198974609375, 3.30126953125, 3.403564453125, 3.505859375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 6.0, 9.0, 11.0, 11.0, 15.0, 30.0, 34.0, 63.0, 83.0, 111.0, 136.0, 191.0, 298.0, 420.0, 735.0, 1224.0, 2267.0, 4365.0, 9227.0, 21311.0, 62264.0, 451353.0, 2985198.0, 542965.0, 68253.0, 23040.0, 9962.0, 4723.0, 2315.0, 1304.0, 761.0, 502.0, 311.0, 232.0, 153.0, 93.0, 74.0, 61.0, 37.0, 32.0, 30.0, 12.0, 17.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.2109375, -8.9188232421875, -8.626708984375, -8.3345947265625, -8.04248046875, -7.7503662109375, -7.458251953125, -7.1661376953125, -6.8740234375, -6.5819091796875, -6.289794921875, -5.9976806640625, -5.70556640625, -5.4134521484375, -5.121337890625, -4.8292236328125, -4.537109375, -4.2449951171875, -3.952880859375, -3.6607666015625, -3.36865234375, -3.0765380859375, -2.784423828125, -2.4923095703125, -2.2001953125, -1.9080810546875, -1.615966796875, -1.3238525390625, -1.03173828125, -0.7396240234375, -0.447509765625, -0.1553955078125, 0.13671875, 0.4288330078125, 0.720947265625, 1.0130615234375, 1.30517578125, 1.5972900390625, 1.889404296875, 2.1815185546875, 2.4736328125, 2.7657470703125, 3.057861328125, 3.3499755859375, 3.64208984375, 3.9342041015625, 4.226318359375, 4.5184326171875, 4.810546875, 5.1026611328125, 5.394775390625, 5.6868896484375, 5.97900390625, 6.2711181640625, 6.563232421875, 6.8553466796875, 7.1474609375, 7.4395751953125, 7.731689453125, 8.0238037109375, 8.31591796875, 8.6080322265625, 8.900146484375, 9.1922607421875, 9.484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 4.0, 4.0, 8.0, 13.0, 22.0, 27.0, 25.0, 26.0, 43.0, 67.0, 79.0, 81.0, 148.0, 200.0, 350.0, 557.0, 701.0, 543.0, 343.0, 241.0, 125.0, 100.0, 76.0, 64.0, 47.0, 41.0, 31.0, 18.0, 16.0, 9.0, 14.0, 9.0, 10.0, 11.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.15203857421875, -6.9251708984375, -6.69830322265625, -6.471435546875, -6.24456787109375, -6.0177001953125, -5.79083251953125, -5.56396484375, -5.33709716796875, -5.1102294921875, -4.88336181640625, -4.656494140625, -4.42962646484375, -4.2027587890625, -3.97589111328125, -3.7490234375, -3.52215576171875, -3.2952880859375, -3.06842041015625, -2.841552734375, -2.61468505859375, -2.3878173828125, -2.16094970703125, -1.93408203125, -1.70721435546875, -1.4803466796875, -1.25347900390625, -1.026611328125, -0.79974365234375, -0.5728759765625, -0.34600830078125, -0.119140625, 0.10772705078125, 0.3345947265625, 0.56146240234375, 0.788330078125, 1.01519775390625, 1.2420654296875, 1.46893310546875, 1.69580078125, 1.92266845703125, 2.1495361328125, 2.37640380859375, 2.603271484375, 2.83013916015625, 3.0570068359375, 3.28387451171875, 3.5107421875, 3.73760986328125, 3.9644775390625, 4.19134521484375, 4.418212890625, 4.64508056640625, 4.8719482421875, 5.09881591796875, 5.32568359375, 5.55255126953125, 5.7794189453125, 6.00628662109375, 6.233154296875, 6.46002197265625, 6.6868896484375, 6.91375732421875, 7.140625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 9.0, 16.0, 8.0, 21.0, 20.0, 28.0, 41.0, 50.0, 70.0, 71.0, 136.0, 256.0, 854.0, 5022.0, 82183.0, 3880748.0, 213433.0, 9246.0, 1175.0, 328.0, 144.0, 107.0, 80.0, 43.0, 35.0, 27.0, 21.0, 24.0, 23.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.90625, -29.928955078125, -28.95166015625, -27.974365234375, -26.9970703125, -26.019775390625, -25.04248046875, -24.065185546875, -23.087890625, -22.110595703125, -21.13330078125, -20.156005859375, -19.1787109375, -18.201416015625, -17.22412109375, -16.246826171875, -15.26953125, -14.292236328125, -13.31494140625, -12.337646484375, -11.3603515625, -10.383056640625, -9.40576171875, -8.428466796875, -7.451171875, -6.473876953125, -5.49658203125, -4.519287109375, -3.5419921875, -2.564697265625, -1.58740234375, -0.610107421875, 0.3671875, 1.344482421875, 2.32177734375, 3.299072265625, 4.2763671875, 5.253662109375, 6.23095703125, 7.208251953125, 8.185546875, 9.162841796875, 10.14013671875, 11.117431640625, 12.0947265625, 13.072021484375, 14.04931640625, 15.026611328125, 16.00390625, 16.981201171875, 17.95849609375, 18.935791015625, 19.9130859375, 20.890380859375, 21.86767578125, 22.844970703125, 23.822265625, 24.799560546875, 25.77685546875, 26.754150390625, 27.7314453125, 28.708740234375, 29.68603515625, 30.663330078125, 31.640625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 13.0, 21.0, 39.0, 74.0, 139.0, 213.0, 209.0, 130.0, 80.0, 40.0, 23.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62064743041992, -52.782440185546875, -50.944236755371094, -49.10602951049805, -47.267822265625, -45.42961883544922, -43.59141159057617, -41.753204345703125, -39.915000915527344, -38.0767936706543, -36.238590240478516, -34.40038299560547, -32.56217575073242, -30.723970413208008, -28.885765075683594, -27.047557830810547, -25.2093505859375, -23.371145248413086, -21.53293800354004, -19.694732666015625, -17.856525421142578, -16.018320083618164, -14.18011474609375, -12.34190845489502, -10.503702163696289, -8.665495872497559, -6.827290058135986, -4.989084243774414, -3.1508779525756836, -1.3126716613769531, 0.5255336761474609, 2.3637399673461914, 4.201946258544922, 6.040152549743652, 7.878358364105225, 9.716564178466797, 11.554770469665527, 13.392976760864258, 15.231182098388672, 17.06938934326172, 18.907594680786133, 20.745800018310547, 22.584007263183594, 24.422212600708008, 26.260417938232422, 28.09862518310547, 29.936830520629883, 31.775035858154297, 33.613243103027344, 35.45145034790039, 37.28965377807617, 39.12786102294922, 40.966068267822266, 42.80427551269531, 44.642478942871094, 46.48068618774414, 48.31889343261719, 50.157100677490234, 51.995304107666016, 53.83351135253906, 55.67171859741211, 57.509925842285156, 59.34812927246094, 61.186336517333984, 63.024539947509766]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 12.0, 10.0, 17.0, 20.0, 15.0, 24.0, 34.0, 34.0, 42.0, 27.0, 27.0, 44.0, 56.0, 37.0, 39.0, 48.0, 42.0, 37.0, 39.0, 38.0, 33.0, 30.0, 34.0, 30.0, 32.0, 25.0, 15.0, 24.0, 22.0, 19.0, 9.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.095863342285156, -21.375322341918945, -20.6547794342041, -19.93423843383789, -19.213695526123047, -18.493154525756836, -17.772613525390625, -17.05207061767578, -16.33152961730957, -15.610987663269043, -14.890445709228516, -14.169904708862305, -13.449362754821777, -12.72882080078125, -12.008279800415039, -11.287737846374512, -10.567195892333984, -9.846653938293457, -9.12611198425293, -8.405570983886719, -7.685029029846191, -6.964487075805664, -6.243945598602295, -5.523404121398926, -4.802862167358398, -4.082320213317871, -3.361778736114502, -2.6412370204925537, -1.9206953048706055, -1.2001535892486572, -0.479611873626709, 0.24092960357666016, 0.9614734649658203, 1.6820151805877686, 2.402556896209717, 3.123098611831665, 3.8436403274536133, 4.564182281494141, 5.28472375869751, 6.005265235900879, 6.725807189941406, 7.446349143981934, 8.166891098022461, 8.887432098388672, 9.6079740524292, 10.328516006469727, 11.049057006835938, 11.769598960876465, 12.490140914916992, 13.21068286895752, 13.931224822998047, 14.651765823364258, 15.372307777404785, 16.092849731445312, 16.813390731811523, 17.533931732177734, 18.254474639892578, 18.97501564025879, 19.695558547973633, 20.416099548339844, 21.136642456054688, 21.8571834564209, 22.57772445678711, 23.298267364501953, 24.018808364868164]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 4.0, 9.0, 10.0, 16.0, 14.0, 13.0, 14.0, 21.0, 22.0, 25.0, 25.0, 29.0, 33.0, 46.0, 39.0, 49.0, 36.0, 40.0, 42.0, 46.0, 26.0, 52.0, 63.0, 37.0, 35.0, 31.0, 21.0, 20.0, 24.0, 39.0, 16.0, 13.0, 25.0, 9.0, 16.0, 12.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.835906982421875, -2.73040771484375, -2.624908447265625, -2.5194091796875, -2.413909912109375, -2.30841064453125, -2.202911376953125, -2.097412109375, -1.991912841796875, -1.88641357421875, -1.780914306640625, -1.6754150390625, -1.569915771484375, -1.46441650390625, -1.358917236328125, -1.25341796875, -1.147918701171875, -1.04241943359375, -0.936920166015625, -0.8314208984375, -0.725921630859375, -0.62042236328125, -0.514923095703125, -0.409423828125, -0.303924560546875, -0.19842529296875, -0.092926025390625, 0.0125732421875, 0.118072509765625, 0.22357177734375, 0.329071044921875, 0.4345703125, 0.540069580078125, 0.64556884765625, 0.751068115234375, 0.8565673828125, 0.962066650390625, 1.06756591796875, 1.173065185546875, 1.278564453125, 1.384063720703125, 1.48956298828125, 1.595062255859375, 1.7005615234375, 1.806060791015625, 1.91156005859375, 2.017059326171875, 2.12255859375, 2.228057861328125, 2.33355712890625, 2.439056396484375, 2.5445556640625, 2.650054931640625, 2.75555419921875, 2.861053466796875, 2.966552734375, 3.072052001953125, 3.17755126953125, 3.283050537109375, 3.3885498046875, 3.494049072265625, 3.59954833984375, 3.705047607421875, 3.810546875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 20.0, 13.0, 29.0, 70.0, 156.0, 308.0, 610.0, 1424.0, 3555.0, 11157.0, 76747.0, 815142.0, 118219.0, 14017.0, 4024.0, 1623.0, 756.0, 309.0, 157.0, 87.0, 46.0, 24.0, 11.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.44921875, -4.32415771484375, -4.1990966796875, -4.07403564453125, -3.948974609375, -3.82391357421875, -3.6988525390625, -3.57379150390625, -3.44873046875, -3.32366943359375, -3.1986083984375, -3.07354736328125, -2.948486328125, -2.82342529296875, -2.6983642578125, -2.57330322265625, -2.4482421875, -2.32318115234375, -2.1981201171875, -2.07305908203125, -1.947998046875, -1.82293701171875, -1.6978759765625, -1.57281494140625, -1.44775390625, -1.32269287109375, -1.1976318359375, -1.07257080078125, -0.947509765625, -0.82244873046875, -0.6973876953125, -0.57232666015625, -0.447265625, -0.32220458984375, -0.1971435546875, -0.07208251953125, 0.052978515625, 0.17803955078125, 0.3031005859375, 0.42816162109375, 0.55322265625, 0.67828369140625, 0.8033447265625, 0.92840576171875, 1.053466796875, 1.17852783203125, 1.3035888671875, 1.42864990234375, 1.5537109375, 1.67877197265625, 1.8038330078125, 1.92889404296875, 2.053955078125, 2.17901611328125, 2.3040771484375, 2.42913818359375, 2.55419921875, 2.67926025390625, 2.8043212890625, 2.92938232421875, 3.054443359375, 3.17950439453125, 3.3045654296875, 3.42962646484375, 3.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 10.0, 9.0, 11.0, 17.0, 11.0, 16.0, 15.0, 26.0, 21.0, 24.0, 33.0, 24.0, 35.0, 38.0, 25.0, 37.0, 47.0, 1066.0, 34.0, 41.0, 46.0, 45.0, 44.0, 35.0, 31.0, 35.0, 33.0, 25.0, 34.0, 13.0, 18.0, 16.0, 22.0, 10.0, 5.0, 12.0, 7.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.44921875, -2.370208740234375, -2.29119873046875, -2.212188720703125, -2.1331787109375, -2.054168701171875, -1.97515869140625, -1.896148681640625, -1.817138671875, -1.738128662109375, -1.65911865234375, -1.580108642578125, -1.5010986328125, -1.422088623046875, -1.34307861328125, -1.264068603515625, -1.18505859375, -1.106048583984375, -1.02703857421875, -0.948028564453125, -0.8690185546875, -0.790008544921875, -0.71099853515625, -0.631988525390625, -0.552978515625, -0.473968505859375, -0.39495849609375, -0.315948486328125, -0.2369384765625, -0.157928466796875, -0.07891845703125, 9.1552734375e-05, 0.0791015625, 0.158111572265625, 0.23712158203125, 0.316131591796875, 0.3951416015625, 0.474151611328125, 0.55316162109375, 0.632171630859375, 0.711181640625, 0.790191650390625, 0.86920166015625, 0.948211669921875, 1.0272216796875, 1.106231689453125, 1.18524169921875, 1.264251708984375, 1.34326171875, 1.422271728515625, 1.50128173828125, 1.580291748046875, 1.6593017578125, 1.738311767578125, 1.81732177734375, 1.896331787109375, 1.975341796875, 2.054351806640625, 2.13336181640625, 2.212371826171875, 2.2913818359375, 2.370391845703125, 2.44940185546875, 2.528411865234375, 2.607421875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 3.0, 6.0, 5.0, 17.0, 33.0, 48.0, 56.0, 103.0, 131.0, 244.0, 379.0, 569.0, 999.0, 1877.0, 3985.0, 12042.0, 74235.0, 1792372.0, 180284.0, 18799.0, 5510.0, 2288.0, 1223.0, 754.0, 432.0, 248.0, 177.0, 102.0, 71.0, 41.0, 31.0, 20.0, 7.0, 10.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.505859375, -2.4374847412109375, -2.369110107421875, -2.3007354736328125, -2.23236083984375, -2.1639862060546875, -2.095611572265625, -2.0272369384765625, -1.9588623046875, -1.8904876708984375, -1.822113037109375, -1.7537384033203125, -1.68536376953125, -1.6169891357421875, -1.548614501953125, -1.4802398681640625, -1.411865234375, -1.3434906005859375, -1.275115966796875, -1.2067413330078125, -1.13836669921875, -1.0699920654296875, -1.001617431640625, -0.9332427978515625, -0.8648681640625, -0.7964935302734375, -0.728118896484375, -0.6597442626953125, -0.59136962890625, -0.5229949951171875, -0.454620361328125, -0.3862457275390625, -0.31787109375, -0.2494964599609375, -0.181121826171875, -0.1127471923828125, -0.04437255859375, 0.0240020751953125, 0.092376708984375, 0.1607513427734375, 0.2291259765625, 0.2975006103515625, 0.365875244140625, 0.4342498779296875, 0.50262451171875, 0.5709991455078125, 0.639373779296875, 0.7077484130859375, 0.776123046875, 0.8444976806640625, 0.912872314453125, 0.9812469482421875, 1.04962158203125, 1.1179962158203125, 1.186370849609375, 1.2547454833984375, 1.3231201171875, 1.3914947509765625, 1.459869384765625, 1.5282440185546875, 1.59661865234375, 1.6649932861328125, 1.733367919921875, 1.8017425537109375, 1.8701171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 30.0, 37.0, 77.0, 94.0, 207.0, 206.0, 137.0, 72.0, 55.0, 19.0, 25.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4054222106933594, -0.39238739013671875, -0.3793525695800781, -0.3663177490234375, -0.3532829284667969, -0.34024810791015625, -0.3272132873535156, -0.314178466796875, -0.3011436462402344, -0.28810882568359375, -0.2750740051269531, -0.2620391845703125, -0.24900436401367188, -0.23596954345703125, -0.22293472290039062, -0.20989990234375, -0.19686508178710938, -0.18383026123046875, -0.17079544067382812, -0.1577606201171875, -0.14472579956054688, -0.13169097900390625, -0.11865615844726562, -0.105621337890625, -0.09258651733398438, -0.07955169677734375, -0.06651687622070312, -0.0534820556640625, -0.040447235107421875, -0.02741241455078125, -0.014377593994140625, -0.0013427734375, 0.011692047119140625, 0.02472686767578125, 0.037761688232421875, 0.0507965087890625, 0.06383132934570312, 0.07686614990234375, 0.08990097045898438, 0.102935791015625, 0.11597061157226562, 0.12900543212890625, 0.14204025268554688, 0.1550750732421875, 0.16810989379882812, 0.18114471435546875, 0.19417953491210938, 0.20721435546875, 0.22024917602539062, 0.23328399658203125, 0.24631881713867188, 0.2593536376953125, 0.2723884582519531, 0.28542327880859375, 0.2984580993652344, 0.311492919921875, 0.3245277404785156, 0.33756256103515625, 0.3505973815917969, 0.3636322021484375, 0.3766670227050781, 0.38970184326171875, 0.4027366638183594, 0.415771484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 27.0, 36.0, 85.0, 170.0, 1145.0, 226177.0, 819212.0, 1348.0, 162.0, 67.0, 45.0, 21.0, 9.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.62060546875, -8.3427734375, -8.06494140625, -7.787109375, -7.50927734375, -7.2314453125, -6.95361328125, -6.67578125, -6.39794921875, -6.1201171875, -5.84228515625, -5.564453125, -5.28662109375, -5.0087890625, -4.73095703125, -4.453125, -4.17529296875, -3.8974609375, -3.61962890625, -3.341796875, -3.06396484375, -2.7861328125, -2.50830078125, -2.23046875, -1.95263671875, -1.6748046875, -1.39697265625, -1.119140625, -0.84130859375, -0.5634765625, -0.28564453125, -0.0078125, 0.27001953125, 0.5478515625, 0.82568359375, 1.103515625, 1.38134765625, 1.6591796875, 1.93701171875, 2.21484375, 2.49267578125, 2.7705078125, 3.04833984375, 3.326171875, 3.60400390625, 3.8818359375, 4.15966796875, 4.4375, 4.71533203125, 4.9931640625, 5.27099609375, 5.548828125, 5.82666015625, 6.1044921875, 6.38232421875, 6.66015625, 6.93798828125, 7.2158203125, 7.49365234375, 7.771484375, 8.04931640625, 8.3271484375, 8.60498046875, 8.8828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 22.0, 28.0, 23.0, 52.0, 79.0, 121.0, 136.0, 161.0, 99.0, 82.0, 54.0, 41.0, 26.0, 22.0, 14.0, 14.0, 8.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18939897418022156, -0.1777198165655136, -0.16604065895080566, -0.1543615162372589, -0.14268234372138977, -0.13100320100784302, -0.11932404339313507, -0.10764488577842712, -0.09596572816371918, -0.08428657054901123, -0.07260741293430328, -0.060928262770175934, -0.04924910515546799, -0.03756994754076004, -0.02589079737663269, -0.014211639761924744, -0.002532482147216797, 0.009146673604846, 0.020825829356908798, 0.03250498324632645, 0.04418414086103439, 0.05586329847574234, 0.06754244863986969, 0.07922160625457764, 0.09090076386928558, 0.10257992148399353, 0.11425907909870148, 0.12593823671340942, 0.13761737942695618, 0.14929655194282532, 0.16097569465637207, 0.17265485227108002, 0.18433398008346558, 0.19601313769817352, 0.20769229531288147, 0.21937143802642822, 0.23105061054229736, 0.24272975325584412, 0.25440889596939087, 0.26608806848526, 0.27776724100112915, 0.2894463837146759, 0.30112555623054504, 0.3128046989440918, 0.32448387145996094, 0.3361630141735077, 0.34784215688705444, 0.3595213294029236, 0.37120047211647034, 0.3828796148300171, 0.39455878734588623, 0.406237930059433, 0.4179171025753021, 0.4295962452888489, 0.441275417804718, 0.45295456051826477, 0.4646337032318115, 0.4763128459453583, 0.4879920184612274, 0.49967116117477417, 0.5113503336906433, 0.5230295062065125, 0.5347086191177368, 0.546387791633606, 0.5580669641494751]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 4.0, 14.0, 16.0, 18.0, 16.0, 22.0, 30.0, 17.0, 28.0, 29.0, 29.0, 31.0, 40.0, 38.0, 39.0, 39.0, 44.0, 44.0, 34.0, 37.0, 31.0, 35.0, 29.0, 28.0, 38.0, 34.0, 21.0, 21.0, 21.0, 18.0, 19.0, 14.0, 14.0, 15.0, 11.0, 7.0, 12.0, 5.0, 2.0, 1.0, 4.0, 9.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.17023152112960815, -0.16418780386447906, -0.15814407169818878, -0.1521003544330597, -0.1460566222667694, -0.14001290500164032, -0.13396918773651123, -0.12792545557022095, -0.12188173830509186, -0.11583801358938217, -0.10979428887367249, -0.1037505716085434, -0.09770684689283371, -0.09166312217712402, -0.08561940491199493, -0.07957568019628525, -0.07353195548057556, -0.06748823076486588, -0.06144450977444649, -0.0554007887840271, -0.04935706406831741, -0.04331333935260773, -0.03726961836218834, -0.03122589737176895, -0.025182172656059265, -0.019138449802994728, -0.013094726949930191, -0.007051004096865654, -0.001007281243801117, 0.00503644160926342, 0.011080164462327957, 0.017123885452747345, 0.02316761016845703, 0.02921133302152157, 0.035255055874586105, 0.04129877686500549, 0.04734250158071518, 0.053386226296424866, 0.059429947286844254, 0.06547366827726364, 0.07151739299297333, 0.07756111770868301, 0.0836048424243927, 0.08964855968952179, 0.09569228440523148, 0.10173600912094116, 0.10777972638607025, 0.11382345110177994, 0.11986717581748962, 0.1259108930826187, 0.131954625248909, 0.13799834251403809, 0.14404207468032837, 0.15008579194545746, 0.15612950921058655, 0.16217324137687683, 0.16821695864200592, 0.174260675907135, 0.1803044080734253, 0.18634812533855438, 0.19239184260368347, 0.19843557476997375, 0.20447929203510284, 0.21052300930023193, 0.21656674146652222]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 5.0, 7.0, 11.0, 10.0, 20.0, 20.0, 16.0, 22.0, 27.0, 29.0, 28.0, 34.0, 44.0, 32.0, 39.0, 40.0, 36.0, 35.0, 43.0, 43.0, 48.0, 46.0, 35.0, 33.0, 35.0, 29.0, 34.0, 30.0, 20.0, 10.0, 25.0, 21.0, 15.0, 18.0, 9.0, 8.0, 5.0, 6.0, 2.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.061492919921875, -2.96087646484375, -2.860260009765625, -2.7596435546875, -2.659027099609375, -2.55841064453125, -2.457794189453125, -2.357177734375, -2.256561279296875, -2.15594482421875, -2.055328369140625, -1.9547119140625, -1.854095458984375, -1.75347900390625, -1.652862548828125, -1.55224609375, -1.451629638671875, -1.35101318359375, -1.250396728515625, -1.1497802734375, -1.049163818359375, -0.94854736328125, -0.847930908203125, -0.747314453125, -0.646697998046875, -0.54608154296875, -0.445465087890625, -0.3448486328125, -0.244232177734375, -0.14361572265625, -0.042999267578125, 0.0576171875, 0.158233642578125, 0.25885009765625, 0.359466552734375, 0.4600830078125, 0.560699462890625, 0.66131591796875, 0.761932373046875, 0.862548828125, 0.963165283203125, 1.06378173828125, 1.164398193359375, 1.2650146484375, 1.365631103515625, 1.46624755859375, 1.566864013671875, 1.66748046875, 1.768096923828125, 1.86871337890625, 1.969329833984375, 2.0699462890625, 2.170562744140625, 2.27117919921875, 2.371795654296875, 2.472412109375, 2.573028564453125, 2.67364501953125, 2.774261474609375, 2.8748779296875, 2.975494384765625, 3.07611083984375, 3.176727294921875, 3.27734375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 11.0, 15.0, 25.0, 42.0, 59.0, 87.0, 157.0, 204.0, 301.0, 446.0, 727.0, 1149.0, 1844.0, 2985.0, 4821.0, 8380.0, 14807.0, 28000.0, 58374.0, 166206.0, 493608.0, 150768.0, 54672.0, 26346.0, 14061.0, 7995.0, 4713.0, 2917.0, 1746.0, 1043.0, 730.0, 451.0, 283.0, 202.0, 118.0, 98.0, 47.0, 31.0, 18.0, 16.0, 16.0, 13.0, 12.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.18878173828125, -5.0064697265625, -4.82415771484375, -4.641845703125, -4.45953369140625, -4.2772216796875, -4.09490966796875, -3.91259765625, -3.73028564453125, -3.5479736328125, -3.36566162109375, -3.183349609375, -3.00103759765625, -2.8187255859375, -2.63641357421875, -2.4541015625, -2.27178955078125, -2.0894775390625, -1.90716552734375, -1.724853515625, -1.54254150390625, -1.3602294921875, -1.17791748046875, -0.99560546875, -0.81329345703125, -0.6309814453125, -0.44866943359375, -0.266357421875, -0.08404541015625, 0.0982666015625, 0.28057861328125, 0.462890625, 0.64520263671875, 0.8275146484375, 1.00982666015625, 1.192138671875, 1.37445068359375, 1.5567626953125, 1.73907470703125, 1.92138671875, 2.10369873046875, 2.2860107421875, 2.46832275390625, 2.650634765625, 2.83294677734375, 3.0152587890625, 3.19757080078125, 3.3798828125, 3.56219482421875, 3.7445068359375, 3.92681884765625, 4.109130859375, 4.29144287109375, 4.4737548828125, 4.65606689453125, 4.83837890625, 5.02069091796875, 5.2030029296875, 5.38531494140625, 5.567626953125, 5.74993896484375, 5.9322509765625, 6.11456298828125, 6.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 4.0, 4.0, 4.0, 10.0, 7.0, 16.0, 17.0, 16.0, 17.0, 19.0, 29.0, 29.0, 33.0, 39.0, 45.0, 52.0, 48.0, 84.0, 131.0, 241.0, 1467.0, 196.0, 94.0, 68.0, 60.0, 38.0, 39.0, 28.0, 31.0, 27.0, 29.0, 20.0, 11.0, 11.0, 13.0, 13.0, 10.0, 9.0, 5.0, 8.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.1171875, -9.8043212890625, -9.491455078125, -9.1785888671875, -8.86572265625, -8.5528564453125, -8.239990234375, -7.9271240234375, -7.6142578125, -7.3013916015625, -6.988525390625, -6.6756591796875, -6.36279296875, -6.0499267578125, -5.737060546875, -5.4241943359375, -5.111328125, -4.7984619140625, -4.485595703125, -4.1727294921875, -3.85986328125, -3.5469970703125, -3.234130859375, -2.9212646484375, -2.6083984375, -2.2955322265625, -1.982666015625, -1.6697998046875, -1.35693359375, -1.0440673828125, -0.731201171875, -0.4183349609375, -0.10546875, 0.2073974609375, 0.520263671875, 0.8331298828125, 1.14599609375, 1.4588623046875, 1.771728515625, 2.0845947265625, 2.3974609375, 2.7103271484375, 3.023193359375, 3.3360595703125, 3.64892578125, 3.9617919921875, 4.274658203125, 4.5875244140625, 4.900390625, 5.2132568359375, 5.526123046875, 5.8389892578125, 6.15185546875, 6.4647216796875, 6.777587890625, 7.0904541015625, 7.4033203125, 7.7161865234375, 8.029052734375, 8.3419189453125, 8.65478515625, 8.9676513671875, 9.280517578125, 9.5933837890625, 9.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 10.0, 23.0, 13.0, 32.0, 36.0, 41.0, 75.0, 125.0, 184.0, 313.0, 862.0, 4628.0, 59142.0, 2921844.0, 148044.0, 7972.0, 1324.0, 381.0, 209.0, 125.0, 82.0, 70.0, 45.0, 30.0, 25.0, 14.0, 12.0, 11.0, 10.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.63818359375, -17.7763671875, -16.91455078125, -16.052734375, -15.19091796875, -14.3291015625, -13.46728515625, -12.60546875, -11.74365234375, -10.8818359375, -10.02001953125, -9.158203125, -8.29638671875, -7.4345703125, -6.57275390625, -5.7109375, -4.84912109375, -3.9873046875, -3.12548828125, -2.263671875, -1.40185546875, -0.5400390625, 0.32177734375, 1.18359375, 2.04541015625, 2.9072265625, 3.76904296875, 4.630859375, 5.49267578125, 6.3544921875, 7.21630859375, 8.078125, 8.93994140625, 9.8017578125, 10.66357421875, 11.525390625, 12.38720703125, 13.2490234375, 14.11083984375, 14.97265625, 15.83447265625, 16.6962890625, 17.55810546875, 18.419921875, 19.28173828125, 20.1435546875, 21.00537109375, 21.8671875, 22.72900390625, 23.5908203125, 24.45263671875, 25.314453125, 26.17626953125, 27.0380859375, 27.89990234375, 28.76171875, 29.62353515625, 30.4853515625, 31.34716796875, 32.208984375, 33.07080078125, 33.9326171875, 34.79443359375, 35.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 200.0, 716.0, 91.0, 0.0, 2.0], "bins": [-305.0229797363281, -299.96630859375, -294.90960693359375, -289.8529357910156, -284.7962646484375, -279.73956298828125, -274.6828918457031, -269.626220703125, -264.56951904296875, -259.5128479003906, -254.45616149902344, -249.39947509765625, -244.34278869628906, -239.28610229492188, -234.22943115234375, -229.17274475097656, -224.11605834960938, -219.0593719482422, -214.00270080566406, -208.94601440429688, -203.8893280029297, -198.8326416015625, -193.77597045898438, -188.7192840576172, -183.66261291503906, -178.60592651367188, -173.54925537109375, -168.49256896972656, -163.43588256835938, -158.3791961669922, -153.32252502441406, -148.26583862304688, -143.2091522216797, -138.1524658203125, -133.09579467773438, -128.0391082763672, -122.982421875, -117.92574310302734, -112.86906433105469, -107.8123779296875, -102.75569152832031, -97.69901275634766, -92.64232635498047, -87.58564758300781, -82.52896118164062, -77.47228240966797, -72.41560363769531, -67.35891723632812, -62.30223846435547, -57.24555587768555, -52.188873291015625, -47.13219451904297, -42.07550811767578, -37.018829345703125, -31.962146759033203, -26.90546417236328, -21.84878158569336, -16.792098999023438, -11.735417366027832, -6.678735733032227, -1.6220531463623047, 3.434629440307617, 8.491310119628906, 13.547992706298828, 18.60467529296875]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 11.0, 13.0, 11.0, 8.0, 14.0, 18.0, 18.0, 14.0, 29.0, 28.0, 30.0, 38.0, 39.0, 43.0, 52.0, 47.0, 46.0, 42.0, 48.0, 38.0, 42.0, 34.0, 42.0, 38.0, 32.0, 38.0, 31.0, 25.0, 15.0, 25.0, 20.0, 17.0, 18.0, 8.0, 6.0, 6.0, 8.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.94982147216797, -27.997146606445312, -27.04447364807129, -26.091798782348633, -25.139123916625977, -24.186450958251953, -23.233776092529297, -22.28110122680664, -21.328428268432617, -20.37575340270996, -19.423080444335938, -18.47040557861328, -17.517730712890625, -16.5650577545166, -15.612382888793945, -14.659708976745605, -13.70703411102295, -12.75436019897461, -11.801685333251953, -10.849011421203613, -9.896337509155273, -8.943662643432617, -7.990988731384277, -7.0383148193359375, -6.0856404304504395, -5.132966041564941, -4.180292129516602, -3.2276177406311035, -2.2749435901641846, -1.3222694396972656, -0.3695950508117676, 0.5830788612365723, 1.5357532501220703, 2.4884274005889893, 3.441101551055908, 4.393775939941406, 5.346449851989746, 6.299124240875244, 7.251798629760742, 8.204472541809082, 9.157146453857422, 10.109820365905762, 11.062495231628418, 12.015169143676758, 12.967843055725098, 13.920516967773438, 14.873191833496094, 15.825865745544434, 16.778541564941406, 17.731216430664062, 18.683889389038086, 19.636564254760742, 20.5892391204834, 21.541912078857422, 22.494586944580078, 23.447261810302734, 24.399934768676758, 25.352609634399414, 26.305282592773438, 27.257957458496094, 28.21063232421875, 29.163305282592773, 30.11598014831543, 31.068653106689453, 32.02132797241211]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 13.0, 7.0, 9.0, 14.0, 18.0, 21.0, 16.0, 25.0, 39.0, 43.0, 25.0, 45.0, 42.0, 37.0, 52.0, 39.0, 65.0, 50.0, 43.0, 48.0, 38.0, 40.0, 33.0, 31.0, 27.0, 26.0, 24.0, 17.0, 28.0, 17.0, 10.0, 16.0, 3.0, 7.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.2890625, -4.16485595703125, -4.0406494140625, -3.91644287109375, -3.792236328125, -3.66802978515625, -3.5438232421875, -3.41961669921875, -3.29541015625, -3.17120361328125, -3.0469970703125, -2.92279052734375, -2.798583984375, -2.67437744140625, -2.5501708984375, -2.42596435546875, -2.3017578125, -2.17755126953125, -2.0533447265625, -1.92913818359375, -1.804931640625, -1.68072509765625, -1.5565185546875, -1.43231201171875, -1.30810546875, -1.18389892578125, -1.0596923828125, -0.93548583984375, -0.811279296875, -0.68707275390625, -0.5628662109375, -0.43865966796875, -0.314453125, -0.19024658203125, -0.0660400390625, 0.05816650390625, 0.182373046875, 0.30657958984375, 0.4307861328125, 0.55499267578125, 0.67919921875, 0.80340576171875, 0.9276123046875, 1.05181884765625, 1.176025390625, 1.30023193359375, 1.4244384765625, 1.54864501953125, 1.6728515625, 1.79705810546875, 1.9212646484375, 2.04547119140625, 2.169677734375, 2.29388427734375, 2.4180908203125, 2.54229736328125, 2.66650390625, 2.79071044921875, 2.9149169921875, 3.03912353515625, 3.163330078125, 3.28753662109375, 3.4117431640625, 3.53594970703125, 3.66015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 11.0, 15.0, 16.0, 26.0, 26.0, 40.0, 65.0, 111.0, 145.0, 224.0, 346.0, 637.0, 1069.0, 1867.0, 3475.0, 6897.0, 15332.0, 39470.0, 173760.0, 1586846.0, 2057125.0, 227335.0, 45902.0, 16956.0, 7757.0, 3805.0, 2019.0, 1164.0, 678.0, 410.0, 255.0, 170.0, 100.0, 60.0, 47.0, 33.0, 24.0, 16.0, 14.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-8.8125, -8.56817626953125, -8.3238525390625, -8.07952880859375, -7.835205078125, -7.59088134765625, -7.3465576171875, -7.10223388671875, -6.85791015625, -6.61358642578125, -6.3692626953125, -6.12493896484375, -5.880615234375, -5.63629150390625, -5.3919677734375, -5.14764404296875, -4.9033203125, -4.65899658203125, -4.4146728515625, -4.17034912109375, -3.926025390625, -3.68170166015625, -3.4373779296875, -3.19305419921875, -2.94873046875, -2.70440673828125, -2.4600830078125, -2.21575927734375, -1.971435546875, -1.72711181640625, -1.4827880859375, -1.23846435546875, -0.994140625, -0.74981689453125, -0.5054931640625, -0.26116943359375, -0.016845703125, 0.22747802734375, 0.4718017578125, 0.71612548828125, 0.96044921875, 1.20477294921875, 1.4490966796875, 1.69342041015625, 1.937744140625, 2.18206787109375, 2.4263916015625, 2.67071533203125, 2.9150390625, 3.15936279296875, 3.4036865234375, 3.64801025390625, 3.892333984375, 4.13665771484375, 4.3809814453125, 4.62530517578125, 4.86962890625, 5.11395263671875, 5.3582763671875, 5.60260009765625, 5.846923828125, 6.09124755859375, 6.3355712890625, 6.57989501953125, 6.82421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 9.0, 6.0, 12.0, 14.0, 23.0, 34.0, 34.0, 39.0, 47.0, 75.0, 83.0, 139.0, 251.0, 398.0, 590.0, 774.0, 524.0, 347.0, 201.0, 123.0, 79.0, 84.0, 38.0, 31.0, 32.0, 20.0, 15.0, 11.0, 3.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.6162109375, -7.373046875, -7.1298828125, -6.88671875, -6.6435546875, -6.400390625, -6.1572265625, -5.9140625, -5.6708984375, -5.427734375, -5.1845703125, -4.94140625, -4.6982421875, -4.455078125, -4.2119140625, -3.96875, -3.7255859375, -3.482421875, -3.2392578125, -2.99609375, -2.7529296875, -2.509765625, -2.2666015625, -2.0234375, -1.7802734375, -1.537109375, -1.2939453125, -1.05078125, -0.8076171875, -0.564453125, -0.3212890625, -0.078125, 0.1650390625, 0.408203125, 0.6513671875, 0.89453125, 1.1376953125, 1.380859375, 1.6240234375, 1.8671875, 2.1103515625, 2.353515625, 2.5966796875, 2.83984375, 3.0830078125, 3.326171875, 3.5693359375, 3.8125, 4.0556640625, 4.298828125, 4.5419921875, 4.78515625, 5.0283203125, 5.271484375, 5.5146484375, 5.7578125, 6.0009765625, 6.244140625, 6.4873046875, 6.73046875, 6.9736328125, 7.216796875, 7.4599609375, 7.703125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 2.0, 10.0, 16.0, 20.0, 38.0, 17.0, 31.0, 74.0, 92.0, 100.0, 227.0, 707.0, 6785.0, 465423.0, 3699645.0, 18995.0, 1284.0, 288.0, 136.0, 82.0, 63.0, 51.0, 35.0, 33.0, 28.0, 22.0, 15.0, 9.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.53125, -39.27099609375, -38.0107421875, -36.75048828125, -35.490234375, -34.22998046875, -32.9697265625, -31.70947265625, -30.44921875, -29.18896484375, -27.9287109375, -26.66845703125, -25.408203125, -24.14794921875, -22.8876953125, -21.62744140625, -20.3671875, -19.10693359375, -17.8466796875, -16.58642578125, -15.326171875, -14.06591796875, -12.8056640625, -11.54541015625, -10.28515625, -9.02490234375, -7.7646484375, -6.50439453125, -5.244140625, -3.98388671875, -2.7236328125, -1.46337890625, -0.203125, 1.05712890625, 2.3173828125, 3.57763671875, 4.837890625, 6.09814453125, 7.3583984375, 8.61865234375, 9.87890625, 11.13916015625, 12.3994140625, 13.65966796875, 14.919921875, 16.18017578125, 17.4404296875, 18.70068359375, 19.9609375, 21.22119140625, 22.4814453125, 23.74169921875, 25.001953125, 26.26220703125, 27.5224609375, 28.78271484375, 30.04296875, 31.30322265625, 32.5634765625, 33.82373046875, 35.083984375, 36.34423828125, 37.6044921875, 38.86474609375, 40.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 17.0, 17.0, 56.0, 83.0, 131.0, 173.0, 182.0, 145.0, 101.0, 53.0, 24.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.73108673095703, -54.26681137084961, -52.80253982543945, -51.33826446533203, -49.873992919921875, -48.40971755981445, -46.94544219970703, -45.481170654296875, -44.01689910888672, -42.5526237487793, -41.08835220336914, -39.62407684326172, -38.15980529785156, -36.69552993774414, -35.23125457763672, -33.76698303222656, -32.30270767211914, -30.83843421936035, -29.374160766601562, -27.90988540649414, -26.445613861083984, -24.981338500976562, -23.517065048217773, -22.052791595458984, -20.588518142700195, -19.124244689941406, -17.659971237182617, -16.195697784423828, -14.731423377990723, -13.267149925231934, -11.802875518798828, -10.338602066040039, -8.874324798583984, -7.410051345825195, -5.945777416229248, -4.481503486633301, -3.0172300338745117, -1.5529565811157227, -0.08868217468261719, 1.3755912780761719, 2.839864730834961, 4.30413818359375, 5.768412113189697, 7.2326860427856445, 8.696959495544434, 10.161232948303223, 11.625507354736328, 13.089780807495117, 14.554054260253906, 16.018327713012695, 17.482601165771484, 18.946876525878906, 20.411148071289062, 21.875423431396484, 23.339696884155273, 24.803970336914062, 26.26824378967285, 27.73251724243164, 29.19679069519043, 30.66106414794922, 32.12533950805664, 33.5896110534668, 35.05388641357422, 36.518157958984375, 37.9824333190918]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 5.0, 8.0, 20.0, 11.0, 19.0, 15.0, 17.0, 18.0, 32.0, 46.0, 41.0, 41.0, 34.0, 36.0, 37.0, 54.0, 42.0, 46.0, 40.0, 42.0, 43.0, 40.0, 32.0, 39.0, 26.0, 25.0, 21.0, 30.0, 14.0, 20.0, 19.0, 7.0, 20.0, 15.0, 6.0, 5.0, 9.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.172319412231445, -21.4759464263916, -20.77957534790039, -20.083202362060547, -19.386831283569336, -18.690458297729492, -17.99408721923828, -17.297714233398438, -16.601341247558594, -15.904969215393066, -15.208597183227539, -14.512224197387695, -13.815853118896484, -13.11948013305664, -12.423108100891113, -11.726736068725586, -11.030364990234375, -10.333992958068848, -9.63762092590332, -8.941247940063477, -8.244876861572266, -7.54850435256958, -6.8521318435668945, -6.155759811401367, -5.45938777923584, -4.7630157470703125, -4.066643714904785, -3.3702712059020996, -2.6738991737365723, -1.977527141571045, -1.2811546325683594, -0.584782600402832, 0.11159133911132812, 0.807963490486145, 1.504335641860962, 2.2007079124450684, 2.8970799446105957, 3.593451976776123, 4.289824485778809, 4.986196517944336, 5.682568550109863, 6.378940582275391, 7.075312614440918, 7.7716851234436035, 8.468057632446289, 9.1644287109375, 9.860801696777344, 10.557173728942871, 11.253545761108398, 11.949917793273926, 12.646289825439453, 13.342662811279297, 14.039033889770508, 14.735406875610352, 15.431778907775879, 16.128150939941406, 16.82452392578125, 17.520896911621094, 18.217267990112305, 18.91364097595215, 19.61001205444336, 20.306385040283203, 21.002758026123047, 21.699129104614258, 22.39550018310547]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 17.0, 6.0, 18.0, 16.0, 16.0, 28.0, 31.0, 33.0, 31.0, 34.0, 40.0, 39.0, 35.0, 39.0, 54.0, 39.0, 42.0, 36.0, 58.0, 38.0, 48.0, 33.0, 39.0, 28.0, 23.0, 28.0, 20.0, 18.0, 14.0, 11.0, 12.0, 7.0, 12.0, 6.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.23089599609375, -3.1180419921875, -3.00518798828125, -2.892333984375, -2.77947998046875, -2.6666259765625, -2.55377197265625, -2.44091796875, -2.32806396484375, -2.2152099609375, -2.10235595703125, -1.989501953125, -1.87664794921875, -1.7637939453125, -1.65093994140625, -1.5380859375, -1.42523193359375, -1.3123779296875, -1.19952392578125, -1.086669921875, -0.97381591796875, -0.8609619140625, -0.74810791015625, -0.63525390625, -0.52239990234375, -0.4095458984375, -0.29669189453125, -0.183837890625, -0.07098388671875, 0.0418701171875, 0.15472412109375, 0.267578125, 0.38043212890625, 0.4932861328125, 0.60614013671875, 0.718994140625, 0.83184814453125, 0.9447021484375, 1.05755615234375, 1.17041015625, 1.28326416015625, 1.3961181640625, 1.50897216796875, 1.621826171875, 1.73468017578125, 1.8475341796875, 1.96038818359375, 2.0732421875, 2.18609619140625, 2.2989501953125, 2.41180419921875, 2.524658203125, 2.63751220703125, 2.7503662109375, 2.86322021484375, 2.97607421875, 3.08892822265625, 3.2017822265625, 3.31463623046875, 3.427490234375, 3.54034423828125, 3.6531982421875, 3.76605224609375, 3.87890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 13.0, 13.0, 33.0, 47.0, 107.0, 213.0, 442.0, 950.0, 2286.0, 6374.0, 27335.0, 222177.0, 690795.0, 77704.0, 13288.0, 3932.0, 1534.0, 697.0, 303.0, 154.0, 68.0, 37.0, 23.0, 13.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.55487060546875, -4.4417724609375, -4.32867431640625, -4.215576171875, -4.10247802734375, -3.9893798828125, -3.87628173828125, -3.76318359375, -3.65008544921875, -3.5369873046875, -3.42388916015625, -3.310791015625, -3.19769287109375, -3.0845947265625, -2.97149658203125, -2.8583984375, -2.74530029296875, -2.6322021484375, -2.51910400390625, -2.406005859375, -2.29290771484375, -2.1798095703125, -2.06671142578125, -1.95361328125, -1.84051513671875, -1.7274169921875, -1.61431884765625, -1.501220703125, -1.38812255859375, -1.2750244140625, -1.16192626953125, -1.048828125, -0.93572998046875, -0.8226318359375, -0.70953369140625, -0.596435546875, -0.48333740234375, -0.3702392578125, -0.25714111328125, -0.14404296875, -0.03094482421875, 0.0821533203125, 0.19525146484375, 0.308349609375, 0.42144775390625, 0.5345458984375, 0.64764404296875, 0.7607421875, 0.87384033203125, 0.9869384765625, 1.10003662109375, 1.213134765625, 1.32623291015625, 1.4393310546875, 1.55242919921875, 1.66552734375, 1.77862548828125, 1.8917236328125, 2.00482177734375, 2.117919921875, 2.23101806640625, 2.3441162109375, 2.45721435546875, 2.5703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 10.0, 17.0, 9.0, 12.0, 12.0, 16.0, 29.0, 22.0, 26.0, 28.0, 28.0, 26.0, 40.0, 44.0, 36.0, 49.0, 35.0, 31.0, 1063.0, 44.0, 32.0, 33.0, 37.0, 33.0, 27.0, 31.0, 29.0, 27.0, 21.0, 31.0, 20.0, 12.0, 14.0, 19.0, 10.0, 4.0, 3.0, 9.0, 9.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.720703125, -2.641082763671875, -2.56146240234375, -2.481842041015625, -2.4022216796875, -2.322601318359375, -2.24298095703125, -2.163360595703125, -2.083740234375, -2.004119873046875, -1.92449951171875, -1.844879150390625, -1.7652587890625, -1.685638427734375, -1.60601806640625, -1.526397705078125, -1.44677734375, -1.367156982421875, -1.28753662109375, -1.207916259765625, -1.1282958984375, -1.048675537109375, -0.96905517578125, -0.889434814453125, -0.809814453125, -0.730194091796875, -0.65057373046875, -0.570953369140625, -0.4913330078125, -0.411712646484375, -0.33209228515625, -0.252471923828125, -0.1728515625, -0.093231201171875, -0.01361083984375, 0.066009521484375, 0.1456298828125, 0.225250244140625, 0.30487060546875, 0.384490966796875, 0.464111328125, 0.543731689453125, 0.62335205078125, 0.702972412109375, 0.7825927734375, 0.862213134765625, 0.94183349609375, 1.021453857421875, 1.10107421875, 1.180694580078125, 1.26031494140625, 1.339935302734375, 1.4195556640625, 1.499176025390625, 1.57879638671875, 1.658416748046875, 1.738037109375, 1.817657470703125, 1.89727783203125, 1.976898193359375, 2.0565185546875, 2.136138916015625, 2.21575927734375, 2.295379638671875, 2.375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 12.0, 11.0, 13.0, 17.0, 32.0, 55.0, 62.0, 81.0, 107.0, 160.0, 261.0, 394.0, 611.0, 938.0, 1681.0, 2806.0, 5719.0, 12732.0, 36895.0, 166233.0, 1503100.0, 283130.0, 50761.0, 16300.0, 6913.0, 3321.0, 1746.0, 1034.0, 676.0, 437.0, 287.0, 199.0, 124.0, 77.0, 51.0, 42.0, 28.0, 16.0, 12.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5556640625, -1.5093994140625, -1.463134765625, -1.4168701171875, -1.37060546875, -1.3243408203125, -1.278076171875, -1.2318115234375, -1.185546875, -1.1392822265625, -1.093017578125, -1.0467529296875, -1.00048828125, -0.9542236328125, -0.907958984375, -0.8616943359375, -0.8154296875, -0.7691650390625, -0.722900390625, -0.6766357421875, -0.63037109375, -0.5841064453125, -0.537841796875, -0.4915771484375, -0.4453125, -0.3990478515625, -0.352783203125, -0.3065185546875, -0.26025390625, -0.2139892578125, -0.167724609375, -0.1214599609375, -0.0751953125, -0.0289306640625, 0.017333984375, 0.0635986328125, 0.10986328125, 0.1561279296875, 0.202392578125, 0.2486572265625, 0.294921875, 0.3411865234375, 0.387451171875, 0.4337158203125, 0.47998046875, 0.5262451171875, 0.572509765625, 0.6187744140625, 0.6650390625, 0.7113037109375, 0.757568359375, 0.8038330078125, 0.85009765625, 0.8963623046875, 0.942626953125, 0.9888916015625, 1.03515625, 1.0814208984375, 1.127685546875, 1.1739501953125, 1.22021484375, 1.2664794921875, 1.312744140625, 1.3590087890625, 1.4052734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 8.0, 7.0, 3.0, 13.0, 7.0, 13.0, 15.0, 31.0, 78.0, 171.0, 311.0, 147.0, 71.0, 28.0, 25.0, 17.0, 12.0, 7.0, 3.0, 10.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5035934448242188, -0.4852142333984375, -0.46683502197265625, -0.448455810546875, -0.43007659912109375, -0.4116973876953125, -0.39331817626953125, -0.37493896484375, -0.35655975341796875, -0.3381805419921875, -0.31980133056640625, -0.301422119140625, -0.28304290771484375, -0.2646636962890625, -0.24628448486328125, -0.2279052734375, -0.20952606201171875, -0.1911468505859375, -0.17276763916015625, -0.154388427734375, -0.13600921630859375, -0.1176300048828125, -0.09925079345703125, -0.08087158203125, -0.06249237060546875, -0.0441131591796875, -0.02573394775390625, -0.007354736328125, 0.01102447509765625, 0.0294036865234375, 0.04778289794921875, 0.066162109375, 0.08454132080078125, 0.1029205322265625, 0.12129974365234375, 0.139678955078125, 0.15805816650390625, 0.1764373779296875, 0.19481658935546875, 0.21319580078125, 0.23157501220703125, 0.2499542236328125, 0.26833343505859375, 0.286712646484375, 0.30509185791015625, 0.3234710693359375, 0.34185028076171875, 0.3602294921875, 0.37860870361328125, 0.3969879150390625, 0.41536712646484375, 0.433746337890625, 0.45212554931640625, 0.4705047607421875, 0.48888397216796875, 0.50726318359375, 0.5256423950195312, 0.5440216064453125, 0.5624008178710938, 0.580780029296875, 0.5991592407226562, 0.6175384521484375, 0.6359176635742188, 0.654296875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 6.0, 20.0, 24.0, 40.0, 71.0, 183.0, 2126.0, 992771.0, 52037.0, 941.0, 128.0, 65.0, 32.0, 21.0, 16.0, 8.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.921875, -13.5225830078125, -13.123291015625, -12.7239990234375, -12.32470703125, -11.9254150390625, -11.526123046875, -11.1268310546875, -10.7275390625, -10.3282470703125, -9.928955078125, -9.5296630859375, -9.13037109375, -8.7310791015625, -8.331787109375, -7.9324951171875, -7.533203125, -7.1339111328125, -6.734619140625, -6.3353271484375, -5.93603515625, -5.5367431640625, -5.137451171875, -4.7381591796875, -4.3388671875, -3.9395751953125, -3.540283203125, -3.1409912109375, -2.74169921875, -2.3424072265625, -1.943115234375, -1.5438232421875, -1.14453125, -0.7452392578125, -0.345947265625, 0.0533447265625, 0.45263671875, 0.8519287109375, 1.251220703125, 1.6505126953125, 2.0498046875, 2.4490966796875, 2.848388671875, 3.2476806640625, 3.64697265625, 4.0462646484375, 4.445556640625, 4.8448486328125, 5.244140625, 5.6434326171875, 6.042724609375, 6.4420166015625, 6.84130859375, 7.2406005859375, 7.639892578125, 8.0391845703125, 8.4384765625, 8.8377685546875, 9.237060546875, 9.6363525390625, 10.03564453125, 10.4349365234375, 10.834228515625, 11.2335205078125, 11.6328125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 6.0, 3.0, 10.0, 23.0, 26.0, 63.0, 93.0, 157.0, 172.0, 169.0, 117.0, 66.0, 31.0, 30.0, 13.0, 10.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41232261061668396, -0.38766157627105713, -0.3630005717277527, -0.33833953738212585, -0.313678503036499, -0.2890174984931946, -0.26435646414756775, -0.2396954447031021, -0.21503442525863647, -0.19037340581417084, -0.1657123863697052, -0.14105135202407837, -0.11639033257961273, -0.0917293131351471, -0.06706827878952026, -0.042407259345054626, -0.01774623990058899, 0.006914783269166946, 0.03157580643892288, 0.056236833333969116, 0.08089785277843475, 0.10555887222290039, 0.13021990656852722, 0.15488092601299286, 0.1795419454574585, 0.20420296490192413, 0.22886398434638977, 0.2535250186920166, 0.27818602323532104, 0.3028470575809479, 0.3275080919265747, 0.35216909646987915, 0.3768301010131836, 0.4014911353588104, 0.42615213990211487, 0.4508131742477417, 0.47547417879104614, 0.5001351833343506, 0.5247962474822998, 0.5494572520256042, 0.5741182565689087, 0.5987792611122131, 0.6234403252601624, 0.6481013298034668, 0.6727623343467712, 0.6974233388900757, 0.7220844030380249, 0.7467454075813293, 0.7714064717292786, 0.796067476272583, 0.8207285404205322, 0.8453895449638367, 0.8700505495071411, 0.8947116136550903, 0.9193726181983948, 0.9440336227416992, 0.9686946868896484, 0.9933556914329529, 1.0180166959762573, 1.0426777601242065, 1.0673388242721558, 1.0919997692108154, 1.1166608333587646, 1.1413218975067139, 1.1659828424453735]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 4.0, 9.0, 6.0, 14.0, 11.0, 16.0, 15.0, 22.0, 29.0, 19.0, 32.0, 35.0, 26.0, 28.0, 35.0, 46.0, 39.0, 41.0, 36.0, 40.0, 41.0, 35.0, 41.0, 28.0, 44.0, 41.0, 36.0, 30.0, 21.0, 28.0, 19.0, 16.0, 20.0, 19.0, 14.0, 9.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.3948132395744324, -0.383027046918869, -0.37124085426330566, -0.3594546616077423, -0.34766846895217896, -0.3358822464942932, -0.32409605383872986, -0.3123098611831665, -0.30052366852760315, -0.2887374758720398, -0.27695128321647644, -0.2651650905609131, -0.25337886810302734, -0.24159269034862518, -0.22980648279190063, -0.21802029013633728, -0.20623409748077393, -0.19444790482521057, -0.18266171216964722, -0.17087550461292267, -0.15908931195735931, -0.14730311930179596, -0.1355169117450714, -0.12373071908950806, -0.1119445264339447, -0.10015833377838135, -0.0883721336722374, -0.07658593356609344, -0.06479974091053009, -0.05301354452967644, -0.041227348148822784, -0.029441148042678833, -0.01765495538711548, -0.0058687590062618256, 0.005917437374591827, 0.01770363375544548, 0.029489830136299133, 0.041276026517152786, 0.05306222289800644, 0.06484842300415039, 0.07663461565971375, 0.0884208083152771, 0.10020700842142105, 0.111993208527565, 0.12377940118312836, 0.1355655938386917, 0.14735180139541626, 0.15913799405097961, 0.17092418670654297, 0.18271037936210632, 0.19449657201766968, 0.20628277957439423, 0.21806897222995758, 0.22985516488552094, 0.24164137244224548, 0.25342756509780884, 0.2652137577533722, 0.27699995040893555, 0.2887861430644989, 0.30057233572006226, 0.312358558177948, 0.32414475083351135, 0.3359309434890747, 0.34771713614463806, 0.3595033288002014]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 14.0, 11.0, 11.0, 17.0, 20.0, 19.0, 25.0, 25.0, 24.0, 26.0, 28.0, 38.0, 35.0, 28.0, 41.0, 30.0, 51.0, 44.0, 42.0, 45.0, 29.0, 45.0, 34.0, 30.0, 47.0, 31.0, 25.0, 26.0, 14.0, 20.0, 20.0, 10.0, 10.0, 11.0, 10.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.98828125, -2.88323974609375, -2.7781982421875, -2.67315673828125, -2.568115234375, -2.46307373046875, -2.3580322265625, -2.25299072265625, -2.14794921875, -2.04290771484375, -1.9378662109375, -1.83282470703125, -1.727783203125, -1.62274169921875, -1.5177001953125, -1.41265869140625, -1.3076171875, -1.20257568359375, -1.0975341796875, -0.99249267578125, -0.887451171875, -0.78240966796875, -0.6773681640625, -0.57232666015625, -0.46728515625, -0.36224365234375, -0.2572021484375, -0.15216064453125, -0.047119140625, 0.05792236328125, 0.1629638671875, 0.26800537109375, 0.373046875, 0.47808837890625, 0.5831298828125, 0.68817138671875, 0.793212890625, 0.89825439453125, 1.0032958984375, 1.10833740234375, 1.21337890625, 1.31842041015625, 1.4234619140625, 1.52850341796875, 1.633544921875, 1.73858642578125, 1.8436279296875, 1.94866943359375, 2.0537109375, 2.15875244140625, 2.2637939453125, 2.36883544921875, 2.473876953125, 2.57891845703125, 2.6839599609375, 2.78900146484375, 2.89404296875, 2.99908447265625, 3.1041259765625, 3.20916748046875, 3.314208984375, 3.41925048828125, 3.5242919921875, 3.62933349609375, 3.734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 10.0, 22.0, 27.0, 31.0, 58.0, 85.0, 107.0, 172.0, 279.0, 407.0, 611.0, 1036.0, 1718.0, 3095.0, 5687.0, 11369.0, 26765.0, 77764.0, 433051.0, 368740.0, 69230.0, 24608.0, 10827.0, 5469.0, 2932.0, 1718.0, 964.0, 629.0, 370.0, 254.0, 162.0, 112.0, 70.0, 61.0, 31.0, 21.0, 20.0, 10.0, 4.0, 8.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.8046875, -5.64324951171875, -5.4818115234375, -5.32037353515625, -5.158935546875, -4.99749755859375, -4.8360595703125, -4.67462158203125, -4.51318359375, -4.35174560546875, -4.1903076171875, -4.02886962890625, -3.867431640625, -3.70599365234375, -3.5445556640625, -3.38311767578125, -3.2216796875, -3.06024169921875, -2.8988037109375, -2.73736572265625, -2.575927734375, -2.41448974609375, -2.2530517578125, -2.09161376953125, -1.93017578125, -1.76873779296875, -1.6072998046875, -1.44586181640625, -1.284423828125, -1.12298583984375, -0.9615478515625, -0.80010986328125, -0.638671875, -0.47723388671875, -0.3157958984375, -0.15435791015625, 0.007080078125, 0.16851806640625, 0.3299560546875, 0.49139404296875, 0.65283203125, 0.81427001953125, 0.9757080078125, 1.13714599609375, 1.298583984375, 1.46002197265625, 1.6214599609375, 1.78289794921875, 1.9443359375, 2.10577392578125, 2.2672119140625, 2.42864990234375, 2.590087890625, 2.75152587890625, 2.9129638671875, 3.07440185546875, 3.23583984375, 3.39727783203125, 3.5587158203125, 3.72015380859375, 3.881591796875, 4.04302978515625, 4.2044677734375, 4.36590576171875, 4.52734375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 8.0, 14.0, 11.0, 10.0, 17.0, 21.0, 26.0, 31.0, 39.0, 39.0, 39.0, 39.0, 46.0, 63.0, 93.0, 236.0, 1624.0, 208.0, 100.0, 58.0, 47.0, 39.0, 43.0, 32.0, 34.0, 20.0, 22.0, 19.0, 16.0, 9.0, 14.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -10.9981689453125, -10.582275390625, -10.1663818359375, -9.75048828125, -9.3345947265625, -8.918701171875, -8.5028076171875, -8.0869140625, -7.6710205078125, -7.255126953125, -6.8392333984375, -6.42333984375, -6.0074462890625, -5.591552734375, -5.1756591796875, -4.759765625, -4.3438720703125, -3.927978515625, -3.5120849609375, -3.09619140625, -2.6802978515625, -2.264404296875, -1.8485107421875, -1.4326171875, -1.0167236328125, -0.600830078125, -0.1849365234375, 0.23095703125, 0.6468505859375, 1.062744140625, 1.4786376953125, 1.89453125, 2.3104248046875, 2.726318359375, 3.1422119140625, 3.55810546875, 3.9739990234375, 4.389892578125, 4.8057861328125, 5.2216796875, 5.6375732421875, 6.053466796875, 6.4693603515625, 6.88525390625, 7.3011474609375, 7.717041015625, 8.1329345703125, 8.548828125, 8.9647216796875, 9.380615234375, 9.7965087890625, 10.21240234375, 10.6282958984375, 11.044189453125, 11.4600830078125, 11.8759765625, 12.2918701171875, 12.707763671875, 13.1236572265625, 13.53955078125, 13.9554443359375, 14.371337890625, 14.7872314453125, 15.203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 11.0, 24.0, 20.0, 22.0, 22.0, 33.0, 49.0, 79.0, 102.0, 179.0, 493.0, 1866.0, 12365.0, 568579.0, 2538229.0, 19847.0, 2492.0, 607.0, 200.0, 111.0, 76.0, 56.0, 48.0, 36.0, 30.0, 24.0, 17.0, 12.0, 18.0, 7.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.779052734375, -26.96435546875, -26.149658203125, -25.3349609375, -24.520263671875, -23.70556640625, -22.890869140625, -22.076171875, -21.261474609375, -20.44677734375, -19.632080078125, -18.8173828125, -18.002685546875, -17.18798828125, -16.373291015625, -15.55859375, -14.743896484375, -13.92919921875, -13.114501953125, -12.2998046875, -11.485107421875, -10.67041015625, -9.855712890625, -9.041015625, -8.226318359375, -7.41162109375, -6.596923828125, -5.7822265625, -4.967529296875, -4.15283203125, -3.338134765625, -2.5234375, -1.708740234375, -0.89404296875, -0.079345703125, 0.7353515625, 1.550048828125, 2.36474609375, 3.179443359375, 3.994140625, 4.808837890625, 5.62353515625, 6.438232421875, 7.2529296875, 8.067626953125, 8.88232421875, 9.697021484375, 10.51171875, 11.326416015625, 12.14111328125, 12.955810546875, 13.7705078125, 14.585205078125, 15.39990234375, 16.214599609375, 17.029296875, 17.843994140625, 18.65869140625, 19.473388671875, 20.2880859375, 21.102783203125, 21.91748046875, 22.732177734375, 23.546875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [3.0, 8.0, 17.0, 51.0, 139.0, 240.0, 267.0, 175.0, 66.0, 34.0, 15.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.217764377593994, -6.045231819152832, -4.872698783874512, -3.7001659870147705, -2.5276331901550293, -1.355100154876709, -0.18256759643554688, 0.9899649620056152, 2.1624979972839355, 3.3350307941436768, 4.507563591003418, 5.680096626281738, 6.8526291847229, 8.025161743164062, 9.197694778442383, 10.370227813720703, 11.542760848999023, 12.715293884277344, 13.887826919555664, 15.060359001159668, 16.232891082763672, 17.405426025390625, 18.577957153320312, 19.750490188598633, 20.923023223876953, 22.095556259155273, 23.268089294433594, 24.440622329711914, 25.613155364990234, 26.785686492919922, 27.958219528198242, 29.130752563476562, 30.30328369140625, 31.47581672668457, 32.64834976196289, 33.82088088989258, 34.99341583251953, 36.16594696044922, 37.33848190307617, 38.51101303100586, 39.68354797363281, 40.8560791015625, 42.02861404418945, 43.20114517211914, 44.373680114746094, 45.54621124267578, 46.718746185302734, 47.89127731323242, 49.06380844116211, 50.2363395690918, 51.40887451171875, 52.58140563964844, 53.75394058227539, 54.92647171020508, 56.09900665283203, 57.27153778076172, 58.444068908691406, 59.616600036621094, 60.78913497924805, 61.961666107177734, 63.13420104980469, 64.30673217773438, 65.47926330566406, 66.65179443359375, 67.82433319091797]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 9.0, 6.0, 6.0, 8.0, 11.0, 10.0, 18.0, 18.0, 15.0, 21.0, 27.0, 36.0, 28.0, 26.0, 33.0, 36.0, 36.0, 40.0, 40.0, 38.0, 54.0, 37.0, 56.0, 31.0, 38.0, 31.0, 39.0, 25.0, 28.0, 25.0, 22.0, 32.0, 24.0, 12.0, 20.0, 10.0, 5.0, 7.0, 10.0, 11.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-39.971099853515625, -38.82118606567383, -37.67127227783203, -36.5213623046875, -35.3714485168457, -34.221534729003906, -33.07162094116211, -31.921707153320312, -30.77179527282715, -29.62188148498535, -28.471969604492188, -27.32205581665039, -26.172142028808594, -25.02223014831543, -23.872316360473633, -22.72240447998047, -21.572490692138672, -20.422576904296875, -19.27266502380371, -18.122751235961914, -16.97283935546875, -15.822925567626953, -14.673011779785156, -13.523098945617676, -12.373186111450195, -11.223273277282715, -10.073360443115234, -8.923446655273438, -7.773533821105957, -6.623620986938477, -5.473707675933838, -4.323794364929199, -3.173877716064453, -2.0239646434783936, -0.874051570892334, 0.2758615016937256, 1.4257745742797852, 2.5756874084472656, 3.7256007194519043, 4.875514030456543, 6.025426864624023, 7.175339698791504, 8.325252532958984, 9.475166320800781, 10.625079154968262, 11.774991989135742, 12.924905776977539, 14.07481861114502, 15.2247314453125, 16.374645233154297, 17.52455711364746, 18.674470901489258, 19.824382781982422, 20.97429656982422, 22.124210357666016, 23.274124145507812, 24.424036026000977, 25.573949813842773, 26.723861694335938, 27.873775482177734, 29.02368927001953, 30.173601150512695, 31.323514938354492, 32.473426818847656, 33.62334060668945]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 13.0, 8.0, 14.0, 20.0, 24.0, 17.0, 20.0, 25.0, 33.0, 34.0, 28.0, 38.0, 37.0, 30.0, 40.0, 36.0, 41.0, 40.0, 42.0, 45.0, 45.0, 40.0, 39.0, 32.0, 31.0, 28.0, 36.0, 26.0, 13.0, 15.0, 19.0, 14.0, 10.0, 7.0, 11.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.71484375, -3.595703125, -3.4765625, -3.357421875, -3.23828125, -3.119140625, -3.0, -2.880859375, -2.76171875, -2.642578125, -2.5234375, -2.404296875, -2.28515625, -2.166015625, -2.046875, -1.927734375, -1.80859375, -1.689453125, -1.5703125, -1.451171875, -1.33203125, -1.212890625, -1.09375, -0.974609375, -0.85546875, -0.736328125, -0.6171875, -0.498046875, -0.37890625, -0.259765625, -0.140625, -0.021484375, 0.09765625, 0.216796875, 0.3359375, 0.455078125, 0.57421875, 0.693359375, 0.8125, 0.931640625, 1.05078125, 1.169921875, 1.2890625, 1.408203125, 1.52734375, 1.646484375, 1.765625, 1.884765625, 2.00390625, 2.123046875, 2.2421875, 2.361328125, 2.48046875, 2.599609375, 2.71875, 2.837890625, 2.95703125, 3.076171875, 3.1953125, 3.314453125, 3.43359375, 3.552734375, 3.671875, 3.791015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 7.0, 12.0, 18.0, 30.0, 36.0, 58.0, 96.0, 149.0, 232.0, 347.0, 512.0, 887.0, 1247.0, 1871.0, 2994.0, 4831.0, 7747.0, 13456.0, 24074.0, 50770.0, 138139.0, 514330.0, 1583751.0, 1286502.0, 368674.0, 102099.0, 40680.0, 20229.0, 11446.0, 6858.0, 4240.0, 2727.0, 1823.0, 1136.0, 769.0, 505.0, 313.0, 222.0, 146.0, 85.0, 69.0, 62.0, 28.0, 14.0, 13.0, 11.0, 4.0, 8.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.90625, -4.7523193359375, -4.598388671875, -4.4444580078125, -4.29052734375, -4.1365966796875, -3.982666015625, -3.8287353515625, -3.6748046875, -3.5208740234375, -3.366943359375, -3.2130126953125, -3.05908203125, -2.9051513671875, -2.751220703125, -2.5972900390625, -2.443359375, -2.2894287109375, -2.135498046875, -1.9815673828125, -1.82763671875, -1.6737060546875, -1.519775390625, -1.3658447265625, -1.2119140625, -1.0579833984375, -0.904052734375, -0.7501220703125, -0.59619140625, -0.4422607421875, -0.288330078125, -0.1343994140625, 0.01953125, 0.1734619140625, 0.327392578125, 0.4813232421875, 0.63525390625, 0.7891845703125, 0.943115234375, 1.0970458984375, 1.2509765625, 1.4049072265625, 1.558837890625, 1.7127685546875, 1.86669921875, 2.0206298828125, 2.174560546875, 2.3284912109375, 2.482421875, 2.6363525390625, 2.790283203125, 2.9442138671875, 3.09814453125, 3.2520751953125, 3.406005859375, 3.5599365234375, 3.7138671875, 3.8677978515625, 4.021728515625, 4.1756591796875, 4.32958984375, 4.4835205078125, 4.637451171875, 4.7913818359375, 4.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 11.0, 12.0, 19.0, 25.0, 35.0, 50.0, 53.0, 80.0, 97.0, 165.0, 232.0, 387.0, 594.0, 698.0, 533.0, 365.0, 206.0, 143.0, 102.0, 77.0, 40.0, 37.0, 31.0, 20.0, 15.0, 8.0, 6.0, 3.0, 4.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3580322265625, -8.083251953125, -7.8084716796875, -7.53369140625, -7.2589111328125, -6.984130859375, -6.7093505859375, -6.4345703125, -6.1597900390625, -5.885009765625, -5.6102294921875, -5.33544921875, -5.0606689453125, -4.785888671875, -4.5111083984375, -4.236328125, -3.9615478515625, -3.686767578125, -3.4119873046875, -3.13720703125, -2.8624267578125, -2.587646484375, -2.3128662109375, -2.0380859375, -1.7633056640625, -1.488525390625, -1.2137451171875, -0.93896484375, -0.6641845703125, -0.389404296875, -0.1146240234375, 0.16015625, 0.4349365234375, 0.709716796875, 0.9844970703125, 1.25927734375, 1.5340576171875, 1.808837890625, 2.0836181640625, 2.3583984375, 2.6331787109375, 2.907958984375, 3.1827392578125, 3.45751953125, 3.7322998046875, 4.007080078125, 4.2818603515625, 4.556640625, 4.8314208984375, 5.106201171875, 5.3809814453125, 5.65576171875, 5.9305419921875, 6.205322265625, 6.4801025390625, 6.7548828125, 7.0296630859375, 7.304443359375, 7.5792236328125, 7.85400390625, 8.1287841796875, 8.403564453125, 8.6783447265625, 8.953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 4.0, 2.0, 11.0, 9.0, 19.0, 29.0, 38.0, 34.0, 83.0, 123.0, 229.0, 478.0, 1680.0, 13166.0, 797864.0, 3349702.0, 26944.0, 2529.0, 631.0, 265.0, 131.0, 88.0, 55.0, 53.0, 26.0, 24.0, 18.0, 15.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.396484375, -31.35546875, -30.314453125, -29.2734375, -28.232421875, -27.19140625, -26.150390625, -25.109375, -24.068359375, -23.02734375, -21.986328125, -20.9453125, -19.904296875, -18.86328125, -17.822265625, -16.78125, -15.740234375, -14.69921875, -13.658203125, -12.6171875, -11.576171875, -10.53515625, -9.494140625, -8.453125, -7.412109375, -6.37109375, -5.330078125, -4.2890625, -3.248046875, -2.20703125, -1.166015625, -0.125, 0.916015625, 1.95703125, 2.998046875, 4.0390625, 5.080078125, 6.12109375, 7.162109375, 8.203125, 9.244140625, 10.28515625, 11.326171875, 12.3671875, 13.408203125, 14.44921875, 15.490234375, 16.53125, 17.572265625, 18.61328125, 19.654296875, 20.6953125, 21.736328125, 22.77734375, 23.818359375, 24.859375, 25.900390625, 26.94140625, 27.982421875, 29.0234375, 30.064453125, 31.10546875, 32.146484375, 33.1875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 18.0, 80.0, 230.0, 373.0, 238.0, 44.0, 21.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.60581970214844, -123.48200225830078, -120.3581771850586, -117.23435974121094, -114.11053466796875, -110.9867172241211, -107.86289978027344, -104.73907470703125, -101.61524963378906, -98.4914321899414, -95.36760711669922, -92.24378967285156, -89.11996459960938, -85.99614715576172, -82.87232971191406, -79.74850463867188, -76.62468719482422, -73.50086975097656, -70.37704467773438, -67.25322723388672, -64.12940216064453, -61.005584716796875, -57.88176345825195, -54.75794219970703, -51.63412094116211, -48.51029968261719, -45.386478424072266, -42.262657165527344, -39.13883972167969, -36.0150146484375, -32.891197204589844, -29.767375946044922, -26.64354705810547, -23.519725799560547, -20.395904541015625, -17.272085189819336, -14.148263931274414, -11.024442672729492, -7.900623321533203, -4.776802062988281, -1.6529808044433594, 1.4708399772644043, 4.594660758972168, 7.718481063842773, 10.842302322387695, 13.966123580932617, 17.089942932128906, 20.213764190673828, 23.33758544921875, 26.461406707763672, 29.585227966308594, 32.70904541015625, 35.83287048339844, 38.956687927246094, 42.080509185791016, 45.20433044433594, 48.32815170288086, 51.45197296142578, 54.5757942199707, 57.699615478515625, 60.82343292236328, 63.94725799560547, 67.07107543945312, 70.19490051269531, 73.31871795654297]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 1.0, 8.0, 7.0, 19.0, 14.0, 17.0, 23.0, 19.0, 34.0, 19.0, 32.0, 25.0, 39.0, 43.0, 33.0, 42.0, 43.0, 33.0, 45.0, 45.0, 49.0, 43.0, 53.0, 40.0, 34.0, 29.0, 23.0, 29.0, 24.0, 21.0, 17.0, 19.0, 8.0, 8.0, 7.0, 7.0, 4.0, 6.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.01807403564453, -20.24705696105957, -19.476041793823242, -18.70502471923828, -17.934009552001953, -17.162992477416992, -16.39197540283203, -15.620959281921387, -14.849943161010742, -14.078927040100098, -13.307910919189453, -12.536893844604492, -11.765877723693848, -10.994861602783203, -10.223844528198242, -9.452828407287598, -8.681812286376953, -7.910796165466309, -7.139779567718506, -6.368762969970703, -5.597746849060059, -4.826730728149414, -4.055714130401611, -3.2846975326538086, -2.513681411743164, -1.7426650524139404, -0.9716486930847168, -0.20063233375549316, 0.5703840255737305, 1.341400384902954, 2.1124167442321777, 2.8834333419799805, 3.654449462890625, 4.4254655838012695, 5.196482181549072, 5.967498779296875, 6.7385149002075195, 7.509531021118164, 8.280548095703125, 9.05156421661377, 9.822580337524414, 10.593596458435059, 11.364612579345703, 12.135629653930664, 12.906645774841309, 13.677661895751953, 14.448678970336914, 15.219695091247559, 15.990711212158203, 16.761728286743164, 17.532743453979492, 18.303760528564453, 19.07477569580078, 19.845792770385742, 20.616809844970703, 21.38782501220703, 22.158842086791992, 22.929859161376953, 23.70087432861328, 24.471891403198242, 25.242908477783203, 26.01392364501953, 26.784940719604492, 27.555957794189453, 28.32697296142578]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 15.0, 14.0, 9.0, 27.0, 23.0, 24.0, 28.0, 24.0, 18.0, 39.0, 43.0, 41.0, 30.0, 36.0, 49.0, 52.0, 50.0, 44.0, 47.0, 35.0, 43.0, 34.0, 34.0, 26.0, 20.0, 25.0, 21.0, 18.0, 25.0, 15.0, 17.0, 14.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.666748046875, -3.55224609375, -3.437744140625, -3.3232421875, -3.208740234375, -3.09423828125, -2.979736328125, -2.865234375, -2.750732421875, -2.63623046875, -2.521728515625, -2.4072265625, -2.292724609375, -2.17822265625, -2.063720703125, -1.94921875, -1.834716796875, -1.72021484375, -1.605712890625, -1.4912109375, -1.376708984375, -1.26220703125, -1.147705078125, -1.033203125, -0.918701171875, -0.80419921875, -0.689697265625, -0.5751953125, -0.460693359375, -0.34619140625, -0.231689453125, -0.1171875, -0.002685546875, 0.11181640625, 0.226318359375, 0.3408203125, 0.455322265625, 0.56982421875, 0.684326171875, 0.798828125, 0.913330078125, 1.02783203125, 1.142333984375, 1.2568359375, 1.371337890625, 1.48583984375, 1.600341796875, 1.71484375, 1.829345703125, 1.94384765625, 2.058349609375, 2.1728515625, 2.287353515625, 2.40185546875, 2.516357421875, 2.630859375, 2.745361328125, 2.85986328125, 2.974365234375, 3.0888671875, 3.203369140625, 3.31787109375, 3.432373046875, 3.546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 12.0, 24.0, 36.0, 42.0, 45.0, 82.0, 137.0, 273.0, 338.0, 591.0, 1079.0, 2083.0, 4417.0, 10657.0, 31108.0, 147097.0, 640125.0, 157377.0, 32733.0, 10800.0, 4573.0, 2128.0, 1121.0, 634.0, 362.0, 234.0, 137.0, 86.0, 73.0, 41.0, 31.0, 21.0, 12.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.200408935546875, -3.10198974609375, -3.003570556640625, -2.9051513671875, -2.806732177734375, -2.70831298828125, -2.609893798828125, -2.511474609375, -2.413055419921875, -2.31463623046875, -2.216217041015625, -2.1177978515625, -2.019378662109375, -1.92095947265625, -1.822540283203125, -1.72412109375, -1.625701904296875, -1.52728271484375, -1.428863525390625, -1.3304443359375, -1.232025146484375, -1.13360595703125, -1.035186767578125, -0.936767578125, -0.838348388671875, -0.73992919921875, -0.641510009765625, -0.5430908203125, -0.444671630859375, -0.34625244140625, -0.247833251953125, -0.1494140625, -0.050994873046875, 0.04742431640625, 0.145843505859375, 0.2442626953125, 0.342681884765625, 0.44110107421875, 0.539520263671875, 0.637939453125, 0.736358642578125, 0.83477783203125, 0.933197021484375, 1.0316162109375, 1.130035400390625, 1.22845458984375, 1.326873779296875, 1.42529296875, 1.523712158203125, 1.62213134765625, 1.720550537109375, 1.8189697265625, 1.917388916015625, 2.01580810546875, 2.114227294921875, 2.212646484375, 2.311065673828125, 2.40948486328125, 2.507904052734375, 2.6063232421875, 2.704742431640625, 2.80316162109375, 2.901580810546875, 3.0]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 11.0, 10.0, 16.0, 13.0, 20.0, 17.0, 25.0, 21.0, 22.0, 30.0, 33.0, 24.0, 27.0, 44.0, 34.0, 39.0, 1058.0, 46.0, 54.0, 33.0, 36.0, 35.0, 39.0, 36.0, 45.0, 37.0, 25.0, 21.0, 23.0, 17.0, 24.0, 15.0, 11.0, 10.0, 10.0, 7.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.111602783203125, -2.02984619140625, -1.948089599609375, -1.8663330078125, -1.784576416015625, -1.70281982421875, -1.621063232421875, -1.539306640625, -1.457550048828125, -1.37579345703125, -1.294036865234375, -1.2122802734375, -1.130523681640625, -1.04876708984375, -0.967010498046875, -0.88525390625, -0.803497314453125, -0.72174072265625, -0.639984130859375, -0.5582275390625, -0.476470947265625, -0.39471435546875, -0.312957763671875, -0.231201171875, -0.149444580078125, -0.06768798828125, 0.014068603515625, 0.0958251953125, 0.177581787109375, 0.25933837890625, 0.341094970703125, 0.4228515625, 0.504608154296875, 0.58636474609375, 0.668121337890625, 0.7498779296875, 0.831634521484375, 0.91339111328125, 0.995147705078125, 1.076904296875, 1.158660888671875, 1.24041748046875, 1.322174072265625, 1.4039306640625, 1.485687255859375, 1.56744384765625, 1.649200439453125, 1.73095703125, 1.812713623046875, 1.89447021484375, 1.976226806640625, 2.0579833984375, 2.139739990234375, 2.22149658203125, 2.303253173828125, 2.385009765625, 2.466766357421875, 2.54852294921875, 2.630279541015625, 2.7120361328125, 2.793792724609375, 2.87554931640625, 2.957305908203125, 3.0390625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 18.0, 16.0, 27.0, 36.0, 52.0, 52.0, 84.0, 141.0, 234.0, 335.0, 525.0, 901.0, 1542.0, 2788.0, 5153.0, 10731.0, 26888.0, 103292.0, 1543672.0, 320409.0, 47713.0, 16172.0, 7414.0, 3759.0, 2083.0, 1150.0, 700.0, 413.0, 258.0, 186.0, 113.0, 86.0, 47.0, 51.0, 29.0, 11.0, 18.0, 6.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.948394775390625, -1.88702392578125, -1.825653076171875, -1.7642822265625, -1.702911376953125, -1.64154052734375, -1.580169677734375, -1.518798828125, -1.457427978515625, -1.39605712890625, -1.334686279296875, -1.2733154296875, -1.211944580078125, -1.15057373046875, -1.089202880859375, -1.02783203125, -0.966461181640625, -0.90509033203125, -0.843719482421875, -0.7823486328125, -0.720977783203125, -0.65960693359375, -0.598236083984375, -0.536865234375, -0.475494384765625, -0.41412353515625, -0.352752685546875, -0.2913818359375, -0.230010986328125, -0.16864013671875, -0.107269287109375, -0.0458984375, 0.015472412109375, 0.07684326171875, 0.138214111328125, 0.1995849609375, 0.260955810546875, 0.32232666015625, 0.383697509765625, 0.445068359375, 0.506439208984375, 0.56781005859375, 0.629180908203125, 0.6905517578125, 0.751922607421875, 0.81329345703125, 0.874664306640625, 0.93603515625, 0.997406005859375, 1.05877685546875, 1.120147705078125, 1.1815185546875, 1.242889404296875, 1.30426025390625, 1.365631103515625, 1.427001953125, 1.488372802734375, 1.54974365234375, 1.611114501953125, 1.6724853515625, 1.733856201171875, 1.79522705078125, 1.856597900390625, 1.91796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 7.0, 4.0, 14.0, 20.0, 47.0, 99.0, 277.0, 276.0, 117.0, 36.0, 23.0, 15.0, 12.0, 5.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.662109375, -0.6426773071289062, -0.6232452392578125, -0.6038131713867188, -0.584381103515625, -0.5649490356445312, -0.5455169677734375, -0.5260848999023438, -0.50665283203125, -0.48722076416015625, -0.4677886962890625, -0.44835662841796875, -0.428924560546875, -0.40949249267578125, -0.3900604248046875, -0.37062835693359375, -0.3511962890625, -0.33176422119140625, -0.3123321533203125, -0.29290008544921875, -0.273468017578125, -0.25403594970703125, -0.2346038818359375, -0.21517181396484375, -0.19573974609375, -0.17630767822265625, -0.1568756103515625, -0.13744354248046875, -0.118011474609375, -0.09857940673828125, -0.0791473388671875, -0.05971527099609375, -0.040283203125, -0.02085113525390625, -0.0014190673828125, 0.01801300048828125, 0.037445068359375, 0.05687713623046875, 0.0763092041015625, 0.09574127197265625, 0.11517333984375, 0.13460540771484375, 0.1540374755859375, 0.17346954345703125, 0.192901611328125, 0.21233367919921875, 0.2317657470703125, 0.25119781494140625, 0.2706298828125, 0.29006195068359375, 0.3094940185546875, 0.32892608642578125, 0.348358154296875, 0.36779022216796875, 0.3872222900390625, 0.40665435791015625, 0.42608642578125, 0.44551849365234375, 0.4649505615234375, 0.48438262939453125, 0.503814697265625, 0.5232467651367188, 0.5426788330078125, 0.5621109008789062, 0.58154296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 2.0, 8.0, 13.0, 10.0, 24.0, 31.0, 44.0, 143.0, 639.0, 3580.0, 875802.0, 164320.0, 3118.0, 567.0, 105.0, 44.0, 25.0, 18.0, 8.0, 6.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.03125, -10.6630859375, -10.294921875, -9.9267578125, -9.55859375, -9.1904296875, -8.822265625, -8.4541015625, -8.0859375, -7.7177734375, -7.349609375, -6.9814453125, -6.61328125, -6.2451171875, -5.876953125, -5.5087890625, -5.140625, -4.7724609375, -4.404296875, -4.0361328125, -3.66796875, -3.2998046875, -2.931640625, -2.5634765625, -2.1953125, -1.8271484375, -1.458984375, -1.0908203125, -0.72265625, -0.3544921875, 0.013671875, 0.3818359375, 0.75, 1.1181640625, 1.486328125, 1.8544921875, 2.22265625, 2.5908203125, 2.958984375, 3.3271484375, 3.6953125, 4.0634765625, 4.431640625, 4.7998046875, 5.16796875, 5.5361328125, 5.904296875, 6.2724609375, 6.640625, 7.0087890625, 7.376953125, 7.7451171875, 8.11328125, 8.4814453125, 8.849609375, 9.2177734375, 9.5859375, 9.9541015625, 10.322265625, 10.6904296875, 11.05859375, 11.4267578125, 11.794921875, 12.1630859375, 12.53125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 10.0, 13.0, 15.0, 39.0, 52.0, 111.0, 211.0, 257.0, 144.0, 61.0, 44.0, 24.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6177295446395874, -0.5797190070152283, -0.5417084693908691, -0.50369793176651, -0.4656873941421509, -0.42767685651779175, -0.3896663188934326, -0.3516557812690735, -0.31364524364471436, -0.2756347060203552, -0.2376241683959961, -0.19961363077163696, -0.16160309314727783, -0.1235925555229187, -0.08558201789855957, -0.04757148027420044, -0.009560942649841309, 0.028449594974517822, 0.06646013259887695, 0.10447067022323608, 0.14248120784759521, 0.18049174547195435, 0.21850228309631348, 0.2565128207206726, 0.29452335834503174, 0.33253389596939087, 0.37054443359375, 0.40855497121810913, 0.44656550884246826, 0.4845760464668274, 0.5225865840911865, 0.5605971217155457, 0.5986077785491943, 0.6366183161735535, 0.6746288537979126, 0.7126393914222717, 0.7506499290466309, 0.78866046667099, 0.8266710042953491, 0.8646815419197083, 0.9026920795440674, 0.9407026171684265, 0.9787131547927856, 1.0167236328125, 1.054734230041504, 1.0927448272705078, 1.1307553052902222, 1.1687657833099365, 1.2067763805389404, 1.2447869777679443, 1.2827974557876587, 1.320807933807373, 1.358818531036377, 1.3968291282653809, 1.4348396062850952, 1.4728500843048096, 1.5108606815338135, 1.5488712787628174, 1.5868817567825317, 1.624892234802246, 1.66290283203125, 1.700913429260254, 1.7389239072799683, 1.7769343852996826, 1.8149449825286865]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 8.0, 8.0, 8.0, 12.0, 19.0, 19.0, 24.0, 19.0, 20.0, 23.0, 16.0, 31.0, 40.0, 30.0, 35.0, 35.0, 33.0, 41.0, 36.0, 38.0, 35.0, 37.0, 39.0, 37.0, 33.0, 30.0, 28.0, 24.0, 28.0, 15.0, 17.0, 26.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 8.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35305070877075195, -0.3404378592967987, -0.32782498002052307, -0.3152121305465698, -0.3025992512702942, -0.28998640179634094, -0.2773735225200653, -0.26476067304611206, -0.2521477937698364, -0.23953492939472198, -0.22692206501960754, -0.2143092006444931, -0.20169633626937866, -0.18908348679542542, -0.17647060751914978, -0.16385775804519653, -0.1512448936700821, -0.13863202929496765, -0.1260191649198532, -0.11340630054473877, -0.10079343616962433, -0.08818057924509048, -0.07556771486997604, -0.0629548504948616, -0.05034198611974716, -0.03772912174463272, -0.02511625923216343, -0.012503396719694138, 0.00010946765542030334, 0.012722328305244446, 0.025335192680358887, 0.03794805705547333, 0.05056092143058777, 0.06317378580570221, 0.07578665018081665, 0.08839951455593109, 0.10101237893104553, 0.11362523585557938, 0.12623810768127441, 0.13885095715522766, 0.1514638364315033, 0.16407670080661774, 0.17668956518173218, 0.18930242955684662, 0.20191529393196106, 0.2145281434059143, 0.22714102268218994, 0.2397538721561432, 0.25236672163009644, 0.2649795711040497, 0.2775924503803253, 0.29020529985427856, 0.3028181791305542, 0.31543102860450745, 0.3280439078807831, 0.34065675735473633, 0.35326963663101196, 0.3658824861049652, 0.37849536538124084, 0.3911082148551941, 0.4037210941314697, 0.416333943605423, 0.4289468228816986, 0.44155967235565186, 0.4541725516319275]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 10.0, 19.0, 11.0, 22.0, 20.0, 18.0, 25.0, 18.0, 30.0, 31.0, 32.0, 39.0, 38.0, 43.0, 30.0, 44.0, 37.0, 40.0, 47.0, 45.0, 52.0, 46.0, 34.0, 21.0, 25.0, 26.0, 16.0, 30.0, 24.0, 18.0, 14.0, 12.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.541015625, -3.43310546875, -3.3251953125, -3.21728515625, -3.109375, -3.00146484375, -2.8935546875, -2.78564453125, -2.677734375, -2.56982421875, -2.4619140625, -2.35400390625, -2.24609375, -2.13818359375, -2.0302734375, -1.92236328125, -1.814453125, -1.70654296875, -1.5986328125, -1.49072265625, -1.3828125, -1.27490234375, -1.1669921875, -1.05908203125, -0.951171875, -0.84326171875, -0.7353515625, -0.62744140625, -0.51953125, -0.41162109375, -0.3037109375, -0.19580078125, -0.087890625, 0.02001953125, 0.1279296875, 0.23583984375, 0.34375, 0.45166015625, 0.5595703125, 0.66748046875, 0.775390625, 0.88330078125, 0.9912109375, 1.09912109375, 1.20703125, 1.31494140625, 1.4228515625, 1.53076171875, 1.638671875, 1.74658203125, 1.8544921875, 1.96240234375, 2.0703125, 2.17822265625, 2.2861328125, 2.39404296875, 2.501953125, 2.60986328125, 2.7177734375, 2.82568359375, 2.93359375, 3.04150390625, 3.1494140625, 3.25732421875, 3.365234375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 7.0, 11.0, 27.0, 34.0, 55.0, 84.0, 159.0, 205.0, 320.0, 483.0, 753.0, 1251.0, 2051.0, 3504.0, 5985.0, 10574.0, 20265.0, 45513.0, 140850.0, 456701.0, 235080.0, 66329.0, 26841.0, 13250.0, 7390.0, 4140.0, 2566.0, 1489.0, 954.0, 587.0, 354.0, 250.0, 150.0, 90.0, 67.0, 46.0, 43.0, 27.0, 9.0, 15.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.94921875, -5.7672119140625, -5.585205078125, -5.4031982421875, -5.22119140625, -5.0391845703125, -4.857177734375, -4.6751708984375, -4.4931640625, -4.3111572265625, -4.129150390625, -3.9471435546875, -3.76513671875, -3.5831298828125, -3.401123046875, -3.2191162109375, -3.037109375, -2.8551025390625, -2.673095703125, -2.4910888671875, -2.30908203125, -2.1270751953125, -1.945068359375, -1.7630615234375, -1.5810546875, -1.3990478515625, -1.217041015625, -1.0350341796875, -0.85302734375, -0.6710205078125, -0.489013671875, -0.3070068359375, -0.125, 0.0570068359375, 0.239013671875, 0.4210205078125, 0.60302734375, 0.7850341796875, 0.967041015625, 1.1490478515625, 1.3310546875, 1.5130615234375, 1.695068359375, 1.8770751953125, 2.05908203125, 2.2410888671875, 2.423095703125, 2.6051025390625, 2.787109375, 2.9691162109375, 3.151123046875, 3.3331298828125, 3.51513671875, 3.6971435546875, 3.879150390625, 4.0611572265625, 4.2431640625, 4.4251708984375, 4.607177734375, 4.7891845703125, 4.97119140625, 5.1531982421875, 5.335205078125, 5.5172119140625, 5.69921875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 12.0, 14.0, 30.0, 34.0, 35.0, 37.0, 36.0, 63.0, 52.0, 67.0, 88.0, 227.0, 1577.0, 248.0, 89.0, 63.0, 63.0, 49.0, 41.0, 35.0, 30.0, 25.0, 17.0, 23.0, 12.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8851318359375, -11.418701171875, -10.9522705078125, -10.48583984375, -10.0194091796875, -9.552978515625, -9.0865478515625, -8.6201171875, -8.1536865234375, -7.687255859375, -7.2208251953125, -6.75439453125, -6.2879638671875, -5.821533203125, -5.3551025390625, -4.888671875, -4.4222412109375, -3.955810546875, -3.4893798828125, -3.02294921875, -2.5565185546875, -2.090087890625, -1.6236572265625, -1.1572265625, -0.6907958984375, -0.224365234375, 0.2420654296875, 0.70849609375, 1.1749267578125, 1.641357421875, 2.1077880859375, 2.57421875, 3.0406494140625, 3.507080078125, 3.9735107421875, 4.43994140625, 4.9063720703125, 5.372802734375, 5.8392333984375, 6.3056640625, 6.7720947265625, 7.238525390625, 7.7049560546875, 8.17138671875, 8.6378173828125, 9.104248046875, 9.5706787109375, 10.037109375, 10.5035400390625, 10.969970703125, 11.4364013671875, 11.90283203125, 12.3692626953125, 12.835693359375, 13.3021240234375, 13.7685546875, 14.2349853515625, 14.701416015625, 15.1678466796875, 15.63427734375, 16.1007080078125, 16.567138671875, 17.0335693359375, 17.5]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 20.0, 28.0, 28.0, 42.0, 73.0, 86.0, 139.0, 263.0, 542.0, 1650.0, 6831.0, 48085.0, 2506483.0, 550360.0, 24668.0, 4179.0, 1086.0, 448.0, 197.0, 139.0, 87.0, 74.0, 51.0, 27.0, 18.0, 22.0, 9.0, 9.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.03125, -22.40625, -21.78125, -21.15625, -20.53125, -19.90625, -19.28125, -18.65625, -18.03125, -17.40625, -16.78125, -16.15625, -15.53125, -14.90625, -14.28125, -13.65625, -13.03125, -12.40625, -11.78125, -11.15625, -10.53125, -9.90625, -9.28125, -8.65625, -8.03125, -7.40625, -6.78125, -6.15625, -5.53125, -4.90625, -4.28125, -3.65625, -3.03125, -2.40625, -1.78125, -1.15625, -0.53125, 0.09375, 0.71875, 1.34375, 1.96875, 2.59375, 3.21875, 3.84375, 4.46875, 5.09375, 5.71875, 6.34375, 6.96875, 7.59375, 8.21875, 8.84375, 9.46875, 10.09375, 10.71875, 11.34375, 11.96875, 12.59375, 13.21875, 13.84375, 14.46875, 15.09375, 15.71875, 16.34375, 16.96875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 15.0, 59.0, 185.0, 314.0, 251.0, 106.0, 50.0, 14.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46574020385742, -60.84966278076172, -59.23358154296875, -57.61750411987305, -56.00142288208008, -54.385345458984375, -52.769264221191406, -51.1531867980957, -49.537105560302734, -47.92102813720703, -46.30494689941406, -44.68886947631836, -43.07278823852539, -41.45671081542969, -39.84062957763672, -38.224552154541016, -36.60847473144531, -34.99239730834961, -33.37631607055664, -31.760236740112305, -30.14415740966797, -28.528079986572266, -26.911998748779297, -25.295921325683594, -23.679840087890625, -22.06376075744629, -20.447681427001953, -18.831602096557617, -17.21552276611328, -15.599444389343262, -13.983365058898926, -12.36728572845459, -10.751205444335938, -9.135126113891602, -7.519046783447266, -5.902967929840088, -4.286888599395752, -2.670809745788574, -1.0547304153442383, 0.5613489151000977, 2.1774282455444336, 3.7935075759887695, 5.4095869064331055, 7.025665760040283, 8.641744613647461, 10.257823944091797, 11.873903274536133, 13.489982604980469, 15.106061935424805, 16.72214126586914, 18.338220596313477, 19.954299926757812, 21.57037925720215, 23.186458587646484, 24.802536010742188, 26.418617248535156, 28.03469467163086, 29.650774002075195, 31.26685333251953, 32.882930755615234, 34.4990119934082, 36.115089416503906, 37.731170654296875, 39.34724807739258, 40.96332931518555]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 6.0, 10.0, 8.0, 14.0, 11.0, 20.0, 15.0, 11.0, 13.0, 23.0, 23.0, 15.0, 25.0, 30.0, 28.0, 40.0, 37.0, 32.0, 41.0, 46.0, 39.0, 34.0, 34.0, 28.0, 33.0, 34.0, 24.0, 40.0, 29.0, 36.0, 17.0, 29.0, 15.0, 28.0, 22.0, 14.0, 18.0, 12.0, 16.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-30.805992126464844, -29.864938735961914, -28.923887252807617, -27.982833862304688, -27.04178237915039, -26.10072898864746, -25.159677505493164, -24.218624114990234, -23.277572631835938, -22.336519241333008, -21.39546775817871, -20.45441436767578, -19.513362884521484, -18.572309494018555, -17.631258010864258, -16.690204620361328, -15.749152183532715, -14.808099746704102, -13.867047309875488, -12.925994873046875, -11.984942436218262, -11.043889999389648, -10.102836608886719, -9.161785125732422, -8.220731735229492, -7.279679298400879, -6.338626861572266, -5.397574424743652, -4.456521987915039, -3.5154690742492676, -2.5744166374206543, -1.633364200592041, -0.6923122406005859, 0.24874025583267212, 1.1897927522659302, 2.130845308303833, 3.0718977451324463, 4.012950420379639, 4.954002857208252, 5.895055294036865, 6.8361077308654785, 7.777160167694092, 8.718213081359863, 9.659265518188477, 10.60031795501709, 11.541370391845703, 12.482422828674316, 13.42347526550293, 14.364527702331543, 15.305580139160156, 16.246633529663086, 17.187685012817383, 18.128738403320312, 19.06978988647461, 20.01084327697754, 20.951894760131836, 21.892948150634766, 22.834001541137695, 23.775053024291992, 24.716106414794922, 25.65715789794922, 26.59821128845215, 27.539262771606445, 28.480316162109375, 29.421367645263672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 10.0, 6.0, 8.0, 9.0, 11.0, 14.0, 15.0, 15.0, 18.0, 26.0, 29.0, 20.0, 31.0, 20.0, 37.0, 34.0, 45.0, 43.0, 51.0, 49.0, 50.0, 39.0, 37.0, 35.0, 43.0, 39.0, 27.0, 33.0, 29.0, 27.0, 26.0, 16.0, 22.0, 11.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.822265625, -3.706298828125, -3.59033203125, -3.474365234375, -3.3583984375, -3.242431640625, -3.12646484375, -3.010498046875, -2.89453125, -2.778564453125, -2.66259765625, -2.546630859375, -2.4306640625, -2.314697265625, -2.19873046875, -2.082763671875, -1.966796875, -1.850830078125, -1.73486328125, -1.618896484375, -1.5029296875, -1.386962890625, -1.27099609375, -1.155029296875, -1.0390625, -0.923095703125, -0.80712890625, -0.691162109375, -0.5751953125, -0.459228515625, -0.34326171875, -0.227294921875, -0.111328125, 0.004638671875, 0.12060546875, 0.236572265625, 0.3525390625, 0.468505859375, 0.58447265625, 0.700439453125, 0.81640625, 0.932373046875, 1.04833984375, 1.164306640625, 1.2802734375, 1.396240234375, 1.51220703125, 1.628173828125, 1.744140625, 1.860107421875, 1.97607421875, 2.092041015625, 2.2080078125, 2.323974609375, 2.43994140625, 2.555908203125, 2.671875, 2.787841796875, 2.90380859375, 3.019775390625, 3.1357421875, 3.251708984375, 3.36767578125, 3.483642578125, 3.599609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 12.0, 12.0, 21.0, 39.0, 50.0, 72.0, 96.0, 122.0, 206.0, 304.0, 416.0, 626.0, 1091.0, 1907.0, 3450.0, 7515.0, 16705.0, 43227.0, 177252.0, 1437154.0, 2130138.0, 280435.0, 55451.0, 19836.0, 8627.0, 3962.0, 2136.0, 1225.0, 726.0, 469.0, 291.0, 194.0, 148.0, 120.0, 62.0, 46.0, 36.0, 30.0, 14.0, 10.0, 9.0, 11.0, 11.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.3936767578125, -6.166259765625, -5.9388427734375, -5.71142578125, -5.4840087890625, -5.256591796875, -5.0291748046875, -4.8017578125, -4.5743408203125, -4.346923828125, -4.1195068359375, -3.89208984375, -3.6646728515625, -3.437255859375, -3.2098388671875, -2.982421875, -2.7550048828125, -2.527587890625, -2.3001708984375, -2.07275390625, -1.8453369140625, -1.617919921875, -1.3905029296875, -1.1630859375, -0.9356689453125, -0.708251953125, -0.4808349609375, -0.25341796875, -0.0260009765625, 0.201416015625, 0.4288330078125, 0.65625, 0.8836669921875, 1.111083984375, 1.3385009765625, 1.56591796875, 1.7933349609375, 2.020751953125, 2.2481689453125, 2.4755859375, 2.7030029296875, 2.930419921875, 3.1578369140625, 3.38525390625, 3.6126708984375, 3.840087890625, 4.0675048828125, 4.294921875, 4.5223388671875, 4.749755859375, 4.9771728515625, 5.20458984375, 5.4320068359375, 5.659423828125, 5.8868408203125, 6.1142578125, 6.3416748046875, 6.569091796875, 6.7965087890625, 7.02392578125, 7.2513427734375, 7.478759765625, 7.7061767578125, 7.93359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 11.0, 7.0, 7.0, 12.0, 9.0, 19.0, 24.0, 29.0, 25.0, 42.0, 58.0, 90.0, 90.0, 106.0, 163.0, 221.0, 410.0, 564.0, 614.0, 476.0, 290.0, 218.0, 156.0, 106.0, 71.0, 55.0, 46.0, 43.0, 23.0, 24.0, 11.0, 10.0, 7.0, 5.0, 3.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.84765625, -7.64752197265625, -7.4473876953125, -7.24725341796875, -7.047119140625, -6.84698486328125, -6.6468505859375, -6.44671630859375, -6.24658203125, -6.04644775390625, -5.8463134765625, -5.64617919921875, -5.446044921875, -5.24591064453125, -5.0457763671875, -4.84564208984375, -4.6455078125, -4.44537353515625, -4.2452392578125, -4.04510498046875, -3.844970703125, -3.64483642578125, -3.4447021484375, -3.24456787109375, -3.04443359375, -2.84429931640625, -2.6441650390625, -2.44403076171875, -2.243896484375, -2.04376220703125, -1.8436279296875, -1.64349365234375, -1.443359375, -1.24322509765625, -1.0430908203125, -0.84295654296875, -0.642822265625, -0.44268798828125, -0.2425537109375, -0.04241943359375, 0.15771484375, 0.35784912109375, 0.5579833984375, 0.75811767578125, 0.958251953125, 1.15838623046875, 1.3585205078125, 1.55865478515625, 1.7587890625, 1.95892333984375, 2.1590576171875, 2.35919189453125, 2.559326171875, 2.75946044921875, 2.9595947265625, 3.15972900390625, 3.35986328125, 3.55999755859375, 3.7601318359375, 3.96026611328125, 4.160400390625, 4.36053466796875, 4.5606689453125, 4.76080322265625, 4.9609375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 9.0, 12.0, 17.0, 24.0, 37.0, 50.0, 66.0, 113.0, 130.0, 249.0, 523.0, 2178.0, 15399.0, 269974.0, 3772044.0, 121885.0, 9031.0, 1373.0, 425.0, 207.0, 142.0, 108.0, 58.0, 49.0, 32.0, 27.0, 23.0, 17.0, 13.0, 8.0, 4.0, 12.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.236572265625, -17.48876953125, -16.740966796875, -15.9931640625, -15.245361328125, -14.49755859375, -13.749755859375, -13.001953125, -12.254150390625, -11.50634765625, -10.758544921875, -10.0107421875, -9.262939453125, -8.51513671875, -7.767333984375, -7.01953125, -6.271728515625, -5.52392578125, -4.776123046875, -4.0283203125, -3.280517578125, -2.53271484375, -1.784912109375, -1.037109375, -0.289306640625, 0.45849609375, 1.206298828125, 1.9541015625, 2.701904296875, 3.44970703125, 4.197509765625, 4.9453125, 5.693115234375, 6.44091796875, 7.188720703125, 7.9365234375, 8.684326171875, 9.43212890625, 10.179931640625, 10.927734375, 11.675537109375, 12.42333984375, 13.171142578125, 13.9189453125, 14.666748046875, 15.41455078125, 16.162353515625, 16.91015625, 17.657958984375, 18.40576171875, 19.153564453125, 19.9013671875, 20.649169921875, 21.39697265625, 22.144775390625, 22.892578125, 23.640380859375, 24.38818359375, 25.135986328125, 25.8837890625, 26.631591796875, 27.37939453125, 28.127197265625, 28.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 32.0, 97.0, 250.0, 348.0, 201.0, 66.0, 11.0, 6.0], "bins": [-150.67547607421875, -148.13961791992188, -145.603759765625, -143.0679168701172, -140.5320587158203, -137.99620056152344, -135.46034240722656, -132.9244842529297, -130.38864135742188, -127.852783203125, -125.31693267822266, -122.78107452392578, -120.24522399902344, -117.70936584472656, -115.17350769042969, -112.63765716552734, -110.10179138183594, -107.56593322753906, -105.03008270263672, -102.49422454833984, -99.9583740234375, -97.42251586914062, -94.88665771484375, -92.3508071899414, -89.81495666503906, -87.27909851074219, -84.74324798583984, -82.20738983154297, -79.67153930664062, -77.13568115234375, -74.59982299804688, -72.06397247314453, -69.52810668945312, -66.99224853515625, -64.4563980102539, -61.92053985595703, -59.38468551635742, -56.84883117675781, -54.3129768371582, -51.777122497558594, -49.24127197265625, -46.70541763305664, -44.16956329345703, -41.633705139160156, -39.09785079956055, -36.56199645996094, -34.02614212036133, -31.490285873413086, -28.954429626464844, -26.418575286865234, -23.882719039916992, -21.346864700317383, -18.81100845336914, -16.27515411376953, -13.739299774169922, -11.20344352722168, -8.66758918762207, -6.1317338943481445, -3.595879077911377, -1.0600242614746094, 1.4758310317993164, 4.011686325073242, 6.547540664672852, 9.083396911621094, 11.619251251220703]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 7.0, 5.0, 11.0, 13.0, 22.0, 19.0, 29.0, 30.0, 22.0, 31.0, 44.0, 43.0, 33.0, 38.0, 42.0, 44.0, 38.0, 31.0, 50.0, 47.0, 38.0, 45.0, 40.0, 27.0, 34.0, 25.0, 33.0, 21.0, 25.0, 19.0, 26.0, 12.0, 14.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.054899215698242, -26.296161651611328, -25.537424087524414, -24.7786865234375, -24.019948959350586, -23.261211395263672, -22.502471923828125, -21.74373435974121, -20.984996795654297, -20.226259231567383, -19.46752166748047, -18.708784103393555, -17.95004653930664, -17.191307067871094, -16.432571411132812, -15.673831939697266, -14.915095329284668, -14.156357765197754, -13.39762020111084, -12.63888168334961, -11.880144119262695, -11.121406555175781, -10.362668991088867, -9.603931427001953, -8.845193862915039, -8.086456298828125, -7.327718257904053, -6.568980693817139, -5.810242652893066, -5.051505088806152, -4.292767524719238, -3.534029483795166, -2.7752914428710938, -2.0165536403656006, -1.257815957069397, -0.49907827377319336, 0.2596595287322998, 1.018397331237793, 1.777134895324707, 2.5358729362487793, 3.2946105003356934, 4.053348064422607, 4.81208610534668, 5.570823669433594, 6.329561233520508, 7.08829927444458, 7.847036838531494, 8.605774879455566, 9.36451244354248, 10.123250007629395, 10.881987571716309, 11.640726089477539, 12.399463653564453, 13.158201217651367, 13.916938781738281, 14.675676345825195, 15.43441390991211, 16.193151473999023, 16.951889038085938, 17.71062660217285, 18.469364166259766, 19.228103637695312, 19.986839294433594, 20.74557876586914, 21.504316329956055]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 2.0, 6.0, 4.0, 13.0, 14.0, 11.0, 11.0, 17.0, 20.0, 20.0, 35.0, 25.0, 18.0, 34.0, 27.0, 42.0, 35.0, 47.0, 35.0, 58.0, 48.0, 38.0, 43.0, 43.0, 43.0, 31.0, 35.0, 32.0, 35.0, 23.0, 25.0, 23.0, 21.0, 15.0, 9.0, 7.0, 7.0, 8.0, 4.0, 5.0, 6.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.453125, -3.338043212890625, -3.22296142578125, -3.107879638671875, -2.9927978515625, -2.877716064453125, -2.76263427734375, -2.647552490234375, -2.532470703125, -2.417388916015625, -2.30230712890625, -2.187225341796875, -2.0721435546875, -1.957061767578125, -1.84197998046875, -1.726898193359375, -1.61181640625, -1.496734619140625, -1.38165283203125, -1.266571044921875, -1.1514892578125, -1.036407470703125, -0.92132568359375, -0.806243896484375, -0.691162109375, -0.576080322265625, -0.46099853515625, -0.345916748046875, -0.2308349609375, -0.115753173828125, -0.00067138671875, 0.114410400390625, 0.2294921875, 0.344573974609375, 0.45965576171875, 0.574737548828125, 0.6898193359375, 0.804901123046875, 0.91998291015625, 1.035064697265625, 1.150146484375, 1.265228271484375, 1.38031005859375, 1.495391845703125, 1.6104736328125, 1.725555419921875, 1.84063720703125, 1.955718994140625, 2.07080078125, 2.185882568359375, 2.30096435546875, 2.416046142578125, 2.5311279296875, 2.646209716796875, 2.76129150390625, 2.876373291015625, 2.991455078125, 3.106536865234375, 3.22161865234375, 3.336700439453125, 3.4517822265625, 3.566864013671875, 3.68194580078125, 3.797027587890625, 3.912109375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 16.0, 24.0, 28.0, 42.0, 56.0, 61.0, 101.0, 128.0, 204.0, 262.0, 306.0, 483.0, 659.0, 959.0, 1494.0, 2259.0, 4016.0, 9393.0, 41793.0, 493535.0, 435727.0, 37489.0, 8716.0, 3872.0, 2259.0, 1336.0, 967.0, 653.0, 469.0, 312.0, 250.0, 170.0, 127.0, 96.0, 60.0, 59.0, 42.0, 36.0, 22.0, 16.0, 14.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.58984375, -2.5062255859375, -2.422607421875, -2.3389892578125, -2.25537109375, -2.1717529296875, -2.088134765625, -2.0045166015625, -1.9208984375, -1.8372802734375, -1.753662109375, -1.6700439453125, -1.58642578125, -1.5028076171875, -1.419189453125, -1.3355712890625, -1.251953125, -1.1683349609375, -1.084716796875, -1.0010986328125, -0.91748046875, -0.8338623046875, -0.750244140625, -0.6666259765625, -0.5830078125, -0.4993896484375, -0.415771484375, -0.3321533203125, -0.24853515625, -0.1649169921875, -0.081298828125, 0.0023193359375, 0.0859375, 0.1695556640625, 0.253173828125, 0.3367919921875, 0.42041015625, 0.5040283203125, 0.587646484375, 0.6712646484375, 0.7548828125, 0.8385009765625, 0.922119140625, 1.0057373046875, 1.08935546875, 1.1729736328125, 1.256591796875, 1.3402099609375, 1.423828125, 1.5074462890625, 1.591064453125, 1.6746826171875, 1.75830078125, 1.8419189453125, 1.925537109375, 2.0091552734375, 2.0927734375, 2.1763916015625, 2.260009765625, 2.3436279296875, 2.42724609375, 2.5108642578125, 2.594482421875, 2.6781005859375, 2.76171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 11.0, 4.0, 13.0, 12.0, 14.0, 16.0, 16.0, 29.0, 25.0, 21.0, 40.0, 35.0, 19.0, 41.0, 49.0, 43.0, 43.0, 43.0, 1069.0, 50.0, 35.0, 43.0, 32.0, 45.0, 35.0, 41.0, 23.0, 33.0, 22.0, 23.0, 18.0, 15.0, 18.0, 14.0, 7.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.090667724609375, -2.99774169921875, -2.904815673828125, -2.8118896484375, -2.718963623046875, -2.62603759765625, -2.533111572265625, -2.440185546875, -2.347259521484375, -2.25433349609375, -2.161407470703125, -2.0684814453125, -1.975555419921875, -1.88262939453125, -1.789703369140625, -1.69677734375, -1.603851318359375, -1.51092529296875, -1.417999267578125, -1.3250732421875, -1.232147216796875, -1.13922119140625, -1.046295166015625, -0.953369140625, -0.860443115234375, -0.76751708984375, -0.674591064453125, -0.5816650390625, -0.488739013671875, -0.39581298828125, -0.302886962890625, -0.2099609375, -0.117034912109375, -0.02410888671875, 0.068817138671875, 0.1617431640625, 0.254669189453125, 0.34759521484375, 0.440521240234375, 0.533447265625, 0.626373291015625, 0.71929931640625, 0.812225341796875, 0.9051513671875, 0.998077392578125, 1.09100341796875, 1.183929443359375, 1.27685546875, 1.369781494140625, 1.46270751953125, 1.555633544921875, 1.6485595703125, 1.741485595703125, 1.83441162109375, 1.927337646484375, 2.020263671875, 2.113189697265625, 2.20611572265625, 2.299041748046875, 2.3919677734375, 2.484893798828125, 2.57781982421875, 2.670745849609375, 2.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 6.0, 5.0, 5.0, 11.0, 11.0, 13.0, 14.0, 26.0, 38.0, 42.0, 67.0, 92.0, 150.0, 136.0, 228.0, 331.0, 567.0, 938.0, 1635.0, 3623.0, 12454.0, 162782.0, 1847369.0, 52739.0, 7625.0, 2724.0, 1342.0, 751.0, 409.0, 270.0, 200.0, 127.0, 94.0, 87.0, 49.0, 46.0, 26.0, 22.0, 18.0, 7.0, 11.0, 6.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-2.658203125, -2.580780029296875, -2.50335693359375, -2.425933837890625, -2.3485107421875, -2.271087646484375, -2.19366455078125, -2.116241455078125, -2.038818359375, -1.961395263671875, -1.88397216796875, -1.806549072265625, -1.7291259765625, -1.651702880859375, -1.57427978515625, -1.496856689453125, -1.41943359375, -1.342010498046875, -1.26458740234375, -1.187164306640625, -1.1097412109375, -1.032318115234375, -0.95489501953125, -0.877471923828125, -0.800048828125, -0.722625732421875, -0.64520263671875, -0.567779541015625, -0.4903564453125, -0.412933349609375, -0.33551025390625, -0.258087158203125, -0.1806640625, -0.103240966796875, -0.02581787109375, 0.051605224609375, 0.1290283203125, 0.206451416015625, 0.28387451171875, 0.361297607421875, 0.438720703125, 0.516143798828125, 0.59356689453125, 0.670989990234375, 0.7484130859375, 0.825836181640625, 0.90325927734375, 0.980682373046875, 1.05810546875, 1.135528564453125, 1.21295166015625, 1.290374755859375, 1.3677978515625, 1.445220947265625, 1.52264404296875, 1.600067138671875, 1.677490234375, 1.754913330078125, 1.83233642578125, 1.909759521484375, 1.9871826171875, 2.064605712890625, 2.14202880859375, 2.219451904296875, 2.296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 11.0, 34.0, 51.0, 125.0, 224.0, 244.0, 135.0, 66.0, 27.0, 14.0, 18.0, 9.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.34619140625, -0.33469390869140625, -0.3231964111328125, -0.31169891357421875, -0.300201416015625, -0.28870391845703125, -0.2772064208984375, -0.26570892333984375, -0.25421142578125, -0.24271392822265625, -0.2312164306640625, -0.21971893310546875, -0.208221435546875, -0.19672393798828125, -0.1852264404296875, -0.17372894287109375, -0.1622314453125, -0.15073394775390625, -0.1392364501953125, -0.12773895263671875, -0.116241455078125, -0.10474395751953125, -0.0932464599609375, -0.08174896240234375, -0.07025146484375, -0.05875396728515625, -0.0472564697265625, -0.03575897216796875, -0.024261474609375, -0.01276397705078125, -0.0012664794921875, 0.01023101806640625, 0.021728515625, 0.03322601318359375, 0.0447235107421875, 0.05622100830078125, 0.067718505859375, 0.07921600341796875, 0.0907135009765625, 0.10221099853515625, 0.11370849609375, 0.12520599365234375, 0.1367034912109375, 0.14820098876953125, 0.159698486328125, 0.17119598388671875, 0.1826934814453125, 0.19419097900390625, 0.2056884765625, 0.21718597412109375, 0.2286834716796875, 0.24018096923828125, 0.251678466796875, 0.26317596435546875, 0.2746734619140625, 0.28617095947265625, 0.29766845703125, 0.30916595458984375, 0.3206634521484375, 0.33216094970703125, 0.343658447265625, 0.35515594482421875, 0.3666534423828125, 0.37815093994140625, 0.3896484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 21.0, 12.0, 29.0, 39.0, 92.0, 264.0, 2707.0, 1031748.0, 12615.0, 712.0, 125.0, 62.0, 43.0, 22.0, 7.0, 9.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.10400390625, -7.8564453125, -7.60888671875, -7.361328125, -7.11376953125, -6.8662109375, -6.61865234375, -6.37109375, -6.12353515625, -5.8759765625, -5.62841796875, -5.380859375, -5.13330078125, -4.8857421875, -4.63818359375, -4.390625, -4.14306640625, -3.8955078125, -3.64794921875, -3.400390625, -3.15283203125, -2.9052734375, -2.65771484375, -2.41015625, -2.16259765625, -1.9150390625, -1.66748046875, -1.419921875, -1.17236328125, -0.9248046875, -0.67724609375, -0.4296875, -0.18212890625, 0.0654296875, 0.31298828125, 0.560546875, 0.80810546875, 1.0556640625, 1.30322265625, 1.55078125, 1.79833984375, 2.0458984375, 2.29345703125, 2.541015625, 2.78857421875, 3.0361328125, 3.28369140625, 3.53125, 3.77880859375, 4.0263671875, 4.27392578125, 4.521484375, 4.76904296875, 5.0166015625, 5.26416015625, 5.51171875, 5.75927734375, 6.0068359375, 6.25439453125, 6.501953125, 6.74951171875, 6.9970703125, 7.24462890625, 7.4921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 26.0, 227.0, 667.0, 76.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296105146408081, -3.2330474853515625, -3.169989824295044, -3.1069321632385254, -3.043874502182007, -2.9808168411254883, -2.9177591800689697, -2.854701519012451, -2.7916440963745117, -2.728586435317993, -2.6655287742614746, -2.602471113204956, -2.5394134521484375, -2.476355791091919, -2.4132981300354004, -2.350240707397461, -2.2871828079223633, -2.2241251468658447, -2.161067485809326, -2.0980098247528076, -2.034952163696289, -1.9718945026397705, -1.9088369607925415, -1.845779299736023, -1.7827216386795044, -1.7196639776229858, -1.6566063165664673, -1.5935486555099487, -1.5304911136627197, -1.4674334526062012, -1.4043757915496826, -1.341318130493164, -1.2782602310180664, -1.2152025699615479, -1.1521449089050293, -1.0890872478485107, -1.0260295867919922, -0.9629719853401184, -0.8999143838882446, -0.8368567228317261, -0.7737990617752075, -0.710741400718689, -0.6476837396621704, -0.5846261382102966, -0.5215684771537781, -0.4585108160972595, -0.39545318484306335, -0.3323955535888672, -0.26933789253234863, -0.20628024637699127, -0.1432226002216339, -0.08016495406627655, -0.01710730791091919, 0.045950353145599365, 0.10900798439979553, 0.1720656156539917, 0.23512327671051025, 0.2981809377670288, 0.361238569021225, 0.42429620027542114, 0.4873538613319397, 0.5504115223884583, 0.613469123840332, 0.6765267848968506, 0.7395844459533691]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 13.0, 15.0, 10.0, 16.0, 15.0, 23.0, 27.0, 26.0, 21.0, 30.0, 32.0, 37.0, 42.0, 34.0, 42.0, 53.0, 47.0, 33.0, 38.0, 37.0, 51.0, 41.0, 34.0, 33.0, 26.0, 34.0, 24.0, 22.0, 28.0, 17.0, 8.0, 18.0, 14.0, 4.0, 8.0, 4.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2493683099746704, -0.2419174164533615, -0.2344665229320526, -0.2270156294107437, -0.21956473588943481, -0.21211384236812592, -0.20466294884681702, -0.19721205532550812, -0.18976116180419922, -0.18231026828289032, -0.17485937476158142, -0.16740848124027252, -0.15995758771896362, -0.15250669419765472, -0.14505580067634583, -0.13760490715503693, -0.13015401363372803, -0.12270312011241913, -0.11525222659111023, -0.10780133306980133, -0.10035043954849243, -0.09289954602718353, -0.08544865250587463, -0.07799775898456573, -0.07054686546325684, -0.06309597194194794, -0.05564507842063904, -0.04819418489933014, -0.04074329137802124, -0.03329239785671234, -0.025841504335403442, -0.018390610814094543, -0.010939717292785645, -0.0034888237714767456, 0.003962069749832153, 0.011412963271141052, 0.01886385679244995, 0.02631475031375885, 0.03376564383506775, 0.04121653735637665, 0.04866743087768555, 0.056118324398994446, 0.06356921792030334, 0.07102011144161224, 0.07847100496292114, 0.08592189848423004, 0.09337279200553894, 0.10082368552684784, 0.10827457904815674, 0.11572547256946564, 0.12317636609077454, 0.13062725961208344, 0.13807815313339233, 0.14552904665470123, 0.15297994017601013, 0.16043083369731903, 0.16788172721862793, 0.17533262073993683, 0.18278351426124573, 0.19023440778255463, 0.19768530130386353, 0.20513619482517242, 0.21258708834648132, 0.22003798186779022, 0.22748887538909912]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 7.0, 8.0, 7.0, 7.0, 13.0, 14.0, 19.0, 15.0, 24.0, 26.0, 21.0, 33.0, 35.0, 31.0, 40.0, 56.0, 42.0, 38.0, 55.0, 60.0, 49.0, 50.0, 28.0, 40.0, 35.0, 33.0, 35.0, 23.0, 29.0, 25.0, 19.0, 14.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.425628662109375, -3.30242919921875, -3.179229736328125, -3.0560302734375, -2.932830810546875, -2.80963134765625, -2.686431884765625, -2.563232421875, -2.440032958984375, -2.31683349609375, -2.193634033203125, -2.0704345703125, -1.947235107421875, -1.82403564453125, -1.700836181640625, -1.57763671875, -1.454437255859375, -1.33123779296875, -1.208038330078125, -1.0848388671875, -0.961639404296875, -0.83843994140625, -0.715240478515625, -0.592041015625, -0.468841552734375, -0.34564208984375, -0.222442626953125, -0.0992431640625, 0.023956298828125, 0.14715576171875, 0.270355224609375, 0.3935546875, 0.516754150390625, 0.63995361328125, 0.763153076171875, 0.8863525390625, 1.009552001953125, 1.13275146484375, 1.255950927734375, 1.379150390625, 1.502349853515625, 1.62554931640625, 1.748748779296875, 1.8719482421875, 1.995147705078125, 2.11834716796875, 2.241546630859375, 2.36474609375, 2.487945556640625, 2.61114501953125, 2.734344482421875, 2.8575439453125, 2.980743408203125, 3.10394287109375, 3.227142333984375, 3.350341796875, 3.473541259765625, 3.59674072265625, 3.719940185546875, 3.8431396484375, 3.966339111328125, 4.08953857421875, 4.212738037109375, 4.3359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 14.0, 28.0, 23.0, 33.0, 51.0, 80.0, 105.0, 137.0, 203.0, 306.0, 430.0, 727.0, 1139.0, 1860.0, 3549.0, 7405.0, 16719.0, 45549.0, 183530.0, 558476.0, 156305.0, 41319.0, 15442.0, 6774.0, 3371.0, 1843.0, 1037.0, 680.0, 435.0, 281.0, 205.0, 150.0, 93.0, 66.0, 51.0, 33.0, 24.0, 16.0, 16.0, 7.0, 10.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.31561279296875, -5.1351318359375, -4.95465087890625, -4.774169921875, -4.59368896484375, -4.4132080078125, -4.23272705078125, -4.05224609375, -3.87176513671875, -3.6912841796875, -3.51080322265625, -3.330322265625, -3.14984130859375, -2.9693603515625, -2.78887939453125, -2.6083984375, -2.42791748046875, -2.2474365234375, -2.06695556640625, -1.886474609375, -1.70599365234375, -1.5255126953125, -1.34503173828125, -1.16455078125, -0.98406982421875, -0.8035888671875, -0.62310791015625, -0.442626953125, -0.26214599609375, -0.0816650390625, 0.09881591796875, 0.279296875, 0.45977783203125, 0.6402587890625, 0.82073974609375, 1.001220703125, 1.18170166015625, 1.3621826171875, 1.54266357421875, 1.72314453125, 1.90362548828125, 2.0841064453125, 2.26458740234375, 2.445068359375, 2.62554931640625, 2.8060302734375, 2.98651123046875, 3.1669921875, 3.34747314453125, 3.5279541015625, 3.70843505859375, 3.888916015625, 4.06939697265625, 4.2498779296875, 4.43035888671875, 4.61083984375, 4.79132080078125, 4.9718017578125, 5.15228271484375, 5.332763671875, 5.51324462890625, 5.6937255859375, 5.87420654296875, 6.0546875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 12.0, 13.0, 8.0, 17.0, 17.0, 20.0, 29.0, 24.0, 36.0, 27.0, 31.0, 44.0, 49.0, 54.0, 66.0, 165.0, 1464.0, 367.0, 124.0, 52.0, 69.0, 51.0, 35.0, 29.0, 38.0, 28.0, 22.0, 16.0, 10.0, 18.0, 12.0, 12.0, 15.0, 6.0, 8.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.26220703125, -9.9072265625, -9.55224609375, -9.197265625, -8.84228515625, -8.4873046875, -8.13232421875, -7.77734375, -7.42236328125, -7.0673828125, -6.71240234375, -6.357421875, -6.00244140625, -5.6474609375, -5.29248046875, -4.9375, -4.58251953125, -4.2275390625, -3.87255859375, -3.517578125, -3.16259765625, -2.8076171875, -2.45263671875, -2.09765625, -1.74267578125, -1.3876953125, -1.03271484375, -0.677734375, -0.32275390625, 0.0322265625, 0.38720703125, 0.7421875, 1.09716796875, 1.4521484375, 1.80712890625, 2.162109375, 2.51708984375, 2.8720703125, 3.22705078125, 3.58203125, 3.93701171875, 4.2919921875, 4.64697265625, 5.001953125, 5.35693359375, 5.7119140625, 6.06689453125, 6.421875, 6.77685546875, 7.1318359375, 7.48681640625, 7.841796875, 8.19677734375, 8.5517578125, 8.90673828125, 9.26171875, 9.61669921875, 9.9716796875, 10.32666015625, 10.681640625, 11.03662109375, 11.3916015625, 11.74658203125, 12.1015625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 10.0, 9.0, 15.0, 22.0, 23.0, 15.0, 26.0, 28.0, 41.0, 66.0, 82.0, 120.0, 164.0, 298.0, 664.0, 2009.0, 10694.0, 137560.0, 2882449.0, 99004.0, 9033.0, 1810.0, 603.0, 280.0, 190.0, 94.0, 93.0, 60.0, 47.0, 45.0, 21.0, 29.0, 13.0, 18.0, 17.0, 11.0, 7.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.890625, -17.371337890625, -16.85205078125, -16.332763671875, -15.8134765625, -15.294189453125, -14.77490234375, -14.255615234375, -13.736328125, -13.217041015625, -12.69775390625, -12.178466796875, -11.6591796875, -11.139892578125, -10.62060546875, -10.101318359375, -9.58203125, -9.062744140625, -8.54345703125, -8.024169921875, -7.5048828125, -6.985595703125, -6.46630859375, -5.947021484375, -5.427734375, -4.908447265625, -4.38916015625, -3.869873046875, -3.3505859375, -2.831298828125, -2.31201171875, -1.792724609375, -1.2734375, -0.754150390625, -0.23486328125, 0.284423828125, 0.8037109375, 1.322998046875, 1.84228515625, 2.361572265625, 2.880859375, 3.400146484375, 3.91943359375, 4.438720703125, 4.9580078125, 5.477294921875, 5.99658203125, 6.515869140625, 7.03515625, 7.554443359375, 8.07373046875, 8.593017578125, 9.1123046875, 9.631591796875, 10.15087890625, 10.670166015625, 11.189453125, 11.708740234375, 12.22802734375, 12.747314453125, 13.2666015625, 13.785888671875, 14.30517578125, 14.824462890625, 15.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 11.0, 300.0, 674.0, 30.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.324481010437012, -9.159858703613281, -4.995236396789551, -0.8306140899658203, 3.33400821685791, 7.498631477355957, 11.663252830505371, 15.827874183654785, 19.992496490478516, 24.157119750976562, 28.321741104125977, 32.48636245727539, 36.65098571777344, 40.815608978271484, 44.98023223876953, 49.14485168457031, 53.30947494506836, 57.474098205566406, 61.63871765136719, 65.8033447265625, 69.96796417236328, 74.13258361816406, 78.29721069335938, 82.46183013916016, 86.62645721435547, 90.79107666015625, 94.95570373535156, 99.12032318115234, 103.28494262695312, 107.44956970214844, 111.61418914794922, 115.77880859375, 119.94343566894531, 124.1080551147461, 128.27267456054688, 132.4373016357422, 136.6019287109375, 140.76654052734375, 144.93116760253906, 149.09579467773438, 153.26040649414062, 157.42503356933594, 161.5896453857422, 165.7542724609375, 169.9188995361328, 174.08352661132812, 178.24813842773438, 182.4127655029297, 186.577392578125, 190.7420196533203, 194.90663146972656, 199.07125854492188, 203.2358856201172, 207.4005126953125, 211.56512451171875, 215.72975158691406, 219.89437866210938, 224.0590057373047, 228.22361755371094, 232.38824462890625, 236.55287170410156, 240.71749877929688, 244.88211059570312, 249.04673767089844, 253.2113494873047]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 3.0, 10.0, 6.0, 7.0, 7.0, 14.0, 8.0, 15.0, 22.0, 34.0, 25.0, 33.0, 37.0, 26.0, 35.0, 43.0, 52.0, 43.0, 45.0, 40.0, 44.0, 47.0, 22.0, 42.0, 24.0, 37.0, 31.0, 32.0, 30.0, 28.0, 30.0, 23.0, 23.0, 16.0, 17.0, 8.0, 7.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.405521392822266, -29.41016960144043, -28.414817810058594, -27.41946792602539, -26.424116134643555, -25.42876434326172, -24.433412551879883, -23.438060760498047, -22.442710876464844, -21.447359085083008, -20.452007293701172, -19.45665740966797, -18.461305618286133, -17.465953826904297, -16.47060203552246, -15.475250244140625, -14.479898452758789, -13.484546661376953, -12.489195823669434, -11.493844032287598, -10.498493194580078, -9.503141403198242, -8.507789611816406, -7.5124382972717285, -6.517086982727051, -5.521735668182373, -4.526384353637695, -3.5310325622558594, -2.5356812477111816, -1.540329933166504, -0.544978141784668, 0.45037317276000977, 1.4457244873046875, 2.4410758018493652, 3.436427354812622, 4.431778907775879, 5.427130222320557, 6.422481536865234, 7.41783332824707, 8.413185119628906, 9.408535957336426, 10.403887748718262, 11.399238586425781, 12.394590377807617, 13.389942169189453, 14.385293006896973, 15.380644798278809, 16.375995635986328, 17.371347427368164, 18.36669921875, 19.362051010131836, 20.357402801513672, 21.352752685546875, 22.34810447692871, 23.343456268310547, 24.338808059692383, 25.33415985107422, 26.329511642456055, 27.32486343383789, 28.320213317871094, 29.31556510925293, 30.310916900634766, 31.3062686920166, 32.30162048339844, 33.29697036743164]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 6.0, 14.0, 10.0, 8.0, 8.0, 19.0, 16.0, 18.0, 15.0, 22.0, 25.0, 30.0, 40.0, 28.0, 40.0, 41.0, 45.0, 37.0, 44.0, 49.0, 32.0, 49.0, 31.0, 47.0, 37.0, 24.0, 16.0, 29.0, 37.0, 23.0, 26.0, 23.0, 11.0, 25.0, 10.0, 6.0, 7.0, 11.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.298828125, -3.183013916015625, -3.06719970703125, -2.951385498046875, -2.8355712890625, -2.719757080078125, -2.60394287109375, -2.488128662109375, -2.372314453125, -2.256500244140625, -2.14068603515625, -2.024871826171875, -1.9090576171875, -1.793243408203125, -1.67742919921875, -1.561614990234375, -1.44580078125, -1.329986572265625, -1.21417236328125, -1.098358154296875, -0.9825439453125, -0.866729736328125, -0.75091552734375, -0.635101318359375, -0.519287109375, -0.403472900390625, -0.28765869140625, -0.171844482421875, -0.0560302734375, 0.059783935546875, 0.17559814453125, 0.291412353515625, 0.4072265625, 0.523040771484375, 0.63885498046875, 0.754669189453125, 0.8704833984375, 0.986297607421875, 1.10211181640625, 1.217926025390625, 1.333740234375, 1.449554443359375, 1.56536865234375, 1.681182861328125, 1.7969970703125, 1.912811279296875, 2.02862548828125, 2.144439697265625, 2.26025390625, 2.376068115234375, 2.49188232421875, 2.607696533203125, 2.7235107421875, 2.839324951171875, 2.95513916015625, 3.070953369140625, 3.186767578125, 3.302581787109375, 3.41839599609375, 3.534210205078125, 3.6500244140625, 3.765838623046875, 3.88165283203125, 3.997467041015625, 4.11328125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 22.0, 18.0, 43.0, 60.0, 74.0, 124.0, 181.0, 276.0, 509.0, 759.0, 1196.0, 2065.0, 3902.0, 7297.0, 14377.0, 35169.0, 123656.0, 695213.0, 2307131.0, 797066.0, 133994.0, 37574.0, 15421.0, 7815.0, 4077.0, 2378.0, 1401.0, 885.0, 548.0, 341.0, 211.0, 154.0, 117.0, 68.0, 42.0, 37.0, 13.0, 21.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.05181884765625, -4.8614501953125, -4.67108154296875, -4.480712890625, -4.29034423828125, -4.0999755859375, -3.90960693359375, -3.71923828125, -3.52886962890625, -3.3385009765625, -3.14813232421875, -2.957763671875, -2.76739501953125, -2.5770263671875, -2.38665771484375, -2.1962890625, -2.00592041015625, -1.8155517578125, -1.62518310546875, -1.434814453125, -1.24444580078125, -1.0540771484375, -0.86370849609375, -0.67333984375, -0.48297119140625, -0.2926025390625, -0.10223388671875, 0.088134765625, 0.27850341796875, 0.4688720703125, 0.65924072265625, 0.849609375, 1.03997802734375, 1.2303466796875, 1.42071533203125, 1.611083984375, 1.80145263671875, 1.9918212890625, 2.18218994140625, 2.37255859375, 2.56292724609375, 2.7532958984375, 2.94366455078125, 3.134033203125, 3.32440185546875, 3.5147705078125, 3.70513916015625, 3.8955078125, 4.08587646484375, 4.2762451171875, 4.46661376953125, 4.656982421875, 4.84735107421875, 5.0377197265625, 5.22808837890625, 5.41845703125, 5.60882568359375, 5.7991943359375, 5.98956298828125, 6.179931640625, 6.37030029296875, 6.5606689453125, 6.75103759765625, 6.94140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 8.0, 4.0, 7.0, 12.0, 15.0, 23.0, 28.0, 28.0, 51.0, 53.0, 99.0, 120.0, 161.0, 248.0, 434.0, 619.0, 669.0, 509.0, 314.0, 198.0, 117.0, 86.0, 71.0, 36.0, 49.0, 29.0, 11.0, 16.0, 18.0, 11.0, 6.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.50384521484375, -5.2850341796875, -5.06622314453125, -4.847412109375, -4.62860107421875, -4.4097900390625, -4.19097900390625, -3.97216796875, -3.75335693359375, -3.5345458984375, -3.31573486328125, -3.096923828125, -2.87811279296875, -2.6593017578125, -2.44049072265625, -2.2216796875, -2.00286865234375, -1.7840576171875, -1.56524658203125, -1.346435546875, -1.12762451171875, -0.9088134765625, -0.69000244140625, -0.47119140625, -0.25238037109375, -0.0335693359375, 0.18524169921875, 0.404052734375, 0.62286376953125, 0.8416748046875, 1.06048583984375, 1.279296875, 1.49810791015625, 1.7169189453125, 1.93572998046875, 2.154541015625, 2.37335205078125, 2.5921630859375, 2.81097412109375, 3.02978515625, 3.24859619140625, 3.4674072265625, 3.68621826171875, 3.905029296875, 4.12384033203125, 4.3426513671875, 4.56146240234375, 4.7802734375, 4.99908447265625, 5.2178955078125, 5.43670654296875, 5.655517578125, 5.87432861328125, 6.0931396484375, 6.31195068359375, 6.53076171875, 6.74957275390625, 6.9683837890625, 7.18719482421875, 7.406005859375, 7.62481689453125, 7.8436279296875, 8.06243896484375, 8.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 14.0, 19.0, 21.0, 29.0, 38.0, 83.0, 88.0, 133.0, 257.0, 625.0, 2119.0, 11889.0, 140730.0, 3681257.0, 331721.0, 20339.0, 3182.0, 866.0, 318.0, 182.0, 103.0, 67.0, 46.0, 41.0, 25.0, 20.0, 12.0, 10.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.859375, -23.24169921875, -22.6240234375, -22.00634765625, -21.388671875, -20.77099609375, -20.1533203125, -19.53564453125, -18.91796875, -18.30029296875, -17.6826171875, -17.06494140625, -16.447265625, -15.82958984375, -15.2119140625, -14.59423828125, -13.9765625, -13.35888671875, -12.7412109375, -12.12353515625, -11.505859375, -10.88818359375, -10.2705078125, -9.65283203125, -9.03515625, -8.41748046875, -7.7998046875, -7.18212890625, -6.564453125, -5.94677734375, -5.3291015625, -4.71142578125, -4.09375, -3.47607421875, -2.8583984375, -2.24072265625, -1.623046875, -1.00537109375, -0.3876953125, 0.22998046875, 0.84765625, 1.46533203125, 2.0830078125, 2.70068359375, 3.318359375, 3.93603515625, 4.5537109375, 5.17138671875, 5.7890625, 6.40673828125, 7.0244140625, 7.64208984375, 8.259765625, 8.87744140625, 9.4951171875, 10.11279296875, 10.73046875, 11.34814453125, 11.9658203125, 12.58349609375, 13.201171875, 13.81884765625, 14.4365234375, 15.05419921875, 15.671875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 37.0, 91.0, 166.0, 242.0, 235.0, 120.0, 71.0, 26.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.61666488647461, -52.90502166748047, -51.19337463378906, -49.48173141479492, -47.770084381103516, -46.058441162109375, -44.34679412841797, -42.63515090942383, -40.92350387573242, -39.21186065673828, -37.500213623046875, -35.788570404052734, -34.07692337036133, -32.36528015136719, -30.65363311767578, -28.94198989868164, -27.230344772338867, -25.518699645996094, -23.80705451965332, -22.095409393310547, -20.383764266967773, -18.672119140625, -16.96047592163086, -15.24882984161377, -13.537184715270996, -11.825539588928223, -10.11389446258545, -8.402250289916992, -6.6906046867370605, -4.978960037231445, -3.267314910888672, -1.5556697845458984, 0.155975341796875, 1.8676203489303589, 3.5792653560638428, 5.290910243988037, 7.0025553703308105, 8.714200019836426, 10.4258451461792, 12.137490272521973, 13.849135398864746, 15.56078052520752, 17.272424697875977, 18.98406982421875, 20.695714950561523, 22.407360076904297, 24.11900520324707, 25.830650329589844, 27.542295455932617, 29.25394058227539, 30.965585708618164, 32.67723083496094, 34.38887405395508, 36.100521087646484, 37.812164306640625, 39.52381134033203, 41.23545455932617, 42.94709777832031, 44.65874481201172, 46.37038803100586, 48.082035064697266, 49.793678283691406, 51.50532531738281, 53.21696853637695, 54.92861557006836]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 2.0, 5.0, 6.0, 12.0, 9.0, 11.0, 18.0, 19.0, 19.0, 22.0, 31.0, 30.0, 30.0, 32.0, 44.0, 41.0, 51.0, 38.0, 45.0, 55.0, 39.0, 41.0, 40.0, 44.0, 30.0, 44.0, 42.0, 29.0, 31.0, 31.0, 21.0, 14.0, 16.0, 11.0, 8.0, 7.0, 8.0, 2.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.89798927307129, -25.143157958984375, -24.388328552246094, -23.63349723815918, -22.878665924072266, -22.123836517333984, -21.36900520324707, -20.614173889160156, -19.859344482421875, -19.10451316833496, -18.34968376159668, -17.594852447509766, -16.840023040771484, -16.08519172668457, -15.330360412597656, -14.575530052185059, -13.820699691772461, -13.065869331359863, -12.311038970947266, -11.556207656860352, -10.801377296447754, -10.046546936035156, -9.291715621948242, -8.536885261535645, -7.782054901123047, -7.027224540710449, -6.272393703460693, -5.5175628662109375, -4.76273250579834, -4.007902145385742, -3.2530713081359863, -2.4982404708862305, -1.743408203125, -0.9885776042938232, -0.23374700546264648, 0.5210835933685303, 1.275914192199707, 2.030744791030884, 2.7855753898620605, 3.5404062271118164, 4.295236587524414, 5.050066947937012, 5.804897785186768, 6.559728622436523, 7.314558982849121, 8.069389343261719, 8.824220657348633, 9.57905101776123, 10.333881378173828, 11.088711738586426, 11.843542098999023, 12.598373413085938, 13.353203773498535, 14.108034133911133, 14.862865447998047, 15.617695808410645, 16.372526168823242, 17.127357482910156, 17.882186889648438, 18.63701820373535, 19.391849517822266, 20.146678924560547, 20.90151023864746, 21.656341552734375, 22.411170959472656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 4.0, 10.0, 10.0, 4.0, 8.0, 15.0, 10.0, 14.0, 26.0, 26.0, 28.0, 23.0, 23.0, 26.0, 50.0, 39.0, 35.0, 34.0, 32.0, 40.0, 31.0, 44.0, 44.0, 42.0, 39.0, 45.0, 34.0, 36.0, 28.0, 29.0, 25.0, 21.0, 14.0, 18.0, 9.0, 12.0, 10.0, 13.0, 7.0, 12.0, 2.0, 4.0, 4.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.318359375, -3.210540771484375, -3.10272216796875, -2.994903564453125, -2.8870849609375, -2.779266357421875, -2.67144775390625, -2.563629150390625, -2.455810546875, -2.347991943359375, -2.24017333984375, -2.132354736328125, -2.0245361328125, -1.916717529296875, -1.80889892578125, -1.701080322265625, -1.59326171875, -1.485443115234375, -1.37762451171875, -1.269805908203125, -1.1619873046875, -1.054168701171875, -0.94635009765625, -0.838531494140625, -0.730712890625, -0.622894287109375, -0.51507568359375, -0.407257080078125, -0.2994384765625, -0.191619873046875, -0.08380126953125, 0.024017333984375, 0.1318359375, 0.239654541015625, 0.34747314453125, 0.455291748046875, 0.5631103515625, 0.670928955078125, 0.77874755859375, 0.886566162109375, 0.994384765625, 1.102203369140625, 1.21002197265625, 1.317840576171875, 1.4256591796875, 1.533477783203125, 1.64129638671875, 1.749114990234375, 1.85693359375, 1.964752197265625, 2.07257080078125, 2.180389404296875, 2.2882080078125, 2.396026611328125, 2.50384521484375, 2.611663818359375, 2.719482421875, 2.827301025390625, 2.93511962890625, 3.042938232421875, 3.1507568359375, 3.258575439453125, 3.36639404296875, 3.474212646484375, 3.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 10.0, 12.0, 10.0, 21.0, 21.0, 26.0, 46.0, 56.0, 74.0, 101.0, 138.0, 187.0, 272.0, 395.0, 556.0, 863.0, 1339.0, 1961.0, 3167.0, 5679.0, 10921.0, 26002.0, 325245.0, 610730.0, 32172.0, 12172.0, 6365.0, 3625.0, 2056.0, 1323.0, 930.0, 568.0, 444.0, 314.0, 204.0, 149.0, 122.0, 92.0, 47.0, 29.0, 36.0, 18.0, 20.0, 7.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6015625, -4.466552734375, -4.33154296875, -4.196533203125, -4.0615234375, -3.926513671875, -3.79150390625, -3.656494140625, -3.521484375, -3.386474609375, -3.25146484375, -3.116455078125, -2.9814453125, -2.846435546875, -2.71142578125, -2.576416015625, -2.44140625, -2.306396484375, -2.17138671875, -2.036376953125, -1.9013671875, -1.766357421875, -1.63134765625, -1.496337890625, -1.361328125, -1.226318359375, -1.09130859375, -0.956298828125, -0.8212890625, -0.686279296875, -0.55126953125, -0.416259765625, -0.28125, -0.146240234375, -0.01123046875, 0.123779296875, 0.2587890625, 0.393798828125, 0.52880859375, 0.663818359375, 0.798828125, 0.933837890625, 1.06884765625, 1.203857421875, 1.3388671875, 1.473876953125, 1.60888671875, 1.743896484375, 1.87890625, 2.013916015625, 2.14892578125, 2.283935546875, 2.4189453125, 2.553955078125, 2.68896484375, 2.823974609375, 2.958984375, 3.093994140625, 3.22900390625, 3.364013671875, 3.4990234375, 3.634033203125, 3.76904296875, 3.904052734375, 4.0390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 11.0, 5.0, 11.0, 10.0, 17.0, 12.0, 17.0, 15.0, 21.0, 25.0, 23.0, 34.0, 40.0, 33.0, 37.0, 27.0, 41.0, 49.0, 41.0, 44.0, 1068.0, 41.0, 45.0, 41.0, 36.0, 36.0, 34.0, 23.0, 18.0, 15.0, 21.0, 24.0, 14.0, 17.0, 13.0, 14.0, 8.0, 4.0, 10.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.365234375, -2.287109375, -2.208984375, -2.130859375, -2.052734375, -1.974609375, -1.896484375, -1.818359375, -1.740234375, -1.662109375, -1.583984375, -1.505859375, -1.427734375, -1.349609375, -1.271484375, -1.193359375, -1.115234375, -1.037109375, -0.958984375, -0.880859375, -0.802734375, -0.724609375, -0.646484375, -0.568359375, -0.490234375, -0.412109375, -0.333984375, -0.255859375, -0.177734375, -0.099609375, -0.021484375, 0.056640625, 0.134765625, 0.212890625, 0.291015625, 0.369140625, 0.447265625, 0.525390625, 0.603515625, 0.681640625, 0.759765625, 0.837890625, 0.916015625, 0.994140625, 1.072265625, 1.150390625, 1.228515625, 1.306640625, 1.384765625, 1.462890625, 1.541015625, 1.619140625, 1.697265625, 1.775390625, 1.853515625, 1.931640625, 2.009765625, 2.087890625, 2.166015625, 2.244140625, 2.322265625, 2.400390625, 2.478515625, 2.556640625, 2.634765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 14.0, 7.0, 10.0, 24.0, 22.0, 23.0, 41.0, 53.0, 68.0, 84.0, 105.0, 147.0, 191.0, 282.0, 418.0, 560.0, 866.0, 1394.0, 2218.0, 3776.0, 6980.0, 16241.0, 58201.0, 1621715.0, 325566.0, 32290.0, 11571.0, 5611.0, 2983.0, 1883.0, 1165.0, 724.0, 514.0, 355.0, 250.0, 188.0, 131.0, 107.0, 76.0, 55.0, 45.0, 34.0, 28.0, 16.0, 13.0, 14.0, 14.0, 15.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.0078125, -1.9447021484375, -1.881591796875, -1.8184814453125, -1.75537109375, -1.6922607421875, -1.629150390625, -1.5660400390625, -1.5029296875, -1.4398193359375, -1.376708984375, -1.3135986328125, -1.25048828125, -1.1873779296875, -1.124267578125, -1.0611572265625, -0.998046875, -0.9349365234375, -0.871826171875, -0.8087158203125, -0.74560546875, -0.6824951171875, -0.619384765625, -0.5562744140625, -0.4931640625, -0.4300537109375, -0.366943359375, -0.3038330078125, -0.24072265625, -0.1776123046875, -0.114501953125, -0.0513916015625, 0.01171875, 0.0748291015625, 0.137939453125, 0.2010498046875, 0.26416015625, 0.3272705078125, 0.390380859375, 0.4534912109375, 0.5166015625, 0.5797119140625, 0.642822265625, 0.7059326171875, 0.76904296875, 0.8321533203125, 0.895263671875, 0.9583740234375, 1.021484375, 1.0845947265625, 1.147705078125, 1.2108154296875, 1.27392578125, 1.3370361328125, 1.400146484375, 1.4632568359375, 1.5263671875, 1.5894775390625, 1.652587890625, 1.7156982421875, 1.77880859375, 1.8419189453125, 1.905029296875, 1.9681396484375, 2.03125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 12.0, 20.0, 16.0, 54.0, 188.0, 469.0, 84.0, 41.0, 18.0, 16.0, 9.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.485107421875, -0.4709625244140625, -0.456817626953125, -0.4426727294921875, -0.42852783203125, -0.4143829345703125, -0.400238037109375, -0.3860931396484375, -0.3719482421875, -0.3578033447265625, -0.343658447265625, -0.3295135498046875, -0.31536865234375, -0.3012237548828125, -0.287078857421875, -0.2729339599609375, -0.2587890625, -0.2446441650390625, -0.230499267578125, -0.2163543701171875, -0.20220947265625, -0.1880645751953125, -0.173919677734375, -0.1597747802734375, -0.1456298828125, -0.1314849853515625, -0.117340087890625, -0.1031951904296875, -0.08905029296875, -0.0749053955078125, -0.060760498046875, -0.0466156005859375, -0.032470703125, -0.0183258056640625, -0.004180908203125, 0.0099639892578125, 0.02410888671875, 0.0382537841796875, 0.052398681640625, 0.0665435791015625, 0.0806884765625, 0.0948333740234375, 0.108978271484375, 0.1231231689453125, 0.13726806640625, 0.1514129638671875, 0.165557861328125, 0.1797027587890625, 0.19384765625, 0.2079925537109375, 0.222137451171875, 0.2362823486328125, 0.25042724609375, 0.2645721435546875, 0.278717041015625, 0.2928619384765625, 0.3070068359375, 0.3211517333984375, 0.335296630859375, 0.3494415283203125, 0.36358642578125, 0.3777313232421875, 0.391876220703125, 0.4060211181640625, 0.420166015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 20.0, 36.0, 52.0, 121.0, 746.0, 41394.0, 1004242.0, 1498.0, 172.0, 63.0, 56.0, 25.0, 24.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 1.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-9.9765625, -9.6453857421875, -9.314208984375, -8.9830322265625, -8.65185546875, -8.3206787109375, -7.989501953125, -7.6583251953125, -7.3271484375, -6.9959716796875, -6.664794921875, -6.3336181640625, -6.00244140625, -5.6712646484375, -5.340087890625, -5.0089111328125, -4.677734375, -4.3465576171875, -4.015380859375, -3.6842041015625, -3.35302734375, -3.0218505859375, -2.690673828125, -2.3594970703125, -2.0283203125, -1.6971435546875, -1.365966796875, -1.0347900390625, -0.70361328125, -0.3724365234375, -0.041259765625, 0.2899169921875, 0.62109375, 0.9522705078125, 1.283447265625, 1.6146240234375, 1.94580078125, 2.2769775390625, 2.608154296875, 2.9393310546875, 3.2705078125, 3.6016845703125, 3.932861328125, 4.2640380859375, 4.59521484375, 4.9263916015625, 5.257568359375, 5.5887451171875, 5.919921875, 6.2510986328125, 6.582275390625, 6.9134521484375, 7.24462890625, 7.5758056640625, 7.906982421875, 8.2381591796875, 8.5693359375, 8.9005126953125, 9.231689453125, 9.5628662109375, 9.89404296875, 10.2252197265625, 10.556396484375, 10.8875732421875, 11.21875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 25.0, 60.0, 208.0, 361.0, 210.0, 84.0, 28.0, 15.0, 14.0, 4.0], "bins": [-1.8845131397247314, -1.8517507314682007, -1.81898832321167, -1.7862260341644287, -1.753463625907898, -1.7207012176513672, -1.6879388093948364, -1.6551764011383057, -1.6224141120910645, -1.5896517038345337, -1.556889295578003, -1.5241270065307617, -1.491364598274231, -1.4586021900177002, -1.4258397817611694, -1.3930773735046387, -1.3603150844573975, -1.3275526762008667, -1.294790267944336, -1.2620279788970947, -1.229265570640564, -1.1965031623840332, -1.1637407541275024, -1.1309783458709717, -1.098215937614441, -1.0654535293579102, -1.0326911211013794, -0.9999287724494934, -0.9671664237976074, -0.9344040155410767, -0.9016416072845459, -0.8688792586326599, -0.8361169099807739, -0.8033545017242432, -0.7705921530723572, -0.7378297448158264, -0.7050673961639404, -0.6723049879074097, -0.6395425796508789, -0.6067802309989929, -0.5740178823471069, -0.5412554740905762, -0.5084931254386902, -0.4757307171821594, -0.44296836853027344, -0.4102059602737427, -0.3774435818195343, -0.3446812033653259, -0.31191879510879517, -0.2791564166545868, -0.24639403820037842, -0.21363164484500885, -0.18086926639080048, -0.1481068879365921, -0.11534449458122253, -0.08258211612701416, -0.04981975257396698, -0.017057370394468307, 0.015705011785030365, 0.048467397689819336, 0.08122977614402771, 0.11399215459823608, 0.14675454795360565, 0.17951692640781403, 0.2122793048620224]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 14.0, 1.0, 16.0, 11.0, 16.0, 24.0, 17.0, 23.0, 28.0, 23.0, 23.0, 31.0, 37.0, 32.0, 29.0, 39.0, 28.0, 36.0, 28.0, 30.0, 45.0, 43.0, 42.0, 36.0, 29.0, 30.0, 28.0, 25.0, 24.0, 21.0, 22.0, 21.0, 17.0, 13.0, 11.0, 13.0, 13.0, 9.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.29606109857559204, -0.2868116796016693, -0.2775622308254242, -0.26831281185150146, -0.25906336307525635, -0.24981392920017242, -0.2405644953250885, -0.23131507635116577, -0.22206562757492065, -0.21281619369983673, -0.2035667598247528, -0.19431732594966888, -0.18506789207458496, -0.17581845819950104, -0.16656902432441711, -0.15731960535049438, -0.14807017147541046, -0.13882073760032654, -0.12957130372524261, -0.12032186985015869, -0.11107243597507477, -0.10182300209999084, -0.09257357567548752, -0.0833241418004036, -0.07407470792531967, -0.06482527405023575, -0.055575840175151825, -0.0463264100253582, -0.03707697615027428, -0.027827542275190353, -0.01857811212539673, -0.009328678250312805, -7.924437522888184e-05, 0.009170188568532467, 0.018419621512293816, 0.02766905352473259, 0.03691848739981651, 0.046167921274900436, 0.05541735142469406, 0.06466678529977798, 0.07391621917486191, 0.08316565304994583, 0.09241508692502975, 0.10166451334953308, 0.110913947224617, 0.12016338109970093, 0.12941281497478485, 0.13866224884986877, 0.1479116827249527, 0.15716111660003662, 0.16641055047512054, 0.17565998435020447, 0.1849094182252884, 0.19415885210037231, 0.20340827107429504, 0.21265771985054016, 0.2219071388244629, 0.23115657269954681, 0.24040600657463074, 0.24965544044971466, 0.2589048743247986, 0.2681542932987213, 0.27740374207496643, 0.28665316104888916, 0.2959026098251343]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 12.0, 9.0, 6.0, 14.0, 7.0, 23.0, 21.0, 21.0, 24.0, 36.0, 20.0, 24.0, 39.0, 31.0, 38.0, 39.0, 36.0, 36.0, 38.0, 48.0, 40.0, 41.0, 35.0, 39.0, 43.0, 23.0, 29.0, 22.0, 23.0, 29.0, 19.0, 13.0, 14.0, 12.0, 15.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.453125, -3.34478759765625, -3.2364501953125, -3.12811279296875, -3.019775390625, -2.91143798828125, -2.8031005859375, -2.69476318359375, -2.58642578125, -2.47808837890625, -2.3697509765625, -2.26141357421875, -2.153076171875, -2.04473876953125, -1.9364013671875, -1.82806396484375, -1.7197265625, -1.61138916015625, -1.5030517578125, -1.39471435546875, -1.286376953125, -1.17803955078125, -1.0697021484375, -0.96136474609375, -0.85302734375, -0.74468994140625, -0.6363525390625, -0.52801513671875, -0.419677734375, -0.31134033203125, -0.2030029296875, -0.09466552734375, 0.013671875, 0.12200927734375, 0.2303466796875, 0.33868408203125, 0.447021484375, 0.55535888671875, 0.6636962890625, 0.77203369140625, 0.88037109375, 0.98870849609375, 1.0970458984375, 1.20538330078125, 1.313720703125, 1.42205810546875, 1.5303955078125, 1.63873291015625, 1.7470703125, 1.85540771484375, 1.9637451171875, 2.07208251953125, 2.180419921875, 2.28875732421875, 2.3970947265625, 2.50543212890625, 2.61376953125, 2.72210693359375, 2.8304443359375, 2.93878173828125, 3.047119140625, 3.15545654296875, 3.2637939453125, 3.37213134765625, 3.48046875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 10.0, 14.0, 11.0, 25.0, 29.0, 32.0, 54.0, 84.0, 125.0, 196.0, 353.0, 525.0, 837.0, 1493.0, 2437.0, 4392.0, 8184.0, 15934.0, 35915.0, 147168.0, 659841.0, 108590.0, 31004.0, 14077.0, 7207.0, 4005.0, 2367.0, 1430.0, 810.0, 488.0, 317.0, 197.0, 124.0, 78.0, 59.0, 43.0, 24.0, 11.0, 7.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.60546875, -7.384521484375, -7.16357421875, -6.942626953125, -6.7216796875, -6.500732421875, -6.27978515625, -6.058837890625, -5.837890625, -5.616943359375, -5.39599609375, -5.175048828125, -4.9541015625, -4.733154296875, -4.51220703125, -4.291259765625, -4.0703125, -3.849365234375, -3.62841796875, -3.407470703125, -3.1865234375, -2.965576171875, -2.74462890625, -2.523681640625, -2.302734375, -2.081787109375, -1.86083984375, -1.639892578125, -1.4189453125, -1.197998046875, -0.97705078125, -0.756103515625, -0.53515625, -0.314208984375, -0.09326171875, 0.127685546875, 0.3486328125, 0.569580078125, 0.79052734375, 1.011474609375, 1.232421875, 1.453369140625, 1.67431640625, 1.895263671875, 2.1162109375, 2.337158203125, 2.55810546875, 2.779052734375, 3.0, 3.220947265625, 3.44189453125, 3.662841796875, 3.8837890625, 4.104736328125, 4.32568359375, 4.546630859375, 4.767578125, 4.988525390625, 5.20947265625, 5.430419921875, 5.6513671875, 5.872314453125, 6.09326171875, 6.314208984375, 6.53515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 7.0, 9.0, 10.0, 16.0, 15.0, 14.0, 29.0, 25.0, 27.0, 27.0, 36.0, 42.0, 51.0, 52.0, 88.0, 111.0, 257.0, 1569.0, 170.0, 67.0, 59.0, 59.0, 41.0, 29.0, 37.0, 19.0, 23.0, 34.0, 25.0, 14.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0390625, -10.6748046875, -10.310546875, -9.9462890625, -9.58203125, -9.2177734375, -8.853515625, -8.4892578125, -8.125, -7.7607421875, -7.396484375, -7.0322265625, -6.66796875, -6.3037109375, -5.939453125, -5.5751953125, -5.2109375, -4.8466796875, -4.482421875, -4.1181640625, -3.75390625, -3.3896484375, -3.025390625, -2.6611328125, -2.296875, -1.9326171875, -1.568359375, -1.2041015625, -0.83984375, -0.4755859375, -0.111328125, 0.2529296875, 0.6171875, 0.9814453125, 1.345703125, 1.7099609375, 2.07421875, 2.4384765625, 2.802734375, 3.1669921875, 3.53125, 3.8955078125, 4.259765625, 4.6240234375, 4.98828125, 5.3525390625, 5.716796875, 6.0810546875, 6.4453125, 6.8095703125, 7.173828125, 7.5380859375, 7.90234375, 8.2666015625, 8.630859375, 8.9951171875, 9.359375, 9.7236328125, 10.087890625, 10.4521484375, 10.81640625, 11.1806640625, 11.544921875, 11.9091796875, 12.2734375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 7.0, 9.0, 17.0, 17.0, 32.0, 37.0, 51.0, 86.0, 92.0, 186.0, 372.0, 929.0, 3016.0, 15479.0, 233159.0, 2831181.0, 51387.0, 6663.0, 1592.0, 619.0, 268.0, 140.0, 76.0, 84.0, 43.0, 45.0, 27.0, 17.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.468017578125, -17.85791015625, -17.247802734375, -16.6376953125, -16.027587890625, -15.41748046875, -14.807373046875, -14.197265625, -13.587158203125, -12.97705078125, -12.366943359375, -11.7568359375, -11.146728515625, -10.53662109375, -9.926513671875, -9.31640625, -8.706298828125, -8.09619140625, -7.486083984375, -6.8759765625, -6.265869140625, -5.65576171875, -5.045654296875, -4.435546875, -3.825439453125, -3.21533203125, -2.605224609375, -1.9951171875, -1.385009765625, -0.77490234375, -0.164794921875, 0.4453125, 1.055419921875, 1.66552734375, 2.275634765625, 2.8857421875, 3.495849609375, 4.10595703125, 4.716064453125, 5.326171875, 5.936279296875, 6.54638671875, 7.156494140625, 7.7666015625, 8.376708984375, 8.98681640625, 9.596923828125, 10.20703125, 10.817138671875, 11.42724609375, 12.037353515625, 12.6474609375, 13.257568359375, 13.86767578125, 14.477783203125, 15.087890625, 15.697998046875, 16.30810546875, 16.918212890625, 17.5283203125, 18.138427734375, 18.74853515625, 19.358642578125, 19.96875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 21.0, 30.0, 116.0, 254.0, 277.0, 195.0, 74.0, 32.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.020174026489258, -14.71348762512207, -13.406801223754883, -12.100114822387695, -10.793428421020508, -9.48674201965332, -8.180055618286133, -6.873369216918945, -5.566682815551758, -4.25999641418457, -2.953310012817383, -1.6466236114501953, -0.3399372100830078, 0.9667491912841797, 2.273435592651367, 3.5801219940185547, 4.886808395385742, 6.19349479675293, 7.500181198120117, 8.806867599487305, 10.113554000854492, 11.42024040222168, 12.726926803588867, 14.033613204956055, 15.340299606323242, 16.64698600769043, 17.953672409057617, 19.260358810424805, 20.567045211791992, 21.87373161315918, 23.180418014526367, 24.487104415893555, 25.793792724609375, 27.100479125976562, 28.40716552734375, 29.713851928710938, 31.020538330078125, 32.32722473144531, 33.6339111328125, 34.94059753417969, 36.247283935546875, 37.55397033691406, 38.86065673828125, 40.16734313964844, 41.474029541015625, 42.78071594238281, 44.08740234375, 45.39408874511719, 46.700775146484375, 48.00746154785156, 49.31414794921875, 50.62083435058594, 51.927520751953125, 53.23420715332031, 54.5408935546875, 55.84757995605469, 57.154266357421875, 58.46095275878906, 59.76763916015625, 61.07432556152344, 62.381011962890625, 63.68769836425781, 64.994384765625, 66.30107116699219, 67.60775756835938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 4.0, 9.0, 4.0, 8.0, 12.0, 15.0, 26.0, 27.0, 18.0, 29.0, 35.0, 32.0, 29.0, 37.0, 46.0, 48.0, 48.0, 38.0, 43.0, 44.0, 46.0, 41.0, 38.0, 43.0, 28.0, 39.0, 25.0, 23.0, 26.0, 17.0, 18.0, 19.0, 13.0, 15.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.587955474853516, -35.603729248046875, -34.619503021240234, -33.635276794433594, -32.65105056762695, -31.666824340820312, -30.682598114013672, -29.6983699798584, -28.714143753051758, -27.729917526245117, -26.745691299438477, -25.761465072631836, -24.777238845825195, -23.793010711669922, -22.80878448486328, -21.82455825805664, -20.84033203125, -19.85610580444336, -18.87187957763672, -17.887653350830078, -16.903427124023438, -15.91919994354248, -14.93497371673584, -13.950746536254883, -12.966522216796875, -11.982295989990234, -10.998069763183594, -10.013843536376953, -9.029616355895996, -8.045390129089355, -7.061163902282715, -6.076937198638916, -5.092710494995117, -4.108484268188477, -3.1242575645446777, -2.140031337738037, -1.1558048725128174, -0.17157840728759766, 0.812647819519043, 1.7968745231628418, 2.7811007499694824, 3.765327215194702, 4.749553680419922, 5.7337799072265625, 6.718006134033203, 7.702232837677002, 8.686458587646484, 9.670685768127441, 10.654911994934082, 11.639138221740723, 12.623364448547363, 13.60759162902832, 14.591817855834961, 15.576044082641602, 16.560270309448242, 17.544496536254883, 18.528722763061523, 19.512948989868164, 20.497175216674805, 21.481401443481445, 22.465627670288086, 23.44985580444336, 24.43408203125, 25.41830825805664, 26.40253448486328]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 7.0, 11.0, 12.0, 12.0, 17.0, 18.0, 13.0, 14.0, 20.0, 29.0, 25.0, 29.0, 29.0, 26.0, 34.0, 43.0, 42.0, 31.0, 42.0, 41.0, 50.0, 30.0, 45.0, 39.0, 41.0, 32.0, 28.0, 30.0, 33.0, 21.0, 26.0, 12.0, 15.0, 17.0, 10.0, 17.0, 8.0, 5.0, 8.0, 6.0, 8.0, 4.0, 3.0, 10.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.478515625, -3.365692138671875, -3.25286865234375, -3.140045166015625, -3.0272216796875, -2.914398193359375, -2.80157470703125, -2.688751220703125, -2.575927734375, -2.463104248046875, -2.35028076171875, -2.237457275390625, -2.1246337890625, -2.011810302734375, -1.89898681640625, -1.786163330078125, -1.67333984375, -1.560516357421875, -1.44769287109375, -1.334869384765625, -1.2220458984375, -1.109222412109375, -0.99639892578125, -0.883575439453125, -0.770751953125, -0.657928466796875, -0.54510498046875, -0.432281494140625, -0.3194580078125, -0.206634521484375, -0.09381103515625, 0.019012451171875, 0.1318359375, 0.244659423828125, 0.35748291015625, 0.470306396484375, 0.5831298828125, 0.695953369140625, 0.80877685546875, 0.921600341796875, 1.034423828125, 1.147247314453125, 1.26007080078125, 1.372894287109375, 1.4857177734375, 1.598541259765625, 1.71136474609375, 1.824188232421875, 1.93701171875, 2.049835205078125, 2.16265869140625, 2.275482177734375, 2.3883056640625, 2.501129150390625, 2.61395263671875, 2.726776123046875, 2.839599609375, 2.952423095703125, 3.06524658203125, 3.178070068359375, 3.2908935546875, 3.403717041015625, 3.51654052734375, 3.629364013671875, 3.7421875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 6.0, 18.0, 18.0, 27.0, 40.0, 48.0, 85.0, 136.0, 221.0, 366.0, 600.0, 1083.0, 1885.0, 3800.0, 7936.0, 17823.0, 48403.0, 232222.0, 1652444.0, 1876167.0, 261764.0, 52319.0, 18795.0, 8609.0, 4223.0, 2252.0, 1187.0, 670.0, 409.0, 263.0, 174.0, 88.0, 67.0, 43.0, 23.0, 17.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.4761962890625, -6.253173828125, -6.0301513671875, -5.80712890625, -5.5841064453125, -5.361083984375, -5.1380615234375, -4.9150390625, -4.6920166015625, -4.468994140625, -4.2459716796875, -4.02294921875, -3.7999267578125, -3.576904296875, -3.3538818359375, -3.130859375, -2.9078369140625, -2.684814453125, -2.4617919921875, -2.23876953125, -2.0157470703125, -1.792724609375, -1.5697021484375, -1.3466796875, -1.1236572265625, -0.900634765625, -0.6776123046875, -0.45458984375, -0.2315673828125, -0.008544921875, 0.2144775390625, 0.4375, 0.6605224609375, 0.883544921875, 1.1065673828125, 1.32958984375, 1.5526123046875, 1.775634765625, 1.9986572265625, 2.2216796875, 2.4447021484375, 2.667724609375, 2.8907470703125, 3.11376953125, 3.3367919921875, 3.559814453125, 3.7828369140625, 4.005859375, 4.2288818359375, 4.451904296875, 4.6749267578125, 4.89794921875, 5.1209716796875, 5.343994140625, 5.5670166015625, 5.7900390625, 6.0130615234375, 6.236083984375, 6.4591064453125, 6.68212890625, 6.9051513671875, 7.128173828125, 7.3511962890625, 7.57421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 8.0, 5.0, 12.0, 20.0, 17.0, 29.0, 36.0, 52.0, 94.0, 118.0, 157.0, 324.0, 531.0, 765.0, 686.0, 430.0, 257.0, 159.0, 110.0, 67.0, 46.0, 42.0, 27.0, 19.0, 18.0, 10.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.65234375, -7.39569091796875, -7.1390380859375, -6.88238525390625, -6.625732421875, -6.36907958984375, -6.1124267578125, -5.85577392578125, -5.59912109375, -5.34246826171875, -5.0858154296875, -4.82916259765625, -4.572509765625, -4.31585693359375, -4.0592041015625, -3.80255126953125, -3.5458984375, -3.28924560546875, -3.0325927734375, -2.77593994140625, -2.519287109375, -2.26263427734375, -2.0059814453125, -1.74932861328125, -1.49267578125, -1.23602294921875, -0.9793701171875, -0.72271728515625, -0.466064453125, -0.20941162109375, 0.0472412109375, 0.30389404296875, 0.560546875, 0.81719970703125, 1.0738525390625, 1.33050537109375, 1.587158203125, 1.84381103515625, 2.1004638671875, 2.35711669921875, 2.61376953125, 2.87042236328125, 3.1270751953125, 3.38372802734375, 3.640380859375, 3.89703369140625, 4.1536865234375, 4.41033935546875, 4.6669921875, 4.92364501953125, 5.1802978515625, 5.43695068359375, 5.693603515625, 5.95025634765625, 6.2069091796875, 6.46356201171875, 6.72021484375, 6.97686767578125, 7.2335205078125, 7.49017333984375, 7.746826171875, 8.00347900390625, 8.2601318359375, 8.51678466796875, 8.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 60.0, 82.0, 141.0, 278.0, 622.0, 2339.0, 17320.0, 564935.0, 3549130.0, 52812.0, 4631.0, 979.0, 366.0, 193.0, 94.0, 58.0, 34.0, 18.0, 27.0, 13.0, 6.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.390625, -25.618896484375, -24.84716796875, -24.075439453125, -23.3037109375, -22.531982421875, -21.76025390625, -20.988525390625, -20.216796875, -19.445068359375, -18.67333984375, -17.901611328125, -17.1298828125, -16.358154296875, -15.58642578125, -14.814697265625, -14.04296875, -13.271240234375, -12.49951171875, -11.727783203125, -10.9560546875, -10.184326171875, -9.41259765625, -8.640869140625, -7.869140625, -7.097412109375, -6.32568359375, -5.553955078125, -4.7822265625, -4.010498046875, -3.23876953125, -2.467041015625, -1.6953125, -0.923583984375, -0.15185546875, 0.619873046875, 1.3916015625, 2.163330078125, 2.93505859375, 3.706787109375, 4.478515625, 5.250244140625, 6.02197265625, 6.793701171875, 7.5654296875, 8.337158203125, 9.10888671875, 9.880615234375, 10.65234375, 11.424072265625, 12.19580078125, 12.967529296875, 13.7392578125, 14.510986328125, 15.28271484375, 16.054443359375, 16.826171875, 17.597900390625, 18.36962890625, 19.141357421875, 19.9130859375, 20.684814453125, 21.45654296875, 22.228271484375, 23.0]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 59.0, 278.0, 515.0, 128.0, 23.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-216.75743103027344, -212.90518188476562, -209.0529327392578, -205.20069885253906, -201.34844970703125, -197.49620056152344, -193.64395141601562, -189.79171752929688, -185.93946838378906, -182.08721923828125, -178.23497009277344, -174.3827362060547, -170.53048706054688, -166.67823791503906, -162.82598876953125, -158.9737548828125, -155.1215057373047, -151.26925659179688, -147.41700744628906, -143.5647735595703, -139.7125244140625, -135.8602752685547, -132.00802612304688, -128.15579223632812, -124.30353546142578, -120.45128631591797, -116.59904479980469, -112.74679565429688, -108.8945541381836, -105.04230499267578, -101.1900634765625, -97.33781433105469, -93.48558044433594, -89.63333129882812, -85.78108978271484, -81.92884063720703, -78.07659912109375, -74.22434997558594, -70.37210845947266, -66.51985931396484, -62.66761016845703, -58.815364837646484, -54.96311950683594, -51.11087417602539, -47.258628845214844, -43.40637969970703, -39.55413818359375, -35.70188903808594, -31.849647521972656, -27.99740219116211, -24.145156860351562, -20.292911529541016, -16.44066619873047, -12.588418960571289, -8.736173629760742, -4.883928298950195, -1.0316829681396484, 2.8205626010894775, 6.6728081703186035, 10.525053977966309, 14.377299308776855, 18.22954559326172, 22.081790924072266, 25.934036254882812, 29.78628158569336]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 10.0, 14.0, 6.0, 22.0, 18.0, 20.0, 35.0, 28.0, 38.0, 37.0, 40.0, 38.0, 42.0, 42.0, 45.0, 48.0, 53.0, 44.0, 36.0, 44.0, 42.0, 29.0, 40.0, 23.0, 26.0, 26.0, 21.0, 22.0, 21.0, 19.0, 9.0, 6.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.454151153564453, -22.71558380126953, -21.977014541625977, -21.238447189331055, -20.4998779296875, -19.761310577392578, -19.022743225097656, -18.284175872802734, -17.54560661315918, -16.807039260864258, -16.068470001220703, -15.329902648925781, -14.591334342956543, -13.852766036987305, -13.114198684692383, -12.375630378723145, -11.637062072753906, -10.898493766784668, -10.15992546081543, -9.421358108520508, -8.68278980255127, -7.944221496582031, -7.205653667449951, -6.467085838317871, -5.728517532348633, -4.9899492263793945, -4.2513813972473145, -3.5128133296966553, -2.774245262145996, -2.035677194595337, -1.2971091270446777, -0.5585412979125977, 0.18002891540527344, 0.9185969829559326, 1.6571650505065918, 2.395733118057251, 3.13430118560791, 3.8728692531585693, 4.6114373207092285, 5.350005149841309, 6.088573455810547, 6.827141761779785, 7.565709590911865, 8.304277420043945, 9.042845726013184, 9.781414031982422, 10.519981384277344, 11.258549690246582, 11.99711799621582, 12.735686302185059, 13.474254608154297, 14.212821960449219, 14.951390266418457, 15.689958572387695, 16.428525924682617, 17.167095184326172, 17.905662536621094, 18.644229888916016, 19.38279914855957, 20.121366500854492, 20.859935760498047, 21.59850311279297, 22.33707046508789, 23.075637817382812, 23.814207077026367]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 9.0, 10.0, 16.0, 22.0, 14.0, 28.0, 28.0, 27.0, 31.0, 42.0, 36.0, 42.0, 47.0, 45.0, 44.0, 49.0, 41.0, 42.0, 47.0, 40.0, 43.0, 29.0, 31.0, 31.0, 38.0, 28.0, 16.0, 15.0, 16.0, 16.0, 12.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.15234375, -4.02862548828125, -3.9049072265625, -3.78118896484375, -3.657470703125, -3.53375244140625, -3.4100341796875, -3.28631591796875, -3.16259765625, -3.03887939453125, -2.9151611328125, -2.79144287109375, -2.667724609375, -2.54400634765625, -2.4202880859375, -2.29656982421875, -2.1728515625, -2.04913330078125, -1.9254150390625, -1.80169677734375, -1.677978515625, -1.55426025390625, -1.4305419921875, -1.30682373046875, -1.18310546875, -1.05938720703125, -0.9356689453125, -0.81195068359375, -0.688232421875, -0.56451416015625, -0.4407958984375, -0.31707763671875, -0.193359375, -0.06964111328125, 0.0540771484375, 0.17779541015625, 0.301513671875, 0.42523193359375, 0.5489501953125, 0.67266845703125, 0.79638671875, 0.92010498046875, 1.0438232421875, 1.16754150390625, 1.291259765625, 1.41497802734375, 1.5386962890625, 1.66241455078125, 1.7861328125, 1.90985107421875, 2.0335693359375, 2.15728759765625, 2.281005859375, 2.40472412109375, 2.5284423828125, 2.65216064453125, 2.77587890625, 2.89959716796875, 3.0233154296875, 3.14703369140625, 3.270751953125, 3.39447021484375, 3.5181884765625, 3.64190673828125, 3.765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 12.0, 28.0, 37.0, 47.0, 58.0, 101.0, 150.0, 175.0, 236.0, 333.0, 456.0, 658.0, 962.0, 1445.0, 2505.0, 5621.0, 45421.0, 927898.0, 49286.0, 5743.0, 2502.0, 1529.0, 997.0, 656.0, 488.0, 371.0, 224.0, 181.0, 130.0, 99.0, 66.0, 40.0, 33.0, 19.0, 15.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.5400390625, -4.400390625, -4.2607421875, -4.12109375, -3.9814453125, -3.841796875, -3.7021484375, -3.5625, -3.4228515625, -3.283203125, -3.1435546875, -3.00390625, -2.8642578125, -2.724609375, -2.5849609375, -2.4453125, -2.3056640625, -2.166015625, -2.0263671875, -1.88671875, -1.7470703125, -1.607421875, -1.4677734375, -1.328125, -1.1884765625, -1.048828125, -0.9091796875, -0.76953125, -0.6298828125, -0.490234375, -0.3505859375, -0.2109375, -0.0712890625, 0.068359375, 0.2080078125, 0.34765625, 0.4873046875, 0.626953125, 0.7666015625, 0.90625, 1.0458984375, 1.185546875, 1.3251953125, 1.46484375, 1.6044921875, 1.744140625, 1.8837890625, 2.0234375, 2.1630859375, 2.302734375, 2.4423828125, 2.58203125, 2.7216796875, 2.861328125, 3.0009765625, 3.140625, 3.2802734375, 3.419921875, 3.5595703125, 3.69921875, 3.8388671875, 3.978515625, 4.1181640625, 4.2578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 1.0, 12.0, 14.0, 17.0, 10.0, 10.0, 11.0, 18.0, 26.0, 27.0, 17.0, 32.0, 32.0, 43.0, 41.0, 37.0, 31.0, 52.0, 1058.0, 49.0, 42.0, 41.0, 30.0, 35.0, 39.0, 26.0, 36.0, 33.0, 36.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 9.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.66796875, -2.588836669921875, -2.50970458984375, -2.430572509765625, -2.3514404296875, -2.272308349609375, -2.19317626953125, -2.114044189453125, -2.034912109375, -1.955780029296875, -1.87664794921875, -1.797515869140625, -1.7183837890625, -1.639251708984375, -1.56011962890625, -1.480987548828125, -1.40185546875, -1.322723388671875, -1.24359130859375, -1.164459228515625, -1.0853271484375, -1.006195068359375, -0.92706298828125, -0.847930908203125, -0.768798828125, -0.689666748046875, -0.61053466796875, -0.531402587890625, -0.4522705078125, -0.373138427734375, -0.29400634765625, -0.214874267578125, -0.1357421875, -0.056610107421875, 0.02252197265625, 0.101654052734375, 0.1807861328125, 0.259918212890625, 0.33905029296875, 0.418182373046875, 0.497314453125, 0.576446533203125, 0.65557861328125, 0.734710693359375, 0.8138427734375, 0.892974853515625, 0.97210693359375, 1.051239013671875, 1.13037109375, 1.209503173828125, 1.28863525390625, 1.367767333984375, 1.4468994140625, 1.526031494140625, 1.60516357421875, 1.684295654296875, 1.763427734375, 1.842559814453125, 1.92169189453125, 2.000823974609375, 2.0799560546875, 2.159088134765625, 2.23822021484375, 2.317352294921875, 2.396484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 5.0, 9.0, 6.0, 13.0, 19.0, 39.0, 48.0, 63.0, 81.0, 137.0, 185.0, 257.0, 390.0, 578.0, 797.0, 1393.0, 2353.0, 5039.0, 18022.0, 406766.0, 1620585.0, 27345.0, 5955.0, 2713.0, 1430.0, 944.0, 568.0, 416.0, 287.0, 198.0, 163.0, 104.0, 64.0, 42.0, 35.0, 23.0, 20.0, 12.0, 11.0, 6.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.13671875, -2.0758514404296875, -2.014984130859375, -1.9541168212890625, -1.89324951171875, -1.8323822021484375, -1.771514892578125, -1.7106475830078125, -1.6497802734375, -1.5889129638671875, -1.528045654296875, -1.4671783447265625, -1.40631103515625, -1.3454437255859375, -1.284576416015625, -1.2237091064453125, -1.162841796875, -1.1019744873046875, -1.041107177734375, -0.9802398681640625, -0.91937255859375, -0.8585052490234375, -0.797637939453125, -0.7367706298828125, -0.6759033203125, -0.6150360107421875, -0.554168701171875, -0.4933013916015625, -0.43243408203125, -0.3715667724609375, -0.310699462890625, -0.2498321533203125, -0.18896484375, -0.1280975341796875, -0.067230224609375, -0.0063629150390625, 0.05450439453125, 0.1153717041015625, 0.176239013671875, 0.2371063232421875, 0.2979736328125, 0.3588409423828125, 0.419708251953125, 0.4805755615234375, 0.54144287109375, 0.6023101806640625, 0.663177490234375, 0.7240447998046875, 0.784912109375, 0.8457794189453125, 0.906646728515625, 0.9675140380859375, 1.02838134765625, 1.0892486572265625, 1.150115966796875, 1.2109832763671875, 1.2718505859375, 1.3327178955078125, 1.393585205078125, 1.4544525146484375, 1.51531982421875, 1.5761871337890625, 1.637054443359375, 1.6979217529296875, 1.7587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 6.0, 9.0, 18.0, 18.0, 8.0, 20.0, 26.0, 31.0, 48.0, 100.0, 206.0, 168.0, 95.0, 63.0, 43.0, 28.0, 21.0, 14.0, 14.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09587287902832031, -0.09305191040039062, -0.09023094177246094, -0.08740997314453125, -0.08458900451660156, -0.08176803588867188, -0.07894706726074219, -0.0761260986328125, -0.07330513000488281, -0.07048416137695312, -0.06766319274902344, -0.06484222412109375, -0.06202125549316406, -0.059200286865234375, -0.05637931823730469, -0.053558349609375, -0.05073738098144531, -0.047916412353515625, -0.04509544372558594, -0.04227447509765625, -0.03945350646972656, -0.036632537841796875, -0.03381156921386719, -0.0309906005859375, -0.028169631958007812, -0.025348663330078125, -0.022527694702148438, -0.01970672607421875, -0.016885757446289062, -0.014064788818359375, -0.011243820190429688, -0.0084228515625, -0.0056018829345703125, -0.002780914306640625, 4.00543212890625e-05, 0.00286102294921875, 0.0056819915771484375, 0.008502960205078125, 0.011323928833007812, 0.0141448974609375, 0.016965866088867188, 0.019786834716796875, 0.022607803344726562, 0.02542877197265625, 0.028249740600585938, 0.031070709228515625, 0.03389167785644531, 0.036712646484375, 0.03953361511230469, 0.042354583740234375, 0.04517555236816406, 0.04799652099609375, 0.05081748962402344, 0.053638458251953125, 0.05645942687988281, 0.0592803955078125, 0.06210136413574219, 0.06492233276367188, 0.06774330139160156, 0.07056427001953125, 0.07338523864746094, 0.07620620727539062, 0.07902717590332031, 0.08184814453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 14.0, 18.0, 38.0, 49.0, 104.0, 221.0, 1116.0, 1040445.0, 5819.0, 336.0, 124.0, 62.0, 41.0, 26.0, 13.0, 19.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.962249755859375, -1.89129638671875, -1.820343017578125, -1.7493896484375, -1.678436279296875, -1.60748291015625, -1.536529541015625, -1.465576171875, -1.394622802734375, -1.32366943359375, -1.252716064453125, -1.1817626953125, -1.110809326171875, -1.03985595703125, -0.968902587890625, -0.89794921875, -0.826995849609375, -0.75604248046875, -0.685089111328125, -0.6141357421875, -0.543182373046875, -0.47222900390625, -0.401275634765625, -0.330322265625, -0.259368896484375, -0.18841552734375, -0.117462158203125, -0.0465087890625, 0.024444580078125, 0.09539794921875, 0.166351318359375, 0.2373046875, 0.308258056640625, 0.37921142578125, 0.450164794921875, 0.5211181640625, 0.592071533203125, 0.66302490234375, 0.733978271484375, 0.804931640625, 0.875885009765625, 0.94683837890625, 1.017791748046875, 1.0887451171875, 1.159698486328125, 1.23065185546875, 1.301605224609375, 1.37255859375, 1.443511962890625, 1.51446533203125, 1.585418701171875, 1.6563720703125, 1.727325439453125, 1.79827880859375, 1.869232177734375, 1.940185546875, 2.011138916015625, 2.08209228515625, 2.153045654296875, 2.2239990234375, 2.294952392578125, 2.36590576171875, 2.436859130859375, 2.5078125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 6.0, 34.0, 92.0, 325.0, 385.0, 135.0, 28.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06273401528596878, -0.05401284620165825, -0.04529167711734772, -0.036570508033037186, -0.027849338948726654, -0.019128169864416122, -0.01040700078010559, -0.0016858316957950592, 0.007035337388515472, 0.015756506472826004, 0.024477675557136536, 0.03319884464144707, 0.0419200137257576, 0.05064118281006813, 0.05936235189437866, 0.06808352470397949, 0.07680469006299973, 0.08552585542201996, 0.09424702823162079, 0.10296820104122162, 0.11168936640024185, 0.12041053175926208, 0.12913170456886292, 0.13785287737846375, 0.14657405018806458, 0.1552952229976654, 0.16401639580726624, 0.17273755371570587, 0.1814587265253067, 0.19017989933490753, 0.19890105724334717, 0.207622230052948, 0.21634337306022644, 0.22506454586982727, 0.2337857186794281, 0.24250687658786774, 0.2512280344963074, 0.2599492073059082, 0.26867038011550903, 0.27739155292510986, 0.2861127257347107, 0.2948338985443115, 0.30355507135391235, 0.3122762441635132, 0.320997416973114, 0.32971855998039246, 0.3384397327899933, 0.3471609055995941, 0.35588207840919495, 0.3646032512187958, 0.3733244240283966, 0.38204559683799744, 0.3907667398452759, 0.3994879126548767, 0.40820908546447754, 0.41693025827407837, 0.4256514310836792, 0.43437260389328003, 0.44309377670288086, 0.4518149495124817, 0.4605361223220825, 0.46925726532936096, 0.4779784381389618, 0.4866996109485626, 0.49542078375816345]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 11.0, 13.0, 3.0, 13.0, 15.0, 25.0, 11.0, 25.0, 21.0, 33.0, 38.0, 36.0, 39.0, 43.0, 54.0, 33.0, 53.0, 49.0, 47.0, 47.0, 34.0, 37.0, 31.0, 42.0, 34.0, 30.0, 27.0, 23.0, 18.0, 27.0, 16.0, 11.0, 10.0, 8.0, 9.0, 9.0, 9.0, 10.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07050657272338867, -0.06814620643854141, -0.06578584015369415, -0.06342548131942749, -0.06106511503458023, -0.05870474874973297, -0.05634438619017601, -0.05398402363061905, -0.05162365734577179, -0.04926329106092453, -0.04690292850136757, -0.04454256594181061, -0.04218219965696335, -0.03982183337211609, -0.03746147081255913, -0.03510110825300217, -0.03274074196815491, -0.030380377545952797, -0.028020013123750687, -0.025659648701548576, -0.023299284279346466, -0.020938919857144356, -0.018578555434942245, -0.016218191012740135, -0.013857826590538025, -0.011497462168335915, -0.009137097746133804, -0.006776733323931694, -0.004416368901729584, -0.0020560044795274734, 0.00030435994267463684, 0.002664724364876747, 0.005025088787078857, 0.007385453209280968, 0.009745817631483078, 0.012106182053685188, 0.014466546475887299, 0.01682691089808941, 0.01918727532029152, 0.02154763974249363, 0.02390800416469574, 0.02626836858689785, 0.02862873300909996, 0.03098909743130207, 0.03334946185350418, 0.03570982813835144, 0.0380701906979084, 0.04043055325746536, 0.04279091954231262, 0.04515128582715988, 0.04751164838671684, 0.049872010946273804, 0.05223237723112106, 0.05459274351596832, 0.056953106075525284, 0.059313468635082245, 0.061673834919929504, 0.06403420120477676, 0.06639456748962402, 0.06875492632389069, 0.07111529260873795, 0.0734756588935852, 0.07583601772785187, 0.07819638401269913, 0.08055675029754639]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 14.0, 13.0, 12.0, 23.0, 33.0, 22.0, 25.0, 36.0, 30.0, 43.0, 42.0, 39.0, 40.0, 45.0, 34.0, 39.0, 33.0, 44.0, 52.0, 46.0, 38.0, 40.0, 26.0, 27.0, 26.0, 37.0, 20.0, 20.0, 20.0, 10.0, 6.0, 13.0, 10.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.830535888671875, -3.70989990234375, -3.589263916015625, -3.4686279296875, -3.347991943359375, -3.22735595703125, -3.106719970703125, -2.986083984375, -2.865447998046875, -2.74481201171875, -2.624176025390625, -2.5035400390625, -2.382904052734375, -2.26226806640625, -2.141632080078125, -2.02099609375, -1.900360107421875, -1.77972412109375, -1.659088134765625, -1.5384521484375, -1.417816162109375, -1.29718017578125, -1.176544189453125, -1.055908203125, -0.935272216796875, -0.81463623046875, -0.694000244140625, -0.5733642578125, -0.452728271484375, -0.33209228515625, -0.211456298828125, -0.0908203125, 0.029815673828125, 0.15045166015625, 0.271087646484375, 0.3917236328125, 0.512359619140625, 0.63299560546875, 0.753631591796875, 0.874267578125, 0.994903564453125, 1.11553955078125, 1.236175537109375, 1.3568115234375, 1.477447509765625, 1.59808349609375, 1.718719482421875, 1.83935546875, 1.959991455078125, 2.08062744140625, 2.201263427734375, 2.3218994140625, 2.442535400390625, 2.56317138671875, 2.683807373046875, 2.804443359375, 2.925079345703125, 3.04571533203125, 3.166351318359375, 3.2869873046875, 3.407623291015625, 3.52825927734375, 3.648895263671875, 3.76953125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 8.0, 10.0, 14.0, 22.0, 15.0, 36.0, 51.0, 98.0, 182.0, 263.0, 467.0, 814.0, 1392.0, 2553.0, 4555.0, 8625.0, 16743.0, 33556.0, 70581.0, 170923.0, 386490.0, 196624.0, 78662.0, 36677.0, 18382.0, 9366.0, 5042.0, 2701.0, 1507.0, 922.0, 495.0, 293.0, 161.0, 114.0, 70.0, 36.0, 29.0, 19.0, 13.0, 14.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.65234375, -6.45416259765625, -6.2559814453125, -6.05780029296875, -5.859619140625, -5.66143798828125, -5.4632568359375, -5.26507568359375, -5.06689453125, -4.86871337890625, -4.6705322265625, -4.47235107421875, -4.274169921875, -4.07598876953125, -3.8778076171875, -3.67962646484375, -3.4814453125, -3.28326416015625, -3.0850830078125, -2.88690185546875, -2.688720703125, -2.49053955078125, -2.2923583984375, -2.09417724609375, -1.89599609375, -1.69781494140625, -1.4996337890625, -1.30145263671875, -1.103271484375, -0.90509033203125, -0.7069091796875, -0.50872802734375, -0.310546875, -0.11236572265625, 0.0858154296875, 0.28399658203125, 0.482177734375, 0.68035888671875, 0.8785400390625, 1.07672119140625, 1.27490234375, 1.47308349609375, 1.6712646484375, 1.86944580078125, 2.067626953125, 2.26580810546875, 2.4639892578125, 2.66217041015625, 2.8603515625, 3.05853271484375, 3.2567138671875, 3.45489501953125, 3.653076171875, 3.85125732421875, 4.0494384765625, 4.24761962890625, 4.44580078125, 4.64398193359375, 4.8421630859375, 5.04034423828125, 5.238525390625, 5.43670654296875, 5.6348876953125, 5.83306884765625, 6.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 8.0, 11.0, 17.0, 13.0, 19.0, 17.0, 23.0, 31.0, 24.0, 33.0, 45.0, 46.0, 48.0, 56.0, 90.0, 104.0, 169.0, 1367.0, 245.0, 144.0, 91.0, 44.0, 43.0, 36.0, 35.0, 40.0, 25.0, 24.0, 25.0, 23.0, 27.0, 15.0, 19.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 7.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.43505859375, -9.1279296875, -8.82080078125, -8.513671875, -8.20654296875, -7.8994140625, -7.59228515625, -7.28515625, -6.97802734375, -6.6708984375, -6.36376953125, -6.056640625, -5.74951171875, -5.4423828125, -5.13525390625, -4.828125, -4.52099609375, -4.2138671875, -3.90673828125, -3.599609375, -3.29248046875, -2.9853515625, -2.67822265625, -2.37109375, -2.06396484375, -1.7568359375, -1.44970703125, -1.142578125, -0.83544921875, -0.5283203125, -0.22119140625, 0.0859375, 0.39306640625, 0.7001953125, 1.00732421875, 1.314453125, 1.62158203125, 1.9287109375, 2.23583984375, 2.54296875, 2.85009765625, 3.1572265625, 3.46435546875, 3.771484375, 4.07861328125, 4.3857421875, 4.69287109375, 5.0, 5.30712890625, 5.6142578125, 5.92138671875, 6.228515625, 6.53564453125, 6.8427734375, 7.14990234375, 7.45703125, 7.76416015625, 8.0712890625, 8.37841796875, 8.685546875, 8.99267578125, 9.2998046875, 9.60693359375, 9.9140625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 15.0, 9.0, 19.0, 15.0, 36.0, 32.0, 69.0, 112.0, 187.0, 376.0, 701.0, 1793.0, 4835.0, 18409.0, 118770.0, 2476881.0, 465775.0, 43428.0, 9224.0, 2744.0, 1123.0, 513.0, 267.0, 143.0, 71.0, 44.0, 29.0, 22.0, 20.0, 8.0, 7.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.234375, -13.721435546875, -13.20849609375, -12.695556640625, -12.1826171875, -11.669677734375, -11.15673828125, -10.643798828125, -10.130859375, -9.617919921875, -9.10498046875, -8.592041015625, -8.0791015625, -7.566162109375, -7.05322265625, -6.540283203125, -6.02734375, -5.514404296875, -5.00146484375, -4.488525390625, -3.9755859375, -3.462646484375, -2.94970703125, -2.436767578125, -1.923828125, -1.410888671875, -0.89794921875, -0.385009765625, 0.1279296875, 0.640869140625, 1.15380859375, 1.666748046875, 2.1796875, 2.692626953125, 3.20556640625, 3.718505859375, 4.2314453125, 4.744384765625, 5.25732421875, 5.770263671875, 6.283203125, 6.796142578125, 7.30908203125, 7.822021484375, 8.3349609375, 8.847900390625, 9.36083984375, 9.873779296875, 10.38671875, 10.899658203125, 11.41259765625, 11.925537109375, 12.4384765625, 12.951416015625, 13.46435546875, 13.977294921875, 14.490234375, 15.003173828125, 15.51611328125, 16.029052734375, 16.5419921875, 17.054931640625, 17.56787109375, 18.080810546875, 18.59375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 17.0, 205.0, 531.0, 226.0, 30.0, 5.0, 1.0], "bins": [-228.764404296875, -224.92250061035156, -221.08059692382812, -217.23870849609375, -213.3968048095703, -209.55490112304688, -205.71299743652344, -201.87110900878906, -198.02920532226562, -194.1873016357422, -190.34539794921875, -186.50350952148438, -182.66160583496094, -178.8197021484375, -174.97779846191406, -171.1359100341797, -167.29400634765625, -163.4521026611328, -159.61019897460938, -155.768310546875, -151.92640686035156, -148.08450317382812, -144.2425994873047, -140.4007110595703, -136.55880737304688, -132.71690368652344, -128.875, -125.0331039428711, -121.19120788574219, -117.34930419921875, -113.50740814208984, -109.6655044555664, -105.82360076904297, -101.98169708251953, -98.13980102539062, -94.29789733886719, -90.45600128173828, -86.61409759521484, -82.77220153808594, -78.9302978515625, -75.08839416503906, -71.24649047851562, -67.40459442138672, -63.56269454956055, -59.720794677734375, -55.87889099121094, -52.03699493408203, -48.195091247558594, -44.35319519042969, -40.511295318603516, -36.669395446777344, -32.82749557495117, -28.985595703125, -25.143693923950195, -21.301794052124023, -17.45989418029785, -13.617996215820312, -9.77609634399414, -5.9341959953308105, -2.0922956466674805, 1.7496042251586914, 5.59150505065918, 9.433404922485352, 13.275304794311523, 17.117204666137695]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 14.0, 22.0, 15.0, 20.0, 13.0, 28.0, 26.0, 24.0, 35.0, 43.0, 39.0, 40.0, 43.0, 44.0, 37.0, 43.0, 43.0, 42.0, 40.0, 33.0, 31.0, 31.0, 28.0, 37.0, 17.0, 23.0, 30.0, 22.0, 14.0, 21.0, 12.0, 9.0, 11.0, 8.0, 7.0, 5.0, 10.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.797935485839844, -23.97972297668457, -23.161510467529297, -22.343297958374023, -21.52508544921875, -20.706871032714844, -19.888660430908203, -19.070446014404297, -18.252233505249023, -17.43402099609375, -16.615808486938477, -15.797595977783203, -14.979382514953613, -14.16117000579834, -13.342957496643066, -12.524744033813477, -11.70653247833252, -10.888319969177246, -10.070107460021973, -9.251893997192383, -8.43368148803711, -7.615468978881836, -6.7972564697265625, -5.979043483734131, -5.160830974578857, -4.342618465423584, -3.5244054794311523, -2.706192970275879, -1.8879802227020264, -1.0697674751281738, -0.2515549659729004, 0.5666580200195312, 1.3848705291748047, 2.2030832767486572, 3.0212960243225098, 3.839508533477783, 4.657721519470215, 5.475934028625488, 6.294146537780762, 7.112359523773193, 7.930572032928467, 8.748785018920898, 9.566997528076172, 10.385210037231445, 11.203422546386719, 12.021635055541992, 12.839847564697266, 13.658061027526855, 14.476273536682129, 15.294486045837402, 16.112699508666992, 16.930912017822266, 17.74912452697754, 18.567337036132812, 19.385549545288086, 20.20376205444336, 21.021974563598633, 21.840187072753906, 22.65839958190918, 23.476612091064453, 24.294824600219727, 25.113037109375, 25.931251525878906, 26.74946403503418, 27.567676544189453]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 5.0, 9.0, 12.0, 18.0, 12.0, 22.0, 14.0, 29.0, 19.0, 18.0, 33.0, 27.0, 25.0, 28.0, 28.0, 34.0, 33.0, 52.0, 42.0, 43.0, 38.0, 40.0, 44.0, 43.0, 32.0, 32.0, 27.0, 24.0, 32.0, 19.0, 21.0, 17.0, 8.0, 13.0, 18.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-3.341796875, -3.23211669921875, -3.1224365234375, -3.01275634765625, -2.903076171875, -2.79339599609375, -2.6837158203125, -2.57403564453125, -2.46435546875, -2.35467529296875, -2.2449951171875, -2.13531494140625, -2.025634765625, -1.91595458984375, -1.8062744140625, -1.69659423828125, -1.5869140625, -1.47723388671875, -1.3675537109375, -1.25787353515625, -1.148193359375, -1.03851318359375, -0.9288330078125, -0.81915283203125, -0.70947265625, -0.59979248046875, -0.4901123046875, -0.38043212890625, -0.270751953125, -0.16107177734375, -0.0513916015625, 0.05828857421875, 0.16796875, 0.27764892578125, 0.3873291015625, 0.49700927734375, 0.606689453125, 0.71636962890625, 0.8260498046875, 0.93572998046875, 1.04541015625, 1.15509033203125, 1.2647705078125, 1.37445068359375, 1.484130859375, 1.59381103515625, 1.7034912109375, 1.81317138671875, 1.9228515625, 2.03253173828125, 2.1422119140625, 2.25189208984375, 2.361572265625, 2.47125244140625, 2.5809326171875, 2.69061279296875, 2.80029296875, 2.90997314453125, 3.0196533203125, 3.12933349609375, 3.239013671875, 3.34869384765625, 3.4583740234375, 3.56805419921875, 3.677734375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 7.0, 13.0, 15.0, 16.0, 17.0, 25.0, 22.0, 32.0, 41.0, 35.0, 54.0, 55.0, 90.0, 167.0, 326.0, 948.0, 4247.0, 34799.0, 3086677.0, 1042467.0, 19597.0, 3026.0, 742.0, 278.0, 141.0, 85.0, 54.0, 34.0, 50.0, 30.0, 24.0, 20.0, 25.0, 18.0, 10.0, 12.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 2.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.635498046875, -20.91162109375, -20.187744140625, -19.4638671875, -18.739990234375, -18.01611328125, -17.292236328125, -16.568359375, -15.844482421875, -15.12060546875, -14.396728515625, -13.6728515625, -12.948974609375, -12.22509765625, -11.501220703125, -10.77734375, -10.053466796875, -9.32958984375, -8.605712890625, -7.8818359375, -7.157958984375, -6.43408203125, -5.710205078125, -4.986328125, -4.262451171875, -3.53857421875, -2.814697265625, -2.0908203125, -1.366943359375, -0.64306640625, 0.080810546875, 0.8046875, 1.528564453125, 2.25244140625, 2.976318359375, 3.7001953125, 4.424072265625, 5.14794921875, 5.871826171875, 6.595703125, 7.319580078125, 8.04345703125, 8.767333984375, 9.4912109375, 10.215087890625, 10.93896484375, 11.662841796875, 12.38671875, 13.110595703125, 13.83447265625, 14.558349609375, 15.2822265625, 16.006103515625, 16.72998046875, 17.453857421875, 18.177734375, 18.901611328125, 19.62548828125, 20.349365234375, 21.0732421875, 21.797119140625, 22.52099609375, 23.244873046875, 23.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 12.0, 8.0, 19.0, 18.0, 26.0, 31.0, 29.0, 58.0, 66.0, 88.0, 124.0, 202.0, 262.0, 442.0, 581.0, 607.0, 467.0, 271.0, 209.0, 130.0, 100.0, 74.0, 42.0, 48.0, 24.0, 27.0, 18.0, 9.0, 22.0, 10.0, 9.0, 8.0, 4.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.2452392578125, -4.052978515625, -3.8607177734375, -3.66845703125, -3.4761962890625, -3.283935546875, -3.0916748046875, -2.8994140625, -2.7071533203125, -2.514892578125, -2.3226318359375, -2.13037109375, -1.9381103515625, -1.745849609375, -1.5535888671875, -1.361328125, -1.1690673828125, -0.976806640625, -0.7845458984375, -0.59228515625, -0.4000244140625, -0.207763671875, -0.0155029296875, 0.1767578125, 0.3690185546875, 0.561279296875, 0.7535400390625, 0.94580078125, 1.1380615234375, 1.330322265625, 1.5225830078125, 1.71484375, 1.9071044921875, 2.099365234375, 2.2916259765625, 2.48388671875, 2.6761474609375, 2.868408203125, 3.0606689453125, 3.2529296875, 3.4451904296875, 3.637451171875, 3.8297119140625, 4.02197265625, 4.2142333984375, 4.406494140625, 4.5987548828125, 4.791015625, 4.9832763671875, 5.175537109375, 5.3677978515625, 5.56005859375, 5.7523193359375, 5.944580078125, 6.1368408203125, 6.3291015625, 6.5213623046875, 6.713623046875, 6.9058837890625, 7.09814453125, 7.2904052734375, 7.482666015625, 7.6749267578125, 7.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 4.0, 12.0, 13.0, 10.0, 16.0, 26.0, 24.0, 31.0, 37.0, 86.0, 120.0, 223.0, 715.0, 4107.0, 48352.0, 2920003.0, 1185259.0, 30887.0, 3116.0, 617.0, 238.0, 119.0, 58.0, 42.0, 34.0, 20.0, 16.0, 12.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.517333984375, -19.83154296875, -19.145751953125, -18.4599609375, -17.774169921875, -17.08837890625, -16.402587890625, -15.716796875, -15.031005859375, -14.34521484375, -13.659423828125, -12.9736328125, -12.287841796875, -11.60205078125, -10.916259765625, -10.23046875, -9.544677734375, -8.85888671875, -8.173095703125, -7.4873046875, -6.801513671875, -6.11572265625, -5.429931640625, -4.744140625, -4.058349609375, -3.37255859375, -2.686767578125, -2.0009765625, -1.315185546875, -0.62939453125, 0.056396484375, 0.7421875, 1.427978515625, 2.11376953125, 2.799560546875, 3.4853515625, 4.171142578125, 4.85693359375, 5.542724609375, 6.228515625, 6.914306640625, 7.60009765625, 8.285888671875, 8.9716796875, 9.657470703125, 10.34326171875, 11.029052734375, 11.71484375, 12.400634765625, 13.08642578125, 13.772216796875, 14.4580078125, 15.143798828125, 15.82958984375, 16.515380859375, 17.201171875, 17.886962890625, 18.57275390625, 19.258544921875, 19.9443359375, 20.630126953125, 21.31591796875, 22.001708984375, 22.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 17.0, 39.0, 81.0, 181.0, 249.0, 234.0, 123.0, 50.0, 24.0, 12.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.815486907958984, -53.194007873535156, -51.572532653808594, -49.951053619384766, -48.32957458496094, -46.708099365234375, -45.08662033081055, -43.46514129638672, -41.843666076660156, -40.22218704223633, -38.600711822509766, -36.97923278808594, -35.35775375366211, -33.73627471923828, -32.11479949951172, -30.49332046508789, -28.871841430664062, -27.250364303588867, -25.62888526916504, -24.007408142089844, -22.385929107666016, -20.76445198059082, -19.142974853515625, -17.521495819091797, -15.900018692016602, -14.27854061126709, -12.657062530517578, -11.035585403442383, -9.414107322692871, -7.792629241943359, -6.171152114868164, -4.549674034118652, -2.928192138671875, -1.3067142963409424, 0.31476354598999023, 1.9362411499023438, 3.5577192306518555, 5.179197311401367, 6.8006744384765625, 8.422152519226074, 10.043630599975586, 11.665108680725098, 13.28658676147461, 14.908063888549805, 16.529541015625, 18.151020050048828, 19.772497177124023, 21.39397430419922, 23.015453338623047, 24.636930465698242, 26.25840950012207, 27.879886627197266, 29.501365661621094, 31.12284278869629, 32.744319915771484, 34.36579895019531, 35.987274169921875, 37.6087532043457, 39.230228424072266, 40.851707458496094, 42.47318649291992, 44.09466552734375, 45.71614074707031, 47.33761978149414, 48.95909881591797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 8.0, 5.0, 5.0, 7.0, 10.0, 8.0, 15.0, 19.0, 12.0, 15.0, 18.0, 15.0, 18.0, 22.0, 31.0, 28.0, 24.0, 31.0, 27.0, 33.0, 43.0, 25.0, 23.0, 30.0, 47.0, 39.0, 26.0, 47.0, 33.0, 17.0, 44.0, 28.0, 34.0, 31.0, 17.0, 15.0, 20.0, 13.0, 15.0, 19.0, 7.0, 9.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.015356063842773, -16.481029510498047, -15.94670295715332, -15.412375450134277, -14.87804889678955, -14.343722343444824, -13.809394836425781, -13.275068283081055, -12.740741729736328, -12.206415176391602, -11.672088623046875, -11.137761116027832, -10.603434562683105, -10.069108009338379, -9.534780502319336, -9.00045394897461, -8.466127395629883, -7.931800842285156, -7.3974738121032715, -6.863146781921387, -6.32882022857666, -5.794493675231934, -5.260166645050049, -4.725839614868164, -4.1915130615234375, -3.657186269760132, -3.122859477996826, -2.5885326862335205, -2.054205894470215, -1.5198791027069092, -0.9855523109436035, -0.45122551918029785, 0.08310317993164062, 0.6174299716949463, 1.151756763458252, 1.6860835552215576, 2.2204103469848633, 2.754737138748169, 3.2890639305114746, 3.8233907222747803, 4.357717514038086, 4.8920440673828125, 5.426371097564697, 5.960698127746582, 6.495024681091309, 7.029351234436035, 7.56367826461792, 8.098005294799805, 8.632331848144531, 9.166658401489258, 9.700984954833984, 10.235312461853027, 10.769639015197754, 11.30396556854248, 11.838293075561523, 12.37261962890625, 12.906946182250977, 13.441272735595703, 13.97559928894043, 14.509926795959473, 15.0442533493042, 15.578579902648926, 16.11290740966797, 16.647233963012695, 17.181560516357422]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 10.0, 17.0, 13.0, 22.0, 15.0, 17.0, 19.0, 25.0, 27.0, 23.0, 30.0, 40.0, 34.0, 38.0, 40.0, 39.0, 52.0, 42.0, 51.0, 36.0, 35.0, 39.0, 30.0, 31.0, 37.0, 26.0, 27.0, 23.0, 22.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.326690673828125, -3.21002197265625, -3.093353271484375, -2.9766845703125, -2.860015869140625, -2.74334716796875, -2.626678466796875, -2.510009765625, -2.393341064453125, -2.27667236328125, -2.160003662109375, -2.0433349609375, -1.926666259765625, -1.80999755859375, -1.693328857421875, -1.57666015625, -1.459991455078125, -1.34332275390625, -1.226654052734375, -1.1099853515625, -0.993316650390625, -0.87664794921875, -0.759979248046875, -0.643310546875, -0.526641845703125, -0.40997314453125, -0.293304443359375, -0.1766357421875, -0.059967041015625, 0.05670166015625, 0.173370361328125, 0.2900390625, 0.406707763671875, 0.52337646484375, 0.640045166015625, 0.7567138671875, 0.873382568359375, 0.99005126953125, 1.106719970703125, 1.223388671875, 1.340057373046875, 1.45672607421875, 1.573394775390625, 1.6900634765625, 1.806732177734375, 1.92340087890625, 2.040069580078125, 2.15673828125, 2.273406982421875, 2.39007568359375, 2.506744384765625, 2.6234130859375, 2.740081787109375, 2.85675048828125, 2.973419189453125, 3.090087890625, 3.206756591796875, 3.32342529296875, 3.440093994140625, 3.5567626953125, 3.673431396484375, 3.79010009765625, 3.906768798828125, 4.0234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 12.0, 22.0, 24.0, 46.0, 66.0, 92.0, 125.0, 225.0, 312.0, 451.0, 798.0, 1211.0, 2059.0, 3612.0, 6373.0, 12117.0, 23867.0, 48701.0, 105548.0, 228162.0, 297256.0, 167144.0, 75469.0, 35508.0, 17512.0, 9451.0, 4994.0, 2934.0, 1648.0, 990.0, 647.0, 401.0, 233.0, 199.0, 102.0, 75.0, 47.0, 41.0, 29.0, 10.0, 12.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62841796875, -0.6089553833007812, -0.5894927978515625, -0.5700302124023438, -0.550567626953125, -0.5311050415039062, -0.5116424560546875, -0.49217987060546875, -0.47271728515625, -0.45325469970703125, -0.4337921142578125, -0.41432952880859375, -0.394866943359375, -0.37540435791015625, -0.3559417724609375, -0.33647918701171875, -0.3170166015625, -0.29755401611328125, -0.2780914306640625, -0.25862884521484375, -0.239166259765625, -0.21970367431640625, -0.2002410888671875, -0.18077850341796875, -0.16131591796875, -0.14185333251953125, -0.1223907470703125, -0.10292816162109375, -0.083465576171875, -0.06400299072265625, -0.0445404052734375, -0.02507781982421875, -0.005615234375, 0.01384735107421875, 0.0333099365234375, 0.05277252197265625, 0.072235107421875, 0.09169769287109375, 0.1111602783203125, 0.13062286376953125, 0.15008544921875, 0.16954803466796875, 0.1890106201171875, 0.20847320556640625, 0.227935791015625, 0.24739837646484375, 0.2668609619140625, 0.28632354736328125, 0.3057861328125, 0.32524871826171875, 0.3447113037109375, 0.36417388916015625, 0.383636474609375, 0.40309906005859375, 0.4225616455078125, 0.44202423095703125, 0.46148681640625, 0.48094940185546875, 0.5004119873046875, 0.5198745727539062, 0.539337158203125, 0.5587997436523438, 0.5782623291015625, 0.5977249145507812, 0.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 9.0, 5.0, 9.0, 8.0, 14.0, 12.0, 18.0, 17.0, 18.0, 26.0, 30.0, 26.0, 28.0, 35.0, 26.0, 30.0, 45.0, 40.0, 35.0, 43.0, 1068.0, 37.0, 40.0, 44.0, 22.0, 33.0, 34.0, 26.0, 30.0, 31.0, 25.0, 20.0, 21.0, 20.0, 16.0, 14.0, 13.0, 7.0, 9.0, 7.0, 5.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.349609375, -2.27178955078125, -2.1939697265625, -2.11614990234375, -2.038330078125, -1.96051025390625, -1.8826904296875, -1.80487060546875, -1.72705078125, -1.64923095703125, -1.5714111328125, -1.49359130859375, -1.415771484375, -1.33795166015625, -1.2601318359375, -1.18231201171875, -1.1044921875, -1.02667236328125, -0.9488525390625, -0.87103271484375, -0.793212890625, -0.71539306640625, -0.6375732421875, -0.55975341796875, -0.48193359375, -0.40411376953125, -0.3262939453125, -0.24847412109375, -0.170654296875, -0.09283447265625, -0.0150146484375, 0.06280517578125, 0.140625, 0.21844482421875, 0.2962646484375, 0.37408447265625, 0.451904296875, 0.52972412109375, 0.6075439453125, 0.68536376953125, 0.76318359375, 0.84100341796875, 0.9188232421875, 0.99664306640625, 1.074462890625, 1.15228271484375, 1.2301025390625, 1.30792236328125, 1.3857421875, 1.46356201171875, 1.5413818359375, 1.61920166015625, 1.697021484375, 1.77484130859375, 1.8526611328125, 1.93048095703125, 2.00830078125, 2.08612060546875, 2.1639404296875, 2.24176025390625, 2.319580078125, 2.39739990234375, 2.4752197265625, 2.55303955078125, 2.630859375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 14.0, 10.0, 22.0, 52.0, 68.0, 94.0, 150.0, 263.0, 460.0, 875.0, 1841.0, 4058.0, 10031.0, 27741.0, 88276.0, 369074.0, 1330679.0, 182731.0, 51305.0, 17344.0, 6428.0, 2728.0, 1279.0, 659.0, 347.0, 220.0, 115.0, 78.0, 42.0, 28.0, 21.0, 25.0, 15.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.646484375, -0.62762451171875, -0.6087646484375, -0.58990478515625, -0.571044921875, -0.55218505859375, -0.5333251953125, -0.51446533203125, -0.49560546875, -0.47674560546875, -0.4578857421875, -0.43902587890625, -0.420166015625, -0.40130615234375, -0.3824462890625, -0.36358642578125, -0.3447265625, -0.32586669921875, -0.3070068359375, -0.28814697265625, -0.269287109375, -0.25042724609375, -0.2315673828125, -0.21270751953125, -0.19384765625, -0.17498779296875, -0.1561279296875, -0.13726806640625, -0.118408203125, -0.09954833984375, -0.0806884765625, -0.06182861328125, -0.04296875, -0.02410888671875, -0.0052490234375, 0.01361083984375, 0.032470703125, 0.05133056640625, 0.0701904296875, 0.08905029296875, 0.10791015625, 0.12677001953125, 0.1456298828125, 0.16448974609375, 0.183349609375, 0.20220947265625, 0.2210693359375, 0.23992919921875, 0.2587890625, 0.27764892578125, 0.2965087890625, 0.31536865234375, 0.334228515625, 0.35308837890625, 0.3719482421875, 0.39080810546875, 0.40966796875, 0.42852783203125, 0.4473876953125, 0.46624755859375, 0.485107421875, 0.50396728515625, 0.5228271484375, 0.54168701171875, 0.560546875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 13.0, 18.0, 21.0, 27.0, 29.0, 48.0, 72.0, 131.0, 155.0, 140.0, 87.0, 67.0, 33.0, 22.0, 25.0, 14.0, 14.0, 8.0, 15.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10052490234375, -0.09778881072998047, -0.09505271911621094, -0.0923166275024414, -0.08958053588867188, -0.08684444427490234, -0.08410835266113281, -0.08137226104736328, -0.07863616943359375, -0.07590007781982422, -0.07316398620605469, -0.07042789459228516, -0.06769180297851562, -0.0649557113647461, -0.06221961975097656, -0.05948352813720703, -0.0567474365234375, -0.05401134490966797, -0.05127525329589844, -0.048539161682128906, -0.045803070068359375, -0.043066978454589844, -0.04033088684082031, -0.03759479522705078, -0.03485870361328125, -0.03212261199951172, -0.029386520385742188, -0.026650428771972656, -0.023914337158203125, -0.021178245544433594, -0.018442153930664062, -0.01570606231689453, -0.012969970703125, -0.010233879089355469, -0.0074977874755859375, -0.004761695861816406, -0.002025604248046875, 0.0007104873657226562, 0.0034465789794921875, 0.006182670593261719, 0.00891876220703125, 0.011654853820800781, 0.014390945434570312, 0.017127037048339844, 0.019863128662109375, 0.022599220275878906, 0.025335311889648438, 0.02807140350341797, 0.0308074951171875, 0.03354358673095703, 0.03627967834472656, 0.039015769958496094, 0.041751861572265625, 0.044487953186035156, 0.04722404479980469, 0.04996013641357422, 0.05269622802734375, 0.05543231964111328, 0.05816841125488281, 0.060904502868652344, 0.06364059448242188, 0.0663766860961914, 0.06911277770996094, 0.07184886932373047, 0.0745849609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 4.0, 5.0, 8.0, 6.0, 15.0, 16.0, 31.0, 38.0, 68.0, 108.0, 196.0, 487.0, 10561.0, 1032639.0, 3488.0, 399.0, 183.0, 87.0, 65.0, 39.0, 29.0, 21.0, 14.0, 3.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.6268157958984375, -1.565155029296875, -1.5034942626953125, -1.44183349609375, -1.3801727294921875, -1.318511962890625, -1.2568511962890625, -1.1951904296875, -1.1335296630859375, -1.071868896484375, -1.0102081298828125, -0.94854736328125, -0.8868865966796875, -0.825225830078125, -0.7635650634765625, -0.701904296875, -0.6402435302734375, -0.578582763671875, -0.5169219970703125, -0.45526123046875, -0.3936004638671875, -0.331939697265625, -0.2702789306640625, -0.2086181640625, -0.1469573974609375, -0.085296630859375, -0.0236358642578125, 0.03802490234375, 0.0996856689453125, 0.161346435546875, 0.2230072021484375, 0.28466796875, 0.3463287353515625, 0.407989501953125, 0.4696502685546875, 0.53131103515625, 0.5929718017578125, 0.654632568359375, 0.7162933349609375, 0.7779541015625, 0.8396148681640625, 0.901275634765625, 0.9629364013671875, 1.02459716796875, 1.0862579345703125, 1.147918701171875, 1.2095794677734375, 1.271240234375, 1.3329010009765625, 1.394561767578125, 1.4562225341796875, 1.51788330078125, 1.5795440673828125, 1.641204833984375, 1.7028656005859375, 1.7645263671875, 1.8261871337890625, 1.887847900390625, 1.9495086669921875, 2.01116943359375, 2.0728302001953125, 2.134490966796875, 2.1961517333984375, 2.2578125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 18.0, 50.0, 127.0, 292.0, 307.0, 139.0, 39.0, 20.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19680680334568024, -0.18978610634803772, -0.1827654093503952, -0.17574471235275269, -0.16872401535511017, -0.16170331835746765, -0.15468262135982513, -0.14766192436218262, -0.1406412273645401, -0.13362053036689758, -0.12659983336925507, -0.11957913637161255, -0.11255843937397003, -0.10553774237632751, -0.098517045378685, -0.09149634838104248, -0.08447565138339996, -0.07745495438575745, -0.07043425738811493, -0.06341356039047241, -0.056392863392829895, -0.04937216639518738, -0.04235146939754486, -0.035330772399902344, -0.028310075402259827, -0.02128937840461731, -0.014268681406974792, -0.007247984409332275, -0.0002272874116897583, 0.006793409585952759, 0.013814106583595276, 0.020834803581237793, 0.027855515480041504, 0.03487621247768402, 0.04189690947532654, 0.048917606472969055, 0.05593830347061157, 0.06295900046825409, 0.0699796974658966, 0.07700039446353912, 0.08402109146118164, 0.09104178845882416, 0.09806248545646667, 0.10508318245410919, 0.11210387945175171, 0.11912457644939423, 0.12614527344703674, 0.13316597044467926, 0.14018666744232178, 0.1472073644399643, 0.1542280614376068, 0.16124875843524933, 0.16826945543289185, 0.17529015243053436, 0.18231084942817688, 0.1893315464258194, 0.19635224342346191, 0.20337294042110443, 0.21039363741874695, 0.21741433441638947, 0.22443503141403198, 0.2314557284116745, 0.23847642540931702, 0.24549712240695953, 0.25251781940460205]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 8.0, 4.0, 14.0, 13.0, 15.0, 19.0, 17.0, 22.0, 27.0, 35.0, 19.0, 16.0, 34.0, 28.0, 39.0, 36.0, 49.0, 29.0, 40.0, 42.0, 43.0, 32.0, 36.0, 32.0, 35.0, 25.0, 30.0, 34.0, 36.0, 38.0, 21.0, 20.0, 9.0, 16.0, 6.0, 17.0, 8.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.05887115001678467, -0.05697086825966835, -0.05507058650255203, -0.053170304745435715, -0.0512700229883194, -0.04936974123120308, -0.04746945947408676, -0.045569177716970444, -0.043668895959854126, -0.04176861420273781, -0.03986833244562149, -0.03796805068850517, -0.036067768931388855, -0.03416748717427254, -0.03226720541715622, -0.0303669236600399, -0.028466641902923584, -0.026566360145807266, -0.02466607838869095, -0.02276579663157463, -0.020865514874458313, -0.018965233117341995, -0.017064951360225677, -0.01516466960310936, -0.013264387845993042, -0.011364106088876724, -0.009463824331760406, -0.007563542574644089, -0.005663260817527771, -0.0037629790604114532, -0.0018626973032951355, 3.758445382118225e-05, 0.0019378662109375, 0.0038381479680538177, 0.0057384297251701355, 0.007638711482286453, 0.009538993239402771, 0.011439274996519089, 0.013339556753635406, 0.015239838510751724, 0.017140120267868042, 0.01904040202498436, 0.020940683782100677, 0.022840965539216995, 0.024741247296333313, 0.02664152905344963, 0.02854181081056595, 0.030442092567682266, 0.032342374324798584, 0.0342426560819149, 0.03614293783903122, 0.03804321959614754, 0.039943501353263855, 0.04184378311038017, 0.04374406486749649, 0.04564434662461281, 0.047544628381729126, 0.049444910138845444, 0.05134519189596176, 0.05324547365307808, 0.0551457554101944, 0.057046037167310715, 0.05894631892442703, 0.06084660068154335, 0.06274688243865967]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 10.0, 10.0, 13.0, 13.0, 15.0, 12.0, 19.0, 28.0, 27.0, 29.0, 25.0, 28.0, 36.0, 40.0, 31.0, 38.0, 53.0, 33.0, 41.0, 36.0, 46.0, 35.0, 40.0, 50.0, 26.0, 28.0, 32.0, 24.0, 21.0, 16.0, 10.0, 17.0, 10.0, 15.0, 9.0, 13.0, 10.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.46484375, -3.351806640625, -3.23876953125, -3.125732421875, -3.0126953125, -2.899658203125, -2.78662109375, -2.673583984375, -2.560546875, -2.447509765625, -2.33447265625, -2.221435546875, -2.1083984375, -1.995361328125, -1.88232421875, -1.769287109375, -1.65625, -1.543212890625, -1.43017578125, -1.317138671875, -1.2041015625, -1.091064453125, -0.97802734375, -0.864990234375, -0.751953125, -0.638916015625, -0.52587890625, -0.412841796875, -0.2998046875, -0.186767578125, -0.07373046875, 0.039306640625, 0.15234375, 0.265380859375, 0.37841796875, 0.491455078125, 0.6044921875, 0.717529296875, 0.83056640625, 0.943603515625, 1.056640625, 1.169677734375, 1.28271484375, 1.395751953125, 1.5087890625, 1.621826171875, 1.73486328125, 1.847900390625, 1.9609375, 2.073974609375, 2.18701171875, 2.300048828125, 2.4130859375, 2.526123046875, 2.63916015625, 2.752197265625, 2.865234375, 2.978271484375, 3.09130859375, 3.204345703125, 3.3173828125, 3.430419921875, 3.54345703125, 3.656494140625, 3.76953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 13.0, 7.0, 22.0, 33.0, 34.0, 46.0, 75.0, 95.0, 143.0, 218.0, 318.0, 459.0, 633.0, 1098.0, 1560.0, 2568.0, 4209.0, 7114.0, 12260.0, 21829.0, 41952.0, 86594.0, 197439.0, 337472.0, 170293.0, 76044.0, 37525.0, 19880.0, 11169.0, 6599.0, 3872.0, 2507.0, 1562.0, 941.0, 663.0, 437.0, 277.0, 200.0, 123.0, 67.0, 71.0, 45.0, 33.0, 15.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.70550537109375, -4.5399169921875, -4.37432861328125, -4.208740234375, -4.04315185546875, -3.8775634765625, -3.71197509765625, -3.54638671875, -3.38079833984375, -3.2152099609375, -3.04962158203125, -2.884033203125, -2.71844482421875, -2.5528564453125, -2.38726806640625, -2.2216796875, -2.05609130859375, -1.8905029296875, -1.72491455078125, -1.559326171875, -1.39373779296875, -1.2281494140625, -1.06256103515625, -0.89697265625, -0.73138427734375, -0.5657958984375, -0.40020751953125, -0.234619140625, -0.06903076171875, 0.0965576171875, 0.26214599609375, 0.427734375, 0.59332275390625, 0.7589111328125, 0.92449951171875, 1.090087890625, 1.25567626953125, 1.4212646484375, 1.58685302734375, 1.75244140625, 1.91802978515625, 2.0836181640625, 2.24920654296875, 2.414794921875, 2.58038330078125, 2.7459716796875, 2.91156005859375, 3.0771484375, 3.24273681640625, 3.4083251953125, 3.57391357421875, 3.739501953125, 3.90509033203125, 4.0706787109375, 4.23626708984375, 4.40185546875, 4.56744384765625, 4.7330322265625, 4.89862060546875, 5.064208984375, 5.22979736328125, 5.3953857421875, 5.56097412109375, 5.7265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 1.0, 6.0, 6.0, 7.0, 16.0, 16.0, 17.0, 21.0, 16.0, 27.0, 31.0, 31.0, 45.0, 31.0, 70.0, 82.0, 113.0, 182.0, 1390.0, 291.0, 133.0, 87.0, 66.0, 41.0, 40.0, 39.0, 29.0, 28.0, 31.0, 22.0, 21.0, 17.0, 15.0, 13.0, 19.0, 11.0, 5.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.03125, -9.70556640625, -9.3798828125, -9.05419921875, -8.728515625, -8.40283203125, -8.0771484375, -7.75146484375, -7.42578125, -7.10009765625, -6.7744140625, -6.44873046875, -6.123046875, -5.79736328125, -5.4716796875, -5.14599609375, -4.8203125, -4.49462890625, -4.1689453125, -3.84326171875, -3.517578125, -3.19189453125, -2.8662109375, -2.54052734375, -2.21484375, -1.88916015625, -1.5634765625, -1.23779296875, -0.912109375, -0.58642578125, -0.2607421875, 0.06494140625, 0.390625, 0.71630859375, 1.0419921875, 1.36767578125, 1.693359375, 2.01904296875, 2.3447265625, 2.67041015625, 2.99609375, 3.32177734375, 3.6474609375, 3.97314453125, 4.298828125, 4.62451171875, 4.9501953125, 5.27587890625, 5.6015625, 5.92724609375, 6.2529296875, 6.57861328125, 6.904296875, 7.22998046875, 7.5556640625, 7.88134765625, 8.20703125, 8.53271484375, 8.8583984375, 9.18408203125, 9.509765625, 9.83544921875, 10.1611328125, 10.48681640625, 10.8125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 12.0, 9.0, 13.0, 13.0, 20.0, 22.0, 38.0, 49.0, 81.0, 91.0, 161.0, 260.0, 500.0, 1167.0, 3992.0, 20739.0, 246759.0, 2732080.0, 120657.0, 13908.0, 3068.0, 959.0, 449.0, 224.0, 144.0, 80.0, 67.0, 36.0, 26.0, 23.0, 16.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.50537109375, -15.9794921875, -15.45361328125, -14.927734375, -14.40185546875, -13.8759765625, -13.35009765625, -12.82421875, -12.29833984375, -11.7724609375, -11.24658203125, -10.720703125, -10.19482421875, -9.6689453125, -9.14306640625, -8.6171875, -8.09130859375, -7.5654296875, -7.03955078125, -6.513671875, -5.98779296875, -5.4619140625, -4.93603515625, -4.41015625, -3.88427734375, -3.3583984375, -2.83251953125, -2.306640625, -1.78076171875, -1.2548828125, -0.72900390625, -0.203125, 0.32275390625, 0.8486328125, 1.37451171875, 1.900390625, 2.42626953125, 2.9521484375, 3.47802734375, 4.00390625, 4.52978515625, 5.0556640625, 5.58154296875, 6.107421875, 6.63330078125, 7.1591796875, 7.68505859375, 8.2109375, 8.73681640625, 9.2626953125, 9.78857421875, 10.314453125, 10.84033203125, 11.3662109375, 11.89208984375, 12.41796875, 12.94384765625, 13.4697265625, 13.99560546875, 14.521484375, 15.04736328125, 15.5732421875, 16.09912109375, 16.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 24.0, 99.0, 332.0, 364.0, 153.0, 32.0, 12.0], "bins": [-138.59930419921875, -136.29335021972656, -133.98741149902344, -131.68145751953125, -129.37551879882812, -127.06956481933594, -124.76361846923828, -122.45767211914062, -120.15171813964844, -117.84577178955078, -115.53982543945312, -113.23387145996094, -110.92792510986328, -108.62197875976562, -106.31603240966797, -104.01008605957031, -101.70413970947266, -99.398193359375, -97.09224700927734, -94.78629302978516, -92.4803466796875, -90.17440032958984, -87.86845397949219, -85.56250762939453, -83.25656127929688, -80.95061492919922, -78.64466857910156, -76.33871459960938, -74.03276824951172, -71.72682189941406, -69.4208755493164, -67.11492919921875, -64.8089828491211, -62.50303649902344, -60.197086334228516, -57.89113998413086, -55.58518981933594, -53.27924346923828, -50.973297119140625, -48.66735076904297, -46.36140060424805, -44.05545425415039, -41.74950408935547, -39.44355773925781, -37.137611389160156, -34.831661224365234, -32.52571487426758, -30.21976661682129, -27.913818359375, -25.60787010192871, -23.301921844482422, -20.995975494384766, -18.690027236938477, -16.384078979492188, -14.078131675720215, -11.772184371948242, -9.466236114501953, -7.160288333892822, -4.854340553283691, -2.5483927726745605, -0.2424449920654297, 2.0635032653808594, 4.369450569152832, 6.675397872924805, 8.981346130371094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 9.0, 10.0, 10.0, 14.0, 13.0, 15.0, 23.0, 27.0, 34.0, 34.0, 28.0, 29.0, 21.0, 26.0, 31.0, 49.0, 59.0, 51.0, 41.0, 41.0, 50.0, 44.0, 23.0, 23.0, 41.0, 30.0, 30.0, 32.0, 16.0, 22.0, 11.0, 17.0, 9.0, 9.0, 14.0, 17.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.878116607666016, -23.134761810302734, -22.39140510559082, -21.64805030822754, -20.904693603515625, -20.161338806152344, -19.417984008789062, -18.67462921142578, -17.931272506713867, -17.187917709350586, -16.444561004638672, -15.70120620727539, -14.957850456237793, -14.214494705200195, -13.471139907836914, -12.727784156799316, -11.984428405761719, -11.241072654724121, -10.497716903686523, -9.754362106323242, -9.011006355285645, -8.267650604248047, -7.524295330047607, -6.780940055847168, -6.03758430480957, -5.294228553771973, -4.550873279571533, -3.8075177669525146, -3.064162254333496, -2.3208067417144775, -1.577451229095459, -0.8340959548950195, -0.09074020385742188, 0.6526153087615967, 1.3959708213806152, 2.139326333999634, 2.8826818466186523, 3.626037359237671, 4.3693928718566895, 5.112748146057129, 5.856103897094727, 6.599459648132324, 7.342814922332764, 8.086170196533203, 8.8295259475708, 9.572881698608398, 10.31623649597168, 11.059592247009277, 11.802947998046875, 12.546303749084473, 13.28965950012207, 14.033014297485352, 14.77637004852295, 15.519725799560547, 16.263080596923828, 17.00643539428711, 17.749792098999023, 18.493146896362305, 19.23650360107422, 19.9798583984375, 20.72321319580078, 21.466569900512695, 22.209924697875977, 22.95328140258789, 23.696636199951172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 3.0, 2.0, 8.0, 9.0, 12.0, 10.0, 11.0, 16.0, 18.0, 12.0, 19.0, 26.0, 34.0, 23.0, 27.0, 49.0, 38.0, 40.0, 37.0, 43.0, 45.0, 36.0, 40.0, 40.0, 38.0, 37.0, 32.0, 24.0, 34.0, 31.0, 25.0, 23.0, 24.0, 11.0, 14.0, 16.0, 19.0, 9.0, 9.0, 4.0, 8.0, 8.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.46484375, -3.351715087890625, -3.23858642578125, -3.125457763671875, -3.0123291015625, -2.899200439453125, -2.78607177734375, -2.672943115234375, -2.559814453125, -2.446685791015625, -2.33355712890625, -2.220428466796875, -2.1072998046875, -1.994171142578125, -1.88104248046875, -1.767913818359375, -1.65478515625, -1.541656494140625, -1.42852783203125, -1.315399169921875, -1.2022705078125, -1.089141845703125, -0.97601318359375, -0.862884521484375, -0.749755859375, -0.636627197265625, -0.52349853515625, -0.410369873046875, -0.2972412109375, -0.184112548828125, -0.07098388671875, 0.042144775390625, 0.1552734375, 0.268402099609375, 0.38153076171875, 0.494659423828125, 0.6077880859375, 0.720916748046875, 0.83404541015625, 0.947174072265625, 1.060302734375, 1.173431396484375, 1.28656005859375, 1.399688720703125, 1.5128173828125, 1.625946044921875, 1.73907470703125, 1.852203369140625, 1.96533203125, 2.078460693359375, 2.19158935546875, 2.304718017578125, 2.4178466796875, 2.530975341796875, 2.64410400390625, 2.757232666015625, 2.870361328125, 2.983489990234375, 3.09661865234375, 3.209747314453125, 3.3228759765625, 3.436004638671875, 3.54913330078125, 3.662261962890625, 3.775390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 7.0, 4.0, 5.0, 11.0, 7.0, 27.0, 32.0, 32.0, 32.0, 44.0, 71.0, 91.0, 130.0, 150.0, 233.0, 374.0, 769.0, 6690.0, 3621492.0, 558804.0, 3548.0, 612.0, 307.0, 206.0, 142.0, 106.0, 87.0, 63.0, 32.0, 30.0, 30.0, 31.0, 23.0, 7.0, 3.0, 5.0, 6.0, 8.0, 4.0, 5.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.9375, -37.634765625, -36.33203125, -35.029296875, -33.7265625, -32.423828125, -31.12109375, -29.818359375, -28.515625, -27.212890625, -25.91015625, -24.607421875, -23.3046875, -22.001953125, -20.69921875, -19.396484375, -18.09375, -16.791015625, -15.48828125, -14.185546875, -12.8828125, -11.580078125, -10.27734375, -8.974609375, -7.671875, -6.369140625, -5.06640625, -3.763671875, -2.4609375, -1.158203125, 0.14453125, 1.447265625, 2.75, 4.052734375, 5.35546875, 6.658203125, 7.9609375, 9.263671875, 10.56640625, 11.869140625, 13.171875, 14.474609375, 15.77734375, 17.080078125, 18.3828125, 19.685546875, 20.98828125, 22.291015625, 23.59375, 24.896484375, 26.19921875, 27.501953125, 28.8046875, 30.107421875, 31.41015625, 32.712890625, 34.015625, 35.318359375, 36.62109375, 37.923828125, 39.2265625, 40.529296875, 41.83203125, 43.134765625, 44.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 14.0, 14.0, 26.0, 35.0, 38.0, 62.0, 81.0, 104.0, 171.0, 287.0, 493.0, 719.0, 724.0, 453.0, 263.0, 162.0, 91.0, 68.0, 56.0, 32.0, 45.0, 27.0, 23.0, 13.0, 10.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.125, -6.91534423828125, -6.7056884765625, -6.49603271484375, -6.286376953125, -6.07672119140625, -5.8670654296875, -5.65740966796875, -5.44775390625, -5.23809814453125, -5.0284423828125, -4.81878662109375, -4.609130859375, -4.39947509765625, -4.1898193359375, -3.98016357421875, -3.7705078125, -3.56085205078125, -3.3511962890625, -3.14154052734375, -2.931884765625, -2.72222900390625, -2.5125732421875, -2.30291748046875, -2.09326171875, -1.88360595703125, -1.6739501953125, -1.46429443359375, -1.254638671875, -1.04498291015625, -0.8353271484375, -0.62567138671875, -0.416015625, -0.20635986328125, 0.0032958984375, 0.21295166015625, 0.422607421875, 0.63226318359375, 0.8419189453125, 1.05157470703125, 1.26123046875, 1.47088623046875, 1.6805419921875, 1.89019775390625, 2.099853515625, 2.30950927734375, 2.5191650390625, 2.72882080078125, 2.9384765625, 3.14813232421875, 3.3577880859375, 3.56744384765625, 3.777099609375, 3.98675537109375, 4.1964111328125, 4.40606689453125, 4.61572265625, 4.82537841796875, 5.0350341796875, 5.24468994140625, 5.454345703125, 5.66400146484375, 5.8736572265625, 6.08331298828125, 6.29296875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 4.0, 6.0, 17.0, 14.0, 23.0, 20.0, 38.0, 55.0, 91.0, 131.0, 339.0, 1219.0, 13591.0, 704841.0, 3438725.0, 32247.0, 2040.0, 428.0, 169.0, 99.0, 63.0, 40.0, 19.0, 12.0, 9.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53125, -23.767822265625, -23.00439453125, -22.240966796875, -21.4775390625, -20.714111328125, -19.95068359375, -19.187255859375, -18.423828125, -17.660400390625, -16.89697265625, -16.133544921875, -15.3701171875, -14.606689453125, -13.84326171875, -13.079833984375, -12.31640625, -11.552978515625, -10.78955078125, -10.026123046875, -9.2626953125, -8.499267578125, -7.73583984375, -6.972412109375, -6.208984375, -5.445556640625, -4.68212890625, -3.918701171875, -3.1552734375, -2.391845703125, -1.62841796875, -0.864990234375, -0.1015625, 0.661865234375, 1.42529296875, 2.188720703125, 2.9521484375, 3.715576171875, 4.47900390625, 5.242431640625, 6.005859375, 6.769287109375, 7.53271484375, 8.296142578125, 9.0595703125, 9.822998046875, 10.58642578125, 11.349853515625, 12.11328125, 12.876708984375, 13.64013671875, 14.403564453125, 15.1669921875, 15.930419921875, 16.69384765625, 17.457275390625, 18.220703125, 18.984130859375, 19.74755859375, 20.510986328125, 21.2744140625, 22.037841796875, 22.80126953125, 23.564697265625, 24.328125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 19.0, 9.0, 28.0, 28.0, 44.0, 63.0, 86.0, 110.0, 109.0, 105.0, 109.0, 82.0, 76.0, 51.0, 30.0, 14.0, 11.0, 16.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.738236427307129, -9.052277565002441, -8.36631965637207, -7.680360794067383, -6.994401931762695, -6.308443546295166, -5.622485160827637, -4.936526298522949, -4.25056791305542, -3.5646092891693115, -2.878650665283203, -2.192692279815674, -1.5067336559295654, -0.820775032043457, -0.13481664657592773, 0.5511422157287598, 1.237100601196289, 1.9230592250823975, 2.609017848968506, 3.294976234436035, 3.9809348583221436, 4.666893482208252, 5.352851867675781, 6.038810729980469, 6.724769115447998, 7.410727500915527, 8.096686363220215, 8.782644271850586, 9.468603134155273, 10.154561996459961, 10.840520858764648, 11.526479721069336, 12.212438583374023, 12.898397445678711, 13.584355354309082, 14.27031421661377, 14.956273078918457, 15.642230987548828, 16.328189849853516, 17.014148712158203, 17.70010757446289, 18.386066436767578, 19.072025299072266, 19.757984161376953, 20.443941116333008, 21.129899978637695, 21.815858840942383, 22.50181770324707, 23.187774658203125, 23.873733520507812, 24.5596923828125, 25.245651245117188, 25.931608200073242, 26.61756706237793, 27.303525924682617, 27.989484786987305, 28.675443649291992, 29.36140251159668, 30.047361373901367, 30.733318328857422, 31.41927719116211, 32.1052360534668, 32.791194915771484, 33.47715377807617, 34.16311264038086]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 1.0, 4.0, 7.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 19.0, 27.0, 12.0, 22.0, 21.0, 34.0, 33.0, 36.0, 26.0, 41.0, 39.0, 32.0, 42.0, 52.0, 40.0, 42.0, 35.0, 52.0, 40.0, 38.0, 29.0, 31.0, 28.0, 20.0, 28.0, 14.0, 13.0, 20.0, 12.0, 11.0, 10.0, 9.0, 0.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.44189453125, -17.84846305847168, -17.255033493041992, -16.661602020263672, -16.06817054748535, -15.474740028381348, -14.881309509277344, -14.287878036499023, -13.694446563720703, -13.1010160446167, -12.507584571838379, -11.914154052734375, -11.320722579956055, -10.72729206085205, -10.133861541748047, -9.540430068969727, -8.946999549865723, -8.353569030761719, -7.760137557983398, -7.1667070388793945, -6.573275566101074, -5.97984504699707, -5.386414051055908, -4.792983055114746, -4.199552059173584, -3.606121063232422, -3.0126900672912598, -2.4192593097686768, -1.8258283138275146, -1.2323973178863525, -0.6389665603637695, -0.04553556442260742, 0.5478954315185547, 1.1413264274597168, 1.7347573041915894, 2.328188180923462, 2.921619176864624, 3.515050172805786, 4.108480930328369, 4.701911926269531, 5.295342922210693, 5.8887739181518555, 6.482204914093018, 7.07563591003418, 7.669066429138184, 8.262497901916504, 8.855928421020508, 9.449359893798828, 10.042790412902832, 10.636220932006836, 11.229652404785156, 11.82308292388916, 12.41651439666748, 13.009944915771484, 13.603376388549805, 14.196806907653809, 14.790237426757812, 15.383667945861816, 15.977099418640137, 16.57052993774414, 17.16396141052246, 17.75739288330078, 18.35082244873047, 18.94425392150879, 19.53768539428711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 8.0, 8.0, 14.0, 11.0, 19.0, 12.0, 12.0, 26.0, 39.0, 26.0, 35.0, 32.0, 36.0, 46.0, 37.0, 37.0, 39.0, 49.0, 46.0, 52.0, 31.0, 39.0, 49.0, 34.0, 17.0, 29.0, 22.0, 13.0, 24.0, 26.0, 24.0, 12.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.677734375, -3.562835693359375, -3.44793701171875, -3.333038330078125, -3.2181396484375, -3.103240966796875, -2.98834228515625, -2.873443603515625, -2.758544921875, -2.643646240234375, -2.52874755859375, -2.413848876953125, -2.2989501953125, -2.184051513671875, -2.06915283203125, -1.954254150390625, -1.83935546875, -1.724456787109375, -1.60955810546875, -1.494659423828125, -1.3797607421875, -1.264862060546875, -1.14996337890625, -1.035064697265625, -0.920166015625, -0.805267333984375, -0.69036865234375, -0.575469970703125, -0.4605712890625, -0.345672607421875, -0.23077392578125, -0.115875244140625, -0.0009765625, 0.113922119140625, 0.22882080078125, 0.343719482421875, 0.4586181640625, 0.573516845703125, 0.68841552734375, 0.803314208984375, 0.918212890625, 1.033111572265625, 1.14801025390625, 1.262908935546875, 1.3778076171875, 1.492706298828125, 1.60760498046875, 1.722503662109375, 1.83740234375, 1.952301025390625, 2.06719970703125, 2.182098388671875, 2.2969970703125, 2.411895751953125, 2.52679443359375, 2.641693115234375, 2.756591796875, 2.871490478515625, 2.98638916015625, 3.101287841796875, 3.2161865234375, 3.331085205078125, 3.44598388671875, 3.560882568359375, 3.67578125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 12.0, 18.0, 24.0, 41.0, 66.0, 101.0, 137.0, 196.0, 282.0, 381.0, 573.0, 779.0, 1272.0, 1838.0, 2791.0, 4243.0, 6749.0, 11006.0, 18316.0, 32160.0, 60418.0, 124574.0, 250718.0, 256991.0, 128787.0, 62636.0, 33417.0, 18827.0, 11238.0, 6883.0, 4372.0, 2860.0, 1832.0, 1287.0, 868.0, 547.0, 437.0, 257.0, 195.0, 136.0, 99.0, 67.0, 46.0, 26.0, 21.0, 13.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.966796875, -0.9375228881835938, -0.9082489013671875, -0.8789749145507812, -0.849700927734375, -0.8204269409179688, -0.7911529541015625, -0.7618789672851562, -0.73260498046875, -0.7033309936523438, -0.6740570068359375, -0.6447830200195312, -0.615509033203125, -0.5862350463867188, -0.5569610595703125, -0.5276870727539062, -0.4984130859375, -0.46913909912109375, -0.4398651123046875, -0.41059112548828125, -0.381317138671875, -0.35204315185546875, -0.3227691650390625, -0.29349517822265625, -0.26422119140625, -0.23494720458984375, -0.2056732177734375, -0.17639923095703125, -0.147125244140625, -0.11785125732421875, -0.0885772705078125, -0.05930328369140625, -0.030029296875, -0.00075531005859375, 0.0285186767578125, 0.05779266357421875, 0.087066650390625, 0.11634063720703125, 0.1456146240234375, 0.17488861083984375, 0.20416259765625, 0.23343658447265625, 0.2627105712890625, 0.29198455810546875, 0.321258544921875, 0.35053253173828125, 0.3798065185546875, 0.40908050537109375, 0.4383544921875, 0.46762847900390625, 0.4969024658203125, 0.5261764526367188, 0.555450439453125, 0.5847244262695312, 0.6139984130859375, 0.6432723999023438, 0.67254638671875, 0.7018203735351562, 0.7310943603515625, 0.7603683471679688, 0.789642333984375, 0.8189163208007812, 0.8481903076171875, 0.8774642944335938, 0.90673828125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 6.0, 8.0, 7.0, 13.0, 14.0, 13.0, 13.0, 23.0, 17.0, 28.0, 29.0, 29.0, 29.0, 38.0, 29.0, 45.0, 45.0, 33.0, 47.0, 1061.0, 34.0, 46.0, 48.0, 47.0, 39.0, 32.0, 36.0, 29.0, 30.0, 25.0, 19.0, 19.0, 14.0, 9.0, 12.0, 9.0, 11.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.88543701171875, -2.7982177734375, -2.71099853515625, -2.623779296875, -2.53656005859375, -2.4493408203125, -2.36212158203125, -2.27490234375, -2.18768310546875, -2.1004638671875, -2.01324462890625, -1.926025390625, -1.83880615234375, -1.7515869140625, -1.66436767578125, -1.5771484375, -1.48992919921875, -1.4027099609375, -1.31549072265625, -1.228271484375, -1.14105224609375, -1.0538330078125, -0.96661376953125, -0.87939453125, -0.79217529296875, -0.7049560546875, -0.61773681640625, -0.530517578125, -0.44329833984375, -0.3560791015625, -0.26885986328125, -0.181640625, -0.09442138671875, -0.0072021484375, 0.08001708984375, 0.167236328125, 0.25445556640625, 0.3416748046875, 0.42889404296875, 0.51611328125, 0.60333251953125, 0.6905517578125, 0.77777099609375, 0.864990234375, 0.95220947265625, 1.0394287109375, 1.12664794921875, 1.2138671875, 1.30108642578125, 1.3883056640625, 1.47552490234375, 1.562744140625, 1.64996337890625, 1.7371826171875, 1.82440185546875, 1.91162109375, 1.99884033203125, 2.0860595703125, 2.17327880859375, 2.260498046875, 2.34771728515625, 2.4349365234375, 2.52215576171875, 2.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 11.0, 17.0, 21.0, 39.0, 61.0, 85.0, 150.0, 269.0, 471.0, 893.0, 1734.0, 3808.0, 9192.0, 27240.0, 119766.0, 1428486.0, 417500.0, 58950.0, 16754.0, 6204.0, 2605.0, 1274.0, 654.0, 348.0, 211.0, 131.0, 89.0, 44.0, 36.0, 34.0, 12.0, 13.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4755859375, -1.4276580810546875, -1.379730224609375, -1.3318023681640625, -1.28387451171875, -1.2359466552734375, -1.188018798828125, -1.1400909423828125, -1.0921630859375, -1.0442352294921875, -0.996307373046875, -0.9483795166015625, -0.90045166015625, -0.8525238037109375, -0.804595947265625, -0.7566680908203125, -0.708740234375, -0.6608123779296875, -0.612884521484375, -0.5649566650390625, -0.51702880859375, -0.4691009521484375, -0.421173095703125, -0.3732452392578125, -0.3253173828125, -0.2773895263671875, -0.229461669921875, -0.1815338134765625, -0.13360595703125, -0.0856781005859375, -0.037750244140625, 0.0101776123046875, 0.05810546875, 0.1060333251953125, 0.153961181640625, 0.2018890380859375, 0.24981689453125, 0.2977447509765625, 0.345672607421875, 0.3936004638671875, 0.4415283203125, 0.4894561767578125, 0.537384033203125, 0.5853118896484375, 0.63323974609375, 0.6811676025390625, 0.729095458984375, 0.7770233154296875, 0.824951171875, 0.8728790283203125, 0.920806884765625, 0.9687347412109375, 1.01666259765625, 1.0645904541015625, 1.112518310546875, 1.1604461669921875, 1.2083740234375, 1.2563018798828125, 1.304229736328125, 1.3521575927734375, 1.40008544921875, 1.4480133056640625, 1.495941162109375, 1.5438690185546875, 1.591796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 8.0, 7.0, 12.0, 14.0, 21.0, 28.0, 41.0, 69.0, 131.0, 148.0, 182.0, 115.0, 76.0, 46.0, 25.0, 17.0, 14.0, 14.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3879966735839844, -0.37584686279296875, -0.3636970520019531, -0.3515472412109375, -0.3393974304199219, -0.32724761962890625, -0.3150978088378906, -0.302947998046875, -0.2907981872558594, -0.27864837646484375, -0.2664985656738281, -0.2543487548828125, -0.24219894409179688, -0.23004913330078125, -0.21789932250976562, -0.20574951171875, -0.19359970092773438, -0.18144989013671875, -0.16930007934570312, -0.1571502685546875, -0.14500045776367188, -0.13285064697265625, -0.12070083618164062, -0.108551025390625, -0.09640121459960938, -0.08425140380859375, -0.07210159301757812, -0.0599517822265625, -0.047801971435546875, -0.03565216064453125, -0.023502349853515625, -0.0113525390625, 0.000797271728515625, 0.01294708251953125, 0.025096893310546875, 0.0372467041015625, 0.049396514892578125, 0.06154632568359375, 0.07369613647460938, 0.085845947265625, 0.09799575805664062, 0.11014556884765625, 0.12229537963867188, 0.1344451904296875, 0.14659500122070312, 0.15874481201171875, 0.17089462280273438, 0.18304443359375, 0.19519424438476562, 0.20734405517578125, 0.21949386596679688, 0.2316436767578125, 0.24379348754882812, 0.25594329833984375, 0.2680931091308594, 0.280242919921875, 0.2923927307128906, 0.30454254150390625, 0.3166923522949219, 0.3288421630859375, 0.3409919738769531, 0.35314178466796875, 0.3652915954589844, 0.37744140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 21.0, 29.0, 54.0, 93.0, 200.0, 492.0, 11757.0, 1033877.0, 1393.0, 274.0, 120.0, 70.0, 40.0, 30.0, 16.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.857666015625, -7.59814453125, -7.338623046875, -7.0791015625, -6.819580078125, -6.56005859375, -6.300537109375, -6.041015625, -5.781494140625, -5.52197265625, -5.262451171875, -5.0029296875, -4.743408203125, -4.48388671875, -4.224365234375, -3.96484375, -3.705322265625, -3.44580078125, -3.186279296875, -2.9267578125, -2.667236328125, -2.40771484375, -2.148193359375, -1.888671875, -1.629150390625, -1.36962890625, -1.110107421875, -0.8505859375, -0.591064453125, -0.33154296875, -0.072021484375, 0.1875, 0.447021484375, 0.70654296875, 0.966064453125, 1.2255859375, 1.485107421875, 1.74462890625, 2.004150390625, 2.263671875, 2.523193359375, 2.78271484375, 3.042236328125, 3.3017578125, 3.561279296875, 3.82080078125, 4.080322265625, 4.33984375, 4.599365234375, 4.85888671875, 5.118408203125, 5.3779296875, 5.637451171875, 5.89697265625, 6.156494140625, 6.416015625, 6.675537109375, 6.93505859375, 7.194580078125, 7.4541015625, 7.713623046875, 7.97314453125, 8.232666015625, 8.4921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 40.0, 258.0, 540.0, 130.0, 19.0, 13.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423232913017273, -1.3887617588043213, -1.35429048538208, -1.3198192119598389, -1.2853480577468872, -1.2508769035339355, -1.2164056301116943, -1.1819343566894531, -1.1474632024765015, -1.1129920482635498, -1.0785207748413086, -1.0440495014190674, -1.0095783472061157, -0.9751071333885193, -0.9406359195709229, -0.9061647057533264, -0.87169349193573, -0.8372222781181335, -0.8027510643005371, -0.7682798504829407, -0.7338086366653442, -0.6993374228477478, -0.6648662090301514, -0.6303949952125549, -0.5959237813949585, -0.5614525675773621, -0.5269813537597656, -0.4925101399421692, -0.45803892612457275, -0.4235677123069763, -0.3890964984893799, -0.35462528467178345, -0.3201541304588318, -0.28568291664123535, -0.2512117028236389, -0.21674048900604248, -0.18226927518844604, -0.1477980613708496, -0.11332684755325317, -0.07885563373565674, -0.0443844199180603, -0.009913206100463867, 0.02455800771713257, 0.059029221534729004, 0.09350043535232544, 0.12797164916992188, 0.1624428629875183, 0.19691407680511475, 0.23138529062271118, 0.2658565044403076, 0.30032771825790405, 0.3347989320755005, 0.3692701458930969, 0.40374135971069336, 0.4382125735282898, 0.47268378734588623, 0.5071550011634827, 0.5416262149810791, 0.5760974287986755, 0.610568642616272, 0.6450398564338684, 0.6795110702514648, 0.7139822840690613, 0.7484534978866577, 0.7829247117042542]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 10.0, 9.0, 15.0, 13.0, 16.0, 13.0, 21.0, 26.0, 36.0, 24.0, 37.0, 45.0, 36.0, 42.0, 39.0, 34.0, 45.0, 31.0, 36.0, 41.0, 40.0, 48.0, 23.0, 35.0, 30.0, 24.0, 43.0, 25.0, 29.0, 17.0, 12.0, 12.0, 13.0, 9.0, 13.0, 8.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2747429609298706, -0.26545190811157227, -0.2561608552932739, -0.24686981737613678, -0.23757877945899963, -0.2282877266407013, -0.21899667382240295, -0.2097056359052658, -0.20041459798812866, -0.19112354516983032, -0.18183250725269318, -0.17254145443439484, -0.1632504165172577, -0.15395936369895935, -0.144668310880661, -0.13537727296352386, -0.12608622014522552, -0.11679517477750778, -0.10750412940979004, -0.0982130765914917, -0.08892203867435455, -0.07963098585605621, -0.07033994048833847, -0.06104889512062073, -0.051757849752902985, -0.04246680438518524, -0.0331757590174675, -0.023884709924459457, -0.014593664556741714, -0.0053026191890239716, 0.00398842990398407, 0.013279475271701813, 0.022570520639419556, 0.0318615660071373, 0.04115261137485504, 0.05044366046786308, 0.059734705835580826, 0.06902575492858887, 0.07831680029630661, 0.08760784566402435, 0.0968988910317421, 0.10618993639945984, 0.11548098176717758, 0.12477202713489532, 0.13406307995319366, 0.1433541178703308, 0.15264517068862915, 0.1619362235069275, 0.17122726142406464, 0.18051831424236298, 0.18980935215950012, 0.19910040497779846, 0.2083914428949356, 0.21768249571323395, 0.2269735336303711, 0.23626458644866943, 0.24555563926696777, 0.2548466920852661, 0.26413774490356445, 0.2734287679195404, 0.28271982073783875, 0.2920108735561371, 0.3013019263744354, 0.3105929493904114, 0.3198840022087097]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 11.0, 14.0, 12.0, 25.0, 26.0, 23.0, 30.0, 30.0, 25.0, 38.0, 33.0, 54.0, 58.0, 44.0, 46.0, 57.0, 34.0, 53.0, 47.0, 31.0, 35.0, 25.0, 25.0, 27.0, 25.0, 19.0, 21.0, 18.0, 27.0, 10.0, 14.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.609466552734375, -3.48651123046875, -3.363555908203125, -3.2406005859375, -3.117645263671875, -2.99468994140625, -2.871734619140625, -2.748779296875, -2.625823974609375, -2.50286865234375, -2.379913330078125, -2.2569580078125, -2.134002685546875, -2.01104736328125, -1.888092041015625, -1.76513671875, -1.642181396484375, -1.51922607421875, -1.396270751953125, -1.2733154296875, -1.150360107421875, -1.02740478515625, -0.904449462890625, -0.781494140625, -0.658538818359375, -0.53558349609375, -0.412628173828125, -0.2896728515625, -0.166717529296875, -0.04376220703125, 0.079193115234375, 0.2021484375, 0.325103759765625, 0.44805908203125, 0.571014404296875, 0.6939697265625, 0.816925048828125, 0.93988037109375, 1.062835693359375, 1.185791015625, 1.308746337890625, 1.43170166015625, 1.554656982421875, 1.6776123046875, 1.800567626953125, 1.92352294921875, 2.046478271484375, 2.16943359375, 2.292388916015625, 2.41534423828125, 2.538299560546875, 2.6612548828125, 2.784210205078125, 2.90716552734375, 3.030120849609375, 3.153076171875, 3.276031494140625, 3.39898681640625, 3.521942138671875, 3.6448974609375, 3.767852783203125, 3.89080810546875, 4.013763427734375, 4.13671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 13.0, 28.0, 24.0, 35.0, 79.0, 75.0, 106.0, 198.0, 315.0, 430.0, 624.0, 1073.0, 1685.0, 2820.0, 4806.0, 8945.0, 16816.0, 33790.0, 73748.0, 181310.0, 365130.0, 199208.0, 80284.0, 36727.0, 17801.0, 9546.0, 5093.0, 2958.0, 1736.0, 1059.0, 704.0, 418.0, 297.0, 194.0, 137.0, 86.0, 67.0, 50.0, 36.0, 27.0, 13.0, 13.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7890625, -4.63726806640625, -4.4854736328125, -4.33367919921875, -4.181884765625, -4.03009033203125, -3.8782958984375, -3.72650146484375, -3.57470703125, -3.42291259765625, -3.2711181640625, -3.11932373046875, -2.967529296875, -2.81573486328125, -2.6639404296875, -2.51214599609375, -2.3603515625, -2.20855712890625, -2.0567626953125, -1.90496826171875, -1.753173828125, -1.60137939453125, -1.4495849609375, -1.29779052734375, -1.14599609375, -0.99420166015625, -0.8424072265625, -0.69061279296875, -0.538818359375, -0.38702392578125, -0.2352294921875, -0.08343505859375, 0.068359375, 0.22015380859375, 0.3719482421875, 0.52374267578125, 0.675537109375, 0.82733154296875, 0.9791259765625, 1.13092041015625, 1.28271484375, 1.43450927734375, 1.5863037109375, 1.73809814453125, 1.889892578125, 2.04168701171875, 2.1934814453125, 2.34527587890625, 2.4970703125, 2.64886474609375, 2.8006591796875, 2.95245361328125, 3.104248046875, 3.25604248046875, 3.4078369140625, 3.55963134765625, 3.71142578125, 3.86322021484375, 4.0150146484375, 4.16680908203125, 4.318603515625, 4.47039794921875, 4.6221923828125, 4.77398681640625, 4.92578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 8.0, 7.0, 10.0, 11.0, 14.0, 22.0, 28.0, 26.0, 33.0, 20.0, 28.0, 40.0, 53.0, 65.0, 91.0, 194.0, 1412.0, 341.0, 168.0, 84.0, 56.0, 50.0, 47.0, 25.0, 38.0, 31.0, 23.0, 20.0, 14.0, 23.0, 19.0, 8.0, 9.0, 8.0, 7.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-11.8515625, -11.5390625, -11.2265625, -10.9140625, -10.6015625, -10.2890625, -9.9765625, -9.6640625, -9.3515625, -9.0390625, -8.7265625, -8.4140625, -8.1015625, -7.7890625, -7.4765625, -7.1640625, -6.8515625, -6.5390625, -6.2265625, -5.9140625, -5.6015625, -5.2890625, -4.9765625, -4.6640625, -4.3515625, -4.0390625, -3.7265625, -3.4140625, -3.1015625, -2.7890625, -2.4765625, -2.1640625, -1.8515625, -1.5390625, -1.2265625, -0.9140625, -0.6015625, -0.2890625, 0.0234375, 0.3359375, 0.6484375, 0.9609375, 1.2734375, 1.5859375, 1.8984375, 2.2109375, 2.5234375, 2.8359375, 3.1484375, 3.4609375, 3.7734375, 4.0859375, 4.3984375, 4.7109375, 5.0234375, 5.3359375, 5.6484375, 5.9609375, 6.2734375, 6.5859375, 6.8984375, 7.2109375, 7.5234375, 7.8359375, 8.1484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 6.0, 7.0, 17.0, 14.0, 20.0, 24.0, 35.0, 39.0, 41.0, 61.0, 96.0, 145.0, 236.0, 360.0, 626.0, 1828.0, 18223.0, 2969360.0, 147951.0, 4268.0, 983.0, 470.0, 257.0, 181.0, 126.0, 71.0, 47.0, 38.0, 31.0, 17.0, 20.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0], "bins": [-25.890625, -25.145263671875, -24.39990234375, -23.654541015625, -22.9091796875, -22.163818359375, -21.41845703125, -20.673095703125, -19.927734375, -19.182373046875, -18.43701171875, -17.691650390625, -16.9462890625, -16.200927734375, -15.45556640625, -14.710205078125, -13.96484375, -13.219482421875, -12.47412109375, -11.728759765625, -10.9833984375, -10.238037109375, -9.49267578125, -8.747314453125, -8.001953125, -7.256591796875, -6.51123046875, -5.765869140625, -5.0205078125, -4.275146484375, -3.52978515625, -2.784423828125, -2.0390625, -1.293701171875, -0.54833984375, 0.197021484375, 0.9423828125, 1.687744140625, 2.43310546875, 3.178466796875, 3.923828125, 4.669189453125, 5.41455078125, 6.159912109375, 6.9052734375, 7.650634765625, 8.39599609375, 9.141357421875, 9.88671875, 10.632080078125, 11.37744140625, 12.122802734375, 12.8681640625, 13.613525390625, 14.35888671875, 15.104248046875, 15.849609375, 16.594970703125, 17.34033203125, 18.085693359375, 18.8310546875, 19.576416015625, 20.32177734375, 21.067138671875, 21.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 17.0, 125.0, 341.0, 372.0, 129.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.57786560058594, -113.2703628540039, -110.96285247802734, -108.65534973144531, -106.34784698486328, -104.04034423828125, -101.73283386230469, -99.42533111572266, -97.11782836914062, -94.8103256225586, -92.50281524658203, -90.1953125, -87.88780975341797, -85.58030700683594, -83.27279663085938, -80.96529388427734, -78.65778350830078, -76.35028076171875, -74.04277038574219, -71.73526763916016, -69.42776489257812, -67.12025451660156, -64.81275177001953, -62.5052490234375, -60.1977424621582, -57.890235900878906, -55.582733154296875, -53.27522659301758, -50.96772003173828, -48.66021728515625, -46.35271072387695, -44.045204162597656, -41.737701416015625, -39.43019485473633, -37.1226921081543, -34.815185546875, -32.50768280029297, -30.200176239013672, -27.892669677734375, -25.58516502380371, -23.277660369873047, -20.970155715942383, -18.66265106201172, -16.355144500732422, -14.047639846801758, -11.740135192871094, -9.432629585266113, -7.125123977661133, -4.817619323730469, -2.5101141929626465, -0.20260906219482422, 2.104896068572998, 4.41240119934082, 6.719905853271484, 9.027411460876465, 11.334917068481445, 13.64242172241211, 15.949926376342773, 18.257431030273438, 20.564937591552734, 22.8724422454834, 25.179946899414062, 27.48745346069336, 29.794958114624023, 32.10246276855469]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 3.0, 7.0, 7.0, 10.0, 8.0, 18.0, 9.0, 20.0, 15.0, 29.0, 24.0, 30.0, 37.0, 34.0, 38.0, 36.0, 50.0, 46.0, 47.0, 45.0, 36.0, 49.0, 46.0, 39.0, 38.0, 32.0, 21.0, 26.0, 28.0, 23.0, 26.0, 20.0, 26.0, 10.0, 21.0, 10.0, 11.0, 4.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.476526260375977, -25.670103073120117, -24.863679885864258, -24.057254791259766, -23.250831604003906, -22.444408416748047, -21.637985229492188, -20.831562042236328, -20.02513885498047, -19.21871566772461, -18.41229248046875, -17.60586929321289, -16.7994441986084, -15.993021011352539, -15.18659782409668, -14.38017463684082, -13.573750495910645, -12.767327308654785, -11.96090316772461, -11.15447998046875, -10.34805679321289, -9.541633605957031, -8.735209465026855, -7.928786277770996, -7.1223626136779785, -6.315938949584961, -5.509515762329102, -4.703092098236084, -3.8966686725616455, -3.090245246887207, -2.2838215827941895, -1.47739839553833, -0.6709747314453125, 0.13544875383377075, 0.941872239112854, 1.748295783996582, 2.5547192096710205, 3.361142635345459, 4.167566299438477, 4.973989486694336, 5.7804131507873535, 6.586836814880371, 7.3932600021362305, 8.199684143066406, 9.006107330322266, 9.812530517578125, 10.618953704833984, 11.425376892089844, 12.23180103302002, 13.038224220275879, 13.844648361206055, 14.651071548461914, 15.457494735717773, 16.263917922973633, 17.070343017578125, 17.876766204833984, 18.683189392089844, 19.489612579345703, 20.296035766601562, 21.102458953857422, 21.908884048461914, 22.715307235717773, 23.521730422973633, 24.328153610229492, 25.13457679748535]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 12.0, 13.0, 15.0, 17.0, 21.0, 31.0, 24.0, 35.0, 38.0, 47.0, 34.0, 45.0, 57.0, 43.0, 56.0, 54.0, 39.0, 46.0, 44.0, 36.0, 41.0, 35.0, 30.0, 29.0, 22.0, 24.0, 21.0, 12.0, 20.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.13739013671875, -4.0013427734375, -3.86529541015625, -3.729248046875, -3.59320068359375, -3.4571533203125, -3.32110595703125, -3.18505859375, -3.04901123046875, -2.9129638671875, -2.77691650390625, -2.640869140625, -2.50482177734375, -2.3687744140625, -2.23272705078125, -2.0966796875, -1.96063232421875, -1.8245849609375, -1.68853759765625, -1.552490234375, -1.41644287109375, -1.2803955078125, -1.14434814453125, -1.00830078125, -0.87225341796875, -0.7362060546875, -0.60015869140625, -0.464111328125, -0.32806396484375, -0.1920166015625, -0.05596923828125, 0.080078125, 0.21612548828125, 0.3521728515625, 0.48822021484375, 0.624267578125, 0.76031494140625, 0.8963623046875, 1.03240966796875, 1.16845703125, 1.30450439453125, 1.4405517578125, 1.57659912109375, 1.712646484375, 1.84869384765625, 1.9847412109375, 2.12078857421875, 2.2568359375, 2.39288330078125, 2.5289306640625, 2.66497802734375, 2.801025390625, 2.93707275390625, 3.0731201171875, 3.20916748046875, 3.34521484375, 3.48126220703125, 3.6173095703125, 3.75335693359375, 3.889404296875, 4.02545166015625, 4.1614990234375, 4.29754638671875, 4.43359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 5.0, 3.0, 2.0, 10.0, 15.0, 24.0, 22.0, 29.0, 52.0, 63.0, 89.0, 117.0, 162.0, 235.0, 302.0, 466.0, 638.0, 898.0, 1370.0, 2175.0, 3787.0, 6985.0, 14283.0, 35694.0, 115746.0, 430163.0, 1408792.0, 1530492.0, 458715.0, 115234.0, 34971.0, 14786.0, 7065.0, 3946.0, 2294.0, 1475.0, 935.0, 635.0, 485.0, 296.0, 191.0, 169.0, 128.0, 100.0, 70.0, 51.0, 37.0, 19.0, 22.0, 11.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0], "bins": [-4.83203125, -4.69000244140625, -4.5479736328125, -4.40594482421875, -4.263916015625, -4.12188720703125, -3.9798583984375, -3.83782958984375, -3.69580078125, -3.55377197265625, -3.4117431640625, -3.26971435546875, -3.127685546875, -2.98565673828125, -2.8436279296875, -2.70159912109375, -2.5595703125, -2.41754150390625, -2.2755126953125, -2.13348388671875, -1.991455078125, -1.84942626953125, -1.7073974609375, -1.56536865234375, -1.42333984375, -1.28131103515625, -1.1392822265625, -0.99725341796875, -0.855224609375, -0.71319580078125, -0.5711669921875, -0.42913818359375, -0.287109375, -0.14508056640625, -0.0030517578125, 0.13897705078125, 0.281005859375, 0.42303466796875, 0.5650634765625, 0.70709228515625, 0.84912109375, 0.99114990234375, 1.1331787109375, 1.27520751953125, 1.417236328125, 1.55926513671875, 1.7012939453125, 1.84332275390625, 1.9853515625, 2.12738037109375, 2.2694091796875, 2.41143798828125, 2.553466796875, 2.69549560546875, 2.8375244140625, 2.97955322265625, 3.12158203125, 3.26361083984375, 3.4056396484375, 3.54766845703125, 3.689697265625, 3.83172607421875, 3.9737548828125, 4.11578369140625, 4.2578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 15.0, 8.0, 9.0, 26.0, 22.0, 37.0, 30.0, 52.0, 87.0, 110.0, 103.0, 140.0, 195.0, 301.0, 467.0, 562.0, 523.0, 381.0, 244.0, 180.0, 122.0, 88.0, 79.0, 65.0, 53.0, 41.0, 35.0, 27.0, 11.0, 22.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.8863525390625, -6.682861328125, -6.4793701171875, -6.27587890625, -6.0723876953125, -5.868896484375, -5.6654052734375, -5.4619140625, -5.2584228515625, -5.054931640625, -4.8514404296875, -4.64794921875, -4.4444580078125, -4.240966796875, -4.0374755859375, -3.833984375, -3.6304931640625, -3.427001953125, -3.2235107421875, -3.02001953125, -2.8165283203125, -2.613037109375, -2.4095458984375, -2.2060546875, -2.0025634765625, -1.799072265625, -1.5955810546875, -1.39208984375, -1.1885986328125, -0.985107421875, -0.7816162109375, -0.578125, -0.3746337890625, -0.171142578125, 0.0323486328125, 0.23583984375, 0.4393310546875, 0.642822265625, 0.8463134765625, 1.0498046875, 1.2532958984375, 1.456787109375, 1.6602783203125, 1.86376953125, 2.0672607421875, 2.270751953125, 2.4742431640625, 2.677734375, 2.8812255859375, 3.084716796875, 3.2882080078125, 3.49169921875, 3.6951904296875, 3.898681640625, 4.1021728515625, 4.3056640625, 4.5091552734375, 4.712646484375, 4.9161376953125, 5.11962890625, 5.3231201171875, 5.526611328125, 5.7301025390625, 5.93359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 10.0, 8.0, 18.0, 21.0, 17.0, 28.0, 31.0, 62.0, 83.0, 127.0, 208.0, 288.0, 480.0, 782.0, 1301.0, 2523.0, 5991.0, 18329.0, 78661.0, 446471.0, 2885271.0, 615516.0, 101235.0, 23016.0, 7131.0, 2901.0, 1496.0, 833.0, 515.0, 322.0, 197.0, 130.0, 102.0, 56.0, 32.0, 27.0, 19.0, 13.0, 10.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1875, -6.9268798828125, -6.666259765625, -6.4056396484375, -6.14501953125, -5.8843994140625, -5.623779296875, -5.3631591796875, -5.1025390625, -4.8419189453125, -4.581298828125, -4.3206787109375, -4.06005859375, -3.7994384765625, -3.538818359375, -3.2781982421875, -3.017578125, -2.7569580078125, -2.496337890625, -2.2357177734375, -1.97509765625, -1.7144775390625, -1.453857421875, -1.1932373046875, -0.9326171875, -0.6719970703125, -0.411376953125, -0.1507568359375, 0.10986328125, 0.3704833984375, 0.631103515625, 0.8917236328125, 1.15234375, 1.4129638671875, 1.673583984375, 1.9342041015625, 2.19482421875, 2.4554443359375, 2.716064453125, 2.9766845703125, 3.2373046875, 3.4979248046875, 3.758544921875, 4.0191650390625, 4.27978515625, 4.5404052734375, 4.801025390625, 5.0616455078125, 5.322265625, 5.5828857421875, 5.843505859375, 6.1041259765625, 6.36474609375, 6.6253662109375, 6.885986328125, 7.1466064453125, 7.4072265625, 7.6678466796875, 7.928466796875, 8.1890869140625, 8.44970703125, 8.7103271484375, 8.970947265625, 9.2315673828125, 9.4921875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 19.0, 222.0, 553.0, 196.0, 17.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.85098266601562, -154.71749877929688, -150.58399963378906, -146.4505157470703, -142.31703186035156, -138.1835479736328, -134.050048828125, -129.91656494140625, -125.7830810546875, -121.64958953857422, -117.51610565185547, -113.38261413574219, -109.24913024902344, -105.11563873291016, -100.98214721679688, -96.84866333007812, -92.71517181396484, -88.58168029785156, -84.44819641113281, -80.31470489501953, -76.18122100830078, -72.0477294921875, -67.91424560546875, -63.78075408935547, -59.64726638793945, -55.51377868652344, -51.38029098510742, -47.246803283691406, -43.113311767578125, -38.979827880859375, -34.846336364746094, -30.712848663330078, -26.579360961914062, -22.445873260498047, -18.31238555908203, -14.178895950317383, -10.045408248901367, -5.911920547485352, -1.7784309387207031, 2.3550567626953125, 6.488544464111328, 10.622032165527344, 14.755520820617676, 18.889009475708008, 23.022497177124023, 27.15598487854004, 31.289474487304688, 35.4229621887207, 39.55644989013672, 43.689937591552734, 47.82342529296875, 51.95691680908203, 56.09040069580078, 60.22389221191406, 64.35737609863281, 68.4908676147461, 72.62435913085938, 76.75785064697266, 80.8913345336914, 85.02482604980469, 89.15830993652344, 93.29180145263672, 97.42529296875, 101.55877685546875, 105.6922607421875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 3.0, 3.0, 7.0, 11.0, 14.0, 7.0, 11.0, 21.0, 20.0, 21.0, 20.0, 25.0, 30.0, 32.0, 33.0, 35.0, 38.0, 28.0, 40.0, 40.0, 30.0, 44.0, 41.0, 46.0, 42.0, 56.0, 38.0, 39.0, 31.0, 25.0, 33.0, 14.0, 18.0, 18.0, 18.0, 14.0, 11.0, 12.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.935544967651367, -23.193965911865234, -22.45238494873047, -21.710805892944336, -20.96922492980957, -20.227645874023438, -19.486064910888672, -18.74448585510254, -18.002906799316406, -17.261327743530273, -16.519746780395508, -15.778167724609375, -15.036587715148926, -14.295007705688477, -13.553427696228027, -12.811847686767578, -12.070267677307129, -11.32868766784668, -10.58710765838623, -9.845527648925781, -9.103948593139648, -8.3623685836792, -7.62078857421875, -6.879209041595459, -6.13762903213501, -5.3960490226745605, -4.6544694900512695, -3.9128894805908203, -3.17130970954895, -2.42972993850708, -1.6881499290466309, -0.9465703964233398, -0.20499038696289062, 0.5365894436836243, 1.2781692743301392, 2.019749164581299, 2.761328935623169, 3.502908706665039, 4.244488716125488, 4.986068248748779, 5.7276482582092285, 6.469228267669678, 7.210807800292969, 7.952387809753418, 8.693967819213867, 9.435546875, 10.177127838134766, 10.918706893920898, 11.660286903381348, 12.401866912841797, 13.143446922302246, 13.885026931762695, 14.626605987548828, 15.368185997009277, 16.109766006469727, 16.85134506225586, 17.592926025390625, 18.334505081176758, 19.076086044311523, 19.817665100097656, 20.559246063232422, 21.300825119018555, 22.042404174804688, 22.783985137939453, 23.525564193725586]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 16.0, 19.0, 19.0, 15.0, 22.0, 30.0, 34.0, 23.0, 36.0, 37.0, 29.0, 36.0, 38.0, 40.0, 37.0, 37.0, 32.0, 33.0, 39.0, 40.0, 37.0, 29.0, 36.0, 28.0, 18.0, 28.0, 21.0, 19.0, 20.0, 19.0, 12.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0], "bins": [-2.810546875, -2.7255859375, -2.640625, -2.5556640625, -2.470703125, -2.3857421875, -2.30078125, -2.2158203125, -2.130859375, -2.0458984375, -1.9609375, -1.8759765625, -1.791015625, -1.7060546875, -1.62109375, -1.5361328125, -1.451171875, -1.3662109375, -1.28125, -1.1962890625, -1.111328125, -1.0263671875, -0.94140625, -0.8564453125, -0.771484375, -0.6865234375, -0.6015625, -0.5166015625, -0.431640625, -0.3466796875, -0.26171875, -0.1767578125, -0.091796875, -0.0068359375, 0.078125, 0.1630859375, 0.248046875, 0.3330078125, 0.41796875, 0.5029296875, 0.587890625, 0.6728515625, 0.7578125, 0.8427734375, 0.927734375, 1.0126953125, 1.09765625, 1.1826171875, 1.267578125, 1.3525390625, 1.4375, 1.5224609375, 1.607421875, 1.6923828125, 1.77734375, 1.8623046875, 1.947265625, 2.0322265625, 2.1171875, 2.2021484375, 2.287109375, 2.3720703125, 2.45703125, 2.5419921875, 2.626953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 31.0, 41.0, 50.0, 77.0, 115.0, 171.0, 252.0, 372.0, 554.0, 818.0, 1189.0, 1943.0, 3036.0, 4958.0, 7892.0, 12653.0, 21952.0, 37743.0, 65510.0, 113168.0, 185345.0, 220414.0, 152409.0, 90633.0, 52283.0, 29595.0, 17629.0, 10443.0, 6301.0, 3779.0, 2466.0, 1550.0, 1000.0, 686.0, 469.0, 310.0, 224.0, 134.0, 113.0, 75.0, 41.0, 31.0, 27.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.378662109375, -0.36728668212890625, -0.3559112548828125, -0.34453582763671875, -0.333160400390625, -0.32178497314453125, -0.3104095458984375, -0.29903411865234375, -0.28765869140625, -0.27628326416015625, -0.2649078369140625, -0.25353240966796875, -0.242156982421875, -0.23078155517578125, -0.2194061279296875, -0.20803070068359375, -0.1966552734375, -0.18527984619140625, -0.1739044189453125, -0.16252899169921875, -0.151153564453125, -0.13977813720703125, -0.1284027099609375, -0.11702728271484375, -0.10565185546875, -0.09427642822265625, -0.0829010009765625, -0.07152557373046875, -0.060150146484375, -0.04877471923828125, -0.0373992919921875, -0.02602386474609375, -0.0146484375, -0.00327301025390625, 0.0081024169921875, 0.01947784423828125, 0.030853271484375, 0.04222869873046875, 0.0536041259765625, 0.06497955322265625, 0.07635498046875, 0.08773040771484375, 0.0991058349609375, 0.11048126220703125, 0.121856689453125, 0.13323211669921875, 0.1446075439453125, 0.15598297119140625, 0.1673583984375, 0.17873382568359375, 0.1901092529296875, 0.20148468017578125, 0.212860107421875, 0.22423553466796875, 0.2356109619140625, 0.24698638916015625, 0.25836181640625, 0.26973724365234375, 0.2811126708984375, 0.29248809814453125, 0.303863525390625, 0.31523895263671875, 0.3266143798828125, 0.33798980712890625, 0.349365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 4.0, 9.0, 7.0, 15.0, 8.0, 15.0, 23.0, 14.0, 16.0, 24.0, 31.0, 31.0, 37.0, 37.0, 38.0, 38.0, 28.0, 33.0, 39.0, 45.0, 1069.0, 35.0, 43.0, 37.0, 40.0, 26.0, 37.0, 24.0, 40.0, 23.0, 22.0, 22.0, 23.0, 19.0, 10.0, 13.0, 10.0, 6.0, 2.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.14959716796875, -2.0784912109375, -2.00738525390625, -1.936279296875, -1.86517333984375, -1.7940673828125, -1.72296142578125, -1.65185546875, -1.58074951171875, -1.5096435546875, -1.43853759765625, -1.367431640625, -1.29632568359375, -1.2252197265625, -1.15411376953125, -1.0830078125, -1.01190185546875, -0.9407958984375, -0.86968994140625, -0.798583984375, -0.72747802734375, -0.6563720703125, -0.58526611328125, -0.51416015625, -0.44305419921875, -0.3719482421875, -0.30084228515625, -0.229736328125, -0.15863037109375, -0.0875244140625, -0.01641845703125, 0.0546875, 0.12579345703125, 0.1968994140625, 0.26800537109375, 0.339111328125, 0.41021728515625, 0.4813232421875, 0.55242919921875, 0.62353515625, 0.69464111328125, 0.7657470703125, 0.83685302734375, 0.907958984375, 0.97906494140625, 1.0501708984375, 1.12127685546875, 1.1923828125, 1.26348876953125, 1.3345947265625, 1.40570068359375, 1.476806640625, 1.54791259765625, 1.6190185546875, 1.69012451171875, 1.76123046875, 1.83233642578125, 1.9034423828125, 1.97454833984375, 2.045654296875, 2.11676025390625, 2.1878662109375, 2.25897216796875, 2.330078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 16.0, 25.0, 49.0, 67.0, 121.0, 176.0, 342.0, 706.0, 1634.0, 4252.0, 12901.0, 50466.0, 248536.0, 1489727.0, 222880.0, 46285.0, 12175.0, 3798.0, 1490.0, 653.0, 345.0, 197.0, 105.0, 55.0, 34.0, 17.0, 14.0, 16.0, 13.0, 2.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6912612915039062, -0.6706085205078125, -0.6499557495117188, -0.629302978515625, -0.6086502075195312, -0.5879974365234375, -0.5673446655273438, -0.54669189453125, -0.5260391235351562, -0.5053863525390625, -0.48473358154296875, -0.464080810546875, -0.44342803955078125, -0.4227752685546875, -0.40212249755859375, -0.3814697265625, -0.36081695556640625, -0.3401641845703125, -0.31951141357421875, -0.298858642578125, -0.27820587158203125, -0.2575531005859375, -0.23690032958984375, -0.21624755859375, -0.19559478759765625, -0.1749420166015625, -0.15428924560546875, -0.133636474609375, -0.11298370361328125, -0.0923309326171875, -0.07167816162109375, -0.051025390625, -0.03037261962890625, -0.0097198486328125, 0.01093292236328125, 0.031585693359375, 0.05223846435546875, 0.0728912353515625, 0.09354400634765625, 0.11419677734375, 0.13484954833984375, 0.1555023193359375, 0.17615509033203125, 0.196807861328125, 0.21746063232421875, 0.2381134033203125, 0.25876617431640625, 0.2794189453125, 0.30007171630859375, 0.3207244873046875, 0.34137725830078125, 0.362030029296875, 0.38268280029296875, 0.4033355712890625, 0.42398834228515625, 0.44464111328125, 0.46529388427734375, 0.4859466552734375, 0.5065994262695312, 0.527252197265625, 0.5479049682617188, 0.5685577392578125, 0.5892105102539062, 0.60986328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 10.0, 17.0, 18.0, 24.0, 27.0, 62.0, 61.0, 88.0, 133.0, 139.0, 132.0, 68.0, 41.0, 26.0, 29.0, 14.0, 13.0, 10.0, 9.0, 6.0, 14.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.090576171875, -0.0881357192993164, -0.08569526672363281, -0.08325481414794922, -0.08081436157226562, -0.07837390899658203, -0.07593345642089844, -0.07349300384521484, -0.07105255126953125, -0.06861209869384766, -0.06617164611816406, -0.06373119354248047, -0.061290740966796875, -0.05885028839111328, -0.05640983581542969, -0.053969383239746094, -0.0515289306640625, -0.049088478088378906, -0.04664802551269531, -0.04420757293701172, -0.041767120361328125, -0.03932666778564453, -0.03688621520996094, -0.034445762634277344, -0.03200531005859375, -0.029564857482910156, -0.027124404907226562, -0.02468395233154297, -0.022243499755859375, -0.01980304718017578, -0.017362594604492188, -0.014922142028808594, -0.012481689453125, -0.010041236877441406, -0.0076007843017578125, -0.005160331726074219, -0.002719879150390625, -0.00027942657470703125, 0.0021610260009765625, 0.004601478576660156, 0.00704193115234375, 0.009482383728027344, 0.011922836303710938, 0.014363288879394531, 0.016803741455078125, 0.01924419403076172, 0.021684646606445312, 0.024125099182128906, 0.0265655517578125, 0.029006004333496094, 0.03144645690917969, 0.03388690948486328, 0.036327362060546875, 0.03876781463623047, 0.04120826721191406, 0.043648719787597656, 0.04608917236328125, 0.048529624938964844, 0.05097007751464844, 0.05341053009033203, 0.055850982666015625, 0.05829143524169922, 0.06073188781738281, 0.0631723403930664, 0.06561279296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 4.0, 7.0, 13.0, 10.0, 18.0, 35.0, 27.0, 32.0, 61.0, 83.0, 171.0, 317.0, 1021.0, 1026617.0, 18845.0, 568.0, 267.0, 123.0, 92.0, 54.0, 42.0, 30.0, 20.0, 17.0, 13.0, 6.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.646484375, -1.593017578125, -1.53955078125, -1.486083984375, -1.4326171875, -1.379150390625, -1.32568359375, -1.272216796875, -1.21875, -1.165283203125, -1.11181640625, -1.058349609375, -1.0048828125, -0.951416015625, -0.89794921875, -0.844482421875, -0.791015625, -0.737548828125, -0.68408203125, -0.630615234375, -0.5771484375, -0.523681640625, -0.47021484375, -0.416748046875, -0.36328125, -0.309814453125, -0.25634765625, -0.202880859375, -0.1494140625, -0.095947265625, -0.04248046875, 0.010986328125, 0.064453125, 0.117919921875, 0.17138671875, 0.224853515625, 0.2783203125, 0.331787109375, 0.38525390625, 0.438720703125, 0.4921875, 0.545654296875, 0.59912109375, 0.652587890625, 0.7060546875, 0.759521484375, 0.81298828125, 0.866455078125, 0.919921875, 0.973388671875, 1.02685546875, 1.080322265625, 1.1337890625, 1.187255859375, 1.24072265625, 1.294189453125, 1.34765625, 1.401123046875, 1.45458984375, 1.508056640625, 1.5615234375, 1.614990234375, 1.66845703125, 1.721923828125, 1.775390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 67.0, 617.0, 297.0, 27.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23715998232364655, -0.22576290369033813, -0.21436583995819092, -0.2029687613248825, -0.1915716826915741, -0.18017460405826569, -0.16877752542495728, -0.15738046169281006, -0.14598338305950165, -0.13458630442619324, -0.12318923324346542, -0.11179216206073761, -0.1003950834274292, -0.08899800479412079, -0.07760093361139297, -0.06620386242866516, -0.05480678379535675, -0.04340970888733864, -0.032012633979320526, -0.020615559071302414, -0.009218484163284302, 0.0021785907447338104, 0.013575665652751923, 0.024972736835479736, 0.03636981546878815, 0.04776689037680626, 0.05916396528482437, 0.07056103646755219, 0.0819581151008606, 0.093355193734169, 0.10475226491689682, 0.11614933609962463, 0.12754639983177185, 0.13894347846508026, 0.15034055709838867, 0.1617376208305359, 0.1731346994638443, 0.1845317780971527, 0.19592884182929993, 0.20732592046260834, 0.21872299909591675, 0.23012007772922516, 0.24151715636253357, 0.2529142200946808, 0.2643113136291504, 0.2757083773612976, 0.2871054410934448, 0.29850250482559204, 0.30989959836006165, 0.32129666209220886, 0.33269375562667847, 0.3440908193588257, 0.3554878830909729, 0.3668849766254425, 0.3782820403575897, 0.3896791338920593, 0.40107619762420654, 0.41247326135635376, 0.42387035489082336, 0.4352674186229706, 0.4466645121574402, 0.4580615758895874, 0.4694586396217346, 0.48085570335388184, 0.49225279688835144]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 13.0, 8.0, 9.0, 20.0, 13.0, 18.0, 23.0, 20.0, 38.0, 33.0, 44.0, 31.0, 42.0, 37.0, 44.0, 47.0, 50.0, 46.0, 36.0, 55.0, 48.0, 44.0, 38.0, 27.0, 35.0, 31.0, 22.0, 23.0, 28.0, 19.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05618172883987427, -0.05404782295227051, -0.051913920789957047, -0.049780018627643585, -0.047646112740039825, -0.045512206852436066, -0.043378304690122604, -0.04124440252780914, -0.03911049664020538, -0.036976590752601624, -0.03484268859028816, -0.0327087864279747, -0.03057488054037094, -0.02844097651541233, -0.02630707249045372, -0.02417316846549511, -0.0220392644405365, -0.01990536041557789, -0.017771456390619278, -0.015637552365660667, -0.013503648340702057, -0.011369744315743446, -0.009235840290784836, -0.007101936265826225, -0.004968032240867615, -0.002834128215909004, -0.0007002241909503937, 0.0014336798340082169, 0.0035675838589668274, 0.005701487883925438, 0.007835391908884048, 0.009969295933842659, 0.01210319995880127, 0.01423710398375988, 0.01637100800871849, 0.0185049120336771, 0.02063881605863571, 0.022772720083594322, 0.024906624108552933, 0.027040528133511543, 0.029174432158470154, 0.031308338046073914, 0.033442240208387375, 0.035576142370700836, 0.037710048258304596, 0.039843954145908356, 0.04197785630822182, 0.04411175847053528, 0.04624566435813904, 0.0483795702457428, 0.05051347240805626, 0.05264737457036972, 0.05478128045797348, 0.05691518634557724, 0.0590490885078907, 0.06118299067020416, 0.06331689655780792, 0.06545080244541168, 0.06758470833301544, 0.0697186067700386, 0.07185251265764236, 0.07398641854524612, 0.07612031698226929, 0.07825422286987305, 0.0803881287574768]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 0.0, 4.0, 1.0, 8.0, 9.0, 6.0, 11.0, 12.0, 18.0, 13.0, 21.0, 26.0, 33.0, 24.0, 31.0, 34.0, 41.0, 33.0, 43.0, 36.0, 46.0, 36.0, 49.0, 42.0, 30.0, 41.0, 40.0, 34.0, 37.0, 21.0, 29.0, 35.0, 23.0, 13.0, 27.0, 23.0, 18.0, 12.0, 9.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0], "bins": [-3.279296875, -3.18701171875, -3.0947265625, -3.00244140625, -2.91015625, -2.81787109375, -2.7255859375, -2.63330078125, -2.541015625, -2.44873046875, -2.3564453125, -2.26416015625, -2.171875, -2.07958984375, -1.9873046875, -1.89501953125, -1.802734375, -1.71044921875, -1.6181640625, -1.52587890625, -1.43359375, -1.34130859375, -1.2490234375, -1.15673828125, -1.064453125, -0.97216796875, -0.8798828125, -0.78759765625, -0.6953125, -0.60302734375, -0.5107421875, -0.41845703125, -0.326171875, -0.23388671875, -0.1416015625, -0.04931640625, 0.04296875, 0.13525390625, 0.2275390625, 0.31982421875, 0.412109375, 0.50439453125, 0.5966796875, 0.68896484375, 0.78125, 0.87353515625, 0.9658203125, 1.05810546875, 1.150390625, 1.24267578125, 1.3349609375, 1.42724609375, 1.51953125, 1.61181640625, 1.7041015625, 1.79638671875, 1.888671875, 1.98095703125, 2.0732421875, 2.16552734375, 2.2578125, 2.35009765625, 2.4423828125, 2.53466796875, 2.626953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 13.0, 15.0, 18.0, 32.0, 48.0, 65.0, 83.0, 122.0, 173.0, 267.0, 435.0, 698.0, 1106.0, 1843.0, 3475.0, 6632.0, 13107.0, 28071.0, 70064.0, 247232.0, 464830.0, 125851.0, 44263.0, 19315.0, 9263.0, 4871.0, 2616.0, 1538.0, 909.0, 524.0, 316.0, 238.0, 148.0, 107.0, 60.0, 58.0, 45.0, 24.0, 19.0, 13.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.6671142578125, -4.517822265625, -4.3685302734375, -4.21923828125, -4.0699462890625, -3.920654296875, -3.7713623046875, -3.6220703125, -3.4727783203125, -3.323486328125, -3.1741943359375, -3.02490234375, -2.8756103515625, -2.726318359375, -2.5770263671875, -2.427734375, -2.2784423828125, -2.129150390625, -1.9798583984375, -1.83056640625, -1.6812744140625, -1.531982421875, -1.3826904296875, -1.2333984375, -1.0841064453125, -0.934814453125, -0.7855224609375, -0.63623046875, -0.4869384765625, -0.337646484375, -0.1883544921875, -0.0390625, 0.1102294921875, 0.259521484375, 0.4088134765625, 0.55810546875, 0.7073974609375, 0.856689453125, 1.0059814453125, 1.1552734375, 1.3045654296875, 1.453857421875, 1.6031494140625, 1.75244140625, 1.9017333984375, 2.051025390625, 2.2003173828125, 2.349609375, 2.4989013671875, 2.648193359375, 2.7974853515625, 2.94677734375, 3.0960693359375, 3.245361328125, 3.3946533203125, 3.5439453125, 3.6932373046875, 3.842529296875, 3.9918212890625, 4.14111328125, 4.2904052734375, 4.439697265625, 4.5889892578125, 4.73828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 7.0, 3.0, 7.0, 12.0, 11.0, 13.0, 22.0, 25.0, 33.0, 34.0, 32.0, 46.0, 57.0, 44.0, 87.0, 158.0, 370.0, 1473.0, 151.0, 108.0, 60.0, 39.0, 28.0, 37.0, 32.0, 23.0, 21.0, 18.0, 12.0, 14.0, 14.0, 13.0, 10.0, 7.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.18896484375, -6.9326171875, -6.67626953125, -6.419921875, -6.16357421875, -5.9072265625, -5.65087890625, -5.39453125, -5.13818359375, -4.8818359375, -4.62548828125, -4.369140625, -4.11279296875, -3.8564453125, -3.60009765625, -3.34375, -3.08740234375, -2.8310546875, -2.57470703125, -2.318359375, -2.06201171875, -1.8056640625, -1.54931640625, -1.29296875, -1.03662109375, -0.7802734375, -0.52392578125, -0.267578125, -0.01123046875, 0.2451171875, 0.50146484375, 0.7578125, 1.01416015625, 1.2705078125, 1.52685546875, 1.783203125, 2.03955078125, 2.2958984375, 2.55224609375, 2.80859375, 3.06494140625, 3.3212890625, 3.57763671875, 3.833984375, 4.09033203125, 4.3466796875, 4.60302734375, 4.859375, 5.11572265625, 5.3720703125, 5.62841796875, 5.884765625, 6.14111328125, 6.3974609375, 6.65380859375, 6.91015625, 7.16650390625, 7.4228515625, 7.67919921875, 7.935546875, 8.19189453125, 8.4482421875, 8.70458984375, 8.9609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 12.0, 12.0, 9.0, 10.0, 11.0, 20.0, 34.0, 30.0, 61.0, 87.0, 121.0, 217.0, 293.0, 497.0, 1095.0, 9267.0, 2981498.0, 147223.0, 3147.0, 802.0, 429.0, 247.0, 158.0, 109.0, 86.0, 62.0, 37.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.46875, -21.783935546875, -21.09912109375, -20.414306640625, -19.7294921875, -19.044677734375, -18.35986328125, -17.675048828125, -16.990234375, -16.305419921875, -15.62060546875, -14.935791015625, -14.2509765625, -13.566162109375, -12.88134765625, -12.196533203125, -11.51171875, -10.826904296875, -10.14208984375, -9.457275390625, -8.7724609375, -8.087646484375, -7.40283203125, -6.718017578125, -6.033203125, -5.348388671875, -4.66357421875, -3.978759765625, -3.2939453125, -2.609130859375, -1.92431640625, -1.239501953125, -0.5546875, 0.130126953125, 0.81494140625, 1.499755859375, 2.1845703125, 2.869384765625, 3.55419921875, 4.239013671875, 4.923828125, 5.608642578125, 6.29345703125, 6.978271484375, 7.6630859375, 8.347900390625, 9.03271484375, 9.717529296875, 10.40234375, 11.087158203125, 11.77197265625, 12.456787109375, 13.1416015625, 13.826416015625, 14.51123046875, 15.196044921875, 15.880859375, 16.565673828125, 17.25048828125, 17.935302734375, 18.6201171875, 19.304931640625, 19.98974609375, 20.674560546875, 21.359375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 15.0, 34.0, 103.0, 142.0, 205.0, 192.0, 130.0, 88.0, 44.0, 18.0, 12.0, 3.0, 4.0], "bins": [-57.1346435546875, -56.117767333984375, -55.10089111328125, -54.08401107788086, -53.067134857177734, -52.05025863647461, -51.033382415771484, -50.01650619506836, -48.99962615966797, -47.982749938964844, -46.96587371826172, -45.94899368286133, -44.9321174621582, -43.91524124145508, -42.89836502075195, -41.88148880004883, -40.8646125793457, -39.84773635864258, -38.83086013793945, -37.81398010253906, -36.79710388183594, -35.78022766113281, -34.76335144042969, -33.74647521972656, -32.72959899902344, -31.712722778320312, -30.695844650268555, -29.67896842956543, -28.662090301513672, -27.645214080810547, -26.628337860107422, -25.611461639404297, -24.59458351135254, -23.577707290649414, -22.560829162597656, -21.54395294189453, -20.527076721191406, -19.51019859313965, -18.493322372436523, -17.476444244384766, -16.45956802368164, -15.4426908493042, -14.425813674926758, -13.408937454223633, -12.392060279846191, -11.37518310546875, -10.358306884765625, -9.341429710388184, -8.324552536010742, -7.307675361633301, -6.290798664093018, -5.273921966552734, -4.257044792175293, -3.2401676177978516, -2.2232909202575684, -1.2064142227172852, -0.18953657150268555, 0.8273403644561768, 1.844217300415039, 2.8610942363739014, 3.8779711723327637, 4.894848346710205, 5.911725044250488, 6.9286017417907715, 7.945478916168213]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 13.0, 14.0, 15.0, 19.0, 13.0, 24.0, 29.0, 26.0, 28.0, 24.0, 28.0, 37.0, 46.0, 36.0, 52.0, 39.0, 37.0, 37.0, 47.0, 41.0, 28.0, 38.0, 39.0, 34.0, 29.0, 26.0, 31.0, 19.0, 15.0, 19.0, 13.0, 17.0, 13.0, 5.0, 10.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.634201049804688, -22.898351669311523, -22.16250228881836, -21.426652908325195, -20.69080352783203, -19.9549560546875, -19.219104766845703, -18.483257293701172, -17.747407913208008, -17.011558532714844, -16.27570915222168, -15.539859771728516, -14.804011344909668, -14.068161964416504, -13.33231258392334, -12.596464157104492, -11.860613822937012, -11.124764442443848, -10.388915061950684, -9.653066635131836, -8.917217254638672, -8.181367874145508, -7.445518493652344, -6.709669589996338, -5.973820209503174, -5.23797082901001, -4.502121925354004, -3.76627254486084, -3.030423402786255, -2.29457426071167, -1.5587248802185059, -0.8228759765625, -0.08702659606933594, 0.6488226056098938, 1.3846718072891235, 2.120521068572998, 2.856370210647583, 3.592219352722168, 4.328068733215332, 5.063917636871338, 5.799767017364502, 6.535616397857666, 7.271465301513672, 8.007314682006836, 8.7431640625, 9.479013442993164, 10.214862823486328, 10.950711250305176, 11.68656063079834, 12.422410011291504, 13.158259391784668, 13.894107818603516, 14.62995719909668, 15.365806579589844, 16.101655960083008, 16.837505340576172, 17.573354721069336, 18.3092041015625, 19.045053482055664, 19.780902862548828, 20.516752243041992, 21.252601623535156, 21.988449096679688, 22.72429847717285, 23.460147857666016]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 14.0, 17.0, 17.0, 12.0, 17.0, 21.0, 25.0, 21.0, 33.0, 44.0, 42.0, 45.0, 40.0, 46.0, 55.0, 46.0, 47.0, 46.0, 50.0, 42.0, 37.0, 27.0, 36.0, 22.0, 26.0, 26.0, 18.0, 19.0, 12.0, 13.0, 20.0, 12.0, 10.0, 10.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20172119140625, -3.0909423828125, -2.98016357421875, -2.869384765625, -2.75860595703125, -2.6478271484375, -2.53704833984375, -2.42626953125, -2.31549072265625, -2.2047119140625, -2.09393310546875, -1.983154296875, -1.87237548828125, -1.7615966796875, -1.65081787109375, -1.5400390625, -1.42926025390625, -1.3184814453125, -1.20770263671875, -1.096923828125, -0.98614501953125, -0.8753662109375, -0.76458740234375, -0.65380859375, -0.54302978515625, -0.4322509765625, -0.32147216796875, -0.210693359375, -0.09991455078125, 0.0108642578125, 0.12164306640625, 0.232421875, 0.34320068359375, 0.4539794921875, 0.56475830078125, 0.675537109375, 0.78631591796875, 0.8970947265625, 1.00787353515625, 1.11865234375, 1.22943115234375, 1.3402099609375, 1.45098876953125, 1.561767578125, 1.67254638671875, 1.7833251953125, 1.89410400390625, 2.0048828125, 2.11566162109375, 2.2264404296875, 2.33721923828125, 2.447998046875, 2.55877685546875, 2.6695556640625, 2.78033447265625, 2.89111328125, 3.00189208984375, 3.1126708984375, 3.22344970703125, 3.334228515625, 3.44500732421875, 3.5557861328125, 3.66656494140625, 3.77734375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 11.0, 26.0, 26.0, 47.0, 53.0, 74.0, 117.0, 166.0, 315.0, 534.0, 1082.0, 2276.0, 5476.0, 19693.0, 511298.0, 3447242.0, 183814.0, 13588.0, 4378.0, 1870.0, 873.0, 465.0, 293.0, 166.0, 104.0, 72.0, 61.0, 36.0, 28.0, 17.0, 12.0, 12.0, 4.0, 16.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.15625, -12.8043212890625, -12.452392578125, -12.1004638671875, -11.74853515625, -11.3966064453125, -11.044677734375, -10.6927490234375, -10.3408203125, -9.9888916015625, -9.636962890625, -9.2850341796875, -8.93310546875, -8.5811767578125, -8.229248046875, -7.8773193359375, -7.525390625, -7.1734619140625, -6.821533203125, -6.4696044921875, -6.11767578125, -5.7657470703125, -5.413818359375, -5.0618896484375, -4.7099609375, -4.3580322265625, -4.006103515625, -3.6541748046875, -3.30224609375, -2.9503173828125, -2.598388671875, -2.2464599609375, -1.89453125, -1.5426025390625, -1.190673828125, -0.8387451171875, -0.48681640625, -0.1348876953125, 0.217041015625, 0.5689697265625, 0.9208984375, 1.2728271484375, 1.624755859375, 1.9766845703125, 2.32861328125, 2.6805419921875, 3.032470703125, 3.3843994140625, 3.736328125, 4.0882568359375, 4.440185546875, 4.7921142578125, 5.14404296875, 5.4959716796875, 5.847900390625, 6.1998291015625, 6.5517578125, 6.9036865234375, 7.255615234375, 7.6075439453125, 7.95947265625, 8.3114013671875, 8.663330078125, 9.0152587890625, 9.3671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 11.0, 12.0, 13.0, 25.0, 24.0, 58.0, 61.0, 77.0, 85.0, 123.0, 142.0, 208.0, 273.0, 392.0, 447.0, 487.0, 386.0, 319.0, 222.0, 171.0, 132.0, 93.0, 81.0, 62.0, 46.0, 35.0, 23.0, 13.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.06787109375, -3.9130859375, -3.75830078125, -3.603515625, -3.44873046875, -3.2939453125, -3.13916015625, -2.984375, -2.82958984375, -2.6748046875, -2.52001953125, -2.365234375, -2.21044921875, -2.0556640625, -1.90087890625, -1.74609375, -1.59130859375, -1.4365234375, -1.28173828125, -1.126953125, -0.97216796875, -0.8173828125, -0.66259765625, -0.5078125, -0.35302734375, -0.1982421875, -0.04345703125, 0.111328125, 0.26611328125, 0.4208984375, 0.57568359375, 0.73046875, 0.88525390625, 1.0400390625, 1.19482421875, 1.349609375, 1.50439453125, 1.6591796875, 1.81396484375, 1.96875, 2.12353515625, 2.2783203125, 2.43310546875, 2.587890625, 2.74267578125, 2.8974609375, 3.05224609375, 3.20703125, 3.36181640625, 3.5166015625, 3.67138671875, 3.826171875, 3.98095703125, 4.1357421875, 4.29052734375, 4.4453125, 4.60009765625, 4.7548828125, 4.90966796875, 5.064453125, 5.21923828125, 5.3740234375, 5.52880859375, 5.68359375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 12.0, 7.0, 22.0, 28.0, 48.0, 61.0, 85.0, 154.0, 246.0, 496.0, 1003.0, 2605.0, 9259.0, 86348.0, 3019085.0, 1025990.0, 38825.0, 5963.0, 1979.0, 918.0, 411.0, 266.0, 161.0, 88.0, 70.0, 42.0, 29.0, 22.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9140625, -12.5728759765625, -12.231689453125, -11.8905029296875, -11.54931640625, -11.2081298828125, -10.866943359375, -10.5257568359375, -10.1845703125, -9.8433837890625, -9.502197265625, -9.1610107421875, -8.81982421875, -8.4786376953125, -8.137451171875, -7.7962646484375, -7.455078125, -7.1138916015625, -6.772705078125, -6.4315185546875, -6.09033203125, -5.7491455078125, -5.407958984375, -5.0667724609375, -4.7255859375, -4.3843994140625, -4.043212890625, -3.7020263671875, -3.36083984375, -3.0196533203125, -2.678466796875, -2.3372802734375, -1.99609375, -1.6549072265625, -1.313720703125, -0.9725341796875, -0.63134765625, -0.2901611328125, 0.051025390625, 0.3922119140625, 0.7333984375, 1.0745849609375, 1.415771484375, 1.7569580078125, 2.09814453125, 2.4393310546875, 2.780517578125, 3.1217041015625, 3.462890625, 3.8040771484375, 4.145263671875, 4.4864501953125, 4.82763671875, 5.1688232421875, 5.510009765625, 5.8511962890625, 6.1923828125, 6.5335693359375, 6.874755859375, 7.2159423828125, 7.55712890625, 7.8983154296875, 8.239501953125, 8.5806884765625, 8.921875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 53.0, 312.0, 465.0, 137.0, 33.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.54766082763672, -120.54611206054688, -117.5445556640625, -114.54300689697266, -111.54145812988281, -108.53990173339844, -105.5383529663086, -102.53680419921875, -99.53524780273438, -96.53369903564453, -93.53214263916016, -90.53059387207031, -87.52904510498047, -84.5274887084961, -81.52593994140625, -78.52438354492188, -75.52284240722656, -72.52129364013672, -69.51973724365234, -66.5181884765625, -63.51663589477539, -60.51508331298828, -57.51353454589844, -54.51198196411133, -51.51042938232422, -48.50887680053711, -45.507328033447266, -42.505775451660156, -39.50422286987305, -36.50267028808594, -33.501121520996094, -30.499568939208984, -27.498016357421875, -24.4964656829834, -21.49491310119629, -18.493362426757812, -15.49181079864502, -12.490259170532227, -9.48870849609375, -6.487155914306641, -3.485605239868164, -0.4840538501739502, 2.5174975395202637, 5.519048690795898, 8.520600318908691, 11.522151947021484, 14.523702621459961, 17.52525520324707, 20.526805877685547, 23.528356552124023, 26.529909133911133, 29.53145980834961, 32.53301239013672, 35.53456115722656, 38.53611373901367, 41.53766632080078, 44.539215087890625, 47.540767669677734, 50.54231643676758, 53.54386901855469, 56.5454216003418, 59.546974182128906, 62.54852294921875, 65.55007934570312, 68.55162811279297]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 7.0, 15.0, 6.0, 11.0, 10.0, 17.0, 16.0, 21.0, 21.0, 34.0, 15.0, 35.0, 27.0, 28.0, 37.0, 37.0, 30.0, 39.0, 35.0, 29.0, 48.0, 43.0, 35.0, 41.0, 39.0, 30.0, 28.0, 36.0, 30.0, 25.0, 25.0, 24.0, 14.0, 15.0, 12.0, 15.0, 11.0, 12.0, 6.0, 10.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-21.14389419555664, -20.527685165405273, -19.911476135253906, -19.295265197753906, -18.67905616760254, -18.062847137451172, -17.446636199951172, -16.830427169799805, -16.214218139648438, -15.59800910949707, -14.981799125671387, -14.365589141845703, -13.749380111694336, -13.133171081542969, -12.516961097717285, -11.900751113891602, -11.284542083740234, -10.668333053588867, -10.052123069763184, -9.4359130859375, -8.819704055786133, -8.203495025634766, -7.587285041809082, -6.971075534820557, -6.354866027832031, -5.738656520843506, -5.1224470138549805, -4.506237506866455, -3.8900279998779297, -3.2738184928894043, -2.657608985900879, -2.0413994789123535, -1.4251899719238281, -0.8089804649353027, -0.19277095794677734, 0.42343854904174805, 1.0396480560302734, 1.6558575630187988, 2.272067070007324, 2.8882765769958496, 3.504486083984375, 4.1206955909729, 4.736905097961426, 5.353114604949951, 5.969324111938477, 6.585533618927002, 7.201743125915527, 7.817952632904053, 8.434162139892578, 9.050371170043945, 9.666581153869629, 10.282791137695312, 10.89900016784668, 11.515209197998047, 12.13141918182373, 12.747629165649414, 13.363838195800781, 13.980047225952148, 14.596257209777832, 15.212467193603516, 15.828676223754883, 16.44488525390625, 17.06109619140625, 17.677305221557617, 18.293514251708984]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 5.0, 8.0, 13.0, 17.0, 18.0, 23.0, 23.0, 32.0, 38.0, 28.0, 33.0, 49.0, 59.0, 43.0, 59.0, 57.0, 50.0, 54.0, 50.0, 45.0, 39.0, 38.0, 48.0, 24.0, 29.0, 23.0, 18.0, 19.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.099884033203125, -2.99859619140625, -2.897308349609375, -2.7960205078125, -2.694732666015625, -2.59344482421875, -2.492156982421875, -2.390869140625, -2.289581298828125, -2.18829345703125, -2.087005615234375, -1.9857177734375, -1.884429931640625, -1.78314208984375, -1.681854248046875, -1.58056640625, -1.479278564453125, -1.37799072265625, -1.276702880859375, -1.1754150390625, -1.074127197265625, -0.97283935546875, -0.871551513671875, -0.770263671875, -0.668975830078125, -0.56768798828125, -0.466400146484375, -0.3651123046875, -0.263824462890625, -0.16253662109375, -0.061248779296875, 0.0400390625, 0.141326904296875, 0.24261474609375, 0.343902587890625, 0.4451904296875, 0.546478271484375, 0.64776611328125, 0.749053955078125, 0.850341796875, 0.951629638671875, 1.05291748046875, 1.154205322265625, 1.2554931640625, 1.356781005859375, 1.45806884765625, 1.559356689453125, 1.66064453125, 1.761932373046875, 1.86322021484375, 1.964508056640625, 2.0657958984375, 2.167083740234375, 2.26837158203125, 2.369659423828125, 2.470947265625, 2.572235107421875, 2.67352294921875, 2.774810791015625, 2.8760986328125, 2.977386474609375, 3.07867431640625, 3.179962158203125, 3.28125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 10.0, 5.0, 8.0, 17.0, 11.0, 27.0, 60.0, 84.0, 116.0, 192.0, 277.0, 411.0, 639.0, 1125.0, 1806.0, 3001.0, 5433.0, 9860.0, 19505.0, 43727.0, 122384.0, 402828.0, 284987.0, 84734.0, 32958.0, 15175.0, 8073.0, 4439.0, 2553.0, 1571.0, 910.0, 554.0, 399.0, 247.0, 148.0, 90.0, 63.0, 35.0, 34.0, 13.0, 19.0, 7.0, 9.0, 9.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7116470336914062, -0.6869659423828125, -0.6622848510742188, -0.637603759765625, -0.6129226684570312, -0.5882415771484375, -0.5635604858398438, -0.53887939453125, -0.5141983032226562, -0.4895172119140625, -0.46483612060546875, -0.440155029296875, -0.41547393798828125, -0.3907928466796875, -0.36611175537109375, -0.3414306640625, -0.31674957275390625, -0.2920684814453125, -0.26738739013671875, -0.242706298828125, -0.21802520751953125, -0.1933441162109375, -0.16866302490234375, -0.14398193359375, -0.11930084228515625, -0.0946197509765625, -0.06993865966796875, -0.045257568359375, -0.02057647705078125, 0.0041046142578125, 0.02878570556640625, 0.053466796875, 0.07814788818359375, 0.1028289794921875, 0.12751007080078125, 0.152191162109375, 0.17687225341796875, 0.2015533447265625, 0.22623443603515625, 0.25091552734375, 0.27559661865234375, 0.3002777099609375, 0.32495880126953125, 0.349639892578125, 0.37432098388671875, 0.3990020751953125, 0.42368316650390625, 0.4483642578125, 0.47304534912109375, 0.4977264404296875, 0.5224075317382812, 0.547088623046875, 0.5717697143554688, 0.5964508056640625, 0.6211318969726562, 0.64581298828125, 0.6704940795898438, 0.6951751708984375, 0.7198562622070312, 0.744537353515625, 0.7692184448242188, 0.7938995361328125, 0.8185806274414062, 0.84326171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 18.0, 16.0, 17.0, 16.0, 12.0, 12.0, 19.0, 31.0, 33.0, 44.0, 51.0, 30.0, 41.0, 39.0, 52.0, 49.0, 1070.0, 38.0, 50.0, 47.0, 31.0, 38.0, 36.0, 32.0, 29.0, 30.0, 22.0, 27.0, 18.0, 7.0, 17.0, 11.0, 6.0, 6.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.33984375, -2.2772064208984375, -2.214569091796875, -2.1519317626953125, -2.08929443359375, -2.0266571044921875, -1.964019775390625, -1.9013824462890625, -1.8387451171875, -1.7761077880859375, -1.713470458984375, -1.6508331298828125, -1.58819580078125, -1.5255584716796875, -1.462921142578125, -1.4002838134765625, -1.337646484375, -1.2750091552734375, -1.212371826171875, -1.1497344970703125, -1.08709716796875, -1.0244598388671875, -0.961822509765625, -0.8991851806640625, -0.8365478515625, -0.7739105224609375, -0.711273193359375, -0.6486358642578125, -0.58599853515625, -0.5233612060546875, -0.460723876953125, -0.3980865478515625, -0.33544921875, -0.2728118896484375, -0.210174560546875, -0.1475372314453125, -0.08489990234375, -0.0222625732421875, 0.040374755859375, 0.1030120849609375, 0.1656494140625, 0.2282867431640625, 0.290924072265625, 0.3535614013671875, 0.41619873046875, 0.4788360595703125, 0.541473388671875, 0.6041107177734375, 0.666748046875, 0.7293853759765625, 0.792022705078125, 0.8546600341796875, 0.91729736328125, 0.9799346923828125, 1.042572021484375, 1.1052093505859375, 1.1678466796875, 1.2304840087890625, 1.293121337890625, 1.3557586669921875, 1.41839599609375, 1.4810333251953125, 1.543670654296875, 1.6063079833984375, 1.6689453125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 13.0, 9.0, 22.0, 33.0, 47.0, 69.0, 107.0, 144.0, 198.0, 283.0, 424.0, 630.0, 983.0, 1711.0, 3000.0, 5655.0, 12262.0, 30611.0, 100832.0, 623720.0, 1128978.0, 122917.0, 35879.0, 13728.0, 6422.0, 3326.0, 1815.0, 1153.0, 738.0, 429.0, 294.0, 203.0, 159.0, 76.0, 62.0, 43.0, 37.0, 28.0, 25.0, 13.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5236740112304688, -0.5068206787109375, -0.48996734619140625, -0.473114013671875, -0.45626068115234375, -0.4394073486328125, -0.42255401611328125, -0.40570068359375, -0.38884735107421875, -0.3719940185546875, -0.35514068603515625, -0.338287353515625, -0.32143402099609375, -0.3045806884765625, -0.28772735595703125, -0.2708740234375, -0.25402069091796875, -0.2371673583984375, -0.22031402587890625, -0.203460693359375, -0.18660736083984375, -0.1697540283203125, -0.15290069580078125, -0.13604736328125, -0.11919403076171875, -0.1023406982421875, -0.08548736572265625, -0.068634033203125, -0.05178070068359375, -0.0349273681640625, -0.01807403564453125, -0.001220703125, 0.01563262939453125, 0.0324859619140625, 0.04933929443359375, 0.066192626953125, 0.08304595947265625, 0.0998992919921875, 0.11675262451171875, 0.13360595703125, 0.15045928955078125, 0.1673126220703125, 0.18416595458984375, 0.201019287109375, 0.21787261962890625, 0.2347259521484375, 0.25157928466796875, 0.2684326171875, 0.28528594970703125, 0.3021392822265625, 0.31899261474609375, 0.335845947265625, 0.35269927978515625, 0.3695526123046875, 0.38640594482421875, 0.40325927734375, 0.42011260986328125, 0.4369659423828125, 0.45381927490234375, 0.470672607421875, 0.48752593994140625, 0.5043792724609375, 0.5212326049804688, 0.5380859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 15.0, 16.0, 15.0, 10.0, 22.0, 21.0, 37.0, 41.0, 90.0, 161.0, 186.0, 139.0, 55.0, 30.0, 21.0, 27.0, 18.0, 15.0, 16.0, 10.0, 8.0, 7.0, 1.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08339881896972656, -0.08110427856445312, -0.07880973815917969, -0.07651519775390625, -0.07422065734863281, -0.07192611694335938, -0.06963157653808594, -0.0673370361328125, -0.06504249572753906, -0.06274795532226562, -0.06045341491699219, -0.05815887451171875, -0.05586433410644531, -0.053569793701171875, -0.05127525329589844, -0.048980712890625, -0.04668617248535156, -0.044391632080078125, -0.04209709167480469, -0.03980255126953125, -0.03750801086425781, -0.035213470458984375, -0.03291893005371094, -0.0306243896484375, -0.028329849243164062, -0.026035308837890625, -0.023740768432617188, -0.02144622802734375, -0.019151687622070312, -0.016857147216796875, -0.014562606811523438, -0.01226806640625, -0.009973526000976562, -0.007678985595703125, -0.0053844451904296875, -0.00308990478515625, -0.0007953643798828125, 0.001499176025390625, 0.0037937164306640625, 0.0060882568359375, 0.008382797241210938, 0.010677337646484375, 0.012971878051757812, 0.01526641845703125, 0.017560958862304688, 0.019855499267578125, 0.022150039672851562, 0.024444580078125, 0.026739120483398438, 0.029033660888671875, 0.03132820129394531, 0.03362274169921875, 0.03591728210449219, 0.038211822509765625, 0.04050636291503906, 0.0428009033203125, 0.04509544372558594, 0.047389984130859375, 0.04968452453613281, 0.05197906494140625, 0.05427360534667969, 0.056568145751953125, 0.05886268615722656, 0.0611572265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 6.0, 11.0, 8.0, 14.0, 26.0, 26.0, 29.0, 48.0, 55.0, 74.0, 126.0, 212.0, 422.0, 2074.0, 1021993.0, 21895.0, 692.0, 274.0, 184.0, 86.0, 56.0, 48.0, 44.0, 40.0, 21.0, 17.0, 13.0, 12.0, 7.0, 7.0, 4.0, 6.0, 8.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1769256591796875, -1.131195068359375, -1.0854644775390625, -1.03973388671875, -0.9940032958984375, -0.948272705078125, -0.9025421142578125, -0.8568115234375, -0.8110809326171875, -0.765350341796875, -0.7196197509765625, -0.67388916015625, -0.6281585693359375, -0.582427978515625, -0.5366973876953125, -0.490966796875, -0.4452362060546875, -0.399505615234375, -0.3537750244140625, -0.30804443359375, -0.2623138427734375, -0.216583251953125, -0.1708526611328125, -0.1251220703125, -0.0793914794921875, -0.033660888671875, 0.0120697021484375, 0.05780029296875, 0.1035308837890625, 0.149261474609375, 0.1949920654296875, 0.24072265625, 0.2864532470703125, 0.332183837890625, 0.3779144287109375, 0.42364501953125, 0.4693756103515625, 0.515106201171875, 0.5608367919921875, 0.6065673828125, 0.6522979736328125, 0.698028564453125, 0.7437591552734375, 0.78948974609375, 0.8352203369140625, 0.880950927734375, 0.9266815185546875, 0.972412109375, 1.0181427001953125, 1.063873291015625, 1.1096038818359375, 1.15533447265625, 1.2010650634765625, 1.246795654296875, 1.2925262451171875, 1.3382568359375, 1.3839874267578125, 1.429718017578125, 1.4754486083984375, 1.52117919921875, 1.5669097900390625, 1.612640380859375, 1.6583709716796875, 1.7041015625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 48.0, 716.0, 239.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27755460143089294, -0.2641831934452057, -0.25081175565719604, -0.2374403476715088, -0.22406893968582153, -0.21069751679897308, -0.19732609391212463, -0.18395468592643738, -0.17058326303958893, -0.15721184015274048, -0.14384043216705322, -0.13046900928020477, -0.11709759384393692, -0.10372617840766907, -0.09035475552082062, -0.07698334008455276, -0.06361192464828491, -0.05024050921201706, -0.03686909005045891, -0.023497670888900757, -0.010126255452632904, 0.0032451599836349487, 0.0166165828704834, 0.02998799830675125, 0.043359413743019104, 0.05673082917928696, 0.07010224461555481, 0.08347366750240326, 0.09684508293867111, 0.11021649837493896, 0.12358792126178741, 0.13695934414863586, 0.15033072233200073, 0.16370214521884918, 0.17707355320453644, 0.1904449760913849, 0.20381638407707214, 0.2171878069639206, 0.23055922985076904, 0.2439306378364563, 0.25730204582214355, 0.2706734538078308, 0.28404489159584045, 0.2974162995815277, 0.31078770756721497, 0.3241591453552246, 0.33753055334091187, 0.3509019613265991, 0.36427339911460876, 0.377644807100296, 0.39101624488830566, 0.4043876528739929, 0.4177590608596802, 0.43113046884536743, 0.4445019066333771, 0.45787331461906433, 0.471244752407074, 0.48461616039276123, 0.4979875981807709, 0.5113589763641357, 0.5247304439544678, 0.538101851940155, 0.5514732599258423, 0.5648446679115295, 0.5782160758972168]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 11.0, 24.0, 19.0, 19.0, 25.0, 28.0, 31.0, 34.0, 32.0, 34.0, 38.0, 41.0, 39.0, 60.0, 45.0, 47.0, 48.0, 41.0, 37.0, 34.0, 44.0, 28.0, 29.0, 21.0, 20.0, 25.0, 20.0, 13.0, 13.0, 15.0, 16.0, 8.0, 4.0, 10.0, 6.0, 7.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-0.09314745664596558, -0.09059496223926544, -0.0880424752831459, -0.08548998087644577, -0.08293749392032623, -0.0803849995136261, -0.07783250510692596, -0.07528001070022583, -0.07272752374410629, -0.07017502933740616, -0.06762254238128662, -0.06507004797458649, -0.06251755356788635, -0.059965066611766815, -0.05741257220506668, -0.054860081523656845, -0.05230759084224701, -0.04975510016083717, -0.04720260947942734, -0.0446501150727272, -0.04209762439131737, -0.03954513370990753, -0.0369926393032074, -0.03444014862179756, -0.031887657940387726, -0.02933516725897789, -0.026782674714922905, -0.02423018217086792, -0.021677691489458084, -0.01912520080804825, -0.016572708263993263, -0.014020215719938278, -0.011467725038528442, -0.008915233425796032, -0.0063627418130636215, -0.003810250200331211, -0.0012577585875988007, 0.0012947330251336098, 0.00384722463786602, 0.006399717181921005, 0.008952207863330841, 0.011504699476063251, 0.014057191088795662, 0.016609683632850647, 0.019162174314260483, 0.02171466499567032, 0.024267157539725304, 0.02681965008378029, 0.029372140765190125, 0.03192463144659996, 0.034477122128009796, 0.03702961653470993, 0.039582107216119766, 0.0421345978975296, 0.044687092304229736, 0.04723958298563957, 0.04979207366704941, 0.052344564348459244, 0.05489705502986908, 0.057449549436569214, 0.06000204011797905, 0.06255453079938889, 0.06510702520608902, 0.06765951216220856, 0.07021200656890869]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 11.0, 8.0, 15.0, 17.0, 14.0, 17.0, 30.0, 21.0, 27.0, 32.0, 38.0, 42.0, 38.0, 51.0, 50.0, 60.0, 56.0, 53.0, 53.0, 39.0, 48.0, 39.0, 45.0, 39.0, 27.0, 25.0, 23.0, 15.0, 12.0, 15.0, 10.0, 11.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.443359375, -3.34259033203125, -3.2418212890625, -3.14105224609375, -3.040283203125, -2.93951416015625, -2.8387451171875, -2.73797607421875, -2.63720703125, -2.53643798828125, -2.4356689453125, -2.33489990234375, -2.234130859375, -2.13336181640625, -2.0325927734375, -1.93182373046875, -1.8310546875, -1.73028564453125, -1.6295166015625, -1.52874755859375, -1.427978515625, -1.32720947265625, -1.2264404296875, -1.12567138671875, -1.02490234375, -0.92413330078125, -0.8233642578125, -0.72259521484375, -0.621826171875, -0.52105712890625, -0.4202880859375, -0.31951904296875, -0.21875, -0.11798095703125, -0.0172119140625, 0.08355712890625, 0.184326171875, 0.28509521484375, 0.3858642578125, 0.48663330078125, 0.58740234375, 0.68817138671875, 0.7889404296875, 0.88970947265625, 0.990478515625, 1.09124755859375, 1.1920166015625, 1.29278564453125, 1.3935546875, 1.49432373046875, 1.5950927734375, 1.69586181640625, 1.796630859375, 1.89739990234375, 1.9981689453125, 2.09893798828125, 2.19970703125, 2.30047607421875, 2.4012451171875, 2.50201416015625, 2.602783203125, 2.70355224609375, 2.8043212890625, 2.90509033203125, 3.005859375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 9.0, 6.0, 8.0, 14.0, 18.0, 33.0, 41.0, 69.0, 78.0, 95.0, 167.0, 250.0, 374.0, 569.0, 905.0, 1574.0, 2725.0, 5337.0, 11255.0, 27577.0, 83778.0, 291965.0, 411097.0, 137682.0, 41363.0, 15774.0, 7082.0, 3625.0, 1993.0, 1104.0, 688.0, 433.0, 253.0, 182.0, 134.0, 85.0, 64.0, 34.0, 33.0, 27.0, 19.0, 6.0, 13.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.056640625, -2.967254638671875, -2.87786865234375, -2.788482666015625, -2.6990966796875, -2.609710693359375, -2.52032470703125, -2.430938720703125, -2.341552734375, -2.252166748046875, -2.16278076171875, -2.073394775390625, -1.9840087890625, -1.894622802734375, -1.80523681640625, -1.715850830078125, -1.62646484375, -1.537078857421875, -1.44769287109375, -1.358306884765625, -1.2689208984375, -1.179534912109375, -1.09014892578125, -1.000762939453125, -0.911376953125, -0.821990966796875, -0.73260498046875, -0.643218994140625, -0.5538330078125, -0.464447021484375, -0.37506103515625, -0.285675048828125, -0.1962890625, -0.106903076171875, -0.01751708984375, 0.071868896484375, 0.1612548828125, 0.250640869140625, 0.34002685546875, 0.429412841796875, 0.518798828125, 0.608184814453125, 0.69757080078125, 0.786956787109375, 0.8763427734375, 0.965728759765625, 1.05511474609375, 1.144500732421875, 1.23388671875, 1.323272705078125, 1.41265869140625, 1.502044677734375, 1.5914306640625, 1.680816650390625, 1.77020263671875, 1.859588623046875, 1.948974609375, 2.038360595703125, 2.12774658203125, 2.217132568359375, 2.3065185546875, 2.395904541015625, 2.48529052734375, 2.574676513671875, 2.6640625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 12.0, 17.0, 19.0, 18.0, 23.0, 22.0, 25.0, 35.0, 30.0, 50.0, 70.0, 65.0, 151.0, 342.0, 1516.0, 173.0, 88.0, 59.0, 47.0, 44.0, 38.0, 31.0, 25.0, 30.0, 20.0, 17.0, 20.0, 8.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.81170654296875, -7.5609130859375, -7.31011962890625, -7.059326171875, -6.80853271484375, -6.5577392578125, -6.30694580078125, -6.05615234375, -5.80535888671875, -5.5545654296875, -5.30377197265625, -5.052978515625, -4.80218505859375, -4.5513916015625, -4.30059814453125, -4.0498046875, -3.79901123046875, -3.5482177734375, -3.29742431640625, -3.046630859375, -2.79583740234375, -2.5450439453125, -2.29425048828125, -2.04345703125, -1.79266357421875, -1.5418701171875, -1.29107666015625, -1.040283203125, -0.78948974609375, -0.5386962890625, -0.28790283203125, -0.037109375, 0.21368408203125, 0.4644775390625, 0.71527099609375, 0.966064453125, 1.21685791015625, 1.4676513671875, 1.71844482421875, 1.96923828125, 2.22003173828125, 2.4708251953125, 2.72161865234375, 2.972412109375, 3.22320556640625, 3.4739990234375, 3.72479248046875, 3.9755859375, 4.22637939453125, 4.4771728515625, 4.72796630859375, 4.978759765625, 5.22955322265625, 5.4803466796875, 5.73114013671875, 5.98193359375, 6.23272705078125, 6.4835205078125, 6.73431396484375, 6.985107421875, 7.23590087890625, 7.4866943359375, 7.73748779296875, 7.98828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 7.0, 8.0, 9.0, 14.0, 17.0, 33.0, 32.0, 33.0, 61.0, 83.0, 95.0, 192.0, 281.0, 517.0, 1243.0, 49335.0, 3087497.0, 4384.0, 786.0, 393.0, 213.0, 133.0, 96.0, 60.0, 39.0, 36.0, 31.0, 20.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.671142578125, -16.17041015625, -15.669677734375, -15.1689453125, -14.668212890625, -14.16748046875, -13.666748046875, -13.166015625, -12.665283203125, -12.16455078125, -11.663818359375, -11.1630859375, -10.662353515625, -10.16162109375, -9.660888671875, -9.16015625, -8.659423828125, -8.15869140625, -7.657958984375, -7.1572265625, -6.656494140625, -6.15576171875, -5.655029296875, -5.154296875, -4.653564453125, -4.15283203125, -3.652099609375, -3.1513671875, -2.650634765625, -2.14990234375, -1.649169921875, -1.1484375, -0.647705078125, -0.14697265625, 0.353759765625, 0.8544921875, 1.355224609375, 1.85595703125, 2.356689453125, 2.857421875, 3.358154296875, 3.85888671875, 4.359619140625, 4.8603515625, 5.361083984375, 5.86181640625, 6.362548828125, 6.86328125, 7.364013671875, 7.86474609375, 8.365478515625, 8.8662109375, 9.366943359375, 9.86767578125, 10.368408203125, 10.869140625, 11.369873046875, 11.87060546875, 12.371337890625, 12.8720703125, 13.372802734375, 13.87353515625, 14.374267578125, 14.875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 88.0, 791.0, 132.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.147857666015625, -21.607765197753906, -19.06767463684082, -16.5275821685791, -13.9874906539917, -11.447399139404297, -8.907306671142578, -6.367216110229492, -3.8271236419677734, -1.287031888961792, 1.2530598640441895, 3.79315185546875, 6.333243370056152, 8.873334884643555, 11.413427352905273, 13.95351791381836, 16.493610382080078, 19.033702850341797, 21.573793411254883, 24.1138858795166, 26.653976440429688, 29.194068908691406, 31.734161376953125, 34.274253845214844, 36.81434631347656, 39.35443878173828, 41.89453125, 44.43462371826172, 46.97471237182617, 49.51480484008789, 52.05489730834961, 54.59498596191406, 57.13507843017578, 59.6751708984375, 62.21526336669922, 64.75535583496094, 67.29544830322266, 69.83554077148438, 72.37562561035156, 74.91571807861328, 77.455810546875, 79.99590301513672, 82.53599548339844, 85.07608795166016, 87.61618041992188, 90.15626525878906, 92.69636535644531, 95.2364501953125, 97.77655029296875, 100.31664276123047, 102.85673522949219, 105.3968276977539, 107.93692016601562, 110.47700500488281, 113.01710510253906, 115.55718994140625, 118.09728240966797, 120.63737487792969, 123.1774673461914, 125.71755981445312, 128.2576446533203, 130.79774475097656, 133.33782958984375, 135.8779296875, 138.4180145263672]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 5.0, 3.0, 5.0, 21.0, 10.0, 7.0, 16.0, 32.0, 20.0, 24.0, 34.0, 34.0, 40.0, 41.0, 44.0, 57.0, 45.0, 48.0, 32.0, 56.0, 46.0, 42.0, 42.0, 42.0, 37.0, 39.0, 31.0, 22.0, 22.0, 21.0, 15.0, 13.0, 9.0, 9.0, 7.0, 4.0, 8.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.396127700805664, -14.830148696899414, -14.264169692993164, -13.698189735412598, -13.132210731506348, -12.566231727600098, -12.000251770019531, -11.434272766113281, -10.868293762207031, -10.302314758300781, -9.736335754394531, -9.170355796813965, -8.604376792907715, -8.038397789001465, -7.472418308258057, -6.906438827514648, -6.340459823608398, -5.774480819702148, -5.20850133895874, -4.642521858215332, -4.076542854309082, -3.510563611984253, -2.944584369659424, -2.3786051273345947, -1.8126258850097656, -1.2466466426849365, -0.6806674003601074, -0.11468815803527832, 0.4512910842895508, 1.0172703266143799, 1.583249568939209, 2.149228811264038, 2.7152099609375, 3.281189203262329, 3.847168445587158, 4.413147926330566, 4.979126930236816, 5.545105934143066, 6.111085414886475, 6.677064895629883, 7.243043899536133, 7.809022903442383, 8.375001907348633, 8.9409818649292, 9.50696086883545, 10.0729398727417, 10.638919830322266, 11.204898834228516, 11.770877838134766, 12.336856842041016, 12.902835845947266, 13.468815803527832, 14.034794807434082, 14.600773811340332, 15.166753768920898, 15.732732772827148, 16.2987117767334, 16.86469078063965, 17.4306697845459, 17.99664878845215, 18.56262969970703, 19.12860870361328, 19.69458770751953, 20.26056671142578, 20.82654571533203]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 18.0, 15.0, 14.0, 20.0, 22.0, 30.0, 31.0, 46.0, 37.0, 35.0, 34.0, 53.0, 51.0, 47.0, 36.0, 31.0, 52.0, 34.0, 34.0, 47.0, 39.0, 36.0, 28.0, 30.0, 28.0, 19.0, 19.0, 13.0, 12.0, 15.0, 12.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.12890625, -3.03179931640625, -2.9346923828125, -2.83758544921875, -2.740478515625, -2.64337158203125, -2.5462646484375, -2.44915771484375, -2.35205078125, -2.25494384765625, -2.1578369140625, -2.06072998046875, -1.963623046875, -1.86651611328125, -1.7694091796875, -1.67230224609375, -1.5751953125, -1.47808837890625, -1.3809814453125, -1.28387451171875, -1.186767578125, -1.08966064453125, -0.9925537109375, -0.89544677734375, -0.79833984375, -0.70123291015625, -0.6041259765625, -0.50701904296875, -0.409912109375, -0.31280517578125, -0.2156982421875, -0.11859130859375, -0.021484375, 0.07562255859375, 0.1727294921875, 0.26983642578125, 0.366943359375, 0.46405029296875, 0.5611572265625, 0.65826416015625, 0.75537109375, 0.85247802734375, 0.9495849609375, 1.04669189453125, 1.143798828125, 1.24090576171875, 1.3380126953125, 1.43511962890625, 1.5322265625, 1.62933349609375, 1.7264404296875, 1.82354736328125, 1.920654296875, 2.01776123046875, 2.1148681640625, 2.21197509765625, 2.30908203125, 2.40618896484375, 2.5032958984375, 2.60040283203125, 2.697509765625, 2.79461669921875, 2.8917236328125, 2.98883056640625, 3.0859375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 5.0, 7.0, 19.0, 22.0, 26.0, 40.0, 50.0, 74.0, 98.0, 113.0, 173.0, 213.0, 292.0, 366.0, 518.0, 841.0, 1391.0, 3111.0, 8229.0, 33605.0, 969166.0, 3073720.0, 79142.0, 13253.0, 4460.0, 1955.0, 1020.0, 658.0, 450.0, 332.0, 235.0, 165.0, 139.0, 100.0, 60.0, 65.0, 39.0, 35.0, 24.0, 14.0, 9.0, 14.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.375, -13.928466796875, -13.48193359375, -13.035400390625, -12.5888671875, -12.142333984375, -11.69580078125, -11.249267578125, -10.802734375, -10.356201171875, -9.90966796875, -9.463134765625, -9.0166015625, -8.570068359375, -8.12353515625, -7.677001953125, -7.23046875, -6.783935546875, -6.33740234375, -5.890869140625, -5.4443359375, -4.997802734375, -4.55126953125, -4.104736328125, -3.658203125, -3.211669921875, -2.76513671875, -2.318603515625, -1.8720703125, -1.425537109375, -0.97900390625, -0.532470703125, -0.0859375, 0.360595703125, 0.80712890625, 1.253662109375, 1.7001953125, 2.146728515625, 2.59326171875, 3.039794921875, 3.486328125, 3.932861328125, 4.37939453125, 4.825927734375, 5.2724609375, 5.718994140625, 6.16552734375, 6.612060546875, 7.05859375, 7.505126953125, 7.95166015625, 8.398193359375, 8.8447265625, 9.291259765625, 9.73779296875, 10.184326171875, 10.630859375, 11.077392578125, 11.52392578125, 11.970458984375, 12.4169921875, 12.863525390625, 13.31005859375, 13.756591796875, 14.203125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 9.0, 11.0, 21.0, 13.0, 31.0, 46.0, 74.0, 143.0, 195.0, 335.0, 581.0, 730.0, 683.0, 442.0, 286.0, 160.0, 112.0, 59.0, 41.0, 31.0, 23.0, 16.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.08966064453125, -5.8629150390625, -5.63616943359375, -5.409423828125, -5.18267822265625, -4.9559326171875, -4.72918701171875, -4.50244140625, -4.27569580078125, -4.0489501953125, -3.82220458984375, -3.595458984375, -3.36871337890625, -3.1419677734375, -2.91522216796875, -2.6884765625, -2.46173095703125, -2.2349853515625, -2.00823974609375, -1.781494140625, -1.55474853515625, -1.3280029296875, -1.10125732421875, -0.87451171875, -0.64776611328125, -0.4210205078125, -0.19427490234375, 0.032470703125, 0.25921630859375, 0.4859619140625, 0.71270751953125, 0.939453125, 1.16619873046875, 1.3929443359375, 1.61968994140625, 1.846435546875, 2.07318115234375, 2.2999267578125, 2.52667236328125, 2.75341796875, 2.98016357421875, 3.2069091796875, 3.43365478515625, 3.660400390625, 3.88714599609375, 4.1138916015625, 4.34063720703125, 4.5673828125, 4.79412841796875, 5.0208740234375, 5.24761962890625, 5.474365234375, 5.70111083984375, 5.9278564453125, 6.15460205078125, 6.38134765625, 6.60809326171875, 6.8348388671875, 7.06158447265625, 7.288330078125, 7.51507568359375, 7.7418212890625, 7.96856689453125, 8.1953125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 26.0, 34.0, 97.0, 227.0, 639.0, 2397.0, 12262.0, 136039.0, 3671862.0, 345138.0, 20665.0, 3483.0, 886.0, 284.0, 121.0, 59.0, 16.0, 12.0, 5.0, 4.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.3397216796875, -13.937255859375, -13.5347900390625, -13.13232421875, -12.7298583984375, -12.327392578125, -11.9249267578125, -11.5224609375, -11.1199951171875, -10.717529296875, -10.3150634765625, -9.91259765625, -9.5101318359375, -9.107666015625, -8.7052001953125, -8.302734375, -7.9002685546875, -7.497802734375, -7.0953369140625, -6.69287109375, -6.2904052734375, -5.887939453125, -5.4854736328125, -5.0830078125, -4.6805419921875, -4.278076171875, -3.8756103515625, -3.47314453125, -3.0706787109375, -2.668212890625, -2.2657470703125, -1.86328125, -1.4608154296875, -1.058349609375, -0.6558837890625, -0.25341796875, 0.1490478515625, 0.551513671875, 0.9539794921875, 1.3564453125, 1.7589111328125, 2.161376953125, 2.5638427734375, 2.96630859375, 3.3687744140625, 3.771240234375, 4.1737060546875, 4.576171875, 4.9786376953125, 5.381103515625, 5.7835693359375, 6.18603515625, 6.5885009765625, 6.990966796875, 7.3934326171875, 7.7958984375, 8.1983642578125, 8.600830078125, 9.0032958984375, 9.40576171875, 9.8082275390625, 10.210693359375, 10.6131591796875, 11.015625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 3.0, 14.0, 20.0, 41.0, 64.0, 88.0, 95.0, 96.0, 124.0, 106.0, 105.0, 82.0, 48.0, 29.0, 33.0, 14.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.936784744262695, -19.583702087402344, -18.230619430541992, -16.87753677368164, -15.524456024169922, -14.17137336730957, -12.818290710449219, -11.465209007263184, -10.112126350402832, -8.75904369354248, -7.405961990356445, -6.052879333496094, -4.6997971534729, -3.346714973449707, -1.9936323165893555, -0.6405506134033203, 0.7125320434570312, 2.0656142234802246, 3.418696641921997, 4.7717790603637695, 6.124861240386963, 7.477943420410156, 8.831026077270508, 10.184107780456543, 11.537190437316895, 12.890273094177246, 14.243354797363281, 15.596437454223633, 16.949520111083984, 18.302600860595703, 19.655685424804688, 21.008766174316406, 22.36185073852539, 23.714933395385742, 25.068016052246094, 26.421096801757812, 27.774179458618164, 29.127262115478516, 30.480344772338867, 31.83342742919922, 33.18650817871094, 34.539588928222656, 35.89267349243164, 37.24575424194336, 38.598838806152344, 39.95191955566406, 41.30500030517578, 42.658084869384766, 44.01116943359375, 45.36425018310547, 46.71733474731445, 48.07041549682617, 49.423500061035156, 50.776580810546875, 52.129661560058594, 53.48274612426758, 54.8358268737793, 56.188907623291016, 57.5419921875, 58.89507293701172, 60.2481575012207, 61.60123825073242, 62.954322814941406, 64.30740356445312, 65.66048431396484]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 11.0, 12.0, 16.0, 17.0, 13.0, 26.0, 16.0, 27.0, 31.0, 34.0, 37.0, 47.0, 41.0, 44.0, 43.0, 43.0, 55.0, 34.0, 48.0, 33.0, 34.0, 40.0, 29.0, 31.0, 37.0, 34.0, 22.0, 16.0, 23.0, 10.0, 10.0, 12.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.79792594909668, -19.13520050048828, -18.47247314453125, -17.80974578857422, -17.14702033996582, -16.484294891357422, -15.82156753540039, -15.158841133117676, -14.496114730834961, -13.833388328552246, -13.170661926269531, -12.507935523986816, -11.845209121704102, -11.182482719421387, -10.519756317138672, -9.857029914855957, -9.194303512573242, -8.531577110290527, -7.8688507080078125, -7.206124305725098, -6.543397903442383, -5.880671501159668, -5.217945098876953, -4.555218696594238, -3.8924922943115234, -3.2297658920288086, -2.5670394897460938, -1.904313087463379, -1.241586685180664, -0.5788602828979492, 0.08386611938476562, 0.7465925216674805, 1.4093189239501953, 2.07204532623291, 2.734771728515625, 3.39749813079834, 4.060224533081055, 4.7229509353637695, 5.385677337646484, 6.048403739929199, 6.711130142211914, 7.373856544494629, 8.036582946777344, 8.699309349060059, 9.362035751342773, 10.024762153625488, 10.687488555908203, 11.350214958190918, 12.012941360473633, 12.675667762756348, 13.338394165039062, 14.001120567321777, 14.663846969604492, 15.326573371887207, 15.989299774169922, 16.652027130126953, 17.31475257873535, 17.97747802734375, 18.64020538330078, 19.302932739257812, 19.96565818786621, 20.62838363647461, 21.29111099243164, 21.953838348388672, 22.61656379699707]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 10.0, 22.0, 20.0, 20.0, 25.0, 26.0, 34.0, 40.0, 29.0, 41.0, 43.0, 51.0, 49.0, 60.0, 56.0, 58.0, 48.0, 43.0, 33.0, 43.0, 33.0, 34.0, 27.0, 21.0, 20.0, 15.0, 18.0, 13.0, 8.0, 9.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.81884765625, -45.2001953125, -43.58154296875, -41.962890625, -40.34423828125, -38.7255859375, -37.10693359375, -35.48828125, -33.86962890625, -32.2509765625, -30.63232421875, -29.013671875, -27.39501953125, -25.7763671875, -24.15771484375, -22.5390625, -20.92041015625, -19.3017578125, -17.68310546875, -16.064453125, -14.44580078125, -12.8271484375, -11.20849609375, -9.58984375, -7.97119140625, -6.3525390625, -4.73388671875, -3.115234375, -1.49658203125, 0.1220703125, 1.74072265625, 3.359375, 4.97802734375, 6.5966796875, 8.21533203125, 9.833984375, 11.45263671875, 13.0712890625, 14.68994140625, 16.30859375, 17.92724609375, 19.5458984375, 21.16455078125, 22.783203125, 24.40185546875, 26.0205078125, 27.63916015625, 29.2578125, 30.87646484375, 32.4951171875, 34.11376953125, 35.732421875, 37.35107421875, 38.9697265625, 40.58837890625, 42.20703125, 43.82568359375, 45.4443359375, 47.06298828125, 48.681640625, 50.30029296875, 51.9189453125, 53.53759765625, 55.15625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 24.0, 32.0, 53.0, 65.0, 103.0, 131.0, 215.0, 332.0, 467.0, 612.0, 926.0, 1371.0, 2107.0, 3306.0, 5035.0, 7847.0, 12210.0, 19513.0, 31071.0, 49947.0, 80042.0, 127820.0, 189079.0, 185208.0, 123221.0, 76773.0, 48549.0, 30078.0, 18694.0, 11881.0, 7554.0, 4762.0, 3141.0, 2128.0, 1383.0, 927.0, 613.0, 410.0, 270.0, 186.0, 149.0, 92.0, 60.0, 46.0, 33.0, 25.0, 15.0, 15.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.409027099609375, -1.36199951171875, -1.314971923828125, -1.2679443359375, -1.220916748046875, -1.17388916015625, -1.126861572265625, -1.079833984375, -1.032806396484375, -0.98577880859375, -0.938751220703125, -0.8917236328125, -0.844696044921875, -0.79766845703125, -0.750640869140625, -0.70361328125, -0.656585693359375, -0.60955810546875, -0.562530517578125, -0.5155029296875, -0.468475341796875, -0.42144775390625, -0.374420166015625, -0.327392578125, -0.280364990234375, -0.23333740234375, -0.186309814453125, -0.1392822265625, -0.092254638671875, -0.04522705078125, 0.001800537109375, 0.048828125, 0.095855712890625, 0.14288330078125, 0.189910888671875, 0.2369384765625, 0.283966064453125, 0.33099365234375, 0.378021240234375, 0.425048828125, 0.472076416015625, 0.51910400390625, 0.566131591796875, 0.6131591796875, 0.660186767578125, 0.70721435546875, 0.754241943359375, 0.80126953125, 0.848297119140625, 0.89532470703125, 0.942352294921875, 0.9893798828125, 1.036407470703125, 1.08343505859375, 1.130462646484375, 1.177490234375, 1.224517822265625, 1.27154541015625, 1.318572998046875, 1.3656005859375, 1.412628173828125, 1.45965576171875, 1.506683349609375, 1.5537109375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 10.0, 13.0, 12.0, 23.0, 16.0, 27.0, 18.0, 24.0, 30.0, 42.0, 40.0, 38.0, 46.0, 36.0, 46.0, 40.0, 1062.0, 46.0, 37.0, 36.0, 37.0, 37.0, 42.0, 26.0, 31.0, 31.0, 22.0, 23.0, 27.0, 15.0, 14.0, 12.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-29.078125, -28.218505859375, -27.35888671875, -26.499267578125, -25.6396484375, -24.780029296875, -23.92041015625, -23.060791015625, -22.201171875, -21.341552734375, -20.48193359375, -19.622314453125, -18.7626953125, -17.903076171875, -17.04345703125, -16.183837890625, -15.32421875, -14.464599609375, -13.60498046875, -12.745361328125, -11.8857421875, -11.026123046875, -10.16650390625, -9.306884765625, -8.447265625, -7.587646484375, -6.72802734375, -5.868408203125, -5.0087890625, -4.149169921875, -3.28955078125, -2.429931640625, -1.5703125, -0.710693359375, 0.14892578125, 1.008544921875, 1.8681640625, 2.727783203125, 3.58740234375, 4.447021484375, 5.306640625, 6.166259765625, 7.02587890625, 7.885498046875, 8.7451171875, 9.604736328125, 10.46435546875, 11.323974609375, 12.18359375, 13.043212890625, 13.90283203125, 14.762451171875, 15.6220703125, 16.481689453125, 17.34130859375, 18.200927734375, 19.060546875, 19.920166015625, 20.77978515625, 21.639404296875, 22.4990234375, 23.358642578125, 24.21826171875, 25.077880859375, 25.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 17.0, 31.0, 41.0, 72.0, 111.0, 174.0, 271.0, 362.0, 574.0, 896.0, 1350.0, 2141.0, 3227.0, 4941.0, 7400.0, 11538.0, 17318.0, 26223.0, 40243.0, 60883.0, 92070.0, 140712.0, 1173072.0, 199507.0, 106519.0, 70916.0, 46974.0, 30595.0, 20261.0, 13395.0, 8761.0, 5805.0, 3790.0, 2330.0, 1548.0, 1067.0, 695.0, 438.0, 304.0, 184.0, 122.0, 70.0, 57.0, 43.0, 20.0, 12.0, 15.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.220703125, -1.1795806884765625, -1.138458251953125, -1.0973358154296875, -1.05621337890625, -1.0150909423828125, -0.973968505859375, -0.9328460693359375, -0.8917236328125, -0.8506011962890625, -0.809478759765625, -0.7683563232421875, -0.72723388671875, -0.6861114501953125, -0.644989013671875, -0.6038665771484375, -0.562744140625, -0.5216217041015625, -0.480499267578125, -0.4393768310546875, -0.39825439453125, -0.3571319580078125, -0.316009521484375, -0.2748870849609375, -0.2337646484375, -0.1926422119140625, -0.151519775390625, -0.1103973388671875, -0.06927490234375, -0.0281524658203125, 0.012969970703125, 0.0540924072265625, 0.09521484375, 0.1363372802734375, 0.177459716796875, 0.2185821533203125, 0.25970458984375, 0.3008270263671875, 0.341949462890625, 0.3830718994140625, 0.4241943359375, 0.4653167724609375, 0.506439208984375, 0.5475616455078125, 0.58868408203125, 0.6298065185546875, 0.670928955078125, 0.7120513916015625, 0.753173828125, 0.7942962646484375, 0.835418701171875, 0.8765411376953125, 0.91766357421875, 0.9587860107421875, 0.999908447265625, 1.0410308837890625, 1.0821533203125, 1.1232757568359375, 1.164398193359375, 1.2055206298828125, 1.24664306640625, 1.2877655029296875, 1.328887939453125, 1.3700103759765625, 1.4111328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 13.0, 10.0, 8.0, 18.0, 12.0, 16.0, 19.0, 19.0, 25.0, 34.0, 27.0, 49.0, 51.0, 42.0, 64.0, 54.0, 50.0, 62.0, 55.0, 48.0, 43.0, 40.0, 30.0, 25.0, 22.0, 26.0, 12.0, 14.0, 13.0, 13.0, 12.0, 10.0, 5.0, 10.0, 6.0, 3.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.027862548828125, -0.027006864547729492, -0.026151180267333984, -0.025295495986938477, -0.02443981170654297, -0.02358412742614746, -0.022728443145751953, -0.021872758865356445, -0.021017074584960938, -0.02016139030456543, -0.019305706024169922, -0.018450021743774414, -0.017594337463378906, -0.0167386531829834, -0.01588296890258789, -0.015027284622192383, -0.014171600341796875, -0.013315916061401367, -0.01246023178100586, -0.011604547500610352, -0.010748863220214844, -0.009893178939819336, -0.009037494659423828, -0.00818181037902832, -0.0073261260986328125, -0.006470441818237305, -0.005614757537841797, -0.004759073257446289, -0.0039033889770507812, -0.0030477046966552734, -0.0021920204162597656, -0.0013363361358642578, -0.00048065185546875, 0.0003750324249267578, 0.0012307167053222656, 0.0020864009857177734, 0.0029420852661132812, 0.003797769546508789, 0.004653453826904297, 0.005509138107299805, 0.0063648223876953125, 0.00722050666809082, 0.008076190948486328, 0.008931875228881836, 0.009787559509277344, 0.010643243789672852, 0.01149892807006836, 0.012354612350463867, 0.013210296630859375, 0.014065980911254883, 0.01492166519165039, 0.0157773494720459, 0.016633033752441406, 0.017488718032836914, 0.018344402313232422, 0.01920008659362793, 0.020055770874023438, 0.020911455154418945, 0.021767139434814453, 0.02262282371520996, 0.02347850799560547, 0.024334192276000977, 0.025189876556396484, 0.026045560836791992, 0.0269012451171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 11.0, 18.0, 29.0, 41.0, 67.0, 78.0, 133.0, 160.0, 286.0, 484.0, 819.0, 1410.0, 2950.0, 6612.0, 16926.0, 52741.0, 200815.0, 475048.0, 205228.0, 54140.0, 17193.0, 6655.0, 3048.0, 1468.0, 818.0, 468.0, 298.0, 182.0, 121.0, 97.0, 48.0, 37.0, 29.0, 25.0, 18.0, 10.0, 7.0, 5.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1968212127685547, -0.19015121459960938, -0.18348121643066406, -0.17681121826171875, -0.17014122009277344, -0.16347122192382812, -0.1568012237548828, -0.1501312255859375, -0.1434612274169922, -0.13679122924804688, -0.13012123107910156, -0.12345123291015625, -0.11678123474121094, -0.11011123657226562, -0.10344123840332031, -0.096771240234375, -0.09010124206542969, -0.08343124389648438, -0.07676124572753906, -0.07009124755859375, -0.06342124938964844, -0.056751251220703125, -0.05008125305175781, -0.0434112548828125, -0.03674125671386719, -0.030071258544921875, -0.023401260375976562, -0.01673126220703125, -0.010061264038085938, -0.003391265869140625, 0.0032787322998046875, 0.00994873046875, 0.016618728637695312, 0.023288726806640625, 0.029958724975585938, 0.03662872314453125, 0.04329872131347656, 0.049968719482421875, 0.05663871765136719, 0.0633087158203125, 0.06997871398925781, 0.07664871215820312, 0.08331871032714844, 0.08998870849609375, 0.09665870666503906, 0.10332870483398438, 0.10999870300292969, 0.116668701171875, 0.12333869934082031, 0.13000869750976562, 0.13667869567871094, 0.14334869384765625, 0.15001869201660156, 0.15668869018554688, 0.1633586883544922, 0.1700286865234375, 0.1766986846923828, 0.18336868286132812, 0.19003868103027344, 0.19670867919921875, 0.20337867736816406, 0.21004867553710938, 0.2167186737060547, 0.223388671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 19.0, 47.0, 81.0, 168.0, 253.0, 201.0, 94.0, 56.0, 31.0, 18.0, 9.0, 9.0, 8.0, 0.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073527030646801, -0.0676354467868805, -0.061743855476379395, -0.055852267891168594, -0.049960680305957794, -0.044069092720746994, -0.038177505135536194, -0.032285917550325394, -0.026394329965114594, -0.020502742379903793, -0.014611154794692993, -0.008719567209482193, -0.002827979624271393, 0.0030636079609394073, 0.008955195546150208, 0.014846783131361008, 0.020738370716571808, 0.026629958301782608, 0.03252154588699341, 0.03841313347220421, 0.04430472105741501, 0.05019630864262581, 0.05608789622783661, 0.06197948381304741, 0.06787107139825821, 0.07376265525817871, 0.07965424656867981, 0.08554583787918091, 0.09143742173910141, 0.09732900559902191, 0.10322059690952301, 0.10911218822002411, 0.11500376462936401, 0.12089535593986511, 0.1267869472503662, 0.13267852365970612, 0.13857011497020721, 0.1444617062807083, 0.15035328269004822, 0.15624487400054932, 0.16213646531105042, 0.1680280566215515, 0.1739196479320526, 0.17981122434139252, 0.18570281565189362, 0.19159440696239471, 0.19748598337173462, 0.20337757468223572, 0.20926916599273682, 0.21516075730323792, 0.221052348613739, 0.22694392502307892, 0.23283551633358002, 0.23872710764408112, 0.24461868405342102, 0.2505102753639221, 0.2564018666744232, 0.2622934579849243, 0.2681850492954254, 0.2740766406059265, 0.2799682021141052, 0.2858597934246063, 0.2917513847351074, 0.2976429760456085, 0.3035345673561096]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 6.0, 8.0, 19.0, 17.0, 17.0, 20.0, 13.0, 28.0, 28.0, 33.0, 27.0, 32.0, 41.0, 32.0, 30.0, 41.0, 31.0, 37.0, 35.0, 50.0, 45.0, 39.0, 30.0, 33.0, 36.0, 28.0, 22.0, 27.0, 18.0, 22.0, 16.0, 21.0, 17.0, 15.0, 8.0, 12.0, 5.0, 14.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04460030794143677, -0.0431242436170578, -0.041648175567388535, -0.04017210751771927, -0.0386960431933403, -0.037219978868961334, -0.03574391081929207, -0.0342678427696228, -0.032791778445243835, -0.03131571412086487, -0.029839646071195602, -0.028363579884171486, -0.02688751369714737, -0.025411447510123253, -0.023935381323099136, -0.02245931513607502, -0.020983248949050903, -0.019507182762026787, -0.01803111657500267, -0.016555050387978554, -0.015078984200954437, -0.01360291801393032, -0.012126851826906204, -0.010650785639882088, -0.009174719452857971, -0.007698653265833855, -0.006222587078809738, -0.004746520891785622, -0.003270454704761505, -0.0017943885177373886, -0.0003183223307132721, 0.0011577438563108444, 0.002633810043334961, 0.0041098762303590775, 0.005585942417383194, 0.0070620086044073105, 0.008538074791431427, 0.010014140978455544, 0.01149020716547966, 0.012966273352503777, 0.014442339539527893, 0.01591840572655201, 0.017394471913576126, 0.018870538100600243, 0.02034660428762436, 0.021822670474648476, 0.023298736661672592, 0.02477480284869671, 0.026250869035720825, 0.02772693522274494, 0.029203001409769058, 0.030679067596793175, 0.03215513378381729, 0.03363119810819626, 0.035107266157865524, 0.03658333420753479, 0.03805939853191376, 0.039535462856292725, 0.04101153090596199, 0.042487598955631256, 0.04396366328001022, 0.04543972760438919, 0.046915795654058456, 0.04839186370372772, 0.04986792802810669]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 10.0, 12.0, 14.0, 9.0, 10.0, 19.0, 23.0, 21.0, 25.0, 30.0, 39.0, 46.0, 41.0, 48.0, 37.0, 48.0, 53.0, 57.0, 45.0, 51.0, 42.0, 36.0, 43.0, 40.0, 32.0, 26.0, 23.0, 29.0, 16.0, 15.0, 7.0, 11.0, 10.0, 10.0, 2.0, 1.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.71875, -46.12744140625, -44.5361328125, -42.94482421875, -41.353515625, -39.76220703125, -38.1708984375, -36.57958984375, -34.98828125, -33.39697265625, -31.8056640625, -30.21435546875, -28.623046875, -27.03173828125, -25.4404296875, -23.84912109375, -22.2578125, -20.66650390625, -19.0751953125, -17.48388671875, -15.892578125, -14.30126953125, -12.7099609375, -11.11865234375, -9.52734375, -7.93603515625, -6.3447265625, -4.75341796875, -3.162109375, -1.57080078125, 0.0205078125, 1.61181640625, 3.203125, 4.79443359375, 6.3857421875, 7.97705078125, 9.568359375, 11.15966796875, 12.7509765625, 14.34228515625, 15.93359375, 17.52490234375, 19.1162109375, 20.70751953125, 22.298828125, 23.89013671875, 25.4814453125, 27.07275390625, 28.6640625, 30.25537109375, 31.8466796875, 33.43798828125, 35.029296875, 36.62060546875, 38.2119140625, 39.80322265625, 41.39453125, 42.98583984375, 44.5771484375, 46.16845703125, 47.759765625, 49.35107421875, 50.9423828125, 52.53369140625, 54.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 16.0, 22.0, 26.0, 25.0, 43.0, 32.0, 67.0, 79.0, 112.0, 190.0, 430.0, 1066.0, 4057.0, 22589.0, 171148.0, 636515.0, 181928.0, 23756.0, 4189.0, 1145.0, 406.0, 202.0, 113.0, 72.0, 60.0, 43.0, 41.0, 29.0, 25.0, 20.0, 20.0, 17.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.98046875, -7.71893310546875, -7.4573974609375, -7.19586181640625, -6.934326171875, -6.67279052734375, -6.4112548828125, -6.14971923828125, -5.88818359375, -5.62664794921875, -5.3651123046875, -5.10357666015625, -4.842041015625, -4.58050537109375, -4.3189697265625, -4.05743408203125, -3.7958984375, -3.53436279296875, -3.2728271484375, -3.01129150390625, -2.749755859375, -2.48822021484375, -2.2266845703125, -1.96514892578125, -1.70361328125, -1.44207763671875, -1.1805419921875, -0.91900634765625, -0.657470703125, -0.39593505859375, -0.1343994140625, 0.12713623046875, 0.388671875, 0.65020751953125, 0.9117431640625, 1.17327880859375, 1.434814453125, 1.69635009765625, 1.9578857421875, 2.21942138671875, 2.48095703125, 2.74249267578125, 3.0040283203125, 3.26556396484375, 3.527099609375, 3.78863525390625, 4.0501708984375, 4.31170654296875, 4.5732421875, 4.83477783203125, 5.0963134765625, 5.35784912109375, 5.619384765625, 5.88092041015625, 6.1424560546875, 6.40399169921875, 6.66552734375, 6.92706298828125, 7.1885986328125, 7.45013427734375, 7.711669921875, 7.97320556640625, 8.2347412109375, 8.49627685546875, 8.7578125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 5.0, 13.0, 15.0, 19.0, 26.0, 44.0, 45.0, 52.0, 49.0, 61.0, 52.0, 75.0, 2117.0, 75.0, 80.0, 66.0, 51.0, 46.0, 33.0, 27.0, 27.0, 15.0, 15.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-105.4375, -102.5517578125, -99.666015625, -96.7802734375, -93.89453125, -91.0087890625, -88.123046875, -85.2373046875, -82.3515625, -79.4658203125, -76.580078125, -73.6943359375, -70.80859375, -67.9228515625, -65.037109375, -62.1513671875, -59.265625, -56.3798828125, -53.494140625, -50.6083984375, -47.72265625, -44.8369140625, -41.951171875, -39.0654296875, -36.1796875, -33.2939453125, -30.408203125, -27.5224609375, -24.63671875, -21.7509765625, -18.865234375, -15.9794921875, -13.09375, -10.2080078125, -7.322265625, -4.4365234375, -1.55078125, 1.3349609375, 4.220703125, 7.1064453125, 9.9921875, 12.8779296875, 15.763671875, 18.6494140625, 21.53515625, 24.4208984375, 27.306640625, 30.1923828125, 33.078125, 35.9638671875, 38.849609375, 41.7353515625, 44.62109375, 47.5068359375, 50.392578125, 53.2783203125, 56.1640625, 59.0498046875, 61.935546875, 64.8212890625, 67.70703125, 70.5927734375, 73.478515625, 76.3642578125, 79.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 19.0, 34.0, 43.0, 46.0, 92.0, 162.0, 315.0, 446.0, 877.0, 1976.0, 5950.0, 29657.0, 228575.0, 2731176.0, 121407.0, 17484.0, 4072.0, 1487.0, 761.0, 407.0, 247.0, 143.0, 90.0, 63.0, 34.0, 35.0, 14.0, 13.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40264892578125, -6.1685791015625, -5.93450927734375, -5.700439453125, -5.46636962890625, -5.2322998046875, -4.99822998046875, -4.76416015625, -4.53009033203125, -4.2960205078125, -4.06195068359375, -3.827880859375, -3.59381103515625, -3.3597412109375, -3.12567138671875, -2.8916015625, -2.65753173828125, -2.4234619140625, -2.18939208984375, -1.955322265625, -1.72125244140625, -1.4871826171875, -1.25311279296875, -1.01904296875, -0.78497314453125, -0.5509033203125, -0.31683349609375, -0.082763671875, 0.15130615234375, 0.3853759765625, 0.61944580078125, 0.853515625, 1.08758544921875, 1.3216552734375, 1.55572509765625, 1.789794921875, 2.02386474609375, 2.2579345703125, 2.49200439453125, 2.72607421875, 2.96014404296875, 3.1942138671875, 3.42828369140625, 3.662353515625, 3.89642333984375, 4.1304931640625, 4.36456298828125, 4.5986328125, 4.83270263671875, 5.0667724609375, 5.30084228515625, 5.534912109375, 5.76898193359375, 6.0030517578125, 6.23712158203125, 6.47119140625, 6.70526123046875, 6.9393310546875, 7.17340087890625, 7.407470703125, 7.64154052734375, 7.8756103515625, 8.10968017578125, 8.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 34.0, 96.0, 342.0, 331.0, 102.0, 39.0, 23.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.48118591308594, -124.69154357910156, -116.90190124511719, -109.11225891113281, -101.32261657714844, -93.53297424316406, -85.74333190917969, -77.95368957519531, -70.16404724121094, -62.37440490722656, -54.58476257324219, -46.79512023925781, -39.00547790527344, -31.215835571289062, -23.426193237304688, -15.636550903320312, -7.8469085693359375, -0.0572662353515625, 7.7323760986328125, 15.522018432617188, 23.311660766601562, 31.101303100585938, 38.89094543457031, 46.68058776855469, 54.47023010253906, 62.25987243652344, 70.04951477050781, 77.83915710449219, 85.62879943847656, 93.41844177246094, 101.20808410644531, 108.99772644042969, 116.787353515625, 124.57699584960938, 132.36663818359375, 140.15628051757812, 147.9459228515625, 155.73556518554688, 163.52520751953125, 171.31484985351562, 179.1044921875, 186.89413452148438, 194.68377685546875, 202.47341918945312, 210.2630615234375, 218.05270385742188, 225.84234619140625, 233.63198852539062, 241.421630859375, 249.21127319335938, 257.00091552734375, 264.7905578613281, 272.5802001953125, 280.3698425292969, 288.15948486328125, 295.9491271972656, 303.73876953125, 311.5284118652344, 319.31805419921875, 327.1076965332031, 334.8973388671875, 342.6869812011719, 350.47662353515625, 358.2662658691406, 366.055908203125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 11.0, 12.0, 12.0, 14.0, 16.0, 23.0, 25.0, 28.0, 26.0, 36.0, 46.0, 37.0, 47.0, 46.0, 46.0, 52.0, 48.0, 31.0, 42.0, 33.0, 26.0, 44.0, 40.0, 29.0, 25.0, 23.0, 24.0, 15.0, 22.0, 26.0, 10.0, 11.0, 6.0, 11.0, 9.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.71125030517578, -78.79401397705078, -75.87677001953125, -72.95953369140625, -70.04229736328125, -67.12506103515625, -64.20781707763672, -61.29058074951172, -58.37334442138672, -55.45610427856445, -52.53886795043945, -49.62162780761719, -46.70439147949219, -43.78715133666992, -40.869911193847656, -37.952674865722656, -35.03543472290039, -32.118194580078125, -29.200958251953125, -26.28371810913086, -23.36648178100586, -20.449241638183594, -17.53200340270996, -14.614765167236328, -11.697526931762695, -8.780288696289062, -5.8630499839782715, -2.9458112716674805, -0.028573036193847656, 2.888665199279785, 5.805904388427734, 8.723142623901367, 11.640380859375, 14.557619094848633, 17.474857330322266, 20.39209747314453, 23.30933380126953, 26.226573944091797, 29.14381217956543, 32.06105041503906, 34.97828674316406, 37.89552688598633, 40.81276321411133, 43.730003356933594, 46.647239685058594, 49.56447982788086, 52.481719970703125, 55.398956298828125, 58.31619644165039, 61.233436584472656, 64.15067291259766, 67.06790924072266, 69.98515319824219, 72.90238952636719, 75.81962585449219, 78.73686218261719, 81.65410614013672, 84.57134246826172, 87.48858642578125, 90.40582275390625, 93.32305908203125, 96.24029541015625, 99.15753936767578, 102.07477569580078, 104.99201202392578]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 9.0, 13.0, 20.0, 16.0, 15.0, 22.0, 35.0, 43.0, 56.0, 78.0, 103.0, 127.0, 185.0, 285.0, 475.0, 731.0, 1338.0, 3104.0, 1025392.0, 11026.0, 2426.0, 1023.0, 634.0, 398.0, 293.0, 168.0, 126.0, 85.0, 65.0, 48.0, 53.0, 32.0, 27.0, 21.0, 23.0, 14.0, 12.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.460712432861328, -25.603782653808594, -24.74685287475586, -23.889923095703125, -23.032995223999023, -22.17606544494629, -21.319135665893555, -20.46220588684082, -19.60527801513672, -18.748348236083984, -17.89141845703125, -17.034488677978516, -16.177560806274414, -15.32063102722168, -14.463701248168945, -13.606771469116211, -12.749841690063477, -11.892911911010742, -11.035983085632324, -10.17905330657959, -9.322124481201172, -8.465194702148438, -7.608264923095703, -6.751335620880127, -5.894406318664551, -5.037477016448975, -4.180547714233398, -3.323617935180664, -2.466688632965088, -1.6097593307495117, -0.7528295516967773, 0.10409975051879883, 0.9610271453857422, 1.817956566810608, 2.6748859882354736, 3.531815528869629, 4.388744831085205, 5.245674133300781, 6.102603912353516, 6.959533214569092, 7.816462516784668, 8.673392295837402, 9.53032112121582, 10.387250900268555, 11.244180679321289, 12.101109504699707, 12.958039283752441, 13.81496810913086, 14.671897888183594, 15.528827667236328, 16.385757446289062, 17.242687225341797, 18.0996150970459, 18.956544876098633, 19.813474655151367, 20.6704044342041, 21.527332305908203, 22.384262084960938, 23.241191864013672, 24.098121643066406, 24.955049514770508, 25.811979293823242, 26.668909072875977, 27.52583885192871, 28.382768630981445]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 39.0, 596.0, 51462116.0, 354.0, 23.0, 9.0, 0.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3868.11083984375, -3772.389892578125, -3676.668701171875, -3580.94775390625, -3485.226806640625, -3389.505859375, -3293.78466796875, -3198.063720703125, -3102.3427734375, -3006.621826171875, -2910.900634765625, -2815.1796875, -2719.458740234375, -2623.73779296875, -2528.0166015625, -2432.295654296875, -2336.574462890625, -2240.853515625, -2145.13232421875, -2049.411376953125, -1953.6904296875, -1857.9693603515625, -1762.248291015625, -1666.52734375, -1570.8062744140625, -1475.085205078125, -1379.3642578125, -1283.6431884765625, -1187.922119140625, -1092.201171875, -996.4801025390625, -900.7590942382812, -805.037841796875, -709.3168334960938, -613.5958251953125, -517.874755859375, -422.15374755859375, -326.4327392578125, -230.711669921875, -134.99066162109375, -39.2696533203125, 56.45137023925781, 152.17239379882812, 247.8934326171875, 343.61444091796875, 439.33544921875, 535.0565185546875, 630.7775268554688, 726.49853515625, 822.2195434570312, 917.9405517578125, 1013.66162109375, 1109.382568359375, 1205.1036376953125, 1300.82470703125, 1396.545654296875, 1492.2667236328125, 1587.98779296875, 1683.708740234375, 1779.4298095703125, 1875.15087890625, 1970.871826171875, 2066.5927734375, 2162.31396484375, 2258.034912109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 21.0, 36.0, 50.0, 81.0, 133.0, 181.0, 272.0, 431.0, 680.0, 1070.0, 1775.0, 2839.0, 4880.0, 8802.0, 15621.0, 29268.0, 58469.0, 125211.0, 297986.0, 919622.0, 3504103.0, 808701.0, 275663.0, 117125.0, 54991.0, 27986.0, 14940.0, 8423.0, 4700.0, 2698.0, 1703.0, 1092.0, 639.0, 429.0, 236.0, 182.0, 113.0, 77.0, 58.0, 28.0, 24.0, 17.0, 14.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.265625, -15.71337890625, -15.1611328125, -14.60888671875, -14.056640625, -13.50439453125, -12.9521484375, -12.39990234375, -11.84765625, -11.29541015625, -10.7431640625, -10.19091796875, -9.638671875, -9.08642578125, -8.5341796875, -7.98193359375, -7.4296875, -6.87744140625, -6.3251953125, -5.77294921875, -5.220703125, -4.66845703125, -4.1162109375, -3.56396484375, -3.01171875, -2.45947265625, -1.9072265625, -1.35498046875, -0.802734375, -0.25048828125, 0.3017578125, 0.85400390625, 1.40625, 1.95849609375, 2.5107421875, 3.06298828125, 3.615234375, 4.16748046875, 4.7197265625, 5.27197265625, 5.82421875, 6.37646484375, 6.9287109375, 7.48095703125, 8.033203125, 8.58544921875, 9.1376953125, 9.68994140625, 10.2421875, 10.79443359375, 11.3466796875, 11.89892578125, 12.451171875, 13.00341796875, 13.5556640625, 14.10791015625, 14.66015625, 15.21240234375, 15.7646484375, 16.31689453125, 16.869140625, 17.42138671875, 17.9736328125, 18.52587890625, 19.078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 10.0, 5.0, 12.0, 21.0, 18.0, 11.0, 20.0, 18.0, 32.0, 34.0, 21.0, 25.0, 31.0, 39.0, 45.0, 72.0, 130.0, 296.0, 459.0, 207.0, 93.0, 58.0, 42.0, 38.0, 32.0, 40.0, 34.0, 28.0, 20.0, 19.0, 23.0, 18.0, 13.0, 12.0, 9.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.625, -21.96484375, -21.3046875, -20.64453125, -19.984375, -19.32421875, -18.6640625, -18.00390625, -17.34375, -16.68359375, -16.0234375, -15.36328125, -14.703125, -14.04296875, -13.3828125, -12.72265625, -12.0625, -11.40234375, -10.7421875, -10.08203125, -9.421875, -8.76171875, -8.1015625, -7.44140625, -6.78125, -6.12109375, -5.4609375, -4.80078125, -4.140625, -3.48046875, -2.8203125, -2.16015625, -1.5, -0.83984375, -0.1796875, 0.48046875, 1.140625, 1.80078125, 2.4609375, 3.12109375, 3.78125, 4.44140625, 5.1015625, 5.76171875, 6.421875, 7.08203125, 7.7421875, 8.40234375, 9.0625, 9.72265625, 10.3828125, 11.04296875, 11.703125, 12.36328125, 13.0234375, 13.68359375, 14.34375, 15.00390625, 15.6640625, 16.32421875, 16.984375, 17.64453125, 18.3046875, 18.96484375, 19.625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 13.0, 26.0, 36.0, 55.0, 73.0, 93.0, 146.0, 207.0, 327.0, 408.0, 621.0, 870.0, 1382.0, 2039.0, 3249.0, 4947.0, 7784.0, 12736.0, 20596.0, 34537.0, 58981.0, 100216.0, 173628.0, 296755.0, 556631.0, 2300921.0, 1597311.0, 475200.0, 264279.0, 153846.0, 89678.0, 52171.0, 31039.0, 18677.0, 11342.0, 7031.0, 4501.0, 2861.0, 1966.0, 1322.0, 896.0, 615.0, 419.0, 307.0, 213.0, 148.0, 96.0, 91.0, 52.0, 37.0, 20.0, 17.0, 3.0, 8.0, 5.0, 1.0, 4.0], "bins": [-7.18359375, -6.96514892578125, -6.7467041015625, -6.52825927734375, -6.309814453125, -6.09136962890625, -5.8729248046875, -5.65447998046875, -5.43603515625, -5.21759033203125, -4.9991455078125, -4.78070068359375, -4.562255859375, -4.34381103515625, -4.1253662109375, -3.90692138671875, -3.6884765625, -3.47003173828125, -3.2515869140625, -3.03314208984375, -2.814697265625, -2.59625244140625, -2.3778076171875, -2.15936279296875, -1.94091796875, -1.72247314453125, -1.5040283203125, -1.28558349609375, -1.067138671875, -0.84869384765625, -0.6302490234375, -0.41180419921875, -0.193359375, 0.02508544921875, 0.2435302734375, 0.46197509765625, 0.680419921875, 0.89886474609375, 1.1173095703125, 1.33575439453125, 1.55419921875, 1.77264404296875, 1.9910888671875, 2.20953369140625, 2.427978515625, 2.64642333984375, 2.8648681640625, 3.08331298828125, 3.3017578125, 3.52020263671875, 3.7386474609375, 3.95709228515625, 4.175537109375, 4.39398193359375, 4.6124267578125, 4.83087158203125, 5.04931640625, 5.26776123046875, 5.4862060546875, 5.70465087890625, 5.923095703125, 6.14154052734375, 6.3599853515625, 6.57843017578125, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 8.0, 5.0, 19.0, 21.0, 22.0, 29.0, 24.0, 35.0, 34.0, 45.0, 36.0, 55.0, 68.0, 174.0, 542.0, 351.0, 114.0, 60.0, 50.0, 38.0, 36.0, 34.0, 35.0, 34.0, 25.0, 28.0, 16.0, 14.0, 15.0, 13.0, 5.0, 3.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.24853515625, -35.9970703125, -34.74560546875, -33.494140625, -32.24267578125, -30.9912109375, -29.73974609375, -28.48828125, -27.23681640625, -25.9853515625, -24.73388671875, -23.482421875, -22.23095703125, -20.9794921875, -19.72802734375, -18.4765625, -17.22509765625, -15.9736328125, -14.72216796875, -13.470703125, -12.21923828125, -10.9677734375, -9.71630859375, -8.46484375, -7.21337890625, -5.9619140625, -4.71044921875, -3.458984375, -2.20751953125, -0.9560546875, 0.29541015625, 1.546875, 2.79833984375, 4.0498046875, 5.30126953125, 6.552734375, 7.80419921875, 9.0556640625, 10.30712890625, 11.55859375, 12.81005859375, 14.0615234375, 15.31298828125, 16.564453125, 17.81591796875, 19.0673828125, 20.31884765625, 21.5703125, 22.82177734375, 24.0732421875, 25.32470703125, 26.576171875, 27.82763671875, 29.0791015625, 30.33056640625, 31.58203125, 32.83349609375, 34.0849609375, 35.33642578125, 36.587890625, 37.83935546875, 39.0908203125, 40.34228515625, 41.59375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 14.0, 16.0, 12.0, 35.0, 48.0, 81.0, 108.0, 126.0, 190.0, 258.0, 377.0, 542.0, 773.0, 1241.0, 1934.0, 3044.0, 5519.0, 11276.0, 26282.0, 67939.0, 227579.0, 5735172.0, 126301.0, 44862.0, 17998.0, 8226.0, 4295.0, 2454.0, 1506.0, 989.0, 651.0, 469.0, 312.0, 212.0, 177.0, 110.0, 83.0, 43.0, 42.0, 26.0, 26.0, 18.0, 14.0, 8.0, 4.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0], "bins": [-39.90625, -38.67041015625, -37.4345703125, -36.19873046875, -34.962890625, -33.72705078125, -32.4912109375, -31.25537109375, -30.01953125, -28.78369140625, -27.5478515625, -26.31201171875, -25.076171875, -23.84033203125, -22.6044921875, -21.36865234375, -20.1328125, -18.89697265625, -17.6611328125, -16.42529296875, -15.189453125, -13.95361328125, -12.7177734375, -11.48193359375, -10.24609375, -9.01025390625, -7.7744140625, -6.53857421875, -5.302734375, -4.06689453125, -2.8310546875, -1.59521484375, -0.359375, 0.87646484375, 2.1123046875, 3.34814453125, 4.583984375, 5.81982421875, 7.0556640625, 8.29150390625, 9.52734375, 10.76318359375, 11.9990234375, 13.23486328125, 14.470703125, 15.70654296875, 16.9423828125, 18.17822265625, 19.4140625, 20.64990234375, 21.8857421875, 23.12158203125, 24.357421875, 25.59326171875, 26.8291015625, 28.06494140625, 29.30078125, 30.53662109375, 31.7724609375, 33.00830078125, 34.244140625, 35.47998046875, 36.7158203125, 37.95166015625, 39.1875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 7.0, 4.0, 4.0, 6.0, 10.0, 8.0, 18.0, 6.0, 19.0, 14.0, 16.0, 17.0, 29.0, 31.0, 39.0, 28.0, 32.0, 27.0, 33.0, 56.0, 119.0, 703.0, 291.0, 81.0, 36.0, 31.0, 36.0, 40.0, 28.0, 26.0, 26.0, 20.0, 22.0, 22.0, 25.0, 19.0, 8.0, 9.0, 23.0, 11.0, 9.0, 9.0, 5.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3388671875, -60.240234375, -58.1416015625, -56.04296875, -53.9443359375, -51.845703125, -49.7470703125, -47.6484375, -45.5498046875, -43.451171875, -41.3525390625, -39.25390625, -37.1552734375, -35.056640625, -32.9580078125, -30.859375, -28.7607421875, -26.662109375, -24.5634765625, -22.46484375, -20.3662109375, -18.267578125, -16.1689453125, -14.0703125, -11.9716796875, -9.873046875, -7.7744140625, -5.67578125, -3.5771484375, -1.478515625, 0.6201171875, 2.71875, 4.8173828125, 6.916015625, 9.0146484375, 11.11328125, 13.2119140625, 15.310546875, 17.4091796875, 19.5078125, 21.6064453125, 23.705078125, 25.8037109375, 27.90234375, 30.0009765625, 32.099609375, 34.1982421875, 36.296875, 38.3955078125, 40.494140625, 42.5927734375, 44.69140625, 46.7900390625, 48.888671875, 50.9873046875, 53.0859375, 55.1845703125, 57.283203125, 59.3818359375, 61.48046875, 63.5791015625, 65.677734375, 67.7763671875, 69.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 35.0, 461.0, 433.0, 29.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.9376831054688, -490.0948486328125, -461.25201416015625, -432.4091796875, -403.56634521484375, -374.7235107421875, -345.8807067871094, -317.0378723144531, -288.1950378417969, -259.3522033691406, -230.50936889648438, -201.6665496826172, -172.82371520996094, -143.9808807373047, -115.1380615234375, -86.29522705078125, -57.452392578125, -28.609561920166016, 0.23326873779296875, 29.076095581054688, 57.91893005371094, 86.76176452636719, 115.60458374023438, 144.44741821289062, 173.29025268554688, 202.13308715820312, 230.97592163085938, 259.8187255859375, 288.66156005859375, 317.50439453125, 346.34722900390625, 375.1900634765625, 404.0328369140625, 432.87567138671875, 461.718505859375, 490.56134033203125, 519.4041748046875, 548.2470092773438, 577.08984375, 605.9326171875, 634.7755126953125, 663.6183471679688, 692.461181640625, 721.3040161132812, 750.1468505859375, 778.9896850585938, 807.83251953125, 836.67529296875, 865.5181274414062, 894.3609619140625, 923.2037963867188, 952.046630859375, 980.8894653320312, 1009.7322998046875, 1038.5750732421875, 1067.41796875, 1096.2607421875, 1125.103515625, 1153.9464111328125, 1182.7891845703125, 1211.632080078125, 1240.474853515625, 1269.3177490234375, 1298.1605224609375, 1327.00341796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 8.0, 12.0, 15.0, 17.0, 18.0, 24.0, 71.0, 425.0, 234.0, 37.0, 24.0, 14.0, 20.0, 10.0, 7.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-519.654296875, -503.79681396484375, -487.9393310546875, -472.08184814453125, -456.224365234375, -440.36688232421875, -424.5093994140625, -408.65191650390625, -392.79443359375, -376.93695068359375, -361.0794677734375, -345.22198486328125, -329.364501953125, -313.50701904296875, -297.6495361328125, -281.79205322265625, -265.9345703125, -250.07708740234375, -234.2196044921875, -218.36212158203125, -202.504638671875, -186.64715576171875, -170.7896728515625, -154.93218994140625, -139.07467651367188, -123.21719360351562, -107.35971069335938, -91.50222778320312, -75.64474487304688, -59.787254333496094, -43.929771423339844, -28.072288513183594, -12.214813232421875, 3.6426706314086914, 19.500154495239258, 35.35763931274414, 51.21512222290039, 67.0726089477539, 82.93009185791016, 98.7875747680664, 114.64505767822266, 130.50254821777344, 146.3600311279297, 162.21751403808594, 178.0749969482422, 193.93247985839844, 209.7899627685547, 225.64744567871094, 241.5049285888672, 257.3624267578125, 273.21990966796875, 289.077392578125, 304.93487548828125, 320.7923583984375, 336.64984130859375, 352.50732421875, 368.36480712890625, 384.2222900390625, 400.07977294921875, 415.937255859375, 431.79473876953125, 447.6522216796875, 463.50970458984375, 479.3671875, 495.22467041015625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 16.0, 14.0, 18.0, 38.0, 52.0, 74.0, 98.0, 163.0, 242.0, 392.0, 673.0, 1194.0, 2144.0, 4426.0, 11405.0, 63006.0, 4059775.0, 33895.0, 8474.0, 3643.0, 1737.0, 1028.0, 602.0, 414.0, 259.0, 146.0, 94.0, 74.0, 55.0, 34.0, 35.0, 19.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8590087890625, -2.764892578125, -2.6707763671875, -2.57666015625, -2.4825439453125, -2.388427734375, -2.2943115234375, -2.2001953125, -2.1060791015625, -2.011962890625, -1.9178466796875, -1.82373046875, -1.7296142578125, -1.635498046875, -1.5413818359375, -1.447265625, -1.3531494140625, -1.259033203125, -1.1649169921875, -1.07080078125, -0.9766845703125, -0.882568359375, -0.7884521484375, -0.6943359375, -0.6002197265625, -0.506103515625, -0.4119873046875, -0.31787109375, -0.2237548828125, -0.129638671875, -0.0355224609375, 0.05859375, 0.1527099609375, 0.246826171875, 0.3409423828125, 0.43505859375, 0.5291748046875, 0.623291015625, 0.7174072265625, 0.8115234375, 0.9056396484375, 0.999755859375, 1.0938720703125, 1.18798828125, 1.2821044921875, 1.376220703125, 1.4703369140625, 1.564453125, 1.6585693359375, 1.752685546875, 1.8468017578125, 1.94091796875, 2.0350341796875, 2.129150390625, 2.2232666015625, 2.3173828125, 2.4114990234375, 2.505615234375, 2.5997314453125, 2.69384765625, 2.7879638671875, 2.882080078125, 2.9761962890625, 3.0703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 9.0, 12.0, 13.0, 12.0, 17.0, 113.0, 649.0, 35.0, 14.0, 10.0, 9.0, 5.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8466796875, -0.814453125, -0.7822265625, -0.75, -0.7177734375, -0.685546875, -0.6533203125, -0.62109375, -0.5888671875, -0.556640625, -0.5244140625, -0.4921875, -0.4599609375, -0.427734375, -0.3955078125, -0.36328125, -0.3310546875, -0.298828125, -0.2666015625, -0.234375, -0.2021484375, -0.169921875, -0.1376953125, -0.10546875, -0.0732421875, -0.041015625, -0.0087890625, 0.0234375, 0.0556640625, 0.087890625, 0.1201171875, 0.15234375, 0.1845703125, 0.216796875, 0.2490234375, 0.28125, 0.3134765625, 0.345703125, 0.3779296875, 0.41015625, 0.4423828125, 0.474609375, 0.5068359375, 0.5390625, 0.5712890625, 0.603515625, 0.6357421875, 0.66796875, 0.7001953125, 0.732421875, 0.7646484375, 0.796875, 0.8291015625, 0.861328125, 0.8935546875, 0.92578125, 0.9580078125, 0.990234375, 1.0224609375, 1.0546875, 1.0869140625, 1.119140625, 1.1513671875, 1.18359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 17.0, 24.0, 18.0, 28.0, 46.0, 71.0, 128.0, 214.0, 381.0, 684.0, 1344.0, 2533.0, 5148.0, 11090.0, 28513.0, 101133.0, 3090342.0, 831353.0, 77627.0, 23925.0, 9816.0, 4644.0, 2338.0, 1192.0, 689.0, 359.0, 222.0, 128.0, 80.0, 61.0, 40.0, 19.0, 12.0, 10.0, 11.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.816009521484375, -2.72186279296875, -2.627716064453125, -2.5335693359375, -2.439422607421875, -2.34527587890625, -2.251129150390625, -2.156982421875, -2.062835693359375, -1.96868896484375, -1.874542236328125, -1.7803955078125, -1.686248779296875, -1.59210205078125, -1.497955322265625, -1.40380859375, -1.309661865234375, -1.21551513671875, -1.121368408203125, -1.0272216796875, -0.933074951171875, -0.83892822265625, -0.744781494140625, -0.650634765625, -0.556488037109375, -0.46234130859375, -0.368194580078125, -0.2740478515625, -0.179901123046875, -0.08575439453125, 0.008392333984375, 0.1025390625, 0.196685791015625, 0.29083251953125, 0.384979248046875, 0.4791259765625, 0.573272705078125, 0.66741943359375, 0.761566162109375, 0.855712890625, 0.949859619140625, 1.04400634765625, 1.138153076171875, 1.2322998046875, 1.326446533203125, 1.42059326171875, 1.514739990234375, 1.60888671875, 1.703033447265625, 1.79718017578125, 1.891326904296875, 1.9854736328125, 2.079620361328125, 2.17376708984375, 2.267913818359375, 2.362060546875, 2.456207275390625, 2.55035400390625, 2.644500732421875, 2.7386474609375, 2.832794189453125, 2.92694091796875, 3.021087646484375, 3.115234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 9.0, 6.0, 9.0, 14.0, 19.0, 25.0, 35.0, 34.0, 56.0, 84.0, 115.0, 229.0, 802.0, 1739.0, 337.0, 154.0, 101.0, 67.0, 40.0, 34.0, 23.0, 27.0, 15.0, 11.0, 14.0, 12.0, 5.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.896484375, -0.8677520751953125, -0.839019775390625, -0.8102874755859375, -0.78155517578125, -0.7528228759765625, -0.724090576171875, -0.6953582763671875, -0.6666259765625, -0.6378936767578125, -0.609161376953125, -0.5804290771484375, -0.55169677734375, -0.5229644775390625, -0.494232177734375, -0.4654998779296875, -0.436767578125, -0.4080352783203125, -0.379302978515625, -0.3505706787109375, -0.32183837890625, -0.2931060791015625, -0.264373779296875, -0.2356414794921875, -0.2069091796875, -0.1781768798828125, -0.149444580078125, -0.1207122802734375, -0.09197998046875, -0.0632476806640625, -0.034515380859375, -0.0057830810546875, 0.02294921875, 0.0516815185546875, 0.080413818359375, 0.1091461181640625, 0.13787841796875, 0.1666107177734375, 0.195343017578125, 0.2240753173828125, 0.2528076171875, 0.2815399169921875, 0.310272216796875, 0.3390045166015625, 0.36773681640625, 0.3964691162109375, 0.425201416015625, 0.4539337158203125, 0.482666015625, 0.5113983154296875, 0.540130615234375, 0.5688629150390625, 0.59759521484375, 0.6263275146484375, 0.655059814453125, 0.6837921142578125, 0.7125244140625, 0.7412567138671875, 0.769989013671875, 0.7987213134765625, 0.82745361328125, 0.8561859130859375, 0.884918212890625, 0.9136505126953125, 0.9423828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 12.0, 114.0, 493.0, 328.0, 40.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.387290000915527, -10.665428161621094, -9.943567276000977, -9.221705436706543, -8.49984359741211, -7.777982711791992, -7.056120872497559, -6.334259510040283, -5.612398147583008, -4.890536785125732, -4.168675422668457, -3.4468135833740234, -2.724952220916748, -2.0030908584594727, -1.281229019165039, -0.5593676567077637, 0.16249370574951172, 0.8843551874160767, 1.6062166690826416, 2.328078269958496, 3.0499396324157715, 3.771800994873047, 4.4936628341674805, 5.215524196624756, 5.937385559082031, 6.659246921539307, 7.381108283996582, 8.102970123291016, 8.824831008911133, 9.546692848205566, 10.2685546875, 10.990415573120117, 11.712276458740234, 12.434138298034668, 13.155999183654785, 13.877861022949219, 14.599721908569336, 15.32158374786377, 16.043445587158203, 16.76530647277832, 17.487167358398438, 18.209028244018555, 18.930891036987305, 19.652751922607422, 20.37461280822754, 21.096473693847656, 21.818336486816406, 22.540197372436523, 23.262060165405273, 23.98392105102539, 24.70578384399414, 25.427644729614258, 26.149505615234375, 26.871368408203125, 27.593229293823242, 28.31509017944336, 29.03695297241211, 29.758813858032227, 30.480676651000977, 31.202537536621094, 31.92439842224121, 32.64625930786133, 33.36812210083008, 34.08998489379883, 34.81184387207031]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 3.0, 9.0, 5.0, 6.0, 16.0, 17.0, 20.0, 24.0, 29.0, 35.0, 62.0, 51.0, 49.0, 30.0, 51.0, 59.0, 60.0, 54.0, 53.0, 56.0, 52.0, 42.0, 31.0, 44.0, 39.0, 22.0, 21.0, 16.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.881981134414673, -2.762664556503296, -2.643348217010498, -2.524031639099121, -2.4047152996063232, -2.2853987216949463, -2.1660823822021484, -2.0467658042907715, -1.927449345588684, -1.8081328868865967, -1.6888164281845093, -1.5694999694824219, -1.450183391571045, -1.330867052078247, -1.2115504741668701, -1.0922340154647827, -0.9729175567626953, -0.8536010980606079, -0.7342846393585205, -0.6149681210517883, -0.4956516623497009, -0.3763352036476135, -0.25701868534088135, -0.13770222663879395, -0.018385767936706543, 0.10093070566654205, 0.22024717926979065, 0.33956366777420044, 0.45888012647628784, 0.5781965851783752, 0.6975131034851074, 0.8168295621871948, 0.9361462593078613, 1.0554627180099487, 1.1747791767120361, 1.294095754623413, 1.413412094116211, 1.532728672027588, 1.6520451307296753, 1.7713615894317627, 1.89067804813385, 2.0099945068359375, 2.1293110847473145, 2.2486274242401123, 2.3679440021514893, 2.487260341644287, 2.606576919555664, 2.725893497467041, 2.845209836959839, 2.964526414871216, 3.0838427543640137, 3.2031593322753906, 3.3224756717681885, 3.4417922496795654, 3.5611085891723633, 3.6804251670837402, 3.799741744995117, 3.919058322906494, 4.038374900817871, 4.15769100189209, 4.277007579803467, 4.396324157714844, 4.515640735626221, 4.634957313537598, 4.754273414611816]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 11.0, 12.0, 15.0, 25.0, 36.0, 44.0, 87.0, 96.0, 146.0, 213.0, 347.0, 496.0, 746.0, 1116.0, 1710.0, 2821.0, 4319.0, 7288.0, 12899.0, 25208.0, 72145.0, 835237.0, 39005.0, 18473.0, 10201.0, 5763.0, 3567.0, 2166.0, 1491.0, 973.0, 566.0, 424.0, 330.0, 199.0, 123.0, 76.0, 61.0, 44.0, 29.0, 17.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.591796875, -2.52227783203125, -2.4527587890625, -2.38323974609375, -2.313720703125, -2.24420166015625, -2.1746826171875, -2.10516357421875, -2.03564453125, -1.96612548828125, -1.8966064453125, -1.82708740234375, -1.757568359375, -1.68804931640625, -1.6185302734375, -1.54901123046875, -1.4794921875, -1.40997314453125, -1.3404541015625, -1.27093505859375, -1.201416015625, -1.13189697265625, -1.0623779296875, -0.99285888671875, -0.92333984375, -0.85382080078125, -0.7843017578125, -0.71478271484375, -0.645263671875, -0.57574462890625, -0.5062255859375, -0.43670654296875, -0.3671875, -0.29766845703125, -0.2281494140625, -0.15863037109375, -0.089111328125, -0.01959228515625, 0.0499267578125, 0.11944580078125, 0.18896484375, 0.25848388671875, 0.3280029296875, 0.39752197265625, 0.467041015625, 0.53656005859375, 0.6060791015625, 0.67559814453125, 0.7451171875, 0.81463623046875, 0.8841552734375, 0.95367431640625, 1.023193359375, 1.09271240234375, 1.1622314453125, 1.23175048828125, 1.30126953125, 1.37078857421875, 1.4403076171875, 1.50982666015625, 1.579345703125, 1.64886474609375, 1.7183837890625, 1.78790283203125, 1.857421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 11.0, 11.0, 129.0, 553.0, 116.0, 12.0, 13.0, 12.0, 6.0, 7.0, 5.0, 4.0, 8.0, 6.0, 2.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8037109375, -0.773284912109375, -0.74285888671875, -0.712432861328125, -0.6820068359375, -0.651580810546875, -0.62115478515625, -0.590728759765625, -0.560302734375, -0.529876708984375, -0.49945068359375, -0.469024658203125, -0.4385986328125, -0.408172607421875, -0.37774658203125, -0.347320556640625, -0.31689453125, -0.286468505859375, -0.25604248046875, -0.225616455078125, -0.1951904296875, -0.164764404296875, -0.13433837890625, -0.103912353515625, -0.073486328125, -0.043060302734375, -0.01263427734375, 0.017791748046875, 0.0482177734375, 0.078643798828125, 0.10906982421875, 0.139495849609375, 0.169921875, 0.200347900390625, 0.23077392578125, 0.261199951171875, 0.2916259765625, 0.322052001953125, 0.35247802734375, 0.382904052734375, 0.413330078125, 0.443756103515625, 0.47418212890625, 0.504608154296875, 0.5350341796875, 0.565460205078125, 0.59588623046875, 0.626312255859375, 0.65673828125, 0.687164306640625, 0.71759033203125, 0.748016357421875, 0.7784423828125, 0.808868408203125, 0.83929443359375, 0.869720458984375, 0.900146484375, 0.930572509765625, 0.96099853515625, 0.991424560546875, 1.0218505859375, 1.052276611328125, 1.08270263671875, 1.113128662109375, 1.1435546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 10.0, 6.0, 14.0, 17.0, 18.0, 22.0, 35.0, 53.0, 87.0, 119.0, 189.0, 351.0, 753.0, 1618.0, 3931.0, 11433.0, 39126.0, 176126.0, 576732.0, 179234.0, 39854.0, 11497.0, 3995.0, 1606.0, 714.0, 371.0, 213.0, 145.0, 92.0, 44.0, 31.0, 29.0, 19.0, 21.0, 11.0, 7.0, 8.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.4671630859375, -2.383544921875, -2.2999267578125, -2.21630859375, -2.1326904296875, -2.049072265625, -1.9654541015625, -1.8818359375, -1.7982177734375, -1.714599609375, -1.6309814453125, -1.54736328125, -1.4637451171875, -1.380126953125, -1.2965087890625, -1.212890625, -1.1292724609375, -1.045654296875, -0.9620361328125, -0.87841796875, -0.7947998046875, -0.711181640625, -0.6275634765625, -0.5439453125, -0.4603271484375, -0.376708984375, -0.2930908203125, -0.20947265625, -0.1258544921875, -0.042236328125, 0.0413818359375, 0.125, 0.2086181640625, 0.292236328125, 0.3758544921875, 0.45947265625, 0.5430908203125, 0.626708984375, 0.7103271484375, 0.7939453125, 0.8775634765625, 0.961181640625, 1.0447998046875, 1.12841796875, 1.2120361328125, 1.295654296875, 1.3792724609375, 1.462890625, 1.5465087890625, 1.630126953125, 1.7137451171875, 1.79736328125, 1.8809814453125, 1.964599609375, 2.0482177734375, 2.1318359375, 2.2154541015625, 2.299072265625, 2.3826904296875, 2.46630859375, 2.5499267578125, 2.633544921875, 2.7171630859375, 2.80078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 17.0, 31.0, 20.0, 20.0, 36.0, 24.0, 37.0, 29.0, 35.0, 34.0, 39.0, 42.0, 43.0, 43.0, 55.0, 55.0, 39.0, 52.0, 33.0, 42.0, 29.0, 28.0, 32.0, 25.0, 25.0, 25.0, 9.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0], "bins": [-4.734375, -4.611480712890625, -4.48858642578125, -4.365692138671875, -4.2427978515625, -4.119903564453125, -3.99700927734375, -3.874114990234375, -3.751220703125, -3.628326416015625, -3.50543212890625, -3.382537841796875, -3.2596435546875, -3.136749267578125, -3.01385498046875, -2.890960693359375, -2.76806640625, -2.645172119140625, -2.52227783203125, -2.399383544921875, -2.2764892578125, -2.153594970703125, -2.03070068359375, -1.907806396484375, -1.784912109375, -1.662017822265625, -1.53912353515625, -1.416229248046875, -1.2933349609375, -1.170440673828125, -1.04754638671875, -0.924652099609375, -0.8017578125, -0.678863525390625, -0.55596923828125, -0.433074951171875, -0.3101806640625, -0.187286376953125, -0.06439208984375, 0.058502197265625, 0.181396484375, 0.304290771484375, 0.42718505859375, 0.550079345703125, 0.6729736328125, 0.795867919921875, 0.91876220703125, 1.041656494140625, 1.16455078125, 1.287445068359375, 1.41033935546875, 1.533233642578125, 1.6561279296875, 1.779022216796875, 1.90191650390625, 2.024810791015625, 2.147705078125, 2.270599365234375, 2.39349365234375, 2.516387939453125, 2.6392822265625, 2.762176513671875, 2.88507080078125, 3.007965087890625, 3.130859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 14.0, 17.0, 31.0, 35.0, 62.0, 93.0, 150.0, 303.0, 522.0, 1226.0, 2982.0, 8955.0, 36460.0, 327064.0, 590653.0, 60423.0, 12429.0, 3998.0, 1610.0, 722.0, 342.0, 164.0, 114.0, 54.0, 26.0, 29.0, 24.0, 10.0, 8.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.340484619140625, -2.24737548828125, -2.154266357421875, -2.0611572265625, -1.968048095703125, -1.87493896484375, -1.781829833984375, -1.688720703125, -1.595611572265625, -1.50250244140625, -1.409393310546875, -1.3162841796875, -1.223175048828125, -1.13006591796875, -1.036956787109375, -0.94384765625, -0.850738525390625, -0.75762939453125, -0.664520263671875, -0.5714111328125, -0.478302001953125, -0.38519287109375, -0.292083740234375, -0.198974609375, -0.105865478515625, -0.01275634765625, 0.080352783203125, 0.1734619140625, 0.266571044921875, 0.35968017578125, 0.452789306640625, 0.5458984375, 0.639007568359375, 0.73211669921875, 0.825225830078125, 0.9183349609375, 1.011444091796875, 1.10455322265625, 1.197662353515625, 1.290771484375, 1.383880615234375, 1.47698974609375, 1.570098876953125, 1.6632080078125, 1.756317138671875, 1.84942626953125, 1.942535400390625, 2.03564453125, 2.128753662109375, 2.22186279296875, 2.314971923828125, 2.4080810546875, 2.501190185546875, 2.59429931640625, 2.687408447265625, 2.780517578125, 2.873626708984375, 2.96673583984375, 3.059844970703125, 3.1529541015625, 3.246063232421875, 3.33917236328125, 3.432281494140625, 3.525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 5.0, 11.0, 15.0, 23.0, 28.0, 39.0, 52.0, 62.0, 79.0, 68.0, 94.0, 91.0, 86.0, 60.0, 61.0, 41.0, 36.0, 40.0, 23.0, 14.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011790171265602112, -0.00011301785707473755, -0.00010813400149345398, -0.00010325014591217041, -9.836629033088684e-05, -9.348243474960327e-05, -8.85985791683197e-05, -8.371472358703613e-05, -7.883086800575256e-05, -7.3947012424469e-05, -6.906315684318542e-05, -6.417930126190186e-05, -5.9295445680618286e-05, -5.441159009933472e-05, -4.952773451805115e-05, -4.464387893676758e-05, -3.976002335548401e-05, -3.487616777420044e-05, -2.999231219291687e-05, -2.51084566116333e-05, -2.022460103034973e-05, -1.5340745449066162e-05, -1.0456889867782593e-05, -5.5730342864990234e-06, -6.891787052154541e-07, 4.194676876068115e-06, 9.078532457351685e-06, 1.3962388038635254e-05, 1.8846243619918823e-05, 2.3730099201202393e-05, 2.8613954782485962e-05, 3.349781036376953e-05, 3.83816659450531e-05, 4.326552152633667e-05, 4.814937710762024e-05, 5.303323268890381e-05, 5.791708827018738e-05, 6.280094385147095e-05, 6.768479943275452e-05, 7.256865501403809e-05, 7.745251059532166e-05, 8.233636617660522e-05, 8.72202217578888e-05, 9.210407733917236e-05, 9.698793292045593e-05, 0.0001018717885017395, 0.00010675564408302307, 0.00011163949966430664, 0.00011652335524559021, 0.00012140721082687378, 0.00012629106640815735, 0.00013117492198944092, 0.0001360587775707245, 0.00014094263315200806, 0.00014582648873329163, 0.0001507103443145752, 0.00015559419989585876, 0.00016047805547714233, 0.0001653619110584259, 0.00017024576663970947, 0.00017512962222099304, 0.0001800134778022766, 0.00018489733338356018, 0.00018978118896484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 16.0, 12.0, 24.0, 31.0, 64.0, 113.0, 197.0, 446.0, 1017.0, 2667.0, 9912.0, 73714.0, 773111.0, 164765.0, 16152.0, 3893.0, 1268.0, 544.0, 257.0, 142.0, 81.0, 46.0, 30.0, 12.0, 10.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.593963623046875, -4.46136474609375, -4.328765869140625, -4.1961669921875, -4.063568115234375, -3.93096923828125, -3.798370361328125, -3.665771484375, -3.533172607421875, -3.40057373046875, -3.267974853515625, -3.1353759765625, -3.002777099609375, -2.87017822265625, -2.737579345703125, -2.60498046875, -2.472381591796875, -2.33978271484375, -2.207183837890625, -2.0745849609375, -1.941986083984375, -1.80938720703125, -1.676788330078125, -1.544189453125, -1.411590576171875, -1.27899169921875, -1.146392822265625, -1.0137939453125, -0.881195068359375, -0.74859619140625, -0.615997314453125, -0.4833984375, -0.350799560546875, -0.21820068359375, -0.085601806640625, 0.0469970703125, 0.179595947265625, 0.31219482421875, 0.444793701171875, 0.577392578125, 0.709991455078125, 0.84259033203125, 0.975189208984375, 1.1077880859375, 1.240386962890625, 1.37298583984375, 1.505584716796875, 1.63818359375, 1.770782470703125, 1.90338134765625, 2.035980224609375, 2.1685791015625, 2.301177978515625, 2.43377685546875, 2.566375732421875, 2.698974609375, 2.831573486328125, 2.96417236328125, 3.096771240234375, 3.2293701171875, 3.361968994140625, 3.49456787109375, 3.627166748046875, 3.759765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 11.0, 20.0, 23.0, 38.0, 43.0, 47.0, 76.0, 86.0, 86.0, 114.0, 104.0, 89.0, 62.0, 47.0, 38.0, 33.0, 17.0, 18.0, 11.0, 13.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.326080322265625, -2.26153564453125, -2.196990966796875, -2.1324462890625, -2.067901611328125, -2.00335693359375, -1.938812255859375, -1.874267578125, -1.809722900390625, -1.74517822265625, -1.680633544921875, -1.6160888671875, -1.551544189453125, -1.48699951171875, -1.422454833984375, -1.35791015625, -1.293365478515625, -1.22882080078125, -1.164276123046875, -1.0997314453125, -1.035186767578125, -0.97064208984375, -0.906097412109375, -0.841552734375, -0.777008056640625, -0.71246337890625, -0.647918701171875, -0.5833740234375, -0.518829345703125, -0.45428466796875, -0.389739990234375, -0.3251953125, -0.260650634765625, -0.19610595703125, -0.131561279296875, -0.0670166015625, -0.002471923828125, 0.06207275390625, 0.126617431640625, 0.191162109375, 0.255706787109375, 0.32025146484375, 0.384796142578125, 0.4493408203125, 0.513885498046875, 0.57843017578125, 0.642974853515625, 0.70751953125, 0.772064208984375, 0.83660888671875, 0.901153564453125, 0.9656982421875, 1.030242919921875, 1.09478759765625, 1.159332275390625, 1.223876953125, 1.288421630859375, 1.35296630859375, 1.417510986328125, 1.4820556640625, 1.546600341796875, 1.61114501953125, 1.675689697265625, 1.740234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 16.0, 52.0, 371.0, 491.0, 59.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.24732971191406, -120.71041107177734, -117.17349243164062, -113.63656616210938, -110.09964752197266, -106.56272888183594, -103.02580261230469, -99.48888397216797, -95.95196533203125, -92.41504669189453, -88.87812805175781, -85.34120178222656, -81.80428314208984, -78.26736450195312, -74.73043823242188, -71.19351959228516, -67.65660095214844, -64.11968231201172, -60.582759857177734, -57.04583740234375, -53.50891876220703, -49.97200012207031, -46.43507766723633, -42.898155212402344, -39.361236572265625, -35.824317932128906, -32.28739547729492, -28.75047492980957, -25.21355438232422, -21.676633834838867, -18.139713287353516, -14.602792739868164, -11.065872192382812, -7.528951644897461, -3.9920310974121094, -0.4551105499267578, 3.0818099975585938, 6.618730545043945, 10.155651092529297, 13.692571640014648, 17.2294921875, 20.76641273498535, 24.303333282470703, 27.840253829956055, 31.377174377441406, 34.914093017578125, 38.45101547241211, 41.987937927246094, 45.52485656738281, 49.06177520751953, 52.598697662353516, 56.1356201171875, 59.67253875732422, 63.20945739746094, 66.74638366699219, 70.2833023071289, 73.82022094726562, 77.35713958740234, 80.89405822753906, 84.43098449707031, 87.96790313720703, 91.50482177734375, 95.041748046875, 98.57866668701172, 102.11558532714844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 3.0, 7.0, 9.0, 12.0, 20.0, 29.0, 38.0, 64.0, 109.0, 123.0, 150.0, 117.0, 87.0, 72.0, 36.0, 16.0, 12.0, 12.0, 15.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.0882339477539, -61.97610855102539, -59.863983154296875, -57.751861572265625, -55.63973617553711, -53.527610778808594, -51.41548538208008, -49.30335998535156, -47.19123840332031, -45.0791130065918, -42.96698760986328, -40.85486602783203, -38.742740631103516, -36.630615234375, -34.518489837646484, -32.40636444091797, -30.294239044189453, -28.182113647460938, -26.069990158081055, -23.95786476135254, -21.845741271972656, -19.73361587524414, -17.621490478515625, -15.509366035461426, -13.397241592407227, -11.285117149353027, -9.172992706298828, -7.0608673095703125, -4.948742866516113, -2.836618423461914, -0.7244930267333984, 1.3876314163208008, 3.499755859375, 5.611880302429199, 7.724005222320557, 9.836130142211914, 11.948254585266113, 14.060379028320312, 16.172504425048828, 18.284629821777344, 20.396753311157227, 22.508878707885742, 24.621002197265625, 26.73312759399414, 28.845252990722656, 30.95737648010254, 33.06950378417969, 35.18162536621094, 37.29375076293945, 39.40587615966797, 41.518001556396484, 43.630126953125, 45.74224853515625, 47.854373931884766, 49.96649932861328, 52.0786247253418, 54.19075012207031, 56.30287551879883, 58.415000915527344, 60.527122497558594, 62.63924789428711, 64.75137329101562, 66.86349487304688, 68.97562408447266, 71.0877456665039]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 6.0, 10.0, 14.0, 23.0, 46.0, 46.0, 71.0, 98.0, 121.0, 202.0, 299.0, 429.0, 677.0, 1101.0, 1763.0, 3029.0, 5592.0, 12177.0, 35067.0, 3594586.0, 486835.0, 29786.0, 10367.0, 4822.0, 2644.0, 1499.0, 941.0, 588.0, 432.0, 298.0, 203.0, 148.0, 77.0, 71.0, 44.0, 37.0, 29.0, 23.0, 17.0, 8.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.87890625, -7.65972900390625, -7.4405517578125, -7.22137451171875, -7.002197265625, -6.78302001953125, -6.5638427734375, -6.34466552734375, -6.12548828125, -5.90631103515625, -5.6871337890625, -5.46795654296875, -5.248779296875, -5.02960205078125, -4.8104248046875, -4.59124755859375, -4.3720703125, -4.15289306640625, -3.9337158203125, -3.71453857421875, -3.495361328125, -3.27618408203125, -3.0570068359375, -2.83782958984375, -2.61865234375, -2.39947509765625, -2.1802978515625, -1.96112060546875, -1.741943359375, -1.52276611328125, -1.3035888671875, -1.08441162109375, -0.865234375, -0.64605712890625, -0.4268798828125, -0.20770263671875, 0.011474609375, 0.23065185546875, 0.4498291015625, 0.66900634765625, 0.88818359375, 1.10736083984375, 1.3265380859375, 1.54571533203125, 1.764892578125, 1.98406982421875, 2.2032470703125, 2.42242431640625, 2.6416015625, 2.86077880859375, 3.0799560546875, 3.29913330078125, 3.518310546875, 3.73748779296875, 3.9566650390625, 4.17584228515625, 4.39501953125, 4.61419677734375, 4.8333740234375, 5.05255126953125, 5.271728515625, 5.49090576171875, 5.7100830078125, 5.92926025390625, 6.1484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 16.0, 14.0, 9.0, 19.0, 22.0, 140.0, 357.0, 244.0, 61.0, 19.0, 12.0, 12.0, 7.0, 8.0, 9.0, 6.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6816787719726562, -0.6529083251953125, -0.6241378784179688, -0.595367431640625, -0.5665969848632812, -0.5378265380859375, -0.5090560913085938, -0.48028564453125, -0.45151519775390625, -0.4227447509765625, -0.39397430419921875, -0.365203857421875, -0.33643341064453125, -0.3076629638671875, -0.27889251708984375, -0.2501220703125, -0.22135162353515625, -0.1925811767578125, -0.16381072998046875, -0.135040283203125, -0.10626983642578125, -0.0774993896484375, -0.04872894287109375, -0.01995849609375, 0.00881195068359375, 0.0375823974609375, 0.06635284423828125, 0.095123291015625, 0.12389373779296875, 0.1526641845703125, 0.18143463134765625, 0.210205078125, 0.23897552490234375, 0.2677459716796875, 0.29651641845703125, 0.325286865234375, 0.35405731201171875, 0.3828277587890625, 0.41159820556640625, 0.44036865234375, 0.46913909912109375, 0.4979095458984375, 0.5266799926757812, 0.555450439453125, 0.5842208862304688, 0.6129913330078125, 0.6417617797851562, 0.6705322265625, 0.6993026733398438, 0.7280731201171875, 0.7568435668945312, 0.785614013671875, 0.8143844604492188, 0.8431549072265625, 0.8719253540039062, 0.90069580078125, 0.9294662475585938, 0.9582366943359375, 0.9870071411132812, 1.015777587890625, 1.0445480346679688, 1.0733184814453125, 1.1020889282226562, 1.130859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 7.0, 17.0, 25.0, 33.0, 51.0, 61.0, 138.0, 222.0, 448.0, 988.0, 2234.0, 5843.0, 17948.0, 84015.0, 3640573.0, 383782.0, 40267.0, 10724.0, 3909.0, 1570.0, 654.0, 361.0, 167.0, 90.0, 48.0, 36.0, 22.0, 12.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.59552001953125, -7.3707275390625, -7.14593505859375, -6.921142578125, -6.69635009765625, -6.4715576171875, -6.24676513671875, -6.02197265625, -5.79718017578125, -5.5723876953125, -5.34759521484375, -5.122802734375, -4.89801025390625, -4.6732177734375, -4.44842529296875, -4.2236328125, -3.99884033203125, -3.7740478515625, -3.54925537109375, -3.324462890625, -3.09967041015625, -2.8748779296875, -2.65008544921875, -2.42529296875, -2.20050048828125, -1.9757080078125, -1.75091552734375, -1.526123046875, -1.30133056640625, -1.0765380859375, -0.85174560546875, -0.626953125, -0.40216064453125, -0.1773681640625, 0.04742431640625, 0.272216796875, 0.49700927734375, 0.7218017578125, 0.94659423828125, 1.17138671875, 1.39617919921875, 1.6209716796875, 1.84576416015625, 2.070556640625, 2.29534912109375, 2.5201416015625, 2.74493408203125, 2.9697265625, 3.19451904296875, 3.4193115234375, 3.64410400390625, 3.868896484375, 4.09368896484375, 4.3184814453125, 4.54327392578125, 4.76806640625, 4.99285888671875, 5.2176513671875, 5.44244384765625, 5.667236328125, 5.89202880859375, 6.1168212890625, 6.34161376953125, 6.56640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 14.0, 18.0, 14.0, 19.0, 33.0, 59.0, 93.0, 178.0, 325.0, 2147.0, 615.0, 214.0, 134.0, 66.0, 37.0, 30.0, 24.0, 20.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2167816162109375, -1.184539794921875, -1.1522979736328125, -1.12005615234375, -1.0878143310546875, -1.055572509765625, -1.0233306884765625, -0.9910888671875, -0.9588470458984375, -0.926605224609375, -0.8943634033203125, -0.86212158203125, -0.8298797607421875, -0.797637939453125, -0.7653961181640625, -0.733154296875, -0.7009124755859375, -0.668670654296875, -0.6364288330078125, -0.60418701171875, -0.5719451904296875, -0.539703369140625, -0.5074615478515625, -0.4752197265625, -0.4429779052734375, -0.410736083984375, -0.3784942626953125, -0.34625244140625, -0.3140106201171875, -0.281768798828125, -0.2495269775390625, -0.21728515625, -0.1850433349609375, -0.152801513671875, -0.1205596923828125, -0.08831787109375, -0.0560760498046875, -0.023834228515625, 0.0084075927734375, 0.0406494140625, 0.0728912353515625, 0.105133056640625, 0.1373748779296875, 0.16961669921875, 0.2018585205078125, 0.234100341796875, 0.2663421630859375, 0.298583984375, 0.3308258056640625, 0.363067626953125, 0.3953094482421875, 0.42755126953125, 0.4597930908203125, 0.492034912109375, 0.5242767333984375, 0.5565185546875, 0.5887603759765625, 0.621002197265625, 0.6532440185546875, 0.68548583984375, 0.7177276611328125, 0.749969482421875, 0.7822113037109375, 0.814453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 48.0, 169.0, 450.0, 246.0, 56.0, 16.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.364155769348145, -9.9586820602417, -9.553208351135254, -9.147734642028809, -8.742260932922363, -8.336787223815918, -7.9313130378723145, -7.525839328765869, -7.120365619659424, -6.7148919105529785, -6.309418201446533, -5.90394401550293, -5.498470306396484, -5.092996597290039, -4.687522888183594, -4.282049179077148, -3.876575469970703, -3.471101760864258, -3.0656280517578125, -2.660154104232788, -2.2546803951263428, -1.8492066860198975, -1.443732738494873, -1.0382590293884277, -0.6327853202819824, -0.22731155157089233, 0.17816221714019775, 0.5836360454559326, 0.9891097545623779, 1.3945834636688232, 1.8000574111938477, 2.205531120300293, 2.611003875732422, 3.016477584838867, 3.4219512939453125, 3.827425241470337, 4.232898712158203, 4.638372421264648, 5.043846607208252, 5.449320316314697, 5.854794025421143, 6.260267734527588, 6.665741443634033, 7.071215629577637, 7.476689338684082, 7.882163047790527, 8.287636756896973, 8.693110466003418, 9.098584175109863, 9.504057884216309, 9.909531593322754, 10.3150053024292, 10.720479011535645, 11.12595272064209, 11.531427383422852, 11.936901092529297, 12.342374801635742, 12.747848510742188, 13.153322219848633, 13.558795928955078, 13.964269638061523, 14.369743347167969, 14.775217056274414, 15.18069076538086, 15.586164474487305]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 10.0, 8.0, 11.0, 16.0, 15.0, 34.0, 34.0, 34.0, 44.0, 63.0, 80.0, 65.0, 75.0, 68.0, 55.0, 79.0, 43.0, 58.0, 37.0, 28.0, 24.0, 25.0, 19.0, 16.0, 11.0, 9.0, 2.0, 4.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.959841251373291, -3.85481333732605, -3.7497856616973877, -3.6447577476501465, -3.5397298336029053, -3.434701919555664, -3.329674243927002, -3.2246463298797607, -3.1196184158325195, -3.0145905017852783, -2.909562826156616, -2.804534912109375, -2.699506998062134, -2.5944790840148926, -2.4894514083862305, -2.3844234943389893, -2.279395818710327, -2.174367904663086, -2.069340229034424, -1.9643123149871826, -1.8592844009399414, -1.7542566061019897, -1.649228811264038, -1.5442008972167969, -1.4391731023788452, -1.3341453075408936, -1.2291173934936523, -1.1240895986557007, -1.019061803817749, -0.9140338897705078, -0.8090060949325562, -0.7039782404899597, -0.5989501476287842, -0.49392229318618774, -0.3888944685459137, -0.28386664390563965, -0.1788387894630432, -0.07381093502044678, 0.031216859817504883, 0.13624471426010132, 0.24127256870269775, 0.3463004231452942, 0.45132824778556824, 0.5563560724258423, 0.6613839268684387, 0.7664117813110352, 0.8714395761489868, 0.9764674305915833, 1.0814952850341797, 1.1865230798721313, 1.2915509939193726, 1.3965787887573242, 1.5016067028045654, 1.606634497642517, 1.7116622924804688, 1.81669020652771, 1.9217180013656616, 2.0267457962036133, 2.1317737102508545, 2.2368016242980957, 2.341829299926758, 2.446857213973999, 2.5518851280212402, 2.6569128036499023, 2.7619407176971436]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 12.0, 8.0, 12.0, 16.0, 21.0, 24.0, 30.0, 46.0, 55.0, 94.0, 142.0, 164.0, 233.0, 374.0, 569.0, 936.0, 1510.0, 2494.0, 4326.0, 8399.0, 19191.0, 71619.0, 816896.0, 81192.0, 20206.0, 8621.0, 4401.0, 2520.0, 1565.0, 1001.0, 620.0, 359.0, 273.0, 193.0, 120.0, 93.0, 64.0, 38.0, 29.0, 28.0, 17.0, 13.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.9375, -4.79022216796875, -4.6429443359375, -4.49566650390625, -4.348388671875, -4.20111083984375, -4.0538330078125, -3.90655517578125, -3.75927734375, -3.61199951171875, -3.4647216796875, -3.31744384765625, -3.170166015625, -3.02288818359375, -2.8756103515625, -2.72833251953125, -2.5810546875, -2.43377685546875, -2.2864990234375, -2.13922119140625, -1.991943359375, -1.84466552734375, -1.6973876953125, -1.55010986328125, -1.40283203125, -1.25555419921875, -1.1082763671875, -0.96099853515625, -0.813720703125, -0.66644287109375, -0.5191650390625, -0.37188720703125, -0.224609375, -0.07733154296875, 0.0699462890625, 0.21722412109375, 0.364501953125, 0.51177978515625, 0.6590576171875, 0.80633544921875, 0.95361328125, 1.10089111328125, 1.2481689453125, 1.39544677734375, 1.542724609375, 1.69000244140625, 1.8372802734375, 1.98455810546875, 2.1318359375, 2.27911376953125, 2.4263916015625, 2.57366943359375, 2.720947265625, 2.86822509765625, 3.0155029296875, 3.16278076171875, 3.31005859375, 3.45733642578125, 3.6046142578125, 3.75189208984375, 3.899169921875, 4.04644775390625, 4.1937255859375, 4.34100341796875, 4.48828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 10.0, 3.0, 7.0, 18.0, 13.0, 27.0, 80.0, 221.0, 335.0, 161.0, 35.0, 19.0, 8.0, 11.0, 13.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7085494995117188, -0.6793060302734375, -0.6500625610351562, -0.620819091796875, -0.5915756225585938, -0.5623321533203125, -0.5330886840820312, -0.50384521484375, -0.47460174560546875, -0.4453582763671875, -0.41611480712890625, -0.386871337890625, -0.35762786865234375, -0.3283843994140625, -0.29914093017578125, -0.2698974609375, -0.24065399169921875, -0.2114105224609375, -0.18216705322265625, -0.152923583984375, -0.12368011474609375, -0.0944366455078125, -0.06519317626953125, -0.03594970703125, -0.00670623779296875, 0.0225372314453125, 0.05178070068359375, 0.081024169921875, 0.11026763916015625, 0.1395111083984375, 0.16875457763671875, 0.197998046875, 0.22724151611328125, 0.2564849853515625, 0.28572845458984375, 0.314971923828125, 0.34421539306640625, 0.3734588623046875, 0.40270233154296875, 0.43194580078125, 0.46118927001953125, 0.4904327392578125, 0.5196762084960938, 0.548919677734375, 0.5781631469726562, 0.6074066162109375, 0.6366500854492188, 0.6658935546875, 0.6951370239257812, 0.7243804931640625, 0.7536239624023438, 0.782867431640625, 0.8121109008789062, 0.8413543701171875, 0.8705978393554688, 0.89984130859375, 0.9290847778320312, 0.9583282470703125, 0.9875717163085938, 1.016815185546875, 1.0460586547851562, 1.0753021240234375, 1.1045455932617188, 1.1337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 11.0, 28.0, 39.0, 50.0, 93.0, 130.0, 266.0, 508.0, 1103.0, 2501.0, 6683.0, 23871.0, 171364.0, 706805.0, 109010.0, 17475.0, 4996.0, 1870.0, 804.0, 399.0, 209.0, 116.0, 74.0, 50.0, 24.0, 9.0, 13.0, 15.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.33843994140625, -4.2003173828125, -4.06219482421875, -3.924072265625, -3.78594970703125, -3.6478271484375, -3.50970458984375, -3.37158203125, -3.23345947265625, -3.0953369140625, -2.95721435546875, -2.819091796875, -2.68096923828125, -2.5428466796875, -2.40472412109375, -2.2666015625, -2.12847900390625, -1.9903564453125, -1.85223388671875, -1.714111328125, -1.57598876953125, -1.4378662109375, -1.29974365234375, -1.16162109375, -1.02349853515625, -0.8853759765625, -0.74725341796875, -0.609130859375, -0.47100830078125, -0.3328857421875, -0.19476318359375, -0.056640625, 0.08148193359375, 0.2196044921875, 0.35772705078125, 0.495849609375, 0.63397216796875, 0.7720947265625, 0.91021728515625, 1.04833984375, 1.18646240234375, 1.3245849609375, 1.46270751953125, 1.600830078125, 1.73895263671875, 1.8770751953125, 2.01519775390625, 2.1533203125, 2.29144287109375, 2.4295654296875, 2.56768798828125, 2.705810546875, 2.84393310546875, 2.9820556640625, 3.12017822265625, 3.25830078125, 3.39642333984375, 3.5345458984375, 3.67266845703125, 3.810791015625, 3.94891357421875, 4.0870361328125, 4.22515869140625, 4.36328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 10.0, 7.0, 17.0, 20.0, 29.0, 33.0, 30.0, 59.0, 46.0, 50.0, 54.0, 50.0, 56.0, 57.0, 49.0, 59.0, 57.0, 52.0, 55.0, 33.0, 38.0, 24.0, 20.0, 13.0, 17.0, 9.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.311767578125, -2.23095703125, -2.150146484375, -2.0693359375, -1.988525390625, -1.90771484375, -1.826904296875, -1.74609375, -1.665283203125, -1.58447265625, -1.503662109375, -1.4228515625, -1.342041015625, -1.26123046875, -1.180419921875, -1.099609375, -1.018798828125, -0.93798828125, -0.857177734375, -0.7763671875, -0.695556640625, -0.61474609375, -0.533935546875, -0.453125, -0.372314453125, -0.29150390625, -0.210693359375, -0.1298828125, -0.049072265625, 0.03173828125, 0.112548828125, 0.193359375, 0.274169921875, 0.35498046875, 0.435791015625, 0.5166015625, 0.597412109375, 0.67822265625, 0.759033203125, 0.83984375, 0.920654296875, 1.00146484375, 1.082275390625, 1.1630859375, 1.243896484375, 1.32470703125, 1.405517578125, 1.486328125, 1.567138671875, 1.64794921875, 1.728759765625, 1.8095703125, 1.890380859375, 1.97119140625, 2.052001953125, 2.1328125, 2.213623046875, 2.29443359375, 2.375244140625, 2.4560546875, 2.536865234375, 2.61767578125, 2.698486328125, 2.779296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 2.0, 4.0, 6.0, 13.0, 16.0, 27.0, 33.0, 42.0, 83.0, 96.0, 158.0, 200.0, 344.0, 504.0, 855.0, 1437.0, 2501.0, 5119.0, 10919.0, 28276.0, 93382.0, 376147.0, 382392.0, 94680.0, 28702.0, 11088.0, 5105.0, 2602.0, 1454.0, 860.0, 455.0, 328.0, 231.0, 145.0, 90.0, 72.0, 41.0, 30.0, 31.0, 22.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.865234375, -2.769744873046875, -2.67425537109375, -2.578765869140625, -2.4832763671875, -2.387786865234375, -2.29229736328125, -2.196807861328125, -2.101318359375, -2.005828857421875, -1.91033935546875, -1.814849853515625, -1.7193603515625, -1.623870849609375, -1.52838134765625, -1.432891845703125, -1.33740234375, -1.241912841796875, -1.14642333984375, -1.050933837890625, -0.9554443359375, -0.859954833984375, -0.76446533203125, -0.668975830078125, -0.573486328125, -0.477996826171875, -0.38250732421875, -0.287017822265625, -0.1915283203125, -0.096038818359375, -0.00054931640625, 0.094940185546875, 0.1904296875, 0.285919189453125, 0.38140869140625, 0.476898193359375, 0.5723876953125, 0.667877197265625, 0.76336669921875, 0.858856201171875, 0.954345703125, 1.049835205078125, 1.14532470703125, 1.240814208984375, 1.3363037109375, 1.431793212890625, 1.52728271484375, 1.622772216796875, 1.71826171875, 1.813751220703125, 1.90924072265625, 2.004730224609375, 2.1002197265625, 2.195709228515625, 2.29119873046875, 2.386688232421875, 2.482177734375, 2.577667236328125, 2.67315673828125, 2.768646240234375, 2.8641357421875, 2.959625244140625, 3.05511474609375, 3.150604248046875, 3.24609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 10.0, 15.0, 18.0, 32.0, 63.0, 120.0, 213.0, 187.0, 140.0, 76.0, 41.0, 24.0, 14.0, 9.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006275177001953125, -0.0006133057177066803, -0.0005990937352180481, -0.0005848817527294159, -0.0005706697702407837, -0.0005564577877521515, -0.0005422458052635193, -0.0005280338227748871, -0.0005138218402862549, -0.0004996098577976227, -0.0004853978753089905, -0.0004711858928203583, -0.0004569739103317261, -0.00044276192784309387, -0.00042854994535446167, -0.00041433796286582947, -0.00040012598037719727, -0.00038591399788856506, -0.00037170201539993286, -0.00035749003291130066, -0.00034327805042266846, -0.00032906606793403625, -0.00031485408544540405, -0.00030064210295677185, -0.00028643012046813965, -0.00027221813797950745, -0.00025800615549087524, -0.00024379417300224304, -0.00022958219051361084, -0.00021537020802497864, -0.00020115822553634644, -0.00018694624304771423, -0.00017273426055908203, -0.00015852227807044983, -0.00014431029558181763, -0.00013009831309318542, -0.00011588633060455322, -0.00010167434811592102, -8.746236562728882e-05, -7.325038313865662e-05, -5.9038400650024414e-05, -4.482641816139221e-05, -3.061443567276001e-05, -1.6402453184127808e-05, -2.1904706954956055e-06, 1.2021511793136597e-05, 2.62334942817688e-05, 4.0445476770401e-05, 5.46574592590332e-05, 6.88694417476654e-05, 8.308142423629761e-05, 9.729340672492981e-05, 0.00011150538921356201, 0.00012571737170219421, 0.00013992935419082642, 0.00015414133667945862, 0.00016835331916809082, 0.00018256530165672302, 0.00019677728414535522, 0.00021098926663398743, 0.00022520124912261963, 0.00023941323161125183, 0.00025362521409988403, 0.00026783719658851624, 0.00028204917907714844]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 6.0, 6.0, 9.0, 21.0, 24.0, 28.0, 27.0, 60.0, 98.0, 135.0, 220.0, 373.0, 653.0, 1156.0, 2226.0, 4661.0, 10747.0, 30802.0, 114591.0, 448379.0, 320218.0, 75375.0, 22356.0, 8429.0, 3635.0, 1818.0, 1024.0, 544.0, 312.0, 190.0, 119.0, 85.0, 53.0, 45.0, 30.0, 24.0, 16.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.2236328125, -3.119140625, -3.0146484375, -2.91015625, -2.8056640625, -2.701171875, -2.5966796875, -2.4921875, -2.3876953125, -2.283203125, -2.1787109375, -2.07421875, -1.9697265625, -1.865234375, -1.7607421875, -1.65625, -1.5517578125, -1.447265625, -1.3427734375, -1.23828125, -1.1337890625, -1.029296875, -0.9248046875, -0.8203125, -0.7158203125, -0.611328125, -0.5068359375, -0.40234375, -0.2978515625, -0.193359375, -0.0888671875, 0.015625, 0.1201171875, 0.224609375, 0.3291015625, 0.43359375, 0.5380859375, 0.642578125, 0.7470703125, 0.8515625, 0.9560546875, 1.060546875, 1.1650390625, 1.26953125, 1.3740234375, 1.478515625, 1.5830078125, 1.6875, 1.7919921875, 1.896484375, 2.0009765625, 2.10546875, 2.2099609375, 2.314453125, 2.4189453125, 2.5234375, 2.6279296875, 2.732421875, 2.8369140625, 2.94140625, 3.0458984375, 3.150390625, 3.2548828125, 3.359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 8.0, 11.0, 11.0, 9.0, 25.0, 19.0, 38.0, 43.0, 48.0, 59.0, 58.0, 97.0, 82.0, 70.0, 70.0, 54.0, 46.0, 47.0, 37.0, 35.0, 26.0, 21.0, 21.0, 9.0, 9.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.79913330078125, -1.7388916015625, -1.67864990234375, -1.618408203125, -1.55816650390625, -1.4979248046875, -1.43768310546875, -1.37744140625, -1.31719970703125, -1.2569580078125, -1.19671630859375, -1.136474609375, -1.07623291015625, -1.0159912109375, -0.95574951171875, -0.8955078125, -0.83526611328125, -0.7750244140625, -0.71478271484375, -0.654541015625, -0.59429931640625, -0.5340576171875, -0.47381591796875, -0.41357421875, -0.35333251953125, -0.2930908203125, -0.23284912109375, -0.172607421875, -0.11236572265625, -0.0521240234375, 0.00811767578125, 0.068359375, 0.12860107421875, 0.1888427734375, 0.24908447265625, 0.309326171875, 0.36956787109375, 0.4298095703125, 0.49005126953125, 0.55029296875, 0.61053466796875, 0.6707763671875, 0.73101806640625, 0.791259765625, 0.85150146484375, 0.9117431640625, 0.97198486328125, 1.0322265625, 1.09246826171875, 1.1527099609375, 1.21295166015625, 1.273193359375, 1.33343505859375, 1.3936767578125, 1.45391845703125, 1.51416015625, 1.57440185546875, 1.6346435546875, 1.69488525390625, 1.755126953125, 1.81536865234375, 1.8756103515625, 1.93585205078125, 1.99609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 24.0, 46.0, 92.0, 181.0, 258.0, 190.0, 110.0, 47.0, 24.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.348005294799805, -16.413665771484375, -15.479326248168945, -14.544986724853516, -13.610647201538086, -12.676307678222656, -11.741968154907227, -10.807628631591797, -9.873289108276367, -8.938949584960938, -8.004610061645508, -7.070270538330078, -6.135931015014648, -5.201591491699219, -4.267251968383789, -3.3329124450683594, -2.3985729217529297, -1.4642333984375, -0.5298938751220703, 0.4044456481933594, 1.338785171508789, 2.2731246948242188, 3.2074642181396484, 4.141803741455078, 5.076143264770508, 6.0104827880859375, 6.944822311401367, 7.879161834716797, 8.813501358032227, 9.747840881347656, 10.682180404663086, 11.616519927978516, 12.550857543945312, 13.485197067260742, 14.419536590576172, 15.353876113891602, 16.28821563720703, 17.22255516052246, 18.15689468383789, 19.09123420715332, 20.02557373046875, 20.95991325378418, 21.89425277709961, 22.82859230041504, 23.76293182373047, 24.6972713470459, 25.631610870361328, 26.565950393676758, 27.500289916992188, 28.434629440307617, 29.368968963623047, 30.303308486938477, 31.237648010253906, 32.17198944091797, 33.106327056884766, 34.04066467285156, 34.975006103515625, 35.90934753417969, 36.843685150146484, 37.77802276611328, 38.712364196777344, 39.646705627441406, 40.5810432434082, 41.515380859375, 42.44972229003906]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 12.0, 11.0, 11.0, 15.0, 22.0, 31.0, 34.0, 48.0, 43.0, 50.0, 63.0, 81.0, 68.0, 64.0, 69.0, 61.0, 57.0, 71.0, 40.0, 28.0, 26.0, 28.0, 13.0, 10.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.886821746826172, -17.308025360107422, -16.729228973388672, -16.150432586669922, -15.571636199951172, -14.992839813232422, -14.414044380187988, -13.835247993469238, -13.256451606750488, -12.677655220031738, -12.098858833312988, -11.520062446594238, -10.941267013549805, -10.362470626831055, -9.783674240112305, -9.204877853393555, -8.626081466674805, -8.047285079956055, -7.468488693237305, -6.889692783355713, -6.310896396636963, -5.732100009918213, -5.153304100036621, -4.574507713317871, -3.995711326599121, -3.416914939880371, -2.8381187915802, -2.2593226432800293, -1.6805262565612793, -1.1017298698425293, -0.5229337215423584, 0.0558624267578125, 0.6346588134765625, 1.213455080986023, 1.7922513484954834, 2.3710474967956543, 2.9498438835144043, 3.5286402702331543, 4.107436180114746, 4.686232566833496, 5.265028953552246, 5.843825340270996, 6.422621726989746, 7.001417636871338, 7.580214023590088, 8.15900993347168, 8.73780632019043, 9.31660270690918, 9.89539909362793, 10.47419548034668, 11.05299186706543, 11.63178825378418, 12.21058464050293, 12.78938102722168, 13.368176460266113, 13.946972846984863, 14.525769233703613, 15.104565620422363, 15.683362007141113, 16.262157440185547, 16.840953826904297, 17.419750213623047, 17.998546600341797, 18.577342987060547, 19.156139373779297]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 22.0, 21.0, 42.0, 51.0, 77.0, 100.0, 145.0, 225.0, 355.0, 448.0, 753.0, 1253.0, 2364.0, 4718.0, 11505.0, 45814.0, 3873722.0, 217062.0, 20971.0, 7079.0, 3088.0, 1709.0, 954.0, 607.0, 369.0, 256.0, 156.0, 111.0, 72.0, 65.0, 35.0, 22.0, 22.0, 12.0, 19.0, 6.0, 9.0, 3.0, 4.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9921875, -11.6370849609375, -11.281982421875, -10.9268798828125, -10.57177734375, -10.2166748046875, -9.861572265625, -9.5064697265625, -9.1513671875, -8.7962646484375, -8.441162109375, -8.0860595703125, -7.73095703125, -7.3758544921875, -7.020751953125, -6.6656494140625, -6.310546875, -5.9554443359375, -5.600341796875, -5.2452392578125, -4.89013671875, -4.5350341796875, -4.179931640625, -3.8248291015625, -3.4697265625, -3.1146240234375, -2.759521484375, -2.4044189453125, -2.04931640625, -1.6942138671875, -1.339111328125, -0.9840087890625, -0.62890625, -0.2738037109375, 0.081298828125, 0.4364013671875, 0.79150390625, 1.1466064453125, 1.501708984375, 1.8568115234375, 2.2119140625, 2.5670166015625, 2.922119140625, 3.2772216796875, 3.63232421875, 3.9874267578125, 4.342529296875, 4.6976318359375, 5.052734375, 5.4078369140625, 5.762939453125, 6.1180419921875, 6.47314453125, 6.8282470703125, 7.183349609375, 7.5384521484375, 7.8935546875, 8.2486572265625, 8.603759765625, 8.9588623046875, 9.31396484375, 9.6690673828125, 10.024169921875, 10.3792724609375, 10.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 11.0, 7.0, 18.0, 31.0, 54.0, 171.0, 287.0, 208.0, 101.0, 31.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7702255249023438, -0.7401580810546875, -0.7100906372070312, -0.680023193359375, -0.6499557495117188, -0.6198883056640625, -0.5898208618164062, -0.55975341796875, -0.5296859741210938, -0.4996185302734375, -0.46955108642578125, -0.439483642578125, -0.40941619873046875, -0.3793487548828125, -0.34928131103515625, -0.3192138671875, -0.28914642333984375, -0.2590789794921875, -0.22901153564453125, -0.198944091796875, -0.16887664794921875, -0.1388092041015625, -0.10874176025390625, -0.07867431640625, -0.04860687255859375, -0.0185394287109375, 0.01152801513671875, 0.041595458984375, 0.07166290283203125, 0.1017303466796875, 0.13179779052734375, 0.161865234375, 0.19193267822265625, 0.2220001220703125, 0.25206756591796875, 0.282135009765625, 0.31220245361328125, 0.3422698974609375, 0.37233734130859375, 0.40240478515625, 0.43247222900390625, 0.4625396728515625, 0.49260711669921875, 0.522674560546875, 0.5527420043945312, 0.5828094482421875, 0.6128768920898438, 0.6429443359375, 0.6730117797851562, 0.7030792236328125, 0.7331466674804688, 0.763214111328125, 0.7932815551757812, 0.8233489990234375, 0.8534164428710938, 0.88348388671875, 0.9135513305664062, 0.9436187744140625, 0.9736862182617188, 1.003753662109375, 1.0338211059570312, 1.0638885498046875, 1.0939559936523438, 1.1240234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 19.0, 34.0, 48.0, 86.0, 181.0, 335.0, 702.0, 1723.0, 4663.0, 15274.0, 63631.0, 653954.0, 3311489.0, 108230.0, 22858.0, 6786.0, 2382.0, 972.0, 400.0, 211.0, 118.0, 68.0, 36.0, 25.0, 10.0, 5.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.6072998046875, -8.339599609375, -8.0718994140625, -7.80419921875, -7.5364990234375, -7.268798828125, -7.0010986328125, -6.7333984375, -6.4656982421875, -6.197998046875, -5.9302978515625, -5.66259765625, -5.3948974609375, -5.127197265625, -4.8594970703125, -4.591796875, -4.3240966796875, -4.056396484375, -3.7886962890625, -3.52099609375, -3.2532958984375, -2.985595703125, -2.7178955078125, -2.4501953125, -2.1824951171875, -1.914794921875, -1.6470947265625, -1.37939453125, -1.1116943359375, -0.843994140625, -0.5762939453125, -0.30859375, -0.0408935546875, 0.226806640625, 0.4945068359375, 0.76220703125, 1.0299072265625, 1.297607421875, 1.5653076171875, 1.8330078125, 2.1007080078125, 2.368408203125, 2.6361083984375, 2.90380859375, 3.1715087890625, 3.439208984375, 3.7069091796875, 3.974609375, 4.2423095703125, 4.510009765625, 4.7777099609375, 5.04541015625, 5.3131103515625, 5.580810546875, 5.8485107421875, 6.1162109375, 6.3839111328125, 6.651611328125, 6.9193115234375, 7.18701171875, 7.4547119140625, 7.722412109375, 7.9901123046875, 8.2578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 7.0, 13.0, 20.0, 11.0, 25.0, 33.0, 50.0, 58.0, 112.0, 172.0, 293.0, 640.0, 1705.0, 383.0, 157.0, 111.0, 69.0, 45.0, 43.0, 27.0, 21.0, 11.0, 15.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.203125, -1.169891357421875, -1.13665771484375, -1.103424072265625, -1.0701904296875, -1.036956787109375, -1.00372314453125, -0.970489501953125, -0.937255859375, -0.904022216796875, -0.87078857421875, -0.837554931640625, -0.8043212890625, -0.771087646484375, -0.73785400390625, -0.704620361328125, -0.67138671875, -0.638153076171875, -0.60491943359375, -0.571685791015625, -0.5384521484375, -0.505218505859375, -0.47198486328125, -0.438751220703125, -0.405517578125, -0.372283935546875, -0.33905029296875, -0.305816650390625, -0.2725830078125, -0.239349365234375, -0.20611572265625, -0.172882080078125, -0.1396484375, -0.106414794921875, -0.07318115234375, -0.039947509765625, -0.0067138671875, 0.026519775390625, 0.05975341796875, 0.092987060546875, 0.126220703125, 0.159454345703125, 0.19268798828125, 0.225921630859375, 0.2591552734375, 0.292388916015625, 0.32562255859375, 0.358856201171875, 0.39208984375, 0.425323486328125, 0.45855712890625, 0.491790771484375, 0.5250244140625, 0.558258056640625, 0.59149169921875, 0.624725341796875, 0.657958984375, 0.691192626953125, 0.72442626953125, 0.757659912109375, 0.7908935546875, 0.824127197265625, 0.85736083984375, 0.890594482421875, 0.923828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 12.0, 30.0, 42.0, 113.0, 169.0, 245.0, 185.0, 96.0, 51.0, 26.0, 15.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.81429672241211, -16.46824836730957, -16.1221981048584, -15.776148796081543, -15.430099487304688, -15.084050178527832, -14.738000869750977, -14.391952514648438, -14.045902252197266, -13.69985294342041, -13.353803634643555, -13.0077543258667, -12.661705017089844, -12.315655708312988, -11.969606399536133, -11.623558044433594, -11.277508735656738, -10.931459426879883, -10.585410118103027, -10.239360809326172, -9.893311500549316, -9.547262191772461, -9.201213836669922, -8.85516357421875, -8.509115219116211, -8.163065910339355, -7.8170166015625, -7.4709672927856445, -7.124917984008789, -6.778868675231934, -6.432819843292236, -6.086770534515381, -5.740721702575684, -5.394672393798828, -5.048623085021973, -4.702573776245117, -4.356524467468262, -4.010475158691406, -3.664426326751709, -3.3183770179748535, -2.972327709197998, -2.6262784004211426, -2.280229091644287, -1.9341800212860107, -1.5881307125091553, -1.2420814037322998, -0.8960323333740234, -0.549983024597168, -0.2039337158203125, 0.1421155333518982, 0.4881647825241089, 0.8342139720916748, 1.1802632808685303, 1.5263125896453857, 1.872361660003662, 2.2184109687805176, 2.564460277557373, 2.9105095863342285, 3.256558895111084, 3.6026079654693604, 3.948657274246216, 4.294706344604492, 4.640755653381348, 4.986804962158203, 5.332854270935059]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 7.0, 6.0, 10.0, 14.0, 13.0, 14.0, 24.0, 21.0, 34.0, 28.0, 25.0, 27.0, 36.0, 40.0, 36.0, 47.0, 43.0, 34.0, 40.0, 35.0, 40.0, 46.0, 34.0, 34.0, 32.0, 42.0, 41.0, 23.0, 25.0, 20.0, 28.0, 14.0, 14.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2092902660369873, -3.1037561893463135, -2.9982218742370605, -2.8926877975463867, -2.787153720855713, -2.681619644165039, -2.5760855674743652, -2.4705512523651123, -2.3650171756744385, -2.2594830989837646, -2.1539487838745117, -2.048414707183838, -1.942880630493164, -1.8373465538024902, -1.7318123579025269, -1.6262781620025635, -1.5207440853118896, -1.4152100086212158, -1.3096758127212524, -1.204141616821289, -1.0986075401306152, -0.9930734038352966, -0.887539267539978, -0.7820051312446594, -0.6764709949493408, -0.5709368586540222, -0.4654027223587036, -0.359868586063385, -0.2543344497680664, -0.1488003134727478, -0.0432661771774292, 0.062267959117889404, 0.1678023338317871, 0.2733364701271057, 0.3788706064224243, 0.4844047427177429, 0.5899388790130615, 0.6954730153083801, 0.8010071516036987, 0.9065412878990173, 1.012075424194336, 1.1176095008850098, 1.2231436967849731, 1.3286778926849365, 1.4342119693756104, 1.5397460460662842, 1.6452802419662476, 1.750814437866211, 1.8563485145568848, 1.9618825912475586, 2.0674166679382324, 2.1729509830474854, 2.278485059738159, 2.384019136428833, 2.489553451538086, 2.5950875282287598, 2.7006216049194336, 2.8061556816101074, 2.9116897583007812, 3.017224073410034, 3.122758150100708, 3.228292226791382, 3.3338265419006348, 3.4393606185913086, 3.5448946952819824]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 13.0, 16.0, 19.0, 24.0, 31.0, 54.0, 73.0, 87.0, 109.0, 153.0, 238.0, 350.0, 523.0, 720.0, 1019.0, 1721.0, 2740.0, 5000.0, 10529.0, 28765.0, 145161.0, 653135.0, 145427.0, 28923.0, 10583.0, 5234.0, 2829.0, 1640.0, 1092.0, 681.0, 472.0, 340.0, 252.0, 166.0, 129.0, 90.0, 56.0, 38.0, 37.0, 22.0, 16.0, 13.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.953125, -5.76995849609375, -5.5867919921875, -5.40362548828125, -5.220458984375, -5.03729248046875, -4.8541259765625, -4.67095947265625, -4.48779296875, -4.30462646484375, -4.1214599609375, -3.93829345703125, -3.755126953125, -3.57196044921875, -3.3887939453125, -3.20562744140625, -3.0224609375, -2.83929443359375, -2.6561279296875, -2.47296142578125, -2.289794921875, -2.10662841796875, -1.9234619140625, -1.74029541015625, -1.55712890625, -1.37396240234375, -1.1907958984375, -1.00762939453125, -0.824462890625, -0.64129638671875, -0.4581298828125, -0.27496337890625, -0.091796875, 0.09136962890625, 0.2745361328125, 0.45770263671875, 0.640869140625, 0.82403564453125, 1.0072021484375, 1.19036865234375, 1.37353515625, 1.55670166015625, 1.7398681640625, 1.92303466796875, 2.106201171875, 2.28936767578125, 2.4725341796875, 2.65570068359375, 2.8388671875, 3.02203369140625, 3.2052001953125, 3.38836669921875, 3.571533203125, 3.75469970703125, 3.9378662109375, 4.12103271484375, 4.30419921875, 4.48736572265625, 4.6705322265625, 4.85369873046875, 5.036865234375, 5.22003173828125, 5.4031982421875, 5.58636474609375, 5.76953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 8.0, 23.0, 39.0, 100.0, 181.0, 232.0, 184.0, 106.0, 40.0, 22.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.771484375, -0.74224853515625, -0.7130126953125, -0.68377685546875, -0.654541015625, -0.62530517578125, -0.5960693359375, -0.56683349609375, -0.53759765625, -0.50836181640625, -0.4791259765625, -0.44989013671875, -0.420654296875, -0.39141845703125, -0.3621826171875, -0.33294677734375, -0.3037109375, -0.27447509765625, -0.2452392578125, -0.21600341796875, -0.186767578125, -0.15753173828125, -0.1282958984375, -0.09906005859375, -0.06982421875, -0.04058837890625, -0.0113525390625, 0.01788330078125, 0.047119140625, 0.07635498046875, 0.1055908203125, 0.13482666015625, 0.1640625, 0.19329833984375, 0.2225341796875, 0.25177001953125, 0.281005859375, 0.31024169921875, 0.3394775390625, 0.36871337890625, 0.39794921875, 0.42718505859375, 0.4564208984375, 0.48565673828125, 0.514892578125, 0.54412841796875, 0.5733642578125, 0.60260009765625, 0.6318359375, 0.66107177734375, 0.6903076171875, 0.71954345703125, 0.748779296875, 0.77801513671875, 0.8072509765625, 0.83648681640625, 0.86572265625, 0.89495849609375, 0.9241943359375, 0.95343017578125, 0.982666015625, 1.01190185546875, 1.0411376953125, 1.07037353515625, 1.099609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 2.0, 9.0, 9.0, 12.0, 15.0, 29.0, 34.0, 36.0, 81.0, 99.0, 124.0, 249.0, 370.0, 654.0, 1230.0, 2689.0, 6844.0, 21901.0, 87491.0, 390794.0, 407232.0, 93030.0, 22956.0, 6888.0, 2684.0, 1278.0, 681.0, 363.0, 239.0, 175.0, 93.0, 64.0, 48.0, 44.0, 25.0, 17.0, 12.0, 11.0, 9.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.48046875, -6.29541015625, -6.1103515625, -5.92529296875, -5.740234375, -5.55517578125, -5.3701171875, -5.18505859375, -5.0, -4.81494140625, -4.6298828125, -4.44482421875, -4.259765625, -4.07470703125, -3.8896484375, -3.70458984375, -3.51953125, -3.33447265625, -3.1494140625, -2.96435546875, -2.779296875, -2.59423828125, -2.4091796875, -2.22412109375, -2.0390625, -1.85400390625, -1.6689453125, -1.48388671875, -1.298828125, -1.11376953125, -0.9287109375, -0.74365234375, -0.55859375, -0.37353515625, -0.1884765625, -0.00341796875, 0.181640625, 0.36669921875, 0.5517578125, 0.73681640625, 0.921875, 1.10693359375, 1.2919921875, 1.47705078125, 1.662109375, 1.84716796875, 2.0322265625, 2.21728515625, 2.40234375, 2.58740234375, 2.7724609375, 2.95751953125, 3.142578125, 3.32763671875, 3.5126953125, 3.69775390625, 3.8828125, 4.06787109375, 4.2529296875, 4.43798828125, 4.623046875, 4.80810546875, 4.9931640625, 5.17822265625, 5.36328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 5.0, 13.0, 9.0, 19.0, 23.0, 13.0, 29.0, 29.0, 30.0, 38.0, 54.0, 45.0, 61.0, 51.0, 47.0, 39.0, 52.0, 53.0, 45.0, 42.0, 47.0, 39.0, 27.0, 19.0, 38.0, 18.0, 19.0, 16.0, 14.0, 8.0, 10.0, 4.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.95703125, -2.875640869140625, -2.79425048828125, -2.712860107421875, -2.6314697265625, -2.550079345703125, -2.46868896484375, -2.387298583984375, -2.305908203125, -2.224517822265625, -2.14312744140625, -2.061737060546875, -1.9803466796875, -1.898956298828125, -1.81756591796875, -1.736175537109375, -1.65478515625, -1.573394775390625, -1.49200439453125, -1.410614013671875, -1.3292236328125, -1.247833251953125, -1.16644287109375, -1.085052490234375, -1.003662109375, -0.922271728515625, -0.84088134765625, -0.759490966796875, -0.6781005859375, -0.596710205078125, -0.51531982421875, -0.433929443359375, -0.3525390625, -0.271148681640625, -0.18975830078125, -0.108367919921875, -0.0269775390625, 0.054412841796875, 0.13580322265625, 0.217193603515625, 0.298583984375, 0.379974365234375, 0.46136474609375, 0.542755126953125, 0.6241455078125, 0.705535888671875, 0.78692626953125, 0.868316650390625, 0.94970703125, 1.031097412109375, 1.11248779296875, 1.193878173828125, 1.2752685546875, 1.356658935546875, 1.43804931640625, 1.519439697265625, 1.600830078125, 1.682220458984375, 1.76361083984375, 1.845001220703125, 1.9263916015625, 2.007781982421875, 2.08917236328125, 2.170562744140625, 2.251953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 18.0, 21.0, 33.0, 59.0, 81.0, 131.0, 174.0, 293.0, 490.0, 840.0, 1589.0, 3063.0, 6688.0, 15785.0, 48731.0, 234242.0, 568875.0, 116137.0, 30152.0, 10957.0, 4837.0, 2325.0, 1213.0, 670.0, 405.0, 241.0, 155.0, 104.0, 62.0, 39.0, 32.0, 21.0, 19.0, 8.0, 12.0, 4.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.54296875, -6.36273193359375, -6.1824951171875, -6.00225830078125, -5.822021484375, -5.64178466796875, -5.4615478515625, -5.28131103515625, -5.10107421875, -4.92083740234375, -4.7406005859375, -4.56036376953125, -4.380126953125, -4.19989013671875, -4.0196533203125, -3.83941650390625, -3.6591796875, -3.47894287109375, -3.2987060546875, -3.11846923828125, -2.938232421875, -2.75799560546875, -2.5777587890625, -2.39752197265625, -2.21728515625, -2.03704833984375, -1.8568115234375, -1.67657470703125, -1.496337890625, -1.31610107421875, -1.1358642578125, -0.95562744140625, -0.775390625, -0.59515380859375, -0.4149169921875, -0.23468017578125, -0.054443359375, 0.12579345703125, 0.3060302734375, 0.48626708984375, 0.66650390625, 0.84674072265625, 1.0269775390625, 1.20721435546875, 1.387451171875, 1.56768798828125, 1.7479248046875, 1.92816162109375, 2.1083984375, 2.28863525390625, 2.4688720703125, 2.64910888671875, 2.829345703125, 3.00958251953125, 3.1898193359375, 3.37005615234375, 3.55029296875, 3.73052978515625, 3.9107666015625, 4.09100341796875, 4.271240234375, 4.45147705078125, 4.6317138671875, 4.81195068359375, 4.9921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 10.0, 20.0, 30.0, 47.0, 66.0, 125.0, 172.0, 162.0, 101.0, 57.0, 49.0, 41.0, 16.0, 21.0, 13.0, 7.0, 6.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000965118408203125, -0.0009358823299407959, -0.0009066462516784668, -0.0008774101734161377, -0.0008481740951538086, -0.0008189380168914795, -0.0007897019386291504, -0.0007604658603668213, -0.0007312297821044922, -0.0007019937038421631, -0.000672757625579834, -0.0006435215473175049, -0.0006142854690551758, -0.0005850493907928467, -0.0005558133125305176, -0.0005265772342681885, -0.0004973411560058594, -0.0004681050777435303, -0.00043886899948120117, -0.00040963292121887207, -0.00038039684295654297, -0.00035116076469421387, -0.00032192468643188477, -0.00029268860816955566, -0.00026345252990722656, -0.00023421645164489746, -0.00020498037338256836, -0.00017574429512023926, -0.00014650821685791016, -0.00011727213859558105, -8.803606033325195e-05, -5.879998207092285e-05, -2.956390380859375e-05, -3.2782554626464844e-07, 2.8908252716064453e-05, 5.8144330978393555e-05, 8.738040924072266e-05, 0.00011661648750305176, 0.00014585256576538086, 0.00017508864402770996, 0.00020432472229003906, 0.00023356080055236816, 0.00026279687881469727, 0.00029203295707702637, 0.00032126903533935547, 0.00035050511360168457, 0.00037974119186401367, 0.0004089772701263428, 0.0004382133483886719, 0.000467449426651001, 0.0004966855049133301, 0.0005259215831756592, 0.0005551576614379883, 0.0005843937397003174, 0.0006136298179626465, 0.0006428658962249756, 0.0006721019744873047, 0.0007013380527496338, 0.0007305741310119629, 0.000759810209274292, 0.0007890462875366211, 0.0008182823657989502, 0.0008475184440612793, 0.0008767545223236084, 0.0009059906005859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 11.0, 14.0, 15.0, 19.0, 21.0, 38.0, 64.0, 90.0, 105.0, 202.0, 323.0, 558.0, 1041.0, 2177.0, 4694.0, 12211.0, 41054.0, 301913.0, 593989.0, 62293.0, 16286.0, 5886.0, 2580.0, 1188.0, 711.0, 366.0, 233.0, 131.0, 79.0, 69.0, 52.0, 28.0, 35.0, 13.0, 13.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.947998046875, -7.70068359375, -7.453369140625, -7.2060546875, -6.958740234375, -6.71142578125, -6.464111328125, -6.216796875, -5.969482421875, -5.72216796875, -5.474853515625, -5.2275390625, -4.980224609375, -4.73291015625, -4.485595703125, -4.23828125, -3.990966796875, -3.74365234375, -3.496337890625, -3.2490234375, -3.001708984375, -2.75439453125, -2.507080078125, -2.259765625, -2.012451171875, -1.76513671875, -1.517822265625, -1.2705078125, -1.023193359375, -0.77587890625, -0.528564453125, -0.28125, -0.033935546875, 0.21337890625, 0.460693359375, 0.7080078125, 0.955322265625, 1.20263671875, 1.449951171875, 1.697265625, 1.944580078125, 2.19189453125, 2.439208984375, 2.6865234375, 2.933837890625, 3.18115234375, 3.428466796875, 3.67578125, 3.923095703125, 4.17041015625, 4.417724609375, 4.6650390625, 4.912353515625, 5.15966796875, 5.406982421875, 5.654296875, 5.901611328125, 6.14892578125, 6.396240234375, 6.6435546875, 6.890869140625, 7.13818359375, 7.385498046875, 7.6328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 13.0, 11.0, 14.0, 14.0, 22.0, 28.0, 26.0, 60.0, 86.0, 102.0, 126.0, 120.0, 94.0, 66.0, 33.0, 32.0, 23.0, 21.0, 14.0, 16.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.265625, -3.165283203125, -3.06494140625, -2.964599609375, -2.8642578125, -2.763916015625, -2.66357421875, -2.563232421875, -2.462890625, -2.362548828125, -2.26220703125, -2.161865234375, -2.0615234375, -1.961181640625, -1.86083984375, -1.760498046875, -1.66015625, -1.559814453125, -1.45947265625, -1.359130859375, -1.2587890625, -1.158447265625, -1.05810546875, -0.957763671875, -0.857421875, -0.757080078125, -0.65673828125, -0.556396484375, -0.4560546875, -0.355712890625, -0.25537109375, -0.155029296875, -0.0546875, 0.045654296875, 0.14599609375, 0.246337890625, 0.3466796875, 0.447021484375, 0.54736328125, 0.647705078125, 0.748046875, 0.848388671875, 0.94873046875, 1.049072265625, 1.1494140625, 1.249755859375, 1.35009765625, 1.450439453125, 1.55078125, 1.651123046875, 1.75146484375, 1.851806640625, 1.9521484375, 2.052490234375, 2.15283203125, 2.253173828125, 2.353515625, 2.453857421875, 2.55419921875, 2.654541015625, 2.7548828125, 2.855224609375, 2.95556640625, 3.055908203125, 3.15625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 9.0, 8.0, 13.0, 23.0, 56.0, 136.0, 213.0, 258.0, 169.0, 60.0, 34.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.481258392333984, -39.60136795043945, -37.721473693847656, -35.841583251953125, -33.961692810058594, -32.08180236816406, -30.201908111572266, -28.322017669677734, -26.44212532043457, -24.562232971191406, -22.682342529296875, -20.80245018005371, -18.922557830810547, -17.042667388916016, -15.162775039672852, -13.282883644104004, -11.402992248535156, -9.523100852966309, -7.643208980560303, -5.763317108154297, -3.883425712585449, -2.0035343170166016, -0.1236419677734375, 1.7562494277954102, 3.636140823364258, 5.5160322189331055, 7.395924091339111, 9.275815963745117, 11.155707359313965, 13.035598754882812, 14.915491104125977, 16.79538345336914, 18.675270080566406, 20.55516242980957, 22.4350528717041, 24.314945220947266, 26.194835662841797, 28.07472801208496, 29.954620361328125, 31.834510803222656, 33.71440124511719, 35.59429168701172, 37.474185943603516, 39.35407638549805, 41.23396682739258, 43.113861083984375, 44.993751525878906, 46.87364196777344, 48.753536224365234, 50.633426666259766, 52.51332092285156, 54.393211364746094, 56.273101806640625, 58.152992248535156, 60.03288650512695, 61.912776947021484, 63.79267120361328, 65.67256164550781, 67.55245208740234, 69.43234252929688, 71.31224060058594, 73.19213104248047, 75.072021484375, 76.95191192626953, 78.83180236816406]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 10.0, 12.0, 10.0, 27.0, 14.0, 31.0, 44.0, 42.0, 36.0, 37.0, 62.0, 59.0, 49.0, 62.0, 51.0, 62.0, 72.0, 49.0, 35.0, 39.0, 38.0, 30.0, 27.0, 18.0, 22.0, 9.0, 11.0, 13.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.923093795776367, -19.154081344604492, -18.385068893432617, -17.616056442260742, -16.847043991088867, -16.078033447265625, -15.309020042419434, -14.540008544921875, -13.77099609375, -13.001983642578125, -12.23297119140625, -11.463958740234375, -10.694947242736816, -9.925934791564941, -9.156922340393066, -8.387910842895508, -7.618897438049316, -6.849884986877441, -6.080873012542725, -5.31186056137085, -4.542848587036133, -3.773836135864258, -3.004823684692383, -2.235811710357666, -1.466799259185791, -0.6977869868278503, 0.07122528553009033, 0.8402376174926758, 1.6092498302459717, 2.3782620429992676, 3.1472744941711426, 3.9162864685058594, 4.685298919677734, 5.454311370849609, 6.223323345184326, 6.992335796356201, 7.761347770690918, 8.530360221862793, 9.299372673034668, 10.068384170532227, 10.837396621704102, 11.606409072875977, 12.375421524047852, 13.144433975219727, 13.913445472717285, 14.68245792388916, 15.451470375061035, 16.220481872558594, 16.98949432373047, 17.758506774902344, 18.52751922607422, 19.296531677246094, 20.06554412841797, 20.834556579589844, 21.60356903076172, 22.37257957458496, 23.14159393310547, 23.910606384277344, 24.67961883544922, 25.448631286621094, 26.21764373779297, 26.986656188964844, 27.75566864013672, 28.52467918395996, 29.293691635131836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 7.0, 12.0, 23.0, 59.0, 103.0, 188.0, 462.0, 1393.0, 6387.0, 145844.0, 4020212.0, 16420.0, 2106.0, 592.0, 244.0, 111.0, 43.0, 25.0, 15.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.372314453125, -20.55712890625, -19.741943359375, -18.9267578125, -18.111572265625, -17.29638671875, -16.481201171875, -15.666015625, -14.850830078125, -14.03564453125, -13.220458984375, -12.4052734375, -11.590087890625, -10.77490234375, -9.959716796875, -9.14453125, -8.329345703125, -7.51416015625, -6.698974609375, -5.8837890625, -5.068603515625, -4.25341796875, -3.438232421875, -2.623046875, -1.807861328125, -0.99267578125, -0.177490234375, 0.6376953125, 1.452880859375, 2.26806640625, 3.083251953125, 3.8984375, 4.713623046875, 5.52880859375, 6.343994140625, 7.1591796875, 7.974365234375, 8.78955078125, 9.604736328125, 10.419921875, 11.235107421875, 12.05029296875, 12.865478515625, 13.6806640625, 14.495849609375, 15.31103515625, 16.126220703125, 16.94140625, 17.756591796875, 18.57177734375, 19.386962890625, 20.2021484375, 21.017333984375, 21.83251953125, 22.647705078125, 23.462890625, 24.278076171875, 25.09326171875, 25.908447265625, 26.7236328125, 27.538818359375, 28.35400390625, 29.169189453125, 29.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 10.0, 29.0, 54.0, 83.0, 153.0, 202.0, 184.0, 127.0, 57.0, 41.0, 21.0, 5.0, 5.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06781005859375, -1.0291748046875, -0.99053955078125, -0.951904296875, -0.91326904296875, -0.8746337890625, -0.83599853515625, -0.79736328125, -0.75872802734375, -0.7200927734375, -0.68145751953125, -0.642822265625, -0.60418701171875, -0.5655517578125, -0.52691650390625, -0.48828125, -0.44964599609375, -0.4110107421875, -0.37237548828125, -0.333740234375, -0.29510498046875, -0.2564697265625, -0.21783447265625, -0.17919921875, -0.14056396484375, -0.1019287109375, -0.06329345703125, -0.024658203125, 0.01397705078125, 0.0526123046875, 0.09124755859375, 0.1298828125, 0.16851806640625, 0.2071533203125, 0.24578857421875, 0.284423828125, 0.32305908203125, 0.3616943359375, 0.40032958984375, 0.43896484375, 0.47760009765625, 0.5162353515625, 0.55487060546875, 0.593505859375, 0.63214111328125, 0.6707763671875, 0.70941162109375, 0.748046875, 0.78668212890625, 0.8253173828125, 0.86395263671875, 0.902587890625, 0.94122314453125, 0.9798583984375, 1.01849365234375, 1.05712890625, 1.09576416015625, 1.1343994140625, 1.17303466796875, 1.211669921875, 1.25030517578125, 1.2889404296875, 1.32757568359375, 1.3662109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 14.0, 15.0, 24.0, 31.0, 47.0, 92.0, 122.0, 252.0, 467.0, 893.0, 2000.0, 5125.0, 14209.0, 49329.0, 265451.0, 3451968.0, 322015.0, 56395.0, 16041.0, 5547.0, 2209.0, 960.0, 484.0, 240.0, 127.0, 90.0, 41.0, 38.0, 22.0, 17.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.6640625, -8.43328857421875, -8.2025146484375, -7.97174072265625, -7.740966796875, -7.51019287109375, -7.2794189453125, -7.04864501953125, -6.81787109375, -6.58709716796875, -6.3563232421875, -6.12554931640625, -5.894775390625, -5.66400146484375, -5.4332275390625, -5.20245361328125, -4.9716796875, -4.74090576171875, -4.5101318359375, -4.27935791015625, -4.048583984375, -3.81781005859375, -3.5870361328125, -3.35626220703125, -3.12548828125, -2.89471435546875, -2.6639404296875, -2.43316650390625, -2.202392578125, -1.97161865234375, -1.7408447265625, -1.51007080078125, -1.279296875, -1.04852294921875, -0.8177490234375, -0.58697509765625, -0.356201171875, -0.12542724609375, 0.1053466796875, 0.33612060546875, 0.56689453125, 0.79766845703125, 1.0284423828125, 1.25921630859375, 1.489990234375, 1.72076416015625, 1.9515380859375, 2.18231201171875, 2.4130859375, 2.64385986328125, 2.8746337890625, 3.10540771484375, 3.336181640625, 3.56695556640625, 3.7977294921875, 4.02850341796875, 4.25927734375, 4.49005126953125, 4.7208251953125, 4.95159912109375, 5.182373046875, 5.41314697265625, 5.6439208984375, 5.87469482421875, 6.10546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 12.0, 11.0, 13.0, 15.0, 36.0, 44.0, 74.0, 84.0, 132.0, 222.0, 452.0, 1610.0, 575.0, 288.0, 141.0, 102.0, 58.0, 48.0, 31.0, 31.0, 14.0, 11.0, 15.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5686492919921875, -1.526947021484375, -1.4852447509765625, -1.44354248046875, -1.4018402099609375, -1.360137939453125, -1.3184356689453125, -1.2767333984375, -1.2350311279296875, -1.193328857421875, -1.1516265869140625, -1.10992431640625, -1.0682220458984375, -1.026519775390625, -0.9848175048828125, -0.943115234375, -0.9014129638671875, -0.859710693359375, -0.8180084228515625, -0.77630615234375, -0.7346038818359375, -0.692901611328125, -0.6511993408203125, -0.6094970703125, -0.5677947998046875, -0.526092529296875, -0.4843902587890625, -0.44268798828125, -0.4009857177734375, -0.359283447265625, -0.3175811767578125, -0.27587890625, -0.2341766357421875, -0.192474365234375, -0.1507720947265625, -0.10906982421875, -0.0673675537109375, -0.025665283203125, 0.0160369873046875, 0.0577392578125, 0.0994415283203125, 0.141143798828125, 0.1828460693359375, 0.22454833984375, 0.2662506103515625, 0.307952880859375, 0.3496551513671875, 0.391357421875, 0.4330596923828125, 0.474761962890625, 0.5164642333984375, 0.55816650390625, 0.5998687744140625, 0.641571044921875, 0.6832733154296875, 0.7249755859375, 0.7666778564453125, 0.808380126953125, 0.8500823974609375, 0.89178466796875, 0.9334869384765625, 0.975189208984375, 1.0168914794921875, 1.05859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 8.0, 18.0, 30.0, 81.0, 100.0, 177.0, 197.0, 165.0, 104.0, 62.0, 28.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.885089874267578, -17.483036041259766, -17.080982208251953, -16.678926467895508, -16.276872634887695, -15.874818801879883, -15.47276496887207, -15.070710182189941, -14.668655395507812, -14.2666015625, -13.864546775817871, -13.462492942810059, -13.06043815612793, -12.658384323120117, -12.256330490112305, -11.854275703430176, -11.452221870422363, -11.05016803741455, -10.648113250732422, -10.24605941772461, -9.84400463104248, -9.441950798034668, -9.039896011352539, -8.637842178344727, -8.235788345336914, -7.833734035491943, -7.431679725646973, -7.02962589263916, -6.627571105957031, -6.225517272949219, -5.823462963104248, -5.421408653259277, -5.019352912902832, -4.617298603057861, -4.215244293212891, -3.813190221786499, -3.4111359119415283, -3.0090816020965576, -2.607027530670166, -2.2049732208251953, -1.8029189109802246, -1.400864601135254, -0.9988104104995728, -0.5967562198638916, -0.1947019100189209, 0.2073523998260498, 0.6094064712524414, 1.011460781097412, 1.4135150909423828, 1.8155694007873535, 2.217623710632324, 2.619677782058716, 3.0217320919036865, 3.4237864017486572, 3.825840473175049, 4.2278947830200195, 4.62994909286499, 5.032003402709961, 5.434057712554932, 5.836112022399902, 6.238165855407715, 6.640220642089844, 7.042274475097656, 7.444328784942627, 7.846383094787598]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 9.0, 6.0, 8.0, 14.0, 10.0, 12.0, 16.0, 18.0, 19.0, 26.0, 26.0, 22.0, 28.0, 29.0, 34.0, 35.0, 32.0, 37.0, 28.0, 38.0, 41.0, 39.0, 28.0, 39.0, 31.0, 26.0, 35.0, 34.0, 20.0, 24.0, 24.0, 32.0, 22.0, 23.0, 20.0, 14.0, 20.0, 14.0, 7.0, 5.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.4001901149749756, -3.2787041664123535, -3.1572182178497314, -3.0357322692871094, -2.914246082305908, -2.792760133743286, -2.671274185180664, -2.549788236618042, -2.42830228805542, -2.306816339492798, -2.185330390930176, -2.0638442039489746, -1.9423582553863525, -1.8208723068237305, -1.6993863582611084, -1.5779004096984863, -1.4564142227172852, -1.334928274154663, -1.2134422063827515, -1.0919562578201294, -0.9704702496528625, -0.8489842414855957, -0.7274982929229736, -0.6060122847557068, -0.48452627658843994, -0.3630402684211731, -0.24155429005622864, -0.12006831169128418, 0.001417696475982666, 0.12290370464324951, 0.24438965320587158, 0.3658756613731384, 0.4873619079589844, 0.6088479161262512, 0.7303339242935181, 0.8518198728561401, 0.973305881023407, 1.0947918891906738, 1.216277837753296, 1.337763786315918, 1.4592498540878296, 1.5807358026504517, 1.7022218704223633, 1.8237078189849854, 1.9451937675476074, 2.0666799545288086, 2.1881656646728516, 2.3096518516540527, 2.431137800216675, 2.552623748779297, 2.674109697341919, 2.795595645904541, 2.917081832885742, 3.0385677814483643, 3.1600537300109863, 3.2815396785736084, 3.4030256271362305, 3.5245115756988525, 3.6459975242614746, 3.767483711242676, 3.888969659805298, 4.01045560836792, 4.131941795349121, 4.253427505493164, 4.374913692474365]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 4.0, 12.0, 19.0, 17.0, 42.0, 46.0, 59.0, 111.0, 160.0, 237.0, 419.0, 680.0, 1180.0, 2105.0, 4493.0, 11510.0, 42890.0, 239968.0, 571687.0, 130760.0, 26437.0, 8082.0, 3373.0, 1699.0, 1022.0, 603.0, 323.0, 178.0, 151.0, 80.0, 68.0, 48.0, 23.0, 15.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.86737060546875, -5.6527099609375, -5.43804931640625, -5.223388671875, -5.00872802734375, -4.7940673828125, -4.57940673828125, -4.36474609375, -4.15008544921875, -3.9354248046875, -3.72076416015625, -3.506103515625, -3.29144287109375, -3.0767822265625, -2.86212158203125, -2.6474609375, -2.43280029296875, -2.2181396484375, -2.00347900390625, -1.788818359375, -1.57415771484375, -1.3594970703125, -1.14483642578125, -0.93017578125, -0.71551513671875, -0.5008544921875, -0.28619384765625, -0.071533203125, 0.14312744140625, 0.3577880859375, 0.57244873046875, 0.787109375, 1.00177001953125, 1.2164306640625, 1.43109130859375, 1.645751953125, 1.86041259765625, 2.0750732421875, 2.28973388671875, 2.50439453125, 2.71905517578125, 2.9337158203125, 3.14837646484375, 3.363037109375, 3.57769775390625, 3.7923583984375, 4.00701904296875, 4.2216796875, 4.43634033203125, 4.6510009765625, 4.86566162109375, 5.080322265625, 5.29498291015625, 5.5096435546875, 5.72430419921875, 5.93896484375, 6.15362548828125, 6.3682861328125, 6.58294677734375, 6.797607421875, 7.01226806640625, 7.2269287109375, 7.44158935546875, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 7.0, 11.0, 14.0, 28.0, 42.0, 75.0, 129.0, 152.0, 188.0, 125.0, 113.0, 53.0, 31.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0396575927734375, -1.001190185546875, -0.9627227783203125, -0.92425537109375, -0.8857879638671875, -0.847320556640625, -0.8088531494140625, -0.7703857421875, -0.7319183349609375, -0.693450927734375, -0.6549835205078125, -0.61651611328125, -0.5780487060546875, -0.539581298828125, -0.5011138916015625, -0.462646484375, -0.4241790771484375, -0.385711669921875, -0.3472442626953125, -0.30877685546875, -0.2703094482421875, -0.231842041015625, -0.1933746337890625, -0.1549072265625, -0.1164398193359375, -0.077972412109375, -0.0395050048828125, -0.00103759765625, 0.0374298095703125, 0.075897216796875, 0.1143646240234375, 0.15283203125, 0.1912994384765625, 0.229766845703125, 0.2682342529296875, 0.30670166015625, 0.3451690673828125, 0.383636474609375, 0.4221038818359375, 0.4605712890625, 0.4990386962890625, 0.537506103515625, 0.5759735107421875, 0.61444091796875, 0.6529083251953125, 0.691375732421875, 0.7298431396484375, 0.768310546875, 0.8067779541015625, 0.845245361328125, 0.8837127685546875, 0.92218017578125, 0.9606475830078125, 0.999114990234375, 1.0375823974609375, 1.0760498046875, 1.1145172119140625, 1.152984619140625, 1.1914520263671875, 1.22991943359375, 1.2683868408203125, 1.306854248046875, 1.3453216552734375, 1.3837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 15.0, 23.0, 38.0, 56.0, 86.0, 141.0, 256.0, 479.0, 903.0, 2403.0, 7191.0, 32804.0, 203136.0, 625222.0, 142090.0, 24083.0, 5758.0, 2002.0, 824.0, 404.0, 232.0, 134.0, 70.0, 65.0, 30.0, 18.0, 13.0, 11.0, 11.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70050048828125, -8.4400634765625, -8.17962646484375, -7.919189453125, -7.65875244140625, -7.3983154296875, -7.13787841796875, -6.87744140625, -6.61700439453125, -6.3565673828125, -6.09613037109375, -5.835693359375, -5.57525634765625, -5.3148193359375, -5.05438232421875, -4.7939453125, -4.53350830078125, -4.2730712890625, -4.01263427734375, -3.752197265625, -3.49176025390625, -3.2313232421875, -2.97088623046875, -2.71044921875, -2.45001220703125, -2.1895751953125, -1.92913818359375, -1.668701171875, -1.40826416015625, -1.1478271484375, -0.88739013671875, -0.626953125, -0.36651611328125, -0.1060791015625, 0.15435791015625, 0.414794921875, 0.67523193359375, 0.9356689453125, 1.19610595703125, 1.45654296875, 1.71697998046875, 1.9774169921875, 2.23785400390625, 2.498291015625, 2.75872802734375, 3.0191650390625, 3.27960205078125, 3.5400390625, 3.80047607421875, 4.0609130859375, 4.32135009765625, 4.581787109375, 4.84222412109375, 5.1026611328125, 5.36309814453125, 5.62353515625, 5.88397216796875, 6.1444091796875, 6.40484619140625, 6.665283203125, 6.92572021484375, 7.1861572265625, 7.44659423828125, 7.70703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 10.0, 7.0, 15.0, 15.0, 33.0, 34.0, 47.0, 40.0, 36.0, 45.0, 48.0, 62.0, 67.0, 67.0, 53.0, 53.0, 45.0, 46.0, 42.0, 31.0, 39.0, 28.0, 23.0, 14.0, 18.0, 14.0, 12.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.33526611328125, -3.2135009765625, -3.09173583984375, -2.969970703125, -2.84820556640625, -2.7264404296875, -2.60467529296875, -2.48291015625, -2.36114501953125, -2.2393798828125, -2.11761474609375, -1.995849609375, -1.87408447265625, -1.7523193359375, -1.63055419921875, -1.5087890625, -1.38702392578125, -1.2652587890625, -1.14349365234375, -1.021728515625, -0.89996337890625, -0.7781982421875, -0.65643310546875, -0.53466796875, -0.41290283203125, -0.2911376953125, -0.16937255859375, -0.047607421875, 0.07415771484375, 0.1959228515625, 0.31768798828125, 0.439453125, 0.56121826171875, 0.6829833984375, 0.80474853515625, 0.926513671875, 1.04827880859375, 1.1700439453125, 1.29180908203125, 1.41357421875, 1.53533935546875, 1.6571044921875, 1.77886962890625, 1.900634765625, 2.02239990234375, 2.1441650390625, 2.26593017578125, 2.3876953125, 2.50946044921875, 2.6312255859375, 2.75299072265625, 2.874755859375, 2.99652099609375, 3.1182861328125, 3.24005126953125, 3.36181640625, 3.48358154296875, 3.6053466796875, 3.72711181640625, 3.848876953125, 3.97064208984375, 4.0924072265625, 4.21417236328125, 4.3359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 11.0, 18.0, 26.0, 31.0, 44.0, 55.0, 80.0, 109.0, 189.0, 301.0, 474.0, 700.0, 1161.0, 2024.0, 3493.0, 6328.0, 11906.0, 25485.0, 59884.0, 169111.0, 423191.0, 211939.0, 72035.0, 29632.0, 13778.0, 7043.0, 3785.0, 2205.0, 1284.0, 780.0, 476.0, 283.0, 226.0, 134.0, 91.0, 77.0, 45.0, 30.0, 20.0, 17.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.00830078125, -2.9130859375, -2.81787109375, -2.72265625, -2.62744140625, -2.5322265625, -2.43701171875, -2.341796875, -2.24658203125, -2.1513671875, -2.05615234375, -1.9609375, -1.86572265625, -1.7705078125, -1.67529296875, -1.580078125, -1.48486328125, -1.3896484375, -1.29443359375, -1.19921875, -1.10400390625, -1.0087890625, -0.91357421875, -0.818359375, -0.72314453125, -0.6279296875, -0.53271484375, -0.4375, -0.34228515625, -0.2470703125, -0.15185546875, -0.056640625, 0.03857421875, 0.1337890625, 0.22900390625, 0.32421875, 0.41943359375, 0.5146484375, 0.60986328125, 0.705078125, 0.80029296875, 0.8955078125, 0.99072265625, 1.0859375, 1.18115234375, 1.2763671875, 1.37158203125, 1.466796875, 1.56201171875, 1.6572265625, 1.75244140625, 1.84765625, 1.94287109375, 2.0380859375, 2.13330078125, 2.228515625, 2.32373046875, 2.4189453125, 2.51416015625, 2.609375, 2.70458984375, 2.7998046875, 2.89501953125, 2.990234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 25.0, 23.0, 27.0, 56.0, 83.0, 98.0, 164.0, 130.0, 88.0, 56.0, 38.0, 31.0, 29.0, 23.0, 14.0, 16.0, 9.0, 11.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006909370422363281, -0.0006668046116828918, -0.0006426721811294556, -0.0006185397505760193, -0.000594407320022583, -0.0005702748894691467, -0.0005461424589157104, -0.0005220100283622742, -0.0004978775978088379, -0.0004737451672554016, -0.00044961273670196533, -0.00042548030614852905, -0.0004013478755950928, -0.0003772154450416565, -0.0003530830144882202, -0.00032895058393478394, -0.00030481815338134766, -0.0002806857228279114, -0.0002565532922744751, -0.00023242086172103882, -0.00020828843116760254, -0.00018415600061416626, -0.00016002357006072998, -0.0001358911395072937, -0.00011175870895385742, -8.762627840042114e-05, -6.349384784698486e-05, -3.9361417293548584e-05, -1.5228986740112305e-05, 8.903443813323975e-06, 3.3035874366760254e-05, 5.716830492019653e-05, 8.130073547363281e-05, 0.00010543316602706909, 0.00012956559658050537, 0.00015369802713394165, 0.00017783045768737793, 0.0002019628882408142, 0.0002260953187942505, 0.00025022774934768677, 0.00027436017990112305, 0.0002984926104545593, 0.0003226250410079956, 0.0003467574715614319, 0.00037088990211486816, 0.00039502233266830444, 0.0004191547632217407, 0.000443287193775177, 0.0004674196243286133, 0.0004915520548820496, 0.0005156844854354858, 0.0005398169159889221, 0.0005639493465423584, 0.0005880817770957947, 0.000612214207649231, 0.0006363466382026672, 0.0006604790687561035, 0.0006846114993095398, 0.0007087439298629761, 0.0007328763604164124, 0.0007570087909698486, 0.0007811412215232849, 0.0008052736520767212, 0.0008294060826301575, 0.0008535385131835938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 16.0, 25.0, 39.0, 41.0, 93.0, 160.0, 327.0, 676.0, 1715.0, 5229.0, 20304.0, 132743.0, 761225.0, 101652.0, 17079.0, 4424.0, 1496.0, 579.0, 292.0, 153.0, 77.0, 48.0, 32.0, 26.0, 18.0, 13.0, 5.0, 3.0, 4.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-9.0625, -8.79150390625, -8.5205078125, -8.24951171875, -7.978515625, -7.70751953125, -7.4365234375, -7.16552734375, -6.89453125, -6.62353515625, -6.3525390625, -6.08154296875, -5.810546875, -5.53955078125, -5.2685546875, -4.99755859375, -4.7265625, -4.45556640625, -4.1845703125, -3.91357421875, -3.642578125, -3.37158203125, -3.1005859375, -2.82958984375, -2.55859375, -2.28759765625, -2.0166015625, -1.74560546875, -1.474609375, -1.20361328125, -0.9326171875, -0.66162109375, -0.390625, -0.11962890625, 0.1513671875, 0.42236328125, 0.693359375, 0.96435546875, 1.2353515625, 1.50634765625, 1.77734375, 2.04833984375, 2.3193359375, 2.59033203125, 2.861328125, 3.13232421875, 3.4033203125, 3.67431640625, 3.9453125, 4.21630859375, 4.4873046875, 4.75830078125, 5.029296875, 5.30029296875, 5.5712890625, 5.84228515625, 6.11328125, 6.38427734375, 6.6552734375, 6.92626953125, 7.197265625, 7.46826171875, 7.7392578125, 8.01025390625, 8.28125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 10.0, 9.0, 19.0, 20.0, 16.0, 24.0, 32.0, 50.0, 82.0, 104.0, 135.0, 128.0, 99.0, 58.0, 42.0, 31.0, 32.0, 14.0, 17.0, 8.0, 8.0, 7.0, 5.0, 7.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.515625, -3.40191650390625, -3.2882080078125, -3.17449951171875, -3.060791015625, -2.94708251953125, -2.8333740234375, -2.71966552734375, -2.60595703125, -2.49224853515625, -2.3785400390625, -2.26483154296875, -2.151123046875, -2.03741455078125, -1.9237060546875, -1.80999755859375, -1.6962890625, -1.58258056640625, -1.4688720703125, -1.35516357421875, -1.241455078125, -1.12774658203125, -1.0140380859375, -0.90032958984375, -0.78662109375, -0.67291259765625, -0.5592041015625, -0.44549560546875, -0.331787109375, -0.21807861328125, -0.1043701171875, 0.00933837890625, 0.123046875, 0.23675537109375, 0.3504638671875, 0.46417236328125, 0.577880859375, 0.69158935546875, 0.8052978515625, 0.91900634765625, 1.03271484375, 1.14642333984375, 1.2601318359375, 1.37384033203125, 1.487548828125, 1.60125732421875, 1.7149658203125, 1.82867431640625, 1.9423828125, 2.05609130859375, 2.1697998046875, 2.28350830078125, 2.397216796875, 2.51092529296875, 2.6246337890625, 2.73834228515625, 2.85205078125, 2.96575927734375, 3.0794677734375, 3.19317626953125, 3.306884765625, 3.42059326171875, 3.5343017578125, 3.64801025390625, 3.76171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 20.0, 49.0, 117.0, 194.0, 278.0, 187.0, 90.0, 29.0, 16.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.77375411987305, -57.32360076904297, -54.87344741821289, -52.42329406738281, -49.97313690185547, -47.522987365722656, -45.07283020019531, -42.622676849365234, -40.172523498535156, -37.72237014770508, -35.272216796875, -32.82206344604492, -30.37190818786621, -27.921754837036133, -25.471599578857422, -23.021446228027344, -20.571292877197266, -18.121139526367188, -15.670985221862793, -13.220830917358398, -10.77067756652832, -8.320524215698242, -5.870369911193848, -3.420215606689453, -0.970062255859375, 1.4800915718078613, 3.9302453994750977, 6.380399227142334, 8.83055305480957, 11.280706405639648, 13.730860710144043, 16.181015014648438, 18.63116455078125, 21.081317901611328, 23.531471252441406, 25.981626510620117, 28.431779861450195, 30.881933212280273, 33.332088470458984, 35.78224182128906, 38.23239517211914, 40.68254852294922, 43.1327018737793, 45.582855224609375, 48.03301239013672, 50.48316192626953, 52.933319091796875, 55.38347244262695, 57.83362579345703, 60.28377914428711, 62.73393249511719, 65.18408966064453, 67.63423919677734, 70.08439636230469, 72.5345458984375, 74.98470306396484, 77.43486022949219, 79.88501739501953, 82.33516693115234, 84.78532409667969, 87.2354736328125, 89.68563079833984, 92.13578033447266, 94.5859375, 97.03608703613281]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 17.0, 18.0, 23.0, 13.0, 29.0, 35.0, 39.0, 35.0, 35.0, 43.0, 60.0, 58.0, 54.0, 45.0, 64.0, 51.0, 50.0, 46.0, 40.0, 37.0, 38.0, 36.0, 14.0, 27.0, 19.0, 12.0, 12.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.994770050048828, -28.134937286376953, -27.275104522705078, -26.415271759033203, -25.555437088012695, -24.69560432434082, -23.835771560668945, -22.97593879699707, -22.116104125976562, -21.256271362304688, -20.396438598632812, -19.536605834960938, -18.67677116394043, -17.816938400268555, -16.95710563659668, -16.097272872924805, -15.23744010925293, -14.377607345581055, -13.517773628234863, -12.657940864562988, -11.798107147216797, -10.938274383544922, -10.078441619873047, -9.218608856201172, -8.35877513885498, -7.498941898345947, -6.639108657836914, -5.779275894165039, -4.919442653656006, -4.059609413146973, -3.1997766494750977, -2.3399434089660645, -1.480112075805664, -0.6202789545059204, 0.23955416679382324, 1.0993871688842773, 1.9592204093933105, 2.8190536499023438, 3.6788864135742188, 4.538719654083252, 5.398552894592285, 6.258386135101318, 7.118219375610352, 7.978052139282227, 8.837884902954102, 9.697718620300293, 10.557551383972168, 11.41738510131836, 12.277217864990234, 13.13705062866211, 13.9968843460083, 14.856717109680176, 15.716550827026367, 16.576383590698242, 17.436216354370117, 18.296049118041992, 19.1558837890625, 20.015716552734375, 20.87554931640625, 21.735382080078125, 22.595216751098633, 23.455049514770508, 24.314882278442383, 25.174715042114258, 26.034547805786133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 16.0, 22.0, 58.0, 58.0, 118.0, 194.0, 324.0, 782.0, 1832.0, 5656.0, 27244.0, 626878.0, 3481757.0, 38190.0, 7131.0, 2134.0, 860.0, 436.0, 213.0, 108.0, 79.0, 49.0, 35.0, 20.0, 12.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.05926513671875, -6.7396240234375, -6.41998291015625, -6.100341796875, -5.78070068359375, -5.4610595703125, -5.14141845703125, -4.82177734375, -4.50213623046875, -4.1824951171875, -3.86285400390625, -3.543212890625, -3.22357177734375, -2.9039306640625, -2.58428955078125, -2.2646484375, -1.94500732421875, -1.6253662109375, -1.30572509765625, -0.986083984375, -0.66644287109375, -0.3468017578125, -0.02716064453125, 0.29248046875, 0.61212158203125, 0.9317626953125, 1.25140380859375, 1.571044921875, 1.89068603515625, 2.2103271484375, 2.52996826171875, 2.849609375, 3.16925048828125, 3.4888916015625, 3.80853271484375, 4.128173828125, 4.44781494140625, 4.7674560546875, 5.08709716796875, 5.40673828125, 5.72637939453125, 6.0460205078125, 6.36566162109375, 6.685302734375, 7.00494384765625, 7.3245849609375, 7.64422607421875, 7.9638671875, 8.28350830078125, 8.6031494140625, 8.92279052734375, 9.242431640625, 9.56207275390625, 9.8817138671875, 10.20135498046875, 10.52099609375, 10.84063720703125, 11.1602783203125, 11.47991943359375, 11.799560546875, 12.11920166015625, 12.4388427734375, 12.75848388671875, 13.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 16.0, 30.0, 46.0, 55.0, 95.0, 98.0, 138.0, 135.0, 111.0, 78.0, 72.0, 50.0, 25.0, 11.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.01593017578125, -0.9752197265625, -0.93450927734375, -0.893798828125, -0.85308837890625, -0.8123779296875, -0.77166748046875, -0.73095703125, -0.69024658203125, -0.6495361328125, -0.60882568359375, -0.568115234375, -0.52740478515625, -0.4866943359375, -0.44598388671875, -0.4052734375, -0.36456298828125, -0.3238525390625, -0.28314208984375, -0.242431640625, -0.20172119140625, -0.1610107421875, -0.12030029296875, -0.07958984375, -0.03887939453125, 0.0018310546875, 0.04254150390625, 0.083251953125, 0.12396240234375, 0.1646728515625, 0.20538330078125, 0.24609375, 0.28680419921875, 0.3275146484375, 0.36822509765625, 0.408935546875, 0.44964599609375, 0.4903564453125, 0.53106689453125, 0.57177734375, 0.61248779296875, 0.6531982421875, 0.69390869140625, 0.734619140625, 0.77532958984375, 0.8160400390625, 0.85675048828125, 0.8974609375, 0.93817138671875, 0.9788818359375, 1.01959228515625, 1.060302734375, 1.10101318359375, 1.1417236328125, 1.18243408203125, 1.22314453125, 1.26385498046875, 1.3045654296875, 1.34527587890625, 1.385986328125, 1.42669677734375, 1.4674072265625, 1.50811767578125, 1.548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 0.0, 7.0, 12.0, 25.0, 29.0, 42.0, 57.0, 98.0, 148.0, 222.0, 372.0, 648.0, 1113.0, 1958.0, 3672.0, 7020.0, 14395.0, 33207.0, 96828.0, 500747.0, 3151702.0, 266699.0, 66730.0, 24830.0, 11204.0, 5696.0, 2902.0, 1566.0, 906.0, 503.0, 319.0, 206.0, 140.0, 82.0, 45.0, 42.0, 34.0, 17.0, 14.0, 12.0, 14.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.18359375, -4.05010986328125, -3.9166259765625, -3.78314208984375, -3.649658203125, -3.51617431640625, -3.3826904296875, -3.24920654296875, -3.11572265625, -2.98223876953125, -2.8487548828125, -2.71527099609375, -2.581787109375, -2.44830322265625, -2.3148193359375, -2.18133544921875, -2.0478515625, -1.91436767578125, -1.7808837890625, -1.64739990234375, -1.513916015625, -1.38043212890625, -1.2469482421875, -1.11346435546875, -0.97998046875, -0.84649658203125, -0.7130126953125, -0.57952880859375, -0.446044921875, -0.31256103515625, -0.1790771484375, -0.04559326171875, 0.087890625, 0.22137451171875, 0.3548583984375, 0.48834228515625, 0.621826171875, 0.75531005859375, 0.8887939453125, 1.02227783203125, 1.15576171875, 1.28924560546875, 1.4227294921875, 1.55621337890625, 1.689697265625, 1.82318115234375, 1.9566650390625, 2.09014892578125, 2.2236328125, 2.35711669921875, 2.4906005859375, 2.62408447265625, 2.757568359375, 2.89105224609375, 3.0245361328125, 3.15802001953125, 3.29150390625, 3.42498779296875, 3.5584716796875, 3.69195556640625, 3.825439453125, 3.95892333984375, 4.0924072265625, 4.22589111328125, 4.359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 10.0, 8.0, 11.0, 16.0, 28.0, 34.0, 50.0, 67.0, 109.0, 158.0, 291.0, 731.0, 1479.0, 377.0, 212.0, 132.0, 80.0, 50.0, 57.0, 25.0, 19.0, 16.0, 14.0, 16.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9782867431640625, -0.940948486328125, -0.9036102294921875, -0.86627197265625, -0.8289337158203125, -0.791595458984375, -0.7542572021484375, -0.7169189453125, -0.6795806884765625, -0.642242431640625, -0.6049041748046875, -0.56756591796875, -0.5302276611328125, -0.492889404296875, -0.4555511474609375, -0.418212890625, -0.3808746337890625, -0.343536376953125, -0.3061981201171875, -0.26885986328125, -0.2315216064453125, -0.194183349609375, -0.1568450927734375, -0.1195068359375, -0.0821685791015625, -0.044830322265625, -0.0074920654296875, 0.02984619140625, 0.0671844482421875, 0.104522705078125, 0.1418609619140625, 0.17919921875, 0.2165374755859375, 0.253875732421875, 0.2912139892578125, 0.32855224609375, 0.3658905029296875, 0.403228759765625, 0.4405670166015625, 0.4779052734375, 0.5152435302734375, 0.552581787109375, 0.5899200439453125, 0.62725830078125, 0.6645965576171875, 0.701934814453125, 0.7392730712890625, 0.776611328125, 0.8139495849609375, 0.851287841796875, 0.8886260986328125, 0.92596435546875, 0.9633026123046875, 1.000640869140625, 1.0379791259765625, 1.0753173828125, 1.1126556396484375, 1.149993896484375, 1.1873321533203125, 1.22467041015625, 1.2620086669921875, 1.299346923828125, 1.3366851806640625, 1.3740234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 21.0, 19.0, 33.0, 67.0, 128.0, 181.0, 198.0, 145.0, 90.0, 53.0, 36.0, 14.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.241500854492188, -19.847503662109375, -19.45350456237793, -19.059507369995117, -18.665508270263672, -18.27151107788086, -17.877513885498047, -17.4835147857666, -17.08951759338379, -16.695520401000977, -16.30152130126953, -15.907524108886719, -15.51352596282959, -15.119527816772461, -14.725530624389648, -14.33153247833252, -13.93753433227539, -13.543536186218262, -13.149538040161133, -12.75554084777832, -12.361542701721191, -11.967544555664062, -11.57354736328125, -11.179549217224121, -10.785551071166992, -10.391552925109863, -9.997554779052734, -9.603557586669922, -9.209559440612793, -8.815561294555664, -8.421564102172852, -8.027565956115723, -7.633566856384277, -7.239568710327148, -6.845571041107178, -6.451573371887207, -6.057575225830078, -5.663577079772949, -5.2695794105529785, -4.875581741333008, -4.481583595275879, -4.08758544921875, -3.6935877799987793, -3.2995898723602295, -2.9055919647216797, -2.51159405708313, -2.11759614944458, -1.7235982418060303, -1.3296003341674805, -0.9356024265289307, -0.5416045188903809, -0.14760661125183105, 0.24639129638671875, 0.6403892040252686, 1.0343871116638184, 1.4283850193023682, 1.822382926940918, 2.2163808345794678, 2.6103787422180176, 3.0043766498565674, 3.398374557495117, 3.792372465133667, 4.186370372772217, 4.5803680419921875, 4.974366188049316]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 7.0, 6.0, 7.0, 7.0, 13.0, 9.0, 9.0, 13.0, 17.0, 25.0, 33.0, 25.0, 30.0, 35.0, 48.0, 49.0, 45.0, 45.0, 54.0, 41.0, 64.0, 50.0, 41.0, 37.0, 48.0, 28.0, 42.0, 25.0, 28.0, 18.0, 23.0, 20.0, 18.0, 7.0, 14.0, 6.0, 10.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.262031316757202, -3.100661277770996, -2.93929123878479, -2.777921199798584, -2.616550922393799, -2.455181121826172, -2.2938108444213867, -2.1324408054351807, -1.9710707664489746, -1.8097007274627686, -1.6483306884765625, -1.486960530281067, -1.3255904912948608, -1.1642204523086548, -1.0028502941131592, -0.8414802551269531, -0.6801102161407471, -0.518740177154541, -0.3573700785636902, -0.19600000977516174, -0.0346299409866333, 0.12674009799957275, 0.2881101965904236, 0.4494802951812744, 0.6108503341674805, 0.7722203731536865, 0.9335904717445374, 1.0949605703353882, 1.2563306093215942, 1.4177006483078003, 1.579070806503296, 1.740440845489502, 1.901810646057129, 2.063180685043335, 2.224550724029541, 2.385920763015747, 2.547290802001953, 2.7086610794067383, 2.8700311183929443, 3.0314011573791504, 3.1927711963653564, 3.3541412353515625, 3.5155112743377686, 3.6768813133239746, 3.8382515907287598, 3.9996213912963867, 4.160991668701172, 4.322361946105957, 4.483731746673584, 4.645102024078369, 4.806471824645996, 4.967842102050781, 5.129211902618408, 5.290582180023193, 5.45195198059082, 5.6133222579956055, 5.774692535400391, 5.936062812805176, 6.097432613372803, 6.258802890777588, 6.420172691345215, 6.58154296875, 6.742912769317627, 6.904283046722412, 7.065652847290039]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 9.0, 4.0, 6.0, 14.0, 21.0, 28.0, 36.0, 59.0, 66.0, 125.0, 157.0, 253.0, 430.0, 605.0, 1049.0, 1742.0, 3388.0, 7162.0, 17812.0, 50655.0, 161836.0, 431787.0, 249894.0, 75936.0, 25553.0, 9890.0, 4519.0, 2169.0, 1207.0, 745.0, 444.0, 291.0, 222.0, 117.0, 95.0, 71.0, 29.0, 29.0, 25.0, 11.0, 14.0, 10.0, 11.0, 4.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.8125, -4.66961669921875, -4.5267333984375, -4.38385009765625, -4.240966796875, -4.09808349609375, -3.9552001953125, -3.81231689453125, -3.66943359375, -3.52655029296875, -3.3836669921875, -3.24078369140625, -3.097900390625, -2.95501708984375, -2.8121337890625, -2.66925048828125, -2.5263671875, -2.38348388671875, -2.2406005859375, -2.09771728515625, -1.954833984375, -1.81195068359375, -1.6690673828125, -1.52618408203125, -1.38330078125, -1.24041748046875, -1.0975341796875, -0.95465087890625, -0.811767578125, -0.66888427734375, -0.5260009765625, -0.38311767578125, -0.240234375, -0.09735107421875, 0.0455322265625, 0.18841552734375, 0.331298828125, 0.47418212890625, 0.6170654296875, 0.75994873046875, 0.90283203125, 1.04571533203125, 1.1885986328125, 1.33148193359375, 1.474365234375, 1.61724853515625, 1.7601318359375, 1.90301513671875, 2.0458984375, 2.18878173828125, 2.3316650390625, 2.47454833984375, 2.617431640625, 2.76031494140625, 2.9031982421875, 3.04608154296875, 3.18896484375, 3.33184814453125, 3.4747314453125, 3.61761474609375, 3.760498046875, 3.90338134765625, 4.0462646484375, 4.18914794921875, 4.33203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 4.0, 3.0, 5.0, 10.0, 12.0, 25.0, 30.0, 69.0, 70.0, 91.0, 117.0, 131.0, 112.0, 94.0, 84.0, 55.0, 36.0, 31.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.062347412109375, -1.02215576171875, -0.981964111328125, -0.9417724609375, -0.901580810546875, -0.86138916015625, -0.821197509765625, -0.781005859375, -0.740814208984375, -0.70062255859375, -0.660430908203125, -0.6202392578125, -0.580047607421875, -0.53985595703125, -0.499664306640625, -0.45947265625, -0.419281005859375, -0.37908935546875, -0.338897705078125, -0.2987060546875, -0.258514404296875, -0.21832275390625, -0.178131103515625, -0.137939453125, -0.097747802734375, -0.05755615234375, -0.017364501953125, 0.0228271484375, 0.063018798828125, 0.10321044921875, 0.143402099609375, 0.18359375, 0.223785400390625, 0.26397705078125, 0.304168701171875, 0.3443603515625, 0.384552001953125, 0.42474365234375, 0.464935302734375, 0.505126953125, 0.545318603515625, 0.58551025390625, 0.625701904296875, 0.6658935546875, 0.706085205078125, 0.74627685546875, 0.786468505859375, 0.82666015625, 0.866851806640625, 0.90704345703125, 0.947235107421875, 0.9874267578125, 1.027618408203125, 1.06781005859375, 1.108001708984375, 1.148193359375, 1.188385009765625, 1.22857666015625, 1.268768310546875, 1.3089599609375, 1.349151611328125, 1.38934326171875, 1.429534912109375, 1.4697265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 1.0, 6.0, 4.0, 4.0, 11.0, 15.0, 25.0, 39.0, 40.0, 86.0, 137.0, 210.0, 366.0, 739.0, 1474.0, 3810.0, 12596.0, 52643.0, 259240.0, 532264.0, 142092.0, 29710.0, 7937.0, 2642.0, 1102.0, 556.0, 264.0, 178.0, 102.0, 80.0, 61.0, 30.0, 20.0, 18.0, 13.0, 10.0, 9.0, 1.0, 2.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.6798095703125, -5.492431640625, -5.3050537109375, -5.11767578125, -4.9302978515625, -4.742919921875, -4.5555419921875, -4.3681640625, -4.1807861328125, -3.993408203125, -3.8060302734375, -3.61865234375, -3.4312744140625, -3.243896484375, -3.0565185546875, -2.869140625, -2.6817626953125, -2.494384765625, -2.3070068359375, -2.11962890625, -1.9322509765625, -1.744873046875, -1.5574951171875, -1.3701171875, -1.1827392578125, -0.995361328125, -0.8079833984375, -0.62060546875, -0.4332275390625, -0.245849609375, -0.0584716796875, 0.12890625, 0.3162841796875, 0.503662109375, 0.6910400390625, 0.87841796875, 1.0657958984375, 1.253173828125, 1.4405517578125, 1.6279296875, 1.8153076171875, 2.002685546875, 2.1900634765625, 2.37744140625, 2.5648193359375, 2.752197265625, 2.9395751953125, 3.126953125, 3.3143310546875, 3.501708984375, 3.6890869140625, 3.87646484375, 4.0638427734375, 4.251220703125, 4.4385986328125, 4.6259765625, 4.8133544921875, 5.000732421875, 5.1881103515625, 5.37548828125, 5.5628662109375, 5.750244140625, 5.9376220703125, 6.125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 11.0, 9.0, 10.0, 15.0, 15.0, 29.0, 17.0, 32.0, 40.0, 39.0, 40.0, 50.0, 44.0, 34.0, 43.0, 44.0, 56.0, 48.0, 46.0, 34.0, 46.0, 37.0, 36.0, 36.0, 18.0, 22.0, 27.0, 19.0, 12.0, 19.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.604583740234375, -3.49237060546875, -3.380157470703125, -3.2679443359375, -3.155731201171875, -3.04351806640625, -2.931304931640625, -2.819091796875, -2.706878662109375, -2.59466552734375, -2.482452392578125, -2.3702392578125, -2.258026123046875, -2.14581298828125, -2.033599853515625, -1.92138671875, -1.809173583984375, -1.69696044921875, -1.584747314453125, -1.4725341796875, -1.360321044921875, -1.24810791015625, -1.135894775390625, -1.023681640625, -0.911468505859375, -0.79925537109375, -0.687042236328125, -0.5748291015625, -0.462615966796875, -0.35040283203125, -0.238189697265625, -0.1259765625, -0.013763427734375, 0.09844970703125, 0.210662841796875, 0.3228759765625, 0.435089111328125, 0.54730224609375, 0.659515380859375, 0.771728515625, 0.883941650390625, 0.99615478515625, 1.108367919921875, 1.2205810546875, 1.332794189453125, 1.44500732421875, 1.557220458984375, 1.66943359375, 1.781646728515625, 1.89385986328125, 2.006072998046875, 2.1182861328125, 2.230499267578125, 2.34271240234375, 2.454925537109375, 2.567138671875, 2.679351806640625, 2.79156494140625, 2.903778076171875, 3.0159912109375, 3.128204345703125, 3.24041748046875, 3.352630615234375, 3.46484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 9.0, 19.0, 41.0, 40.0, 68.0, 103.0, 179.0, 287.0, 505.0, 983.0, 1942.0, 3864.0, 9139.0, 21850.0, 61417.0, 198992.0, 431662.0, 211673.0, 64951.0, 23139.0, 9180.0, 4166.0, 1977.0, 974.0, 528.0, 315.0, 183.0, 110.0, 64.0, 55.0, 36.0, 18.0, 23.0, 13.0, 6.0, 10.0, 3.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.33258056640625, -2.2608642578125, -2.18914794921875, -2.117431640625, -2.04571533203125, -1.9739990234375, -1.90228271484375, -1.83056640625, -1.75885009765625, -1.6871337890625, -1.61541748046875, -1.543701171875, -1.47198486328125, -1.4002685546875, -1.32855224609375, -1.2568359375, -1.18511962890625, -1.1134033203125, -1.04168701171875, -0.969970703125, -0.89825439453125, -0.8265380859375, -0.75482177734375, -0.68310546875, -0.61138916015625, -0.5396728515625, -0.46795654296875, -0.396240234375, -0.32452392578125, -0.2528076171875, -0.18109130859375, -0.109375, -0.03765869140625, 0.0340576171875, 0.10577392578125, 0.177490234375, 0.24920654296875, 0.3209228515625, 0.39263916015625, 0.46435546875, 0.53607177734375, 0.6077880859375, 0.67950439453125, 0.751220703125, 0.82293701171875, 0.8946533203125, 0.96636962890625, 1.0380859375, 1.10980224609375, 1.1815185546875, 1.25323486328125, 1.324951171875, 1.39666748046875, 1.4683837890625, 1.54010009765625, 1.61181640625, 1.68353271484375, 1.7552490234375, 1.82696533203125, 1.898681640625, 1.97039794921875, 2.0421142578125, 2.11383056640625, 2.185546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 6.0, 11.0, 18.0, 14.0, 22.0, 18.0, 40.0, 40.0, 62.0, 83.0, 96.0, 142.0, 103.0, 86.0, 62.0, 43.0, 36.0, 20.0, 19.0, 15.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006465911865234375, -0.0006297975778579712, -0.0006130039691925049, -0.0005962103605270386, -0.0005794167518615723, -0.000562623143196106, -0.0005458295345306396, -0.0005290359258651733, -0.000512242317199707, -0.0004954487085342407, -0.0004786550998687744, -0.0004618614912033081, -0.0004450678825378418, -0.0004282742738723755, -0.0004114806652069092, -0.00039468705654144287, -0.00037789344787597656, -0.00036109983921051025, -0.00034430623054504395, -0.00032751262187957764, -0.00031071901321411133, -0.000293925404548645, -0.0002771317958831787, -0.0002603381872177124, -0.0002435445785522461, -0.00022675096988677979, -0.00020995736122131348, -0.00019316375255584717, -0.00017637014389038086, -0.00015957653522491455, -0.00014278292655944824, -0.00012598931789398193, -0.00010919570922851562, -9.240210056304932e-05, -7.560849189758301e-05, -5.88148832321167e-05, -4.202127456665039e-05, -2.5227665901184082e-05, -8.434057235717773e-06, 8.359551429748535e-06, 2.5153160095214844e-05, 4.194676876068115e-05, 5.874037742614746e-05, 7.553398609161377e-05, 9.232759475708008e-05, 0.00010912120342254639, 0.0001259148120880127, 0.000142708420753479, 0.0001595020294189453, 0.00017629563808441162, 0.00019308924674987793, 0.00020988285541534424, 0.00022667646408081055, 0.00024347007274627686, 0.00026026368141174316, 0.00027705729007720947, 0.0002938508987426758, 0.0003106445074081421, 0.0003274381160736084, 0.0003442317247390747, 0.000361025333404541, 0.0003778189420700073, 0.00039461255073547363, 0.00041140615940093994, 0.00042819976806640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 17.0, 26.0, 33.0, 81.0, 136.0, 283.0, 661.0, 1782.0, 6038.0, 29931.0, 266575.0, 653319.0, 72826.0, 12132.0, 2916.0, 952.0, 397.0, 175.0, 104.0, 55.0, 27.0, 20.0, 13.0, 9.0, 5.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4493408203125, -4.297119140625, -4.1448974609375, -3.99267578125, -3.8404541015625, -3.688232421875, -3.5360107421875, -3.3837890625, -3.2315673828125, -3.079345703125, -2.9271240234375, -2.77490234375, -2.6226806640625, -2.470458984375, -2.3182373046875, -2.166015625, -2.0137939453125, -1.861572265625, -1.7093505859375, -1.55712890625, -1.4049072265625, -1.252685546875, -1.1004638671875, -0.9482421875, -0.7960205078125, -0.643798828125, -0.4915771484375, -0.33935546875, -0.1871337890625, -0.034912109375, 0.1173095703125, 0.26953125, 0.4217529296875, 0.573974609375, 0.7261962890625, 0.87841796875, 1.0306396484375, 1.182861328125, 1.3350830078125, 1.4873046875, 1.6395263671875, 1.791748046875, 1.9439697265625, 2.09619140625, 2.2484130859375, 2.400634765625, 2.5528564453125, 2.705078125, 2.8572998046875, 3.009521484375, 3.1617431640625, 3.31396484375, 3.4661865234375, 3.618408203125, 3.7706298828125, 3.9228515625, 4.0750732421875, 4.227294921875, 4.3795166015625, 4.53173828125, 4.6839599609375, 4.836181640625, 4.9884033203125, 5.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 5.0, 8.0, 4.0, 10.0, 8.0, 10.0, 18.0, 20.0, 14.0, 23.0, 36.0, 46.0, 56.0, 59.0, 63.0, 81.0, 86.0, 67.0, 83.0, 55.0, 55.0, 41.0, 32.0, 30.0, 18.0, 14.0, 10.0, 15.0, 7.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6953125, -1.63916015625, -1.5830078125, -1.52685546875, -1.470703125, -1.41455078125, -1.3583984375, -1.30224609375, -1.24609375, -1.18994140625, -1.1337890625, -1.07763671875, -1.021484375, -0.96533203125, -0.9091796875, -0.85302734375, -0.796875, -0.74072265625, -0.6845703125, -0.62841796875, -0.572265625, -0.51611328125, -0.4599609375, -0.40380859375, -0.34765625, -0.29150390625, -0.2353515625, -0.17919921875, -0.123046875, -0.06689453125, -0.0107421875, 0.04541015625, 0.1015625, 0.15771484375, 0.2138671875, 0.27001953125, 0.326171875, 0.38232421875, 0.4384765625, 0.49462890625, 0.55078125, 0.60693359375, 0.6630859375, 0.71923828125, 0.775390625, 0.83154296875, 0.8876953125, 0.94384765625, 1.0, 1.05615234375, 1.1123046875, 1.16845703125, 1.224609375, 1.28076171875, 1.3369140625, 1.39306640625, 1.44921875, 1.50537109375, 1.5615234375, 1.61767578125, 1.673828125, 1.72998046875, 1.7861328125, 1.84228515625, 1.8984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 10.0, 25.0, 46.0, 86.0, 192.0, 213.0, 219.0, 107.0, 70.0, 21.0, 13.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.60674285888672, -48.90692901611328, -47.20711898803711, -45.50730514526367, -43.807491302490234, -42.10768127441406, -40.407867431640625, -38.70805358886719, -37.00823974609375, -35.30842590332031, -33.60861587524414, -31.908802032470703, -30.208988189697266, -28.50917625427246, -26.809364318847656, -25.10955047607422, -23.409740447998047, -21.709928512573242, -20.010114669799805, -18.310302734375, -16.610488891601562, -14.910676956176758, -13.210865020751953, -11.511052131652832, -9.811239242553711, -8.11142635345459, -6.411613941192627, -4.711801528930664, -3.011988639831543, -1.3121757507324219, 0.3876361846923828, 2.087449073791504, 3.7872581481933594, 5.4870710372924805, 7.186883449554443, 8.886695861816406, 10.586508750915527, 12.286321640014648, 13.986133575439453, 15.685946464538574, 17.385759353637695, 19.0855712890625, 20.785385131835938, 22.485197067260742, 24.185009002685547, 25.884822845458984, 27.58463478088379, 29.284446716308594, 30.98426055908203, 32.68407440185547, 34.38388442993164, 36.08369827270508, 37.783512115478516, 39.48332214355469, 41.183135986328125, 42.88294982910156, 44.582763671875, 46.28257751464844, 47.98238754272461, 49.68220138549805, 51.382015228271484, 53.081825256347656, 54.781639099121094, 56.48145294189453, 58.1812629699707]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 18.0, 12.0, 16.0, 16.0, 17.0, 28.0, 28.0, 34.0, 31.0, 49.0, 33.0, 40.0, 49.0, 51.0, 39.0, 40.0, 40.0, 35.0, 45.0, 32.0, 35.0, 28.0, 22.0, 30.0, 16.0, 28.0, 23.0, 18.0, 14.0, 15.0, 12.0, 9.0, 10.0, 5.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.762094497680664, -18.190765380859375, -17.61943817138672, -17.04810905456543, -16.47677993774414, -15.905450820922852, -15.334122657775879, -14.762794494628906, -14.191465377807617, -13.620136260986328, -13.048808097839355, -12.477479934692383, -11.906150817871094, -11.334821701049805, -10.763493537902832, -10.19216537475586, -9.62083625793457, -9.049507141113281, -8.478178977966309, -7.906850337982178, -7.335521697998047, -6.764193058013916, -6.192864418029785, -5.621535778045654, -5.050207138061523, -4.478878498077393, -3.9075498580932617, -3.336221218109131, -2.764892578125, -2.193563938140869, -1.6222352981567383, -1.0509066581726074, -0.47957611083984375, 0.09175252914428711, 0.663081169128418, 1.2344098091125488, 1.8057384490966797, 2.3770670890808105, 2.9483957290649414, 3.5197243690490723, 4.091053009033203, 4.662381649017334, 5.233710289001465, 5.805038928985596, 6.376367568969727, 6.947696208953857, 7.519024848937988, 8.090353012084961, 8.66168212890625, 9.233011245727539, 9.804339408874512, 10.375667572021484, 10.946996688842773, 11.518325805664062, 12.089653968811035, 12.660982131958008, 13.232311248779297, 13.803640365600586, 14.374968528747559, 14.946296691894531, 15.51762580871582, 16.08895492553711, 16.660282135009766, 17.231611251831055, 17.802940368652344]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 10.0, 5.0, 16.0, 18.0, 32.0, 58.0, 124.0, 172.0, 375.0, 849.0, 2433.0, 8437.0, 52844.0, 3877006.0, 226523.0, 18629.0, 4189.0, 1348.0, 567.0, 281.0, 147.0, 85.0, 49.0, 26.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.73583984375, -8.4091796875, -8.08251953125, -7.755859375, -7.42919921875, -7.1025390625, -6.77587890625, -6.44921875, -6.12255859375, -5.7958984375, -5.46923828125, -5.142578125, -4.81591796875, -4.4892578125, -4.16259765625, -3.8359375, -3.50927734375, -3.1826171875, -2.85595703125, -2.529296875, -2.20263671875, -1.8759765625, -1.54931640625, -1.22265625, -0.89599609375, -0.5693359375, -0.24267578125, 0.083984375, 0.41064453125, 0.7373046875, 1.06396484375, 1.390625, 1.71728515625, 2.0439453125, 2.37060546875, 2.697265625, 3.02392578125, 3.3505859375, 3.67724609375, 4.00390625, 4.33056640625, 4.6572265625, 4.98388671875, 5.310546875, 5.63720703125, 5.9638671875, 6.29052734375, 6.6171875, 6.94384765625, 7.2705078125, 7.59716796875, 7.923828125, 8.25048828125, 8.5771484375, 8.90380859375, 9.23046875, 9.55712890625, 9.8837890625, 10.21044921875, 10.537109375, 10.86376953125, 11.1904296875, 11.51708984375, 11.84375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 11.0, 12.0, 16.0, 36.0, 45.0, 67.0, 69.0, 85.0, 101.0, 114.0, 95.0, 91.0, 74.0, 57.0, 48.0, 27.0, 15.0, 16.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.2063446044921875, -1.166595458984375, -1.1268463134765625, -1.08709716796875, -1.0473480224609375, -1.007598876953125, -0.9678497314453125, -0.9281005859375, -0.8883514404296875, -0.848602294921875, -0.8088531494140625, -0.76910400390625, -0.7293548583984375, -0.689605712890625, -0.6498565673828125, -0.610107421875, -0.5703582763671875, -0.530609130859375, -0.4908599853515625, -0.45111083984375, -0.4113616943359375, -0.371612548828125, -0.3318634033203125, -0.2921142578125, -0.2523651123046875, -0.212615966796875, -0.1728668212890625, -0.13311767578125, -0.0933685302734375, -0.053619384765625, -0.0138702392578125, 0.02587890625, 0.0656280517578125, 0.105377197265625, 0.1451263427734375, 0.18487548828125, 0.2246246337890625, 0.264373779296875, 0.3041229248046875, 0.3438720703125, 0.3836212158203125, 0.423370361328125, 0.4631195068359375, 0.50286865234375, 0.5426177978515625, 0.582366943359375, 0.6221160888671875, 0.661865234375, 0.7016143798828125, 0.741363525390625, 0.7811126708984375, 0.82086181640625, 0.8606109619140625, 0.900360107421875, 0.9401092529296875, 0.9798583984375, 1.0196075439453125, 1.059356689453125, 1.0991058349609375, 1.13885498046875, 1.1786041259765625, 1.218353271484375, 1.2581024169921875, 1.2978515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 8.0, 11.0, 29.0, 43.0, 83.0, 104.0, 164.0, 272.0, 429.0, 768.0, 1307.0, 2433.0, 5325.0, 12096.0, 31155.0, 106755.0, 858664.0, 2940553.0, 161164.0, 42999.0, 15817.0, 6814.0, 3344.0, 1757.0, 933.0, 496.0, 281.0, 195.0, 98.0, 58.0, 37.0, 23.0, 25.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.29296875, -5.150421142578125, -5.00787353515625, -4.865325927734375, -4.7227783203125, -4.580230712890625, -4.43768310546875, -4.295135498046875, -4.152587890625, -4.010040283203125, -3.86749267578125, -3.724945068359375, -3.5823974609375, -3.439849853515625, -3.29730224609375, -3.154754638671875, -3.01220703125, -2.869659423828125, -2.72711181640625, -2.584564208984375, -2.4420166015625, -2.299468994140625, -2.15692138671875, -2.014373779296875, -1.871826171875, -1.729278564453125, -1.58673095703125, -1.444183349609375, -1.3016357421875, -1.159088134765625, -1.01654052734375, -0.873992919921875, -0.7314453125, -0.588897705078125, -0.44635009765625, -0.303802490234375, -0.1612548828125, -0.018707275390625, 0.12384033203125, 0.266387939453125, 0.408935546875, 0.551483154296875, 0.69403076171875, 0.836578369140625, 0.9791259765625, 1.121673583984375, 1.26422119140625, 1.406768798828125, 1.54931640625, 1.691864013671875, 1.83441162109375, 1.976959228515625, 2.1195068359375, 2.262054443359375, 2.40460205078125, 2.547149658203125, 2.689697265625, 2.832244873046875, 2.97479248046875, 3.117340087890625, 3.2598876953125, 3.402435302734375, 3.54498291015625, 3.687530517578125, 3.830078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 12.0, 12.0, 18.0, 29.0, 24.0, 50.0, 51.0, 90.0, 149.0, 234.0, 600.0, 1646.0, 481.0, 199.0, 146.0, 76.0, 60.0, 38.0, 31.0, 26.0, 16.0, 9.0, 22.0, 10.0, 0.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.3683929443359375, -1.328582763671875, -1.2887725830078125, -1.24896240234375, -1.2091522216796875, -1.169342041015625, -1.1295318603515625, -1.0897216796875, -1.0499114990234375, -1.010101318359375, -0.9702911376953125, -0.93048095703125, -0.8906707763671875, -0.850860595703125, -0.8110504150390625, -0.771240234375, -0.7314300537109375, -0.691619873046875, -0.6518096923828125, -0.61199951171875, -0.5721893310546875, -0.532379150390625, -0.4925689697265625, -0.4527587890625, -0.4129486083984375, -0.373138427734375, -0.3333282470703125, -0.29351806640625, -0.2537078857421875, -0.213897705078125, -0.1740875244140625, -0.13427734375, -0.0944671630859375, -0.054656982421875, -0.0148468017578125, 0.02496337890625, 0.0647735595703125, 0.104583740234375, 0.1443939208984375, 0.1842041015625, 0.2240142822265625, 0.263824462890625, 0.3036346435546875, 0.34344482421875, 0.3832550048828125, 0.423065185546875, 0.4628753662109375, 0.502685546875, 0.5424957275390625, 0.582305908203125, 0.6221160888671875, 0.66192626953125, 0.7017364501953125, 0.741546630859375, 0.7813568115234375, 0.8211669921875, 0.8609771728515625, 0.900787353515625, 0.9405975341796875, 0.98040771484375, 1.0202178955078125, 1.060028076171875, 1.0998382568359375, 1.1396484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 23.0, 39.0, 103.0, 199.0, 244.0, 201.0, 122.0, 43.0, 14.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.255008697509766, -8.690715789794922, -8.126422882080078, -7.562129974365234, -6.997837066650391, -6.433544158935547, -5.869251251220703, -5.304958343505859, -4.740665435791016, -4.176372528076172, -3.612079620361328, -3.0477867126464844, -2.4834938049316406, -1.9192008972167969, -1.3549079895019531, -0.7906150817871094, -0.22632217407226562, 0.3379707336425781, 0.9022636413574219, 1.4665565490722656, 2.0308494567871094, 2.595142364501953, 3.159435272216797, 3.7237281799316406, 4.288021087646484, 4.852313995361328, 5.416606903076172, 5.980899810791016, 6.545192718505859, 7.109485626220703, 7.673778533935547, 8.23807144165039, 8.802366256713867, 9.366659164428711, 9.930952072143555, 10.495244979858398, 11.059537887573242, 11.623830795288086, 12.18812370300293, 12.752416610717773, 13.316709518432617, 13.881002426147461, 14.445295333862305, 15.009588241577148, 15.573881149291992, 16.138174057006836, 16.70246696472168, 17.266759872436523, 17.831052780151367, 18.39534568786621, 18.959638595581055, 19.5239315032959, 20.088224411010742, 20.652517318725586, 21.21681022644043, 21.781103134155273, 22.345396041870117, 22.90968894958496, 23.473981857299805, 24.03827476501465, 24.602567672729492, 25.166860580444336, 25.73115348815918, 26.295446395874023, 26.859739303588867]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 8.0, 7.0, 13.0, 5.0, 13.0, 16.0, 19.0, 19.0, 16.0, 12.0, 25.0, 40.0, 30.0, 34.0, 48.0, 34.0, 49.0, 39.0, 49.0, 55.0, 48.0, 54.0, 43.0, 44.0, 34.0, 33.0, 27.0, 23.0, 31.0, 15.0, 20.0, 19.0, 11.0, 15.0, 9.0, 11.0, 8.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.036235809326172, -4.883856296539307, -4.7314772605896, -4.579097747802734, -4.426718711853027, -4.274339199066162, -4.121959686279297, -3.9695804119110107, -3.8172011375427246, -3.6648218631744385, -3.5124425888061523, -3.360063076019287, -3.207683801651001, -3.055304527282715, -2.9029250144958496, -2.7505457401275635, -2.5981664657592773, -2.445787191390991, -2.293407917022705, -2.14102840423584, -1.9886491298675537, -1.8362698554992676, -1.683890461921692, -1.5315110683441162, -1.37913179397583, -1.226752519607544, -1.0743731260299683, -0.9219937920570374, -0.7696144580841064, -0.6172351241111755, -0.46485579013824463, -0.31247639656066895, -0.1600966453552246, -0.007717311382293701, 0.1446620225906372, 0.2970413565635681, 0.449420690536499, 0.6018000245094299, 0.7541793584823608, 0.9065587520599365, 1.0589380264282227, 1.2113173007965088, 1.3636966943740845, 1.5160760879516602, 1.6684553623199463, 1.8208346366882324, 1.973214030265808, 2.125593423843384, 2.27797269821167, 2.430351972579956, 2.582731246948242, 2.7351107597351074, 2.8874900341033936, 3.0398693084716797, 3.192248821258545, 3.344628095626831, 3.497007369995117, 3.6493866443634033, 3.8017659187316895, 3.9541454315185547, 4.106524467468262, 4.258903980255127, 4.411283493041992, 4.563662528991699, 4.7160420417785645]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 12.0, 20.0, 21.0, 35.0, 56.0, 67.0, 138.0, 224.0, 403.0, 637.0, 1264.0, 2524.0, 5935.0, 16749.0, 58984.0, 249263.0, 507625.0, 147737.0, 36771.0, 11397.0, 4421.0, 1929.0, 949.0, 570.0, 303.0, 177.0, 116.0, 73.0, 44.0, 39.0, 17.0, 9.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.71539306640625, -4.5362548828125, -4.35711669921875, -4.177978515625, -3.99884033203125, -3.8197021484375, -3.64056396484375, -3.46142578125, -3.28228759765625, -3.1031494140625, -2.92401123046875, -2.744873046875, -2.56573486328125, -2.3865966796875, -2.20745849609375, -2.0283203125, -1.84918212890625, -1.6700439453125, -1.49090576171875, -1.311767578125, -1.13262939453125, -0.9534912109375, -0.77435302734375, -0.59521484375, -0.41607666015625, -0.2369384765625, -0.05780029296875, 0.121337890625, 0.30047607421875, 0.4796142578125, 0.65875244140625, 0.837890625, 1.01702880859375, 1.1961669921875, 1.37530517578125, 1.554443359375, 1.73358154296875, 1.9127197265625, 2.09185791015625, 2.27099609375, 2.45013427734375, 2.6292724609375, 2.80841064453125, 2.987548828125, 3.16668701171875, 3.3458251953125, 3.52496337890625, 3.7041015625, 3.88323974609375, 4.0623779296875, 4.24151611328125, 4.420654296875, 4.59979248046875, 4.7789306640625, 4.95806884765625, 5.13720703125, 5.31634521484375, 5.4954833984375, 5.67462158203125, 5.853759765625, 6.03289794921875, 6.2120361328125, 6.39117431640625, 6.5703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 9.0, 14.0, 21.0, 26.0, 60.0, 52.0, 63.0, 68.0, 95.0, 99.0, 99.0, 88.0, 77.0, 61.0, 51.0, 32.0, 25.0, 21.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.0929718017578125, -1.056060791015625, -1.0191497802734375, -0.98223876953125, -0.9453277587890625, -0.908416748046875, -0.8715057373046875, -0.8345947265625, -0.7976837158203125, -0.760772705078125, -0.7238616943359375, -0.68695068359375, -0.6500396728515625, -0.613128662109375, -0.5762176513671875, -0.539306640625, -0.5023956298828125, -0.465484619140625, -0.4285736083984375, -0.39166259765625, -0.3547515869140625, -0.317840576171875, -0.2809295654296875, -0.2440185546875, -0.2071075439453125, -0.170196533203125, -0.1332855224609375, -0.09637451171875, -0.0594635009765625, -0.022552490234375, 0.0143585205078125, 0.05126953125, 0.0881805419921875, 0.125091552734375, 0.1620025634765625, 0.19891357421875, 0.2358245849609375, 0.272735595703125, 0.3096466064453125, 0.3465576171875, 0.3834686279296875, 0.420379638671875, 0.4572906494140625, 0.49420166015625, 0.5311126708984375, 0.568023681640625, 0.6049346923828125, 0.641845703125, 0.6787567138671875, 0.715667724609375, 0.7525787353515625, 0.78948974609375, 0.8264007568359375, 0.863311767578125, 0.9002227783203125, 0.9371337890625, 0.9740447998046875, 1.010955810546875, 1.0478668212890625, 1.08477783203125, 1.1216888427734375, 1.158599853515625, 1.1955108642578125, 1.232421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 7.0, 6.0, 14.0, 12.0, 16.0, 13.0, 32.0, 33.0, 51.0, 77.0, 127.0, 221.0, 357.0, 604.0, 1232.0, 3127.0, 10091.0, 45702.0, 255098.0, 563580.0, 132593.0, 24930.0, 6258.0, 2169.0, 953.0, 485.0, 281.0, 167.0, 92.0, 60.0, 48.0, 25.0, 16.0, 20.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.30078125, -6.11163330078125, -5.9224853515625, -5.73333740234375, -5.544189453125, -5.35504150390625, -5.1658935546875, -4.97674560546875, -4.78759765625, -4.59844970703125, -4.4093017578125, -4.22015380859375, -4.031005859375, -3.84185791015625, -3.6527099609375, -3.46356201171875, -3.2744140625, -3.08526611328125, -2.8961181640625, -2.70697021484375, -2.517822265625, -2.32867431640625, -2.1395263671875, -1.95037841796875, -1.76123046875, -1.57208251953125, -1.3829345703125, -1.19378662109375, -1.004638671875, -0.81549072265625, -0.6263427734375, -0.43719482421875, -0.248046875, -0.05889892578125, 0.1302490234375, 0.31939697265625, 0.508544921875, 0.69769287109375, 0.8868408203125, 1.07598876953125, 1.26513671875, 1.45428466796875, 1.6434326171875, 1.83258056640625, 2.021728515625, 2.21087646484375, 2.4000244140625, 2.58917236328125, 2.7783203125, 2.96746826171875, 3.1566162109375, 3.34576416015625, 3.534912109375, 3.72406005859375, 3.9132080078125, 4.10235595703125, 4.29150390625, 4.48065185546875, 4.6697998046875, 4.85894775390625, 5.048095703125, 5.23724365234375, 5.4263916015625, 5.61553955078125, 5.8046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 2.0, 9.0, 7.0, 13.0, 4.0, 15.0, 13.0, 16.0, 17.0, 33.0, 27.0, 33.0, 23.0, 38.0, 29.0, 32.0, 34.0, 34.0, 35.0, 33.0, 43.0, 41.0, 44.0, 26.0, 39.0, 39.0, 29.0, 34.0, 26.0, 35.0, 34.0, 27.0, 20.0, 26.0, 10.0, 9.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.947265625, -2.85589599609375, -2.7645263671875, -2.67315673828125, -2.581787109375, -2.49041748046875, -2.3990478515625, -2.30767822265625, -2.21630859375, -2.12493896484375, -2.0335693359375, -1.94219970703125, -1.850830078125, -1.75946044921875, -1.6680908203125, -1.57672119140625, -1.4853515625, -1.39398193359375, -1.3026123046875, -1.21124267578125, -1.119873046875, -1.02850341796875, -0.9371337890625, -0.84576416015625, -0.75439453125, -0.66302490234375, -0.5716552734375, -0.48028564453125, -0.388916015625, -0.29754638671875, -0.2061767578125, -0.11480712890625, -0.0234375, 0.06793212890625, 0.1593017578125, 0.25067138671875, 0.342041015625, 0.43341064453125, 0.5247802734375, 0.61614990234375, 0.70751953125, 0.79888916015625, 0.8902587890625, 0.98162841796875, 1.072998046875, 1.16436767578125, 1.2557373046875, 1.34710693359375, 1.4384765625, 1.52984619140625, 1.6212158203125, 1.71258544921875, 1.803955078125, 1.89532470703125, 1.9866943359375, 2.07806396484375, 2.16943359375, 2.26080322265625, 2.3521728515625, 2.44354248046875, 2.534912109375, 2.62628173828125, 2.7176513671875, 2.80902099609375, 2.900390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 12.0, 38.0, 57.0, 106.0, 251.0, 595.0, 1508.0, 4319.0, 20946.0, 250414.0, 706343.0, 51986.0, 7984.0, 2411.0, 861.0, 371.0, 152.0, 71.0, 39.0, 23.0, 15.0, 12.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.647216796875, -5.46630859375, -5.285400390625, -5.1044921875, -4.923583984375, -4.74267578125, -4.561767578125, -4.380859375, -4.199951171875, -4.01904296875, -3.838134765625, -3.6572265625, -3.476318359375, -3.29541015625, -3.114501953125, -2.93359375, -2.752685546875, -2.57177734375, -2.390869140625, -2.2099609375, -2.029052734375, -1.84814453125, -1.667236328125, -1.486328125, -1.305419921875, -1.12451171875, -0.943603515625, -0.7626953125, -0.581787109375, -0.40087890625, -0.219970703125, -0.0390625, 0.141845703125, 0.32275390625, 0.503662109375, 0.6845703125, 0.865478515625, 1.04638671875, 1.227294921875, 1.408203125, 1.589111328125, 1.77001953125, 1.950927734375, 2.1318359375, 2.312744140625, 2.49365234375, 2.674560546875, 2.85546875, 3.036376953125, 3.21728515625, 3.398193359375, 3.5791015625, 3.760009765625, 3.94091796875, 4.121826171875, 4.302734375, 4.483642578125, 4.66455078125, 4.845458984375, 5.0263671875, 5.207275390625, 5.38818359375, 5.569091796875, 5.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 5.0, 14.0, 10.0, 23.0, 37.0, 50.0, 87.0, 138.0, 214.0, 157.0, 86.0, 50.0, 35.0, 33.0, 16.0, 13.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010004043579101562, -0.0009697899222373962, -0.0009391754865646362, -0.0009085610508918762, -0.0008779466152191162, -0.0008473321795463562, -0.0008167177438735962, -0.0007861033082008362, -0.0007554888725280762, -0.0007248744368553162, -0.0006942600011825562, -0.0006636455655097961, -0.0006330311298370361, -0.0006024166941642761, -0.0005718022584915161, -0.0005411878228187561, -0.0005105733871459961, -0.0004799589514732361, -0.0004493445158004761, -0.00041873008012771606, -0.00038811564445495605, -0.00035750120878219604, -0.00032688677310943604, -0.000296272337436676, -0.000265657901763916, -0.000235043466091156, -0.000204429030418396, -0.00017381459474563599, -0.00014320015907287598, -0.00011258572340011597, -8.197128772735596e-05, -5.135685205459595e-05, -2.0742416381835938e-05, 9.872019290924072e-06, 4.048645496368408e-05, 7.110089063644409e-05, 0.0001017153263092041, 0.0001323297619819641, 0.00016294419765472412, 0.00019355863332748413, 0.00022417306900024414, 0.00025478750467300415, 0.00028540194034576416, 0.00031601637601852417, 0.0003466308116912842, 0.0003772452473640442, 0.0004078596830368042, 0.0004384741187095642, 0.0004690885543823242, 0.0004997029900550842, 0.0005303174257278442, 0.0005609318614006042, 0.0005915462970733643, 0.0006221607327461243, 0.0006527751684188843, 0.0006833896040916443, 0.0007140040397644043, 0.0007446184754371643, 0.0007752329111099243, 0.0008058473467826843, 0.0008364617824554443, 0.0008670762181282043, 0.0008976906538009644, 0.0009283050894737244, 0.0009589195251464844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 21.0, 30.0, 46.0, 95.0, 165.0, 430.0, 943.0, 2772.0, 12141.0, 201717.0, 793554.0, 29205.0, 4933.0, 1426.0, 515.0, 259.0, 131.0, 72.0, 19.0, 13.0, 19.0, 4.0, 7.0, 12.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.95574951171875, -7.7161865234375, -7.47662353515625, -7.237060546875, -6.99749755859375, -6.7579345703125, -6.51837158203125, -6.27880859375, -6.03924560546875, -5.7996826171875, -5.56011962890625, -5.320556640625, -5.08099365234375, -4.8414306640625, -4.60186767578125, -4.3623046875, -4.12274169921875, -3.8831787109375, -3.64361572265625, -3.404052734375, -3.16448974609375, -2.9249267578125, -2.68536376953125, -2.44580078125, -2.20623779296875, -1.9666748046875, -1.72711181640625, -1.487548828125, -1.24798583984375, -1.0084228515625, -0.76885986328125, -0.529296875, -0.28973388671875, -0.0501708984375, 0.18939208984375, 0.428955078125, 0.66851806640625, 0.9080810546875, 1.14764404296875, 1.38720703125, 1.62677001953125, 1.8663330078125, 2.10589599609375, 2.345458984375, 2.58502197265625, 2.8245849609375, 3.06414794921875, 3.3037109375, 3.54327392578125, 3.7828369140625, 4.02239990234375, 4.261962890625, 4.50152587890625, 4.7410888671875, 4.98065185546875, 5.22021484375, 5.45977783203125, 5.6993408203125, 5.93890380859375, 6.178466796875, 6.41802978515625, 6.6575927734375, 6.89715576171875, 7.13671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 4.0, 10.0, 8.0, 11.0, 24.0, 30.0, 61.0, 112.0, 140.0, 170.0, 145.0, 108.0, 48.0, 29.0, 19.0, 21.0, 13.0, 9.0, 8.0, 3.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4765625, -3.36602783203125, -3.2554931640625, -3.14495849609375, -3.034423828125, -2.92388916015625, -2.8133544921875, -2.70281982421875, -2.59228515625, -2.48175048828125, -2.3712158203125, -2.26068115234375, -2.150146484375, -2.03961181640625, -1.9290771484375, -1.81854248046875, -1.7080078125, -1.59747314453125, -1.4869384765625, -1.37640380859375, -1.265869140625, -1.15533447265625, -1.0447998046875, -0.93426513671875, -0.82373046875, -0.71319580078125, -0.6026611328125, -0.49212646484375, -0.381591796875, -0.27105712890625, -0.1605224609375, -0.04998779296875, 0.060546875, 0.17108154296875, 0.2816162109375, 0.39215087890625, 0.502685546875, 0.61322021484375, 0.7237548828125, 0.83428955078125, 0.94482421875, 1.05535888671875, 1.1658935546875, 1.27642822265625, 1.386962890625, 1.49749755859375, 1.6080322265625, 1.71856689453125, 1.8291015625, 1.93963623046875, 2.0501708984375, 2.16070556640625, 2.271240234375, 2.38177490234375, 2.4923095703125, 2.60284423828125, 2.71337890625, 2.82391357421875, 2.9344482421875, 3.04498291015625, 3.155517578125, 3.26605224609375, 3.3765869140625, 3.48712158203125, 3.59765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 22.0, 32.0, 56.0, 79.0, 121.0, 123.0, 134.0, 132.0, 101.0, 69.0, 30.0, 24.0, 20.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.876922607421875, -17.836334228515625, -16.795745849609375, -15.755155563354492, -14.714567184448242, -13.673978805541992, -12.633389472961426, -11.59280014038086, -10.55221176147461, -9.51162338256836, -8.471034049987793, -7.430445194244385, -6.389856338500977, -5.349267482757568, -4.30867862701416, -3.268089771270752, -2.2275009155273438, -1.1869120597839355, -0.14632320404052734, 0.8942656517028809, 1.934854507446289, 2.9754433631896973, 4.0160322189331055, 5.056621074676514, 6.097209930419922, 7.13779878616333, 8.178387641906738, 9.218976974487305, 10.259565353393555, 11.300153732299805, 12.340743064880371, 13.381332397460938, 14.421920776367188, 15.462509155273438, 16.503097534179688, 17.54368782043457, 18.58427619934082, 19.62486457824707, 20.665454864501953, 21.706043243408203, 22.746631622314453, 23.787220001220703, 24.827808380126953, 25.868398666381836, 26.908987045288086, 27.949575424194336, 28.99016571044922, 30.03075408935547, 31.07134246826172, 32.11193084716797, 33.15251922607422, 34.19310760498047, 35.23369598388672, 36.274288177490234, 37.314876556396484, 38.355464935302734, 39.396053314208984, 40.436641693115234, 41.477230072021484, 42.517818450927734, 43.55841064453125, 44.5989990234375, 45.63958740234375, 46.68017578125, 47.72076416015625]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 8.0, 3.0, 7.0, 8.0, 12.0, 9.0, 16.0, 11.0, 16.0, 14.0, 21.0, 21.0, 33.0, 35.0, 37.0, 41.0, 44.0, 34.0, 51.0, 51.0, 52.0, 50.0, 53.0, 54.0, 37.0, 37.0, 41.0, 34.0, 31.0, 24.0, 24.0, 22.0, 11.0, 15.0, 7.0, 6.0, 6.0, 5.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.13074493408203, -19.472129821777344, -18.813514709472656, -18.1549015045166, -17.496286392211914, -16.837671279907227, -16.179058074951172, -15.520442962646484, -14.861827850341797, -14.20321273803711, -13.544598579406738, -12.885984420776367, -12.22736930847168, -11.568754196166992, -10.910140037536621, -10.25152587890625, -9.592910766601562, -8.934295654296875, -8.275681495666504, -7.617066860198975, -6.958452224731445, -6.299837589263916, -5.641222953796387, -4.982608318328857, -4.323993682861328, -3.665379047393799, -3.0067644119262695, -2.3481497764587402, -1.689535140991211, -1.0309205055236816, -0.37230587005615234, 0.28630876541137695, 0.9449214935302734, 1.6035361289978027, 2.262150764465332, 2.9207653999328613, 3.5793800354003906, 4.23799467086792, 4.896609306335449, 5.5552239418029785, 6.213838577270508, 6.872453212738037, 7.531067848205566, 8.189682006835938, 8.848297119140625, 9.506912231445312, 10.165526390075684, 10.824140548706055, 11.482755661010742, 12.14137077331543, 12.7999849319458, 13.458599090576172, 14.11721420288086, 14.775829315185547, 15.434443473815918, 16.09305763244629, 16.751672744750977, 17.410287857055664, 18.06890106201172, 18.727516174316406, 19.386131286621094, 20.04474639892578, 20.70336151123047, 21.361974716186523, 22.02058982849121]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 15.0, 14.0, 32.0, 56.0, 89.0, 171.0, 323.0, 782.0, 2145.0, 7431.0, 37323.0, 728180.0, 3346537.0, 56766.0, 9883.0, 2724.0, 974.0, 398.0, 179.0, 93.0, 57.0, 29.0, 30.0, 13.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.25238037109375, -4.9774169921875, -4.70245361328125, -4.427490234375, -4.15252685546875, -3.8775634765625, -3.60260009765625, -3.32763671875, -3.05267333984375, -2.7777099609375, -2.50274658203125, -2.227783203125, -1.95281982421875, -1.6778564453125, -1.40289306640625, -1.1279296875, -0.85296630859375, -0.5780029296875, -0.30303955078125, -0.028076171875, 0.24688720703125, 0.5218505859375, 0.79681396484375, 1.07177734375, 1.34674072265625, 1.6217041015625, 1.89666748046875, 2.171630859375, 2.44659423828125, 2.7215576171875, 2.99652099609375, 3.271484375, 3.54644775390625, 3.8214111328125, 4.09637451171875, 4.371337890625, 4.64630126953125, 4.9212646484375, 5.19622802734375, 5.47119140625, 5.74615478515625, 6.0211181640625, 6.29608154296875, 6.571044921875, 6.84600830078125, 7.1209716796875, 7.39593505859375, 7.6708984375, 7.94586181640625, 8.2208251953125, 8.49578857421875, 8.770751953125, 9.04571533203125, 9.3206787109375, 9.59564208984375, 9.87060546875, 10.14556884765625, 10.4205322265625, 10.69549560546875, 10.970458984375, 11.24542236328125, 11.5203857421875, 11.79534912109375, 12.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 16.0, 20.0, 27.0, 45.0, 54.0, 55.0, 76.0, 69.0, 88.0, 86.0, 98.0, 74.0, 70.0, 53.0, 44.0, 30.0, 30.0, 17.0, 7.0, 3.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1135101318359375, -1.076629638671875, -1.0397491455078125, -1.00286865234375, -0.9659881591796875, -0.929107666015625, -0.8922271728515625, -0.8553466796875, -0.8184661865234375, -0.781585693359375, -0.7447052001953125, -0.70782470703125, -0.6709442138671875, -0.634063720703125, -0.5971832275390625, -0.560302734375, -0.5234222412109375, -0.486541748046875, -0.4496612548828125, -0.41278076171875, -0.3759002685546875, -0.339019775390625, -0.3021392822265625, -0.2652587890625, -0.2283782958984375, -0.191497802734375, -0.1546173095703125, -0.11773681640625, -0.0808563232421875, -0.043975830078125, -0.0070953369140625, 0.02978515625, 0.0666656494140625, 0.103546142578125, 0.1404266357421875, 0.17730712890625, 0.2141876220703125, 0.251068115234375, 0.2879486083984375, 0.3248291015625, 0.3617095947265625, 0.398590087890625, 0.4354705810546875, 0.47235107421875, 0.5092315673828125, 0.546112060546875, 0.5829925537109375, 0.619873046875, 0.6567535400390625, 0.693634033203125, 0.7305145263671875, 0.76739501953125, 0.8042755126953125, 0.841156005859375, 0.8780364990234375, 0.9149169921875, 0.9517974853515625, 0.988677978515625, 1.0255584716796875, 1.06243896484375, 1.0993194580078125, 1.136199951171875, 1.1730804443359375, 1.2099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 17.0, 15.0, 18.0, 34.0, 31.0, 38.0, 71.0, 113.0, 162.0, 246.0, 410.0, 702.0, 1271.0, 2203.0, 4345.0, 9463.0, 22310.0, 63793.0, 228615.0, 2433427.0, 1171587.0, 169443.0, 50498.0, 18662.0, 8103.0, 3994.0, 1928.0, 1060.0, 611.0, 397.0, 224.0, 146.0, 90.0, 72.0, 49.0, 26.0, 27.0, 12.0, 9.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.92578125, -3.809967041015625, -3.69415283203125, -3.578338623046875, -3.4625244140625, -3.346710205078125, -3.23089599609375, -3.115081787109375, -2.999267578125, -2.883453369140625, -2.76763916015625, -2.651824951171875, -2.5360107421875, -2.420196533203125, -2.30438232421875, -2.188568115234375, -2.07275390625, -1.956939697265625, -1.84112548828125, -1.725311279296875, -1.6094970703125, -1.493682861328125, -1.37786865234375, -1.262054443359375, -1.146240234375, -1.030426025390625, -0.91461181640625, -0.798797607421875, -0.6829833984375, -0.567169189453125, -0.45135498046875, -0.335540771484375, -0.2197265625, -0.103912353515625, 0.01190185546875, 0.127716064453125, 0.2435302734375, 0.359344482421875, 0.47515869140625, 0.590972900390625, 0.706787109375, 0.822601318359375, 0.93841552734375, 1.054229736328125, 1.1700439453125, 1.285858154296875, 1.40167236328125, 1.517486572265625, 1.63330078125, 1.749114990234375, 1.86492919921875, 1.980743408203125, 2.0965576171875, 2.212371826171875, 2.32818603515625, 2.444000244140625, 2.559814453125, 2.675628662109375, 2.79144287109375, 2.907257080078125, 3.0230712890625, 3.138885498046875, 3.25469970703125, 3.370513916015625, 3.486328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 21.0, 18.0, 21.0, 36.0, 48.0, 58.0, 71.0, 112.0, 198.0, 298.0, 687.0, 1234.0, 471.0, 231.0, 166.0, 91.0, 72.0, 59.0, 39.0, 29.0, 18.0, 22.0, 10.0, 6.0, 10.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.625244140625, -1.56982421875, -1.514404296875, -1.458984375, -1.403564453125, -1.34814453125, -1.292724609375, -1.2373046875, -1.181884765625, -1.12646484375, -1.071044921875, -1.015625, -0.960205078125, -0.90478515625, -0.849365234375, -0.7939453125, -0.738525390625, -0.68310546875, -0.627685546875, -0.572265625, -0.516845703125, -0.46142578125, -0.406005859375, -0.3505859375, -0.295166015625, -0.23974609375, -0.184326171875, -0.12890625, -0.073486328125, -0.01806640625, 0.037353515625, 0.0927734375, 0.148193359375, 0.20361328125, 0.259033203125, 0.314453125, 0.369873046875, 0.42529296875, 0.480712890625, 0.5361328125, 0.591552734375, 0.64697265625, 0.702392578125, 0.7578125, 0.813232421875, 0.86865234375, 0.924072265625, 0.9794921875, 1.034912109375, 1.09033203125, 1.145751953125, 1.201171875, 1.256591796875, 1.31201171875, 1.367431640625, 1.4228515625, 1.478271484375, 1.53369140625, 1.589111328125, 1.64453125, 1.699951171875, 1.75537109375, 1.810791015625, 1.8662109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 13.0, 10.0, 17.0, 12.0, 27.0, 45.0, 70.0, 63.0, 72.0, 97.0, 91.0, 87.0, 73.0, 72.0, 65.0, 61.0, 31.0, 23.0, 19.0, 11.0, 1.0, 7.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.557207107543945, -12.254907608032227, -11.952608108520508, -11.650307655334473, -11.348008155822754, -11.045708656311035, -10.743408203125, -10.441108703613281, -10.138809204101562, -9.836509704589844, -9.534210205078125, -9.23190975189209, -8.929610252380371, -8.627310752868652, -8.325010299682617, -8.022710800170898, -7.72041130065918, -7.418111801147461, -7.115811824798584, -6.813511848449707, -6.511212348937988, -6.2089128494262695, -5.906612873077393, -5.604312896728516, -5.302013397216797, -4.999713897705078, -4.697413921356201, -4.395113945007324, -4.0928144454956055, -3.7905147075653076, -3.4882149696350098, -3.185915231704712, -2.8836164474487305, -2.5813167095184326, -2.2790169715881348, -1.976717233657837, -1.674417495727539, -1.3721177577972412, -1.0698180198669434, -0.7675182819366455, -0.46521854400634766, -0.1629188060760498, 0.13938093185424805, 0.4416806697845459, 0.7439804077148438, 1.0462801456451416, 1.3485798835754395, 1.6508796215057373, 1.9531793594360352, 2.255479097366333, 2.557778835296631, 2.8600785732269287, 3.1623783111572266, 3.4646780490875244, 3.7669777870178223, 4.069277763366699, 4.371577262878418, 4.673876762390137, 4.976176738739014, 5.278476715087891, 5.580776214599609, 5.883075714111328, 6.185375690460205, 6.487675666809082, 6.789975166320801]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 13.0, 10.0, 13.0, 19.0, 20.0, 23.0, 24.0, 21.0, 39.0, 28.0, 36.0, 38.0, 42.0, 43.0, 42.0, 52.0, 35.0, 20.0, 40.0, 31.0, 37.0, 34.0, 43.0, 39.0, 22.0, 27.0, 21.0, 26.0, 26.0, 23.0, 13.0, 14.0, 8.0, 10.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.001309394836426, -5.808198928833008, -5.61508846282959, -5.421977996826172, -5.228867530822754, -5.035757064819336, -4.842646598815918, -4.649536609649658, -4.45642614364624, -4.263315677642822, -4.070205211639404, -3.8770947456359863, -3.6839845180511475, -3.4908740520477295, -3.2977635860443115, -3.1046533584594727, -2.9115426540374756, -2.7184321880340576, -2.5253217220306396, -2.332211494445801, -2.139101028442383, -1.9459905624389648, -1.7528800964355469, -1.5597697496414185, -1.3666592836380005, -1.1735488176345825, -0.9804384708404541, -0.7873280048370361, -0.5942175984382629, -0.40110719203948975, -0.20799672603607178, -0.01488637924194336, 0.1782240867614746, 0.3713344931602478, 0.564444899559021, 0.757555365562439, 0.9506657719612122, 1.1437761783599854, 1.3368866443634033, 1.5299969911575317, 1.7231074571609497, 1.9162179231643677, 2.109328269958496, 2.302438735961914, 2.495549201965332, 2.68865966796875, 2.881770133972168, 3.074880361557007, 3.267990827560425, 3.4611012935638428, 3.6542117595672607, 3.8473219871520996, 4.040432453155518, 4.2335429191589355, 4.4266533851623535, 4.6197638511657715, 4.8128743171691895, 5.005984783172607, 5.199095249176025, 5.392205715179443, 5.585316181182861, 5.778426170349121, 5.971536636352539, 6.164647102355957, 6.357757568359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 18.0, 23.0, 37.0, 61.0, 66.0, 116.0, 205.0, 350.0, 529.0, 931.0, 1829.0, 3563.0, 7608.0, 17744.0, 46329.0, 143289.0, 461900.0, 245233.0, 72031.0, 26134.0, 10571.0, 4680.0, 2273.0, 1190.0, 691.0, 418.0, 230.0, 149.0, 108.0, 62.0, 41.0, 33.0, 18.0, 14.0, 9.0, 15.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.6484375, -5.498626708984375, -5.34881591796875, -5.199005126953125, -5.0491943359375, -4.899383544921875, -4.74957275390625, -4.599761962890625, -4.449951171875, -4.300140380859375, -4.15032958984375, -4.000518798828125, -3.8507080078125, -3.700897216796875, -3.55108642578125, -3.401275634765625, -3.25146484375, -3.101654052734375, -2.95184326171875, -2.802032470703125, -2.6522216796875, -2.502410888671875, -2.35260009765625, -2.202789306640625, -2.052978515625, -1.903167724609375, -1.75335693359375, -1.603546142578125, -1.4537353515625, -1.303924560546875, -1.15411376953125, -1.004302978515625, -0.8544921875, -0.704681396484375, -0.55487060546875, -0.405059814453125, -0.2552490234375, -0.105438232421875, 0.04437255859375, 0.194183349609375, 0.343994140625, 0.493804931640625, 0.64361572265625, 0.793426513671875, 0.9432373046875, 1.093048095703125, 1.24285888671875, 1.392669677734375, 1.54248046875, 1.692291259765625, 1.84210205078125, 1.991912841796875, 2.1417236328125, 2.291534423828125, 2.44134521484375, 2.591156005859375, 2.740966796875, 2.890777587890625, 3.04058837890625, 3.190399169921875, 3.3402099609375, 3.490020751953125, 3.63983154296875, 3.789642333984375, 3.939453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 13.0, 13.0, 21.0, 29.0, 39.0, 45.0, 44.0, 64.0, 74.0, 77.0, 92.0, 83.0, 70.0, 80.0, 65.0, 49.0, 43.0, 25.0, 24.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.09783935546875, -1.0609130859375, -1.02398681640625, -0.987060546875, -0.95013427734375, -0.9132080078125, -0.87628173828125, -0.83935546875, -0.80242919921875, -0.7655029296875, -0.72857666015625, -0.691650390625, -0.65472412109375, -0.6177978515625, -0.58087158203125, -0.5439453125, -0.50701904296875, -0.4700927734375, -0.43316650390625, -0.396240234375, -0.35931396484375, -0.3223876953125, -0.28546142578125, -0.24853515625, -0.21160888671875, -0.1746826171875, -0.13775634765625, -0.100830078125, -0.06390380859375, -0.0269775390625, 0.00994873046875, 0.046875, 0.08380126953125, 0.1207275390625, 0.15765380859375, 0.194580078125, 0.23150634765625, 0.2684326171875, 0.30535888671875, 0.34228515625, 0.37921142578125, 0.4161376953125, 0.45306396484375, 0.489990234375, 0.52691650390625, 0.5638427734375, 0.60076904296875, 0.6376953125, 0.67462158203125, 0.7115478515625, 0.74847412109375, 0.785400390625, 0.82232666015625, 0.8592529296875, 0.89617919921875, 0.93310546875, 0.97003173828125, 1.0069580078125, 1.04388427734375, 1.080810546875, 1.11773681640625, 1.1546630859375, 1.19158935546875, 1.228515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 11.0, 13.0, 18.0, 32.0, 40.0, 55.0, 81.0, 149.0, 232.0, 409.0, 810.0, 1687.0, 4137.0, 13064.0, 47918.0, 224149.0, 578638.0, 131655.0, 30762.0, 8697.0, 3118.0, 1271.0, 637.0, 343.0, 199.0, 114.0, 85.0, 50.0, 46.0, 29.0, 27.0, 15.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.890625, -4.71173095703125, -4.5328369140625, -4.35394287109375, -4.175048828125, -3.99615478515625, -3.8172607421875, -3.63836669921875, -3.45947265625, -3.28057861328125, -3.1016845703125, -2.92279052734375, -2.743896484375, -2.56500244140625, -2.3861083984375, -2.20721435546875, -2.0283203125, -1.84942626953125, -1.6705322265625, -1.49163818359375, -1.312744140625, -1.13385009765625, -0.9549560546875, -0.77606201171875, -0.59716796875, -0.41827392578125, -0.2393798828125, -0.06048583984375, 0.118408203125, 0.29730224609375, 0.4761962890625, 0.65509033203125, 0.833984375, 1.01287841796875, 1.1917724609375, 1.37066650390625, 1.549560546875, 1.72845458984375, 1.9073486328125, 2.08624267578125, 2.26513671875, 2.44403076171875, 2.6229248046875, 2.80181884765625, 2.980712890625, 3.15960693359375, 3.3385009765625, 3.51739501953125, 3.6962890625, 3.87518310546875, 4.0540771484375, 4.23297119140625, 4.411865234375, 4.59075927734375, 4.7696533203125, 4.94854736328125, 5.12744140625, 5.30633544921875, 5.4852294921875, 5.66412353515625, 5.843017578125, 6.02191162109375, 6.2008056640625, 6.37969970703125, 6.55859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 8.0, 15.0, 19.0, 14.0, 16.0, 25.0, 23.0, 38.0, 36.0, 40.0, 49.0, 52.0, 43.0, 50.0, 56.0, 53.0, 45.0, 48.0, 50.0, 53.0, 35.0, 40.0, 24.0, 25.0, 23.0, 19.0, 25.0, 11.0, 8.0, 6.0, 9.0, 11.0, 1.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.977783203125, -3.84619140625, -3.714599609375, -3.5830078125, -3.451416015625, -3.31982421875, -3.188232421875, -3.056640625, -2.925048828125, -2.79345703125, -2.661865234375, -2.5302734375, -2.398681640625, -2.26708984375, -2.135498046875, -2.00390625, -1.872314453125, -1.74072265625, -1.609130859375, -1.4775390625, -1.345947265625, -1.21435546875, -1.082763671875, -0.951171875, -0.819580078125, -0.68798828125, -0.556396484375, -0.4248046875, -0.293212890625, -0.16162109375, -0.030029296875, 0.1015625, 0.233154296875, 0.36474609375, 0.496337890625, 0.6279296875, 0.759521484375, 0.89111328125, 1.022705078125, 1.154296875, 1.285888671875, 1.41748046875, 1.549072265625, 1.6806640625, 1.812255859375, 1.94384765625, 2.075439453125, 2.20703125, 2.338623046875, 2.47021484375, 2.601806640625, 2.7333984375, 2.864990234375, 2.99658203125, 3.128173828125, 3.259765625, 3.391357421875, 3.52294921875, 3.654541015625, 3.7861328125, 3.917724609375, 4.04931640625, 4.180908203125, 4.3125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 14.0, 18.0, 28.0, 52.0, 80.0, 167.0, 340.0, 733.0, 1689.0, 5140.0, 22475.0, 180985.0, 720277.0, 95582.0, 14499.0, 3878.0, 1386.0, 609.0, 251.0, 140.0, 79.0, 36.0, 26.0, 15.0, 10.0, 9.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.85247802734375, -5.6658935546875, -5.47930908203125, -5.292724609375, -5.10614013671875, -4.9195556640625, -4.73297119140625, -4.54638671875, -4.35980224609375, -4.1732177734375, -3.98663330078125, -3.800048828125, -3.61346435546875, -3.4268798828125, -3.24029541015625, -3.0537109375, -2.86712646484375, -2.6805419921875, -2.49395751953125, -2.307373046875, -2.12078857421875, -1.9342041015625, -1.74761962890625, -1.56103515625, -1.37445068359375, -1.1878662109375, -1.00128173828125, -0.814697265625, -0.62811279296875, -0.4415283203125, -0.25494384765625, -0.068359375, 0.11822509765625, 0.3048095703125, 0.49139404296875, 0.677978515625, 0.86456298828125, 1.0511474609375, 1.23773193359375, 1.42431640625, 1.61090087890625, 1.7974853515625, 1.98406982421875, 2.170654296875, 2.35723876953125, 2.5438232421875, 2.73040771484375, 2.9169921875, 3.10357666015625, 3.2901611328125, 3.47674560546875, 3.663330078125, 3.84991455078125, 4.0364990234375, 4.22308349609375, 4.40966796875, 4.59625244140625, 4.7828369140625, 4.96942138671875, 5.156005859375, 5.34259033203125, 5.5291748046875, 5.71575927734375, 5.90234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 19.0, 21.0, 22.0, 36.0, 84.0, 180.0, 257.0, 126.0, 83.0, 48.0, 29.0, 16.0, 14.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.0009905099868774414, -0.0009529590606689453, -0.0009154081344604492, -0.0008778572082519531, -0.000840306282043457, -0.0008027553558349609, -0.0007652044296264648, -0.0007276535034179688, -0.0006901025772094727, -0.0006525516510009766, -0.0006150007247924805, -0.0005774497985839844, -0.0005398988723754883, -0.0005023479461669922, -0.0004647970199584961, -0.00042724609375, -0.0003896951675415039, -0.0003521442413330078, -0.0003145933151245117, -0.0002770423889160156, -0.00023949146270751953, -0.00020194053649902344, -0.00016438961029052734, -0.00012683868408203125, -8.928775787353516e-05, -5.173683166503906e-05, -1.4185905456542969e-05, 2.3365020751953125e-05, 6.091594696044922e-05, 9.846687316894531e-05, 0.0001360177993774414, 0.0001735687255859375, 0.0002111196517944336, 0.0002486705780029297, 0.0002862215042114258, 0.0003237724304199219, 0.00036132335662841797, 0.00039887428283691406, 0.00043642520904541016, 0.00047397613525390625, 0.0005115270614624023, 0.0005490779876708984, 0.0005866289138793945, 0.0006241798400878906, 0.0006617307662963867, 0.0006992816925048828, 0.0007368326187133789, 0.000774383544921875, 0.0008119344711303711, 0.0008494853973388672, 0.0008870363235473633, 0.0009245872497558594, 0.0009621381759643555, 0.0009996891021728516, 0.0010372400283813477, 0.0010747909545898438, 0.0011123418807983398, 0.001149892807006836, 0.001187443733215332, 0.0012249946594238281, 0.0012625455856323242, 0.0013000965118408203, 0.0013376474380493164, 0.0013751983642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 6.0, 8.0, 10.0, 12.0, 23.0, 41.0, 33.0, 48.0, 112.0, 211.0, 509.0, 1216.0, 3551.0, 13769.0, 88331.0, 731933.0, 178599.0, 22049.0, 5269.0, 1581.0, 605.0, 292.0, 129.0, 88.0, 44.0, 30.0, 18.0, 17.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.9296875, -6.7503662109375, -6.571044921875, -6.3917236328125, -6.21240234375, -6.0330810546875, -5.853759765625, -5.6744384765625, -5.4951171875, -5.3157958984375, -5.136474609375, -4.9571533203125, -4.77783203125, -4.5985107421875, -4.419189453125, -4.2398681640625, -4.060546875, -3.8812255859375, -3.701904296875, -3.5225830078125, -3.34326171875, -3.1639404296875, -2.984619140625, -2.8052978515625, -2.6259765625, -2.4466552734375, -2.267333984375, -2.0880126953125, -1.90869140625, -1.7293701171875, -1.550048828125, -1.3707275390625, -1.19140625, -1.0120849609375, -0.832763671875, -0.6534423828125, -0.47412109375, -0.2947998046875, -0.115478515625, 0.0638427734375, 0.2431640625, 0.4224853515625, 0.601806640625, 0.7811279296875, 0.96044921875, 1.1397705078125, 1.319091796875, 1.4984130859375, 1.677734375, 1.8570556640625, 2.036376953125, 2.2156982421875, 2.39501953125, 2.5743408203125, 2.753662109375, 2.9329833984375, 3.1123046875, 3.2916259765625, 3.470947265625, 3.6502685546875, 3.82958984375, 4.0089111328125, 4.188232421875, 4.3675537109375, 4.546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 6.0, 14.0, 23.0, 30.0, 52.0, 60.0, 81.0, 132.0, 153.0, 121.0, 77.0, 54.0, 39.0, 33.0, 22.0, 19.0, 14.0, 14.0, 6.0, 5.0, 2.0, 1.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.91156005859375, -3.8074951171875, -3.70343017578125, -3.599365234375, -3.49530029296875, -3.3912353515625, -3.28717041015625, -3.18310546875, -3.07904052734375, -2.9749755859375, -2.87091064453125, -2.766845703125, -2.66278076171875, -2.5587158203125, -2.45465087890625, -2.3505859375, -2.24652099609375, -2.1424560546875, -2.03839111328125, -1.934326171875, -1.83026123046875, -1.7261962890625, -1.62213134765625, -1.51806640625, -1.41400146484375, -1.3099365234375, -1.20587158203125, -1.101806640625, -0.99774169921875, -0.8936767578125, -0.78961181640625, -0.685546875, -0.58148193359375, -0.4774169921875, -0.37335205078125, -0.269287109375, -0.16522216796875, -0.0611572265625, 0.04290771484375, 0.14697265625, 0.25103759765625, 0.3551025390625, 0.45916748046875, 0.563232421875, 0.66729736328125, 0.7713623046875, 0.87542724609375, 0.9794921875, 1.08355712890625, 1.1876220703125, 1.29168701171875, 1.395751953125, 1.49981689453125, 1.6038818359375, 1.70794677734375, 1.81201171875, 1.91607666015625, 2.0201416015625, 2.12420654296875, 2.228271484375, 2.33233642578125, 2.4364013671875, 2.54046630859375, 2.64453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 16.0, 30.0, 33.0, 46.0, 97.0, 138.0, 122.0, 125.0, 96.0, 101.0, 68.0, 46.0, 32.0, 17.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.55727767944336, -18.358530044555664, -17.15978240966797, -15.961034774780273, -14.762287139892578, -13.563539505004883, -12.364792823791504, -11.166045188903809, -9.967297554016113, -8.768549919128418, -7.569802284240723, -6.3710551261901855, -5.17230749130249, -3.973559856414795, -2.774812698364258, -1.5760650634765625, -0.3773174285888672, 0.8214300870895386, 2.0201776027679443, 3.2189249992370605, 4.417672634124756, 5.616420269012451, 6.815167427062988, 8.013915061950684, 9.212662696838379, 10.411410331726074, 11.61015796661377, 12.808904647827148, 14.007652282714844, 15.206399917602539, 16.405147552490234, 17.60389518737793, 18.802642822265625, 20.00139045715332, 21.200138092041016, 22.39888572692871, 23.597633361816406, 24.7963809967041, 25.995128631591797, 27.19387435913086, 28.392623901367188, 29.591371536254883, 30.790119171142578, 31.988866806030273, 33.18761444091797, 34.38636016845703, 35.58510971069336, 36.78385543823242, 37.98260498046875, 39.18135070800781, 40.38010025024414, 41.5788459777832, 42.77759552001953, 43.976341247558594, 45.17509078979492, 46.373836517333984, 47.57258224487305, 48.77132797241211, 49.97007751464844, 51.1688232421875, 52.36757278442383, 53.56631851196289, 54.76506805419922, 55.96381378173828, 57.16256332397461]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 4.0, 6.0, 7.0, 15.0, 7.0, 13.0, 18.0, 21.0, 17.0, 21.0, 26.0, 40.0, 31.0, 35.0, 51.0, 41.0, 46.0, 57.0, 55.0, 53.0, 42.0, 44.0, 45.0, 43.0, 42.0, 28.0, 34.0, 28.0, 17.0, 21.0, 15.0, 10.0, 9.0, 9.0, 13.0, 7.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.261754989624023, -22.515945434570312, -21.770137786865234, -21.024328231811523, -20.278520584106445, -19.532711029052734, -18.786903381347656, -18.041093826293945, -17.295284271240234, -16.549474716186523, -15.803667068481445, -15.057857513427734, -14.312049865722656, -13.566240310668945, -12.82043170928955, -12.074623107910156, -11.328815460205078, -10.583006858825684, -9.837198257446289, -9.091388702392578, -8.3455810546875, -7.599771976470947, -6.8539628982543945, -6.108154296875, -5.3623456954956055, -4.616537094116211, -3.8707282543182373, -3.1249194145202637, -2.379110813140869, -1.6333022117614746, -0.8874931335449219, -0.14168453216552734, 0.6041259765625, 1.349934697151184, 2.095743417739868, 2.841552257537842, 3.5873608589172363, 4.333169460296631, 5.078978538513184, 5.824787139892578, 6.570595741271973, 7.316404342651367, 8.062212944030762, 8.808021545410156, 9.553831100463867, 10.299638748168945, 11.045448303222656, 11.79125690460205, 12.537065505981445, 13.28287410736084, 14.028682708740234, 14.774492263793945, 15.520299911499023, 16.266109466552734, 17.011917114257812, 17.757726669311523, 18.503536224365234, 19.249345779418945, 19.995153427124023, 20.740962982177734, 21.486770629882812, 22.232580184936523, 22.978389739990234, 23.724197387695312, 24.47000503540039]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 13.0, 37.0, 44.0, 70.0, 129.0, 190.0, 315.0, 656.0, 1445.0, 3117.0, 8351.0, 28304.0, 147610.0, 3687280.0, 259215.0, 39554.0, 10922.0, 3875.0, 1561.0, 712.0, 360.0, 200.0, 96.0, 51.0, 44.0, 34.0, 25.0, 10.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.3046875, -6.0987548828125, -5.892822265625, -5.6868896484375, -5.48095703125, -5.2750244140625, -5.069091796875, -4.8631591796875, -4.6572265625, -4.4512939453125, -4.245361328125, -4.0394287109375, -3.83349609375, -3.6275634765625, -3.421630859375, -3.2156982421875, -3.009765625, -2.8038330078125, -2.597900390625, -2.3919677734375, -2.18603515625, -1.9801025390625, -1.774169921875, -1.5682373046875, -1.3623046875, -1.1563720703125, -0.950439453125, -0.7445068359375, -0.53857421875, -0.3326416015625, -0.126708984375, 0.0792236328125, 0.28515625, 0.4910888671875, 0.697021484375, 0.9029541015625, 1.10888671875, 1.3148193359375, 1.520751953125, 1.7266845703125, 1.9326171875, 2.1385498046875, 2.344482421875, 2.5504150390625, 2.75634765625, 2.9622802734375, 3.168212890625, 3.3741455078125, 3.580078125, 3.7860107421875, 3.991943359375, 4.1978759765625, 4.40380859375, 4.6097412109375, 4.815673828125, 5.0216064453125, 5.2275390625, 5.4334716796875, 5.639404296875, 5.8453369140625, 6.05126953125, 6.2572021484375, 6.463134765625, 6.6690673828125, 6.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 14.0, 24.0, 30.0, 21.0, 28.0, 49.0, 51.0, 72.0, 72.0, 75.0, 71.0, 68.0, 59.0, 68.0, 59.0, 44.0, 36.0, 35.0, 29.0, 22.0, 13.0, 7.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.090240478515625, -1.05352783203125, -1.016815185546875, -0.9801025390625, -0.943389892578125, -0.90667724609375, -0.869964599609375, -0.833251953125, -0.796539306640625, -0.75982666015625, -0.723114013671875, -0.6864013671875, -0.649688720703125, -0.61297607421875, -0.576263427734375, -0.53955078125, -0.502838134765625, -0.46612548828125, -0.429412841796875, -0.3927001953125, -0.355987548828125, -0.31927490234375, -0.282562255859375, -0.245849609375, -0.209136962890625, -0.17242431640625, -0.135711669921875, -0.0989990234375, -0.062286376953125, -0.02557373046875, 0.011138916015625, 0.0478515625, 0.084564208984375, 0.12127685546875, 0.157989501953125, 0.1947021484375, 0.231414794921875, 0.26812744140625, 0.304840087890625, 0.341552734375, 0.378265380859375, 0.41497802734375, 0.451690673828125, 0.4884033203125, 0.525115966796875, 0.56182861328125, 0.598541259765625, 0.63525390625, 0.671966552734375, 0.70867919921875, 0.745391845703125, 0.7821044921875, 0.818817138671875, 0.85552978515625, 0.892242431640625, 0.928955078125, 0.965667724609375, 1.00238037109375, 1.039093017578125, 1.0758056640625, 1.112518310546875, 1.14923095703125, 1.185943603515625, 1.22265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 17.0, 22.0, 19.0, 29.0, 61.0, 90.0, 127.0, 165.0, 298.0, 445.0, 760.0, 1339.0, 2495.0, 4737.0, 10565.0, 26543.0, 79723.0, 372464.0, 3268576.0, 309986.0, 71362.0, 24352.0, 9928.0, 4515.0, 2311.0, 1270.0, 776.0, 433.0, 266.0, 183.0, 118.0, 81.0, 65.0, 43.0, 18.0, 18.0, 19.0, 11.0, 6.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0234375, -4.86865234375, -4.7138671875, -4.55908203125, -4.404296875, -4.24951171875, -4.0947265625, -3.93994140625, -3.78515625, -3.63037109375, -3.4755859375, -3.32080078125, -3.166015625, -3.01123046875, -2.8564453125, -2.70166015625, -2.546875, -2.39208984375, -2.2373046875, -2.08251953125, -1.927734375, -1.77294921875, -1.6181640625, -1.46337890625, -1.30859375, -1.15380859375, -0.9990234375, -0.84423828125, -0.689453125, -0.53466796875, -0.3798828125, -0.22509765625, -0.0703125, 0.08447265625, 0.2392578125, 0.39404296875, 0.548828125, 0.70361328125, 0.8583984375, 1.01318359375, 1.16796875, 1.32275390625, 1.4775390625, 1.63232421875, 1.787109375, 1.94189453125, 2.0966796875, 2.25146484375, 2.40625, 2.56103515625, 2.7158203125, 2.87060546875, 3.025390625, 3.18017578125, 3.3349609375, 3.48974609375, 3.64453125, 3.79931640625, 3.9541015625, 4.10888671875, 4.263671875, 4.41845703125, 4.5732421875, 4.72802734375, 4.8828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 15.0, 25.0, 39.0, 51.0, 72.0, 109.0, 174.0, 403.0, 1709.0, 755.0, 273.0, 155.0, 83.0, 46.0, 35.0, 37.0, 17.0, 13.0, 4.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.705322265625, -2.62744140625, -2.549560546875, -2.4716796875, -2.393798828125, -2.31591796875, -2.238037109375, -2.16015625, -2.082275390625, -2.00439453125, -1.926513671875, -1.8486328125, -1.770751953125, -1.69287109375, -1.614990234375, -1.537109375, -1.459228515625, -1.38134765625, -1.303466796875, -1.2255859375, -1.147705078125, -1.06982421875, -0.991943359375, -0.9140625, -0.836181640625, -0.75830078125, -0.680419921875, -0.6025390625, -0.524658203125, -0.44677734375, -0.368896484375, -0.291015625, -0.213134765625, -0.13525390625, -0.057373046875, 0.0205078125, 0.098388671875, 0.17626953125, 0.254150390625, 0.33203125, 0.409912109375, 0.48779296875, 0.565673828125, 0.6435546875, 0.721435546875, 0.79931640625, 0.877197265625, 0.955078125, 1.032958984375, 1.11083984375, 1.188720703125, 1.2666015625, 1.344482421875, 1.42236328125, 1.500244140625, 1.578125, 1.656005859375, 1.73388671875, 1.811767578125, 1.8896484375, 1.967529296875, 2.04541015625, 2.123291015625, 2.201171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 30.0, 80.0, 171.0, 237.0, 230.0, 137.0, 60.0, 18.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.856782913208008, -29.00043296813965, -28.14408302307129, -27.28773307800293, -26.431381225585938, -25.575031280517578, -24.71868133544922, -23.86233139038086, -23.0059814453125, -22.14963150024414, -21.29328155517578, -20.436931610107422, -19.580581665039062, -18.724231719970703, -17.86787986755371, -17.01152992248535, -16.155179977416992, -15.298830032348633, -14.442480087280273, -13.586129188537598, -12.729779243469238, -11.873429298400879, -11.017078399658203, -10.160728454589844, -9.304378509521484, -8.448028564453125, -7.591678142547607, -6.73532772064209, -5.8789777755737305, -5.022627830505371, -4.1662774085998535, -3.309926986694336, -2.4535751342773438, -1.5972249507904053, -0.7408747673034668, 0.11547541618347168, 0.9718255996704102, 1.8281755447387695, 2.684525966644287, 3.5408763885498047, 4.397226333618164, 5.253576278686523, 6.109926700592041, 6.966277122497559, 7.822627067565918, 8.678977012634277, 9.535327911376953, 10.391677856445312, 11.248027801513672, 12.104377746582031, 12.96072769165039, 13.817078590393066, 14.673428535461426, 15.529778480529785, 16.38612937927246, 17.24247932434082, 18.09882926940918, 18.95517921447754, 19.8115291595459, 20.667879104614258, 21.52423095703125, 22.38058090209961, 23.23693084716797, 24.093280792236328, 24.949630737304688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 2.0, 11.0, 19.0, 17.0, 24.0, 22.0, 32.0, 29.0, 43.0, 35.0, 47.0, 38.0, 63.0, 52.0, 47.0, 48.0, 48.0, 56.0, 35.0, 41.0, 45.0, 33.0, 32.0, 33.0, 26.0, 20.0, 19.0, 17.0, 11.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.195155143737793, -7.932441234588623, -7.669727325439453, -7.407013893127441, -7.1442999839782715, -6.881586074829102, -6.61887264251709, -6.35615873336792, -6.09344482421875, -5.83073091506958, -5.56801700592041, -5.305303573608398, -5.0425896644592285, -4.779875755310059, -4.517162322998047, -4.254448413848877, -3.991734504699707, -3.729020595550537, -3.4663069248199463, -3.2035932540893555, -2.9408793449401855, -2.6781654357910156, -2.415451765060425, -2.152738094329834, -1.890024185180664, -1.6273103952407837, -1.3645966053009033, -1.101882815361023, -0.8391690254211426, -0.5764552354812622, -0.31374144554138184, -0.051027655601501465, 0.2116870880126953, 0.4744008779525757, 0.737114667892456, 0.9998284578323364, 1.2625422477722168, 1.5252560377120972, 1.7879698276519775, 2.0506834983825684, 2.3133974075317383, 2.576111316680908, 2.838824987411499, 3.10153865814209, 3.3642525672912598, 3.6269664764404297, 3.8896801471710205, 4.152393817901611, 4.415107727050781, 4.677821636199951, 4.940535545349121, 5.203248977661133, 5.465962886810303, 5.728676795959473, 5.991390228271484, 6.254104137420654, 6.516818046569824, 6.779531955718994, 7.042245864868164, 7.304959297180176, 7.567673206329346, 7.830387115478516, 8.093100547790527, 8.355814933776855, 8.618528366088867]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 8.0, 19.0, 18.0, 20.0, 35.0, 51.0, 88.0, 122.0, 223.0, 342.0, 608.0, 1307.0, 2633.0, 5583.0, 13045.0, 32509.0, 88298.0, 278579.0, 413352.0, 132316.0, 46381.0, 18195.0, 7632.0, 3457.0, 1757.0, 847.0, 435.0, 250.0, 135.0, 98.0, 68.0, 49.0, 25.0, 21.0, 9.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.87591552734375, -4.7088623046875, -4.54180908203125, -4.374755859375, -4.20770263671875, -4.0406494140625, -3.87359619140625, -3.70654296875, -3.53948974609375, -3.3724365234375, -3.20538330078125, -3.038330078125, -2.87127685546875, -2.7042236328125, -2.53717041015625, -2.3701171875, -2.20306396484375, -2.0360107421875, -1.86895751953125, -1.701904296875, -1.53485107421875, -1.3677978515625, -1.20074462890625, -1.03369140625, -0.86663818359375, -0.6995849609375, -0.53253173828125, -0.365478515625, -0.19842529296875, -0.0313720703125, 0.13568115234375, 0.302734375, 0.46978759765625, 0.6368408203125, 0.80389404296875, 0.970947265625, 1.13800048828125, 1.3050537109375, 1.47210693359375, 1.63916015625, 1.80621337890625, 1.9732666015625, 2.14031982421875, 2.307373046875, 2.47442626953125, 2.6414794921875, 2.80853271484375, 2.9755859375, 3.14263916015625, 3.3096923828125, 3.47674560546875, 3.643798828125, 3.81085205078125, 3.9779052734375, 4.14495849609375, 4.31201171875, 4.47906494140625, 4.6461181640625, 4.81317138671875, 4.980224609375, 5.14727783203125, 5.3143310546875, 5.48138427734375, 5.6484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 6.0, 10.0, 13.0, 16.0, 11.0, 21.0, 21.0, 23.0, 31.0, 33.0, 44.0, 52.0, 61.0, 76.0, 56.0, 62.0, 57.0, 61.0, 55.0, 44.0, 41.0, 39.0, 40.0, 35.0, 19.0, 20.0, 8.0, 13.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.898040771484375, -0.86541748046875, -0.832794189453125, -0.8001708984375, -0.767547607421875, -0.73492431640625, -0.702301025390625, -0.669677734375, -0.637054443359375, -0.60443115234375, -0.571807861328125, -0.5391845703125, -0.506561279296875, -0.47393798828125, -0.441314697265625, -0.40869140625, -0.376068115234375, -0.34344482421875, -0.310821533203125, -0.2781982421875, -0.245574951171875, -0.21295166015625, -0.180328369140625, -0.147705078125, -0.115081787109375, -0.08245849609375, -0.049835205078125, -0.0172119140625, 0.015411376953125, 0.04803466796875, 0.080657958984375, 0.11328125, 0.145904541015625, 0.17852783203125, 0.211151123046875, 0.2437744140625, 0.276397705078125, 0.30902099609375, 0.341644287109375, 0.374267578125, 0.406890869140625, 0.43951416015625, 0.472137451171875, 0.5047607421875, 0.537384033203125, 0.57000732421875, 0.602630615234375, 0.63525390625, 0.667877197265625, 0.70050048828125, 0.733123779296875, 0.7657470703125, 0.798370361328125, 0.83099365234375, 0.863616943359375, 0.896240234375, 0.928863525390625, 0.96148681640625, 0.994110107421875, 1.0267333984375, 1.059356689453125, 1.09197998046875, 1.124603271484375, 1.1572265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 13.0, 10.0, 11.0, 15.0, 34.0, 33.0, 54.0, 75.0, 111.0, 196.0, 346.0, 583.0, 1245.0, 3311.0, 13385.0, 79009.0, 573452.0, 319610.0, 43967.0, 8559.0, 2387.0, 963.0, 434.0, 240.0, 161.0, 109.0, 81.0, 32.0, 30.0, 18.0, 15.0, 14.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.89306640625, -6.6455078125, -6.39794921875, -6.150390625, -5.90283203125, -5.6552734375, -5.40771484375, -5.16015625, -4.91259765625, -4.6650390625, -4.41748046875, -4.169921875, -3.92236328125, -3.6748046875, -3.42724609375, -3.1796875, -2.93212890625, -2.6845703125, -2.43701171875, -2.189453125, -1.94189453125, -1.6943359375, -1.44677734375, -1.19921875, -0.95166015625, -0.7041015625, -0.45654296875, -0.208984375, 0.03857421875, 0.2861328125, 0.53369140625, 0.78125, 1.02880859375, 1.2763671875, 1.52392578125, 1.771484375, 2.01904296875, 2.2666015625, 2.51416015625, 2.76171875, 3.00927734375, 3.2568359375, 3.50439453125, 3.751953125, 3.99951171875, 4.2470703125, 4.49462890625, 4.7421875, 4.98974609375, 5.2373046875, 5.48486328125, 5.732421875, 5.97998046875, 6.2275390625, 6.47509765625, 6.72265625, 6.97021484375, 7.2177734375, 7.46533203125, 7.712890625, 7.96044921875, 8.2080078125, 8.45556640625, 8.703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 5.0, 10.0, 7.0, 12.0, 11.0, 15.0, 16.0, 21.0, 35.0, 32.0, 30.0, 30.0, 53.0, 44.0, 49.0, 61.0, 54.0, 45.0, 57.0, 42.0, 60.0, 33.0, 41.0, 48.0, 34.0, 29.0, 16.0, 28.0, 11.0, 16.0, 17.0, 11.0, 4.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.222412109375, -4.07763671875, -3.932861328125, -3.7880859375, -3.643310546875, -3.49853515625, -3.353759765625, -3.208984375, -3.064208984375, -2.91943359375, -2.774658203125, -2.6298828125, -2.485107421875, -2.34033203125, -2.195556640625, -2.05078125, -1.906005859375, -1.76123046875, -1.616455078125, -1.4716796875, -1.326904296875, -1.18212890625, -1.037353515625, -0.892578125, -0.747802734375, -0.60302734375, -0.458251953125, -0.3134765625, -0.168701171875, -0.02392578125, 0.120849609375, 0.265625, 0.410400390625, 0.55517578125, 0.699951171875, 0.8447265625, 0.989501953125, 1.13427734375, 1.279052734375, 1.423828125, 1.568603515625, 1.71337890625, 1.858154296875, 2.0029296875, 2.147705078125, 2.29248046875, 2.437255859375, 2.58203125, 2.726806640625, 2.87158203125, 3.016357421875, 3.1611328125, 3.305908203125, 3.45068359375, 3.595458984375, 3.740234375, 3.885009765625, 4.02978515625, 4.174560546875, 4.3193359375, 4.464111328125, 4.60888671875, 4.753662109375, 4.8984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 5.0, 17.0, 15.0, 34.0, 40.0, 60.0, 99.0, 130.0, 219.0, 448.0, 1001.0, 2514.0, 9453.0, 84466.0, 836295.0, 98544.0, 10387.0, 2634.0, 1051.0, 480.0, 241.0, 141.0, 93.0, 44.0, 42.0, 30.0, 19.0, 13.0, 6.0, 6.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58203125, -7.29620361328125, -7.0103759765625, -6.72454833984375, -6.438720703125, -6.15289306640625, -5.8670654296875, -5.58123779296875, -5.29541015625, -5.00958251953125, -4.7237548828125, -4.43792724609375, -4.152099609375, -3.86627197265625, -3.5804443359375, -3.29461669921875, -3.0087890625, -2.72296142578125, -2.4371337890625, -2.15130615234375, -1.865478515625, -1.57965087890625, -1.2938232421875, -1.00799560546875, -0.72216796875, -0.43634033203125, -0.1505126953125, 0.13531494140625, 0.421142578125, 0.70697021484375, 0.9927978515625, 1.27862548828125, 1.564453125, 1.85028076171875, 2.1361083984375, 2.42193603515625, 2.707763671875, 2.99359130859375, 3.2794189453125, 3.56524658203125, 3.85107421875, 4.13690185546875, 4.4227294921875, 4.70855712890625, 4.994384765625, 5.28021240234375, 5.5660400390625, 5.85186767578125, 6.1376953125, 6.42352294921875, 6.7093505859375, 6.99517822265625, 7.281005859375, 7.56683349609375, 7.8526611328125, 8.13848876953125, 8.42431640625, 8.71014404296875, 8.9959716796875, 9.28179931640625, 9.567626953125, 9.85345458984375, 10.1392822265625, 10.42510986328125, 10.7109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 13.0, 12.0, 17.0, 24.0, 43.0, 41.0, 61.0, 134.0, 141.0, 142.0, 91.0, 43.0, 45.0, 29.0, 19.0, 19.0, 21.0, 10.0, 6.0, 10.0, 3.0, 8.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008206367492675781, -0.0007954463362693787, -0.0007702559232711792, -0.0007450655102729797, -0.0007198750972747803, -0.0006946846842765808, -0.0006694942712783813, -0.0006443038582801819, -0.0006191134452819824, -0.000593923032283783, -0.0005687326192855835, -0.000543542206287384, -0.0005183517932891846, -0.0004931613802909851, -0.00046797096729278564, -0.0004427805542945862, -0.0004175901412963867, -0.00039239972829818726, -0.0003672093152999878, -0.00034201890230178833, -0.00031682848930358887, -0.0002916380763053894, -0.00026644766330718994, -0.00024125725030899048, -0.00021606683731079102, -0.00019087642431259155, -0.0001656860113143921, -0.00014049559831619263, -0.00011530518531799316, -9.01147723197937e-05, -6.492435932159424e-05, -3.9733946323394775e-05, -1.4543533325195312e-05, 1.064687967300415e-05, 3.583729267120361e-05, 6.1027705669403076e-05, 8.621811866760254e-05, 0.000111408531665802, 0.00013659894466400146, 0.00016178935766220093, 0.0001869797706604004, 0.00021217018365859985, 0.00023736059665679932, 0.0002625510096549988, 0.00028774142265319824, 0.0003129318356513977, 0.00033812224864959717, 0.00036331266164779663, 0.0003885030746459961, 0.00041369348764419556, 0.000438883900642395, 0.0004640743136405945, 0.0004892647266387939, 0.0005144551396369934, 0.0005396455526351929, 0.0005648359656333923, 0.0005900263786315918, 0.0006152167916297913, 0.0006404072046279907, 0.0006655976176261902, 0.0006907880306243896, 0.0007159784436225891, 0.0007411688566207886, 0.000766359269618988, 0.0007915496826171875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 27.0, 32.0, 74.0, 124.0, 284.0, 772.0, 2704.0, 15629.0, 792614.0, 225289.0, 8176.0, 1681.0, 621.0, 235.0, 121.0, 56.0, 26.0, 18.0, 16.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.015625, -15.592529296875, -15.16943359375, -14.746337890625, -14.3232421875, -13.900146484375, -13.47705078125, -13.053955078125, -12.630859375, -12.207763671875, -11.78466796875, -11.361572265625, -10.9384765625, -10.515380859375, -10.09228515625, -9.669189453125, -9.24609375, -8.822998046875, -8.39990234375, -7.976806640625, -7.5537109375, -7.130615234375, -6.70751953125, -6.284423828125, -5.861328125, -5.438232421875, -5.01513671875, -4.592041015625, -4.1689453125, -3.745849609375, -3.32275390625, -2.899658203125, -2.4765625, -2.053466796875, -1.63037109375, -1.207275390625, -0.7841796875, -0.361083984375, 0.06201171875, 0.485107421875, 0.908203125, 1.331298828125, 1.75439453125, 2.177490234375, 2.6005859375, 3.023681640625, 3.44677734375, 3.869873046875, 4.29296875, 4.716064453125, 5.13916015625, 5.562255859375, 5.9853515625, 6.408447265625, 6.83154296875, 7.254638671875, 7.677734375, 8.100830078125, 8.52392578125, 8.947021484375, 9.3701171875, 9.793212890625, 10.21630859375, 10.639404296875, 11.0625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 7.0, 18.0, 21.0, 32.0, 71.0, 96.0, 130.0, 168.0, 135.0, 95.0, 69.0, 51.0, 29.0, 9.0, 14.0, 5.0, 10.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.33721923828125, -4.1744384765625, -4.01165771484375, -3.848876953125, -3.68609619140625, -3.5233154296875, -3.36053466796875, -3.19775390625, -3.03497314453125, -2.8721923828125, -2.70941162109375, -2.546630859375, -2.38385009765625, -2.2210693359375, -2.05828857421875, -1.8955078125, -1.73272705078125, -1.5699462890625, -1.40716552734375, -1.244384765625, -1.08160400390625, -0.9188232421875, -0.75604248046875, -0.59326171875, -0.43048095703125, -0.2677001953125, -0.10491943359375, 0.057861328125, 0.22064208984375, 0.3834228515625, 0.54620361328125, 0.708984375, 0.87176513671875, 1.0345458984375, 1.19732666015625, 1.360107421875, 1.52288818359375, 1.6856689453125, 1.84844970703125, 2.01123046875, 2.17401123046875, 2.3367919921875, 2.49957275390625, 2.662353515625, 2.82513427734375, 2.9879150390625, 3.15069580078125, 3.3134765625, 3.47625732421875, 3.6390380859375, 3.80181884765625, 3.964599609375, 4.12738037109375, 4.2901611328125, 4.45294189453125, 4.61572265625, 4.77850341796875, 4.9412841796875, 5.10406494140625, 5.266845703125, 5.42962646484375, 5.5924072265625, 5.75518798828125, 5.91796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 13.0, 37.0, 150.0, 317.0, 277.0, 149.0, 39.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.17984008789062, -138.70510864257812, -135.23037719726562, -131.7556610107422, -128.2809295654297, -124.80619812011719, -121.33146667480469, -117.85674285888672, -114.38201141357422, -110.90727996826172, -107.43255615234375, -103.95782470703125, -100.48310089111328, -97.00836944580078, -93.53364562988281, -90.05891418457031, -86.58418273925781, -83.10945129394531, -79.63472747802734, -76.15999603271484, -72.68527221679688, -69.21054077148438, -65.73580932617188, -62.261085510253906, -58.78636169433594, -55.3116340637207, -51.83690643310547, -48.36217498779297, -44.887447357177734, -41.4127197265625, -37.937992095947266, -34.46326446533203, -30.98853302001953, -27.513805389404297, -24.03907585144043, -20.564348220825195, -17.089618682861328, -13.614891052246094, -10.14016342163086, -6.665433883666992, -3.190706253051758, 0.28402209281921387, 3.7587504386901855, 7.233478546142578, 10.708207130432129, 14.18293571472168, 17.657663345336914, 21.13239288330078, 24.607120513916016, 28.08184814453125, 31.556577682495117, 35.03130340576172, 38.50603485107422, 41.98076248168945, 45.45549011230469, 48.93022155761719, 52.404945373535156, 55.87967300415039, 59.354400634765625, 62.829132080078125, 66.3038558959961, 69.7785873413086, 73.25331115722656, 76.72804260253906, 80.20277404785156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 13.0, 10.0, 14.0, 8.0, 25.0, 23.0, 18.0, 24.0, 22.0, 34.0, 24.0, 35.0, 30.0, 54.0, 40.0, 42.0, 43.0, 45.0, 39.0, 45.0, 45.0, 33.0, 45.0, 31.0, 23.0, 32.0, 28.0, 15.0, 16.0, 18.0, 11.0, 12.0, 16.0, 20.0, 7.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.59099769592285, -21.890220642089844, -21.189443588256836, -20.488666534423828, -19.78788948059082, -19.087112426757812, -18.386335372924805, -17.685558319091797, -16.98478126525879, -16.28400421142578, -15.583227157592773, -14.882450103759766, -14.181673049926758, -13.48089599609375, -12.780118942260742, -12.079341888427734, -11.378564834594727, -10.677787780761719, -9.977010726928711, -9.276233673095703, -8.575456619262695, -7.8746795654296875, -7.17390251159668, -6.473125457763672, -5.772348403930664, -5.071571350097656, -4.370794296264648, -3.6700172424316406, -2.969240188598633, -2.268463134765625, -1.5676860809326172, -0.8669090270996094, -0.16613388061523438, 0.5346431732177734, 1.2354202270507812, 1.936197280883789, 2.636974334716797, 3.3377513885498047, 4.0385284423828125, 4.73930549621582, 5.440082550048828, 6.140859603881836, 6.841636657714844, 7.542413711547852, 8.24319076538086, 8.943967819213867, 9.644744873046875, 10.345521926879883, 11.04629898071289, 11.747076034545898, 12.447853088378906, 13.148630142211914, 13.849407196044922, 14.55018424987793, 15.250961303710938, 15.951738357543945, 16.652515411376953, 17.35329246520996, 18.05406951904297, 18.754846572875977, 19.455623626708984, 20.156400680541992, 20.857177734375, 21.557954788208008, 22.258731842041016]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 20.0, 24.0, 24.0, 50.0, 67.0, 135.0, 213.0, 387.0, 696.0, 1410.0, 3332.0, 8569.0, 26686.0, 118018.0, 3131608.0, 794106.0, 77981.0, 19704.0, 6503.0, 2466.0, 1111.0, 503.0, 283.0, 144.0, 85.0, 46.0, 30.0, 27.0, 14.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -3.97454833984375, -3.7928466796875, -3.61114501953125, -3.429443359375, -3.24774169921875, -3.0660400390625, -2.88433837890625, -2.70263671875, -2.52093505859375, -2.3392333984375, -2.15753173828125, -1.975830078125, -1.79412841796875, -1.6124267578125, -1.43072509765625, -1.2490234375, -1.06732177734375, -0.8856201171875, -0.70391845703125, -0.522216796875, -0.34051513671875, -0.1588134765625, 0.02288818359375, 0.20458984375, 0.38629150390625, 0.5679931640625, 0.74969482421875, 0.931396484375, 1.11309814453125, 1.2947998046875, 1.47650146484375, 1.658203125, 1.83990478515625, 2.0216064453125, 2.20330810546875, 2.385009765625, 2.56671142578125, 2.7484130859375, 2.93011474609375, 3.11181640625, 3.29351806640625, 3.4752197265625, 3.65692138671875, 3.838623046875, 4.02032470703125, 4.2020263671875, 4.38372802734375, 4.5654296875, 4.74713134765625, 4.9288330078125, 5.11053466796875, 5.292236328125, 5.47393798828125, 5.6556396484375, 5.83734130859375, 6.01904296875, 6.20074462890625, 6.3824462890625, 6.56414794921875, 6.745849609375, 6.92755126953125, 7.1092529296875, 7.29095458984375, 7.47265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 5.0, 8.0, 12.0, 5.0, 18.0, 27.0, 15.0, 31.0, 42.0, 46.0, 62.0, 52.0, 56.0, 55.0, 62.0, 67.0, 51.0, 56.0, 59.0, 50.0, 49.0, 38.0, 25.0, 35.0, 13.0, 12.0, 10.0, 4.0, 6.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -1.0113372802734375, -0.974822998046875, -0.9383087158203125, -0.90179443359375, -0.8652801513671875, -0.828765869140625, -0.7922515869140625, -0.7557373046875, -0.7192230224609375, -0.682708740234375, -0.6461944580078125, -0.60968017578125, -0.5731658935546875, -0.536651611328125, -0.5001373291015625, -0.463623046875, -0.4271087646484375, -0.390594482421875, -0.3540802001953125, -0.31756591796875, -0.2810516357421875, -0.244537353515625, -0.2080230712890625, -0.1715087890625, -0.1349945068359375, -0.098480224609375, -0.0619659423828125, -0.02545166015625, 0.0110626220703125, 0.047576904296875, 0.0840911865234375, 0.12060546875, 0.1571197509765625, 0.193634033203125, 0.2301483154296875, 0.26666259765625, 0.3031768798828125, 0.339691162109375, 0.3762054443359375, 0.4127197265625, 0.4492340087890625, 0.485748291015625, 0.5222625732421875, 0.55877685546875, 0.5952911376953125, 0.631805419921875, 0.6683197021484375, 0.704833984375, 0.7413482666015625, 0.777862548828125, 0.8143768310546875, 0.85089111328125, 0.8874053955078125, 0.923919677734375, 0.9604339599609375, 0.9969482421875, 1.0334625244140625, 1.069976806640625, 1.1064910888671875, 1.14300537109375, 1.1795196533203125, 1.216033935546875, 1.2525482177734375, 1.2890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 9.0, 16.0, 24.0, 30.0, 48.0, 72.0, 124.0, 211.0, 333.0, 607.0, 1049.0, 1938.0, 3647.0, 7759.0, 17973.0, 49154.0, 177594.0, 2260314.0, 1437548.0, 158003.0, 45190.0, 17102.0, 7528.0, 3657.0, 1790.0, 1022.0, 559.0, 317.0, 208.0, 151.0, 103.0, 62.0, 50.0, 19.0, 27.0, 5.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.05859375, -4.91387939453125, -4.7691650390625, -4.62445068359375, -4.479736328125, -4.33502197265625, -4.1903076171875, -4.04559326171875, -3.90087890625, -3.75616455078125, -3.6114501953125, -3.46673583984375, -3.322021484375, -3.17730712890625, -3.0325927734375, -2.88787841796875, -2.7431640625, -2.59844970703125, -2.4537353515625, -2.30902099609375, -2.164306640625, -2.01959228515625, -1.8748779296875, -1.73016357421875, -1.58544921875, -1.44073486328125, -1.2960205078125, -1.15130615234375, -1.006591796875, -0.86187744140625, -0.7171630859375, -0.57244873046875, -0.427734375, -0.28302001953125, -0.1383056640625, 0.00640869140625, 0.151123046875, 0.29583740234375, 0.4405517578125, 0.58526611328125, 0.72998046875, 0.87469482421875, 1.0194091796875, 1.16412353515625, 1.308837890625, 1.45355224609375, 1.5982666015625, 1.74298095703125, 1.8876953125, 2.03240966796875, 2.1771240234375, 2.32183837890625, 2.466552734375, 2.61126708984375, 2.7559814453125, 2.90069580078125, 3.04541015625, 3.19012451171875, 3.3348388671875, 3.47955322265625, 3.624267578125, 3.76898193359375, 3.9136962890625, 4.05841064453125, 4.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 21.0, 19.0, 25.0, 40.0, 42.0, 84.0, 129.0, 192.0, 345.0, 1015.0, 1057.0, 395.0, 193.0, 140.0, 95.0, 57.0, 33.0, 32.0, 22.0, 18.0, 12.0, 16.0, 12.0, 10.0, 3.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.060546875, -1.991973876953125, -1.92340087890625, -1.854827880859375, -1.7862548828125, -1.717681884765625, -1.64910888671875, -1.580535888671875, -1.511962890625, -1.443389892578125, -1.37481689453125, -1.306243896484375, -1.2376708984375, -1.169097900390625, -1.10052490234375, -1.031951904296875, -0.96337890625, -0.894805908203125, -0.82623291015625, -0.757659912109375, -0.6890869140625, -0.620513916015625, -0.55194091796875, -0.483367919921875, -0.414794921875, -0.346221923828125, -0.27764892578125, -0.209075927734375, -0.1405029296875, -0.071929931640625, -0.00335693359375, 0.065216064453125, 0.1337890625, 0.202362060546875, 0.27093505859375, 0.339508056640625, 0.4080810546875, 0.476654052734375, 0.54522705078125, 0.613800048828125, 0.682373046875, 0.750946044921875, 0.81951904296875, 0.888092041015625, 0.9566650390625, 1.025238037109375, 1.09381103515625, 1.162384033203125, 1.23095703125, 1.299530029296875, 1.36810302734375, 1.436676025390625, 1.5052490234375, 1.573822021484375, 1.64239501953125, 1.710968017578125, 1.779541015625, 1.848114013671875, 1.91668701171875, 1.985260009765625, 2.0538330078125, 2.122406005859375, 2.19097900390625, 2.259552001953125, 2.328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 17.0, 50.0, 87.0, 164.0, 207.0, 212.0, 127.0, 62.0, 31.0, 20.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.24348258972168, -21.3341121673584, -20.424741744995117, -19.515371322631836, -18.606000900268555, -17.696630477905273, -16.787261962890625, -15.877890586853027, -14.968520164489746, -14.059149742126465, -13.149779319763184, -12.240409851074219, -11.331039428710938, -10.421669006347656, -9.512298583984375, -8.602928161621094, -7.6935577392578125, -6.784187316894531, -5.87481689453125, -4.965446949005127, -4.056076526641846, -3.1467061042785645, -2.2373361587524414, -1.3279657363891602, -0.4185953140258789, 0.4907749891281128, 1.4001452922821045, 2.3095154762268066, 3.218885898590088, 4.128256320953369, 5.037626266479492, 5.946996688842773, 6.856365203857422, 7.765735626220703, 8.675106048583984, 9.584476470947266, 10.493846893310547, 11.403217315673828, 12.312586784362793, 13.221957206726074, 14.131327629089355, 15.040698051452637, 15.950068473815918, 16.859437942504883, 17.768808364868164, 18.678178787231445, 19.587549209594727, 20.496919631958008, 21.40629005432129, 22.31566047668457, 23.22503089904785, 24.134401321411133, 25.043771743774414, 25.953142166137695, 26.862510681152344, 27.771881103515625, 28.681251525878906, 29.590621948242188, 30.49999237060547, 31.40936279296875, 32.31873321533203, 33.22810363769531, 34.137474060058594, 35.046844482421875, 35.956214904785156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 4.0, 8.0, 15.0, 11.0, 16.0, 19.0, 25.0, 29.0, 34.0, 30.0, 36.0, 44.0, 37.0, 46.0, 45.0, 51.0, 53.0, 36.0, 39.0, 44.0, 39.0, 46.0, 35.0, 31.0, 36.0, 31.0, 26.0, 22.0, 16.0, 28.0, 14.0, 7.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203773498535156, -8.894710540771484, -8.585647583007812, -8.27658462524414, -7.967521667480469, -7.658458709716797, -7.349395751953125, -7.040332794189453, -6.731269836425781, -6.422206878662109, -6.1131439208984375, -5.804080963134766, -5.495018005371094, -5.185955047607422, -4.87689208984375, -4.567829132080078, -4.258766174316406, -3.9497032165527344, -3.6406402587890625, -3.3315773010253906, -3.0225143432617188, -2.713451385498047, -2.404388427734375, -2.095325469970703, -1.7862625122070312, -1.4771995544433594, -1.1681365966796875, -0.8590736389160156, -0.5500106811523438, -0.24094772338867188, 0.068115234375, 0.3771781921386719, 0.6862411499023438, 0.9953041076660156, 1.3043670654296875, 1.6134300231933594, 1.9224929809570312, 2.231555938720703, 2.540618896484375, 2.849681854248047, 3.1587448120117188, 3.4678077697753906, 3.7768707275390625, 4.085933685302734, 4.394996643066406, 4.704059600830078, 5.01312255859375, 5.322185516357422, 5.631248474121094, 5.940311431884766, 6.2493743896484375, 6.558437347412109, 6.867500305175781, 7.176563262939453, 7.485626220703125, 7.794689178466797, 8.103752136230469, 8.41281509399414, 8.721878051757812, 9.030941009521484, 9.340003967285156, 9.649066925048828, 9.9581298828125, 10.267192840576172, 10.576255798339844]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 19.0, 15.0, 22.0, 28.0, 44.0, 95.0, 127.0, 274.0, 420.0, 778.0, 1505.0, 3078.0, 6518.0, 15613.0, 39708.0, 118723.0, 645624.0, 139889.0, 44807.0, 17224.0, 7245.0, 3201.0, 1594.0, 850.0, 515.0, 257.0, 129.0, 92.0, 57.0, 35.0, 21.0, 21.0, 5.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.41998291015625, -6.2227783203125, -6.02557373046875, -5.828369140625, -5.63116455078125, -5.4339599609375, -5.23675537109375, -5.03955078125, -4.84234619140625, -4.6451416015625, -4.44793701171875, -4.250732421875, -4.05352783203125, -3.8563232421875, -3.65911865234375, -3.4619140625, -3.26470947265625, -3.0675048828125, -2.87030029296875, -2.673095703125, -2.47589111328125, -2.2786865234375, -2.08148193359375, -1.88427734375, -1.68707275390625, -1.4898681640625, -1.29266357421875, -1.095458984375, -0.89825439453125, -0.7010498046875, -0.50384521484375, -0.306640625, -0.10943603515625, 0.0877685546875, 0.28497314453125, 0.482177734375, 0.67938232421875, 0.8765869140625, 1.07379150390625, 1.27099609375, 1.46820068359375, 1.6654052734375, 1.86260986328125, 2.059814453125, 2.25701904296875, 2.4542236328125, 2.65142822265625, 2.8486328125, 3.04583740234375, 3.2430419921875, 3.44024658203125, 3.637451171875, 3.83465576171875, 4.0318603515625, 4.22906494140625, 4.42626953125, 4.62347412109375, 4.8206787109375, 5.01788330078125, 5.215087890625, 5.41229248046875, 5.6094970703125, 5.80670166015625, 6.00390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 8.0, 10.0, 18.0, 19.0, 19.0, 18.0, 35.0, 30.0, 39.0, 46.0, 54.0, 58.0, 52.0, 46.0, 64.0, 61.0, 50.0, 63.0, 48.0, 40.0, 32.0, 28.0, 25.0, 23.0, 19.0, 20.0, 11.0, 7.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.861358642578125, -0.82720947265625, -0.793060302734375, -0.7589111328125, -0.724761962890625, -0.69061279296875, -0.656463623046875, -0.622314453125, -0.588165283203125, -0.55401611328125, -0.519866943359375, -0.4857177734375, -0.451568603515625, -0.41741943359375, -0.383270263671875, -0.34912109375, -0.314971923828125, -0.28082275390625, -0.246673583984375, -0.2125244140625, -0.178375244140625, -0.14422607421875, -0.110076904296875, -0.075927734375, -0.041778564453125, -0.00762939453125, 0.026519775390625, 0.0606689453125, 0.094818115234375, 0.12896728515625, 0.163116455078125, 0.197265625, 0.231414794921875, 0.26556396484375, 0.299713134765625, 0.3338623046875, 0.368011474609375, 0.40216064453125, 0.436309814453125, 0.470458984375, 0.504608154296875, 0.53875732421875, 0.572906494140625, 0.6070556640625, 0.641204833984375, 0.67535400390625, 0.709503173828125, 0.74365234375, 0.777801513671875, 0.81195068359375, 0.846099853515625, 0.8802490234375, 0.914398193359375, 0.94854736328125, 0.982696533203125, 1.016845703125, 1.050994873046875, 1.08514404296875, 1.119293212890625, 1.1534423828125, 1.187591552734375, 1.22174072265625, 1.255889892578125, 1.2900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 13.0, 14.0, 18.0, 22.0, 29.0, 44.0, 57.0, 96.0, 138.0, 237.0, 409.0, 737.0, 1600.0, 4537.0, 17995.0, 91339.0, 768581.0, 128274.0, 24610.0, 5853.0, 1879.0, 798.0, 454.0, 279.0, 158.0, 99.0, 73.0, 51.0, 38.0, 31.0, 20.0, 9.0, 6.0, 10.0, 7.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1875, -7.910888671875, -7.63427734375, -7.357666015625, -7.0810546875, -6.804443359375, -6.52783203125, -6.251220703125, -5.974609375, -5.697998046875, -5.42138671875, -5.144775390625, -4.8681640625, -4.591552734375, -4.31494140625, -4.038330078125, -3.76171875, -3.485107421875, -3.20849609375, -2.931884765625, -2.6552734375, -2.378662109375, -2.10205078125, -1.825439453125, -1.548828125, -1.272216796875, -0.99560546875, -0.718994140625, -0.4423828125, -0.165771484375, 0.11083984375, 0.387451171875, 0.6640625, 0.940673828125, 1.21728515625, 1.493896484375, 1.7705078125, 2.047119140625, 2.32373046875, 2.600341796875, 2.876953125, 3.153564453125, 3.43017578125, 3.706787109375, 3.9833984375, 4.260009765625, 4.53662109375, 4.813232421875, 5.08984375, 5.366455078125, 5.64306640625, 5.919677734375, 6.1962890625, 6.472900390625, 6.74951171875, 7.026123046875, 7.302734375, 7.579345703125, 7.85595703125, 8.132568359375, 8.4091796875, 8.685791015625, 8.96240234375, 9.239013671875, 9.515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 7.0, 12.0, 10.0, 27.0, 36.0, 36.0, 51.0, 43.0, 43.0, 61.0, 61.0, 64.0, 43.0, 68.0, 48.0, 53.0, 52.0, 49.0, 41.0, 39.0, 28.0, 32.0, 17.0, 13.0, 10.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.9375, -5.767333984375, -5.59716796875, -5.427001953125, -5.2568359375, -5.086669921875, -4.91650390625, -4.746337890625, -4.576171875, -4.406005859375, -4.23583984375, -4.065673828125, -3.8955078125, -3.725341796875, -3.55517578125, -3.385009765625, -3.21484375, -3.044677734375, -2.87451171875, -2.704345703125, -2.5341796875, -2.364013671875, -2.19384765625, -2.023681640625, -1.853515625, -1.683349609375, -1.51318359375, -1.343017578125, -1.1728515625, -1.002685546875, -0.83251953125, -0.662353515625, -0.4921875, -0.322021484375, -0.15185546875, 0.018310546875, 0.1884765625, 0.358642578125, 0.52880859375, 0.698974609375, 0.869140625, 1.039306640625, 1.20947265625, 1.379638671875, 1.5498046875, 1.719970703125, 1.89013671875, 2.060302734375, 2.23046875, 2.400634765625, 2.57080078125, 2.740966796875, 2.9111328125, 3.081298828125, 3.25146484375, 3.421630859375, 3.591796875, 3.761962890625, 3.93212890625, 4.102294921875, 4.2724609375, 4.442626953125, 4.61279296875, 4.782958984375, 4.953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 20.0, 29.0, 43.0, 58.0, 112.0, 172.0, 302.0, 540.0, 1160.0, 2275.0, 5742.0, 15629.0, 46922.0, 203773.0, 631187.0, 93405.0, 29439.0, 10284.0, 3848.0, 1717.0, 853.0, 411.0, 228.0, 121.0, 71.0, 68.0, 42.0, 28.0, 16.0, 9.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.3428955078125, -3.228759765625, -3.1146240234375, -3.00048828125, -2.8863525390625, -2.772216796875, -2.6580810546875, -2.5439453125, -2.4298095703125, -2.315673828125, -2.2015380859375, -2.08740234375, -1.9732666015625, -1.859130859375, -1.7449951171875, -1.630859375, -1.5167236328125, -1.402587890625, -1.2884521484375, -1.17431640625, -1.0601806640625, -0.946044921875, -0.8319091796875, -0.7177734375, -0.6036376953125, -0.489501953125, -0.3753662109375, -0.26123046875, -0.1470947265625, -0.032958984375, 0.0811767578125, 0.1953125, 0.3094482421875, 0.423583984375, 0.5377197265625, 0.65185546875, 0.7659912109375, 0.880126953125, 0.9942626953125, 1.1083984375, 1.2225341796875, 1.336669921875, 1.4508056640625, 1.56494140625, 1.6790771484375, 1.793212890625, 1.9073486328125, 2.021484375, 2.1356201171875, 2.249755859375, 2.3638916015625, 2.47802734375, 2.5921630859375, 2.706298828125, 2.8204345703125, 2.9345703125, 3.0487060546875, 3.162841796875, 3.2769775390625, 3.39111328125, 3.5052490234375, 3.619384765625, 3.7335205078125, 3.84765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 9.0, 3.0, 5.0, 13.0, 4.0, 10.0, 8.0, 14.0, 22.0, 22.0, 32.0, 51.0, 122.0, 326.0, 148.0, 55.0, 28.0, 36.0, 17.0, 10.0, 8.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010080337524414062, -0.0009760856628417969, -0.0009441375732421875, -0.0009121894836425781, -0.0008802413940429688, -0.0008482933044433594, -0.00081634521484375, -0.0007843971252441406, -0.0007524490356445312, -0.0007205009460449219, -0.0006885528564453125, -0.0006566047668457031, -0.0006246566772460938, -0.0005927085876464844, -0.000560760498046875, -0.0005288124084472656, -0.0004968643188476562, -0.0004649162292480469, -0.0004329681396484375, -0.0004010200500488281, -0.00036907196044921875, -0.0003371238708496094, -0.00030517578125, -0.0002732276916503906, -0.00024127960205078125, -0.00020933151245117188, -0.0001773834228515625, -0.00014543533325195312, -0.00011348724365234375, -8.153915405273438e-05, -4.9591064453125e-05, -1.7642974853515625e-05, 1.430511474609375e-05, 4.6253204345703125e-05, 7.82012939453125e-05, 0.00011014938354492188, 0.00014209747314453125, 0.00017404556274414062, 0.00020599365234375, 0.00023794174194335938, 0.00026988983154296875, 0.0003018379211425781, 0.0003337860107421875, 0.0003657341003417969, 0.00039768218994140625, 0.0004296302795410156, 0.000461578369140625, 0.0004935264587402344, 0.0005254745483398438, 0.0005574226379394531, 0.0005893707275390625, 0.0006213188171386719, 0.0006532669067382812, 0.0006852149963378906, 0.0007171630859375, 0.0007491111755371094, 0.0007810592651367188, 0.0008130073547363281, 0.0008449554443359375, 0.0008769035339355469, 0.0009088516235351562, 0.0009407997131347656, 0.000972747802734375, 0.0010046958923339844, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 9.0, 7.0, 19.0, 23.0, 34.0, 62.0, 105.0, 117.0, 264.0, 560.0, 1469.0, 5220.0, 31444.0, 350213.0, 606255.0, 43164.0, 6534.0, 1666.0, 649.0, 306.0, 163.0, 89.0, 56.0, 30.0, 21.0, 16.0, 10.0, 10.0, 5.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.34246826171875, -4.1693115234375, -3.99615478515625, -3.822998046875, -3.64984130859375, -3.4766845703125, -3.30352783203125, -3.13037109375, -2.95721435546875, -2.7840576171875, -2.61090087890625, -2.437744140625, -2.26458740234375, -2.0914306640625, -1.91827392578125, -1.7451171875, -1.57196044921875, -1.3988037109375, -1.22564697265625, -1.052490234375, -0.87933349609375, -0.7061767578125, -0.53302001953125, -0.35986328125, -0.18670654296875, -0.0135498046875, 0.15960693359375, 0.332763671875, 0.50592041015625, 0.6790771484375, 0.85223388671875, 1.025390625, 1.19854736328125, 1.3717041015625, 1.54486083984375, 1.718017578125, 1.89117431640625, 2.0643310546875, 2.23748779296875, 2.41064453125, 2.58380126953125, 2.7569580078125, 2.93011474609375, 3.103271484375, 3.27642822265625, 3.4495849609375, 3.62274169921875, 3.7958984375, 3.96905517578125, 4.1422119140625, 4.31536865234375, 4.488525390625, 4.66168212890625, 4.8348388671875, 5.00799560546875, 5.18115234375, 5.35430908203125, 5.5274658203125, 5.70062255859375, 5.873779296875, 6.04693603515625, 6.2200927734375, 6.39324951171875, 6.56640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 16.0, 3.0, 7.0, 8.0, 9.0, 20.0, 14.0, 28.0, 19.0, 26.0, 41.0, 65.0, 117.0, 134.0, 108.0, 102.0, 69.0, 29.0, 26.0, 22.0, 16.0, 13.0, 21.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.509735107421875, -2.43939208984375, -2.369049072265625, -2.2987060546875, -2.228363037109375, -2.15802001953125, -2.087677001953125, -2.017333984375, -1.946990966796875, -1.87664794921875, -1.806304931640625, -1.7359619140625, -1.665618896484375, -1.59527587890625, -1.524932861328125, -1.45458984375, -1.384246826171875, -1.31390380859375, -1.243560791015625, -1.1732177734375, -1.102874755859375, -1.03253173828125, -0.962188720703125, -0.891845703125, -0.821502685546875, -0.75115966796875, -0.680816650390625, -0.6104736328125, -0.540130615234375, -0.46978759765625, -0.399444580078125, -0.3291015625, -0.258758544921875, -0.18841552734375, -0.118072509765625, -0.0477294921875, 0.022613525390625, 0.09295654296875, 0.163299560546875, 0.233642578125, 0.303985595703125, 0.37432861328125, 0.444671630859375, 0.5150146484375, 0.585357666015625, 0.65570068359375, 0.726043701171875, 0.79638671875, 0.866729736328125, 0.93707275390625, 1.007415771484375, 1.0777587890625, 1.148101806640625, 1.21844482421875, 1.288787841796875, 1.359130859375, 1.429473876953125, 1.49981689453125, 1.570159912109375, 1.6405029296875, 1.710845947265625, 1.78118896484375, 1.851531982421875, 1.921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 13.0, 32.0, 78.0, 180.0, 246.0, 265.0, 107.0, 59.0, 13.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.47672653198242, -35.871986389160156, -33.26724624633789, -30.662508010864258, -28.057769775390625, -25.45302963256836, -22.848289489746094, -20.24355125427246, -17.638811111450195, -15.034071922302246, -12.429332733154297, -9.824592590332031, -7.219853401184082, -4.615114212036133, -2.010374069213867, 0.5943641662597656, 3.1991043090820312, 5.8038434982299805, 8.40858268737793, 11.013322830200195, 13.618062019348145, 16.222801208496094, 18.82754135131836, 21.432279586791992, 24.037019729614258, 26.641759872436523, 29.246498107910156, 31.851238250732422, 34.45597839355469, 37.06071472167969, 39.66545867919922, 42.27019500732422, 44.87493133544922, 47.479671478271484, 50.08441162109375, 52.68914794921875, 55.293888092041016, 57.89862823486328, 60.50336837768555, 63.10810852050781, 65.71284484863281, 68.31758117675781, 70.92232513427734, 73.52706146240234, 76.13180541992188, 78.73654174804688, 81.34127807617188, 83.9460220336914, 86.55076599121094, 89.15550231933594, 91.76024627685547, 94.36498260498047, 96.9697265625, 99.574462890625, 102.17919921875, 104.78394317626953, 107.38867950439453, 109.99341583251953, 112.59815979003906, 115.20289611816406, 117.8076400756836, 120.4123764038086, 123.01712036132812, 125.62185668945312, 128.22659301757812]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 10.0, 16.0, 11.0, 15.0, 13.0, 19.0, 34.0, 24.0, 28.0, 35.0, 34.0, 49.0, 39.0, 49.0, 49.0, 48.0, 46.0, 45.0, 45.0, 37.0, 41.0, 40.0, 34.0, 31.0, 36.0, 24.0, 18.0, 23.0, 20.0, 13.0, 9.0, 12.0, 9.0, 3.0, 7.0, 2.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.024023056030273, -23.28664779663086, -22.549270629882812, -21.8118953704834, -21.074520111083984, -20.337142944335938, -19.599767684936523, -18.86239242553711, -18.125015258789062, -17.38763999938965, -16.6502628326416, -15.912887573242188, -15.175512313842773, -14.438136100769043, -13.700759887695312, -12.963384628295898, -12.226009368896484, -11.488633155822754, -10.75125789642334, -10.01388168334961, -9.276506423950195, -8.539130210876465, -7.801753997802734, -7.064378261566162, -6.32700252532959, -5.589626789093018, -4.852251052856445, -4.114874839782715, -3.3774991035461426, -2.6401233673095703, -1.9027471542358398, -1.1653714179992676, -0.4279975891113281, 0.3093782663345337, 1.0467541217803955, 1.7841300964355469, 2.521505832672119, 3.2588815689086914, 3.996257781982422, 4.733633518218994, 5.471009254455566, 6.208384990692139, 6.945760726928711, 7.683136940002441, 8.420513153076172, 9.157888412475586, 9.895264625549316, 10.632640838623047, 11.370016098022461, 12.107392311096191, 12.844767570495605, 13.582143783569336, 14.31951904296875, 15.05689525604248, 15.794271469116211, 16.531646728515625, 17.269023895263672, 18.006399154663086, 18.743776321411133, 19.481151580810547, 20.21852684020996, 20.955902099609375, 21.693279266357422, 22.430654525756836, 23.16802978515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 11.0, 19.0, 24.0, 29.0, 48.0, 83.0, 153.0, 297.0, 553.0, 1172.0, 2470.0, 6197.0, 17621.0, 65191.0, 641809.0, 3320005.0, 100923.0, 24117.0, 7829.0, 3075.0, 1322.0, 621.0, 327.0, 131.0, 96.0, 59.0, 26.0, 20.0, 13.0, 5.0, 7.0, 9.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.78594970703125, -6.5679931640625, -6.35003662109375, -6.132080078125, -5.91412353515625, -5.6961669921875, -5.47821044921875, -5.26025390625, -5.04229736328125, -4.8243408203125, -4.60638427734375, -4.388427734375, -4.17047119140625, -3.9525146484375, -3.73455810546875, -3.5166015625, -3.29864501953125, -3.0806884765625, -2.86273193359375, -2.644775390625, -2.42681884765625, -2.2088623046875, -1.99090576171875, -1.77294921875, -1.55499267578125, -1.3370361328125, -1.11907958984375, -0.901123046875, -0.68316650390625, -0.4652099609375, -0.24725341796875, -0.029296875, 0.18865966796875, 0.4066162109375, 0.62457275390625, 0.842529296875, 1.06048583984375, 1.2784423828125, 1.49639892578125, 1.71435546875, 1.93231201171875, 2.1502685546875, 2.36822509765625, 2.586181640625, 2.80413818359375, 3.0220947265625, 3.24005126953125, 3.4580078125, 3.67596435546875, 3.8939208984375, 4.11187744140625, 4.329833984375, 4.54779052734375, 4.7657470703125, 4.98370361328125, 5.20166015625, 5.41961669921875, 5.6375732421875, 5.85552978515625, 6.073486328125, 6.29144287109375, 6.5093994140625, 6.72735595703125, 6.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 11.0, 10.0, 15.0, 15.0, 16.0, 24.0, 29.0, 38.0, 50.0, 44.0, 55.0, 52.0, 59.0, 57.0, 73.0, 66.0, 54.0, 58.0, 44.0, 40.0, 49.0, 28.0, 30.0, 15.0, 14.0, 12.0, 11.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2109375, -1.1689910888671875, -1.127044677734375, -1.0850982666015625, -1.04315185546875, -1.0012054443359375, -0.959259033203125, -0.9173126220703125, -0.8753662109375, -0.8334197998046875, -0.791473388671875, -0.7495269775390625, -0.70758056640625, -0.6656341552734375, -0.623687744140625, -0.5817413330078125, -0.539794921875, -0.4978485107421875, -0.455902099609375, -0.4139556884765625, -0.37200927734375, -0.3300628662109375, -0.288116455078125, -0.2461700439453125, -0.2042236328125, -0.1622772216796875, -0.120330810546875, -0.0783843994140625, -0.03643798828125, 0.0055084228515625, 0.047454833984375, 0.0894012451171875, 0.13134765625, 0.1732940673828125, 0.215240478515625, 0.2571868896484375, 0.29913330078125, 0.3410797119140625, 0.383026123046875, 0.4249725341796875, 0.4669189453125, 0.5088653564453125, 0.550811767578125, 0.5927581787109375, 0.63470458984375, 0.6766510009765625, 0.718597412109375, 0.7605438232421875, 0.802490234375, 0.8444366455078125, 0.886383056640625, 0.9283294677734375, 0.97027587890625, 1.0122222900390625, 1.054168701171875, 1.0961151123046875, 1.1380615234375, 1.1800079345703125, 1.221954345703125, 1.2639007568359375, 1.30584716796875, 1.3477935791015625, 1.389739990234375, 1.4316864013671875, 1.4736328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 9.0, 8.0, 12.0, 17.0, 30.0, 62.0, 102.0, 133.0, 229.0, 414.0, 706.0, 1221.0, 2433.0, 4868.0, 11026.0, 29162.0, 97115.0, 640439.0, 3141840.0, 186708.0, 47249.0, 16565.0, 6772.0, 3305.0, 1683.0, 883.0, 523.0, 311.0, 165.0, 119.0, 68.0, 39.0, 22.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69952392578125, -5.5279541015625, -5.35638427734375, -5.184814453125, -5.01324462890625, -4.8416748046875, -4.67010498046875, -4.49853515625, -4.32696533203125, -4.1553955078125, -3.98382568359375, -3.812255859375, -3.64068603515625, -3.4691162109375, -3.29754638671875, -3.1259765625, -2.95440673828125, -2.7828369140625, -2.61126708984375, -2.439697265625, -2.26812744140625, -2.0965576171875, -1.92498779296875, -1.75341796875, -1.58184814453125, -1.4102783203125, -1.23870849609375, -1.067138671875, -0.89556884765625, -0.7239990234375, -0.55242919921875, -0.380859375, -0.20928955078125, -0.0377197265625, 0.13385009765625, 0.305419921875, 0.47698974609375, 0.6485595703125, 0.82012939453125, 0.99169921875, 1.16326904296875, 1.3348388671875, 1.50640869140625, 1.677978515625, 1.84954833984375, 2.0211181640625, 2.19268798828125, 2.3642578125, 2.53582763671875, 2.7073974609375, 2.87896728515625, 3.050537109375, 3.22210693359375, 3.3936767578125, 3.56524658203125, 3.73681640625, 3.90838623046875, 4.0799560546875, 4.25152587890625, 4.423095703125, 4.59466552734375, 4.7662353515625, 4.93780517578125, 5.109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 18.0, 13.0, 23.0, 30.0, 50.0, 74.0, 108.0, 190.0, 395.0, 1640.0, 818.0, 277.0, 129.0, 66.0, 52.0, 44.0, 30.0, 24.0, 16.0, 11.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.554412841796875, -2.47406005859375, -2.393707275390625, -2.3133544921875, -2.233001708984375, -2.15264892578125, -2.072296142578125, -1.991943359375, -1.911590576171875, -1.83123779296875, -1.750885009765625, -1.6705322265625, -1.590179443359375, -1.50982666015625, -1.429473876953125, -1.34912109375, -1.268768310546875, -1.18841552734375, -1.108062744140625, -1.0277099609375, -0.947357177734375, -0.86700439453125, -0.786651611328125, -0.706298828125, -0.625946044921875, -0.54559326171875, -0.465240478515625, -0.3848876953125, -0.304534912109375, -0.22418212890625, -0.143829345703125, -0.0634765625, 0.016876220703125, 0.09722900390625, 0.177581787109375, 0.2579345703125, 0.338287353515625, 0.41864013671875, 0.498992919921875, 0.579345703125, 0.659698486328125, 0.74005126953125, 0.820404052734375, 0.9007568359375, 0.981109619140625, 1.06146240234375, 1.141815185546875, 1.22216796875, 1.302520751953125, 1.38287353515625, 1.463226318359375, 1.5435791015625, 1.623931884765625, 1.70428466796875, 1.784637451171875, 1.864990234375, 1.945343017578125, 2.02569580078125, 2.106048583984375, 2.1864013671875, 2.266754150390625, 2.34710693359375, 2.427459716796875, 2.5078125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 21.0, 37.0, 77.0, 168.0, 224.0, 190.0, 147.0, 79.0, 27.0, 12.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.649436950683594, -27.853559494018555, -27.057682037353516, -26.261804580688477, -25.465927124023438, -24.6700496673584, -23.87417221069336, -23.078292846679688, -22.28241729736328, -21.486539840698242, -20.690662384033203, -19.894784927368164, -19.098907470703125, -18.303030014038086, -17.507152557373047, -16.711273193359375, -15.915395736694336, -15.119518280029297, -14.323640823364258, -13.527763366699219, -12.73188591003418, -11.93600845336914, -11.140130043029785, -10.344252586364746, -9.548375129699707, -8.752497673034668, -7.956620216369629, -7.160742282867432, -6.364864826202393, -5.5689873695373535, -4.773109436035156, -3.977231979370117, -3.181354522705078, -2.385477066040039, -1.589599370956421, -0.7937216758728027, 0.002155780792236328, 0.7980332374572754, 1.5939111709594727, 2.3897886276245117, 3.185666084289551, 3.98154354095459, 4.777420997619629, 5.573298931121826, 6.369176387786865, 7.165053844451904, 7.960931777954102, 8.75680923461914, 9.55268669128418, 10.348564147949219, 11.144441604614258, 11.940319061279297, 12.736196517944336, 13.532073974609375, 14.32795238494873, 15.12382984161377, 15.919707298278809, 16.715585708618164, 17.511463165283203, 18.307340621948242, 19.10321807861328, 19.89909553527832, 20.69497299194336, 21.4908504486084, 22.286727905273438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 9.0, 7.0, 9.0, 19.0, 17.0, 27.0, 17.0, 19.0, 37.0, 38.0, 38.0, 40.0, 42.0, 42.0, 52.0, 47.0, 47.0, 48.0, 50.0, 42.0, 44.0, 50.0, 23.0, 36.0, 28.0, 32.0, 23.0, 22.0, 11.0, 14.0, 19.0, 10.0, 6.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.208544731140137, -7.939805507659912, -7.6710662841796875, -7.402327060699463, -7.133587837219238, -6.864849090576172, -6.596109867095947, -6.327370643615723, -6.058631420135498, -5.789892196655273, -5.521152973175049, -5.252413749694824, -4.983675003051758, -4.714935302734375, -4.446196556091309, -4.177457332611084, -3.9087181091308594, -3.6399788856506348, -3.37123966217041, -3.1025006771087646, -2.83376145362854, -2.5650222301483154, -2.29628324508667, -2.0275440216064453, -1.7588047981262207, -1.490065574645996, -1.221326470375061, -0.9525873064994812, -0.6838481426239014, -0.41510891914367676, -0.1463698148727417, 0.12236928939819336, 0.39110851287841797, 0.6598476767539978, 0.9285868406295776, 1.1973259449005127, 1.4660651683807373, 1.734804391860962, 2.0035433769226074, 2.272282600402832, 2.5410218238830566, 2.8097610473632812, 3.078500270843506, 3.3472392559051514, 3.615978479385376, 3.8847177028656006, 4.153456687927246, 4.422195911407471, 4.690935134887695, 4.95967435836792, 5.2284135818481445, 5.497152805328369, 5.765892028808594, 6.03463077545166, 6.303369998931885, 6.572109222412109, 6.840848445892334, 7.109587669372559, 7.378326892852783, 7.647066116333008, 7.915804862976074, 8.184544563293457, 8.453283309936523, 8.722023010253906, 8.990761756896973]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 12.0, 19.0, 24.0, 30.0, 43.0, 74.0, 110.0, 164.0, 253.0, 486.0, 920.0, 1778.0, 3610.0, 7745.0, 16602.0, 35793.0, 104619.0, 578180.0, 206443.0, 49669.0, 22057.0, 10158.0, 4779.0, 2368.0, 1118.0, 608.0, 338.0, 193.0, 115.0, 89.0, 49.0, 28.0, 20.0, 15.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.468475341796875, -3.33343505859375, -3.198394775390625, -3.0633544921875, -2.928314208984375, -2.79327392578125, -2.658233642578125, -2.523193359375, -2.388153076171875, -2.25311279296875, -2.118072509765625, -1.9830322265625, -1.847991943359375, -1.71295166015625, -1.577911376953125, -1.44287109375, -1.307830810546875, -1.17279052734375, -1.037750244140625, -0.9027099609375, -0.767669677734375, -0.63262939453125, -0.497589111328125, -0.362548828125, -0.227508544921875, -0.09246826171875, 0.042572021484375, 0.1776123046875, 0.312652587890625, 0.44769287109375, 0.582733154296875, 0.7177734375, 0.852813720703125, 0.98785400390625, 1.122894287109375, 1.2579345703125, 1.392974853515625, 1.52801513671875, 1.663055419921875, 1.798095703125, 1.933135986328125, 2.06817626953125, 2.203216552734375, 2.3382568359375, 2.473297119140625, 2.60833740234375, 2.743377685546875, 2.87841796875, 3.013458251953125, 3.14849853515625, 3.283538818359375, 3.4185791015625, 3.553619384765625, 3.68865966796875, 3.823699951171875, 3.958740234375, 4.093780517578125, 4.22882080078125, 4.363861083984375, 4.4989013671875, 4.633941650390625, 4.76898193359375, 4.904022216796875, 5.0390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 8.0, 13.0, 14.0, 17.0, 15.0, 25.0, 24.0, 36.0, 40.0, 36.0, 39.0, 55.0, 43.0, 51.0, 66.0, 70.0, 53.0, 49.0, 43.0, 53.0, 45.0, 41.0, 39.0, 16.0, 28.0, 13.0, 21.0, 12.0, 1.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1874542236328125, -1.147369384765625, -1.1072845458984375, -1.06719970703125, -1.0271148681640625, -0.987030029296875, -0.9469451904296875, -0.9068603515625, -0.8667755126953125, -0.826690673828125, -0.7866058349609375, -0.74652099609375, -0.7064361572265625, -0.666351318359375, -0.6262664794921875, -0.586181640625, -0.5460968017578125, -0.506011962890625, -0.4659271240234375, -0.42584228515625, -0.3857574462890625, -0.345672607421875, -0.3055877685546875, -0.2655029296875, -0.2254180908203125, -0.185333251953125, -0.1452484130859375, -0.10516357421875, -0.0650787353515625, -0.024993896484375, 0.0150909423828125, 0.05517578125, 0.0952606201171875, 0.135345458984375, 0.1754302978515625, 0.21551513671875, 0.2555999755859375, 0.295684814453125, 0.3357696533203125, 0.3758544921875, 0.4159393310546875, 0.456024169921875, 0.4961090087890625, 0.53619384765625, 0.5762786865234375, 0.616363525390625, 0.6564483642578125, 0.696533203125, 0.7366180419921875, 0.776702880859375, 0.8167877197265625, 0.85687255859375, 0.8969573974609375, 0.937042236328125, 0.9771270751953125, 1.0172119140625, 1.0572967529296875, 1.097381591796875, 1.1374664306640625, 1.17755126953125, 1.2176361083984375, 1.257720947265625, 1.2978057861328125, 1.337890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 7.0, 14.0, 20.0, 14.0, 23.0, 40.0, 43.0, 88.0, 107.0, 209.0, 371.0, 791.0, 1934.0, 5495.0, 17180.0, 57144.0, 687099.0, 222431.0, 37457.0, 11539.0, 3769.0, 1426.0, 612.0, 287.0, 162.0, 94.0, 56.0, 44.0, 29.0, 11.0, 18.0, 13.0, 7.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.98828125, -7.7713623046875, -7.554443359375, -7.3375244140625, -7.12060546875, -6.9036865234375, -6.686767578125, -6.4698486328125, -6.2529296875, -6.0360107421875, -5.819091796875, -5.6021728515625, -5.38525390625, -5.1683349609375, -4.951416015625, -4.7344970703125, -4.517578125, -4.3006591796875, -4.083740234375, -3.8668212890625, -3.64990234375, -3.4329833984375, -3.216064453125, -2.9991455078125, -2.7822265625, -2.5653076171875, -2.348388671875, -2.1314697265625, -1.91455078125, -1.6976318359375, -1.480712890625, -1.2637939453125, -1.046875, -0.8299560546875, -0.613037109375, -0.3961181640625, -0.17919921875, 0.0377197265625, 0.254638671875, 0.4715576171875, 0.6884765625, 0.9053955078125, 1.122314453125, 1.3392333984375, 1.55615234375, 1.7730712890625, 1.989990234375, 2.2069091796875, 2.423828125, 2.6407470703125, 2.857666015625, 3.0745849609375, 3.29150390625, 3.5084228515625, 3.725341796875, 3.9422607421875, 4.1591796875, 4.3760986328125, 4.593017578125, 4.8099365234375, 5.02685546875, 5.2437744140625, 5.460693359375, 5.6776123046875, 5.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 11.0, 8.0, 14.0, 17.0, 22.0, 35.0, 36.0, 59.0, 66.0, 79.0, 84.0, 79.0, 82.0, 66.0, 62.0, 62.0, 38.0, 41.0, 42.0, 21.0, 13.0, 9.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3671875, -9.12725830078125, -8.8873291015625, -8.64739990234375, -8.407470703125, -8.16754150390625, -7.9276123046875, -7.68768310546875, -7.44775390625, -7.20782470703125, -6.9678955078125, -6.72796630859375, -6.488037109375, -6.24810791015625, -6.0081787109375, -5.76824951171875, -5.5283203125, -5.28839111328125, -5.0484619140625, -4.80853271484375, -4.568603515625, -4.32867431640625, -4.0887451171875, -3.84881591796875, -3.60888671875, -3.36895751953125, -3.1290283203125, -2.88909912109375, -2.649169921875, -2.40924072265625, -2.1693115234375, -1.92938232421875, -1.689453125, -1.44952392578125, -1.2095947265625, -0.96966552734375, -0.729736328125, -0.48980712890625, -0.2498779296875, -0.00994873046875, 0.22998046875, 0.46990966796875, 0.7098388671875, 0.94976806640625, 1.189697265625, 1.42962646484375, 1.6695556640625, 1.90948486328125, 2.1494140625, 2.38934326171875, 2.6292724609375, 2.86920166015625, 3.109130859375, 3.34906005859375, 3.5889892578125, 3.82891845703125, 4.06884765625, 4.30877685546875, 4.5487060546875, 4.78863525390625, 5.028564453125, 5.26849365234375, 5.5084228515625, 5.74835205078125, 5.98828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 8.0, 26.0, 20.0, 29.0, 45.0, 81.0, 101.0, 176.0, 255.0, 446.0, 741.0, 1320.0, 2444.0, 4942.0, 10548.0, 24764.0, 65081.0, 410216.0, 415830.0, 65408.0, 24772.0, 10598.0, 4838.0, 2552.0, 1311.0, 794.0, 415.0, 293.0, 157.0, 124.0, 66.0, 41.0, 34.0, 18.0, 20.0, 12.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.583984375, -2.510162353515625, -2.43634033203125, -2.362518310546875, -2.2886962890625, -2.214874267578125, -2.14105224609375, -2.067230224609375, -1.993408203125, -1.919586181640625, -1.84576416015625, -1.771942138671875, -1.6981201171875, -1.624298095703125, -1.55047607421875, -1.476654052734375, -1.40283203125, -1.329010009765625, -1.25518798828125, -1.181365966796875, -1.1075439453125, -1.033721923828125, -0.95989990234375, -0.886077880859375, -0.812255859375, -0.738433837890625, -0.66461181640625, -0.590789794921875, -0.5169677734375, -0.443145751953125, -0.36932373046875, -0.295501708984375, -0.2216796875, -0.147857666015625, -0.07403564453125, -0.000213623046875, 0.0736083984375, 0.147430419921875, 0.22125244140625, 0.295074462890625, 0.368896484375, 0.442718505859375, 0.51654052734375, 0.590362548828125, 0.6641845703125, 0.738006591796875, 0.81182861328125, 0.885650634765625, 0.95947265625, 1.033294677734375, 1.10711669921875, 1.180938720703125, 1.2547607421875, 1.328582763671875, 1.40240478515625, 1.476226806640625, 1.550048828125, 1.623870849609375, 1.69769287109375, 1.771514892578125, 1.8453369140625, 1.919158935546875, 1.99298095703125, 2.066802978515625, 2.140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 7.0, 6.0, 13.0, 18.0, 14.0, 23.0, 46.0, 178.0, 383.0, 132.0, 39.0, 29.0, 23.0, 16.0, 19.0, 8.0, 5.0, 7.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008817464113235474, -0.000852733850479126, -0.0008237212896347046, -0.0007947087287902832, -0.0007656961679458618, -0.0007366836071014404, -0.000707671046257019, -0.0006786584854125977, -0.0006496459245681763, -0.0006206333637237549, -0.0005916208028793335, -0.0005626082420349121, -0.0005335956811904907, -0.0005045831203460693, -0.00047557055950164795, -0.00044655799865722656, -0.0004175454378128052, -0.0003885328769683838, -0.0003595203161239624, -0.000330507755279541, -0.00030149519443511963, -0.00027248263359069824, -0.00024347007274627686, -0.00021445751190185547, -0.00018544495105743408, -0.0001564323902130127, -0.0001274198293685913, -9.840726852416992e-05, -6.939470767974854e-05, -4.038214683532715e-05, -1.1369585990905762e-05, 1.7642974853515625e-05, 4.665553569793701e-05, 7.56680965423584e-05, 0.00010468065738677979, 0.00013369321823120117, 0.00016270577907562256, 0.00019171833992004395, 0.00022073090076446533, 0.0002497434616088867, 0.0002787560224533081, 0.0003077685832977295, 0.0003367811441421509, 0.00036579370498657227, 0.00039480626583099365, 0.00042381882667541504, 0.0004528313875198364, 0.0004818439483642578, 0.0005108565092086792, 0.0005398690700531006, 0.000568881630897522, 0.0005978941917419434, 0.0006269067525863647, 0.0006559193134307861, 0.0006849318742752075, 0.0007139444351196289, 0.0007429569959640503, 0.0007719695568084717, 0.0008009821176528931, 0.0008299946784973145, 0.0008590072393417358, 0.0008880198001861572, 0.0009170323610305786, 0.000946044921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 13.0, 16.0, 33.0, 39.0, 67.0, 101.0, 174.0, 269.0, 550.0, 1517.0, 4774.0, 20925.0, 121947.0, 794208.0, 81838.0, 15820.0, 3859.0, 1226.0, 505.0, 248.0, 146.0, 105.0, 53.0, 35.0, 20.0, 24.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.56640625, -4.43743896484375, -4.3084716796875, -4.17950439453125, -4.050537109375, -3.92156982421875, -3.7926025390625, -3.66363525390625, -3.53466796875, -3.40570068359375, -3.2767333984375, -3.14776611328125, -3.018798828125, -2.88983154296875, -2.7608642578125, -2.63189697265625, -2.5029296875, -2.37396240234375, -2.2449951171875, -2.11602783203125, -1.987060546875, -1.85809326171875, -1.7291259765625, -1.60015869140625, -1.47119140625, -1.34222412109375, -1.2132568359375, -1.08428955078125, -0.955322265625, -0.82635498046875, -0.6973876953125, -0.56842041015625, -0.439453125, -0.31048583984375, -0.1815185546875, -0.05255126953125, 0.076416015625, 0.20538330078125, 0.3343505859375, 0.46331787109375, 0.59228515625, 0.72125244140625, 0.8502197265625, 0.97918701171875, 1.108154296875, 1.23712158203125, 1.3660888671875, 1.49505615234375, 1.6240234375, 1.75299072265625, 1.8819580078125, 2.01092529296875, 2.139892578125, 2.26885986328125, 2.3978271484375, 2.52679443359375, 2.65576171875, 2.78472900390625, 2.9136962890625, 3.04266357421875, 3.171630859375, 3.30059814453125, 3.4295654296875, 3.55853271484375, 3.6875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 4.0, 10.0, 14.0, 13.0, 20.0, 12.0, 24.0, 33.0, 57.0, 118.0, 145.0, 165.0, 125.0, 51.0, 32.0, 33.0, 23.0, 20.0, 15.0, 14.0, 7.0, 12.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09375, -2.019378662109375, -1.94500732421875, -1.870635986328125, -1.7962646484375, -1.721893310546875, -1.64752197265625, -1.573150634765625, -1.498779296875, -1.424407958984375, -1.35003662109375, -1.275665283203125, -1.2012939453125, -1.126922607421875, -1.05255126953125, -0.978179931640625, -0.90380859375, -0.829437255859375, -0.75506591796875, -0.680694580078125, -0.6063232421875, -0.531951904296875, -0.45758056640625, -0.383209228515625, -0.308837890625, -0.234466552734375, -0.16009521484375, -0.085723876953125, -0.0113525390625, 0.063018798828125, 0.13739013671875, 0.211761474609375, 0.2861328125, 0.360504150390625, 0.43487548828125, 0.509246826171875, 0.5836181640625, 0.657989501953125, 0.73236083984375, 0.806732177734375, 0.881103515625, 0.955474853515625, 1.02984619140625, 1.104217529296875, 1.1785888671875, 1.252960205078125, 1.32733154296875, 1.401702880859375, 1.47607421875, 1.550445556640625, 1.62481689453125, 1.699188232421875, 1.7735595703125, 1.847930908203125, 1.92230224609375, 1.996673583984375, 2.071044921875, 2.145416259765625, 2.21978759765625, 2.294158935546875, 2.3685302734375, 2.442901611328125, 2.51727294921875, 2.591644287109375, 2.666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 28.0, 25.0, 53.0, 62.0, 82.0, 88.0, 115.0, 102.0, 101.0, 82.0, 69.0, 42.0, 36.0, 22.0, 23.0, 16.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.986961364746094, -31.047964096069336, -30.108964920043945, -29.169967651367188, -28.23097038269043, -27.291973114013672, -26.35297393798828, -25.413976669311523, -24.474979400634766, -23.535982131958008, -22.596982955932617, -21.65798568725586, -20.7189884185791, -19.779991149902344, -18.840991973876953, -17.901994705200195, -16.962995529174805, -16.023998260498047, -15.085000038146973, -14.146001815795898, -13.20700454711914, -12.268006324768066, -11.329008102416992, -10.390010833740234, -9.45101261138916, -8.512014389038086, -7.573017120361328, -6.634018898010254, -5.695021152496338, -4.756023406982422, -3.8170251846313477, -2.8780274391174316, -1.9390277862548828, -1.0000299215316772, -0.06103205680847168, 0.8779659271240234, 1.8169636726379395, 2.7559614181518555, 3.6949596405029297, 4.633957386016846, 5.572955131530762, 6.511952877044678, 7.450950622558594, 8.389948844909668, 9.328947067260742, 10.2679443359375, 11.206942558288574, 12.145940780639648, 13.084938049316406, 14.02393627166748, 14.962933540344238, 15.901931762695312, 16.84092903137207, 17.779926300048828, 18.71892547607422, 19.657922744750977, 20.596920013427734, 21.535917282104492, 22.474916458129883, 23.41391372680664, 24.3529109954834, 25.291908264160156, 26.230907440185547, 27.169904708862305, 28.108903884887695]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 5.0, 10.0, 4.0, 13.0, 14.0, 15.0, 22.0, 15.0, 17.0, 28.0, 28.0, 31.0, 34.0, 35.0, 37.0, 44.0, 54.0, 50.0, 48.0, 42.0, 39.0, 40.0, 45.0, 40.0, 32.0, 42.0, 25.0, 31.0, 21.0, 19.0, 15.0, 19.0, 16.0, 12.0, 7.0, 14.0, 3.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-24.45825958251953, -23.762027740478516, -23.0657958984375, -22.369564056396484, -21.67333221435547, -20.977100372314453, -20.280868530273438, -19.584636688232422, -18.888404846191406, -18.19217300415039, -17.495941162109375, -16.79970932006836, -16.103477478027344, -15.407245635986328, -14.711012840270996, -14.01478099822998, -13.318548202514648, -12.622316360473633, -11.926084518432617, -11.229852676391602, -10.533620834350586, -9.83738899230957, -9.141156196594238, -8.444924354553223, -7.748692512512207, -7.052460670471191, -6.356228828430176, -5.659996509552002, -4.963764667510986, -4.267532825469971, -3.571300506591797, -2.8750686645507812, -2.178834915161133, -1.4826029539108276, -0.7863709926605225, -0.09013891220092773, 0.6060929298400879, 1.3023247718811035, 1.9985570907592773, 2.694788932800293, 3.3910207748413086, 4.087252616882324, 4.78348445892334, 5.479716777801514, 6.175948619842529, 6.872180461883545, 7.568412780761719, 8.264644622802734, 8.96087646484375, 9.657108306884766, 10.353340148925781, 11.049571990966797, 11.745803833007812, 12.442035675048828, 13.13826847076416, 13.834500312805176, 14.530732154846191, 15.226963996887207, 15.923195838928223, 16.619428634643555, 17.31566047668457, 18.011892318725586, 18.7081241607666, 19.404356002807617, 20.100587844848633]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 17.0, 35.0, 38.0, 68.0, 108.0, 216.0, 456.0, 991.0, 2372.0, 6111.0, 17300.0, 68537.0, 1583259.0, 2416290.0, 70520.0, 17752.0, 6003.0, 2298.0, 978.0, 440.0, 216.0, 109.0, 59.0, 28.0, 18.0, 7.0, 15.0, 8.0, 4.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75, -7.4732666015625, -7.196533203125, -6.9197998046875, -6.64306640625, -6.3663330078125, -6.089599609375, -5.8128662109375, -5.5361328125, -5.2593994140625, -4.982666015625, -4.7059326171875, -4.42919921875, -4.1524658203125, -3.875732421875, -3.5989990234375, -3.322265625, -3.0455322265625, -2.768798828125, -2.4920654296875, -2.21533203125, -1.9385986328125, -1.661865234375, -1.3851318359375, -1.1083984375, -0.8316650390625, -0.554931640625, -0.2781982421875, -0.00146484375, 0.2752685546875, 0.552001953125, 0.8287353515625, 1.10546875, 1.3822021484375, 1.658935546875, 1.9356689453125, 2.21240234375, 2.4891357421875, 2.765869140625, 3.0426025390625, 3.3193359375, 3.5960693359375, 3.872802734375, 4.1495361328125, 4.42626953125, 4.7030029296875, 4.979736328125, 5.2564697265625, 5.533203125, 5.8099365234375, 6.086669921875, 6.3634033203125, 6.64013671875, 6.9168701171875, 7.193603515625, 7.4703369140625, 7.7470703125, 8.0238037109375, 8.300537109375, 8.5772705078125, 8.85400390625, 9.1307373046875, 9.407470703125, 9.6842041015625, 9.9609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 12.0, 11.0, 14.0, 16.0, 14.0, 15.0, 28.0, 18.0, 32.0, 36.0, 47.0, 30.0, 35.0, 62.0, 59.0, 54.0, 59.0, 67.0, 46.0, 48.0, 47.0, 40.0, 33.0, 38.0, 33.0, 36.0, 10.0, 18.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2179718017578125, -1.177154541015625, -1.1363372802734375, -1.09552001953125, -1.0547027587890625, -1.013885498046875, -0.9730682373046875, -0.9322509765625, -0.8914337158203125, -0.850616455078125, -0.8097991943359375, -0.76898193359375, -0.7281646728515625, -0.687347412109375, -0.6465301513671875, -0.605712890625, -0.5648956298828125, -0.524078369140625, -0.4832611083984375, -0.44244384765625, -0.4016265869140625, -0.360809326171875, -0.3199920654296875, -0.2791748046875, -0.2383575439453125, -0.197540283203125, -0.1567230224609375, -0.11590576171875, -0.0750885009765625, -0.034271240234375, 0.0065460205078125, 0.04736328125, 0.0881805419921875, 0.128997802734375, 0.1698150634765625, 0.21063232421875, 0.2514495849609375, 0.292266845703125, 0.3330841064453125, 0.3739013671875, 0.4147186279296875, 0.455535888671875, 0.4963531494140625, 0.53717041015625, 0.5779876708984375, 0.618804931640625, 0.6596221923828125, 0.700439453125, 0.7412567138671875, 0.782073974609375, 0.8228912353515625, 0.86370849609375, 0.9045257568359375, 0.945343017578125, 0.9861602783203125, 1.0269775390625, 1.0677947998046875, 1.108612060546875, 1.1494293212890625, 1.19024658203125, 1.2310638427734375, 1.271881103515625, 1.3126983642578125, 1.353515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 13.0, 11.0, 20.0, 33.0, 50.0, 80.0, 70.0, 127.0, 171.0, 222.0, 297.0, 497.0, 815.0, 1381.0, 2636.0, 5352.0, 12195.0, 30264.0, 97024.0, 718487.0, 3109359.0, 144639.0, 40798.0, 15409.0, 6567.0, 3247.0, 1675.0, 936.0, 565.0, 388.0, 274.0, 173.0, 132.0, 93.0, 63.0, 56.0, 39.0, 35.0, 23.0, 16.0, 14.0, 13.0, 9.0, 7.0, 1.0, 3.0], "bins": [-8.140625, -7.92718505859375, -7.7137451171875, -7.50030517578125, -7.286865234375, -7.07342529296875, -6.8599853515625, -6.64654541015625, -6.43310546875, -6.21966552734375, -6.0062255859375, -5.79278564453125, -5.579345703125, -5.36590576171875, -5.1524658203125, -4.93902587890625, -4.7255859375, -4.51214599609375, -4.2987060546875, -4.08526611328125, -3.871826171875, -3.65838623046875, -3.4449462890625, -3.23150634765625, -3.01806640625, -2.80462646484375, -2.5911865234375, -2.37774658203125, -2.164306640625, -1.95086669921875, -1.7374267578125, -1.52398681640625, -1.310546875, -1.09710693359375, -0.8836669921875, -0.67022705078125, -0.456787109375, -0.24334716796875, -0.0299072265625, 0.18353271484375, 0.39697265625, 0.61041259765625, 0.8238525390625, 1.03729248046875, 1.250732421875, 1.46417236328125, 1.6776123046875, 1.89105224609375, 2.1044921875, 2.31793212890625, 2.5313720703125, 2.74481201171875, 2.958251953125, 3.17169189453125, 3.3851318359375, 3.59857177734375, 3.81201171875, 4.02545166015625, 4.2388916015625, 4.45233154296875, 4.665771484375, 4.87921142578125, 5.0926513671875, 5.30609130859375, 5.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 12.0, 12.0, 16.0, 24.0, 30.0, 46.0, 65.0, 148.0, 290.0, 1484.0, 1301.0, 275.0, 109.0, 78.0, 41.0, 47.0, 17.0, 13.0, 14.0, 11.0, 4.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57421875, -2.4622802734375, -2.350341796875, -2.2384033203125, -2.12646484375, -2.0145263671875, -1.902587890625, -1.7906494140625, -1.6787109375, -1.5667724609375, -1.454833984375, -1.3428955078125, -1.23095703125, -1.1190185546875, -1.007080078125, -0.8951416015625, -0.783203125, -0.6712646484375, -0.559326171875, -0.4473876953125, -0.33544921875, -0.2235107421875, -0.111572265625, 0.0003662109375, 0.1123046875, 0.2242431640625, 0.336181640625, 0.4481201171875, 0.56005859375, 0.6719970703125, 0.783935546875, 0.8958740234375, 1.0078125, 1.1197509765625, 1.231689453125, 1.3436279296875, 1.45556640625, 1.5675048828125, 1.679443359375, 1.7913818359375, 1.9033203125, 2.0152587890625, 2.127197265625, 2.2391357421875, 2.35107421875, 2.4630126953125, 2.574951171875, 2.6868896484375, 2.798828125, 2.9107666015625, 3.022705078125, 3.1346435546875, 3.24658203125, 3.3585205078125, 3.470458984375, 3.5823974609375, 3.6943359375, 3.8062744140625, 3.918212890625, 4.0301513671875, 4.14208984375, 4.2540283203125, 4.365966796875, 4.4779052734375, 4.58984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 33.0, 53.0, 72.0, 132.0, 157.0, 151.0, 128.0, 91.0, 52.0, 36.0, 23.0, 10.0, 11.0, 10.0, 1.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.313812255859375, -15.635957717895508, -14.958102226257324, -14.280247688293457, -13.602392196655273, -12.924537658691406, -12.246683120727539, -11.568827629089355, -10.890972137451172, -10.213117599487305, -9.535262107849121, -8.857407569885254, -8.17955207824707, -7.501697540283203, -6.823842525482178, -6.145987510681152, -5.468132972717285, -4.79027795791626, -4.112422943115234, -3.434568166732788, -2.7567131519317627, -2.0788581371307373, -1.401003360748291, -0.7231483459472656, -0.045293331146240234, 0.6325616240501404, 1.310416579246521, 1.9882714748382568, 2.6661264896392822, 3.3439815044403076, 4.021836280822754, 4.699691295623779, 5.377546310424805, 6.05540132522583, 6.7332563400268555, 7.411110877990723, 8.088966369628906, 8.766820907592773, 9.44467544555664, 10.122530937194824, 10.800386428833008, 11.478240966796875, 12.156096458435059, 12.833950996398926, 13.51180648803711, 14.189661026000977, 14.867515563964844, 15.545371055603027, 16.223224639892578, 16.901079177856445, 17.578933715820312, 18.256790161132812, 18.93464469909668, 19.612499237060547, 20.290353775024414, 20.96820831298828, 21.64606475830078, 22.32391929626465, 23.001773834228516, 23.679630279541016, 24.357484817504883, 25.03533935546875, 25.713193893432617, 26.391048431396484, 27.068904876708984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 9.0, 8.0, 9.0, 10.0, 11.0, 17.0, 20.0, 27.0, 22.0, 23.0, 40.0, 43.0, 48.0, 41.0, 46.0, 57.0, 42.0, 44.0, 70.0, 55.0, 47.0, 48.0, 49.0, 34.0, 30.0, 35.0, 21.0, 23.0, 18.0, 14.0, 12.0, 7.0, 4.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.803576469421387, -10.422284126281738, -10.04099178314209, -9.659699440002441, -9.278407096862793, -8.897113800048828, -8.51582145690918, -8.134529113769531, -7.753236770629883, -7.371944427490234, -6.990652084350586, -6.6093597412109375, -6.228066921234131, -5.846774578094482, -5.465482234954834, -5.084189414978027, -4.702897548675537, -4.321605205535889, -3.940312623977661, -3.5590202808380127, -3.177727699279785, -2.7964353561401367, -2.4151430130004883, -2.0338504314422607, -1.6525580883026123, -1.2712656259536743, -0.8899732232093811, -0.5086808204650879, -0.1273883581161499, 0.2539041042327881, 0.6351964473724365, 1.016489028930664, 1.3977813720703125, 1.7790738344192505, 2.1603662967681885, 2.541658639907837, 2.9229512214660645, 3.304243564605713, 3.6855359077453613, 4.066828727722168, 4.448121070861816, 4.829413414001465, 5.210705757141113, 5.591998100280762, 5.973290920257568, 6.354583263397217, 6.735875606536865, 7.117168426513672, 7.498460292816162, 7.8797526359558105, 8.261045455932617, 8.642337799072266, 9.023630142211914, 9.404922485351562, 9.786214828491211, 10.16750717163086, 10.548799514770508, 10.930091857910156, 11.311384201049805, 11.692676544189453, 12.073968887329102, 12.45526123046875, 12.836553573608398, 13.217846870422363, 13.599139213562012]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 17.0, 19.0, 34.0, 40.0, 72.0, 85.0, 136.0, 185.0, 334.0, 527.0, 922.0, 1864.0, 3714.0, 8368.0, 19525.0, 46241.0, 116123.0, 355675.0, 316337.0, 103347.0, 42112.0, 17620.0, 7794.0, 3513.0, 1657.0, 875.0, 507.0, 281.0, 197.0, 112.0, 66.0, 70.0, 50.0, 33.0, 28.0, 19.0, 12.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-5.08203125, -4.93231201171875, -4.7825927734375, -4.63287353515625, -4.483154296875, -4.33343505859375, -4.1837158203125, -4.03399658203125, -3.88427734375, -3.73455810546875, -3.5848388671875, -3.43511962890625, -3.285400390625, -3.13568115234375, -2.9859619140625, -2.83624267578125, -2.6865234375, -2.53680419921875, -2.3870849609375, -2.23736572265625, -2.087646484375, -1.93792724609375, -1.7882080078125, -1.63848876953125, -1.48876953125, -1.33905029296875, -1.1893310546875, -1.03961181640625, -0.889892578125, -0.74017333984375, -0.5904541015625, -0.44073486328125, -0.291015625, -0.14129638671875, 0.0084228515625, 0.15814208984375, 0.307861328125, 0.45758056640625, 0.6072998046875, 0.75701904296875, 0.90673828125, 1.05645751953125, 1.2061767578125, 1.35589599609375, 1.505615234375, 1.65533447265625, 1.8050537109375, 1.95477294921875, 2.1044921875, 2.25421142578125, 2.4039306640625, 2.55364990234375, 2.703369140625, 2.85308837890625, 3.0028076171875, 3.15252685546875, 3.30224609375, 3.45196533203125, 3.6016845703125, 3.75140380859375, 3.901123046875, 4.05084228515625, 4.2005615234375, 4.35028076171875, 4.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 18.0, 14.0, 17.0, 17.0, 17.0, 28.0, 34.0, 36.0, 35.0, 40.0, 51.0, 45.0, 60.0, 64.0, 55.0, 50.0, 63.0, 41.0, 40.0, 37.0, 39.0, 32.0, 29.0, 27.0, 20.0, 17.0, 24.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3803253173828125, -1.335845947265625, -1.2913665771484375, -1.24688720703125, -1.2024078369140625, -1.157928466796875, -1.1134490966796875, -1.0689697265625, -1.0244903564453125, -0.980010986328125, -0.9355316162109375, -0.89105224609375, -0.8465728759765625, -0.802093505859375, -0.7576141357421875, -0.713134765625, -0.6686553955078125, -0.624176025390625, -0.5796966552734375, -0.53521728515625, -0.4907379150390625, -0.446258544921875, -0.4017791748046875, -0.3572998046875, -0.3128204345703125, -0.268341064453125, -0.2238616943359375, -0.17938232421875, -0.1349029541015625, -0.090423583984375, -0.0459442138671875, -0.00146484375, 0.0430145263671875, 0.087493896484375, 0.1319732666015625, 0.17645263671875, 0.2209320068359375, 0.265411376953125, 0.3098907470703125, 0.3543701171875, 0.3988494873046875, 0.443328857421875, 0.4878082275390625, 0.53228759765625, 0.5767669677734375, 0.621246337890625, 0.6657257080078125, 0.710205078125, 0.7546844482421875, 0.799163818359375, 0.8436431884765625, 0.88812255859375, 0.9326019287109375, 0.977081298828125, 1.0215606689453125, 1.0660400390625, 1.1105194091796875, 1.154998779296875, 1.1994781494140625, 1.24395751953125, 1.2884368896484375, 1.332916259765625, 1.3773956298828125, 1.421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 14.0, 25.0, 51.0, 57.0, 77.0, 170.0, 256.0, 412.0, 764.0, 1855.0, 6301.0, 38539.0, 387533.0, 551943.0, 48835.0, 7647.0, 2010.0, 893.0, 426.0, 263.0, 159.0, 104.0, 61.0, 34.0, 28.0, 22.0, 16.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.11712646484375, -6.8084716796875, -6.49981689453125, -6.191162109375, -5.88250732421875, -5.5738525390625, -5.26519775390625, -4.95654296875, -4.64788818359375, -4.3392333984375, -4.03057861328125, -3.721923828125, -3.41326904296875, -3.1046142578125, -2.79595947265625, -2.4873046875, -2.17864990234375, -1.8699951171875, -1.56134033203125, -1.252685546875, -0.94403076171875, -0.6353759765625, -0.32672119140625, -0.01806640625, 0.29058837890625, 0.5992431640625, 0.90789794921875, 1.216552734375, 1.52520751953125, 1.8338623046875, 2.14251708984375, 2.451171875, 2.75982666015625, 3.0684814453125, 3.37713623046875, 3.685791015625, 3.99444580078125, 4.3031005859375, 4.61175537109375, 4.92041015625, 5.22906494140625, 5.5377197265625, 5.84637451171875, 6.155029296875, 6.46368408203125, 6.7723388671875, 7.08099365234375, 7.3896484375, 7.69830322265625, 8.0069580078125, 8.31561279296875, 8.624267578125, 8.93292236328125, 9.2415771484375, 9.55023193359375, 9.85888671875, 10.16754150390625, 10.4761962890625, 10.78485107421875, 11.093505859375, 11.40216064453125, 11.7108154296875, 12.01947021484375, 12.328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 7.0, 8.0, 10.0, 9.0, 15.0, 19.0, 19.0, 20.0, 25.0, 41.0, 34.0, 40.0, 38.0, 41.0, 49.0, 44.0, 39.0, 55.0, 57.0, 50.0, 46.0, 40.0, 30.0, 38.0, 27.0, 29.0, 33.0, 23.0, 28.0, 14.0, 14.0, 8.0, 3.0, 6.0, 8.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7984619140625, -5.612548828125, -5.4266357421875, -5.24072265625, -5.0548095703125, -4.868896484375, -4.6829833984375, -4.4970703125, -4.3111572265625, -4.125244140625, -3.9393310546875, -3.75341796875, -3.5675048828125, -3.381591796875, -3.1956787109375, -3.009765625, -2.8238525390625, -2.637939453125, -2.4520263671875, -2.26611328125, -2.0802001953125, -1.894287109375, -1.7083740234375, -1.5224609375, -1.3365478515625, -1.150634765625, -0.9647216796875, -0.77880859375, -0.5928955078125, -0.406982421875, -0.2210693359375, -0.03515625, 0.1507568359375, 0.336669921875, 0.5225830078125, 0.70849609375, 0.8944091796875, 1.080322265625, 1.2662353515625, 1.4521484375, 1.6380615234375, 1.823974609375, 2.0098876953125, 2.19580078125, 2.3817138671875, 2.567626953125, 2.7535400390625, 2.939453125, 3.1253662109375, 3.311279296875, 3.4971923828125, 3.68310546875, 3.8690185546875, 4.054931640625, 4.2408447265625, 4.4267578125, 4.6126708984375, 4.798583984375, 4.9844970703125, 5.17041015625, 5.3563232421875, 5.542236328125, 5.7281494140625, 5.9140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 13.0, 23.0, 22.0, 34.0, 58.0, 93.0, 175.0, 298.0, 622.0, 1246.0, 3039.0, 8145.0, 23854.0, 75957.0, 330608.0, 462081.0, 96846.0, 28849.0, 9854.0, 3695.0, 1498.0, 693.0, 337.0, 204.0, 101.0, 59.0, 43.0, 30.0, 21.0, 14.0, 8.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.015625, -3.91546630859375, -3.8153076171875, -3.71514892578125, -3.614990234375, -3.51483154296875, -3.4146728515625, -3.31451416015625, -3.21435546875, -3.11419677734375, -3.0140380859375, -2.91387939453125, -2.813720703125, -2.71356201171875, -2.6134033203125, -2.51324462890625, -2.4130859375, -2.31292724609375, -2.2127685546875, -2.11260986328125, -2.012451171875, -1.91229248046875, -1.8121337890625, -1.71197509765625, -1.61181640625, -1.51165771484375, -1.4114990234375, -1.31134033203125, -1.211181640625, -1.11102294921875, -1.0108642578125, -0.91070556640625, -0.810546875, -0.71038818359375, -0.6102294921875, -0.51007080078125, -0.409912109375, -0.30975341796875, -0.2095947265625, -0.10943603515625, -0.00927734375, 0.09088134765625, 0.1910400390625, 0.29119873046875, 0.391357421875, 0.49151611328125, 0.5916748046875, 0.69183349609375, 0.7919921875, 0.89215087890625, 0.9923095703125, 1.09246826171875, 1.192626953125, 1.29278564453125, 1.3929443359375, 1.49310302734375, 1.59326171875, 1.69342041015625, 1.7935791015625, 1.89373779296875, 1.993896484375, 2.09405517578125, 2.1942138671875, 2.29437255859375, 2.39453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 19.0, 10.0, 17.0, 27.0, 26.0, 38.0, 45.0, 55.0, 99.0, 207.0, 140.0, 62.0, 41.0, 29.0, 30.0, 25.0, 21.0, 17.0, 16.0, 11.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000835418701171875, -0.0008098036050796509, -0.0007841885089874268, -0.0007585734128952026, -0.0007329583168029785, -0.0007073432207107544, -0.0006817281246185303, -0.0006561130285263062, -0.000630497932434082, -0.0006048828363418579, -0.0005792677402496338, -0.0005536526441574097, -0.0005280375480651855, -0.0005024224519729614, -0.0004768073558807373, -0.0004511922597885132, -0.00042557716369628906, -0.00039996206760406494, -0.0003743469715118408, -0.0003487318754196167, -0.0003231167793273926, -0.00029750168323516846, -0.00027188658714294434, -0.0002462714910507202, -0.0002206563949584961, -0.00019504129886627197, -0.00016942620277404785, -0.00014381110668182373, -0.00011819601058959961, -9.258091449737549e-05, -6.696581840515137e-05, -4.1350722312927246e-05, -1.5735626220703125e-05, 9.879469871520996e-06, 3.549456596374512e-05, 6.110966205596924e-05, 8.672475814819336e-05, 0.00011233985424041748, 0.0001379549503326416, 0.00016357004642486572, 0.00018918514251708984, 0.00021480023860931396, 0.00024041533470153809, 0.0002660304307937622, 0.00029164552688598633, 0.00031726062297821045, 0.00034287571907043457, 0.0003684908151626587, 0.0003941059112548828, 0.00041972100734710693, 0.00044533610343933105, 0.0004709511995315552, 0.0004965662956237793, 0.0005221813917160034, 0.0005477964878082275, 0.0005734115839004517, 0.0005990266799926758, 0.0006246417760848999, 0.000650256872177124, 0.0006758719682693481, 0.0007014870643615723, 0.0007271021604537964, 0.0007527172565460205, 0.0007783323526382446, 0.0008039474487304688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 10.0, 18.0, 19.0, 20.0, 43.0, 51.0, 85.0, 163.0, 314.0, 560.0, 1420.0, 4589.0, 22625.0, 173400.0, 709442.0, 113809.0, 16021.0, 3655.0, 1154.0, 509.0, 241.0, 127.0, 85.0, 48.0, 34.0, 17.0, 22.0, 21.0, 10.0, 11.0, 8.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.1875, -6.0220947265625, -5.856689453125, -5.6912841796875, -5.52587890625, -5.3604736328125, -5.195068359375, -5.0296630859375, -4.8642578125, -4.6988525390625, -4.533447265625, -4.3680419921875, -4.20263671875, -4.0372314453125, -3.871826171875, -3.7064208984375, -3.541015625, -3.3756103515625, -3.210205078125, -3.0447998046875, -2.87939453125, -2.7139892578125, -2.548583984375, -2.3831787109375, -2.2177734375, -2.0523681640625, -1.886962890625, -1.7215576171875, -1.55615234375, -1.3907470703125, -1.225341796875, -1.0599365234375, -0.89453125, -0.7291259765625, -0.563720703125, -0.3983154296875, -0.23291015625, -0.0675048828125, 0.097900390625, 0.2633056640625, 0.4287109375, 0.5941162109375, 0.759521484375, 0.9249267578125, 1.09033203125, 1.2557373046875, 1.421142578125, 1.5865478515625, 1.751953125, 1.9173583984375, 2.082763671875, 2.2481689453125, 2.41357421875, 2.5789794921875, 2.744384765625, 2.9097900390625, 3.0751953125, 3.2406005859375, 3.406005859375, 3.5714111328125, 3.73681640625, 3.9022216796875, 4.067626953125, 4.2330322265625, 4.3984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 12.0, 19.0, 15.0, 31.0, 42.0, 69.0, 89.0, 118.0, 145.0, 126.0, 93.0, 70.0, 44.0, 33.0, 24.0, 10.0, 13.0, 11.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.26953125, -6.1324462890625, -5.995361328125, -5.8582763671875, -5.72119140625, -5.5841064453125, -5.447021484375, -5.3099365234375, -5.1728515625, -5.0357666015625, -4.898681640625, -4.7615966796875, -4.62451171875, -4.4874267578125, -4.350341796875, -4.2132568359375, -4.076171875, -3.9390869140625, -3.802001953125, -3.6649169921875, -3.52783203125, -3.3907470703125, -3.253662109375, -3.1165771484375, -2.9794921875, -2.8424072265625, -2.705322265625, -2.5682373046875, -2.43115234375, -2.2940673828125, -2.156982421875, -2.0198974609375, -1.8828125, -1.7457275390625, -1.608642578125, -1.4715576171875, -1.33447265625, -1.1973876953125, -1.060302734375, -0.9232177734375, -0.7861328125, -0.6490478515625, -0.511962890625, -0.3748779296875, -0.23779296875, -0.1007080078125, 0.036376953125, 0.1734619140625, 0.310546875, 0.4476318359375, 0.584716796875, 0.7218017578125, 0.85888671875, 0.9959716796875, 1.133056640625, 1.2701416015625, 1.4072265625, 1.5443115234375, 1.681396484375, 1.8184814453125, 1.95556640625, 2.0926513671875, 2.229736328125, 2.3668212890625, 2.50390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 21.0, 65.0, 181.0, 338.0, 251.0, 103.0, 24.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.445945739746094, -42.7911262512207, -39.13630676269531, -35.48148727416992, -31.82666778564453, -28.17184829711914, -24.51702880859375, -20.86220932006836, -17.20738983154297, -13.552570343017578, -9.897750854492188, -6.242931365966797, -2.5881118774414062, 1.0667076110839844, 4.721527099609375, 8.376346588134766, 12.031166076660156, 15.685985565185547, 19.340805053710938, 22.995624542236328, 26.65044403076172, 30.30526351928711, 33.9600830078125, 37.61490249633789, 41.26972198486328, 44.92454147338867, 48.57936096191406, 52.23418045043945, 55.888999938964844, 59.543819427490234, 63.198638916015625, 66.85345458984375, 70.50827026367188, 74.1630859375, 77.81790924072266, 81.47273254394531, 85.12754821777344, 88.78236389160156, 92.43718719482422, 96.09201049804688, 99.746826171875, 103.40164184570312, 107.05646514892578, 110.71128845214844, 114.36610412597656, 118.02091979980469, 121.67574310302734, 125.33056640625, 128.98538208007812, 132.64019775390625, 136.29501342773438, 139.94984436035156, 143.6046600341797, 147.2594757080078, 150.914306640625, 154.56912231445312, 158.22393798828125, 161.87875366210938, 165.5335693359375, 169.1884002685547, 172.8432159423828, 176.49803161621094, 180.15286254882812, 183.80767822265625, 187.46249389648438]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 8.0, 13.0, 13.0, 15.0, 15.0, 23.0, 20.0, 22.0, 17.0, 25.0, 36.0, 44.0, 33.0, 52.0, 35.0, 41.0, 45.0, 50.0, 43.0, 35.0, 45.0, 39.0, 44.0, 27.0, 29.0, 28.0, 27.0, 20.0, 22.0, 17.0, 18.0, 16.0, 11.0, 11.0, 6.0, 6.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.444995880126953, -28.50366973876953, -27.56234359741211, -26.621017456054688, -25.679691314697266, -24.738365173339844, -23.797039031982422, -22.855712890625, -21.914386749267578, -20.973060607910156, -20.031734466552734, -19.090408325195312, -18.14908218383789, -17.20775604248047, -16.266429901123047, -15.325104713439941, -14.383779525756836, -13.442453384399414, -12.501127243041992, -11.55980110168457, -10.618474960327148, -9.677148818969727, -8.735823631286621, -7.794497489929199, -6.853171348571777, -5.9118452072143555, -4.970519065856934, -4.02919340133667, -3.087867259979248, -2.146541118621826, -1.2052154541015625, -0.2638893127441406, 0.6774368286132812, 1.6187628507614136, 2.560088872909546, 3.5014147758483887, 4.4427409172058105, 5.384067058563232, 6.325392723083496, 7.266718864440918, 8.20804500579834, 9.149371147155762, 10.090697288513184, 11.032022476196289, 11.973348617553711, 12.914674758911133, 13.856000900268555, 14.797327041625977, 15.738653182983398, 16.67997932434082, 17.621305465698242, 18.562631607055664, 19.503957748413086, 20.445283889770508, 21.386608123779297, 22.32793426513672, 23.26926040649414, 24.210586547851562, 25.151912689208984, 26.093238830566406, 27.034564971923828, 27.97589111328125, 28.917217254638672, 29.858543395996094, 30.799869537353516]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 12.0, 21.0, 25.0, 59.0, 110.0, 221.0, 571.0, 1665.0, 6552.0, 32435.0, 398894.0, 3672063.0, 66051.0, 11341.0, 2787.0, 860.0, 294.0, 134.0, 74.0, 33.0, 27.0, 18.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7454833984375, -9.342529296875, -8.9395751953125, -8.53662109375, -8.1336669921875, -7.730712890625, -7.3277587890625, -6.9248046875, -6.5218505859375, -6.118896484375, -5.7159423828125, -5.31298828125, -4.9100341796875, -4.507080078125, -4.1041259765625, -3.701171875, -3.2982177734375, -2.895263671875, -2.4923095703125, -2.08935546875, -1.6864013671875, -1.283447265625, -0.8804931640625, -0.4775390625, -0.0745849609375, 0.328369140625, 0.7313232421875, 1.13427734375, 1.5372314453125, 1.940185546875, 2.3431396484375, 2.74609375, 3.1490478515625, 3.552001953125, 3.9549560546875, 4.35791015625, 4.7608642578125, 5.163818359375, 5.5667724609375, 5.9697265625, 6.3726806640625, 6.775634765625, 7.1785888671875, 7.58154296875, 7.9844970703125, 8.387451171875, 8.7904052734375, 9.193359375, 9.5963134765625, 9.999267578125, 10.4022216796875, 10.80517578125, 11.2081298828125, 11.611083984375, 12.0140380859375, 12.4169921875, 12.8199462890625, 13.222900390625, 13.6258544921875, 14.02880859375, 14.4317626953125, 14.834716796875, 15.2376708984375, 15.640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 5.0, 9.0, 11.0, 11.0, 14.0, 15.0, 25.0, 22.0, 33.0, 31.0, 41.0, 41.0, 42.0, 43.0, 35.0, 48.0, 61.0, 59.0, 52.0, 46.0, 35.0, 44.0, 39.0, 36.0, 34.0, 36.0, 22.0, 13.0, 22.0, 16.0, 17.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3505859375, -1.3067779541015625, -1.262969970703125, -1.2191619873046875, -1.17535400390625, -1.1315460205078125, -1.087738037109375, -1.0439300537109375, -1.0001220703125, -0.9563140869140625, -0.912506103515625, -0.8686981201171875, -0.82489013671875, -0.7810821533203125, -0.737274169921875, -0.6934661865234375, -0.649658203125, -0.6058502197265625, -0.562042236328125, -0.5182342529296875, -0.47442626953125, -0.4306182861328125, -0.386810302734375, -0.3430023193359375, -0.2991943359375, -0.2553863525390625, -0.211578369140625, -0.1677703857421875, -0.12396240234375, -0.0801544189453125, -0.036346435546875, 0.0074615478515625, 0.05126953125, 0.0950775146484375, 0.138885498046875, 0.1826934814453125, 0.22650146484375, 0.2703094482421875, 0.314117431640625, 0.3579254150390625, 0.4017333984375, 0.4455413818359375, 0.489349365234375, 0.5331573486328125, 0.57696533203125, 0.6207733154296875, 0.664581298828125, 0.7083892822265625, 0.752197265625, 0.7960052490234375, 0.839813232421875, 0.8836212158203125, 0.92742919921875, 0.9712371826171875, 1.015045166015625, 1.0588531494140625, 1.1026611328125, 1.1464691162109375, 1.190277099609375, 1.2340850830078125, 1.27789306640625, 1.3217010498046875, 1.365509033203125, 1.4093170166015625, 1.453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 10.0, 9.0, 8.0, 12.0, 12.0, 25.0, 34.0, 49.0, 65.0, 90.0, 133.0, 188.0, 284.0, 444.0, 737.0, 1215.0, 2190.0, 4384.0, 9058.0, 20804.0, 56349.0, 205633.0, 3089075.0, 633878.0, 107111.0, 34773.0, 13884.0, 6298.0, 3162.0, 1665.0, 962.0, 578.0, 367.0, 257.0, 147.0, 113.0, 78.0, 62.0, 38.0, 32.0, 19.0, 12.0, 10.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.24609375, -6.04949951171875, -5.8529052734375, -5.65631103515625, -5.459716796875, -5.26312255859375, -5.0665283203125, -4.86993408203125, -4.67333984375, -4.47674560546875, -4.2801513671875, -4.08355712890625, -3.886962890625, -3.69036865234375, -3.4937744140625, -3.29718017578125, -3.1005859375, -2.90399169921875, -2.7073974609375, -2.51080322265625, -2.314208984375, -2.11761474609375, -1.9210205078125, -1.72442626953125, -1.52783203125, -1.33123779296875, -1.1346435546875, -0.93804931640625, -0.741455078125, -0.54486083984375, -0.3482666015625, -0.15167236328125, 0.044921875, 0.24151611328125, 0.4381103515625, 0.63470458984375, 0.831298828125, 1.02789306640625, 1.2244873046875, 1.42108154296875, 1.61767578125, 1.81427001953125, 2.0108642578125, 2.20745849609375, 2.404052734375, 2.60064697265625, 2.7972412109375, 2.99383544921875, 3.1904296875, 3.38702392578125, 3.5836181640625, 3.78021240234375, 3.976806640625, 4.17340087890625, 4.3699951171875, 4.56658935546875, 4.76318359375, 4.95977783203125, 5.1563720703125, 5.35296630859375, 5.549560546875, 5.74615478515625, 5.9427490234375, 6.13934326171875, 6.3359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 14.0, 17.0, 29.0, 41.0, 58.0, 92.0, 140.0, 245.0, 736.0, 1684.0, 401.0, 189.0, 109.0, 63.0, 45.0, 42.0, 28.0, 19.0, 20.0, 12.0, 8.0, 7.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.16015625, -3.04815673828125, -2.9361572265625, -2.82415771484375, -2.712158203125, -2.60015869140625, -2.4881591796875, -2.37615966796875, -2.26416015625, -2.15216064453125, -2.0401611328125, -1.92816162109375, -1.816162109375, -1.70416259765625, -1.5921630859375, -1.48016357421875, -1.3681640625, -1.25616455078125, -1.1441650390625, -1.03216552734375, -0.920166015625, -0.80816650390625, -0.6961669921875, -0.58416748046875, -0.47216796875, -0.36016845703125, -0.2481689453125, -0.13616943359375, -0.024169921875, 0.08782958984375, 0.1998291015625, 0.31182861328125, 0.423828125, 0.53582763671875, 0.6478271484375, 0.75982666015625, 0.871826171875, 0.98382568359375, 1.0958251953125, 1.20782470703125, 1.31982421875, 1.43182373046875, 1.5438232421875, 1.65582275390625, 1.767822265625, 1.87982177734375, 1.9918212890625, 2.10382080078125, 2.2158203125, 2.32781982421875, 2.4398193359375, 2.55181884765625, 2.663818359375, 2.77581787109375, 2.8878173828125, 2.99981689453125, 3.11181640625, 3.22381591796875, 3.3358154296875, 3.44781494140625, 3.559814453125, 3.67181396484375, 3.7838134765625, 3.89581298828125, 4.0078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 11.0, 14.0, 27.0, 39.0, 46.0, 78.0, 105.0, 106.0, 130.0, 121.0, 77.0, 70.0, 62.0, 39.0, 28.0, 15.0, 7.0, 10.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.542293548583984, -11.814962387084961, -11.087631225585938, -10.360299110412598, -9.632967948913574, -8.90563678741455, -8.178304672241211, -7.4509735107421875, -6.723642349243164, -5.996311187744141, -5.268979549407959, -4.541647911071777, -3.814316749572754, -3.0869853496551514, -2.359653949737549, -1.6323223114013672, -0.9049911499023438, -0.1776597499847412, 0.5496716499328613, 1.2770030498504639, 2.0043344497680664, 2.731665849685669, 3.4589972496032715, 4.186328887939453, 4.913660049438477, 5.6409912109375, 6.368322849273682, 7.095654487609863, 7.822985649108887, 8.55031681060791, 9.27764892578125, 10.004980087280273, 10.732311248779297, 11.45964241027832, 12.186973571777344, 12.914305686950684, 13.641636848449707, 14.36896800994873, 15.09630012512207, 15.823631286621094, 16.550962448120117, 17.27829360961914, 18.005624771118164, 18.732955932617188, 19.460289001464844, 20.187620162963867, 20.91495132446289, 21.642282485961914, 22.369613647460938, 23.09694480895996, 23.824275970458984, 24.551607131958008, 25.27893829345703, 26.006271362304688, 26.73360252380371, 27.460933685302734, 28.188264846801758, 28.91559600830078, 29.642927169799805, 30.370258331298828, 31.097591400146484, 31.824922561645508, 32.55225372314453, 33.27958679199219, 34.00691604614258]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 14.0, 15.0, 18.0, 19.0, 23.0, 23.0, 36.0, 26.0, 27.0, 31.0, 31.0, 35.0, 42.0, 43.0, 48.0, 43.0, 44.0, 34.0, 40.0, 32.0, 46.0, 31.0, 29.0, 33.0, 27.0, 28.0, 18.0, 15.0, 17.0, 19.0, 16.0, 9.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.027045249938965, -10.672649383544922, -10.318252563476562, -9.96385669708252, -9.609460830688477, -9.255064010620117, -8.900668144226074, -8.546272277832031, -8.191875457763672, -7.837479114532471, -7.4830827713012695, -7.128686904907227, -6.774290561676025, -6.419894218444824, -6.065498352050781, -5.71110200881958, -5.356705665588379, -5.002309322357178, -4.647912979125977, -4.293517112731934, -3.9391207695007324, -3.5847244262695312, -3.230328321456909, -2.875932216644287, -2.521535873413086, -2.1671395301818848, -1.8127434253692627, -1.458347201347351, -1.1039509773254395, -0.7495547533035278, -0.3951585292816162, -0.04076242446899414, 0.31363487243652344, 0.6680310964584351, 1.0224273204803467, 1.3768235445022583, 1.73121976852417, 2.085616111755371, 2.440012216567993, 2.7944083213806152, 3.1488046646118164, 3.5032010078430176, 3.8575971126556396, 4.211993217468262, 4.566389560699463, 4.920785903930664, 5.275181770324707, 5.629578113555908, 5.983974456787109, 6.3383708000183105, 6.692767143249512, 7.047163009643555, 7.401559352874756, 7.755955696105957, 8.1103515625, 8.46474838256836, 8.819144248962402, 9.173540115356445, 9.527936935424805, 9.882332801818848, 10.23672866821289, 10.59112548828125, 10.945521354675293, 11.299917221069336, 11.654314041137695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 19.0, 23.0, 26.0, 68.0, 96.0, 168.0, 289.0, 615.0, 1291.0, 3147.0, 8648.0, 28011.0, 102977.0, 384054.0, 377173.0, 100549.0, 27158.0, 8557.0, 3101.0, 1288.0, 570.0, 291.0, 188.0, 94.0, 59.0, 26.0, 18.0, 10.0, 7.0, 7.0, 3.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.63739013671875, -6.4232177734375, -6.20904541015625, -5.994873046875, -5.78070068359375, -5.5665283203125, -5.35235595703125, -5.13818359375, -4.92401123046875, -4.7098388671875, -4.49566650390625, -4.281494140625, -4.06732177734375, -3.8531494140625, -3.63897705078125, -3.4248046875, -3.21063232421875, -2.9964599609375, -2.78228759765625, -2.568115234375, -2.35394287109375, -2.1397705078125, -1.92559814453125, -1.71142578125, -1.49725341796875, -1.2830810546875, -1.06890869140625, -0.854736328125, -0.64056396484375, -0.4263916015625, -0.21221923828125, 0.001953125, 0.21612548828125, 0.4302978515625, 0.64447021484375, 0.858642578125, 1.07281494140625, 1.2869873046875, 1.50115966796875, 1.71533203125, 1.92950439453125, 2.1436767578125, 2.35784912109375, 2.572021484375, 2.78619384765625, 3.0003662109375, 3.21453857421875, 3.4287109375, 3.64288330078125, 3.8570556640625, 4.07122802734375, 4.285400390625, 4.49957275390625, 4.7137451171875, 4.92791748046875, 5.14208984375, 5.35626220703125, 5.5704345703125, 5.78460693359375, 5.998779296875, 6.21295166015625, 6.4271240234375, 6.64129638671875, 6.85546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 4.0, 8.0, 15.0, 17.0, 22.0, 19.0, 25.0, 28.0, 34.0, 39.0, 53.0, 43.0, 46.0, 54.0, 42.0, 49.0, 61.0, 59.0, 50.0, 38.0, 56.0, 38.0, 41.0, 27.0, 29.0, 23.0, 20.0, 18.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.638671875, -1.5885772705078125, -1.538482666015625, -1.4883880615234375, -1.43829345703125, -1.3881988525390625, -1.338104248046875, -1.2880096435546875, -1.2379150390625, -1.1878204345703125, -1.137725830078125, -1.0876312255859375, -1.03753662109375, -0.9874420166015625, -0.937347412109375, -0.8872528076171875, -0.837158203125, -0.7870635986328125, -0.736968994140625, -0.6868743896484375, -0.63677978515625, -0.5866851806640625, -0.536590576171875, -0.4864959716796875, -0.4364013671875, -0.3863067626953125, -0.336212158203125, -0.2861175537109375, -0.23602294921875, -0.1859283447265625, -0.135833740234375, -0.0857391357421875, -0.03564453125, 0.0144500732421875, 0.064544677734375, 0.1146392822265625, 0.16473388671875, 0.2148284912109375, 0.264923095703125, 0.3150177001953125, 0.3651123046875, 0.4152069091796875, 0.465301513671875, 0.5153961181640625, 0.56549072265625, 0.6155853271484375, 0.665679931640625, 0.7157745361328125, 0.765869140625, 0.8159637451171875, 0.866058349609375, 0.9161529541015625, 0.96624755859375, 1.0163421630859375, 1.066436767578125, 1.1165313720703125, 1.1666259765625, 1.2167205810546875, 1.266815185546875, 1.3169097900390625, 1.36700439453125, 1.4170989990234375, 1.467193603515625, 1.5172882080078125, 1.5673828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 7.0, 6.0, 10.0, 12.0, 13.0, 24.0, 37.0, 31.0, 80.0, 130.0, 221.0, 356.0, 660.0, 1360.0, 3668.0, 14321.0, 107283.0, 718131.0, 173607.0, 20488.0, 4614.0, 1656.0, 812.0, 417.0, 223.0, 140.0, 73.0, 61.0, 35.0, 21.0, 16.0, 9.0, 20.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -11.03271484375, -10.7138671875, -10.39501953125, -10.076171875, -9.75732421875, -9.4384765625, -9.11962890625, -8.80078125, -8.48193359375, -8.1630859375, -7.84423828125, -7.525390625, -7.20654296875, -6.8876953125, -6.56884765625, -6.25, -5.93115234375, -5.6123046875, -5.29345703125, -4.974609375, -4.65576171875, -4.3369140625, -4.01806640625, -3.69921875, -3.38037109375, -3.0615234375, -2.74267578125, -2.423828125, -2.10498046875, -1.7861328125, -1.46728515625, -1.1484375, -0.82958984375, -0.5107421875, -0.19189453125, 0.126953125, 0.44580078125, 0.7646484375, 1.08349609375, 1.40234375, 1.72119140625, 2.0400390625, 2.35888671875, 2.677734375, 2.99658203125, 3.3154296875, 3.63427734375, 3.953125, 4.27197265625, 4.5908203125, 4.90966796875, 5.228515625, 5.54736328125, 5.8662109375, 6.18505859375, 6.50390625, 6.82275390625, 7.1416015625, 7.46044921875, 7.779296875, 8.09814453125, 8.4169921875, 8.73583984375, 9.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 9.0, 19.0, 24.0, 16.0, 24.0, 24.0, 24.0, 32.0, 36.0, 36.0, 38.0, 32.0, 46.0, 47.0, 50.0, 44.0, 44.0, 37.0, 46.0, 45.0, 56.0, 31.0, 31.0, 26.0, 22.0, 26.0, 19.0, 23.0, 14.0, 9.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.23046875, -7.008544921875, -6.78662109375, -6.564697265625, -6.3427734375, -6.120849609375, -5.89892578125, -5.677001953125, -5.455078125, -5.233154296875, -5.01123046875, -4.789306640625, -4.5673828125, -4.345458984375, -4.12353515625, -3.901611328125, -3.6796875, -3.457763671875, -3.23583984375, -3.013916015625, -2.7919921875, -2.570068359375, -2.34814453125, -2.126220703125, -1.904296875, -1.682373046875, -1.46044921875, -1.238525390625, -1.0166015625, -0.794677734375, -0.57275390625, -0.350830078125, -0.12890625, 0.093017578125, 0.31494140625, 0.536865234375, 0.7587890625, 0.980712890625, 1.20263671875, 1.424560546875, 1.646484375, 1.868408203125, 2.09033203125, 2.312255859375, 2.5341796875, 2.756103515625, 2.97802734375, 3.199951171875, 3.421875, 3.643798828125, 3.86572265625, 4.087646484375, 4.3095703125, 4.531494140625, 4.75341796875, 4.975341796875, 5.197265625, 5.419189453125, 5.64111328125, 5.863037109375, 6.0849609375, 6.306884765625, 6.52880859375, 6.750732421875, 6.97265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 11.0, 12.0, 30.0, 36.0, 79.0, 103.0, 242.0, 494.0, 1150.0, 3110.0, 10778.0, 56634.0, 394649.0, 488475.0, 73377.0, 13415.0, 3506.0, 1271.0, 539.0, 281.0, 134.0, 81.0, 53.0, 22.0, 24.0, 11.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.899169921875, -4.75537109375, -4.611572265625, -4.4677734375, -4.323974609375, -4.18017578125, -4.036376953125, -3.892578125, -3.748779296875, -3.60498046875, -3.461181640625, -3.3173828125, -3.173583984375, -3.02978515625, -2.885986328125, -2.7421875, -2.598388671875, -2.45458984375, -2.310791015625, -2.1669921875, -2.023193359375, -1.87939453125, -1.735595703125, -1.591796875, -1.447998046875, -1.30419921875, -1.160400390625, -1.0166015625, -0.872802734375, -0.72900390625, -0.585205078125, -0.44140625, -0.297607421875, -0.15380859375, -0.010009765625, 0.1337890625, 0.277587890625, 0.42138671875, 0.565185546875, 0.708984375, 0.852783203125, 0.99658203125, 1.140380859375, 1.2841796875, 1.427978515625, 1.57177734375, 1.715576171875, 1.859375, 2.003173828125, 2.14697265625, 2.290771484375, 2.4345703125, 2.578369140625, 2.72216796875, 2.865966796875, 3.009765625, 3.153564453125, 3.29736328125, 3.441162109375, 3.5849609375, 3.728759765625, 3.87255859375, 4.016357421875, 4.16015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 18.0, 12.0, 24.0, 28.0, 30.0, 47.0, 61.0, 70.0, 76.0, 101.0, 100.0, 78.0, 64.0, 60.0, 38.0, 28.0, 28.0, 23.0, 21.0, 11.0, 12.0, 6.0, 3.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006122589111328125, -0.0005916431546211243, -0.000571027398109436, -0.0005504116415977478, -0.0005297958850860596, -0.0005091801285743713, -0.0004885643720626831, -0.0004679486155509949, -0.00044733285903930664, -0.0004267171025276184, -0.0004061013460159302, -0.00038548558950424194, -0.0003648698329925537, -0.0003442540764808655, -0.00032363831996917725, -0.000303022563457489, -0.0002824068069458008, -0.00026179105043411255, -0.00024117529392242432, -0.00022055953741073608, -0.00019994378089904785, -0.00017932802438735962, -0.0001587122678756714, -0.00013809651136398315, -0.00011748075485229492, -9.686499834060669e-05, -7.624924182891846e-05, -5.5633485317230225e-05, -3.501772880554199e-05, -1.440197229385376e-05, 6.213784217834473e-06, 2.6829540729522705e-05, 4.744529724121094e-05, 6.806105375289917e-05, 8.86768102645874e-05, 0.00010929256677627563, 0.00012990832328796387, 0.0001505240797996521, 0.00017113983631134033, 0.00019175559282302856, 0.0002123713493347168, 0.00023298710584640503, 0.00025360286235809326, 0.0002742186188697815, 0.0002948343753814697, 0.00031545013189315796, 0.0003360658884048462, 0.0003566816449165344, 0.00037729740142822266, 0.0003979131579399109, 0.0004185289144515991, 0.00043914467096328735, 0.0004597604274749756, 0.0004803761839866638, 0.000500991940498352, 0.0005216076970100403, 0.0005422234535217285, 0.0005628392100334167, 0.000583454966545105, 0.0006040707230567932, 0.0006246864795684814, 0.0006453022360801697, 0.0006659179925918579, 0.0006865337491035461, 0.0007071495056152344]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 16.0, 41.0, 63.0, 187.0, 493.0, 1576.0, 8214.0, 109368.0, 841762.0, 77975.0, 6720.0, 1378.0, 414.0, 178.0, 77.0, 39.0, 15.0, 9.0, 7.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5152587890625, -7.241455078125, -6.9676513671875, -6.69384765625, -6.4200439453125, -6.146240234375, -5.8724365234375, -5.5986328125, -5.3248291015625, -5.051025390625, -4.7772216796875, -4.50341796875, -4.2296142578125, -3.955810546875, -3.6820068359375, -3.408203125, -3.1343994140625, -2.860595703125, -2.5867919921875, -2.31298828125, -2.0391845703125, -1.765380859375, -1.4915771484375, -1.2177734375, -0.9439697265625, -0.670166015625, -0.3963623046875, -0.12255859375, 0.1512451171875, 0.425048828125, 0.6988525390625, 0.97265625, 1.2464599609375, 1.520263671875, 1.7940673828125, 2.06787109375, 2.3416748046875, 2.615478515625, 2.8892822265625, 3.1630859375, 3.4368896484375, 3.710693359375, 3.9844970703125, 4.25830078125, 4.5321044921875, 4.805908203125, 5.0797119140625, 5.353515625, 5.6273193359375, 5.901123046875, 6.1749267578125, 6.44873046875, 6.7225341796875, 6.996337890625, 7.2701416015625, 7.5439453125, 7.8177490234375, 8.091552734375, 8.3653564453125, 8.63916015625, 8.9129638671875, 9.186767578125, 9.4605712890625, 9.734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 8.0, 15.0, 14.0, 16.0, 25.0, 39.0, 38.0, 64.0, 66.0, 65.0, 85.0, 84.0, 45.0, 70.0, 69.0, 66.0, 31.0, 33.0, 34.0, 24.0, 20.0, 11.0, 10.0, 9.0, 2.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.931640625, -2.841827392578125, -2.75201416015625, -2.662200927734375, -2.5723876953125, -2.482574462890625, -2.39276123046875, -2.302947998046875, -2.213134765625, -2.123321533203125, -2.03350830078125, -1.943695068359375, -1.8538818359375, -1.764068603515625, -1.67425537109375, -1.584442138671875, -1.49462890625, -1.404815673828125, -1.31500244140625, -1.225189208984375, -1.1353759765625, -1.045562744140625, -0.95574951171875, -0.865936279296875, -0.776123046875, -0.686309814453125, -0.59649658203125, -0.506683349609375, -0.4168701171875, -0.327056884765625, -0.23724365234375, -0.147430419921875, -0.0576171875, 0.032196044921875, 0.12200927734375, 0.211822509765625, 0.3016357421875, 0.391448974609375, 0.48126220703125, 0.571075439453125, 0.660888671875, 0.750701904296875, 0.84051513671875, 0.930328369140625, 1.0201416015625, 1.109954833984375, 1.19976806640625, 1.289581298828125, 1.37939453125, 1.469207763671875, 1.55902099609375, 1.648834228515625, 1.7386474609375, 1.828460693359375, 1.91827392578125, 2.008087158203125, 2.097900390625, 2.187713623046875, 2.27752685546875, 2.367340087890625, 2.4571533203125, 2.546966552734375, 2.63677978515625, 2.726593017578125, 2.81640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 13.0, 12.0, 22.0, 33.0, 29.0, 49.0, 68.0, 99.0, 93.0, 132.0, 94.0, 89.0, 81.0, 54.0, 42.0, 31.0, 23.0, 5.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.91415786743164, -41.5188102722168, -40.12346267700195, -38.72811508178711, -37.33277130126953, -35.93742370605469, -34.542076110839844, -33.146728515625, -31.751380920410156, -30.356033325195312, -28.96068572998047, -27.565340042114258, -26.169992446899414, -24.77464485168457, -23.37929916381836, -21.983951568603516, -20.588603973388672, -19.193256378173828, -17.797908782958984, -16.402563095092773, -15.00721549987793, -13.611867904663086, -12.216521263122559, -10.821174621582031, -9.425827026367188, -8.030479431152344, -6.635132789611816, -5.239785671234131, -3.8444385528564453, -2.4490914344787598, -1.0537443161010742, 0.3416023254394531, 1.7369461059570312, 3.132293224334717, 4.527640342712402, 5.922987461090088, 7.318334579467773, 8.713682174682617, 10.109028816223145, 11.504375457763672, 12.899723052978516, 14.29507064819336, 15.690417289733887, 17.085763931274414, 18.481111526489258, 19.8764591217041, 21.271804809570312, 22.667152404785156, 24.0625, 25.457847595214844, 26.853195190429688, 28.2485408782959, 29.643888473510742, 31.039236068725586, 32.4345817565918, 33.82992935180664, 35.225276947021484, 36.62062454223633, 38.01597213745117, 39.411319732666016, 40.806663513183594, 42.20201110839844, 43.59735870361328, 44.992706298828125, 46.38805389404297]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 9.0, 13.0, 8.0, 12.0, 26.0, 26.0, 23.0, 41.0, 38.0, 36.0, 44.0, 40.0, 44.0, 49.0, 42.0, 48.0, 48.0, 50.0, 41.0, 44.0, 29.0, 33.0, 27.0, 35.0, 25.0, 18.0, 27.0, 18.0, 12.0, 10.0, 10.0, 9.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.061729431152344, -31.95173454284668, -30.841739654541016, -29.731746673583984, -28.62175178527832, -27.511756896972656, -26.401763916015625, -25.29176902770996, -24.181774139404297, -23.071779251098633, -21.96178436279297, -20.851791381835938, -19.741796493530273, -18.63180160522461, -17.521808624267578, -16.411813735961914, -15.30181884765625, -14.191823959350586, -13.081830024719238, -11.97183609008789, -10.861841201782227, -9.751846313476562, -8.641852378845215, -7.531857967376709, -6.421863555908203, -5.311869144439697, -4.201874732971191, -3.0918803215026855, -1.9818859100341797, -0.8718914985656738, 0.23810291290283203, 1.348097324371338, 2.4580917358398438, 3.5680861473083496, 4.6780805587768555, 5.788074970245361, 6.898069381713867, 8.008064270019531, 9.118058204650879, 10.228052139282227, 11.33804702758789, 12.448041915893555, 13.558035850524902, 14.66802978515625, 15.778024673461914, 16.888019561767578, 17.99801254272461, 19.108007431030273, 20.218002319335938, 21.3279972076416, 22.437992095947266, 23.547985076904297, 24.65797996520996, 25.767974853515625, 26.877967834472656, 27.98796272277832, 29.097957611083984, 30.20795249938965, 31.317947387695312, 32.427940368652344, 33.537933349609375, 34.64793014526367, 35.7579231262207, 36.867919921875, 37.97791290283203]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 17.0, 5.0, 6.0, 14.0, 25.0, 23.0, 43.0, 68.0, 106.0, 149.0, 233.0, 380.0, 654.0, 1084.0, 1793.0, 3522.0, 7646.0, 24925.0, 3926244.0, 196586.0, 17639.0, 6108.0, 2900.0, 1585.0, 948.0, 555.0, 344.0, 229.0, 140.0, 92.0, 64.0, 50.0, 33.0, 25.0, 15.0, 11.0, 7.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.390625, -11.081787109375, -10.77294921875, -10.464111328125, -10.1552734375, -9.846435546875, -9.53759765625, -9.228759765625, -8.919921875, -8.611083984375, -8.30224609375, -7.993408203125, -7.6845703125, -7.375732421875, -7.06689453125, -6.758056640625, -6.44921875, -6.140380859375, -5.83154296875, -5.522705078125, -5.2138671875, -4.905029296875, -4.59619140625, -4.287353515625, -3.978515625, -3.669677734375, -3.36083984375, -3.052001953125, -2.7431640625, -2.434326171875, -2.12548828125, -1.816650390625, -1.5078125, -1.198974609375, -0.89013671875, -0.581298828125, -0.2724609375, 0.036376953125, 0.34521484375, 0.654052734375, 0.962890625, 1.271728515625, 1.58056640625, 1.889404296875, 2.1982421875, 2.507080078125, 2.81591796875, 3.124755859375, 3.43359375, 3.742431640625, 4.05126953125, 4.360107421875, 4.6689453125, 4.977783203125, 5.28662109375, 5.595458984375, 5.904296875, 6.213134765625, 6.52197265625, 6.830810546875, 7.1396484375, 7.448486328125, 7.75732421875, 8.066162109375, 8.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 7.0, 7.0, 9.0, 23.0, 24.0, 24.0, 30.0, 34.0, 52.0, 43.0, 48.0, 48.0, 63.0, 69.0, 71.0, 61.0, 72.0, 59.0, 37.0, 49.0, 34.0, 32.0, 20.0, 12.0, 16.0, 12.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.8614044189453125, -1.800933837890625, -1.7404632568359375, -1.67999267578125, -1.6195220947265625, -1.559051513671875, -1.4985809326171875, -1.4381103515625, -1.3776397705078125, -1.317169189453125, -1.2566986083984375, -1.19622802734375, -1.1357574462890625, -1.075286865234375, -1.0148162841796875, -0.954345703125, -0.8938751220703125, -0.833404541015625, -0.7729339599609375, -0.71246337890625, -0.6519927978515625, -0.591522216796875, -0.5310516357421875, -0.4705810546875, -0.4101104736328125, -0.349639892578125, -0.2891693115234375, -0.22869873046875, -0.1682281494140625, -0.107757568359375, -0.0472869873046875, 0.01318359375, 0.0736541748046875, 0.134124755859375, 0.1945953369140625, 0.25506591796875, 0.3155364990234375, 0.376007080078125, 0.4364776611328125, 0.4969482421875, 0.5574188232421875, 0.617889404296875, 0.6783599853515625, 0.73883056640625, 0.7993011474609375, 0.859771728515625, 0.9202423095703125, 0.980712890625, 1.0411834716796875, 1.101654052734375, 1.1621246337890625, 1.22259521484375, 1.2830657958984375, 1.343536376953125, 1.4040069580078125, 1.4644775390625, 1.5249481201171875, 1.585418701171875, 1.6458892822265625, 1.70635986328125, 1.7668304443359375, 1.827301025390625, 1.8877716064453125, 1.9482421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 10.0, 19.0, 21.0, 36.0, 62.0, 75.0, 115.0, 179.0, 252.0, 374.0, 583.0, 945.0, 1899.0, 4773.0, 27763.0, 4080460.0, 64413.0, 6914.0, 2341.0, 1132.0, 637.0, 390.0, 269.0, 191.0, 126.0, 83.0, 66.0, 48.0, 20.0, 18.0, 9.0, 14.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.278564453125, -12.81494140625, -12.351318359375, -11.8876953125, -11.424072265625, -10.96044921875, -10.496826171875, -10.033203125, -9.569580078125, -9.10595703125, -8.642333984375, -8.1787109375, -7.715087890625, -7.25146484375, -6.787841796875, -6.32421875, -5.860595703125, -5.39697265625, -4.933349609375, -4.4697265625, -4.006103515625, -3.54248046875, -3.078857421875, -2.615234375, -2.151611328125, -1.68798828125, -1.224365234375, -0.7607421875, -0.297119140625, 0.16650390625, 0.630126953125, 1.09375, 1.557373046875, 2.02099609375, 2.484619140625, 2.9482421875, 3.411865234375, 3.87548828125, 4.339111328125, 4.802734375, 5.266357421875, 5.72998046875, 6.193603515625, 6.6572265625, 7.120849609375, 7.58447265625, 8.048095703125, 8.51171875, 8.975341796875, 9.43896484375, 9.902587890625, 10.3662109375, 10.829833984375, 11.29345703125, 11.757080078125, 12.220703125, 12.684326171875, 13.14794921875, 13.611572265625, 14.0751953125, 14.538818359375, 15.00244140625, 15.466064453125, 15.9296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 17.0, 20.0, 47.0, 156.0, 3519.0, 210.0, 47.0, 25.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.133392333984375, -2.04998779296875, -1.966583251953125, -1.8831787109375, -1.799774169921875, -1.71636962890625, -1.632965087890625, -1.549560546875, -1.466156005859375, -1.38275146484375, -1.299346923828125, -1.2159423828125, -1.132537841796875, -1.04913330078125, -0.965728759765625, -0.88232421875, -0.798919677734375, -0.71551513671875, -0.632110595703125, -0.5487060546875, -0.465301513671875, -0.38189697265625, -0.298492431640625, -0.215087890625, -0.131683349609375, -0.04827880859375, 0.035125732421875, 0.1185302734375, 0.201934814453125, 0.28533935546875, 0.368743896484375, 0.4521484375, 0.535552978515625, 0.61895751953125, 0.702362060546875, 0.7857666015625, 0.869171142578125, 0.95257568359375, 1.035980224609375, 1.119384765625, 1.202789306640625, 1.28619384765625, 1.369598388671875, 1.4530029296875, 1.536407470703125, 1.61981201171875, 1.703216552734375, 1.78662109375, 1.870025634765625, 1.95343017578125, 2.036834716796875, 2.1202392578125, 2.203643798828125, 2.28704833984375, 2.370452880859375, 2.453857421875, 2.537261962890625, 2.62066650390625, 2.704071044921875, 2.7874755859375, 2.870880126953125, 2.95428466796875, 3.037689208984375, 3.12109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 11.0, 10.0, 25.0, 26.0, 35.0, 41.0, 68.0, 84.0, 105.0, 115.0, 88.0, 99.0, 75.0, 70.0, 50.0, 28.0, 17.0, 22.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.274593353271484, -8.061896324157715, -7.849198341369629, -7.636501312255859, -7.423803806304932, -7.211106300354004, -6.998409271240234, -6.785711765289307, -6.573014259338379, -6.360316753387451, -6.147619247436523, -5.934922218322754, -5.722224712371826, -5.509527206420898, -5.296830177307129, -5.084132671356201, -4.871435165405273, -4.658737659454346, -4.446040153503418, -4.233343124389648, -4.020645618438721, -3.807948112487793, -3.5952508449554443, -3.3825535774230957, -3.169856071472168, -2.9571585655212402, -2.7444612979888916, -2.531764030456543, -2.3190665245056152, -2.1063690185546875, -1.8936717510223389, -1.6809743642807007, -1.4682765007019043, -1.2555791139602661, -1.042881727218628, -0.8301843404769897, -0.6174869537353516, -0.4047895669937134, -0.1920921802520752, 0.02060520648956299, 0.23330259323120117, 0.44599997997283936, 0.6586973667144775, 0.8713947534561157, 1.084092140197754, 1.296789526939392, 1.5094869136810303, 1.7221843004226685, 1.9348816871643066, 2.1475791931152344, 2.360276460647583, 2.5729737281799316, 2.7856712341308594, 2.998368740081787, 3.2110660076141357, 3.4237632751464844, 3.636460781097412, 3.84915828704834, 4.061855316162109, 4.274552822113037, 4.487250328063965, 4.699947834014893, 4.91264533996582, 5.12534236907959, 5.338039875030518]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 16.0, 10.0, 11.0, 20.0, 22.0, 28.0, 29.0, 22.0, 25.0, 33.0, 38.0, 27.0, 45.0, 41.0, 47.0, 41.0, 48.0, 37.0, 38.0, 44.0, 45.0, 26.0, 34.0, 41.0, 23.0, 32.0, 20.0, 27.0, 17.0, 14.0, 13.0, 17.0, 9.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.4689292907714844, -3.3560986518859863, -3.2432680130004883, -3.130437135696411, -3.017606496810913, -2.904775857925415, -2.791944980621338, -2.67911434173584, -2.566283702850342, -2.4534530639648438, -2.3406224250793457, -2.2277915477752686, -2.1149609088897705, -2.0021302700042725, -1.8892995119094849, -1.7764687538146973, -1.6636381149291992, -1.5508074760437012, -1.4379767179489136, -1.325145959854126, -1.212315320968628, -1.0994846820831299, -0.9866539239883423, -0.8738232254981995, -0.7609925270080566, -0.6481618285179138, -0.535331130027771, -0.4225004315376282, -0.30966973304748535, -0.19683903455734253, -0.08400833606719971, 0.028822362422943115, 0.14165306091308594, 0.25448375940322876, 0.3673144578933716, 0.4801451563835144, 0.5929758548736572, 0.7058065533638, 0.8186372518539429, 0.9314679503440857, 1.0442986488342285, 1.1571292877197266, 1.2699600458145142, 1.3827908039093018, 1.4956214427947998, 1.6084520816802979, 1.7212828397750854, 1.834113597869873, 1.946944236755371, 2.059774875640869, 2.172605514526367, 2.2854363918304443, 2.3982670307159424, 2.5110976696014404, 2.6239285469055176, 2.7367591857910156, 2.8495898246765137, 2.9624204635620117, 3.0752511024475098, 3.188081979751587, 3.300912618637085, 3.413743257522583, 3.52657413482666, 3.639404773712158, 3.7522354125976562]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 11.0, 9.0, 10.0, 24.0, 42.0, 67.0, 120.0, 211.0, 421.0, 797.0, 1930.0, 4705.0, 13189.0, 39208.0, 128568.0, 376640.0, 327687.0, 104684.0, 32302.0, 10640.0, 4085.0, 1642.0, 757.0, 362.0, 185.0, 100.0, 48.0, 35.0, 22.0, 14.0, 15.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.80859375, -6.6241455078125, -6.439697265625, -6.2552490234375, -6.07080078125, -5.8863525390625, -5.701904296875, -5.5174560546875, -5.3330078125, -5.1485595703125, -4.964111328125, -4.7796630859375, -4.59521484375, -4.4107666015625, -4.226318359375, -4.0418701171875, -3.857421875, -3.6729736328125, -3.488525390625, -3.3040771484375, -3.11962890625, -2.9351806640625, -2.750732421875, -2.5662841796875, -2.3818359375, -2.1973876953125, -2.012939453125, -1.8284912109375, -1.64404296875, -1.4595947265625, -1.275146484375, -1.0906982421875, -0.90625, -0.7218017578125, -0.537353515625, -0.3529052734375, -0.16845703125, 0.0159912109375, 0.200439453125, 0.3848876953125, 0.5693359375, 0.7537841796875, 0.938232421875, 1.1226806640625, 1.30712890625, 1.4915771484375, 1.676025390625, 1.8604736328125, 2.044921875, 2.2293701171875, 2.413818359375, 2.5982666015625, 2.78271484375, 2.9671630859375, 3.151611328125, 3.3360595703125, 3.5205078125, 3.7049560546875, 3.889404296875, 4.0738525390625, 4.25830078125, 4.4427490234375, 4.627197265625, 4.8116455078125, 4.99609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 7.0, 9.0, 12.0, 18.0, 19.0, 19.0, 29.0, 22.0, 32.0, 29.0, 49.0, 50.0, 43.0, 48.0, 55.0, 67.0, 51.0, 54.0, 55.0, 56.0, 50.0, 49.0, 45.0, 27.0, 29.0, 10.0, 19.0, 8.0, 5.0, 11.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.892547607421875, -1.83099365234375, -1.769439697265625, -1.7078857421875, -1.646331787109375, -1.58477783203125, -1.523223876953125, -1.461669921875, -1.400115966796875, -1.33856201171875, -1.277008056640625, -1.2154541015625, -1.153900146484375, -1.09234619140625, -1.030792236328125, -0.96923828125, -0.907684326171875, -0.84613037109375, -0.784576416015625, -0.7230224609375, -0.661468505859375, -0.59991455078125, -0.538360595703125, -0.476806640625, -0.415252685546875, -0.35369873046875, -0.292144775390625, -0.2305908203125, -0.169036865234375, -0.10748291015625, -0.045928955078125, 0.015625, 0.077178955078125, 0.13873291015625, 0.200286865234375, 0.2618408203125, 0.323394775390625, 0.38494873046875, 0.446502685546875, 0.508056640625, 0.569610595703125, 0.63116455078125, 0.692718505859375, 0.7542724609375, 0.815826416015625, 0.87738037109375, 0.938934326171875, 1.00048828125, 1.062042236328125, 1.12359619140625, 1.185150146484375, 1.2467041015625, 1.308258056640625, 1.36981201171875, 1.431365966796875, 1.492919921875, 1.554473876953125, 1.61602783203125, 1.677581787109375, 1.7391357421875, 1.800689697265625, 1.86224365234375, 1.923797607421875, 1.9853515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 9.0, 13.0, 22.0, 36.0, 51.0, 73.0, 121.0, 171.0, 249.0, 422.0, 779.0, 1379.0, 3271.0, 10537.0, 47454.0, 328767.0, 548957.0, 81912.0, 15853.0, 4462.0, 1735.0, 914.0, 497.0, 291.0, 181.0, 126.0, 92.0, 48.0, 27.0, 23.0, 12.0, 13.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.62249755859375, -7.3778076171875, -7.13311767578125, -6.888427734375, -6.64373779296875, -6.3990478515625, -6.15435791015625, -5.90966796875, -5.66497802734375, -5.4202880859375, -5.17559814453125, -4.930908203125, -4.68621826171875, -4.4415283203125, -4.19683837890625, -3.9521484375, -3.70745849609375, -3.4627685546875, -3.21807861328125, -2.973388671875, -2.72869873046875, -2.4840087890625, -2.23931884765625, -1.99462890625, -1.74993896484375, -1.5052490234375, -1.26055908203125, -1.015869140625, -0.77117919921875, -0.5264892578125, -0.28179931640625, -0.037109375, 0.20758056640625, 0.4522705078125, 0.69696044921875, 0.941650390625, 1.18634033203125, 1.4310302734375, 1.67572021484375, 1.92041015625, 2.16510009765625, 2.4097900390625, 2.65447998046875, 2.899169921875, 3.14385986328125, 3.3885498046875, 3.63323974609375, 3.8779296875, 4.12261962890625, 4.3673095703125, 4.61199951171875, 4.856689453125, 5.10137939453125, 5.3460693359375, 5.59075927734375, 5.83544921875, 6.08013916015625, 6.3248291015625, 6.56951904296875, 6.814208984375, 7.05889892578125, 7.3035888671875, 7.54827880859375, 7.79296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 9.0, 13.0, 18.0, 20.0, 16.0, 32.0, 24.0, 26.0, 24.0, 22.0, 34.0, 29.0, 40.0, 37.0, 47.0, 48.0, 31.0, 52.0, 36.0, 41.0, 41.0, 33.0, 46.0, 33.0, 23.0, 28.0, 21.0, 32.0, 21.0, 17.0, 12.0, 9.0, 8.0, 16.0, 6.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.31640625, -7.08319091796875, -6.8499755859375, -6.61676025390625, -6.383544921875, -6.15032958984375, -5.9171142578125, -5.68389892578125, -5.45068359375, -5.21746826171875, -4.9842529296875, -4.75103759765625, -4.517822265625, -4.28460693359375, -4.0513916015625, -3.81817626953125, -3.5849609375, -3.35174560546875, -3.1185302734375, -2.88531494140625, -2.652099609375, -2.41888427734375, -2.1856689453125, -1.95245361328125, -1.71923828125, -1.48602294921875, -1.2528076171875, -1.01959228515625, -0.786376953125, -0.55316162109375, -0.3199462890625, -0.08673095703125, 0.146484375, 0.37969970703125, 0.6129150390625, 0.84613037109375, 1.079345703125, 1.31256103515625, 1.5457763671875, 1.77899169921875, 2.01220703125, 2.24542236328125, 2.4786376953125, 2.71185302734375, 2.945068359375, 3.17828369140625, 3.4114990234375, 3.64471435546875, 3.8779296875, 4.11114501953125, 4.3443603515625, 4.57757568359375, 4.810791015625, 5.04400634765625, 5.2772216796875, 5.51043701171875, 5.74365234375, 5.97686767578125, 6.2100830078125, 6.44329833984375, 6.676513671875, 6.90972900390625, 7.1429443359375, 7.37615966796875, 7.609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 13.0, 21.0, 29.0, 44.0, 74.0, 134.0, 273.0, 500.0, 1060.0, 2578.0, 7634.0, 28102.0, 147204.0, 604107.0, 205183.0, 36458.0, 9393.0, 3234.0, 1274.0, 559.0, 304.0, 151.0, 84.0, 46.0, 30.0, 15.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.677734375, -3.56488037109375, -3.4520263671875, -3.33917236328125, -3.226318359375, -3.11346435546875, -3.0006103515625, -2.88775634765625, -2.77490234375, -2.66204833984375, -2.5491943359375, -2.43634033203125, -2.323486328125, -2.21063232421875, -2.0977783203125, -1.98492431640625, -1.8720703125, -1.75921630859375, -1.6463623046875, -1.53350830078125, -1.420654296875, -1.30780029296875, -1.1949462890625, -1.08209228515625, -0.96923828125, -0.85638427734375, -0.7435302734375, -0.63067626953125, -0.517822265625, -0.40496826171875, -0.2921142578125, -0.17926025390625, -0.06640625, 0.04644775390625, 0.1593017578125, 0.27215576171875, 0.385009765625, 0.49786376953125, 0.6107177734375, 0.72357177734375, 0.83642578125, 0.94927978515625, 1.0621337890625, 1.17498779296875, 1.287841796875, 1.40069580078125, 1.5135498046875, 1.62640380859375, 1.7392578125, 1.85211181640625, 1.9649658203125, 2.07781982421875, 2.190673828125, 2.30352783203125, 2.4163818359375, 2.52923583984375, 2.64208984375, 2.75494384765625, 2.8677978515625, 2.98065185546875, 3.093505859375, 3.20635986328125, 3.3192138671875, 3.43206787109375, 3.544921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 8.0, 9.0, 9.0, 12.0, 22.0, 23.0, 32.0, 45.0, 60.0, 76.0, 110.0, 113.0, 102.0, 84.0, 72.0, 49.0, 43.0, 30.0, 26.0, 23.0, 12.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00079345703125, -0.0007698088884353638, -0.0007461607456207275, -0.0007225126028060913, -0.0006988644599914551, -0.0006752163171768188, -0.0006515681743621826, -0.0006279200315475464, -0.0006042718887329102, -0.0005806237459182739, -0.0005569756031036377, -0.0005333274602890015, -0.0005096793174743652, -0.000486031174659729, -0.0004623830318450928, -0.00043873488903045654, -0.0004150867462158203, -0.0003914386034011841, -0.00036779046058654785, -0.0003441423177719116, -0.0003204941749572754, -0.00029684603214263916, -0.00027319788932800293, -0.0002495497465133667, -0.00022590160369873047, -0.00020225346088409424, -0.000178605318069458, -0.00015495717525482178, -0.00013130903244018555, -0.00010766088962554932, -8.401274681091309e-05, -6.0364603996276855e-05, -3.6716461181640625e-05, -1.3068318367004395e-05, 1.0579824447631836e-05, 3.4227967262268066e-05, 5.78761100769043e-05, 8.152425289154053e-05, 0.00010517239570617676, 0.000128820538520813, 0.00015246868133544922, 0.00017611682415008545, 0.00019976496696472168, 0.0002234131097793579, 0.00024706125259399414, 0.00027070939540863037, 0.0002943575382232666, 0.00031800568103790283, 0.00034165382385253906, 0.0003653019666671753, 0.0003889501094818115, 0.00041259825229644775, 0.000436246395111084, 0.0004598945379257202, 0.00048354268074035645, 0.0005071908235549927, 0.0005308389663696289, 0.0005544871091842651, 0.0005781352519989014, 0.0006017833948135376, 0.0006254315376281738, 0.0006490796804428101, 0.0006727278232574463, 0.0006963759660720825, 0.0007200241088867188]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 21.0, 34.0, 53.0, 79.0, 139.0, 282.0, 557.0, 1410.0, 4586.0, 21904.0, 240558.0, 691339.0, 73082.0, 10099.0, 2618.0, 921.0, 390.0, 180.0, 113.0, 53.0, 41.0, 18.0, 22.0, 10.0, 7.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9921875, -5.8314208984375, -5.670654296875, -5.5098876953125, -5.34912109375, -5.1883544921875, -5.027587890625, -4.8668212890625, -4.7060546875, -4.5452880859375, -4.384521484375, -4.2237548828125, -4.06298828125, -3.9022216796875, -3.741455078125, -3.5806884765625, -3.419921875, -3.2591552734375, -3.098388671875, -2.9376220703125, -2.77685546875, -2.6160888671875, -2.455322265625, -2.2945556640625, -2.1337890625, -1.9730224609375, -1.812255859375, -1.6514892578125, -1.49072265625, -1.3299560546875, -1.169189453125, -1.0084228515625, -0.84765625, -0.6868896484375, -0.526123046875, -0.3653564453125, -0.20458984375, -0.0438232421875, 0.116943359375, 0.2777099609375, 0.4384765625, 0.5992431640625, 0.760009765625, 0.9207763671875, 1.08154296875, 1.2423095703125, 1.403076171875, 1.5638427734375, 1.724609375, 1.8853759765625, 2.046142578125, 2.2069091796875, 2.36767578125, 2.5284423828125, 2.689208984375, 2.8499755859375, 3.0107421875, 3.1715087890625, 3.332275390625, 3.4930419921875, 3.65380859375, 3.8145751953125, 3.975341796875, 4.1361083984375, 4.296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 10.0, 6.0, 6.0, 13.0, 15.0, 14.0, 26.0, 20.0, 46.0, 39.0, 56.0, 56.0, 73.0, 66.0, 61.0, 75.0, 65.0, 56.0, 57.0, 36.0, 37.0, 37.0, 32.0, 18.0, 16.0, 14.0, 10.0, 6.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98095703125, -1.9013671875, -1.82177734375, -1.7421875, -1.66259765625, -1.5830078125, -1.50341796875, -1.423828125, -1.34423828125, -1.2646484375, -1.18505859375, -1.10546875, -1.02587890625, -0.9462890625, -0.86669921875, -0.787109375, -0.70751953125, -0.6279296875, -0.54833984375, -0.46875, -0.38916015625, -0.3095703125, -0.22998046875, -0.150390625, -0.07080078125, 0.0087890625, 0.08837890625, 0.16796875, 0.24755859375, 0.3271484375, 0.40673828125, 0.486328125, 0.56591796875, 0.6455078125, 0.72509765625, 0.8046875, 0.88427734375, 0.9638671875, 1.04345703125, 1.123046875, 1.20263671875, 1.2822265625, 1.36181640625, 1.44140625, 1.52099609375, 1.6005859375, 1.68017578125, 1.759765625, 1.83935546875, 1.9189453125, 1.99853515625, 2.078125, 2.15771484375, 2.2373046875, 2.31689453125, 2.396484375, 2.47607421875, 2.5556640625, 2.63525390625, 2.71484375, 2.79443359375, 2.8740234375, 2.95361328125, 3.033203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 17.0, 25.0, 42.0, 78.0, 94.0, 124.0, 147.0, 120.0, 113.0, 71.0, 66.0, 31.0, 25.0, 9.0, 9.0, 6.0, 2.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.62795639038086, -59.896305084228516, -58.16465377807617, -56.43300247192383, -54.70135498046875, -52.969703674316406, -51.23805236816406, -49.50640106201172, -47.774749755859375, -46.04309844970703, -44.31144714355469, -42.579795837402344, -40.84814453125, -39.116493225097656, -37.38484573364258, -35.653194427490234, -33.92154312133789, -32.18989181518555, -30.458240509033203, -28.726591110229492, -26.99493980407715, -25.263288497924805, -23.531639099121094, -21.79998779296875, -20.068336486816406, -18.336685180664062, -16.60503387451172, -14.873384475708008, -13.141733169555664, -11.41008186340332, -9.678431510925293, -7.946781158447266, -6.2151336669921875, -4.483482837677002, -2.7518320083618164, -1.0201811790466309, 0.7114696502685547, 2.4431209564208984, 4.174771308898926, 5.906421661376953, 7.638072967529297, 9.36972427368164, 11.101374626159668, 12.833024978637695, 14.564676284790039, 16.296327590942383, 18.027976989746094, 19.759628295898438, 21.49127960205078, 23.222930908203125, 24.95458221435547, 26.68623161315918, 28.417882919311523, 30.149534225463867, 31.881183624267578, 33.61283493041992, 35.344486236572266, 37.07613754272461, 38.80778884887695, 40.5394401550293, 42.271087646484375, 44.00273895263672, 45.73439025878906, 47.466041564941406, 49.19769287109375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 9.0, 13.0, 27.0, 18.0, 27.0, 17.0, 41.0, 47.0, 33.0, 31.0, 42.0, 50.0, 56.0, 55.0, 59.0, 49.0, 62.0, 46.0, 31.0, 28.0, 30.0, 27.0, 29.0, 28.0, 17.0, 21.0, 17.0, 11.0, 7.0, 7.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.503570556640625, -43.09716033935547, -41.69075393676758, -40.28434371948242, -38.87793731689453, -37.471527099609375, -36.06511688232422, -34.65871047973633, -33.25230026245117, -31.84589195251465, -30.439483642578125, -29.03307342529297, -27.626665115356445, -26.220256805419922, -24.8138484954834, -23.407440185546875, -22.00103187561035, -20.594623565673828, -19.188215255737305, -17.78180694580078, -16.375396728515625, -14.968988418579102, -13.562580108642578, -12.156170845031738, -10.749762535095215, -9.343354225158691, -7.936944961547852, -6.530536651611328, -5.1241278648376465, -3.717719078063965, -2.3113107681274414, -0.9049015045166016, 0.5015068054199219, 1.907915472984314, 3.314324140548706, 4.720732688903809, 6.12714147567749, 7.533550262451172, 8.939958572387695, 10.346367835998535, 11.752776145935059, 13.159184455871582, 14.565593719482422, 15.972002029418945, 17.37841033935547, 18.784820556640625, 20.191226959228516, 21.597637176513672, 23.004045486450195, 24.41045379638672, 25.816862106323242, 27.223270416259766, 28.629680633544922, 30.036088943481445, 31.44249725341797, 32.848907470703125, 34.255313873291016, 35.66172409057617, 37.06813049316406, 38.47454071044922, 39.88094711303711, 41.287357330322266, 42.693763732910156, 44.10017395019531, 45.50658416748047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 14.0, 21.0, 41.0, 56.0, 100.0, 178.0, 321.0, 716.0, 1782.0, 6294.0, 55760.0, 4103617.0, 19271.0, 3727.0, 1254.0, 526.0, 265.0, 150.0, 72.0, 39.0, 28.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.14111328125, -14.6416015625, -14.14208984375, -13.642578125, -13.14306640625, -12.6435546875, -12.14404296875, -11.64453125, -11.14501953125, -10.6455078125, -10.14599609375, -9.646484375, -9.14697265625, -8.6474609375, -8.14794921875, -7.6484375, -7.14892578125, -6.6494140625, -6.14990234375, -5.650390625, -5.15087890625, -4.6513671875, -4.15185546875, -3.65234375, -3.15283203125, -2.6533203125, -2.15380859375, -1.654296875, -1.15478515625, -0.6552734375, -0.15576171875, 0.34375, 0.84326171875, 1.3427734375, 1.84228515625, 2.341796875, 2.84130859375, 3.3408203125, 3.84033203125, 4.33984375, 4.83935546875, 5.3388671875, 5.83837890625, 6.337890625, 6.83740234375, 7.3369140625, 7.83642578125, 8.3359375, 8.83544921875, 9.3349609375, 9.83447265625, 10.333984375, 10.83349609375, 11.3330078125, 11.83251953125, 12.33203125, 12.83154296875, 13.3310546875, 13.83056640625, 14.330078125, 14.82958984375, 15.3291015625, 15.82861328125, 16.328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 8.0, 21.0, 13.0, 26.0, 32.0, 42.0, 47.0, 53.0, 26.0, 46.0, 55.0, 64.0, 61.0, 51.0, 43.0, 50.0, 50.0, 44.0, 50.0, 29.0, 27.0, 26.0, 34.0, 15.0, 19.0, 11.0, 11.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.880859375, -1.82232666015625, -1.7637939453125, -1.70526123046875, -1.646728515625, -1.58819580078125, -1.5296630859375, -1.47113037109375, -1.41259765625, -1.35406494140625, -1.2955322265625, -1.23699951171875, -1.178466796875, -1.11993408203125, -1.0614013671875, -1.00286865234375, -0.9443359375, -0.88580322265625, -0.8272705078125, -0.76873779296875, -0.710205078125, -0.65167236328125, -0.5931396484375, -0.53460693359375, -0.47607421875, -0.41754150390625, -0.3590087890625, -0.30047607421875, -0.241943359375, -0.18341064453125, -0.1248779296875, -0.06634521484375, -0.0078125, 0.05072021484375, 0.1092529296875, 0.16778564453125, 0.226318359375, 0.28485107421875, 0.3433837890625, 0.40191650390625, 0.46044921875, 0.51898193359375, 0.5775146484375, 0.63604736328125, 0.694580078125, 0.75311279296875, 0.8116455078125, 0.87017822265625, 0.9287109375, 0.98724365234375, 1.0457763671875, 1.10430908203125, 1.162841796875, 1.22137451171875, 1.2799072265625, 1.33843994140625, 1.39697265625, 1.45550537109375, 1.5140380859375, 1.57257080078125, 1.631103515625, 1.68963623046875, 1.7481689453125, 1.80670166015625, 1.865234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 10.0, 20.0, 26.0, 26.0, 44.0, 59.0, 72.0, 103.0, 122.0, 183.0, 252.0, 371.0, 577.0, 1022.0, 1742.0, 3686.0, 8743.0, 27661.0, 260649.0, 3819073.0, 46848.0, 12580.0, 4768.0, 2200.0, 1217.0, 690.0, 429.0, 314.0, 218.0, 143.0, 106.0, 72.0, 55.0, 39.0, 37.0, 19.0, 24.0, 15.0, 11.0, 6.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.26171875, -6.04705810546875, -5.8323974609375, -5.61773681640625, -5.403076171875, -5.18841552734375, -4.9737548828125, -4.75909423828125, -4.54443359375, -4.32977294921875, -4.1151123046875, -3.90045166015625, -3.685791015625, -3.47113037109375, -3.2564697265625, -3.04180908203125, -2.8271484375, -2.61248779296875, -2.3978271484375, -2.18316650390625, -1.968505859375, -1.75384521484375, -1.5391845703125, -1.32452392578125, -1.10986328125, -0.89520263671875, -0.6805419921875, -0.46588134765625, -0.251220703125, -0.03656005859375, 0.1781005859375, 0.39276123046875, 0.607421875, 0.82208251953125, 1.0367431640625, 1.25140380859375, 1.466064453125, 1.68072509765625, 1.8953857421875, 2.11004638671875, 2.32470703125, 2.53936767578125, 2.7540283203125, 2.96868896484375, 3.183349609375, 3.39801025390625, 3.6126708984375, 3.82733154296875, 4.0419921875, 4.25665283203125, 4.4713134765625, 4.68597412109375, 4.900634765625, 5.11529541015625, 5.3299560546875, 5.54461669921875, 5.75927734375, 5.97393798828125, 6.1885986328125, 6.40325927734375, 6.617919921875, 6.83258056640625, 7.0472412109375, 7.26190185546875, 7.4765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 34.0, 99.0, 364.0, 3151.0, 173.0, 60.0, 32.0, 23.0, 10.0, 10.0, 10.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.248504638671875, -1.19232177734375, -1.136138916015625, -1.0799560546875, -1.023773193359375, -0.96759033203125, -0.911407470703125, -0.855224609375, -0.799041748046875, -0.74285888671875, -0.686676025390625, -0.6304931640625, -0.574310302734375, -0.51812744140625, -0.461944580078125, -0.40576171875, -0.349578857421875, -0.29339599609375, -0.237213134765625, -0.1810302734375, -0.124847412109375, -0.06866455078125, -0.012481689453125, 0.043701171875, 0.099884033203125, 0.15606689453125, 0.212249755859375, 0.2684326171875, 0.324615478515625, 0.38079833984375, 0.436981201171875, 0.4931640625, 0.549346923828125, 0.60552978515625, 0.661712646484375, 0.7178955078125, 0.774078369140625, 0.83026123046875, 0.886444091796875, 0.942626953125, 0.998809814453125, 1.05499267578125, 1.111175537109375, 1.1673583984375, 1.223541259765625, 1.27972412109375, 1.335906982421875, 1.39208984375, 1.448272705078125, 1.50445556640625, 1.560638427734375, 1.6168212890625, 1.673004150390625, 1.72918701171875, 1.785369873046875, 1.841552734375, 1.897735595703125, 1.95391845703125, 2.010101318359375, 2.0662841796875, 2.122467041015625, 2.17864990234375, 2.234832763671875, 2.291015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 24.0, 18.0, 35.0, 62.0, 88.0, 94.0, 125.0, 121.0, 112.0, 102.0, 67.0, 53.0, 23.0, 17.0, 15.0, 18.0, 10.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.574706077575684, -8.327876091003418, -8.081045150756836, -7.83421516418457, -7.587385177612305, -7.340554714202881, -7.093724250793457, -6.846894264221191, -6.600064277648926, -6.353233814239502, -6.106403827667236, -5.8595733642578125, -5.612743377685547, -5.365912914276123, -5.119082450866699, -4.872252464294434, -4.62542200088501, -4.378591537475586, -4.13176155090332, -3.8849310874938965, -3.638101100921631, -3.391270637512207, -3.1444404125213623, -2.8976101875305176, -2.650779962539673, -2.403949737548828, -2.1571195125579834, -1.9102891683578491, -1.6634589433670044, -1.4166287183761597, -1.1697983741760254, -0.9229681491851807, -0.6761379241943359, -0.4293076694011688, -0.1824774146080017, 0.06435286998748779, 0.3111830949783325, 0.5580133199691772, 0.8048436641693115, 1.0516738891601562, 1.298504114151001, 1.5453343391418457, 1.7921645641326904, 2.038994789123535, 2.285825252532959, 2.5326552391052246, 2.7794857025146484, 3.026315927505493, 3.273146152496338, 3.5199763774871826, 3.7668066024780273, 4.013637065887451, 4.260467052459717, 4.507297515869141, 4.754127502441406, 5.00095796585083, 5.247788429260254, 5.494618892669678, 5.741448879241943, 5.988279342651367, 6.235109329223633, 6.481939792633057, 6.7287702560424805, 6.975600242614746, 7.222430229187012]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 15.0, 15.0, 16.0, 24.0, 17.0, 27.0, 35.0, 35.0, 45.0, 28.0, 37.0, 49.0, 48.0, 42.0, 42.0, 41.0, 41.0, 46.0, 41.0, 38.0, 41.0, 21.0, 34.0, 39.0, 34.0, 25.0, 22.0, 17.0, 13.0, 6.0, 7.0, 12.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.112955093383789, -3.997013568878174, -3.8810720443725586, -3.7651305198669434, -3.6491892337799072, -3.533247709274292, -3.4173061847686768, -3.3013646602630615, -3.1854231357574463, -3.069481611251831, -2.953540086746216, -2.8375988006591797, -2.7216572761535645, -2.605715751647949, -2.489774227142334, -2.3738327026367188, -2.2578911781311035, -2.1419496536254883, -2.026008129119873, -1.9100667238235474, -1.7941251993179321, -1.6781837940216064, -1.5622422695159912, -1.446300745010376, -1.3303594589233398, -1.2144179344177246, -1.098476529121399, -0.9825350046157837, -0.8665934801101685, -0.750652015209198, -0.6347105503082275, -0.5187690258026123, -0.40282750129699707, -0.2868860065937042, -0.17094452679157257, -0.05500304698944092, 0.06093844771385193, 0.17687994241714478, 0.29282140731811523, 0.40876293182373047, 0.5247043967247009, 0.6406458616256714, 0.7565873861312866, 0.8725288510322571, 0.9884703159332275, 1.1044118404388428, 1.220353364944458, 1.3362948894500732, 1.452236294746399, 1.5681778192520142, 1.6841192245483398, 1.800060749053955, 1.9160022735595703, 2.0319437980651855, 2.147885322570801, 2.263826847076416, 2.379768133163452, 2.4957096576690674, 2.6116511821746826, 2.7275924682617188, 2.843533992767334, 2.959475517272949, 3.0754170417785645, 3.1913585662841797, 3.307300090789795]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 42.0, 74.0, 119.0, 202.0, 324.0, 641.0, 1262.0, 2333.0, 4979.0, 11450.0, 29618.0, 85347.0, 245795.0, 376364.0, 186541.0, 63356.0, 22754.0, 9091.0, 4023.0, 1928.0, 962.0, 540.0, 309.0, 157.0, 88.0, 61.0, 42.0, 19.0, 21.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.1640625, -4.03924560546875, -3.9144287109375, -3.78961181640625, -3.664794921875, -3.53997802734375, -3.4151611328125, -3.29034423828125, -3.16552734375, -3.04071044921875, -2.9158935546875, -2.79107666015625, -2.666259765625, -2.54144287109375, -2.4166259765625, -2.29180908203125, -2.1669921875, -2.04217529296875, -1.9173583984375, -1.79254150390625, -1.667724609375, -1.54290771484375, -1.4180908203125, -1.29327392578125, -1.16845703125, -1.04364013671875, -0.9188232421875, -0.79400634765625, -0.669189453125, -0.54437255859375, -0.4195556640625, -0.29473876953125, -0.169921875, -0.04510498046875, 0.0797119140625, 0.20452880859375, 0.329345703125, 0.45416259765625, 0.5789794921875, 0.70379638671875, 0.82861328125, 0.95343017578125, 1.0782470703125, 1.20306396484375, 1.327880859375, 1.45269775390625, 1.5775146484375, 1.70233154296875, 1.8271484375, 1.95196533203125, 2.0767822265625, 2.20159912109375, 2.326416015625, 2.45123291015625, 2.5760498046875, 2.70086669921875, 2.82568359375, 2.95050048828125, 3.0753173828125, 3.20013427734375, 3.324951171875, 3.44976806640625, 3.5745849609375, 3.69940185546875, 3.82421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 13.0, 15.0, 20.0, 21.0, 22.0, 33.0, 39.0, 30.0, 51.0, 45.0, 41.0, 51.0, 49.0, 59.0, 47.0, 66.0, 58.0, 48.0, 49.0, 36.0, 39.0, 25.0, 35.0, 24.0, 18.0, 16.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.7986907958984375, -1.737030029296875, -1.6753692626953125, -1.61370849609375, -1.5520477294921875, -1.490386962890625, -1.4287261962890625, -1.3670654296875, -1.3054046630859375, -1.243743896484375, -1.1820831298828125, -1.12042236328125, -1.0587615966796875, -0.997100830078125, -0.9354400634765625, -0.873779296875, -0.8121185302734375, -0.750457763671875, -0.6887969970703125, -0.62713623046875, -0.5654754638671875, -0.503814697265625, -0.4421539306640625, -0.3804931640625, -0.3188323974609375, -0.257171630859375, -0.1955108642578125, -0.13385009765625, -0.0721893310546875, -0.010528564453125, 0.0511322021484375, 0.11279296875, 0.1744537353515625, 0.236114501953125, 0.2977752685546875, 0.35943603515625, 0.4210968017578125, 0.482757568359375, 0.5444183349609375, 0.6060791015625, 0.6677398681640625, 0.729400634765625, 0.7910614013671875, 0.85272216796875, 0.9143829345703125, 0.976043701171875, 1.0377044677734375, 1.099365234375, 1.1610260009765625, 1.222686767578125, 1.2843475341796875, 1.34600830078125, 1.4076690673828125, 1.469329833984375, 1.5309906005859375, 1.5926513671875, 1.6543121337890625, 1.715972900390625, 1.7776336669921875, 1.83929443359375, 1.9009552001953125, 1.962615966796875, 2.0242767333984375, 2.0859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 10.0, 12.0, 15.0, 26.0, 25.0, 35.0, 53.0, 83.0, 125.0, 209.0, 316.0, 500.0, 923.0, 2045.0, 5785.0, 27246.0, 292348.0, 642134.0, 60904.0, 9901.0, 2939.0, 1311.0, 578.0, 392.0, 225.0, 122.0, 95.0, 45.0, 51.0, 25.0, 15.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.796875, -7.56884765625, -7.3408203125, -7.11279296875, -6.884765625, -6.65673828125, -6.4287109375, -6.20068359375, -5.97265625, -5.74462890625, -5.5166015625, -5.28857421875, -5.060546875, -4.83251953125, -4.6044921875, -4.37646484375, -4.1484375, -3.92041015625, -3.6923828125, -3.46435546875, -3.236328125, -3.00830078125, -2.7802734375, -2.55224609375, -2.32421875, -2.09619140625, -1.8681640625, -1.64013671875, -1.412109375, -1.18408203125, -0.9560546875, -0.72802734375, -0.5, -0.27197265625, -0.0439453125, 0.18408203125, 0.412109375, 0.64013671875, 0.8681640625, 1.09619140625, 1.32421875, 1.55224609375, 1.7802734375, 2.00830078125, 2.236328125, 2.46435546875, 2.6923828125, 2.92041015625, 3.1484375, 3.37646484375, 3.6044921875, 3.83251953125, 4.060546875, 4.28857421875, 4.5166015625, 4.74462890625, 4.97265625, 5.20068359375, 5.4287109375, 5.65673828125, 5.884765625, 6.11279296875, 6.3408203125, 6.56884765625, 6.796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 8.0, 14.0, 14.0, 12.0, 12.0, 12.0, 27.0, 22.0, 29.0, 25.0, 29.0, 39.0, 44.0, 46.0, 39.0, 47.0, 56.0, 42.0, 61.0, 51.0, 47.0, 40.0, 44.0, 44.0, 37.0, 34.0, 27.0, 17.0, 13.0, 17.0, 7.0, 12.0, 14.0, 1.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.28948974609375, -8.0399169921875, -7.79034423828125, -7.540771484375, -7.29119873046875, -7.0416259765625, -6.79205322265625, -6.54248046875, -6.29290771484375, -6.0433349609375, -5.79376220703125, -5.544189453125, -5.29461669921875, -5.0450439453125, -4.79547119140625, -4.5458984375, -4.29632568359375, -4.0467529296875, -3.79718017578125, -3.547607421875, -3.29803466796875, -3.0484619140625, -2.79888916015625, -2.54931640625, -2.29974365234375, -2.0501708984375, -1.80059814453125, -1.551025390625, -1.30145263671875, -1.0518798828125, -0.80230712890625, -0.552734375, -0.30316162109375, -0.0535888671875, 0.19598388671875, 0.445556640625, 0.69512939453125, 0.9447021484375, 1.19427490234375, 1.44384765625, 1.69342041015625, 1.9429931640625, 2.19256591796875, 2.442138671875, 2.69171142578125, 2.9412841796875, 3.19085693359375, 3.4404296875, 3.69000244140625, 3.9395751953125, 4.18914794921875, 4.438720703125, 4.68829345703125, 4.9378662109375, 5.18743896484375, 5.43701171875, 5.68658447265625, 5.9361572265625, 6.18572998046875, 6.435302734375, 6.68487548828125, 6.9344482421875, 7.18402099609375, 7.43359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 5.0, 14.0, 31.0, 27.0, 38.0, 61.0, 81.0, 157.0, 310.0, 660.0, 1674.0, 5768.0, 31078.0, 315974.0, 615924.0, 63387.0, 9187.0, 2300.0, 900.0, 426.0, 192.0, 106.0, 61.0, 53.0, 37.0, 23.0, 14.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.80078125, -3.67047119140625, -3.5401611328125, -3.40985107421875, -3.279541015625, -3.14923095703125, -3.0189208984375, -2.88861083984375, -2.75830078125, -2.62799072265625, -2.4976806640625, -2.36737060546875, -2.237060546875, -2.10675048828125, -1.9764404296875, -1.84613037109375, -1.7158203125, -1.58551025390625, -1.4552001953125, -1.32489013671875, -1.194580078125, -1.06427001953125, -0.9339599609375, -0.80364990234375, -0.67333984375, -0.54302978515625, -0.4127197265625, -0.28240966796875, -0.152099609375, -0.02178955078125, 0.1085205078125, 0.23883056640625, 0.369140625, 0.49945068359375, 0.6297607421875, 0.76007080078125, 0.890380859375, 1.02069091796875, 1.1510009765625, 1.28131103515625, 1.41162109375, 1.54193115234375, 1.6722412109375, 1.80255126953125, 1.932861328125, 2.06317138671875, 2.1934814453125, 2.32379150390625, 2.4541015625, 2.58441162109375, 2.7147216796875, 2.84503173828125, 2.975341796875, 3.10565185546875, 3.2359619140625, 3.36627197265625, 3.49658203125, 3.62689208984375, 3.7572021484375, 3.88751220703125, 4.017822265625, 4.14813232421875, 4.2784423828125, 4.40875244140625, 4.5390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 15.0, 18.0, 26.0, 17.0, 28.0, 27.0, 53.0, 51.0, 80.0, 75.0, 89.0, 85.0, 75.0, 63.0, 56.0, 44.0, 35.0, 14.0, 25.0, 15.0, 14.0, 10.0, 10.0, 15.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005002021789550781, -0.00048532336950302124, -0.00047044456005096436, -0.00045556575059890747, -0.0004406869411468506, -0.0004258081316947937, -0.0004109293222427368, -0.00039605051279067993, -0.00038117170333862305, -0.00036629289388656616, -0.0003514140844345093, -0.0003365352749824524, -0.0003216564655303955, -0.0003067776560783386, -0.00029189884662628174, -0.00027702003717422485, -0.00026214122772216797, -0.0002472624182701111, -0.0002323836088180542, -0.00021750479936599731, -0.00020262598991394043, -0.00018774718046188354, -0.00017286837100982666, -0.00015798956155776978, -0.0001431107521057129, -0.000128231942653656, -0.00011335313320159912, -9.847432374954224e-05, -8.359551429748535e-05, -6.871670484542847e-05, -5.383789539337158e-05, -3.89590859413147e-05, -2.4080276489257812e-05, -9.201467037200928e-06, 5.677342414855957e-06, 2.0556151866912842e-05, 3.5434961318969727e-05, 5.031377077102661e-05, 6.51925802230835e-05, 8.007138967514038e-05, 9.495019912719727e-05, 0.00010982900857925415, 0.00012470781803131104, 0.00013958662748336792, 0.0001544654369354248, 0.0001693442463874817, 0.00018422305583953857, 0.00019910186529159546, 0.00021398067474365234, 0.00022885948419570923, 0.0002437382936477661, 0.000258617103099823, 0.0002734959125518799, 0.00028837472200393677, 0.00030325353145599365, 0.00031813234090805054, 0.0003330111503601074, 0.0003478899598121643, 0.0003627687692642212, 0.0003776475787162781, 0.00039252638816833496, 0.00040740519762039185, 0.00042228400707244873, 0.0004371628165245056, 0.0004520416259765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 9.0, 9.0, 15.0, 20.0, 30.0, 56.0, 84.0, 174.0, 372.0, 1201.0, 5894.0, 111012.0, 883976.0, 40511.0, 3634.0, 881.0, 325.0, 152.0, 71.0, 50.0, 25.0, 16.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.9432373046875, -6.714599609375, -6.4859619140625, -6.25732421875, -6.0286865234375, -5.800048828125, -5.5714111328125, -5.3427734375, -5.1141357421875, -4.885498046875, -4.6568603515625, -4.42822265625, -4.1995849609375, -3.970947265625, -3.7423095703125, -3.513671875, -3.2850341796875, -3.056396484375, -2.8277587890625, -2.59912109375, -2.3704833984375, -2.141845703125, -1.9132080078125, -1.6845703125, -1.4559326171875, -1.227294921875, -0.9986572265625, -0.77001953125, -0.5413818359375, -0.312744140625, -0.0841064453125, 0.14453125, 0.3731689453125, 0.601806640625, 0.8304443359375, 1.05908203125, 1.2877197265625, 1.516357421875, 1.7449951171875, 1.9736328125, 2.2022705078125, 2.430908203125, 2.6595458984375, 2.88818359375, 3.1168212890625, 3.345458984375, 3.5740966796875, 3.802734375, 4.0313720703125, 4.260009765625, 4.4886474609375, 4.71728515625, 4.9459228515625, 5.174560546875, 5.4031982421875, 5.6318359375, 5.8604736328125, 6.089111328125, 6.3177490234375, 6.54638671875, 6.7750244140625, 7.003662109375, 7.2322998046875, 7.4609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 7.0, 20.0, 27.0, 25.0, 44.0, 49.0, 54.0, 57.0, 68.0, 71.0, 71.0, 62.0, 64.0, 62.0, 65.0, 44.0, 38.0, 32.0, 28.0, 16.0, 14.0, 15.0, 8.0, 6.0, 3.0, 8.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.10546875, -2.029296875, -1.953125, -1.876953125, -1.80078125, -1.724609375, -1.6484375, -1.572265625, -1.49609375, -1.419921875, -1.34375, -1.267578125, -1.19140625, -1.115234375, -1.0390625, -0.962890625, -0.88671875, -0.810546875, -0.734375, -0.658203125, -0.58203125, -0.505859375, -0.4296875, -0.353515625, -0.27734375, -0.201171875, -0.125, -0.048828125, 0.02734375, 0.103515625, 0.1796875, 0.255859375, 0.33203125, 0.408203125, 0.484375, 0.560546875, 0.63671875, 0.712890625, 0.7890625, 0.865234375, 0.94140625, 1.017578125, 1.09375, 1.169921875, 1.24609375, 1.322265625, 1.3984375, 1.474609375, 1.55078125, 1.626953125, 1.703125, 1.779296875, 1.85546875, 1.931640625, 2.0078125, 2.083984375, 2.16015625, 2.236328125, 2.3125, 2.388671875, 2.46484375, 2.541015625, 2.6171875, 2.693359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 9.0, 14.0, 22.0, 42.0, 78.0, 112.0, 167.0, 169.0, 161.0, 95.0, 62.0, 38.0, 19.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-80.1387710571289, -78.24723815917969, -76.35569763183594, -74.46415710449219, -72.57262420654297, -70.68109130859375, -68.78955078125, -66.89801025390625, -65.00647735595703, -63.11494064331055, -61.22340393066406, -59.33186721801758, -57.440330505371094, -55.54879379272461, -53.657257080078125, -51.76572036743164, -49.874183654785156, -47.98264694213867, -46.09111022949219, -44.1995735168457, -42.30803680419922, -40.416500091552734, -38.52496337890625, -36.633426666259766, -34.74188995361328, -32.8503532409668, -30.958816528320312, -29.067279815673828, -27.175743103027344, -25.28420639038086, -23.392669677734375, -21.50113296508789, -19.609596252441406, -17.718059539794922, -15.826522827148438, -13.934986114501953, -12.043449401855469, -10.151912689208984, -8.2603759765625, -6.368839263916016, -4.477302551269531, -2.585765838623047, -0.6942291259765625, 1.1973075866699219, 3.0888442993164062, 4.980381011962891, 6.871917724609375, 8.76345443725586, 10.654991149902344, 12.546527862548828, 14.438064575195312, 16.329601287841797, 18.22113800048828, 20.112674713134766, 22.00421142578125, 23.895748138427734, 25.78728485107422, 27.678821563720703, 29.570358276367188, 31.461894989013672, 33.353431701660156, 35.24496841430664, 37.136505126953125, 39.02804183959961, 40.919578552246094]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 13.0, 25.0, 23.0, 22.0, 28.0, 37.0, 32.0, 40.0, 44.0, 51.0, 56.0, 57.0, 50.0, 44.0, 55.0, 39.0, 40.0, 31.0, 38.0, 34.0, 31.0, 23.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.078405380249023, -30.00717544555664, -28.935945510864258, -27.864715576171875, -26.79348373413086, -25.72225570678711, -24.651023864746094, -23.57979393005371, -22.508563995361328, -21.437334060668945, -20.366104125976562, -19.29487419128418, -18.223644256591797, -17.15241241455078, -16.0811824798584, -15.009952545166016, -13.938722610473633, -12.86749267578125, -11.796262741088867, -10.725031852722168, -9.653801918029785, -8.582571983337402, -7.511341571807861, -6.44011116027832, -5.3688812255859375, -4.297651290893555, -3.2264208793640137, -2.1551907062530518, -1.0839605331420898, -0.012730598449707031, 1.058499813079834, 2.129730224609375, 3.2009620666503906, 4.272192001342773, 5.3434224128723145, 6.4146528244018555, 7.485882759094238, 8.557112693786621, 9.62834358215332, 10.699573516845703, 11.770803451538086, 12.842033386230469, 13.913263320922852, 14.98449420928955, 16.05572509765625, 17.126953125, 18.198184967041016, 19.2694149017334, 20.34064483642578, 21.411874771118164, 22.483104705810547, 23.55433464050293, 24.625564575195312, 25.696796417236328, 26.76802635192871, 27.839256286621094, 28.910486221313477, 29.98171615600586, 31.052946090698242, 32.124176025390625, 33.19540786743164, 34.26663589477539, 35.337867736816406, 36.409095764160156, 37.48032760620117]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 11.0, 22.0, 38.0, 88.0, 170.0, 253.0, 439.0, 833.0, 1843.0, 5771.0, 57627.0, 4110120.0, 11767.0, 2859.0, 1120.0, 564.0, 309.0, 175.0, 116.0, 61.0, 43.0, 21.0, 13.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.46044921875, -12.9833984375, -12.50634765625, -12.029296875, -11.55224609375, -11.0751953125, -10.59814453125, -10.12109375, -9.64404296875, -9.1669921875, -8.68994140625, -8.212890625, -7.73583984375, -7.2587890625, -6.78173828125, -6.3046875, -5.82763671875, -5.3505859375, -4.87353515625, -4.396484375, -3.91943359375, -3.4423828125, -2.96533203125, -2.48828125, -2.01123046875, -1.5341796875, -1.05712890625, -0.580078125, -0.10302734375, 0.3740234375, 0.85107421875, 1.328125, 1.80517578125, 2.2822265625, 2.75927734375, 3.236328125, 3.71337890625, 4.1904296875, 4.66748046875, 5.14453125, 5.62158203125, 6.0986328125, 6.57568359375, 7.052734375, 7.52978515625, 8.0068359375, 8.48388671875, 8.9609375, 9.43798828125, 9.9150390625, 10.39208984375, 10.869140625, 11.34619140625, 11.8232421875, 12.30029296875, 12.77734375, 13.25439453125, 13.7314453125, 14.20849609375, 14.685546875, 15.16259765625, 15.6396484375, 16.11669921875, 16.59375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 8.0, 17.0, 15.0, 24.0, 35.0, 32.0, 46.0, 39.0, 50.0, 41.0, 56.0, 53.0, 60.0, 62.0, 63.0, 55.0, 52.0, 49.0, 46.0, 36.0, 32.0, 18.0, 20.0, 16.0, 14.0, 13.0, 7.0, 7.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1328125, -2.066497802734375, -2.00018310546875, -1.933868408203125, -1.8675537109375, -1.801239013671875, -1.73492431640625, -1.668609619140625, -1.602294921875, -1.535980224609375, -1.46966552734375, -1.403350830078125, -1.3370361328125, -1.270721435546875, -1.20440673828125, -1.138092041015625, -1.07177734375, -1.005462646484375, -0.93914794921875, -0.872833251953125, -0.8065185546875, -0.740203857421875, -0.67388916015625, -0.607574462890625, -0.541259765625, -0.474945068359375, -0.40863037109375, -0.342315673828125, -0.2760009765625, -0.209686279296875, -0.14337158203125, -0.077056884765625, -0.0107421875, 0.055572509765625, 0.12188720703125, 0.188201904296875, 0.2545166015625, 0.320831298828125, 0.38714599609375, 0.453460693359375, 0.519775390625, 0.586090087890625, 0.65240478515625, 0.718719482421875, 0.7850341796875, 0.851348876953125, 0.91766357421875, 0.983978271484375, 1.05029296875, 1.116607666015625, 1.18292236328125, 1.249237060546875, 1.3155517578125, 1.381866455078125, 1.44818115234375, 1.514495849609375, 1.580810546875, 1.647125244140625, 1.71343994140625, 1.779754638671875, 1.8460693359375, 1.912384033203125, 1.97869873046875, 2.045013427734375, 2.111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 9.0, 10.0, 16.0, 24.0, 29.0, 34.0, 46.0, 88.0, 122.0, 176.0, 329.0, 619.0, 1123.0, 2358.0, 6967.0, 42662.0, 4081714.0, 45675.0, 7246.0, 2409.0, 1134.0, 597.0, 338.0, 189.0, 104.0, 62.0, 57.0, 40.0, 24.0, 13.0, 11.0, 10.0, 8.0, 6.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.9375, -11.6353759765625, -11.333251953125, -11.0311279296875, -10.72900390625, -10.4268798828125, -10.124755859375, -9.8226318359375, -9.5205078125, -9.2183837890625, -8.916259765625, -8.6141357421875, -8.31201171875, -8.0098876953125, -7.707763671875, -7.4056396484375, -7.103515625, -6.8013916015625, -6.499267578125, -6.1971435546875, -5.89501953125, -5.5928955078125, -5.290771484375, -4.9886474609375, -4.6865234375, -4.3843994140625, -4.082275390625, -3.7801513671875, -3.47802734375, -3.1759033203125, -2.873779296875, -2.5716552734375, -2.26953125, -1.9674072265625, -1.665283203125, -1.3631591796875, -1.06103515625, -0.7589111328125, -0.456787109375, -0.1546630859375, 0.1474609375, 0.4495849609375, 0.751708984375, 1.0538330078125, 1.35595703125, 1.6580810546875, 1.960205078125, 2.2623291015625, 2.564453125, 2.8665771484375, 3.168701171875, 3.4708251953125, 3.77294921875, 4.0750732421875, 4.377197265625, 4.6793212890625, 4.9814453125, 5.2835693359375, 5.585693359375, 5.8878173828125, 6.18994140625, 6.4920654296875, 6.794189453125, 7.0963134765625, 7.3984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 11.0, 19.0, 46.0, 161.0, 3553.0, 158.0, 39.0, 24.0, 19.0, 14.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.784088134765625, -2.71856689453125, -2.653045654296875, -2.5875244140625, -2.522003173828125, -2.45648193359375, -2.390960693359375, -2.325439453125, -2.259918212890625, -2.19439697265625, -2.128875732421875, -2.0633544921875, -1.997833251953125, -1.93231201171875, -1.866790771484375, -1.80126953125, -1.735748291015625, -1.67022705078125, -1.604705810546875, -1.5391845703125, -1.473663330078125, -1.40814208984375, -1.342620849609375, -1.277099609375, -1.211578369140625, -1.14605712890625, -1.080535888671875, -1.0150146484375, -0.949493408203125, -0.88397216796875, -0.818450927734375, -0.7529296875, -0.687408447265625, -0.62188720703125, -0.556365966796875, -0.4908447265625, -0.425323486328125, -0.35980224609375, -0.294281005859375, -0.228759765625, -0.163238525390625, -0.09771728515625, -0.032196044921875, 0.0333251953125, 0.098846435546875, 0.16436767578125, 0.229888916015625, 0.29541015625, 0.360931396484375, 0.42645263671875, 0.491973876953125, 0.5574951171875, 0.623016357421875, 0.68853759765625, 0.754058837890625, 0.819580078125, 0.885101318359375, 0.95062255859375, 1.016143798828125, 1.0816650390625, 1.147186279296875, 1.21270751953125, 1.278228759765625, 1.34375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 13.0, 28.0, 35.0, 56.0, 119.0, 153.0, 204.0, 167.0, 108.0, 52.0, 29.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.651954650878906, -7.372481346130371, -7.093008518218994, -6.813535213470459, -6.534062385559082, -6.254589080810547, -5.975115776062012, -5.695642948150635, -5.416170120239258, -5.136696815490723, -4.857223987579346, -4.5777506828308105, -4.298277854919434, -4.018804550170898, -3.7393314838409424, -3.4598584175109863, -3.180385112762451, -2.900912046432495, -2.621438980102539, -2.341965675354004, -2.062492847442627, -1.7830196619033813, -1.5035464763641357, -1.2240734100341797, -0.9446003437042236, -0.6651272773742676, -0.38565415143966675, -0.10618102550506592, 0.17329204082489014, 0.4527651071548462, 0.7322382926940918, 1.0117113590240479, 1.291184425354004, 1.57065749168396, 1.850130558013916, 2.129603862762451, 2.409076690673828, 2.6885499954223633, 2.9680230617523193, 3.2474961280822754, 3.5269691944122314, 3.8064422607421875, 4.085915565490723, 4.3653883934021, 4.644861698150635, 4.924334526062012, 5.203807830810547, 5.483281135559082, 5.762753963470459, 6.042227268218994, 6.321700096130371, 6.601173400878906, 6.880646228790283, 7.160119533538818, 7.439592361450195, 7.7190656661987305, 7.998538970947266, 8.2780122756958, 8.557485580444336, 8.836957931518555, 9.11643123626709, 9.395904541015625, 9.67537784576416, 9.954851150512695, 10.234323501586914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 3.0, 10.0, 5.0, 11.0, 9.0, 9.0, 11.0, 18.0, 21.0, 22.0, 22.0, 32.0, 27.0, 34.0, 36.0, 40.0, 40.0, 49.0, 47.0, 57.0, 47.0, 43.0, 46.0, 37.0, 43.0, 39.0, 32.0, 32.0, 28.0, 21.0, 23.0, 22.0, 18.0, 14.0, 9.0, 12.0, 3.0, 3.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-3.4852757453918457, -3.389942169189453, -3.2946088314056396, -3.199275255203247, -3.1039419174194336, -3.008608341217041, -2.9132747650146484, -2.817941188812256, -2.7226078510284424, -2.62727427482605, -2.5319409370422363, -2.4366073608398438, -2.341273784637451, -2.2459404468536377, -2.150606870651245, -2.0552735328674316, -1.959939956665039, -1.864606499671936, -1.769273042678833, -1.6739394664764404, -1.5786060094833374, -1.4832725524902344, -1.3879389762878418, -1.2926055192947388, -1.1972720623016357, -1.1019386053085327, -1.0066051483154297, -0.9112715721130371, -0.8159381151199341, -0.720604658126831, -0.6252711415290833, -0.5299376249313354, -0.4346041679382324, -0.339270681142807, -0.2439371943473816, -0.14860370755195618, -0.05327022075653076, 0.04206326603889465, 0.13739675283432007, 0.23273026943206787, 0.3280637264251709, 0.4233972132205963, 0.5187307000160217, 0.6140642166137695, 0.7093976736068726, 0.8047311305999756, 0.9000646471977234, 0.9953981637954712, 1.0907316207885742, 1.1860650777816772, 1.2813985347747803, 1.3767321109771729, 1.4720655679702759, 1.567399024963379, 1.6627326011657715, 1.7580660581588745, 1.8533995151519775, 1.9487329721450806, 2.0440664291381836, 2.139400005340576, 2.2347335815429688, 2.3300669193267822, 2.425400495529175, 2.5207338333129883, 2.616067409515381]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 7.0, 11.0, 19.0, 15.0, 26.0, 52.0, 64.0, 109.0, 160.0, 277.0, 437.0, 698.0, 1157.0, 2162.0, 3993.0, 7905.0, 17595.0, 41488.0, 104303.0, 262260.0, 338252.0, 157974.0, 61327.0, 24994.0, 11167.0, 5503.0, 2796.0, 1498.0, 848.0, 537.0, 313.0, 200.0, 138.0, 74.0, 59.0, 37.0, 28.0, 21.0, 17.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.533203125, -3.438262939453125, -3.34332275390625, -3.248382568359375, -3.1534423828125, -3.058502197265625, -2.96356201171875, -2.868621826171875, -2.773681640625, -2.678741455078125, -2.58380126953125, -2.488861083984375, -2.3939208984375, -2.298980712890625, -2.20404052734375, -2.109100341796875, -2.01416015625, -1.919219970703125, -1.82427978515625, -1.729339599609375, -1.6343994140625, -1.539459228515625, -1.44451904296875, -1.349578857421875, -1.254638671875, -1.159698486328125, -1.06475830078125, -0.969818115234375, -0.8748779296875, -0.779937744140625, -0.68499755859375, -0.590057373046875, -0.4951171875, -0.400177001953125, -0.30523681640625, -0.210296630859375, -0.1153564453125, -0.020416259765625, 0.07452392578125, 0.169464111328125, 0.264404296875, 0.359344482421875, 0.45428466796875, 0.549224853515625, 0.6441650390625, 0.739105224609375, 0.83404541015625, 0.928985595703125, 1.02392578125, 1.118865966796875, 1.21380615234375, 1.308746337890625, 1.4036865234375, 1.498626708984375, 1.59356689453125, 1.688507080078125, 1.783447265625, 1.878387451171875, 1.97332763671875, 2.068267822265625, 2.1632080078125, 2.258148193359375, 2.35308837890625, 2.448028564453125, 2.54296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 14.0, 30.0, 31.0, 22.0, 40.0, 41.0, 46.0, 46.0, 36.0, 53.0, 58.0, 55.0, 50.0, 60.0, 47.0, 51.0, 61.0, 43.0, 37.0, 27.0, 26.0, 23.0, 15.0, 12.0, 8.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.995513916015625, -1.93048095703125, -1.865447998046875, -1.8004150390625, -1.735382080078125, -1.67034912109375, -1.605316162109375, -1.540283203125, -1.475250244140625, -1.41021728515625, -1.345184326171875, -1.2801513671875, -1.215118408203125, -1.15008544921875, -1.085052490234375, -1.02001953125, -0.954986572265625, -0.88995361328125, -0.824920654296875, -0.7598876953125, -0.694854736328125, -0.62982177734375, -0.564788818359375, -0.499755859375, -0.434722900390625, -0.36968994140625, -0.304656982421875, -0.2396240234375, -0.174591064453125, -0.10955810546875, -0.044525146484375, 0.0205078125, 0.085540771484375, 0.15057373046875, 0.215606689453125, 0.2806396484375, 0.345672607421875, 0.41070556640625, 0.475738525390625, 0.540771484375, 0.605804443359375, 0.67083740234375, 0.735870361328125, 0.8009033203125, 0.865936279296875, 0.93096923828125, 0.996002197265625, 1.06103515625, 1.126068115234375, 1.19110107421875, 1.256134033203125, 1.3211669921875, 1.386199951171875, 1.45123291015625, 1.516265869140625, 1.581298828125, 1.646331787109375, 1.71136474609375, 1.776397705078125, 1.8414306640625, 1.906463623046875, 1.97149658203125, 2.036529541015625, 2.1015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 6.0, 9.0, 7.0, 13.0, 17.0, 21.0, 45.0, 49.0, 80.0, 109.0, 154.0, 248.0, 366.0, 618.0, 1088.0, 2496.0, 7560.0, 43327.0, 607667.0, 346510.0, 27804.0, 5755.0, 2106.0, 944.0, 537.0, 326.0, 214.0, 146.0, 100.0, 61.0, 49.0, 31.0, 29.0, 22.0, 18.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.46484375, -6.26214599609375, -6.0594482421875, -5.85675048828125, -5.654052734375, -5.45135498046875, -5.2486572265625, -5.04595947265625, -4.84326171875, -4.64056396484375, -4.4378662109375, -4.23516845703125, -4.032470703125, -3.82977294921875, -3.6270751953125, -3.42437744140625, -3.2216796875, -3.01898193359375, -2.8162841796875, -2.61358642578125, -2.410888671875, -2.20819091796875, -2.0054931640625, -1.80279541015625, -1.60009765625, -1.39739990234375, -1.1947021484375, -0.99200439453125, -0.789306640625, -0.58660888671875, -0.3839111328125, -0.18121337890625, 0.021484375, 0.22418212890625, 0.4268798828125, 0.62957763671875, 0.832275390625, 1.03497314453125, 1.2376708984375, 1.44036865234375, 1.64306640625, 1.84576416015625, 2.0484619140625, 2.25115966796875, 2.453857421875, 2.65655517578125, 2.8592529296875, 3.06195068359375, 3.2646484375, 3.46734619140625, 3.6700439453125, 3.87274169921875, 4.075439453125, 4.27813720703125, 4.4808349609375, 4.68353271484375, 4.88623046875, 5.08892822265625, 5.2916259765625, 5.49432373046875, 5.697021484375, 5.89971923828125, 6.1024169921875, 6.30511474609375, 6.5078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 15.0, 7.0, 5.0, 13.0, 23.0, 21.0, 13.0, 24.0, 29.0, 26.0, 24.0, 44.0, 50.0, 26.0, 43.0, 37.0, 35.0, 49.0, 47.0, 43.0, 37.0, 43.0, 38.0, 40.0, 28.0, 29.0, 20.0, 21.0, 24.0, 21.0, 17.0, 18.0, 16.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.8125, -6.61279296875, -6.4130859375, -6.21337890625, -6.013671875, -5.81396484375, -5.6142578125, -5.41455078125, -5.21484375, -5.01513671875, -4.8154296875, -4.61572265625, -4.416015625, -4.21630859375, -4.0166015625, -3.81689453125, -3.6171875, -3.41748046875, -3.2177734375, -3.01806640625, -2.818359375, -2.61865234375, -2.4189453125, -2.21923828125, -2.01953125, -1.81982421875, -1.6201171875, -1.42041015625, -1.220703125, -1.02099609375, -0.8212890625, -0.62158203125, -0.421875, -0.22216796875, -0.0224609375, 0.17724609375, 0.376953125, 0.57666015625, 0.7763671875, 0.97607421875, 1.17578125, 1.37548828125, 1.5751953125, 1.77490234375, 1.974609375, 2.17431640625, 2.3740234375, 2.57373046875, 2.7734375, 2.97314453125, 3.1728515625, 3.37255859375, 3.572265625, 3.77197265625, 3.9716796875, 4.17138671875, 4.37109375, 4.57080078125, 4.7705078125, 4.97021484375, 5.169921875, 5.36962890625, 5.5693359375, 5.76904296875, 5.96875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 10.0, 19.0, 18.0, 32.0, 45.0, 85.0, 180.0, 366.0, 1073.0, 4428.0, 42956.0, 855178.0, 133012.0, 8510.0, 1662.0, 501.0, 224.0, 94.0, 57.0, 33.0, 16.0, 18.0, 12.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640625, -4.478759765625, -4.31689453125, -4.155029296875, -3.9931640625, -3.831298828125, -3.66943359375, -3.507568359375, -3.345703125, -3.183837890625, -3.02197265625, -2.860107421875, -2.6982421875, -2.536376953125, -2.37451171875, -2.212646484375, -2.05078125, -1.888916015625, -1.72705078125, -1.565185546875, -1.4033203125, -1.241455078125, -1.07958984375, -0.917724609375, -0.755859375, -0.593994140625, -0.43212890625, -0.270263671875, -0.1083984375, 0.053466796875, 0.21533203125, 0.377197265625, 0.5390625, 0.700927734375, 0.86279296875, 1.024658203125, 1.1865234375, 1.348388671875, 1.51025390625, 1.672119140625, 1.833984375, 1.995849609375, 2.15771484375, 2.319580078125, 2.4814453125, 2.643310546875, 2.80517578125, 2.967041015625, 3.12890625, 3.290771484375, 3.45263671875, 3.614501953125, 3.7763671875, 3.938232421875, 4.10009765625, 4.261962890625, 4.423828125, 4.585693359375, 4.74755859375, 4.909423828125, 5.0712890625, 5.233154296875, 5.39501953125, 5.556884765625, 5.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 14.0, 18.0, 18.0, 31.0, 63.0, 90.0, 189.0, 185.0, 134.0, 70.0, 47.0, 36.0, 21.0, 7.0, 14.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007348060607910156, -0.0007087960839271545, -0.0006827861070632935, -0.0006567761301994324, -0.0006307661533355713, -0.0006047561764717102, -0.0005787461996078491, -0.000552736222743988, -0.000526726245880127, -0.0005007162690162659, -0.0004747062921524048, -0.0004486963152885437, -0.0004226863384246826, -0.00039667636156082153, -0.00037066638469696045, -0.00034465640783309937, -0.0003186464309692383, -0.0002926364541053772, -0.0002666264772415161, -0.00024061650037765503, -0.00021460652351379395, -0.00018859654664993286, -0.00016258656978607178, -0.0001365765929222107, -0.00011056661605834961, -8.455663919448853e-05, -5.854666233062744e-05, -3.253668546676636e-05, -6.5267086029052734e-06, 1.948326826095581e-05, 4.5493245124816895e-05, 7.150322198867798e-05, 9.751319885253906e-05, 0.00012352317571640015, 0.00014953315258026123, 0.00017554312944412231, 0.0002015531063079834, 0.00022756308317184448, 0.00025357306003570557, 0.00027958303689956665, 0.00030559301376342773, 0.0003316029906272888, 0.0003576129674911499, 0.000383622944355011, 0.00040963292121887207, 0.00043564289808273315, 0.00046165287494659424, 0.0004876628518104553, 0.0005136728286743164, 0.0005396828055381775, 0.0005656927824020386, 0.0005917027592658997, 0.0006177127361297607, 0.0006437227129936218, 0.0006697326898574829, 0.000695742666721344, 0.0007217526435852051, 0.0007477626204490662, 0.0007737725973129272, 0.0007997825741767883, 0.0008257925510406494, 0.0008518025279045105, 0.0008778125047683716, 0.0009038224816322327, 0.0009298324584960938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 20.0, 17.0, 28.0, 46.0, 79.0, 132.0, 212.0, 422.0, 840.0, 1859.0, 5178.0, 22440.0, 185323.0, 705192.0, 104737.0, 14912.0, 3952.0, 1508.0, 707.0, 386.0, 204.0, 126.0, 69.0, 37.0, 37.0, 20.0, 11.0, 12.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.842559814453125, -3.73394775390625, -3.625335693359375, -3.5167236328125, -3.408111572265625, -3.29949951171875, -3.190887451171875, -3.082275390625, -2.973663330078125, -2.86505126953125, -2.756439208984375, -2.6478271484375, -2.539215087890625, -2.43060302734375, -2.321990966796875, -2.21337890625, -2.104766845703125, -1.99615478515625, -1.887542724609375, -1.7789306640625, -1.670318603515625, -1.56170654296875, -1.453094482421875, -1.344482421875, -1.235870361328125, -1.12725830078125, -1.018646240234375, -0.9100341796875, -0.801422119140625, -0.69281005859375, -0.584197998046875, -0.4755859375, -0.366973876953125, -0.25836181640625, -0.149749755859375, -0.0411376953125, 0.067474365234375, 0.17608642578125, 0.284698486328125, 0.393310546875, 0.501922607421875, 0.61053466796875, 0.719146728515625, 0.8277587890625, 0.936370849609375, 1.04498291015625, 1.153594970703125, 1.26220703125, 1.370819091796875, 1.47943115234375, 1.588043212890625, 1.6966552734375, 1.805267333984375, 1.91387939453125, 2.022491455078125, 2.131103515625, 2.239715576171875, 2.34832763671875, 2.456939697265625, 2.5655517578125, 2.674163818359375, 2.78277587890625, 2.891387939453125, 3.0]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 24.0, 34.0, 30.0, 42.0, 44.0, 71.0, 64.0, 69.0, 96.0, 97.0, 77.0, 83.0, 59.0, 52.0, 32.0, 26.0, 17.0, 16.0, 10.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.011810302734375, -2.92987060546875, -2.847930908203125, -2.7659912109375, -2.684051513671875, -2.60211181640625, -2.520172119140625, -2.438232421875, -2.356292724609375, -2.27435302734375, -2.192413330078125, -2.1104736328125, -2.028533935546875, -1.94659423828125, -1.864654541015625, -1.78271484375, -1.700775146484375, -1.61883544921875, -1.536895751953125, -1.4549560546875, -1.373016357421875, -1.29107666015625, -1.209136962890625, -1.127197265625, -1.045257568359375, -0.96331787109375, -0.881378173828125, -0.7994384765625, -0.717498779296875, -0.63555908203125, -0.553619384765625, -0.4716796875, -0.389739990234375, -0.30780029296875, -0.225860595703125, -0.1439208984375, -0.061981201171875, 0.01995849609375, 0.101898193359375, 0.183837890625, 0.265777587890625, 0.34771728515625, 0.429656982421875, 0.5115966796875, 0.593536376953125, 0.67547607421875, 0.757415771484375, 0.83935546875, 0.921295166015625, 1.00323486328125, 1.085174560546875, 1.1671142578125, 1.249053955078125, 1.33099365234375, 1.412933349609375, 1.494873046875, 1.576812744140625, 1.65875244140625, 1.740692138671875, 1.8226318359375, 1.904571533203125, 1.98651123046875, 2.068450927734375, 2.150390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 30.0, 89.0, 178.0, 288.0, 245.0, 89.0, 39.0, 18.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.6630630493164, -92.97833251953125, -90.29359436035156, -87.6088638305664, -84.92412567138672, -82.23939514160156, -79.55465698242188, -76.86992645263672, -74.18519592285156, -71.5004653930664, -68.81572723388672, -66.13099670410156, -63.446258544921875, -60.76152801513672, -58.0767936706543, -55.392059326171875, -52.70732116699219, -50.022586822509766, -47.337852478027344, -44.65312194824219, -41.9683837890625, -39.283653259277344, -36.59891891479492, -33.9141845703125, -31.229450225830078, -28.544715881347656, -25.859981536865234, -23.175249099731445, -20.490514755249023, -17.8057804107666, -15.121047973632812, -12.43631362915039, -9.7515869140625, -7.066853046417236, -4.382119178771973, -1.6973857879638672, 0.9873485565185547, 3.6720829010009766, 6.356815338134766, 9.041549682617188, 11.72628402709961, 14.411018371582031, 17.095752716064453, 19.780485153198242, 22.465219497680664, 25.149953842163086, 27.834686279296875, 30.519420623779297, 33.20415496826172, 35.88888931274414, 38.57362365722656, 41.25835418701172, 43.943092346191406, 46.62782287597656, 49.312557220458984, 51.997291564941406, 54.68202590942383, 57.36676025390625, 60.05149459838867, 62.736228942871094, 65.42095947265625, 68.10569763183594, 70.7904281616211, 73.47515869140625, 76.15989685058594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 5.0, 11.0, 11.0, 12.0, 20.0, 29.0, 23.0, 28.0, 43.0, 47.0, 48.0, 52.0, 78.0, 75.0, 70.0, 66.0, 55.0, 51.0, 34.0, 46.0, 33.0, 37.0, 22.0, 20.0, 12.0, 18.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.164466857910156, -51.79619216918945, -50.427913665771484, -49.05963897705078, -47.69136428833008, -46.323089599609375, -44.954811096191406, -43.5865364074707, -42.21826171875, -40.8499870300293, -39.48170852661133, -38.113433837890625, -36.74515914916992, -35.37688446044922, -34.00860595703125, -32.64033126831055, -31.27205467224121, -29.903778076171875, -28.535503387451172, -27.167226791381836, -25.798952102661133, -24.430675506591797, -23.062400817871094, -21.694124221801758, -20.325847625732422, -18.957571029663086, -17.589296340942383, -16.221019744873047, -14.852745056152344, -13.484468460083008, -12.116192817687988, -10.747917175292969, -9.379642486572266, -8.011366844177246, -6.643091201782227, -5.274815082550049, -3.9065394401550293, -2.5382637977600098, -1.169987678527832, 0.1982879638671875, 1.566563606262207, 2.9348392486572266, 4.303114891052246, 5.671391010284424, 7.039666652679443, 8.407941818237305, 9.77621841430664, 11.14449405670166, 12.51276969909668, 13.8810453414917, 15.249320983886719, 16.617597579956055, 17.985872268676758, 19.354148864746094, 20.722423553466797, 22.090700149536133, 23.45897674560547, 24.827253341674805, 26.195528030395508, 27.563804626464844, 28.932079315185547, 30.300355911254883, 31.66863250732422, 33.03690719604492, 34.405181884765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 9.0, 20.0, 17.0, 29.0, 57.0, 100.0, 191.0, 347.0, 716.0, 1525.0, 3426.0, 9330.0, 38199.0, 3975536.0, 138118.0, 16995.0, 5215.0, 2245.0, 1046.0, 492.0, 300.0, 164.0, 75.0, 34.0, 34.0, 21.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.0087890625, -5.775390625, -5.5419921875, -5.30859375, -5.0751953125, -4.841796875, -4.6083984375, -4.375, -4.1416015625, -3.908203125, -3.6748046875, -3.44140625, -3.2080078125, -2.974609375, -2.7412109375, -2.5078125, -2.2744140625, -2.041015625, -1.8076171875, -1.57421875, -1.3408203125, -1.107421875, -0.8740234375, -0.640625, -0.4072265625, -0.173828125, 0.0595703125, 0.29296875, 0.5263671875, 0.759765625, 0.9931640625, 1.2265625, 1.4599609375, 1.693359375, 1.9267578125, 2.16015625, 2.3935546875, 2.626953125, 2.8603515625, 3.09375, 3.3271484375, 3.560546875, 3.7939453125, 4.02734375, 4.2607421875, 4.494140625, 4.7275390625, 4.9609375, 5.1943359375, 5.427734375, 5.6611328125, 5.89453125, 6.1279296875, 6.361328125, 6.5947265625, 6.828125, 7.0615234375, 7.294921875, 7.5283203125, 7.76171875, 7.9951171875, 8.228515625, 8.4619140625, 8.6953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 7.0, 14.0, 21.0, 18.0, 21.0, 33.0, 28.0, 40.0, 50.0, 57.0, 53.0, 67.0, 69.0, 59.0, 57.0, 64.0, 57.0, 54.0, 43.0, 32.0, 29.0, 37.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.556640625, -2.487640380859375, -2.41864013671875, -2.349639892578125, -2.2806396484375, -2.211639404296875, -2.14263916015625, -2.073638916015625, -2.004638671875, -1.935638427734375, -1.86663818359375, -1.797637939453125, -1.7286376953125, -1.659637451171875, -1.59063720703125, -1.521636962890625, -1.45263671875, -1.383636474609375, -1.31463623046875, -1.245635986328125, -1.1766357421875, -1.107635498046875, -1.03863525390625, -0.969635009765625, -0.900634765625, -0.831634521484375, -0.76263427734375, -0.693634033203125, -0.6246337890625, -0.555633544921875, -0.48663330078125, -0.417633056640625, -0.3486328125, -0.279632568359375, -0.21063232421875, -0.141632080078125, -0.0726318359375, -0.003631591796875, 0.06536865234375, 0.134368896484375, 0.203369140625, 0.272369384765625, 0.34136962890625, 0.410369873046875, 0.4793701171875, 0.548370361328125, 0.61737060546875, 0.686370849609375, 0.75537109375, 0.824371337890625, 0.89337158203125, 0.962371826171875, 1.0313720703125, 1.100372314453125, 1.16937255859375, 1.238372802734375, 1.307373046875, 1.376373291015625, 1.44537353515625, 1.514373779296875, 1.5833740234375, 1.652374267578125, 1.72137451171875, 1.790374755859375, 1.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 16.0, 16.0, 34.0, 35.0, 51.0, 78.0, 115.0, 179.0, 268.0, 421.0, 707.0, 1152.0, 1934.0, 3424.0, 7092.0, 18143.0, 77336.0, 3801452.0, 230352.0, 30511.0, 10381.0, 4413.0, 2483.0, 1351.0, 896.0, 482.0, 299.0, 214.0, 137.0, 84.0, 67.0, 42.0, 19.0, 21.0, 18.0, 9.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.33837890625, -4.1923828125, -4.04638671875, -3.900390625, -3.75439453125, -3.6083984375, -3.46240234375, -3.31640625, -3.17041015625, -3.0244140625, -2.87841796875, -2.732421875, -2.58642578125, -2.4404296875, -2.29443359375, -2.1484375, -2.00244140625, -1.8564453125, -1.71044921875, -1.564453125, -1.41845703125, -1.2724609375, -1.12646484375, -0.98046875, -0.83447265625, -0.6884765625, -0.54248046875, -0.396484375, -0.25048828125, -0.1044921875, 0.04150390625, 0.1875, 0.33349609375, 0.4794921875, 0.62548828125, 0.771484375, 0.91748046875, 1.0634765625, 1.20947265625, 1.35546875, 1.50146484375, 1.6474609375, 1.79345703125, 1.939453125, 2.08544921875, 2.2314453125, 2.37744140625, 2.5234375, 2.66943359375, 2.8154296875, 2.96142578125, 3.107421875, 3.25341796875, 3.3994140625, 3.54541015625, 3.69140625, 3.83740234375, 3.9833984375, 4.12939453125, 4.275390625, 4.42138671875, 4.5673828125, 4.71337890625, 4.859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 9.0, 12.0, 11.0, 20.0, 54.0, 90.0, 245.0, 2856.0, 469.0, 126.0, 57.0, 33.0, 21.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.94854736328125, -1.8756103515625, -1.80267333984375, -1.729736328125, -1.65679931640625, -1.5838623046875, -1.51092529296875, -1.43798828125, -1.36505126953125, -1.2921142578125, -1.21917724609375, -1.146240234375, -1.07330322265625, -1.0003662109375, -0.92742919921875, -0.8544921875, -0.78155517578125, -0.7086181640625, -0.63568115234375, -0.562744140625, -0.48980712890625, -0.4168701171875, -0.34393310546875, -0.27099609375, -0.19805908203125, -0.1251220703125, -0.05218505859375, 0.020751953125, 0.09368896484375, 0.1666259765625, 0.23956298828125, 0.3125, 0.38543701171875, 0.4583740234375, 0.53131103515625, 0.604248046875, 0.67718505859375, 0.7501220703125, 0.82305908203125, 0.89599609375, 0.96893310546875, 1.0418701171875, 1.11480712890625, 1.187744140625, 1.26068115234375, 1.3336181640625, 1.40655517578125, 1.4794921875, 1.55242919921875, 1.6253662109375, 1.69830322265625, 1.771240234375, 1.84417724609375, 1.9171142578125, 1.99005126953125, 2.06298828125, 2.13592529296875, 2.2088623046875, 2.28179931640625, 2.354736328125, 2.42767333984375, 2.5006103515625, 2.57354736328125, 2.646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 7.0, 6.0, 19.0, 27.0, 37.0, 58.0, 99.0, 133.0, 145.0, 161.0, 118.0, 74.0, 47.0, 23.0, 22.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.110759735107422, -9.742130279541016, -9.37350082397461, -9.004871368408203, -8.636241912841797, -8.26761245727539, -7.898983478546143, -7.530354022979736, -7.16172456741333, -6.793095111846924, -6.424465656280518, -6.0558366775512695, -5.687207221984863, -5.318577766418457, -4.949948310852051, -4.5813188552856445, -4.212689399719238, -3.844059944152832, -3.475430488586426, -3.1068012714385986, -2.7381718158721924, -2.369542360305786, -2.000913143157959, -1.6322836875915527, -1.2636542320251465, -0.895024836063385, -0.5263954401016235, -0.15776610374450684, 0.21086335182189941, 0.5794928073883057, 0.9481220245361328, 1.316751480102539, 1.685379981994629, 2.054009437561035, 2.4226388931274414, 2.7912681102752686, 3.159897565841675, 3.528527021408081, 3.897156238555908, 4.2657856941223145, 4.634415149688721, 5.003044605255127, 5.371674060821533, 5.740303039550781, 6.1089324951171875, 6.477561950683594, 6.84619140625, 7.214820861816406, 7.5834503173828125, 7.952079772949219, 8.320709228515625, 8.689338684082031, 9.057968139648438, 9.426597595214844, 9.79522705078125, 10.163856506347656, 10.532485961914062, 10.901115417480469, 11.269744873046875, 11.638374328613281, 12.007003784179688, 12.375633239746094, 12.7442626953125, 13.112892150878906, 13.481520652770996]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 5.0, 17.0, 16.0, 13.0, 22.0, 26.0, 22.0, 40.0, 23.0, 37.0, 43.0, 38.0, 47.0, 45.0, 44.0, 59.0, 50.0, 36.0, 38.0, 41.0, 29.0, 44.0, 36.0, 31.0, 30.0, 31.0, 26.0, 17.0, 15.0, 12.0, 20.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.804723262786865, -4.625757217407227, -4.44679069519043, -4.267824649810791, -4.088858604431152, -3.9098923206329346, -3.730926036834717, -3.551959991455078, -3.3729937076568604, -3.1940274238586426, -3.015061378479004, -2.836095094680786, -2.6571288108825684, -2.4781627655029297, -2.299196481704712, -2.120230197906494, -1.9412641525268555, -1.7622979879379272, -1.583331823348999, -1.4043655395507812, -1.225399374961853, -1.0464332103729248, -0.867466926574707, -0.6885007619857788, -0.5095345973968506, -0.3305684030056, -0.15160220861434937, 0.027364015579223633, 0.20633018016815186, 0.3852963447570801, 0.5642626285552979, 0.7432287931442261, 0.9221954345703125, 1.1011615991592407, 1.280127763748169, 1.4590940475463867, 1.638060212135315, 1.8170263767242432, 1.995992660522461, 2.1749587059020996, 2.3539249897003174, 2.532891273498535, 2.711857318878174, 2.8908236026763916, 3.0697898864746094, 3.248755931854248, 3.427722215652466, 3.6066884994506836, 3.7856545448303223, 3.96462082862854, 4.143587112426758, 4.3225531578063965, 4.501519203186035, 4.680485725402832, 4.859451770782471, 5.038417816162109, 5.217384338378906, 5.396350383758545, 5.575316905975342, 5.7542829513549805, 5.933248996734619, 6.112215042114258, 6.291181564331055, 6.470147609710693, 6.649113655090332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 3.0, 11.0, 17.0, 16.0, 43.0, 69.0, 120.0, 233.0, 472.0, 1169.0, 2903.0, 8065.0, 27037.0, 105325.0, 464332.0, 334662.0, 73743.0, 20001.0, 6296.0, 2265.0, 924.0, 408.0, 201.0, 89.0, 57.0, 32.0, 23.0, 10.0, 12.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.49493408203125, -4.2984619140625, -4.10198974609375, -3.905517578125, -3.70904541015625, -3.5125732421875, -3.31610107421875, -3.11962890625, -2.92315673828125, -2.7266845703125, -2.53021240234375, -2.333740234375, -2.13726806640625, -1.9407958984375, -1.74432373046875, -1.5478515625, -1.35137939453125, -1.1549072265625, -0.95843505859375, -0.761962890625, -0.56549072265625, -0.3690185546875, -0.17254638671875, 0.02392578125, 0.22039794921875, 0.4168701171875, 0.61334228515625, 0.809814453125, 1.00628662109375, 1.2027587890625, 1.39923095703125, 1.595703125, 1.79217529296875, 1.9886474609375, 2.18511962890625, 2.381591796875, 2.57806396484375, 2.7745361328125, 2.97100830078125, 3.16748046875, 3.36395263671875, 3.5604248046875, 3.75689697265625, 3.953369140625, 4.14984130859375, 4.3463134765625, 4.54278564453125, 4.7392578125, 4.93572998046875, 5.1322021484375, 5.32867431640625, 5.525146484375, 5.72161865234375, 5.9180908203125, 6.11456298828125, 6.31103515625, 6.50750732421875, 6.7039794921875, 6.90045166015625, 7.096923828125, 7.29339599609375, 7.4898681640625, 7.68634033203125, 7.8828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 14.0, 20.0, 20.0, 27.0, 21.0, 30.0, 36.0, 33.0, 49.0, 53.0, 54.0, 57.0, 55.0, 54.0, 48.0, 52.0, 54.0, 44.0, 51.0, 34.0, 43.0, 21.0, 20.0, 20.0, 16.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.15625, -2.0941314697265625, -2.032012939453125, -1.9698944091796875, -1.90777587890625, -1.8456573486328125, -1.783538818359375, -1.7214202880859375, -1.6593017578125, -1.5971832275390625, -1.535064697265625, -1.4729461669921875, -1.41082763671875, -1.3487091064453125, -1.286590576171875, -1.2244720458984375, -1.162353515625, -1.1002349853515625, -1.038116455078125, -0.9759979248046875, -0.91387939453125, -0.8517608642578125, -0.789642333984375, -0.7275238037109375, -0.6654052734375, -0.6032867431640625, -0.541168212890625, -0.4790496826171875, -0.41693115234375, -0.3548126220703125, -0.292694091796875, -0.2305755615234375, -0.16845703125, -0.1063385009765625, -0.044219970703125, 0.0178985595703125, 0.08001708984375, 0.1421356201171875, 0.204254150390625, 0.2663726806640625, 0.3284912109375, 0.3906097412109375, 0.452728271484375, 0.5148468017578125, 0.57696533203125, 0.6390838623046875, 0.701202392578125, 0.7633209228515625, 0.825439453125, 0.8875579833984375, 0.949676513671875, 1.0117950439453125, 1.07391357421875, 1.1360321044921875, 1.198150634765625, 1.2602691650390625, 1.3223876953125, 1.3845062255859375, 1.446624755859375, 1.5087432861328125, 1.57086181640625, 1.6329803466796875, 1.695098876953125, 1.7572174072265625, 1.8193359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 11.0, 21.0, 13.0, 20.0, 33.0, 29.0, 48.0, 75.0, 94.0, 137.0, 196.0, 322.0, 437.0, 707.0, 1194.0, 2467.0, 6475.0, 28654.0, 219443.0, 682245.0, 83539.0, 13957.0, 3931.0, 1795.0, 968.0, 564.0, 361.0, 228.0, 152.0, 111.0, 95.0, 58.0, 52.0, 29.0, 24.0, 20.0, 9.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.94140625, -7.7283935546875, -7.515380859375, -7.3023681640625, -7.08935546875, -6.8763427734375, -6.663330078125, -6.4503173828125, -6.2373046875, -6.0242919921875, -5.811279296875, -5.5982666015625, -5.38525390625, -5.1722412109375, -4.959228515625, -4.7462158203125, -4.533203125, -4.3201904296875, -4.107177734375, -3.8941650390625, -3.68115234375, -3.4681396484375, -3.255126953125, -3.0421142578125, -2.8291015625, -2.6160888671875, -2.403076171875, -2.1900634765625, -1.97705078125, -1.7640380859375, -1.551025390625, -1.3380126953125, -1.125, -0.9119873046875, -0.698974609375, -0.4859619140625, -0.27294921875, -0.0599365234375, 0.153076171875, 0.3660888671875, 0.5791015625, 0.7921142578125, 1.005126953125, 1.2181396484375, 1.43115234375, 1.6441650390625, 1.857177734375, 2.0701904296875, 2.283203125, 2.4962158203125, 2.709228515625, 2.9222412109375, 3.13525390625, 3.3482666015625, 3.561279296875, 3.7742919921875, 3.9873046875, 4.2003173828125, 4.413330078125, 4.6263427734375, 4.83935546875, 5.0523681640625, 5.265380859375, 5.4783935546875, 5.69140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 3.0, 10.0, 13.0, 15.0, 18.0, 17.0, 30.0, 29.0, 30.0, 45.0, 47.0, 60.0, 52.0, 48.0, 53.0, 62.0, 67.0, 50.0, 53.0, 41.0, 44.0, 36.0, 26.0, 25.0, 28.0, 22.0, 16.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.6484375, -9.403076171875, -9.15771484375, -8.912353515625, -8.6669921875, -8.421630859375, -8.17626953125, -7.930908203125, -7.685546875, -7.440185546875, -7.19482421875, -6.949462890625, -6.7041015625, -6.458740234375, -6.21337890625, -5.968017578125, -5.72265625, -5.477294921875, -5.23193359375, -4.986572265625, -4.7412109375, -4.495849609375, -4.25048828125, -4.005126953125, -3.759765625, -3.514404296875, -3.26904296875, -3.023681640625, -2.7783203125, -2.532958984375, -2.28759765625, -2.042236328125, -1.796875, -1.551513671875, -1.30615234375, -1.060791015625, -0.8154296875, -0.570068359375, -0.32470703125, -0.079345703125, 0.166015625, 0.411376953125, 0.65673828125, 0.902099609375, 1.1474609375, 1.392822265625, 1.63818359375, 1.883544921875, 2.12890625, 2.374267578125, 2.61962890625, 2.864990234375, 3.1103515625, 3.355712890625, 3.60107421875, 3.846435546875, 4.091796875, 4.337158203125, 4.58251953125, 4.827880859375, 5.0732421875, 5.318603515625, 5.56396484375, 5.809326171875, 6.0546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 7.0, 9.0, 6.0, 21.0, 23.0, 34.0, 55.0, 50.0, 79.0, 115.0, 153.0, 222.0, 332.0, 615.0, 950.0, 1782.0, 3486.0, 7622.0, 19299.0, 55593.0, 179897.0, 510079.0, 178105.0, 55123.0, 19161.0, 7785.0, 3507.0, 1797.0, 962.0, 542.0, 361.0, 200.0, 173.0, 106.0, 83.0, 48.0, 34.0, 22.0, 17.0, 16.0, 9.0, 18.0, 6.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0], "bins": [-1.6611328125, -1.610015869140625, -1.55889892578125, -1.507781982421875, -1.4566650390625, -1.405548095703125, -1.35443115234375, -1.303314208984375, -1.252197265625, -1.201080322265625, -1.14996337890625, -1.098846435546875, -1.0477294921875, -0.996612548828125, -0.94549560546875, -0.894378662109375, -0.84326171875, -0.792144775390625, -0.74102783203125, -0.689910888671875, -0.6387939453125, -0.587677001953125, -0.53656005859375, -0.485443115234375, -0.434326171875, -0.383209228515625, -0.33209228515625, -0.280975341796875, -0.2298583984375, -0.178741455078125, -0.12762451171875, -0.076507568359375, -0.025390625, 0.025726318359375, 0.07684326171875, 0.127960205078125, 0.1790771484375, 0.230194091796875, 0.28131103515625, 0.332427978515625, 0.383544921875, 0.434661865234375, 0.48577880859375, 0.536895751953125, 0.5880126953125, 0.639129638671875, 0.69024658203125, 0.741363525390625, 0.79248046875, 0.843597412109375, 0.89471435546875, 0.945831298828125, 0.9969482421875, 1.048065185546875, 1.09918212890625, 1.150299072265625, 1.201416015625, 1.252532958984375, 1.30364990234375, 1.354766845703125, 1.4058837890625, 1.457000732421875, 1.50811767578125, 1.559234619140625, 1.6103515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 11.0, 4.0, 11.0, 9.0, 27.0, 30.0, 38.0, 45.0, 60.0, 90.0, 145.0, 188.0, 110.0, 57.0, 40.0, 43.0, 18.0, 24.0, 18.0, 14.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009059906005859375, -0.0008816048502922058, -0.0008572190999984741, -0.0008328333497047424, -0.0008084475994110107, -0.000784061849117279, -0.0007596760988235474, -0.0007352903485298157, -0.000710904598236084, -0.0006865188479423523, -0.0006621330976486206, -0.0006377473473548889, -0.0006133615970611572, -0.0005889758467674255, -0.0005645900964736938, -0.0005402043461799622, -0.0005158185958862305, -0.0004914328455924988, -0.0004670470952987671, -0.0004426613450050354, -0.0004182755947113037, -0.000393889844417572, -0.00036950409412384033, -0.00034511834383010864, -0.00032073259353637695, -0.00029634684324264526, -0.0002719610929489136, -0.0002475753426551819, -0.0002231895923614502, -0.0001988038420677185, -0.00017441809177398682, -0.00015003234148025513, -0.00012564659118652344, -0.00010126084089279175, -7.687509059906006e-05, -5.248934030532837e-05, -2.810359001159668e-05, -3.7178397178649902e-06, 2.06679105758667e-05, 4.505366086959839e-05, 6.943941116333008e-05, 9.382516145706177e-05, 0.00011821091175079346, 0.00014259666204452515, 0.00016698241233825684, 0.00019136816263198853, 0.00021575391292572021, 0.0002401396632194519, 0.0002645254135131836, 0.0002889111638069153, 0.00031329691410064697, 0.00033768266439437866, 0.00036206841468811035, 0.00038645416498184204, 0.00041083991527557373, 0.0004352256655693054, 0.0004596114158630371, 0.0004839971661567688, 0.0005083829164505005, 0.0005327686667442322, 0.0005571544170379639, 0.0005815401673316956, 0.0006059259176254272, 0.0006303116679191589, 0.0006546974182128906]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 5.0, 9.0, 15.0, 21.0, 30.0, 45.0, 48.0, 65.0, 118.0, 179.0, 262.0, 437.0, 842.0, 1558.0, 3540.0, 10174.0, 40402.0, 225977.0, 602687.0, 124945.0, 24565.0, 6912.0, 2661.0, 1231.0, 709.0, 369.0, 259.0, 162.0, 107.0, 62.0, 42.0, 34.0, 20.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.272735595703125, -2.19781494140625, -2.122894287109375, -2.0479736328125, -1.973052978515625, -1.89813232421875, -1.823211669921875, -1.748291015625, -1.673370361328125, -1.59844970703125, -1.523529052734375, -1.4486083984375, -1.373687744140625, -1.29876708984375, -1.223846435546875, -1.14892578125, -1.074005126953125, -0.99908447265625, -0.924163818359375, -0.8492431640625, -0.774322509765625, -0.69940185546875, -0.624481201171875, -0.549560546875, -0.474639892578125, -0.39971923828125, -0.324798583984375, -0.2498779296875, -0.174957275390625, -0.10003662109375, -0.025115966796875, 0.0498046875, 0.124725341796875, 0.19964599609375, 0.274566650390625, 0.3494873046875, 0.424407958984375, 0.49932861328125, 0.574249267578125, 0.649169921875, 0.724090576171875, 0.79901123046875, 0.873931884765625, 0.9488525390625, 1.023773193359375, 1.09869384765625, 1.173614501953125, 1.24853515625, 1.323455810546875, 1.39837646484375, 1.473297119140625, 1.5482177734375, 1.623138427734375, 1.69805908203125, 1.772979736328125, 1.847900390625, 1.922821044921875, 1.99774169921875, 2.072662353515625, 2.1475830078125, 2.222503662109375, 2.29742431640625, 2.372344970703125, 2.447265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 8.0, 16.0, 19.0, 12.0, 26.0, 27.0, 19.0, 34.0, 41.0, 47.0, 56.0, 67.0, 84.0, 52.0, 80.0, 64.0, 56.0, 48.0, 22.0, 25.0, 26.0, 15.0, 28.0, 18.0, 15.0, 11.0, 12.0, 10.0, 3.0, 11.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61260986328125, -1.5592041015625, -1.50579833984375, -1.452392578125, -1.39898681640625, -1.3455810546875, -1.29217529296875, -1.23876953125, -1.18536376953125, -1.1319580078125, -1.07855224609375, -1.025146484375, -0.97174072265625, -0.9183349609375, -0.86492919921875, -0.8115234375, -0.75811767578125, -0.7047119140625, -0.65130615234375, -0.597900390625, -0.54449462890625, -0.4910888671875, -0.43768310546875, -0.38427734375, -0.33087158203125, -0.2774658203125, -0.22406005859375, -0.170654296875, -0.11724853515625, -0.0638427734375, -0.01043701171875, 0.04296875, 0.09637451171875, 0.1497802734375, 0.20318603515625, 0.256591796875, 0.30999755859375, 0.3634033203125, 0.41680908203125, 0.47021484375, 0.52362060546875, 0.5770263671875, 0.63043212890625, 0.683837890625, 0.73724365234375, 0.7906494140625, 0.84405517578125, 0.8974609375, 0.95086669921875, 1.0042724609375, 1.05767822265625, 1.111083984375, 1.16448974609375, 1.2178955078125, 1.27130126953125, 1.32470703125, 1.37811279296875, 1.4315185546875, 1.48492431640625, 1.538330078125, 1.59173583984375, 1.6451416015625, 1.69854736328125, 1.751953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 23.0, 82.0, 179.0, 253.0, 248.0, 117.0, 54.0, 22.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.33924865722656, -51.71582794189453, -49.0924072265625, -46.46898651123047, -43.8455696105957, -41.22214889526367, -38.59872817993164, -35.975311279296875, -33.351890563964844, -30.728469848632812, -28.105051040649414, -25.481630325317383, -22.858211517333984, -20.234790802001953, -17.611370086669922, -14.987951278686523, -12.36452865600586, -9.741108894348145, -7.1176886558532715, -4.494268417358398, -1.8708486557006836, 0.7525711059570312, 3.3759918212890625, 5.999410629272461, 8.622831344604492, 11.246251106262207, 13.869670867919922, 16.493091583251953, 19.116512298583984, 21.739931106567383, 24.363351821899414, 26.986770629882812, 29.610191345214844, 32.233612060546875, 34.857032775878906, 37.48045349121094, 40.1038703918457, 42.727291107177734, 45.350711822509766, 47.97412872314453, 50.59754943847656, 53.220970153808594, 55.844390869140625, 58.467811584472656, 61.09122848510742, 63.71464920043945, 66.33807373046875, 68.96148681640625, 71.58491516113281, 74.20833587646484, 76.83175659179688, 79.4551773071289, 82.07859802246094, 84.70201110839844, 87.325439453125, 89.9488525390625, 92.57227325439453, 95.19569396972656, 97.8191146850586, 100.44253540039062, 103.06595611572266, 105.68937683105469, 108.31278991699219, 110.93621063232422, 113.55963134765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 17.0, 50.0, 39.0, 38.0, 32.0, 44.0, 52.0, 50.0, 55.0, 39.0, 47.0, 30.0, 45.0, 39.0, 40.0, 37.0, 30.0, 22.0, 31.0, 24.0, 18.0, 15.0, 11.0, 12.0, 7.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.92465591430664, -24.99482536315918, -24.064992904663086, -23.135162353515625, -22.205331802368164, -21.275501251220703, -20.34566879272461, -19.41583824157715, -18.486007690429688, -17.556177139282227, -16.626344680786133, -15.696514129638672, -14.766683578491211, -13.836852073669434, -12.907020568847656, -11.977190017700195, -11.047358512878418, -10.11752700805664, -9.18769645690918, -8.257864952087402, -7.328034400939941, -6.398202896118164, -5.468371868133545, -4.538540840148926, -3.6087098121643066, -2.6788787841796875, -1.7490476369857788, -0.8192164897918701, 0.11061453819274902, 1.0404458045959473, 1.9702768325805664, 2.9001078605651855, 3.8299388885498047, 4.759769916534424, 5.689600944519043, 6.61943244934082, 7.549263000488281, 8.479094505310059, 9.408926010131836, 10.338756561279297, 11.268587112426758, 12.198418617248535, 13.128249168395996, 14.058080673217773, 14.987911224365234, 15.917742729187012, 16.84757423400879, 17.77740478515625, 18.707237243652344, 19.637067794799805, 20.5669002532959, 21.49673080444336, 22.42656135559082, 23.35639190673828, 24.286224365234375, 25.216054916381836, 26.145885467529297, 27.075716018676758, 28.00554847717285, 28.935379028320312, 29.865209579467773, 30.795040130615234, 31.724872589111328, 32.654701232910156, 33.58453369140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 13.0, 16.0, 27.0, 50.0, 82.0, 134.0, 218.0, 378.0, 730.0, 1398.0, 2791.0, 6263.0, 15490.0, 46147.0, 221830.0, 3062423.0, 714655.0, 81176.0, 23810.0, 9025.0, 3785.0, 1796.0, 880.0, 473.0, 279.0, 165.0, 81.0, 60.0, 39.0, 23.0, 16.0, 5.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.806640625, -3.682708740234375, -3.55877685546875, -3.434844970703125, -3.3109130859375, -3.186981201171875, -3.06304931640625, -2.939117431640625, -2.815185546875, -2.691253662109375, -2.56732177734375, -2.443389892578125, -2.3194580078125, -2.195526123046875, -2.07159423828125, -1.947662353515625, -1.82373046875, -1.699798583984375, -1.57586669921875, -1.451934814453125, -1.3280029296875, -1.204071044921875, -1.08013916015625, -0.956207275390625, -0.832275390625, -0.708343505859375, -0.58441162109375, -0.460479736328125, -0.3365478515625, -0.212615966796875, -0.08868408203125, 0.035247802734375, 0.1591796875, 0.283111572265625, 0.40704345703125, 0.530975341796875, 0.6549072265625, 0.778839111328125, 0.90277099609375, 1.026702880859375, 1.150634765625, 1.274566650390625, 1.39849853515625, 1.522430419921875, 1.6463623046875, 1.770294189453125, 1.89422607421875, 2.018157958984375, 2.14208984375, 2.266021728515625, 2.38995361328125, 2.513885498046875, 2.6378173828125, 2.761749267578125, 2.88568115234375, 3.009613037109375, 3.133544921875, 3.257476806640625, 3.38140869140625, 3.505340576171875, 3.6292724609375, 3.753204345703125, 3.87713623046875, 4.001068115234375, 4.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 2.0, 10.0, 14.0, 16.0, 11.0, 17.0, 29.0, 24.0, 37.0, 30.0, 37.0, 55.0, 46.0, 56.0, 55.0, 58.0, 49.0, 52.0, 51.0, 46.0, 47.0, 42.0, 37.0, 34.0, 37.0, 27.0, 21.0, 13.0, 12.0, 8.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.09765625, -2.0394134521484375, -1.981170654296875, -1.9229278564453125, -1.86468505859375, -1.8064422607421875, -1.748199462890625, -1.6899566650390625, -1.6317138671875, -1.5734710693359375, -1.515228271484375, -1.4569854736328125, -1.39874267578125, -1.3404998779296875, -1.282257080078125, -1.2240142822265625, -1.165771484375, -1.1075286865234375, -1.049285888671875, -0.9910430908203125, -0.93280029296875, -0.8745574951171875, -0.816314697265625, -0.7580718994140625, -0.6998291015625, -0.6415863037109375, -0.583343505859375, -0.5251007080078125, -0.46685791015625, -0.4086151123046875, -0.350372314453125, -0.2921295166015625, -0.23388671875, -0.1756439208984375, -0.117401123046875, -0.0591583251953125, -0.00091552734375, 0.0573272705078125, 0.115570068359375, 0.1738128662109375, 0.2320556640625, 0.2902984619140625, 0.348541259765625, 0.4067840576171875, 0.46502685546875, 0.5232696533203125, 0.581512451171875, 0.6397552490234375, 0.697998046875, 0.7562408447265625, 0.814483642578125, 0.8727264404296875, 0.93096923828125, 0.9892120361328125, 1.047454833984375, 1.1056976318359375, 1.1639404296875, 1.2221832275390625, 1.280426025390625, 1.3386688232421875, 1.39691162109375, 1.4551544189453125, 1.513397216796875, 1.5716400146484375, 1.6298828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 15.0, 18.0, 27.0, 27.0, 47.0, 72.0, 100.0, 161.0, 301.0, 481.0, 998.0, 2225.0, 5333.0, 14975.0, 55191.0, 409637.0, 3402055.0, 242913.0, 40631.0, 11417.0, 4124.0, 1687.0, 820.0, 417.0, 224.0, 133.0, 81.0, 51.0, 32.0, 12.0, 14.0, 22.0, 7.0, 8.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.1644287109375, -4.012451171875, -3.8604736328125, -3.70849609375, -3.5565185546875, -3.404541015625, -3.2525634765625, -3.1005859375, -2.9486083984375, -2.796630859375, -2.6446533203125, -2.49267578125, -2.3406982421875, -2.188720703125, -2.0367431640625, -1.884765625, -1.7327880859375, -1.580810546875, -1.4288330078125, -1.27685546875, -1.1248779296875, -0.972900390625, -0.8209228515625, -0.6689453125, -0.5169677734375, -0.364990234375, -0.2130126953125, -0.06103515625, 0.0909423828125, 0.242919921875, 0.3948974609375, 0.546875, 0.6988525390625, 0.850830078125, 1.0028076171875, 1.15478515625, 1.3067626953125, 1.458740234375, 1.6107177734375, 1.7626953125, 1.9146728515625, 2.066650390625, 2.2186279296875, 2.37060546875, 2.5225830078125, 2.674560546875, 2.8265380859375, 2.978515625, 3.1304931640625, 3.282470703125, 3.4344482421875, 3.58642578125, 3.7384033203125, 3.890380859375, 4.0423583984375, 4.1943359375, 4.3463134765625, 4.498291015625, 4.6502685546875, 4.80224609375, 4.9542236328125, 5.106201171875, 5.2581787109375, 5.41015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 11.0, 23.0, 23.0, 22.0, 47.0, 54.0, 94.0, 160.0, 294.0, 828.0, 1213.0, 620.0, 307.0, 144.0, 71.0, 44.0, 32.0, 14.0, 16.0, 6.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7998046875, -5.615234375, -5.4306640625, -5.24609375, -5.0615234375, -4.876953125, -4.6923828125, -4.5078125, -4.3232421875, -4.138671875, -3.9541015625, -3.76953125, -3.5849609375, -3.400390625, -3.2158203125, -3.03125, -2.8466796875, -2.662109375, -2.4775390625, -2.29296875, -2.1083984375, -1.923828125, -1.7392578125, -1.5546875, -1.3701171875, -1.185546875, -1.0009765625, -0.81640625, -0.6318359375, -0.447265625, -0.2626953125, -0.078125, 0.1064453125, 0.291015625, 0.4755859375, 0.66015625, 0.8447265625, 1.029296875, 1.2138671875, 1.3984375, 1.5830078125, 1.767578125, 1.9521484375, 2.13671875, 2.3212890625, 2.505859375, 2.6904296875, 2.875, 3.0595703125, 3.244140625, 3.4287109375, 3.61328125, 3.7978515625, 3.982421875, 4.1669921875, 4.3515625, 4.5361328125, 4.720703125, 4.9052734375, 5.08984375, 5.2744140625, 5.458984375, 5.6435546875, 5.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 0.0, 3.0, 4.0, 8.0, 6.0, 12.0, 20.0, 20.0, 42.0, 57.0, 116.0, 174.0, 215.0, 155.0, 85.0, 41.0, 16.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.24077606201172, -80.50762176513672, -78.77445983886719, -77.04130554199219, -75.30814361572266, -73.57498931884766, -71.84182739257812, -70.10867309570312, -68.3755111694336, -66.6423568725586, -64.90919494628906, -63.1760368347168, -61.44287872314453, -59.709720611572266, -57.9765625, -56.243404388427734, -54.51024627685547, -52.7770881652832, -51.04393005371094, -49.31077194213867, -47.577613830566406, -45.84445571899414, -44.111297607421875, -42.37813949584961, -40.64498519897461, -38.911827087402344, -37.17866897583008, -35.44551086425781, -33.71235275268555, -31.97919464111328, -30.246036529541016, -28.51287841796875, -26.779720306396484, -25.04656219482422, -23.313404083251953, -21.580245971679688, -19.847087860107422, -18.113929748535156, -16.38077163696289, -14.647614479064941, -12.914456367492676, -11.18129825592041, -9.448140144348145, -7.714982509613037, -5.9818243980407715, -4.248666763305664, -2.5155086517333984, -0.7823505401611328, 0.9508075714111328, 2.6839656829833984, 4.417123794555664, 6.1502814292907715, 7.883439540863037, 9.616597175598145, 11.34975528717041, 13.082913398742676, 14.816071510314941, 16.54922866821289, 18.282386779785156, 20.015544891357422, 21.748703002929688, 23.481861114501953, 25.21501922607422, 26.948177337646484, 28.68133544921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 15.0, 22.0, 22.0, 17.0, 25.0, 30.0, 24.0, 26.0, 39.0, 39.0, 31.0, 36.0, 38.0, 47.0, 38.0, 37.0, 43.0, 40.0, 33.0, 48.0, 38.0, 36.0, 38.0, 29.0, 39.0, 24.0, 24.0, 19.0, 18.0, 19.0, 6.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.709545135498047, -22.95271110534668, -22.195877075195312, -21.439043045043945, -20.682209014892578, -19.92537498474121, -19.168540954589844, -18.41170883178711, -17.65487289428711, -16.898038864135742, -16.141204833984375, -15.384370803833008, -14.62753677368164, -13.870702743530273, -13.113869667053223, -12.357035636901855, -11.600202560424805, -10.843368530273438, -10.08653450012207, -9.329700469970703, -8.572866439819336, -7.816032886505127, -7.059199333190918, -6.302365303039551, -5.545531272888184, -4.788697242736816, -4.031863212585449, -3.2750296592712402, -2.518195629119873, -1.7613615989685059, -1.0045280456542969, -0.2476940155029297, 0.5091381072998047, 1.2659720182418823, 2.02280592918396, 2.779639720916748, 3.5364737510681152, 4.293307781219482, 5.050141334533691, 5.806975364685059, 6.563809394836426, 7.320643424987793, 8.07747745513916, 8.834310531616211, 9.591144561767578, 10.347978591918945, 11.104812622070312, 11.86164665222168, 12.618480682373047, 13.375314712524414, 14.132148742675781, 14.888982772827148, 15.645816802978516, 16.402650833129883, 17.15948486328125, 17.916316986083984, 18.673152923583984, 19.42998695373535, 20.18682098388672, 20.943655014038086, 21.700489044189453, 22.45732307434082, 23.214157104492188, 23.970989227294922, 24.72782325744629]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 5.0, 18.0, 22.0, 35.0, 52.0, 85.0, 157.0, 235.0, 412.0, 721.0, 1248.0, 2263.0, 4441.0, 9073.0, 20757.0, 54174.0, 214790.0, 534412.0, 134038.0, 40176.0, 15953.0, 7209.0, 3651.0, 1978.0, 1121.0, 604.0, 347.0, 201.0, 146.0, 94.0, 45.0, 36.0, 16.0, 19.0, 14.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.82275390625, -4.6689453125, -4.51513671875, -4.361328125, -4.20751953125, -4.0537109375, -3.89990234375, -3.74609375, -3.59228515625, -3.4384765625, -3.28466796875, -3.130859375, -2.97705078125, -2.8232421875, -2.66943359375, -2.515625, -2.36181640625, -2.2080078125, -2.05419921875, -1.900390625, -1.74658203125, -1.5927734375, -1.43896484375, -1.28515625, -1.13134765625, -0.9775390625, -0.82373046875, -0.669921875, -0.51611328125, -0.3623046875, -0.20849609375, -0.0546875, 0.09912109375, 0.2529296875, 0.40673828125, 0.560546875, 0.71435546875, 0.8681640625, 1.02197265625, 1.17578125, 1.32958984375, 1.4833984375, 1.63720703125, 1.791015625, 1.94482421875, 2.0986328125, 2.25244140625, 2.40625, 2.56005859375, 2.7138671875, 2.86767578125, 3.021484375, 3.17529296875, 3.3291015625, 3.48291015625, 3.63671875, 3.79052734375, 3.9443359375, 4.09814453125, 4.251953125, 4.40576171875, 4.5595703125, 4.71337890625, 4.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 9.0, 17.0, 14.0, 19.0, 28.0, 26.0, 32.0, 30.0, 35.0, 35.0, 41.0, 43.0, 52.0, 40.0, 56.0, 55.0, 53.0, 48.0, 60.0, 39.0, 34.0, 32.0, 31.0, 29.0, 25.0, 22.0, 24.0, 16.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.172637939453125, -2.11480712890625, -2.056976318359375, -1.9991455078125, -1.941314697265625, -1.88348388671875, -1.825653076171875, -1.767822265625, -1.709991455078125, -1.65216064453125, -1.594329833984375, -1.5364990234375, -1.478668212890625, -1.42083740234375, -1.363006591796875, -1.30517578125, -1.247344970703125, -1.18951416015625, -1.131683349609375, -1.0738525390625, -1.016021728515625, -0.95819091796875, -0.900360107421875, -0.842529296875, -0.784698486328125, -0.72686767578125, -0.669036865234375, -0.6112060546875, -0.553375244140625, -0.49554443359375, -0.437713623046875, -0.3798828125, -0.322052001953125, -0.26422119140625, -0.206390380859375, -0.1485595703125, -0.090728759765625, -0.03289794921875, 0.024932861328125, 0.082763671875, 0.140594482421875, 0.19842529296875, 0.256256103515625, 0.3140869140625, 0.371917724609375, 0.42974853515625, 0.487579345703125, 0.54541015625, 0.603240966796875, 0.66107177734375, 0.718902587890625, 0.7767333984375, 0.834564208984375, 0.89239501953125, 0.950225830078125, 1.008056640625, 1.065887451171875, 1.12371826171875, 1.181549072265625, 1.2393798828125, 1.297210693359375, 1.35504150390625, 1.412872314453125, 1.470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 4.0, 9.0, 9.0, 20.0, 25.0, 39.0, 57.0, 91.0, 131.0, 209.0, 348.0, 601.0, 1139.0, 2652.0, 9504.0, 72258.0, 869258.0, 76908.0, 9888.0, 2738.0, 1208.0, 542.0, 314.0, 207.0, 131.0, 68.0, 65.0, 45.0, 19.0, 19.0, 14.0, 13.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0440673828125, -7.728759765625, -7.4134521484375, -7.09814453125, -6.7828369140625, -6.467529296875, -6.1522216796875, -5.8369140625, -5.5216064453125, -5.206298828125, -4.8909912109375, -4.57568359375, -4.2603759765625, -3.945068359375, -3.6297607421875, -3.314453125, -2.9991455078125, -2.683837890625, -2.3685302734375, -2.05322265625, -1.7379150390625, -1.422607421875, -1.1072998046875, -0.7919921875, -0.4766845703125, -0.161376953125, 0.1539306640625, 0.46923828125, 0.7845458984375, 1.099853515625, 1.4151611328125, 1.73046875, 2.0457763671875, 2.361083984375, 2.6763916015625, 2.99169921875, 3.3070068359375, 3.622314453125, 3.9376220703125, 4.2529296875, 4.5682373046875, 4.883544921875, 5.1988525390625, 5.51416015625, 5.8294677734375, 6.144775390625, 6.4600830078125, 6.775390625, 7.0906982421875, 7.406005859375, 7.7213134765625, 8.03662109375, 8.3519287109375, 8.667236328125, 8.9825439453125, 9.2978515625, 9.6131591796875, 9.928466796875, 10.2437744140625, 10.55908203125, 10.8743896484375, 11.189697265625, 11.5050048828125, 11.8203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 9.0, 6.0, 8.0, 3.0, 7.0, 9.0, 13.0, 13.0, 17.0, 25.0, 42.0, 27.0, 33.0, 40.0, 44.0, 57.0, 56.0, 57.0, 42.0, 48.0, 47.0, 55.0, 58.0, 44.0, 53.0, 37.0, 24.0, 35.0, 24.0, 19.0, 19.0, 6.0, 7.0, 4.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.89453125, -7.63128662109375, -7.3680419921875, -7.10479736328125, -6.841552734375, -6.57830810546875, -6.3150634765625, -6.05181884765625, -5.78857421875, -5.52532958984375, -5.2620849609375, -4.99884033203125, -4.735595703125, -4.47235107421875, -4.2091064453125, -3.94586181640625, -3.6826171875, -3.41937255859375, -3.1561279296875, -2.89288330078125, -2.629638671875, -2.36639404296875, -2.1031494140625, -1.83990478515625, -1.57666015625, -1.31341552734375, -1.0501708984375, -0.78692626953125, -0.523681640625, -0.26043701171875, 0.0028076171875, 0.26605224609375, 0.529296875, 0.79254150390625, 1.0557861328125, 1.31903076171875, 1.582275390625, 1.84552001953125, 2.1087646484375, 2.37200927734375, 2.63525390625, 2.89849853515625, 3.1617431640625, 3.42498779296875, 3.688232421875, 3.95147705078125, 4.2147216796875, 4.47796630859375, 4.7412109375, 5.00445556640625, 5.2677001953125, 5.53094482421875, 5.794189453125, 6.05743408203125, 6.3206787109375, 6.58392333984375, 6.84716796875, 7.11041259765625, 7.3736572265625, 7.63690185546875, 7.900146484375, 8.16339111328125, 8.4266357421875, 8.68988037109375, 8.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 16.0, 18.0, 25.0, 36.0, 51.0, 100.0, 166.0, 326.0, 588.0, 1319.0, 3443.0, 10184.0, 37700.0, 444717.0, 494895.0, 38450.0, 10274.0, 3521.0, 1364.0, 589.0, 293.0, 178.0, 99.0, 52.0, 32.0, 24.0, 19.0, 14.0, 13.0, 8.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0], "bins": [-5.20703125, -5.080047607421875, -4.95306396484375, -4.826080322265625, -4.6990966796875, -4.572113037109375, -4.44512939453125, -4.318145751953125, -4.191162109375, -4.064178466796875, -3.93719482421875, -3.810211181640625, -3.6832275390625, -3.556243896484375, -3.42926025390625, -3.302276611328125, -3.17529296875, -3.048309326171875, -2.92132568359375, -2.794342041015625, -2.6673583984375, -2.540374755859375, -2.41339111328125, -2.286407470703125, -2.159423828125, -2.032440185546875, -1.90545654296875, -1.778472900390625, -1.6514892578125, -1.524505615234375, -1.39752197265625, -1.270538330078125, -1.1435546875, -1.016571044921875, -0.88958740234375, -0.762603759765625, -0.6356201171875, -0.508636474609375, -0.38165283203125, -0.254669189453125, -0.127685546875, -0.000701904296875, 0.12628173828125, 0.253265380859375, 0.3802490234375, 0.507232666015625, 0.63421630859375, 0.761199951171875, 0.88818359375, 1.015167236328125, 1.14215087890625, 1.269134521484375, 1.3961181640625, 1.523101806640625, 1.65008544921875, 1.777069091796875, 1.904052734375, 2.031036376953125, 2.15802001953125, 2.285003662109375, 2.4119873046875, 2.538970947265625, 2.66595458984375, 2.792938232421875, 2.919921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 5.0, 6.0, 6.0, 7.0, 19.0, 17.0, 35.0, 38.0, 72.0, 198.0, 271.0, 134.0, 54.0, 27.0, 25.0, 17.0, 11.0, 5.0, 9.0, 4.0, 7.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011396408081054688, -0.0011032074689865112, -0.0010667741298675537, -0.0010303407907485962, -0.0009939074516296387, -0.0009574741125106812, -0.0009210407733917236, -0.0008846074342727661, -0.0008481740951538086, -0.0008117407560348511, -0.0007753074169158936, -0.000738874077796936, -0.0007024407386779785, -0.000666007399559021, -0.0006295740604400635, -0.000593140721321106, -0.0005567073822021484, -0.0005202740430831909, -0.0004838407039642334, -0.0004474073648452759, -0.00041097402572631836, -0.00037454068660736084, -0.0003381073474884033, -0.0003016740083694458, -0.0002652406692504883, -0.00022880733013153076, -0.00019237399101257324, -0.00015594065189361572, -0.0001195073127746582, -8.307397365570068e-05, -4.6640634536743164e-05, -1.0207295417785645e-05, 2.6226043701171875e-05, 6.26593828201294e-05, 9.909272193908691e-05, 0.00013552606105804443, 0.00017195940017700195, 0.00020839273929595947, 0.000244826078414917, 0.0002812594175338745, 0.00031769275665283203, 0.00035412609577178955, 0.00039055943489074707, 0.0004269927740097046, 0.0004634261131286621, 0.0004998594522476196, 0.0005362927913665771, 0.0005727261304855347, 0.0006091594696044922, 0.0006455928087234497, 0.0006820261478424072, 0.0007184594869613647, 0.0007548928260803223, 0.0007913261651992798, 0.0008277595043182373, 0.0008641928434371948, 0.0009006261825561523, 0.0009370595216751099, 0.0009734928607940674, 0.001009926199913025, 0.0010463595390319824, 0.00108279287815094, 0.0011192262172698975, 0.001155659556388855, 0.0011920928955078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 9.0, 8.0, 21.0, 19.0, 33.0, 45.0, 107.0, 160.0, 276.0, 534.0, 1222.0, 3217.0, 11507.0, 71179.0, 830680.0, 108069.0, 14768.0, 3920.0, 1381.0, 632.0, 300.0, 181.0, 90.0, 67.0, 41.0, 28.0, 18.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.015625, -4.86627197265625, -4.7169189453125, -4.56756591796875, -4.418212890625, -4.26885986328125, -4.1195068359375, -3.97015380859375, -3.82080078125, -3.67144775390625, -3.5220947265625, -3.37274169921875, -3.223388671875, -3.07403564453125, -2.9246826171875, -2.77532958984375, -2.6259765625, -2.47662353515625, -2.3272705078125, -2.17791748046875, -2.028564453125, -1.87921142578125, -1.7298583984375, -1.58050537109375, -1.43115234375, -1.28179931640625, -1.1324462890625, -0.98309326171875, -0.833740234375, -0.68438720703125, -0.5350341796875, -0.38568115234375, -0.236328125, -0.08697509765625, 0.0623779296875, 0.21173095703125, 0.361083984375, 0.51043701171875, 0.6597900390625, 0.80914306640625, 0.95849609375, 1.10784912109375, 1.2572021484375, 1.40655517578125, 1.555908203125, 1.70526123046875, 1.8546142578125, 2.00396728515625, 2.1533203125, 2.30267333984375, 2.4520263671875, 2.60137939453125, 2.750732421875, 2.90008544921875, 3.0494384765625, 3.19879150390625, 3.34814453125, 3.49749755859375, 3.6468505859375, 3.79620361328125, 3.945556640625, 4.09490966796875, 4.2442626953125, 4.39361572265625, 4.54296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 6.0, 7.0, 12.0, 16.0, 18.0, 26.0, 38.0, 45.0, 65.0, 97.0, 123.0, 114.0, 110.0, 81.0, 51.0, 45.0, 31.0, 29.0, 21.0, 13.0, 7.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.39666748046875, -2.2933349609375, -2.19000244140625, -2.086669921875, -1.98333740234375, -1.8800048828125, -1.77667236328125, -1.67333984375, -1.57000732421875, -1.4666748046875, -1.36334228515625, -1.260009765625, -1.15667724609375, -1.0533447265625, -0.95001220703125, -0.8466796875, -0.74334716796875, -0.6400146484375, -0.53668212890625, -0.433349609375, -0.33001708984375, -0.2266845703125, -0.12335205078125, -0.02001953125, 0.08331298828125, 0.1866455078125, 0.28997802734375, 0.393310546875, 0.49664306640625, 0.5999755859375, 0.70330810546875, 0.806640625, 0.90997314453125, 1.0133056640625, 1.11663818359375, 1.219970703125, 1.32330322265625, 1.4266357421875, 1.52996826171875, 1.63330078125, 1.73663330078125, 1.8399658203125, 1.94329833984375, 2.046630859375, 2.14996337890625, 2.2532958984375, 2.35662841796875, 2.4599609375, 2.56329345703125, 2.6666259765625, 2.76995849609375, 2.873291015625, 2.97662353515625, 3.0799560546875, 3.18328857421875, 3.28662109375, 3.38995361328125, 3.4932861328125, 3.59661865234375, 3.699951171875, 3.80328369140625, 3.9066162109375, 4.00994873046875, 4.11328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 1.0, 5.0, 5.0, 13.0, 26.0, 42.0, 83.0, 93.0, 141.0, 159.0, 139.0, 94.0, 75.0, 42.0, 32.0, 14.0, 11.0, 5.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.12789535522461, -34.59796905517578, -33.06803894042969, -31.53811264038086, -30.00818634033203, -28.47825813293457, -26.94832992553711, -25.41840362548828, -23.88847541809082, -22.35854721069336, -20.82862091064453, -19.29869270324707, -17.76876449584961, -16.23883819580078, -14.70890998840332, -13.178982734680176, -11.649055480957031, -10.119128227233887, -8.589200973510742, -7.059272766113281, -5.529345512390137, -3.999418258666992, -2.4694900512695312, -0.9395627975463867, 0.5903644561767578, 2.1202919483184814, 3.650219440460205, 5.180147171020508, 6.710074424743652, 8.240001678466797, 9.769929885864258, 11.299857139587402, 12.829784393310547, 14.359711647033691, 15.889638900756836, 17.419567108154297, 18.949493408203125, 20.479421615600586, 22.009349822998047, 23.539276123046875, 25.069204330444336, 26.599132537841797, 28.129058837890625, 29.658987045288086, 31.188915252685547, 32.718841552734375, 34.24877166748047, 35.7786979675293, 37.308624267578125, 38.83855056762695, 40.36848068237305, 41.898406982421875, 43.4283332824707, 44.95825958251953, 46.488189697265625, 48.01811599731445, 49.54804229736328, 51.07796859741211, 52.6078987121582, 54.13782501220703, 55.66775131225586, 57.19767761230469, 58.72760772705078, 60.25753402709961, 61.7874641418457]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 5.0, 9.0, 9.0, 16.0, 8.0, 18.0, 15.0, 26.0, 17.0, 15.0, 18.0, 27.0, 29.0, 26.0, 29.0, 33.0, 52.0, 42.0, 47.0, 41.0, 47.0, 49.0, 43.0, 50.0, 31.0, 35.0, 24.0, 31.0, 41.0, 22.0, 15.0, 23.0, 16.0, 16.0, 10.0, 16.0, 10.0, 8.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.409465789794922, -26.574079513549805, -25.738693237304688, -24.903305053710938, -24.06791877746582, -23.232532501220703, -22.397144317626953, -21.561758041381836, -20.72637176513672, -19.8909854888916, -19.055599212646484, -18.220211029052734, -17.384824752807617, -16.5494384765625, -15.714051246643066, -14.878664016723633, -14.043277740478516, -13.207891464233398, -12.372504234313965, -11.537117004394531, -10.701730728149414, -9.866344451904297, -9.030957221984863, -8.19556999206543, -7.3601837158203125, -6.524796962738037, -5.689410209655762, -4.854023456573486, -4.018636703491211, -3.1832499504089355, -2.34786319732666, -1.5124764442443848, -0.6770896911621094, 0.15829706192016602, 0.9936838150024414, 1.8290705680847168, 2.664457321166992, 3.4998440742492676, 4.335230827331543, 5.170617580413818, 6.006004333496094, 6.841391086578369, 7.6767778396606445, 8.512165069580078, 9.347551345825195, 10.182937622070312, 11.018324851989746, 11.85371208190918, 12.689098358154297, 13.524484634399414, 14.359871864318848, 15.195259094238281, 16.0306453704834, 16.866031646728516, 17.701419830322266, 18.536806106567383, 19.3721923828125, 20.207578659057617, 21.042964935302734, 21.878353118896484, 22.7137393951416, 23.54912567138672, 24.38451385498047, 25.219900131225586, 26.055286407470703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 10.0, 19.0, 21.0, 19.0, 36.0, 46.0, 72.0, 77.0, 130.0, 240.0, 795.0, 9504.0, 2650207.0, 1523389.0, 8351.0, 713.0, 200.0, 132.0, 76.0, 54.0, 47.0, 37.0, 20.0, 17.0, 21.0, 11.0, 6.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.2342529296875, -9.788818359375, -9.3433837890625, -8.89794921875, -8.4525146484375, -8.007080078125, -7.5616455078125, -7.1162109375, -6.6707763671875, -6.225341796875, -5.7799072265625, -5.33447265625, -4.8890380859375, -4.443603515625, -3.9981689453125, -3.552734375, -3.1072998046875, -2.661865234375, -2.2164306640625, -1.77099609375, -1.3255615234375, -0.880126953125, -0.4346923828125, 0.0107421875, 0.4561767578125, 0.901611328125, 1.3470458984375, 1.79248046875, 2.2379150390625, 2.683349609375, 3.1287841796875, 3.57421875, 4.0196533203125, 4.465087890625, 4.9105224609375, 5.35595703125, 5.8013916015625, 6.246826171875, 6.6922607421875, 7.1376953125, 7.5831298828125, 8.028564453125, 8.4739990234375, 8.91943359375, 9.3648681640625, 9.810302734375, 10.2557373046875, 10.701171875, 11.1466064453125, 11.592041015625, 12.0374755859375, 12.48291015625, 12.9283447265625, 13.373779296875, 13.8192138671875, 14.2646484375, 14.7100830078125, 15.155517578125, 15.6009521484375, 16.04638671875, 16.4918212890625, 16.937255859375, 17.3826904296875, 17.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 8.0, 15.0, 19.0, 16.0, 20.0, 22.0, 34.0, 45.0, 34.0, 42.0, 54.0, 58.0, 59.0, 76.0, 39.0, 50.0, 52.0, 58.0, 60.0, 44.0, 26.0, 31.0, 35.0, 20.0, 20.0, 17.0, 7.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.12127685546875, -2.0589599609375, -1.99664306640625, -1.934326171875, -1.87200927734375, -1.8096923828125, -1.74737548828125, -1.68505859375, -1.62274169921875, -1.5604248046875, -1.49810791015625, -1.435791015625, -1.37347412109375, -1.3111572265625, -1.24884033203125, -1.1865234375, -1.12420654296875, -1.0618896484375, -0.99957275390625, -0.937255859375, -0.87493896484375, -0.8126220703125, -0.75030517578125, -0.68798828125, -0.62567138671875, -0.5633544921875, -0.50103759765625, -0.438720703125, -0.37640380859375, -0.3140869140625, -0.25177001953125, -0.189453125, -0.12713623046875, -0.0648193359375, -0.00250244140625, 0.059814453125, 0.12213134765625, 0.1844482421875, 0.24676513671875, 0.30908203125, 0.37139892578125, 0.4337158203125, 0.49603271484375, 0.558349609375, 0.62066650390625, 0.6829833984375, 0.74530029296875, 0.8076171875, 0.86993408203125, 0.9322509765625, 0.99456787109375, 1.056884765625, 1.11920166015625, 1.1815185546875, 1.24383544921875, 1.30615234375, 1.36846923828125, 1.4307861328125, 1.49310302734375, 1.555419921875, 1.61773681640625, 1.6800537109375, 1.74237060546875, 1.8046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 19.0, 34.0, 31.0, 53.0, 92.0, 174.0, 239.0, 436.0, 855.0, 1449.0, 2980.0, 5939.0, 12725.0, 31139.0, 94880.0, 517164.0, 2870596.0, 505603.0, 94379.0, 30657.0, 12413.0, 5840.0, 2870.0, 1581.0, 848.0, 492.0, 281.0, 190.0, 104.0, 70.0, 37.0, 27.0, 20.0, 10.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.139251708984375, -3.03631591796875, -2.933380126953125, -2.8304443359375, -2.727508544921875, -2.62457275390625, -2.521636962890625, -2.418701171875, -2.315765380859375, -2.21282958984375, -2.109893798828125, -2.0069580078125, -1.904022216796875, -1.80108642578125, -1.698150634765625, -1.59521484375, -1.492279052734375, -1.38934326171875, -1.286407470703125, -1.1834716796875, -1.080535888671875, -0.97760009765625, -0.874664306640625, -0.771728515625, -0.668792724609375, -0.56585693359375, -0.462921142578125, -0.3599853515625, -0.257049560546875, -0.15411376953125, -0.051177978515625, 0.0517578125, 0.154693603515625, 0.25762939453125, 0.360565185546875, 0.4635009765625, 0.566436767578125, 0.66937255859375, 0.772308349609375, 0.875244140625, 0.978179931640625, 1.08111572265625, 1.184051513671875, 1.2869873046875, 1.389923095703125, 1.49285888671875, 1.595794677734375, 1.69873046875, 1.801666259765625, 1.90460205078125, 2.007537841796875, 2.1104736328125, 2.213409423828125, 2.31634521484375, 2.419281005859375, 2.522216796875, 2.625152587890625, 2.72808837890625, 2.831024169921875, 2.9339599609375, 3.036895751953125, 3.13983154296875, 3.242767333984375, 3.345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 11.0, 12.0, 10.0, 18.0, 15.0, 32.0, 38.0, 58.0, 74.0, 119.0, 203.0, 368.0, 654.0, 878.0, 601.0, 346.0, 219.0, 130.0, 73.0, 50.0, 36.0, 27.0, 19.0, 21.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.69921875, -3.56488037109375, -3.4305419921875, -3.29620361328125, -3.161865234375, -3.02752685546875, -2.8931884765625, -2.75885009765625, -2.62451171875, -2.49017333984375, -2.3558349609375, -2.22149658203125, -2.087158203125, -1.95281982421875, -1.8184814453125, -1.68414306640625, -1.5498046875, -1.41546630859375, -1.2811279296875, -1.14678955078125, -1.012451171875, -0.87811279296875, -0.7437744140625, -0.60943603515625, -0.47509765625, -0.34075927734375, -0.2064208984375, -0.07208251953125, 0.062255859375, 0.19659423828125, 0.3309326171875, 0.46527099609375, 0.599609375, 0.73394775390625, 0.8682861328125, 1.00262451171875, 1.136962890625, 1.27130126953125, 1.4056396484375, 1.53997802734375, 1.67431640625, 1.80865478515625, 1.9429931640625, 2.07733154296875, 2.211669921875, 2.34600830078125, 2.4803466796875, 2.61468505859375, 2.7490234375, 2.88336181640625, 3.0177001953125, 3.15203857421875, 3.286376953125, 3.42071533203125, 3.5550537109375, 3.68939208984375, 3.82373046875, 3.95806884765625, 4.0924072265625, 4.22674560546875, 4.361083984375, 4.49542236328125, 4.6297607421875, 4.76409912109375, 4.8984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 37.0, 132.0, 365.0, 326.0, 84.0, 31.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.76509094238281, -65.88572692871094, -63.006370544433594, -60.127010345458984, -57.247650146484375, -54.368289947509766, -51.488929748535156, -48.60956573486328, -45.73020935058594, -42.85084915161133, -39.97148895263672, -37.09212875366211, -34.2127685546875, -31.33340835571289, -28.45404624938965, -25.57468605041504, -22.695323944091797, -19.815963745117188, -16.936603546142578, -14.057242393493652, -11.177882194519043, -8.298521995544434, -5.419160842895508, -2.5398006439208984, 0.33955955505371094, 3.2189199924468994, 6.098280429840088, 8.977641105651855, 11.857001304626465, 14.736361503601074, 17.61572265625, 20.49508285522461, 23.37444305419922, 26.253803253173828, 29.133163452148438, 32.01252365112305, 34.891883850097656, 37.771244049072266, 40.650604248046875, 43.52996826171875, 46.409324645996094, 49.2886848449707, 52.16804504394531, 55.04740524291992, 57.92676544189453, 60.80612564086914, 63.68548583984375, 66.56484985351562, 69.4442138671875, 72.32357788085938, 75.20293426513672, 78.0822982788086, 80.96165466308594, 83.84101867675781, 86.72037506103516, 89.59973907470703, 92.47909545898438, 95.35845947265625, 98.2378158569336, 101.11717987060547, 103.99653625488281, 106.87590026855469, 109.75525665283203, 112.6346206665039, 115.51397705078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 4.0, 7.0, 7.0, 4.0, 9.0, 6.0, 15.0, 10.0, 13.0, 19.0, 24.0, 20.0, 30.0, 25.0, 30.0, 28.0, 52.0, 44.0, 28.0, 51.0, 36.0, 41.0, 46.0, 44.0, 35.0, 37.0, 46.0, 36.0, 29.0, 33.0, 17.0, 28.0, 20.0, 21.0, 19.0, 11.0, 7.0, 7.0, 9.0, 5.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.872273445129395, -15.355517387390137, -14.838761329650879, -14.322005271911621, -13.805248260498047, -13.288492202758789, -12.771736145019531, -12.254980087280273, -11.738224029541016, -11.221467971801758, -10.7047119140625, -10.187955856323242, -9.671199798583984, -9.154443740844727, -8.637686729431152, -8.120930671691895, -7.604174613952637, -7.087418556213379, -6.570662498474121, -6.053905963897705, -5.537149906158447, -5.0203938484191895, -4.503637313842773, -3.9868812561035156, -3.470125198364258, -2.953369140625, -2.436612844467163, -1.9198566675186157, -1.4031004905700684, -0.8863444328308105, -0.36958813667297363, 0.14716815948486328, 0.6639251708984375, 1.1806813478469849, 1.6974375247955322, 2.214193820953369, 2.730949878692627, 3.2477059364318848, 3.7644622325897217, 4.281218528747559, 4.797974586486816, 5.314730644226074, 5.831486701965332, 6.348243236541748, 6.864999294281006, 7.381755352020264, 7.89851188659668, 8.415267944335938, 8.932024002075195, 9.448780059814453, 9.965536117553711, 10.482292175292969, 10.999048233032227, 11.515804290771484, 12.032561302185059, 12.549317359924316, 13.066073417663574, 13.582829475402832, 14.09958553314209, 14.616341590881348, 15.133098602294922, 15.64985466003418, 16.166610717773438, 16.683366775512695, 17.200122833251953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 7.0, 9.0, 17.0, 29.0, 28.0, 44.0, 75.0, 90.0, 134.0, 217.0, 344.0, 540.0, 895.0, 1813.0, 3478.0, 7481.0, 17962.0, 48083.0, 196729.0, 561021.0, 141883.0, 39349.0, 15144.0, 6389.0, 3085.0, 1553.0, 773.0, 466.0, 274.0, 203.0, 145.0, 79.0, 67.0, 35.0, 24.0, 26.0, 16.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.386962890625, -4.24267578125, -4.098388671875, -3.9541015625, -3.809814453125, -3.66552734375, -3.521240234375, -3.376953125, -3.232666015625, -3.08837890625, -2.944091796875, -2.7998046875, -2.655517578125, -2.51123046875, -2.366943359375, -2.22265625, -2.078369140625, -1.93408203125, -1.789794921875, -1.6455078125, -1.501220703125, -1.35693359375, -1.212646484375, -1.068359375, -0.924072265625, -0.77978515625, -0.635498046875, -0.4912109375, -0.346923828125, -0.20263671875, -0.058349609375, 0.0859375, 0.230224609375, 0.37451171875, 0.518798828125, 0.6630859375, 0.807373046875, 0.95166015625, 1.095947265625, 1.240234375, 1.384521484375, 1.52880859375, 1.673095703125, 1.8173828125, 1.961669921875, 2.10595703125, 2.250244140625, 2.39453125, 2.538818359375, 2.68310546875, 2.827392578125, 2.9716796875, 3.115966796875, 3.26025390625, 3.404541015625, 3.548828125, 3.693115234375, 3.83740234375, 3.981689453125, 4.1259765625, 4.270263671875, 4.41455078125, 4.558837890625, 4.703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 10.0, 8.0, 19.0, 22.0, 15.0, 17.0, 25.0, 32.0, 32.0, 41.0, 39.0, 47.0, 47.0, 37.0, 50.0, 55.0, 41.0, 47.0, 45.0, 44.0, 33.0, 31.0, 48.0, 27.0, 27.0, 27.0, 25.0, 13.0, 17.0, 17.0, 11.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -2.0131378173828125, -1.959869384765625, -1.9066009521484375, -1.85333251953125, -1.8000640869140625, -1.746795654296875, -1.6935272216796875, -1.6402587890625, -1.5869903564453125, -1.533721923828125, -1.4804534912109375, -1.42718505859375, -1.3739166259765625, -1.320648193359375, -1.2673797607421875, -1.214111328125, -1.1608428955078125, -1.107574462890625, -1.0543060302734375, -1.00103759765625, -0.9477691650390625, -0.894500732421875, -0.8412322998046875, -0.7879638671875, -0.7346954345703125, -0.681427001953125, -0.6281585693359375, -0.57489013671875, -0.5216217041015625, -0.468353271484375, -0.4150848388671875, -0.36181640625, -0.3085479736328125, -0.255279541015625, -0.2020111083984375, -0.14874267578125, -0.0954742431640625, -0.042205810546875, 0.0110626220703125, 0.0643310546875, 0.1175994873046875, 0.170867919921875, 0.2241363525390625, 0.27740478515625, 0.3306732177734375, 0.383941650390625, 0.4372100830078125, 0.490478515625, 0.5437469482421875, 0.597015380859375, 0.6502838134765625, 0.70355224609375, 0.7568206787109375, 0.810089111328125, 0.8633575439453125, 0.9166259765625, 0.9698944091796875, 1.023162841796875, 1.0764312744140625, 1.12969970703125, 1.1829681396484375, 1.236236572265625, 1.2895050048828125, 1.3427734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 10.0, 11.0, 9.0, 15.0, 22.0, 24.0, 33.0, 40.0, 58.0, 99.0, 138.0, 224.0, 344.0, 627.0, 1287.0, 3094.0, 9175.0, 36008.0, 313049.0, 614501.0, 50560.0, 12074.0, 3764.0, 1527.0, 682.0, 421.0, 251.0, 158.0, 103.0, 80.0, 44.0, 36.0, 18.0, 7.0, 15.0, 14.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-7.73046875, -7.527587890625, -7.32470703125, -7.121826171875, -6.9189453125, -6.716064453125, -6.51318359375, -6.310302734375, -6.107421875, -5.904541015625, -5.70166015625, -5.498779296875, -5.2958984375, -5.093017578125, -4.89013671875, -4.687255859375, -4.484375, -4.281494140625, -4.07861328125, -3.875732421875, -3.6728515625, -3.469970703125, -3.26708984375, -3.064208984375, -2.861328125, -2.658447265625, -2.45556640625, -2.252685546875, -2.0498046875, -1.846923828125, -1.64404296875, -1.441162109375, -1.23828125, -1.035400390625, -0.83251953125, -0.629638671875, -0.4267578125, -0.223876953125, -0.02099609375, 0.181884765625, 0.384765625, 0.587646484375, 0.79052734375, 0.993408203125, 1.1962890625, 1.399169921875, 1.60205078125, 1.804931640625, 2.0078125, 2.210693359375, 2.41357421875, 2.616455078125, 2.8193359375, 3.022216796875, 3.22509765625, 3.427978515625, 3.630859375, 3.833740234375, 4.03662109375, 4.239501953125, 4.4423828125, 4.645263671875, 4.84814453125, 5.051025390625, 5.25390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 6.0, 15.0, 10.0, 21.0, 17.0, 28.0, 29.0, 33.0, 44.0, 60.0, 53.0, 59.0, 55.0, 61.0, 69.0, 51.0, 51.0, 51.0, 52.0, 45.0, 29.0, 34.0, 25.0, 22.0, 18.0, 15.0, 7.0, 4.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.0108642578125, -7.756103515625, -7.5013427734375, -7.24658203125, -6.9918212890625, -6.737060546875, -6.4822998046875, -6.2275390625, -5.9727783203125, -5.718017578125, -5.4632568359375, -5.20849609375, -4.9537353515625, -4.698974609375, -4.4442138671875, -4.189453125, -3.9346923828125, -3.679931640625, -3.4251708984375, -3.17041015625, -2.9156494140625, -2.660888671875, -2.4061279296875, -2.1513671875, -1.8966064453125, -1.641845703125, -1.3870849609375, -1.13232421875, -0.8775634765625, -0.622802734375, -0.3680419921875, -0.11328125, 0.1414794921875, 0.396240234375, 0.6510009765625, 0.90576171875, 1.1605224609375, 1.415283203125, 1.6700439453125, 1.9248046875, 2.1795654296875, 2.434326171875, 2.6890869140625, 2.94384765625, 3.1986083984375, 3.453369140625, 3.7081298828125, 3.962890625, 4.2176513671875, 4.472412109375, 4.7271728515625, 4.98193359375, 5.2366943359375, 5.491455078125, 5.7462158203125, 6.0009765625, 6.2557373046875, 6.510498046875, 6.7652587890625, 7.02001953125, 7.2747802734375, 7.529541015625, 7.7843017578125, 8.0390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 17.0, 21.0, 43.0, 85.0, 160.0, 381.0, 1127.0, 3974.0, 22097.0, 589497.0, 405792.0, 19839.0, 3717.0, 1054.0, 388.0, 154.0, 72.0, 42.0, 28.0, 19.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.390625, -6.2177734375, -6.044921875, -5.8720703125, -5.69921875, -5.5263671875, -5.353515625, -5.1806640625, -5.0078125, -4.8349609375, -4.662109375, -4.4892578125, -4.31640625, -4.1435546875, -3.970703125, -3.7978515625, -3.625, -3.4521484375, -3.279296875, -3.1064453125, -2.93359375, -2.7607421875, -2.587890625, -2.4150390625, -2.2421875, -2.0693359375, -1.896484375, -1.7236328125, -1.55078125, -1.3779296875, -1.205078125, -1.0322265625, -0.859375, -0.6865234375, -0.513671875, -0.3408203125, -0.16796875, 0.0048828125, 0.177734375, 0.3505859375, 0.5234375, 0.6962890625, 0.869140625, 1.0419921875, 1.21484375, 1.3876953125, 1.560546875, 1.7333984375, 1.90625, 2.0791015625, 2.251953125, 2.4248046875, 2.59765625, 2.7705078125, 2.943359375, 3.1162109375, 3.2890625, 3.4619140625, 3.634765625, 3.8076171875, 3.98046875, 4.1533203125, 4.326171875, 4.4990234375, 4.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 3.0, 10.0, 14.0, 4.0, 15.0, 13.0, 25.0, 40.0, 59.0, 97.0, 143.0, 184.0, 111.0, 69.0, 49.0, 43.0, 31.0, 14.0, 12.0, 14.0, 3.0, 5.0, 5.0, 11.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00080108642578125, -0.0007783696055412292, -0.0007556527853012085, -0.0007329359650611877, -0.000710219144821167, -0.0006875023245811462, -0.0006647855043411255, -0.0006420686841011047, -0.000619351863861084, -0.0005966350436210632, -0.0005739182233810425, -0.0005512014031410217, -0.000528484582901001, -0.0005057677626609802, -0.00048305094242095947, -0.0004603341221809387, -0.00043761730194091797, -0.0004149004817008972, -0.00039218366146087646, -0.0003694668412208557, -0.00034675002098083496, -0.0003240332007408142, -0.00030131638050079346, -0.0002785995602607727, -0.00025588274002075195, -0.0002331659197807312, -0.00021044909954071045, -0.0001877322793006897, -0.00016501545906066895, -0.0001422986388206482, -0.00011958181858062744, -9.686499834060669e-05, -7.414817810058594e-05, -5.1431357860565186e-05, -2.8714537620544434e-05, -5.997717380523682e-06, 1.671910285949707e-05, 3.943592309951782e-05, 6.215274333953857e-05, 8.486956357955933e-05, 0.00010758638381958008, 0.00013030320405960083, 0.00015302002429962158, 0.00017573684453964233, 0.00019845366477966309, 0.00022117048501968384, 0.0002438873052597046, 0.00026660412549972534, 0.0002893209457397461, 0.00031203776597976685, 0.0003347545862197876, 0.00035747140645980835, 0.0003801882266998291, 0.00040290504693984985, 0.0004256218671798706, 0.00044833868741989136, 0.0004710555076599121, 0.0004937723278999329, 0.0005164891481399536, 0.0005392059683799744, 0.0005619227886199951, 0.0005846396088600159, 0.0006073564291000366, 0.0006300732493400574, 0.0006527900695800781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 12.0, 9.0, 15.0, 34.0, 65.0, 112.0, 148.0, 268.0, 495.0, 948.0, 2083.0, 5288.0, 20155.0, 171669.0, 766134.0, 63127.0, 11299.0, 3522.0, 1484.0, 696.0, 400.0, 223.0, 138.0, 85.0, 44.0, 37.0, 19.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.46875, -3.34619140625, -3.2236328125, -3.10107421875, -2.978515625, -2.85595703125, -2.7333984375, -2.61083984375, -2.48828125, -2.36572265625, -2.2431640625, -2.12060546875, -1.998046875, -1.87548828125, -1.7529296875, -1.63037109375, -1.5078125, -1.38525390625, -1.2626953125, -1.14013671875, -1.017578125, -0.89501953125, -0.7724609375, -0.64990234375, -0.52734375, -0.40478515625, -0.2822265625, -0.15966796875, -0.037109375, 0.08544921875, 0.2080078125, 0.33056640625, 0.453125, 0.57568359375, 0.6982421875, 0.82080078125, 0.943359375, 1.06591796875, 1.1884765625, 1.31103515625, 1.43359375, 1.55615234375, 1.6787109375, 1.80126953125, 1.923828125, 2.04638671875, 2.1689453125, 2.29150390625, 2.4140625, 2.53662109375, 2.6591796875, 2.78173828125, 2.904296875, 3.02685546875, 3.1494140625, 3.27197265625, 3.39453125, 3.51708984375, 3.6396484375, 3.76220703125, 3.884765625, 4.00732421875, 4.1298828125, 4.25244140625, 4.375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 2.0, 13.0, 18.0, 15.0, 19.0, 27.0, 54.0, 75.0, 116.0, 127.0, 130.0, 105.0, 74.0, 55.0, 45.0, 23.0, 17.0, 9.0, 15.0, 10.0, 2.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.506744384765625, -2.41387939453125, -2.321014404296875, -2.2281494140625, -2.135284423828125, -2.04241943359375, -1.949554443359375, -1.856689453125, -1.763824462890625, -1.67095947265625, -1.578094482421875, -1.4852294921875, -1.392364501953125, -1.29949951171875, -1.206634521484375, -1.11376953125, -1.020904541015625, -0.92803955078125, -0.835174560546875, -0.7423095703125, -0.649444580078125, -0.55657958984375, -0.463714599609375, -0.370849609375, -0.277984619140625, -0.18511962890625, -0.092254638671875, 0.0006103515625, 0.093475341796875, 0.18634033203125, 0.279205322265625, 0.3720703125, 0.464935302734375, 0.55780029296875, 0.650665283203125, 0.7435302734375, 0.836395263671875, 0.92926025390625, 1.022125244140625, 1.114990234375, 1.207855224609375, 1.30072021484375, 1.393585205078125, 1.4864501953125, 1.579315185546875, 1.67218017578125, 1.765045166015625, 1.85791015625, 1.950775146484375, 2.04364013671875, 2.136505126953125, 2.2293701171875, 2.322235107421875, 2.41510009765625, 2.507965087890625, 2.600830078125, 2.693695068359375, 2.78656005859375, 2.879425048828125, 2.9722900390625, 3.065155029296875, 3.15802001953125, 3.250885009765625, 3.34375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 38.0, 87.0, 217.0, 337.0, 196.0, 53.0, 25.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.62693786621094, -117.05058288574219, -114.47422790527344, -111.89787292480469, -109.32151794433594, -106.74517059326172, -104.16881561279297, -101.59246063232422, -99.01610565185547, -96.43975067138672, -93.86339569091797, -91.28704071044922, -88.710693359375, -86.13433837890625, -83.5579833984375, -80.98162841796875, -78.4052734375, -75.82891845703125, -73.2525634765625, -70.67620849609375, -68.099853515625, -65.52350616455078, -62.94715118408203, -60.37079620361328, -57.79444122314453, -55.21808624267578, -52.64173126220703, -50.06538009643555, -47.4890251159668, -44.91267013549805, -42.33631896972656, -39.75996398925781, -37.183616638183594, -34.607261657714844, -32.030906677246094, -29.45455551147461, -26.87820053100586, -24.30184555053711, -21.725492477416992, -19.149139404296875, -16.572784423828125, -13.996430397033691, -11.420076370239258, -8.843722343444824, -6.267368316650391, -3.691014289855957, -1.1146602630615234, 1.4616928100585938, 4.038047790527344, 6.614401817321777, 9.190755844116211, 11.767109870910645, 14.343463897705078, 16.919818878173828, 19.496171951293945, 22.072525024414062, 24.648880004882812, 27.225234985351562, 29.80158805847168, 32.3779411315918, 34.95429611206055, 37.5306510925293, 40.10700225830078, 42.68335723876953, 45.25971221923828]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 9.0, 20.0, 21.0, 18.0, 24.0, 19.0, 20.0, 27.0, 28.0, 35.0, 38.0, 55.0, 44.0, 55.0, 68.0, 45.0, 52.0, 38.0, 42.0, 36.0, 36.0, 32.0, 27.0, 21.0, 27.0, 24.0, 18.0, 24.0, 16.0, 7.0, 15.0, 5.0, 9.0, 6.0, 6.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.12070083618164, -24.28488540649414, -23.449068069458008, -22.613252639770508, -21.777437210083008, -20.941619873046875, -20.105804443359375, -19.269989013671875, -18.434173583984375, -17.598358154296875, -16.762540817260742, -15.926725387573242, -15.090909957885742, -14.255093574523926, -13.41927719116211, -12.58346176147461, -11.747644424438477, -10.91182804107666, -10.07601261138916, -9.240196228027344, -8.404380798339844, -7.568564414978027, -6.732748031616211, -5.896932125091553, -5.0611162185668945, -4.225300312042236, -3.389484167098999, -2.5536680221557617, -1.7178521156311035, -0.8820362091064453, -0.046219825744628906, 0.7895960807800293, 1.6254119873046875, 2.4612278938293457, 3.297044038772583, 4.13286018371582, 4.9686760902404785, 5.804491996765137, 6.640308380126953, 7.476124286651611, 8.31194019317627, 9.147756576538086, 9.983572006225586, 10.819388389587402, 11.655204772949219, 12.491020202636719, 13.326836585998535, 14.162652969360352, 14.998468399047852, 15.834284782409668, 16.670101165771484, 17.505916595458984, 18.341732025146484, 19.177547454833984, 20.013364791870117, 20.849180221557617, 21.68499755859375, 22.52081298828125, 23.356630325317383, 24.192445755004883, 25.028261184692383, 25.864078521728516, 26.699893951416016, 27.535709381103516, 28.371524810791016]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 11.0, 12.0, 16.0, 17.0, 51.0, 83.0, 97.0, 175.0, 303.0, 536.0, 938.0, 1821.0, 3442.0, 7060.0, 16181.0, 39772.0, 121458.0, 586430.0, 2406296.0, 776869.0, 150948.0, 47334.0, 18301.0, 8101.0, 3846.0, 1836.0, 985.0, 560.0, 300.0, 191.0, 100.0, 71.0, 40.0, 27.0, 23.0, 15.0, 8.0, 12.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.90374755859375, -2.8172607421875, -2.73077392578125, -2.644287109375, -2.55780029296875, -2.4713134765625, -2.38482666015625, -2.29833984375, -2.21185302734375, -2.1253662109375, -2.03887939453125, -1.952392578125, -1.86590576171875, -1.7794189453125, -1.69293212890625, -1.6064453125, -1.51995849609375, -1.4334716796875, -1.34698486328125, -1.260498046875, -1.17401123046875, -1.0875244140625, -1.00103759765625, -0.91455078125, -0.82806396484375, -0.7415771484375, -0.65509033203125, -0.568603515625, -0.48211669921875, -0.3956298828125, -0.30914306640625, -0.22265625, -0.13616943359375, -0.0496826171875, 0.03680419921875, 0.123291015625, 0.20977783203125, 0.2962646484375, 0.38275146484375, 0.46923828125, 0.55572509765625, 0.6422119140625, 0.72869873046875, 0.815185546875, 0.90167236328125, 0.9881591796875, 1.07464599609375, 1.1611328125, 1.24761962890625, 1.3341064453125, 1.42059326171875, 1.507080078125, 1.59356689453125, 1.6800537109375, 1.76654052734375, 1.85302734375, 1.93951416015625, 2.0260009765625, 2.11248779296875, 2.198974609375, 2.28546142578125, 2.3719482421875, 2.45843505859375, 2.544921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 10.0, 7.0, 9.0, 18.0, 25.0, 20.0, 25.0, 27.0, 32.0, 25.0, 53.0, 39.0, 42.0, 36.0, 52.0, 52.0, 54.0, 48.0, 37.0, 45.0, 32.0, 35.0, 38.0, 36.0, 30.0, 37.0, 25.0, 19.0, 20.0, 10.0, 11.0, 16.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.8515625, -1.8030242919921875, -1.754486083984375, -1.7059478759765625, -1.65740966796875, -1.6088714599609375, -1.560333251953125, -1.5117950439453125, -1.4632568359375, -1.4147186279296875, -1.366180419921875, -1.3176422119140625, -1.26910400390625, -1.2205657958984375, -1.172027587890625, -1.1234893798828125, -1.074951171875, -1.0264129638671875, -0.977874755859375, -0.9293365478515625, -0.88079833984375, -0.8322601318359375, -0.783721923828125, -0.7351837158203125, -0.6866455078125, -0.6381072998046875, -0.589569091796875, -0.5410308837890625, -0.49249267578125, -0.4439544677734375, -0.395416259765625, -0.3468780517578125, -0.29833984375, -0.2498016357421875, -0.201263427734375, -0.1527252197265625, -0.10418701171875, -0.0556488037109375, -0.007110595703125, 0.0414276123046875, 0.0899658203125, 0.1385040283203125, 0.187042236328125, 0.2355804443359375, 0.28411865234375, 0.3326568603515625, 0.381195068359375, 0.4297332763671875, 0.478271484375, 0.5268096923828125, 0.575347900390625, 0.6238861083984375, 0.67242431640625, 0.7209625244140625, 0.769500732421875, 0.8180389404296875, 0.8665771484375, 0.9151153564453125, 0.963653564453125, 1.0121917724609375, 1.06072998046875, 1.1092681884765625, 1.157806396484375, 1.2063446044921875, 1.2548828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 12.0, 26.0, 30.0, 45.0, 83.0, 151.0, 248.0, 551.0, 973.0, 2423.0, 7166.0, 25878.0, 128970.0, 1794426.0, 2038948.0, 149610.0, 30764.0, 8512.0, 2908.0, 1212.0, 602.0, 294.0, 175.0, 95.0, 56.0, 31.0, 21.0, 20.0, 13.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.84100341796875, -4.6741943359375, -4.50738525390625, -4.340576171875, -4.17376708984375, -4.0069580078125, -3.84014892578125, -3.67333984375, -3.50653076171875, -3.3397216796875, -3.17291259765625, -3.006103515625, -2.83929443359375, -2.6724853515625, -2.50567626953125, -2.3388671875, -2.17205810546875, -2.0052490234375, -1.83843994140625, -1.671630859375, -1.50482177734375, -1.3380126953125, -1.17120361328125, -1.00439453125, -0.83758544921875, -0.6707763671875, -0.50396728515625, -0.337158203125, -0.17034912109375, -0.0035400390625, 0.16326904296875, 0.330078125, 0.49688720703125, 0.6636962890625, 0.83050537109375, 0.997314453125, 1.16412353515625, 1.3309326171875, 1.49774169921875, 1.66455078125, 1.83135986328125, 1.9981689453125, 2.16497802734375, 2.331787109375, 2.49859619140625, 2.6654052734375, 2.83221435546875, 2.9990234375, 3.16583251953125, 3.3326416015625, 3.49945068359375, 3.666259765625, 3.83306884765625, 3.9998779296875, 4.16668701171875, 4.33349609375, 4.50030517578125, 4.6671142578125, 4.83392333984375, 5.000732421875, 5.16754150390625, 5.3343505859375, 5.50115966796875, 5.66796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 15.0, 11.0, 21.0, 34.0, 42.0, 64.0, 92.0, 123.0, 223.0, 362.0, 677.0, 800.0, 530.0, 331.0, 218.0, 133.0, 101.0, 65.0, 57.0, 41.0, 18.0, 26.0, 13.0, 15.0, 7.0, 8.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.34765625, -6.17340087890625, -5.9991455078125, -5.82489013671875, -5.650634765625, -5.47637939453125, -5.3021240234375, -5.12786865234375, -4.95361328125, -4.77935791015625, -4.6051025390625, -4.43084716796875, -4.256591796875, -4.08233642578125, -3.9080810546875, -3.73382568359375, -3.5595703125, -3.38531494140625, -3.2110595703125, -3.03680419921875, -2.862548828125, -2.68829345703125, -2.5140380859375, -2.33978271484375, -2.16552734375, -1.99127197265625, -1.8170166015625, -1.64276123046875, -1.468505859375, -1.29425048828125, -1.1199951171875, -0.94573974609375, -0.771484375, -0.59722900390625, -0.4229736328125, -0.24871826171875, -0.074462890625, 0.09979248046875, 0.2740478515625, 0.44830322265625, 0.62255859375, 0.79681396484375, 0.9710693359375, 1.14532470703125, 1.319580078125, 1.49383544921875, 1.6680908203125, 1.84234619140625, 2.0166015625, 2.19085693359375, 2.3651123046875, 2.53936767578125, 2.713623046875, 2.88787841796875, 3.0621337890625, 3.23638916015625, 3.41064453125, 3.58489990234375, 3.7591552734375, 3.93341064453125, 4.107666015625, 4.28192138671875, 4.4561767578125, 4.63043212890625, 4.8046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 21.0, 45.0, 68.0, 123.0, 211.0, 190.0, 118.0, 95.0, 39.0, 27.0, 13.0, 5.0, 10.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.571048736572266, -44.5204963684082, -42.469940185546875, -40.41938781738281, -38.36883544921875, -36.31828308105469, -34.267730712890625, -32.2171745300293, -30.166622161865234, -28.116069793701172, -26.065515518188477, -24.01496124267578, -21.96440887451172, -19.913856506347656, -17.86330223083496, -15.812748908996582, -13.762195587158203, -11.711642265319824, -9.661088943481445, -7.610535621643066, -5.5599822998046875, -3.5094289779663086, -1.4588756561279297, 0.5916776657104492, 2.642230987548828, 4.692784309387207, 6.743337631225586, 8.793890953063965, 10.844444274902344, 12.894997596740723, 14.945550918579102, 16.996105194091797, 19.046661376953125, 21.097213745117188, 23.147768020629883, 25.198322296142578, 27.24887466430664, 29.299427032470703, 31.3499813079834, 33.400535583496094, 35.451087951660156, 37.50164031982422, 39.55219268798828, 41.60274887084961, 43.65330123901367, 45.703853607177734, 47.75440979003906, 49.804962158203125, 51.85551452636719, 53.90606689453125, 55.95661926269531, 58.00717544555664, 60.0577278137207, 62.108280181884766, 64.1588363647461, 66.20938873291016, 68.25994110107422, 70.31049346923828, 72.36104583740234, 74.4115982055664, 76.462158203125, 78.51271057128906, 80.56326293945312, 82.61381530761719, 84.66436767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 8.0, 16.0, 17.0, 19.0, 17.0, 21.0, 25.0, 32.0, 33.0, 41.0, 32.0, 43.0, 36.0, 49.0, 49.0, 53.0, 43.0, 40.0, 43.0, 45.0, 44.0, 45.0, 29.0, 26.0, 31.0, 27.0, 19.0, 18.0, 16.0, 7.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.193378448486328, -29.28727149963379, -28.381162643432617, -27.475055694580078, -26.568946838378906, -25.662839889526367, -24.756732940673828, -23.850624084472656, -22.944517135620117, -22.038410186767578, -21.132301330566406, -20.226194381713867, -19.320087432861328, -18.413978576660156, -17.507871627807617, -16.601764678955078, -15.695655822753906, -14.78954792022705, -13.883440017700195, -12.977333068847656, -12.0712251663208, -11.165117263793945, -10.259010314941406, -9.35290241241455, -8.446794509887695, -7.54068660736084, -6.634579181671143, -5.728471755981445, -4.82236385345459, -3.9162559509277344, -3.010148525238037, -2.10404109954834, -1.1979351043701172, -0.2918274402618408, 0.6142802238464355, 1.520387887954712, 2.4264955520629883, 3.3326034545898438, 4.238710880279541, 5.144818305969238, 6.050926208496094, 6.957034111022949, 7.8631415367126465, 8.769248962402344, 9.6753568649292, 10.581464767456055, 11.487571716308594, 12.39367961883545, 13.299787521362305, 14.20589542388916, 15.112003326416016, 16.018110275268555, 16.924217224121094, 17.830326080322266, 18.736433029174805, 19.642539978027344, 20.548648834228516, 21.454755783081055, 22.360864639282227, 23.266971588134766, 24.173080444335938, 25.079187393188477, 25.985294342041016, 26.891403198242188, 27.797510147094727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 14.0, 19.0, 36.0, 46.0, 113.0, 191.0, 495.0, 1221.0, 2994.0, 9012.0, 31260.0, 130595.0, 602408.0, 206221.0, 44887.0, 12426.0, 4033.0, 1409.0, 599.0, 275.0, 131.0, 76.0, 32.0, 20.0, 19.0, 9.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.9344482421875, -6.728271484375, -6.5220947265625, -6.31591796875, -6.1097412109375, -5.903564453125, -5.6973876953125, -5.4912109375, -5.2850341796875, -5.078857421875, -4.8726806640625, -4.66650390625, -4.4603271484375, -4.254150390625, -4.0479736328125, -3.841796875, -3.6356201171875, -3.429443359375, -3.2232666015625, -3.01708984375, -2.8109130859375, -2.604736328125, -2.3985595703125, -2.1923828125, -1.9862060546875, -1.780029296875, -1.5738525390625, -1.36767578125, -1.1614990234375, -0.955322265625, -0.7491455078125, -0.54296875, -0.3367919921875, -0.130615234375, 0.0755615234375, 0.28173828125, 0.4879150390625, 0.694091796875, 0.9002685546875, 1.1064453125, 1.3126220703125, 1.518798828125, 1.7249755859375, 1.93115234375, 2.1373291015625, 2.343505859375, 2.5496826171875, 2.755859375, 2.9620361328125, 3.168212890625, 3.3743896484375, 3.58056640625, 3.7867431640625, 3.992919921875, 4.1990966796875, 4.4052734375, 4.6114501953125, 4.817626953125, 5.0238037109375, 5.22998046875, 5.4361572265625, 5.642333984375, 5.8485107421875, 6.0546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 11.0, 19.0, 28.0, 19.0, 35.0, 39.0, 42.0, 35.0, 45.0, 46.0, 61.0, 64.0, 64.0, 67.0, 57.0, 53.0, 48.0, 41.0, 39.0, 37.0, 29.0, 28.0, 24.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 0.0, 1.0, 3.0], "bins": [-2.98828125, -2.9210205078125, -2.853759765625, -2.7864990234375, -2.71923828125, -2.6519775390625, -2.584716796875, -2.5174560546875, -2.4501953125, -2.3829345703125, -2.315673828125, -2.2484130859375, -2.18115234375, -2.1138916015625, -2.046630859375, -1.9793701171875, -1.912109375, -1.8448486328125, -1.777587890625, -1.7103271484375, -1.64306640625, -1.5758056640625, -1.508544921875, -1.4412841796875, -1.3740234375, -1.3067626953125, -1.239501953125, -1.1722412109375, -1.10498046875, -1.0377197265625, -0.970458984375, -0.9031982421875, -0.8359375, -0.7686767578125, -0.701416015625, -0.6341552734375, -0.56689453125, -0.4996337890625, -0.432373046875, -0.3651123046875, -0.2978515625, -0.2305908203125, -0.163330078125, -0.0960693359375, -0.02880859375, 0.0384521484375, 0.105712890625, 0.1729736328125, 0.240234375, 0.3074951171875, 0.374755859375, 0.4420166015625, 0.50927734375, 0.5765380859375, 0.643798828125, 0.7110595703125, 0.7783203125, 0.8455810546875, 0.912841796875, 0.9801025390625, 1.04736328125, 1.1146240234375, 1.181884765625, 1.2491455078125, 1.31640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 20.0, 20.0, 33.0, 61.0, 80.0, 136.0, 229.0, 348.0, 599.0, 1126.0, 2498.0, 6922.0, 33266.0, 647087.0, 319965.0, 25523.0, 5806.0, 2264.0, 1029.0, 576.0, 326.0, 224.0, 123.0, 70.0, 65.0, 37.0, 24.0, 10.0, 12.0, 9.0, 4.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0546875, -10.718994140625, -10.38330078125, -10.047607421875, -9.7119140625, -9.376220703125, -9.04052734375, -8.704833984375, -8.369140625, -8.033447265625, -7.69775390625, -7.362060546875, -7.0263671875, -6.690673828125, -6.35498046875, -6.019287109375, -5.68359375, -5.347900390625, -5.01220703125, -4.676513671875, -4.3408203125, -4.005126953125, -3.66943359375, -3.333740234375, -2.998046875, -2.662353515625, -2.32666015625, -1.990966796875, -1.6552734375, -1.319580078125, -0.98388671875, -0.648193359375, -0.3125, 0.023193359375, 0.35888671875, 0.694580078125, 1.0302734375, 1.365966796875, 1.70166015625, 2.037353515625, 2.373046875, 2.708740234375, 3.04443359375, 3.380126953125, 3.7158203125, 4.051513671875, 4.38720703125, 4.722900390625, 5.05859375, 5.394287109375, 5.72998046875, 6.065673828125, 6.4013671875, 6.737060546875, 7.07275390625, 7.408447265625, 7.744140625, 8.079833984375, 8.41552734375, 8.751220703125, 9.0869140625, 9.422607421875, 9.75830078125, 10.093994140625, 10.4296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 15.0, 24.0, 21.0, 21.0, 26.0, 30.0, 38.0, 40.0, 30.0, 35.0, 62.0, 42.0, 51.0, 51.0, 48.0, 57.0, 36.0, 36.0, 36.0, 38.0, 38.0, 41.0, 27.0, 15.0, 20.0, 12.0, 16.0, 8.0, 11.0, 6.0, 6.0, 8.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.078125, -7.8057861328125, -7.533447265625, -7.2611083984375, -6.98876953125, -6.7164306640625, -6.444091796875, -6.1717529296875, -5.8994140625, -5.6270751953125, -5.354736328125, -5.0823974609375, -4.81005859375, -4.5377197265625, -4.265380859375, -3.9930419921875, -3.720703125, -3.4483642578125, -3.176025390625, -2.9036865234375, -2.63134765625, -2.3590087890625, -2.086669921875, -1.8143310546875, -1.5419921875, -1.2696533203125, -0.997314453125, -0.7249755859375, -0.45263671875, -0.1802978515625, 0.092041015625, 0.3643798828125, 0.63671875, 0.9090576171875, 1.181396484375, 1.4537353515625, 1.72607421875, 1.9984130859375, 2.270751953125, 2.5430908203125, 2.8154296875, 3.0877685546875, 3.360107421875, 3.6324462890625, 3.90478515625, 4.1771240234375, 4.449462890625, 4.7218017578125, 4.994140625, 5.2664794921875, 5.538818359375, 5.8111572265625, 6.08349609375, 6.3558349609375, 6.628173828125, 6.9005126953125, 7.1728515625, 7.4451904296875, 7.717529296875, 7.9898681640625, 8.26220703125, 8.5345458984375, 8.806884765625, 9.0792236328125, 9.3515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 12.0, 14.0, 11.0, 25.0, 40.0, 51.0, 81.0, 112.0, 176.0, 293.0, 472.0, 808.0, 1557.0, 2923.0, 6744.0, 17495.0, 53191.0, 243205.0, 599157.0, 80909.0, 24213.0, 8792.0, 3836.0, 1877.0, 989.0, 567.0, 324.0, 220.0, 136.0, 95.0, 69.0, 40.0, 26.0, 22.0, 14.0, 5.0, 6.0, 10.0, 9.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.693878173828125, -2.60455322265625, -2.515228271484375, -2.4259033203125, -2.336578369140625, -2.24725341796875, -2.157928466796875, -2.068603515625, -1.979278564453125, -1.88995361328125, -1.800628662109375, -1.7113037109375, -1.621978759765625, -1.53265380859375, -1.443328857421875, -1.35400390625, -1.264678955078125, -1.17535400390625, -1.086029052734375, -0.9967041015625, -0.907379150390625, -0.81805419921875, -0.728729248046875, -0.639404296875, -0.550079345703125, -0.46075439453125, -0.371429443359375, -0.2821044921875, -0.192779541015625, -0.10345458984375, -0.014129638671875, 0.0751953125, 0.164520263671875, 0.25384521484375, 0.343170166015625, 0.4324951171875, 0.521820068359375, 0.61114501953125, 0.700469970703125, 0.789794921875, 0.879119873046875, 0.96844482421875, 1.057769775390625, 1.1470947265625, 1.236419677734375, 1.32574462890625, 1.415069580078125, 1.50439453125, 1.593719482421875, 1.68304443359375, 1.772369384765625, 1.8616943359375, 1.951019287109375, 2.04034423828125, 2.129669189453125, 2.218994140625, 2.308319091796875, 2.39764404296875, 2.486968994140625, 2.5762939453125, 2.665618896484375, 2.75494384765625, 2.844268798828125, 2.93359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 9.0, 7.0, 16.0, 17.0, 15.0, 26.0, 29.0, 44.0, 58.0, 84.0, 212.0, 145.0, 80.0, 57.0, 35.0, 33.0, 27.0, 19.0, 16.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00118255615234375, -0.001147627830505371, -0.0011126995086669922, -0.0010777711868286133, -0.0010428428649902344, -0.0010079145431518555, -0.0009729862213134766, -0.0009380578994750977, -0.0009031295776367188, -0.0008682012557983398, -0.0008332729339599609, -0.000798344612121582, -0.0007634162902832031, -0.0007284879684448242, -0.0006935596466064453, -0.0006586313247680664, -0.0006237030029296875, -0.0005887746810913086, -0.0005538463592529297, -0.0005189180374145508, -0.0004839897155761719, -0.00044906139373779297, -0.00041413307189941406, -0.00037920475006103516, -0.00034427642822265625, -0.00030934810638427734, -0.00027441978454589844, -0.00023949146270751953, -0.00020456314086914062, -0.00016963481903076172, -0.0001347064971923828, -9.97781753540039e-05, -6.4849853515625e-05, -2.9921531677246094e-05, 5.0067901611328125e-06, 3.993511199951172e-05, 7.486343383789062e-05, 0.00010979175567626953, 0.00014472007751464844, 0.00017964839935302734, 0.00021457672119140625, 0.00024950504302978516, 0.00028443336486816406, 0.00031936168670654297, 0.0003542900085449219, 0.0003892183303833008, 0.0004241466522216797, 0.0004590749740600586, 0.0004940032958984375, 0.0005289316177368164, 0.0005638599395751953, 0.0005987882614135742, 0.0006337165832519531, 0.000668644905090332, 0.0007035732269287109, 0.0007385015487670898, 0.0007734298706054688, 0.0008083581924438477, 0.0008432865142822266, 0.0008782148361206055, 0.0009131431579589844, 0.0009480714797973633, 0.0009829998016357422, 0.001017928123474121, 0.0010528564453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 17.0, 23.0, 39.0, 47.0, 63.0, 125.0, 178.0, 321.0, 570.0, 1039.0, 2117.0, 5057.0, 15002.0, 62453.0, 599093.0, 297054.0, 45394.0, 11795.0, 4085.0, 1864.0, 931.0, 488.0, 279.0, 156.0, 113.0, 78.0, 43.0, 29.0, 17.0, 9.0, 17.0, 12.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.928253173828125, -2.82330322265625, -2.718353271484375, -2.6134033203125, -2.508453369140625, -2.40350341796875, -2.298553466796875, -2.193603515625, -2.088653564453125, -1.98370361328125, -1.878753662109375, -1.7738037109375, -1.668853759765625, -1.56390380859375, -1.458953857421875, -1.35400390625, -1.249053955078125, -1.14410400390625, -1.039154052734375, -0.9342041015625, -0.829254150390625, -0.72430419921875, -0.619354248046875, -0.514404296875, -0.409454345703125, -0.30450439453125, -0.199554443359375, -0.0946044921875, 0.010345458984375, 0.11529541015625, 0.220245361328125, 0.3251953125, 0.430145263671875, 0.53509521484375, 0.640045166015625, 0.7449951171875, 0.849945068359375, 0.95489501953125, 1.059844970703125, 1.164794921875, 1.269744873046875, 1.37469482421875, 1.479644775390625, 1.5845947265625, 1.689544677734375, 1.79449462890625, 1.899444580078125, 2.00439453125, 2.109344482421875, 2.21429443359375, 2.319244384765625, 2.4241943359375, 2.529144287109375, 2.63409423828125, 2.739044189453125, 2.843994140625, 2.948944091796875, 3.05389404296875, 3.158843994140625, 3.2637939453125, 3.368743896484375, 3.47369384765625, 3.578643798828125, 3.68359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 4.0, 4.0, 14.0, 8.0, 12.0, 18.0, 16.0, 18.0, 36.0, 28.0, 20.0, 38.0, 34.0, 58.0, 53.0, 75.0, 68.0, 79.0, 62.0, 50.0, 40.0, 29.0, 24.0, 26.0, 19.0, 19.0, 15.0, 12.0, 16.0, 14.0, 13.0, 11.0, 3.0, 7.0, 6.0, 5.0, 7.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.248046875, -2.178863525390625, -2.10968017578125, -2.040496826171875, -1.9713134765625, -1.902130126953125, -1.83294677734375, -1.763763427734375, -1.694580078125, -1.625396728515625, -1.55621337890625, -1.487030029296875, -1.4178466796875, -1.348663330078125, -1.27947998046875, -1.210296630859375, -1.14111328125, -1.071929931640625, -1.00274658203125, -0.933563232421875, -0.8643798828125, -0.795196533203125, -0.72601318359375, -0.656829833984375, -0.587646484375, -0.518463134765625, -0.44927978515625, -0.380096435546875, -0.3109130859375, -0.241729736328125, -0.17254638671875, -0.103363037109375, -0.0341796875, 0.035003662109375, 0.10418701171875, 0.173370361328125, 0.2425537109375, 0.311737060546875, 0.38092041015625, 0.450103759765625, 0.519287109375, 0.588470458984375, 0.65765380859375, 0.726837158203125, 0.7960205078125, 0.865203857421875, 0.93438720703125, 1.003570556640625, 1.07275390625, 1.141937255859375, 1.21112060546875, 1.280303955078125, 1.3494873046875, 1.418670654296875, 1.48785400390625, 1.557037353515625, 1.626220703125, 1.695404052734375, 1.76458740234375, 1.833770751953125, 1.9029541015625, 1.972137451171875, 2.04132080078125, 2.110504150390625, 2.1796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 9.0, 15.0, 49.0, 114.0, 217.0, 304.0, 157.0, 75.0, 17.0, 15.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-75.54513549804688, -72.65704345703125, -69.7689437866211, -66.88085174560547, -63.99275207519531, -61.10465621948242, -58.21656036376953, -55.328468322753906, -52.44036865234375, -49.55227279663086, -46.66417694091797, -43.77608108520508, -40.88798522949219, -37.9998893737793, -35.111793518066406, -32.22370147705078, -29.33560562133789, -26.447509765625, -23.55941390991211, -20.67131805419922, -17.783222198486328, -14.895127296447754, -12.00703239440918, -9.118936538696289, -6.230840682983398, -3.342745065689087, -0.4546494483947754, 2.433445930480957, 5.321541786193848, 8.209637641906738, 11.097732543945312, 13.985828399658203, 16.873924255371094, 19.762020111083984, 22.650115966796875, 25.538211822509766, 28.426307678222656, 31.314403533935547, 34.20249938964844, 37.09059143066406, 39.97869110107422, 42.86678695678711, 45.7548828125, 48.64297866821289, 51.53107452392578, 54.41917037963867, 57.30726623535156, 60.19535827636719, 63.08345413208008, 65.97154998779297, 68.8596420288086, 71.74774169921875, 74.63583374023438, 77.52393341064453, 80.41202545166016, 83.30012512207031, 86.18821716308594, 89.07630920410156, 91.96440887451172, 94.85250091552734, 97.7406005859375, 100.62869262695312, 103.51679229736328, 106.4048843383789, 109.29298400878906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 8.0, 9.0, 9.0, 11.0, 6.0, 15.0, 17.0, 18.0, 27.0, 29.0, 27.0, 34.0, 24.0, 29.0, 33.0, 48.0, 46.0, 48.0, 65.0, 42.0, 46.0, 38.0, 36.0, 45.0, 12.0, 29.0, 23.0, 32.0, 17.0, 22.0, 15.0, 15.0, 16.0, 21.0, 8.0, 9.0, 12.0, 5.0, 6.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.49323081970215, -22.629426956176758, -21.765621185302734, -20.901817321777344, -20.038013458251953, -19.17420768737793, -18.31040382385254, -17.446598052978516, -16.582794189453125, -15.718989372253418, -14.855184555053711, -13.99138069152832, -13.127575874328613, -12.263771057128906, -11.399967193603516, -10.536162376403809, -9.672357559204102, -8.808552742004395, -7.944748401641846, -7.080944061279297, -6.21713924407959, -5.353334426879883, -4.489530086517334, -3.625725746154785, -2.761920928955078, -1.8981163501739502, -1.0343117713928223, -0.17050719261169434, 0.6932973861694336, 1.5571022033691406, 2.4209065437316895, 3.2847108840942383, 4.148517608642578, 5.012322425842285, 5.876126766204834, 6.739931106567383, 7.60373592376709, 8.467540740966797, 9.331344604492188, 10.195149421691895, 11.058954238891602, 11.922759056091309, 12.786563873291016, 13.650367736816406, 14.514172554016113, 15.37797737121582, 16.24178123474121, 17.105587005615234, 17.969390869140625, 18.833194732666016, 19.69700050354004, 20.56080436706543, 21.424610137939453, 22.288414001464844, 23.152217864990234, 24.016021728515625, 24.87982749938965, 25.74363136291504, 26.607437133789062, 27.471240997314453, 28.335044860839844, 29.198850631713867, 30.062654495239258, 30.92646026611328, 31.790264129638672]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 9.0, 19.0, 25.0, 33.0, 40.0, 55.0, 78.0, 105.0, 184.0, 301.0, 450.0, 740.0, 1422.0, 2520.0, 5222.0, 11600.0, 29860.0, 99581.0, 577906.0, 2602619.0, 688151.0, 115385.0, 33306.0, 12867.0, 5518.0, 2714.0, 1467.0, 764.0, 447.0, 271.0, 200.0, 127.0, 81.0, 52.0, 36.0, 23.0, 20.0, 14.0, 13.0, 10.0, 1.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.86328125, -2.76953125, -2.67578125, -2.58203125, -2.48828125, -2.39453125, -2.30078125, -2.20703125, -2.11328125, -2.01953125, -1.92578125, -1.83203125, -1.73828125, -1.64453125, -1.55078125, -1.45703125, -1.36328125, -1.26953125, -1.17578125, -1.08203125, -0.98828125, -0.89453125, -0.80078125, -0.70703125, -0.61328125, -0.51953125, -0.42578125, -0.33203125, -0.23828125, -0.14453125, -0.05078125, 0.04296875, 0.13671875, 0.23046875, 0.32421875, 0.41796875, 0.51171875, 0.60546875, 0.69921875, 0.79296875, 0.88671875, 0.98046875, 1.07421875, 1.16796875, 1.26171875, 1.35546875, 1.44921875, 1.54296875, 1.63671875, 1.73046875, 1.82421875, 1.91796875, 2.01171875, 2.10546875, 2.19921875, 2.29296875, 2.38671875, 2.48046875, 2.57421875, 2.66796875, 2.76171875, 2.85546875, 2.94921875, 3.04296875, 3.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 2.0, 7.0, 10.0, 9.0, 8.0, 15.0, 17.0, 17.0, 32.0, 34.0, 35.0, 36.0, 41.0, 55.0, 50.0, 65.0, 59.0, 59.0, 71.0, 46.0, 41.0, 53.0, 38.0, 46.0, 33.0, 28.0, 28.0, 18.0, 18.0, 12.0, 7.0, 8.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.865234375, -2.7971343994140625, -2.729034423828125, -2.6609344482421875, -2.59283447265625, -2.5247344970703125, -2.456634521484375, -2.3885345458984375, -2.3204345703125, -2.2523345947265625, -2.184234619140625, -2.1161346435546875, -2.04803466796875, -1.9799346923828125, -1.911834716796875, -1.8437347412109375, -1.775634765625, -1.7075347900390625, -1.639434814453125, -1.5713348388671875, -1.50323486328125, -1.4351348876953125, -1.367034912109375, -1.2989349365234375, -1.2308349609375, -1.1627349853515625, -1.094635009765625, -1.0265350341796875, -0.95843505859375, -0.8903350830078125, -0.822235107421875, -0.7541351318359375, -0.68603515625, -0.6179351806640625, -0.549835205078125, -0.4817352294921875, -0.41363525390625, -0.3455352783203125, -0.277435302734375, -0.2093353271484375, -0.1412353515625, -0.0731353759765625, -0.005035400390625, 0.0630645751953125, 0.13116455078125, 0.1992645263671875, 0.267364501953125, 0.3354644775390625, 0.403564453125, 0.4716644287109375, 0.539764404296875, 0.6078643798828125, 0.67596435546875, 0.7440643310546875, 0.812164306640625, 0.8802642822265625, 0.9483642578125, 1.0164642333984375, 1.084564208984375, 1.1526641845703125, 1.22076416015625, 1.2888641357421875, 1.356964111328125, 1.4250640869140625, 1.4931640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 11.0, 9.0, 27.0, 45.0, 65.0, 137.0, 330.0, 825.0, 2479.0, 9527.0, 55307.0, 773655.0, 3185266.0, 140944.0, 18764.0, 4325.0, 1382.0, 591.0, 258.0, 145.0, 72.0, 40.0, 28.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.72650146484375, -4.5037841796875, -4.28106689453125, -4.058349609375, -3.83563232421875, -3.6129150390625, -3.39019775390625, -3.16748046875, -2.94476318359375, -2.7220458984375, -2.49932861328125, -2.276611328125, -2.05389404296875, -1.8311767578125, -1.60845947265625, -1.3857421875, -1.16302490234375, -0.9403076171875, -0.71759033203125, -0.494873046875, -0.27215576171875, -0.0494384765625, 0.17327880859375, 0.39599609375, 0.61871337890625, 0.8414306640625, 1.06414794921875, 1.286865234375, 1.50958251953125, 1.7322998046875, 1.95501708984375, 2.177734375, 2.40045166015625, 2.6231689453125, 2.84588623046875, 3.068603515625, 3.29132080078125, 3.5140380859375, 3.73675537109375, 3.95947265625, 4.18218994140625, 4.4049072265625, 4.62762451171875, 4.850341796875, 5.07305908203125, 5.2957763671875, 5.51849365234375, 5.7412109375, 5.96392822265625, 6.1866455078125, 6.40936279296875, 6.632080078125, 6.85479736328125, 7.0775146484375, 7.30023193359375, 7.52294921875, 7.74566650390625, 7.9683837890625, 8.19110107421875, 8.413818359375, 8.63653564453125, 8.8592529296875, 9.08197021484375, 9.3046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 7.0, 4.0, 15.0, 8.0, 36.0, 41.0, 57.0, 84.0, 115.0, 201.0, 368.0, 667.0, 948.0, 652.0, 316.0, 203.0, 107.0, 73.0, 54.0, 24.0, 30.0, 19.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.2088623046875, -4.995849609375, -4.7828369140625, -4.56982421875, -4.3568115234375, -4.143798828125, -3.9307861328125, -3.7177734375, -3.5047607421875, -3.291748046875, -3.0787353515625, -2.86572265625, -2.6527099609375, -2.439697265625, -2.2266845703125, -2.013671875, -1.8006591796875, -1.587646484375, -1.3746337890625, -1.16162109375, -0.9486083984375, -0.735595703125, -0.5225830078125, -0.3095703125, -0.0965576171875, 0.116455078125, 0.3294677734375, 0.54248046875, 0.7554931640625, 0.968505859375, 1.1815185546875, 1.39453125, 1.6075439453125, 1.820556640625, 2.0335693359375, 2.24658203125, 2.4595947265625, 2.672607421875, 2.8856201171875, 3.0986328125, 3.3116455078125, 3.524658203125, 3.7376708984375, 3.95068359375, 4.1636962890625, 4.376708984375, 4.5897216796875, 4.802734375, 5.0157470703125, 5.228759765625, 5.4417724609375, 5.65478515625, 5.8677978515625, 6.080810546875, 6.2938232421875, 6.5068359375, 6.7198486328125, 6.932861328125, 7.1458740234375, 7.35888671875, 7.5718994140625, 7.784912109375, 7.9979248046875, 8.2109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 9.0, 15.0, 100.0, 282.0, 404.0, 138.0, 35.0, 13.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.06217956542969, -76.85025024414062, -72.6383285522461, -68.42640686035156, -64.2144775390625, -60.0025520324707, -55.790626525878906, -51.57870101928711, -47.36677551269531, -43.154850006103516, -38.94292449951172, -34.73099899291992, -30.519073486328125, -26.307147979736328, -22.09522247314453, -17.883296966552734, -13.671371459960938, -9.45944595336914, -5.247520446777344, -1.0355949401855469, 3.17633056640625, 7.388256072998047, 11.600181579589844, 15.81210708618164, 20.024032592773438, 24.235958099365234, 28.44788360595703, 32.65980911254883, 36.871734619140625, 41.08366012573242, 45.29558563232422, 49.507511138916016, 53.719451904296875, 57.93137741088867, 62.14330291748047, 66.355224609375, 70.56715393066406, 74.77908325195312, 78.99100494384766, 83.20292663574219, 87.41485595703125, 91.62678527832031, 95.83870697021484, 100.05062866210938, 104.26255798339844, 108.4744873046875, 112.68640899658203, 116.89833068847656, 121.11026000976562, 125.32218933105469, 129.53411865234375, 133.74603271484375, 137.9579620361328, 142.16989135742188, 146.38180541992188, 150.59373474121094, 154.8056640625, 159.01759338378906, 163.22952270507812, 167.44143676757812, 171.6533660888672, 175.86529541015625, 180.07720947265625, 184.2891387939453, 188.50106811523438]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 16.0, 12.0, 29.0, 37.0, 52.0, 37.0, 50.0, 54.0, 77.0, 92.0, 68.0, 95.0, 65.0, 69.0, 59.0, 44.0, 38.0, 23.0, 21.0, 15.0, 8.0, 4.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.531421661376953, -20.19291114807129, -18.854402542114258, -17.515892028808594, -16.177383422851562, -14.838872909545898, -13.500362396240234, -12.161852836608887, -10.823343276977539, -9.484833717346191, -8.146324157714844, -6.80781364440918, -5.469304084777832, -4.130794525146484, -2.7922840118408203, -1.4537744522094727, -0.115264892578125, 1.2232449054718018, 2.5617547035217285, 3.9002647399902344, 5.238774299621582, 6.57728385925293, 7.915794372558594, 9.254303932189941, 10.592813491821289, 11.931323051452637, 13.269832611083984, 14.608343124389648, 15.946852684020996, 17.285362243652344, 18.623872756958008, 19.962383270263672, 21.30089569091797, 22.639406204223633, 23.977914810180664, 25.316425323486328, 26.65493392944336, 27.993444442749023, 29.331954956054688, 30.67046356201172, 32.00897216796875, 33.34748077392578, 34.68599319458008, 36.02450180053711, 37.36301040649414, 38.70152282714844, 40.04003143310547, 41.3785400390625, 42.7170524597168, 44.05556106567383, 45.394073486328125, 46.732582092285156, 48.07109069824219, 49.40959930419922, 50.748111724853516, 52.08662033081055, 53.425132751464844, 54.763641357421875, 56.10215377807617, 57.4406623840332, 58.779170989990234, 60.11768341064453, 61.45619201660156, 62.794700622558594, 64.13320922851562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 30.0, 49.0, 65.0, 111.0, 211.0, 308.0, 608.0, 1142.0, 2452.0, 5553.0, 14072.0, 43485.0, 221011.0, 594097.0, 117993.0, 29059.0, 10087.0, 4151.0, 1955.0, 906.0, 462.0, 274.0, 175.0, 93.0, 54.0, 37.0, 26.0, 18.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.53955078125, -4.3603515625, -4.18115234375, -4.001953125, -3.82275390625, -3.6435546875, -3.46435546875, -3.28515625, -3.10595703125, -2.9267578125, -2.74755859375, -2.568359375, -2.38916015625, -2.2099609375, -2.03076171875, -1.8515625, -1.67236328125, -1.4931640625, -1.31396484375, -1.134765625, -0.95556640625, -0.7763671875, -0.59716796875, -0.41796875, -0.23876953125, -0.0595703125, 0.11962890625, 0.298828125, 0.47802734375, 0.6572265625, 0.83642578125, 1.015625, 1.19482421875, 1.3740234375, 1.55322265625, 1.732421875, 1.91162109375, 2.0908203125, 2.27001953125, 2.44921875, 2.62841796875, 2.8076171875, 2.98681640625, 3.166015625, 3.34521484375, 3.5244140625, 3.70361328125, 3.8828125, 4.06201171875, 4.2412109375, 4.42041015625, 4.599609375, 4.77880859375, 4.9580078125, 5.13720703125, 5.31640625, 5.49560546875, 5.6748046875, 5.85400390625, 6.033203125, 6.21240234375, 6.3916015625, 6.57080078125, 6.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 17.0, 12.0, 15.0, 18.0, 27.0, 32.0, 27.0, 36.0, 34.0, 48.0, 38.0, 59.0, 62.0, 49.0, 54.0, 64.0, 52.0, 56.0, 53.0, 38.0, 39.0, 37.0, 21.0, 18.0, 22.0, 12.0, 13.0, 8.0, 5.0, 10.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.498046875, -2.4297943115234375, -2.361541748046875, -2.2932891845703125, -2.22503662109375, -2.1567840576171875, -2.088531494140625, -2.0202789306640625, -1.9520263671875, -1.8837738037109375, -1.815521240234375, -1.7472686767578125, -1.67901611328125, -1.6107635498046875, -1.542510986328125, -1.4742584228515625, -1.406005859375, -1.3377532958984375, -1.269500732421875, -1.2012481689453125, -1.13299560546875, -1.0647430419921875, -0.996490478515625, -0.9282379150390625, -0.8599853515625, -0.7917327880859375, -0.723480224609375, -0.6552276611328125, -0.58697509765625, -0.5187225341796875, -0.450469970703125, -0.3822174072265625, -0.31396484375, -0.2457122802734375, -0.177459716796875, -0.1092071533203125, -0.04095458984375, 0.0272979736328125, 0.095550537109375, 0.1638031005859375, 0.2320556640625, 0.3003082275390625, 0.368560791015625, 0.4368133544921875, 0.50506591796875, 0.5733184814453125, 0.641571044921875, 0.7098236083984375, 0.778076171875, 0.8463287353515625, 0.914581298828125, 0.9828338623046875, 1.05108642578125, 1.1193389892578125, 1.187591552734375, 1.2558441162109375, 1.3240966796875, 1.3923492431640625, 1.460601806640625, 1.5288543701171875, 1.59710693359375, 1.6653594970703125, 1.733612060546875, 1.8018646240234375, 1.8701171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 21.0, 20.0, 28.0, 40.0, 45.0, 68.0, 120.0, 168.0, 286.0, 490.0, 892.0, 1770.0, 4364.0, 14404.0, 79786.0, 809453.0, 109615.0, 17626.0, 5092.0, 1950.0, 926.0, 477.0, 313.0, 182.0, 119.0, 69.0, 63.0, 37.0, 28.0, 18.0, 14.0, 7.0, 9.0, 7.0, 5.0, 6.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7421875, -9.47576904296875, -9.2093505859375, -8.94293212890625, -8.676513671875, -8.41009521484375, -8.1436767578125, -7.87725830078125, -7.61083984375, -7.34442138671875, -7.0780029296875, -6.81158447265625, -6.545166015625, -6.27874755859375, -6.0123291015625, -5.74591064453125, -5.4794921875, -5.21307373046875, -4.9466552734375, -4.68023681640625, -4.413818359375, -4.14739990234375, -3.8809814453125, -3.61456298828125, -3.34814453125, -3.08172607421875, -2.8153076171875, -2.54888916015625, -2.282470703125, -2.01605224609375, -1.7496337890625, -1.48321533203125, -1.216796875, -0.95037841796875, -0.6839599609375, -0.41754150390625, -0.151123046875, 0.11529541015625, 0.3817138671875, 0.64813232421875, 0.91455078125, 1.18096923828125, 1.4473876953125, 1.71380615234375, 1.980224609375, 2.24664306640625, 2.5130615234375, 2.77947998046875, 3.0458984375, 3.31231689453125, 3.5787353515625, 3.84515380859375, 4.111572265625, 4.37799072265625, 4.6444091796875, 4.91082763671875, 5.17724609375, 5.44366455078125, 5.7100830078125, 5.97650146484375, 6.242919921875, 6.50933837890625, 6.7757568359375, 7.04217529296875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 18.0, 11.0, 12.0, 16.0, 23.0, 32.0, 40.0, 44.0, 51.0, 51.0, 53.0, 56.0, 62.0, 74.0, 59.0, 58.0, 50.0, 38.0, 28.0, 39.0, 27.0, 21.0, 17.0, 13.0, 14.0, 15.0, 14.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.8934326171875, -7.607177734375, -7.3209228515625, -7.03466796875, -6.7484130859375, -6.462158203125, -6.1759033203125, -5.8896484375, -5.6033935546875, -5.317138671875, -5.0308837890625, -4.74462890625, -4.4583740234375, -4.172119140625, -3.8858642578125, -3.599609375, -3.3133544921875, -3.027099609375, -2.7408447265625, -2.45458984375, -2.1683349609375, -1.882080078125, -1.5958251953125, -1.3095703125, -1.0233154296875, -0.737060546875, -0.4508056640625, -0.16455078125, 0.1217041015625, 0.407958984375, 0.6942138671875, 0.98046875, 1.2667236328125, 1.552978515625, 1.8392333984375, 2.12548828125, 2.4117431640625, 2.697998046875, 2.9842529296875, 3.2705078125, 3.5567626953125, 3.843017578125, 4.1292724609375, 4.41552734375, 4.7017822265625, 4.988037109375, 5.2742919921875, 5.560546875, 5.8468017578125, 6.133056640625, 6.4193115234375, 6.70556640625, 6.9918212890625, 7.278076171875, 7.5643310546875, 7.8505859375, 8.1368408203125, 8.423095703125, 8.7093505859375, 8.99560546875, 9.2818603515625, 9.568115234375, 9.8543701171875, 10.140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 18.0, 28.0, 35.0, 69.0, 79.0, 161.0, 311.0, 546.0, 1159.0, 2636.0, 6806.0, 20439.0, 80486.0, 645501.0, 228415.0, 41815.0, 12162.0, 4241.0, 1797.0, 767.0, 379.0, 222.0, 148.0, 87.0, 54.0, 38.0, 27.0, 18.0, 15.0, 13.0, 13.0, 2.0, 2.0, 10.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.31451416015625, -2.2247314453125, -2.13494873046875, -2.045166015625, -1.95538330078125, -1.8656005859375, -1.77581787109375, -1.68603515625, -1.59625244140625, -1.5064697265625, -1.41668701171875, -1.326904296875, -1.23712158203125, -1.1473388671875, -1.05755615234375, -0.9677734375, -0.87799072265625, -0.7882080078125, -0.69842529296875, -0.608642578125, -0.51885986328125, -0.4290771484375, -0.33929443359375, -0.24951171875, -0.15972900390625, -0.0699462890625, 0.01983642578125, 0.109619140625, 0.19940185546875, 0.2891845703125, 0.37896728515625, 0.46875, 0.55853271484375, 0.6483154296875, 0.73809814453125, 0.827880859375, 0.91766357421875, 1.0074462890625, 1.09722900390625, 1.18701171875, 1.27679443359375, 1.3665771484375, 1.45635986328125, 1.546142578125, 1.63592529296875, 1.7257080078125, 1.81549072265625, 1.9052734375, 1.99505615234375, 2.0848388671875, 2.17462158203125, 2.264404296875, 2.35418701171875, 2.4439697265625, 2.53375244140625, 2.62353515625, 2.71331787109375, 2.8031005859375, 2.89288330078125, 2.982666015625, 3.07244873046875, 3.1622314453125, 3.25201416015625, 3.341796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 7.0, 19.0, 21.0, 24.0, 43.0, 57.0, 101.0, 134.0, 158.0, 118.0, 67.0, 55.0, 42.0, 28.0, 18.0, 21.0, 18.0, 6.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006933212280273438, -0.0006669163703918457, -0.0006405115127563477, -0.0006141066551208496, -0.0005877017974853516, -0.0005612969398498535, -0.0005348920822143555, -0.0005084872245788574, -0.0004820823669433594, -0.00045567750930786133, -0.0004292726516723633, -0.00040286779403686523, -0.0003764629364013672, -0.00035005807876586914, -0.0003236532211303711, -0.00029724836349487305, -0.000270843505859375, -0.00024443864822387695, -0.0002180337905883789, -0.00019162893295288086, -0.0001652240753173828, -0.00013881921768188477, -0.00011241436004638672, -8.600950241088867e-05, -5.9604644775390625e-05, -3.319978713989258e-05, -6.794929504394531e-06, 1.9609928131103516e-05, 4.601478576660156e-05, 7.241964340209961e-05, 9.882450103759766e-05, 0.0001252293586730957, 0.00015163421630859375, 0.0001780390739440918, 0.00020444393157958984, 0.0002308487892150879, 0.00025725364685058594, 0.000283658504486084, 0.00031006336212158203, 0.0003364682197570801, 0.0003628730773925781, 0.00038927793502807617, 0.0004156827926635742, 0.00044208765029907227, 0.0004684925079345703, 0.0004948973655700684, 0.0005213022232055664, 0.0005477070808410645, 0.0005741119384765625, 0.0006005167961120605, 0.0006269216537475586, 0.0006533265113830566, 0.0006797313690185547, 0.0007061362266540527, 0.0007325410842895508, 0.0007589459419250488, 0.0007853507995605469, 0.0008117556571960449, 0.000838160514831543, 0.000864565372467041, 0.0008909702301025391, 0.0009173750877380371, 0.0009437799453735352, 0.0009701848030090332, 0.0009965896606445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 3.0, 12.0, 14.0, 8.0, 14.0, 17.0, 27.0, 33.0, 62.0, 83.0, 121.0, 160.0, 221.0, 330.0, 567.0, 950.0, 1804.0, 3617.0, 8204.0, 21249.0, 65794.0, 289415.0, 527231.0, 84303.0, 25588.0, 9734.0, 4136.0, 1947.0, 1119.0, 623.0, 377.0, 244.0, 160.0, 95.0, 92.0, 57.0, 27.0, 29.0, 21.0, 20.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.176422119140625, -2.11065673828125, -2.044891357421875, -1.9791259765625, -1.913360595703125, -1.84759521484375, -1.781829833984375, -1.716064453125, -1.650299072265625, -1.58453369140625, -1.518768310546875, -1.4530029296875, -1.387237548828125, -1.32147216796875, -1.255706787109375, -1.18994140625, -1.124176025390625, -1.05841064453125, -0.992645263671875, -0.9268798828125, -0.861114501953125, -0.79534912109375, -0.729583740234375, -0.663818359375, -0.598052978515625, -0.53228759765625, -0.466522216796875, -0.4007568359375, -0.334991455078125, -0.26922607421875, -0.203460693359375, -0.1376953125, -0.071929931640625, -0.00616455078125, 0.059600830078125, 0.1253662109375, 0.191131591796875, 0.25689697265625, 0.322662353515625, 0.388427734375, 0.454193115234375, 0.51995849609375, 0.585723876953125, 0.6514892578125, 0.717254638671875, 0.78302001953125, 0.848785400390625, 0.91455078125, 0.980316162109375, 1.04608154296875, 1.111846923828125, 1.1776123046875, 1.243377685546875, 1.30914306640625, 1.374908447265625, 1.440673828125, 1.506439208984375, 1.57220458984375, 1.637969970703125, 1.7037353515625, 1.769500732421875, 1.83526611328125, 1.901031494140625, 1.966796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 11.0, 6.0, 15.0, 8.0, 12.0, 14.0, 20.0, 39.0, 35.0, 42.0, 64.0, 74.0, 80.0, 107.0, 105.0, 83.0, 43.0, 37.0, 41.0, 38.0, 22.0, 21.0, 11.0, 15.0, 13.0, 8.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.38739013671875, -2.3099365234375, -2.23248291015625, -2.155029296875, -2.07757568359375, -2.0001220703125, -1.92266845703125, -1.84521484375, -1.76776123046875, -1.6903076171875, -1.61285400390625, -1.535400390625, -1.45794677734375, -1.3804931640625, -1.30303955078125, -1.2255859375, -1.14813232421875, -1.0706787109375, -0.99322509765625, -0.915771484375, -0.83831787109375, -0.7608642578125, -0.68341064453125, -0.60595703125, -0.52850341796875, -0.4510498046875, -0.37359619140625, -0.296142578125, -0.21868896484375, -0.1412353515625, -0.06378173828125, 0.013671875, 0.09112548828125, 0.1685791015625, 0.24603271484375, 0.323486328125, 0.40093994140625, 0.4783935546875, 0.55584716796875, 0.63330078125, 0.71075439453125, 0.7882080078125, 0.86566162109375, 0.943115234375, 1.02056884765625, 1.0980224609375, 1.17547607421875, 1.2529296875, 1.33038330078125, 1.4078369140625, 1.48529052734375, 1.562744140625, 1.64019775390625, 1.7176513671875, 1.79510498046875, 1.87255859375, 1.95001220703125, 2.0274658203125, 2.10491943359375, 2.182373046875, 2.25982666015625, 2.3372802734375, 2.41473388671875, 2.4921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 11.0, 31.0, 63.0, 133.0, 217.0, 209.0, 133.0, 91.0, 53.0, 20.0, 7.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.09856414794922, -53.26109313964844, -51.42361831665039, -49.58614730834961, -47.74867630004883, -45.91120147705078, -44.07373046875, -42.23625946044922, -40.39878845214844, -38.561317443847656, -36.72384262084961, -34.88637161254883, -33.04890060424805, -31.211427688598633, -29.37395477294922, -27.536483764648438, -25.699010848999023, -23.86153793334961, -22.024066925048828, -20.186594009399414, -18.349123001098633, -16.51165008544922, -14.674178123474121, -12.836706161499023, -10.999234199523926, -9.161762237548828, -7.3242902755737305, -5.486817836761475, -3.649345874786377, -1.811873435974121, 0.025598526000976562, 1.8630704879760742, 3.700542449951172, 5.5380144119262695, 7.375486373901367, 9.212959289550781, 11.050430297851562, 12.887903213500977, 14.725375175476074, 16.562847137451172, 18.400318145751953, 20.237791061401367, 22.07526206970215, 23.912734985351562, 25.750205993652344, 27.587678909301758, 29.425151824951172, 31.262622833251953, 33.10009765625, 34.93756866455078, 36.77504348754883, 38.61251449584961, 40.44998550415039, 42.28746032714844, 44.12493133544922, 45.96240234375, 47.79987335205078, 49.63734436035156, 51.47481918334961, 53.31229019165039, 55.14976119995117, 56.98723602294922, 58.82470703125, 60.66217803955078, 62.49964904785156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 2.0, 19.0, 16.0, 19.0, 17.0, 14.0, 21.0, 27.0, 31.0, 29.0, 44.0, 50.0, 47.0, 77.0, 75.0, 62.0, 58.0, 76.0, 36.0, 37.0, 42.0, 27.0, 27.0, 31.0, 18.0, 13.0, 13.0, 10.0, 7.0, 10.0, 4.0, 9.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.8331413269043, -34.77885818481445, -33.72457504272461, -32.67029571533203, -31.616012573242188, -30.561729431152344, -29.5074462890625, -28.453163146972656, -27.398881912231445, -26.3445987701416, -25.29031753540039, -24.236034393310547, -23.181751251220703, -22.127470016479492, -21.07318687438965, -20.018905639648438, -18.964622497558594, -17.91033935546875, -16.85605812072754, -15.801774978637695, -14.747492790222168, -13.69321060180664, -12.638927459716797, -11.58464527130127, -10.530363082885742, -9.476080894470215, -8.421798706054688, -7.367515563964844, -6.313233375549316, -5.258951187133789, -4.2046685218811035, -3.150385856628418, -2.096101760864258, -1.0418193340301514, 0.012463092803955078, 1.0667455196380615, 2.121027946472168, 3.1753101348876953, 4.229592800140381, 5.283875465393066, 6.338157653808594, 7.392439842224121, 8.446722030639648, 9.501005172729492, 10.55528736114502, 11.609569549560547, 12.66385269165039, 13.718134880065918, 14.772417068481445, 15.826699256896973, 16.8809814453125, 17.935264587402344, 18.989547729492188, 20.0438289642334, 21.098112106323242, 22.152393341064453, 23.206676483154297, 24.26095962524414, 25.31524085998535, 26.369524002075195, 27.423805236816406, 28.47808837890625, 29.532371520996094, 30.586654663085938, 31.64093589782715]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 5.0, 5.0, 15.0, 7.0, 16.0, 22.0, 31.0, 36.0, 77.0, 103.0, 186.0, 328.0, 646.0, 1432.0, 3471.0, 9644.0, 32890.0, 186602.0, 2523138.0, 1294798.0, 104330.0, 23444.0, 7708.0, 2893.0, 1252.0, 558.0, 270.0, 149.0, 71.0, 37.0, 33.0, 28.0, 15.0, 9.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0], "bins": [-5.25, -5.12750244140625, -5.0050048828125, -4.88250732421875, -4.760009765625, -4.63751220703125, -4.5150146484375, -4.39251708984375, -4.27001953125, -4.14752197265625, -4.0250244140625, -3.90252685546875, -3.780029296875, -3.65753173828125, -3.5350341796875, -3.41253662109375, -3.2900390625, -3.16754150390625, -3.0450439453125, -2.92254638671875, -2.800048828125, -2.67755126953125, -2.5550537109375, -2.43255615234375, -2.31005859375, -2.18756103515625, -2.0650634765625, -1.94256591796875, -1.820068359375, -1.69757080078125, -1.5750732421875, -1.45257568359375, -1.330078125, -1.20758056640625, -1.0850830078125, -0.96258544921875, -0.840087890625, -0.71759033203125, -0.5950927734375, -0.47259521484375, -0.35009765625, -0.22760009765625, -0.1051025390625, 0.01739501953125, 0.139892578125, 0.26239013671875, 0.3848876953125, 0.50738525390625, 0.6298828125, 0.75238037109375, 0.8748779296875, 0.99737548828125, 1.119873046875, 1.24237060546875, 1.3648681640625, 1.48736572265625, 1.60986328125, 1.73236083984375, 1.8548583984375, 1.97735595703125, 2.099853515625, 2.22235107421875, 2.3448486328125, 2.46734619140625, 2.58984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 7.0, 16.0, 12.0, 14.0, 20.0, 21.0, 25.0, 35.0, 37.0, 52.0, 47.0, 50.0, 67.0, 62.0, 53.0, 59.0, 55.0, 51.0, 61.0, 60.0, 41.0, 33.0, 22.0, 25.0, 23.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.904144287109375, -2.83172607421875, -2.759307861328125, -2.6868896484375, -2.614471435546875, -2.54205322265625, -2.469635009765625, -2.397216796875, -2.324798583984375, -2.25238037109375, -2.179962158203125, -2.1075439453125, -2.035125732421875, -1.96270751953125, -1.890289306640625, -1.81787109375, -1.745452880859375, -1.67303466796875, -1.600616455078125, -1.5281982421875, -1.455780029296875, -1.38336181640625, -1.310943603515625, -1.238525390625, -1.166107177734375, -1.09368896484375, -1.021270751953125, -0.9488525390625, -0.876434326171875, -0.80401611328125, -0.731597900390625, -0.6591796875, -0.586761474609375, -0.51434326171875, -0.441925048828125, -0.3695068359375, -0.297088623046875, -0.22467041015625, -0.152252197265625, -0.079833984375, -0.007415771484375, 0.06500244140625, 0.137420654296875, 0.2098388671875, 0.282257080078125, 0.35467529296875, 0.427093505859375, 0.49951171875, 0.571929931640625, 0.64434814453125, 0.716766357421875, 0.7891845703125, 0.861602783203125, 0.93402099609375, 1.006439208984375, 1.078857421875, 1.151275634765625, 1.22369384765625, 1.296112060546875, 1.3685302734375, 1.440948486328125, 1.51336669921875, 1.585784912109375, 1.658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 10.0, 9.0, 5.0, 5.0, 12.0, 13.0, 26.0, 33.0, 55.0, 106.0, 170.0, 346.0, 683.0, 1426.0, 3606.0, 9987.0, 32886.0, 170092.0, 2864419.0, 996518.0, 82217.0, 19958.0, 6637.0, 2547.0, 1156.0, 562.0, 304.0, 183.0, 105.0, 52.0, 44.0, 36.0, 14.0, 14.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.8037109375, -4.642578125, -4.4814453125, -4.3203125, -4.1591796875, -3.998046875, -3.8369140625, -3.67578125, -3.5146484375, -3.353515625, -3.1923828125, -3.03125, -2.8701171875, -2.708984375, -2.5478515625, -2.38671875, -2.2255859375, -2.064453125, -1.9033203125, -1.7421875, -1.5810546875, -1.419921875, -1.2587890625, -1.09765625, -0.9365234375, -0.775390625, -0.6142578125, -0.453125, -0.2919921875, -0.130859375, 0.0302734375, 0.19140625, 0.3525390625, 0.513671875, 0.6748046875, 0.8359375, 0.9970703125, 1.158203125, 1.3193359375, 1.48046875, 1.6416015625, 1.802734375, 1.9638671875, 2.125, 2.2861328125, 2.447265625, 2.6083984375, 2.76953125, 2.9306640625, 3.091796875, 3.2529296875, 3.4140625, 3.5751953125, 3.736328125, 3.8974609375, 4.05859375, 4.2197265625, 4.380859375, 4.5419921875, 4.703125, 4.8642578125, 5.025390625, 5.1865234375, 5.34765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 18.0, 16.0, 21.0, 25.0, 38.0, 57.0, 78.0, 113.0, 182.0, 365.0, 704.0, 850.0, 638.0, 385.0, 205.0, 127.0, 63.0, 43.0, 36.0, 19.0, 14.0, 18.0, 7.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.99029541015625, -3.8126220703125, -3.63494873046875, -3.457275390625, -3.27960205078125, -3.1019287109375, -2.92425537109375, -2.74658203125, -2.56890869140625, -2.3912353515625, -2.21356201171875, -2.035888671875, -1.85821533203125, -1.6805419921875, -1.50286865234375, -1.3251953125, -1.14752197265625, -0.9698486328125, -0.79217529296875, -0.614501953125, -0.43682861328125, -0.2591552734375, -0.08148193359375, 0.09619140625, 0.27386474609375, 0.4515380859375, 0.62921142578125, 0.806884765625, 0.98455810546875, 1.1622314453125, 1.33990478515625, 1.517578125, 1.69525146484375, 1.8729248046875, 2.05059814453125, 2.228271484375, 2.40594482421875, 2.5836181640625, 2.76129150390625, 2.93896484375, 3.11663818359375, 3.2943115234375, 3.47198486328125, 3.649658203125, 3.82733154296875, 4.0050048828125, 4.18267822265625, 4.3603515625, 4.53802490234375, 4.7156982421875, 4.89337158203125, 5.071044921875, 5.24871826171875, 5.4263916015625, 5.60406494140625, 5.78173828125, 5.95941162109375, 6.1370849609375, 6.31475830078125, 6.492431640625, 6.67010498046875, 6.8477783203125, 7.02545166015625, 7.203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 12.0, 23.0, 79.0, 150.0, 251.0, 245.0, 140.0, 50.0, 18.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.43997192382812, -87.19168853759766, -84.94339752197266, -82.69511413574219, -80.44683074951172, -78.19854736328125, -75.95025634765625, -73.70197296142578, -71.45368957519531, -69.20540618896484, -66.95711517333984, -64.70883178710938, -62.460548400878906, -60.21226119995117, -57.96397399902344, -55.71569061279297, -53.467403411865234, -51.2191162109375, -48.97083282470703, -46.7225456237793, -44.47426223754883, -42.225975036621094, -39.977691650390625, -37.72940444946289, -35.481117248535156, -33.23283004760742, -30.984546661376953, -28.73625946044922, -26.48797607421875, -24.239688873291016, -21.991403579711914, -19.743118286132812, -17.494834899902344, -15.246549606323242, -12.99826431274414, -10.749978065490723, -8.501692771911621, -6.2534074783325195, -4.005121231079102, -1.7568359375, 0.49144935607910156, 2.7397348880767822, 4.988020420074463, 7.236306190490723, 9.484591484069824, 11.732876777648926, 13.981163024902344, 16.229448318481445, 18.477733612060547, 20.72601890563965, 22.97430419921875, 25.222591400146484, 27.470874786376953, 29.719161987304688, 31.96744728088379, 34.21573257446289, 36.464019775390625, 38.71230697631836, 40.96059036254883, 43.20887756347656, 45.45716094970703, 47.705448150634766, 49.9537353515625, 52.20201873779297, 54.45030212402344]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 13.0, 9.0, 15.0, 21.0, 24.0, 19.0, 18.0, 19.0, 20.0, 35.0, 46.0, 30.0, 38.0, 48.0, 57.0, 53.0, 37.0, 48.0, 52.0, 34.0, 44.0, 32.0, 44.0, 21.0, 25.0, 25.0, 27.0, 27.0, 20.0, 12.0, 17.0, 16.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.417434692382812, -21.777280807495117, -21.137126922607422, -20.49697494506836, -19.856821060180664, -19.21666717529297, -18.576513290405273, -17.936359405517578, -17.296207427978516, -16.65605354309082, -16.015899658203125, -15.375746726989746, -14.735593795776367, -14.095439910888672, -13.455286026000977, -12.815133094787598, -12.174979209899902, -11.534825325012207, -10.894672393798828, -10.254518508911133, -9.614365577697754, -8.974211692810059, -8.33405876159668, -7.693904876708984, -7.053751468658447, -6.41359806060791, -5.773444652557373, -5.133291244506836, -4.493137359619141, -3.8529841899871826, -3.2128305435180664, -2.5726771354675293, -1.9325237274169922, -1.292370319366455, -0.6522167921066284, -0.012063264846801758, 0.6280901432037354, 1.2682435512542725, 1.9083971977233887, 2.548550605773926, 3.188704013824463, 3.828857421875, 4.469010829925537, 5.109164237976074, 5.7493181228637695, 6.389471054077148, 7.029624938964844, 7.669778347015381, 8.309931755065918, 8.950085639953613, 9.590238571166992, 10.230392456054688, 10.870545387268066, 11.510699272155762, 12.15085220336914, 12.791006088256836, 13.431159973144531, 14.071313858032227, 14.711466789245605, 15.3516206741333, 15.99177360534668, 16.631927490234375, 17.27208137512207, 17.912235260009766, 18.552387237548828]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 24.0, 17.0, 40.0, 46.0, 57.0, 106.0, 156.0, 239.0, 387.0, 573.0, 951.0, 1729.0, 3391.0, 7068.0, 18173.0, 64472.0, 289377.0, 467499.0, 139740.0, 33015.0, 10933.0, 4843.0, 2380.0, 1259.0, 738.0, 455.0, 294.0, 184.0, 106.0, 96.0, 62.0, 38.0, 27.0, 22.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.09173583984375, -2.9822998046875, -2.87286376953125, -2.763427734375, -2.65399169921875, -2.5445556640625, -2.43511962890625, -2.32568359375, -2.21624755859375, -2.1068115234375, -1.99737548828125, -1.887939453125, -1.77850341796875, -1.6690673828125, -1.55963134765625, -1.4501953125, -1.34075927734375, -1.2313232421875, -1.12188720703125, -1.012451171875, -0.90301513671875, -0.7935791015625, -0.68414306640625, -0.57470703125, -0.46527099609375, -0.3558349609375, -0.24639892578125, -0.136962890625, -0.02752685546875, 0.0819091796875, 0.19134521484375, 0.30078125, 0.41021728515625, 0.5196533203125, 0.62908935546875, 0.738525390625, 0.84796142578125, 0.9573974609375, 1.06683349609375, 1.17626953125, 1.28570556640625, 1.3951416015625, 1.50457763671875, 1.614013671875, 1.72344970703125, 1.8328857421875, 1.94232177734375, 2.0517578125, 2.16119384765625, 2.2706298828125, 2.38006591796875, 2.489501953125, 2.59893798828125, 2.7083740234375, 2.81781005859375, 2.92724609375, 3.03668212890625, 3.1461181640625, 3.25555419921875, 3.364990234375, 3.47442626953125, 3.5838623046875, 3.69329833984375, 3.802734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 17.0, 16.0, 21.0, 27.0, 18.0, 29.0, 46.0, 42.0, 44.0, 61.0, 50.0, 57.0, 53.0, 64.0, 66.0, 57.0, 46.0, 36.0, 36.0, 31.0, 32.0, 24.0, 21.0, 12.0, 16.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.869140625, -2.7957916259765625, -2.722442626953125, -2.6490936279296875, -2.57574462890625, -2.5023956298828125, -2.429046630859375, -2.3556976318359375, -2.2823486328125, -2.2089996337890625, -2.135650634765625, -2.0623016357421875, -1.98895263671875, -1.9156036376953125, -1.842254638671875, -1.7689056396484375, -1.695556640625, -1.6222076416015625, -1.548858642578125, -1.4755096435546875, -1.40216064453125, -1.3288116455078125, -1.255462646484375, -1.1821136474609375, -1.1087646484375, -1.0354156494140625, -0.962066650390625, -0.8887176513671875, -0.81536865234375, -0.7420196533203125, -0.668670654296875, -0.5953216552734375, -0.52197265625, -0.4486236572265625, -0.375274658203125, -0.3019256591796875, -0.22857666015625, -0.1552276611328125, -0.081878662109375, -0.0085296630859375, 0.0648193359375, 0.1381683349609375, 0.211517333984375, 0.2848663330078125, 0.35821533203125, 0.4315643310546875, 0.504913330078125, 0.5782623291015625, 0.651611328125, 0.7249603271484375, 0.798309326171875, 0.8716583251953125, 0.94500732421875, 1.0183563232421875, 1.091705322265625, 1.1650543212890625, 1.2384033203125, 1.3117523193359375, 1.385101318359375, 1.4584503173828125, 1.53179931640625, 1.6051483154296875, 1.678497314453125, 1.7518463134765625, 1.8251953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 10.0, 20.0, 25.0, 39.0, 62.0, 93.0, 128.0, 279.0, 615.0, 1414.0, 3743.0, 15811.0, 161969.0, 778769.0, 71215.0, 9423.0, 2776.0, 1057.0, 477.0, 261.0, 139.0, 73.0, 46.0, 33.0, 21.0, 13.0, 9.0, 9.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.2042236328125, -5.013916015625, -4.8236083984375, -4.63330078125, -4.4429931640625, -4.252685546875, -4.0623779296875, -3.8720703125, -3.6817626953125, -3.491455078125, -3.3011474609375, -3.11083984375, -2.9205322265625, -2.730224609375, -2.5399169921875, -2.349609375, -2.1593017578125, -1.968994140625, -1.7786865234375, -1.58837890625, -1.3980712890625, -1.207763671875, -1.0174560546875, -0.8271484375, -0.6368408203125, -0.446533203125, -0.2562255859375, -0.06591796875, 0.1243896484375, 0.314697265625, 0.5050048828125, 0.6953125, 0.8856201171875, 1.075927734375, 1.2662353515625, 1.45654296875, 1.6468505859375, 1.837158203125, 2.0274658203125, 2.2177734375, 2.4080810546875, 2.598388671875, 2.7886962890625, 2.97900390625, 3.1693115234375, 3.359619140625, 3.5499267578125, 3.740234375, 3.9305419921875, 4.120849609375, 4.3111572265625, 4.50146484375, 4.6917724609375, 4.882080078125, 5.0723876953125, 5.2626953125, 5.4530029296875, 5.643310546875, 5.8336181640625, 6.02392578125, 6.2142333984375, 6.404541015625, 6.5948486328125, 6.78515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 11.0, 15.0, 23.0, 13.0, 18.0, 19.0, 24.0, 42.0, 51.0, 37.0, 41.0, 41.0, 45.0, 50.0, 57.0, 59.0, 39.0, 51.0, 36.0, 45.0, 30.0, 25.0, 28.0, 25.0, 31.0, 24.0, 26.0, 12.0, 13.0, 17.0, 2.0, 3.0, 8.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.63671875, -7.4022216796875, -7.167724609375, -6.9332275390625, -6.69873046875, -6.4642333984375, -6.229736328125, -5.9952392578125, -5.7607421875, -5.5262451171875, -5.291748046875, -5.0572509765625, -4.82275390625, -4.5882568359375, -4.353759765625, -4.1192626953125, -3.884765625, -3.6502685546875, -3.415771484375, -3.1812744140625, -2.94677734375, -2.7122802734375, -2.477783203125, -2.2432861328125, -2.0087890625, -1.7742919921875, -1.539794921875, -1.3052978515625, -1.07080078125, -0.8363037109375, -0.601806640625, -0.3673095703125, -0.1328125, 0.1016845703125, 0.336181640625, 0.5706787109375, 0.80517578125, 1.0396728515625, 1.274169921875, 1.5086669921875, 1.7431640625, 1.9776611328125, 2.212158203125, 2.4466552734375, 2.68115234375, 2.9156494140625, 3.150146484375, 3.3846435546875, 3.619140625, 3.8536376953125, 4.088134765625, 4.3226318359375, 4.55712890625, 4.7916259765625, 5.026123046875, 5.2606201171875, 5.4951171875, 5.7296142578125, 5.964111328125, 6.1986083984375, 6.43310546875, 6.6676025390625, 6.902099609375, 7.1365966796875, 7.37109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 14.0, 13.0, 36.0, 78.0, 126.0, 246.0, 513.0, 1099.0, 2867.0, 10215.0, 48258.0, 349253.0, 563153.0, 55687.0, 11370.0, 3415.0, 1171.0, 498.0, 251.0, 112.0, 82.0, 36.0, 16.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.229400634765625, -2.16192626953125, -2.094451904296875, -2.0269775390625, -1.959503173828125, -1.89202880859375, -1.824554443359375, -1.757080078125, -1.689605712890625, -1.62213134765625, -1.554656982421875, -1.4871826171875, -1.419708251953125, -1.35223388671875, -1.284759521484375, -1.21728515625, -1.149810791015625, -1.08233642578125, -1.014862060546875, -0.9473876953125, -0.879913330078125, -0.81243896484375, -0.744964599609375, -0.677490234375, -0.610015869140625, -0.54254150390625, -0.475067138671875, -0.4075927734375, -0.340118408203125, -0.27264404296875, -0.205169677734375, -0.1376953125, -0.070220947265625, -0.00274658203125, 0.064727783203125, 0.1322021484375, 0.199676513671875, 0.26715087890625, 0.334625244140625, 0.402099609375, 0.469573974609375, 0.53704833984375, 0.604522705078125, 0.6719970703125, 0.739471435546875, 0.80694580078125, 0.874420166015625, 0.94189453125, 1.009368896484375, 1.07684326171875, 1.144317626953125, 1.2117919921875, 1.279266357421875, 1.34674072265625, 1.414215087890625, 1.481689453125, 1.549163818359375, 1.61663818359375, 1.684112548828125, 1.7515869140625, 1.819061279296875, 1.88653564453125, 1.954010009765625, 2.021484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 11.0, 5.0, 16.0, 13.0, 15.0, 29.0, 47.0, 52.0, 70.0, 111.0, 112.0, 125.0, 117.0, 81.0, 67.0, 25.0, 30.0, 16.0, 15.0, 10.0, 3.0, 6.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038123130798339844, -0.00036537274718284607, -0.0003495141863822937, -0.00033365562558174133, -0.00031779706478118896, -0.0003019385039806366, -0.00028607994318008423, -0.00027022138237953186, -0.0002543628215789795, -0.00023850426077842712, -0.00022264569997787476, -0.0002067871391773224, -0.00019092857837677002, -0.00017507001757621765, -0.00015921145677566528, -0.00014335289597511292, -0.00012749433517456055, -0.00011163577437400818, -9.577721357345581e-05, -7.991865277290344e-05, -6.406009197235107e-05, -4.8201531171798706e-05, -3.234297037124634e-05, -1.648440957069397e-05, -6.258487701416016e-07, 1.5232712030410767e-05, 3.1091272830963135e-05, 4.69498336315155e-05, 6.280839443206787e-05, 7.866695523262024e-05, 9.452551603317261e-05, 0.00011038407683372498, 0.00012624263763427734, 0.0001421011984348297, 0.00015795975923538208, 0.00017381832003593445, 0.00018967688083648682, 0.00020553544163703918, 0.00022139400243759155, 0.00023725256323814392, 0.0002531111240386963, 0.00026896968483924866, 0.000284828245639801, 0.0003006868064403534, 0.00031654536724090576, 0.00033240392804145813, 0.0003482624888420105, 0.00036412104964256287, 0.00037997961044311523, 0.0003958381712436676, 0.00041169673204421997, 0.00042755529284477234, 0.0004434138536453247, 0.0004592724144458771, 0.00047513097524642944, 0.0004909895360469818, 0.0005068480968475342, 0.0005227066576480865, 0.0005385652184486389, 0.0005544237792491913, 0.0005702823400497437, 0.000586140900850296, 0.0006019994616508484, 0.0006178580224514008, 0.0006337165832519531]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 12.0, 30.0, 45.0, 80.0, 151.0, 346.0, 1132.0, 5459.0, 60354.0, 884139.0, 87844.0, 6841.0, 1349.0, 406.0, 155.0, 99.0, 38.0, 24.0, 11.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.938812255859375, -4.80731201171875, -4.675811767578125, -4.5443115234375, -4.412811279296875, -4.28131103515625, -4.149810791015625, -4.018310546875, -3.886810302734375, -3.75531005859375, -3.623809814453125, -3.4923095703125, -3.360809326171875, -3.22930908203125, -3.097808837890625, -2.96630859375, -2.834808349609375, -2.70330810546875, -2.571807861328125, -2.4403076171875, -2.308807373046875, -2.17730712890625, -2.045806884765625, -1.914306640625, -1.782806396484375, -1.65130615234375, -1.519805908203125, -1.3883056640625, -1.256805419921875, -1.12530517578125, -0.993804931640625, -0.8623046875, -0.730804443359375, -0.59930419921875, -0.467803955078125, -0.3363037109375, -0.204803466796875, -0.07330322265625, 0.058197021484375, 0.189697265625, 0.321197509765625, 0.45269775390625, 0.584197998046875, 0.7156982421875, 0.847198486328125, 0.97869873046875, 1.110198974609375, 1.24169921875, 1.373199462890625, 1.50469970703125, 1.636199951171875, 1.7677001953125, 1.899200439453125, 2.03070068359375, 2.162200927734375, 2.293701171875, 2.425201416015625, 2.55670166015625, 2.688201904296875, 2.8197021484375, 2.951202392578125, 3.08270263671875, 3.214202880859375, 3.345703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 11.0, 7.0, 12.0, 22.0, 19.0, 38.0, 39.0, 57.0, 65.0, 84.0, 86.0, 80.0, 98.0, 87.0, 75.0, 45.0, 32.0, 33.0, 18.0, 22.0, 11.0, 12.0, 5.0, 7.0, 9.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.35791015625, -2.2958984375, -2.23388671875, -2.171875, -2.10986328125, -2.0478515625, -1.98583984375, -1.923828125, -1.86181640625, -1.7998046875, -1.73779296875, -1.67578125, -1.61376953125, -1.5517578125, -1.48974609375, -1.427734375, -1.36572265625, -1.3037109375, -1.24169921875, -1.1796875, -1.11767578125, -1.0556640625, -0.99365234375, -0.931640625, -0.86962890625, -0.8076171875, -0.74560546875, -0.68359375, -0.62158203125, -0.5595703125, -0.49755859375, -0.435546875, -0.37353515625, -0.3115234375, -0.24951171875, -0.1875, -0.12548828125, -0.0634765625, -0.00146484375, 0.060546875, 0.12255859375, 0.1845703125, 0.24658203125, 0.30859375, 0.37060546875, 0.4326171875, 0.49462890625, 0.556640625, 0.61865234375, 0.6806640625, 0.74267578125, 0.8046875, 0.86669921875, 0.9287109375, 0.99072265625, 1.052734375, 1.11474609375, 1.1767578125, 1.23876953125, 1.30078125, 1.36279296875, 1.4248046875, 1.48681640625, 1.548828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 8.0, 16.0, 19.0, 32.0, 78.0, 144.0, 247.0, 228.0, 116.0, 55.0, 24.0, 8.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.43402862548828, -44.93017578125, -43.42632293701172, -41.9224739074707, -40.41862106323242, -38.91476821899414, -37.410919189453125, -35.907066345214844, -34.40321350097656, -32.89936065673828, -31.395509719848633, -29.891658782958984, -28.387805938720703, -26.883953094482422, -25.380102157592773, -23.876251220703125, -22.372398376464844, -20.868545532226562, -19.364694595336914, -17.860843658447266, -16.356990814208984, -14.85313892364502, -13.349287033081055, -11.84543514251709, -10.341583251953125, -8.83773136138916, -7.333879470825195, -5.8300275802612305, -4.326175689697266, -2.822323799133301, -1.318471908569336, 0.1853799819946289, 1.6892318725585938, 3.1930837631225586, 4.696935653686523, 6.200787544250488, 7.704639434814453, 9.208491325378418, 10.712343215942383, 12.216195106506348, 13.720046997070312, 15.223898887634277, 16.727750778198242, 18.23160171508789, 19.735454559326172, 21.239307403564453, 22.7431583404541, 24.24700927734375, 25.75086212158203, 27.254714965820312, 28.75856590270996, 30.26241683959961, 31.76626968383789, 33.27012252807617, 34.77397155761719, 36.27782440185547, 37.78167724609375, 39.28553009033203, 40.78938293457031, 42.29323196411133, 43.79708480834961, 45.30093765258789, 46.804786682128906, 48.30863952636719, 49.81249237060547]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 4.0, 12.0, 10.0, 11.0, 17.0, 12.0, 18.0, 27.0, 16.0, 27.0, 33.0, 28.0, 39.0, 34.0, 60.0, 68.0, 80.0, 63.0, 73.0, 56.0, 42.0, 30.0, 32.0, 27.0, 20.0, 19.0, 31.0, 14.0, 10.0, 15.0, 10.0, 9.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.821874618530273, -29.876317977905273, -28.930763244628906, -27.985206604003906, -27.039649963378906, -26.094093322753906, -25.148536682128906, -24.20298194885254, -23.25742530822754, -22.31186866760254, -21.366313934326172, -20.420757293701172, -19.475200653076172, -18.529644012451172, -17.584087371826172, -16.638532638549805, -15.692975997924805, -14.747419357299805, -13.801863670349121, -12.856307983398438, -11.910751342773438, -10.965194702148438, -10.019639015197754, -9.07408332824707, -8.12852668762207, -7.1829705238342285, -6.237414360046387, -5.291858196258545, -4.346302032470703, -3.4007458686828613, -2.4551897048950195, -1.5096335411071777, -0.5640754699707031, 0.38148069381713867, 1.3270368576049805, 2.2725930213928223, 3.218149185180664, 4.163705348968506, 5.109261512756348, 6.0548176765441895, 7.000373840332031, 7.945930004119873, 8.891486167907715, 9.837041854858398, 10.782598495483398, 11.728155136108398, 12.673710823059082, 13.619266510009766, 14.564823150634766, 15.510379791259766, 16.455936431884766, 17.401491165161133, 18.347047805786133, 19.292604446411133, 20.2381591796875, 21.1837158203125, 22.1292724609375, 23.0748291015625, 24.0203857421875, 24.965940475463867, 25.911497116088867, 26.857053756713867, 27.802608489990234, 28.748165130615234, 29.693721771240234]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 16.0, 18.0, 46.0, 55.0, 97.0, 180.0, 334.0, 557.0, 1181.0, 2680.0, 6723.0, 20845.0, 100576.0, 1197512.0, 2591532.0, 220243.0, 34329.0, 9964.0, 3914.0, 1664.0, 814.0, 432.0, 211.0, 131.0, 65.0, 50.0, 29.0, 22.0, 9.0, 11.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.244293212890625, -3.13311767578125, -3.021942138671875, -2.9107666015625, -2.799591064453125, -2.68841552734375, -2.577239990234375, -2.466064453125, -2.354888916015625, -2.24371337890625, -2.132537841796875, -2.0213623046875, -1.910186767578125, -1.79901123046875, -1.687835693359375, -1.57666015625, -1.465484619140625, -1.35430908203125, -1.243133544921875, -1.1319580078125, -1.020782470703125, -0.90960693359375, -0.798431396484375, -0.687255859375, -0.576080322265625, -0.46490478515625, -0.353729248046875, -0.2425537109375, -0.131378173828125, -0.02020263671875, 0.090972900390625, 0.2021484375, 0.313323974609375, 0.42449951171875, 0.535675048828125, 0.6468505859375, 0.758026123046875, 0.86920166015625, 0.980377197265625, 1.091552734375, 1.202728271484375, 1.31390380859375, 1.425079345703125, 1.5362548828125, 1.647430419921875, 1.75860595703125, 1.869781494140625, 1.98095703125, 2.092132568359375, 2.20330810546875, 2.314483642578125, 2.4256591796875, 2.536834716796875, 2.64801025390625, 2.759185791015625, 2.870361328125, 2.981536865234375, 3.09271240234375, 3.203887939453125, 3.3150634765625, 3.426239013671875, 3.53741455078125, 3.648590087890625, 3.759765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 8.0, 10.0, 16.0, 9.0, 23.0, 21.0, 20.0, 37.0, 33.0, 46.0, 39.0, 47.0, 43.0, 47.0, 46.0, 54.0, 50.0, 47.0, 47.0, 43.0, 47.0, 50.0, 34.0, 35.0, 23.0, 18.0, 24.0, 17.0, 11.0, 15.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3984375, -2.33551025390625, -2.2725830078125, -2.20965576171875, -2.146728515625, -2.08380126953125, -2.0208740234375, -1.95794677734375, -1.89501953125, -1.83209228515625, -1.7691650390625, -1.70623779296875, -1.643310546875, -1.58038330078125, -1.5174560546875, -1.45452880859375, -1.3916015625, -1.32867431640625, -1.2657470703125, -1.20281982421875, -1.139892578125, -1.07696533203125, -1.0140380859375, -0.95111083984375, -0.88818359375, -0.82525634765625, -0.7623291015625, -0.69940185546875, -0.636474609375, -0.57354736328125, -0.5106201171875, -0.44769287109375, -0.384765625, -0.32183837890625, -0.2589111328125, -0.19598388671875, -0.133056640625, -0.07012939453125, -0.0072021484375, 0.05572509765625, 0.11865234375, 0.18157958984375, 0.2445068359375, 0.30743408203125, 0.370361328125, 0.43328857421875, 0.4962158203125, 0.55914306640625, 0.6220703125, 0.68499755859375, 0.7479248046875, 0.81085205078125, 0.873779296875, 0.93670654296875, 0.9996337890625, 1.06256103515625, 1.12548828125, 1.18841552734375, 1.2513427734375, 1.31427001953125, 1.377197265625, 1.44012451171875, 1.5030517578125, 1.56597900390625, 1.62890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 17.0, 13.0, 20.0, 29.0, 52.0, 100.0, 202.0, 512.0, 1536.0, 5289.0, 26583.0, 329817.0, 3647591.0, 159001.0, 17471.0, 3883.0, 1223.0, 463.0, 201.0, 112.0, 55.0, 29.0, 20.0, 18.0, 9.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.06951904296875, -6.8577880859375, -6.64605712890625, -6.434326171875, -6.22259521484375, -6.0108642578125, -5.79913330078125, -5.58740234375, -5.37567138671875, -5.1639404296875, -4.95220947265625, -4.740478515625, -4.52874755859375, -4.3170166015625, -4.10528564453125, -3.8935546875, -3.68182373046875, -3.4700927734375, -3.25836181640625, -3.046630859375, -2.83489990234375, -2.6231689453125, -2.41143798828125, -2.19970703125, -1.98797607421875, -1.7762451171875, -1.56451416015625, -1.352783203125, -1.14105224609375, -0.9293212890625, -0.71759033203125, -0.505859375, -0.29412841796875, -0.0823974609375, 0.12933349609375, 0.341064453125, 0.55279541015625, 0.7645263671875, 0.97625732421875, 1.18798828125, 1.39971923828125, 1.6114501953125, 1.82318115234375, 2.034912109375, 2.24664306640625, 2.4583740234375, 2.67010498046875, 2.8818359375, 3.09356689453125, 3.3052978515625, 3.51702880859375, 3.728759765625, 3.94049072265625, 4.1522216796875, 4.36395263671875, 4.57568359375, 4.78741455078125, 4.9991455078125, 5.21087646484375, 5.422607421875, 5.63433837890625, 5.8460693359375, 6.05780029296875, 6.26953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 9.0, 12.0, 6.0, 9.0, 15.0, 16.0, 25.0, 36.0, 63.0, 61.0, 97.0, 182.0, 320.0, 528.0, 822.0, 693.0, 427.0, 265.0, 159.0, 95.0, 70.0, 37.0, 26.0, 28.0, 18.0, 10.0, 9.0, 5.0, 4.0, 11.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.380615234375, -4.23388671875, -4.087158203125, -3.9404296875, -3.793701171875, -3.64697265625, -3.500244140625, -3.353515625, -3.206787109375, -3.06005859375, -2.913330078125, -2.7666015625, -2.619873046875, -2.47314453125, -2.326416015625, -2.1796875, -2.032958984375, -1.88623046875, -1.739501953125, -1.5927734375, -1.446044921875, -1.29931640625, -1.152587890625, -1.005859375, -0.859130859375, -0.71240234375, -0.565673828125, -0.4189453125, -0.272216796875, -0.12548828125, 0.021240234375, 0.16796875, 0.314697265625, 0.46142578125, 0.608154296875, 0.7548828125, 0.901611328125, 1.04833984375, 1.195068359375, 1.341796875, 1.488525390625, 1.63525390625, 1.781982421875, 1.9287109375, 2.075439453125, 2.22216796875, 2.368896484375, 2.515625, 2.662353515625, 2.80908203125, 2.955810546875, 3.1025390625, 3.249267578125, 3.39599609375, 3.542724609375, 3.689453125, 3.836181640625, 3.98291015625, 4.129638671875, 4.2763671875, 4.423095703125, 4.56982421875, 4.716552734375, 4.86328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 27.0, 56.0, 70.0, 104.0, 138.0, 125.0, 128.0, 96.0, 81.0, 44.0, 34.0, 25.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59521484375, -39.510807037353516, -38.42639923095703, -37.34198760986328, -36.2575798034668, -35.17317199707031, -34.08876037597656, -33.00435256958008, -31.919944763183594, -30.83553695678711, -29.751127243041992, -28.666717529296875, -27.58230972290039, -26.497901916503906, -25.41349220275879, -24.329082489013672, -23.244674682617188, -22.160266876220703, -21.075857162475586, -19.99144744873047, -18.907039642333984, -17.8226318359375, -16.738222122192383, -15.653813362121582, -14.569404602050781, -13.48499584197998, -12.40058708190918, -11.316178321838379, -10.231769561767578, -9.147360801696777, -8.062952041625977, -6.978543281555176, -5.894136428833008, -4.809727668762207, -3.7253189086914062, -2.6409101486206055, -1.5565013885498047, -0.4720926284790039, 0.6123161315917969, 1.6967248916625977, 2.7811336517333984, 3.865542411804199, 4.949951171875, 6.034359931945801, 7.118768692016602, 8.203177452087402, 9.287586212158203, 10.371994972229004, 11.456403732299805, 12.540812492370605, 13.625221252441406, 14.709630012512207, 15.794038772583008, 16.878448486328125, 17.96285629272461, 19.047264099121094, 20.13167381286621, 21.216083526611328, 22.300491333007812, 23.384899139404297, 24.469308853149414, 25.55371856689453, 26.638126373291016, 27.7225341796875, 28.806943893432617]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 14.0, 23.0, 18.0, 20.0, 37.0, 37.0, 35.0, 51.0, 55.0, 46.0, 55.0, 69.0, 88.0, 66.0, 63.0, 47.0, 35.0, 40.0, 34.0, 33.0, 20.0, 21.0, 20.0, 21.0, 5.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-29.58866310119629, -28.84001922607422, -28.09137535095215, -27.342731475830078, -26.59408950805664, -25.84544563293457, -25.0968017578125, -24.34815788269043, -23.59951400756836, -22.85087013244629, -22.10222625732422, -21.35358428955078, -20.60494041442871, -19.85629653930664, -19.10765266418457, -18.3590087890625, -17.610366821289062, -16.861722946166992, -16.113079071044922, -15.364436149597168, -14.615793228149414, -13.867149353027344, -13.118505477905273, -12.369861602783203, -11.62121868133545, -10.872574806213379, -10.123931884765625, -9.375288009643555, -8.626644134521484, -7.8780012130737305, -7.12935733795166, -6.380713939666748, -5.632072448730469, -4.883429050445557, -4.1347856521606445, -3.386141777038574, -2.637498378753662, -1.88885498046875, -1.1402111053466797, -0.3915677070617676, 0.35707569122314453, 1.1057192087173462, 1.8543627262115479, 2.603006362915039, 3.351649761199951, 4.100293159484863, 4.848937034606934, 5.597580432891846, 6.346223831176758, 7.09486722946167, 7.843510627746582, 8.592154502868652, 9.340797424316406, 10.089441299438477, 10.838085174560547, 11.586729049682617, 12.335371971130371, 13.084015846252441, 13.832658767700195, 14.581302642822266, 15.329946517944336, 16.078590393066406, 16.827232360839844, 17.575876235961914, 18.324520111083984]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 10.0, 14.0, 27.0, 28.0, 79.0, 94.0, 196.0, 332.0, 592.0, 1227.0, 2710.0, 7500.0, 27449.0, 171932.0, 638496.0, 159553.0, 25979.0, 7050.0, 2723.0, 1142.0, 574.0, 334.0, 205.0, 125.0, 62.0, 34.0, 27.0, 18.0, 17.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.02423095703125, -3.8922119140625, -3.76019287109375, -3.628173828125, -3.49615478515625, -3.3641357421875, -3.23211669921875, -3.10009765625, -2.96807861328125, -2.8360595703125, -2.70404052734375, -2.572021484375, -2.44000244140625, -2.3079833984375, -2.17596435546875, -2.0439453125, -1.91192626953125, -1.7799072265625, -1.64788818359375, -1.515869140625, -1.38385009765625, -1.2518310546875, -1.11981201171875, -0.98779296875, -0.85577392578125, -0.7237548828125, -0.59173583984375, -0.459716796875, -0.32769775390625, -0.1956787109375, -0.06365966796875, 0.068359375, 0.20037841796875, 0.3323974609375, 0.46441650390625, 0.596435546875, 0.72845458984375, 0.8604736328125, 0.99249267578125, 1.12451171875, 1.25653076171875, 1.3885498046875, 1.52056884765625, 1.652587890625, 1.78460693359375, 1.9166259765625, 2.04864501953125, 2.1806640625, 2.31268310546875, 2.4447021484375, 2.57672119140625, 2.708740234375, 2.84075927734375, 2.9727783203125, 3.10479736328125, 3.23681640625, 3.36883544921875, 3.5008544921875, 3.63287353515625, 3.764892578125, 3.89691162109375, 4.0289306640625, 4.16094970703125, 4.29296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 15.0, 8.0, 10.0, 12.0, 17.0, 21.0, 18.0, 22.0, 28.0, 34.0, 41.0, 46.0, 58.0, 57.0, 57.0, 50.0, 58.0, 41.0, 52.0, 54.0, 56.0, 42.0, 30.0, 33.0, 28.0, 16.0, 24.0, 20.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.158233642578125, -2.08599853515625, -2.013763427734375, -1.9415283203125, -1.869293212890625, -1.79705810546875, -1.724822998046875, -1.652587890625, -1.580352783203125, -1.50811767578125, -1.435882568359375, -1.3636474609375, -1.291412353515625, -1.21917724609375, -1.146942138671875, -1.07470703125, -1.002471923828125, -0.93023681640625, -0.858001708984375, -0.7857666015625, -0.713531494140625, -0.64129638671875, -0.569061279296875, -0.496826171875, -0.424591064453125, -0.35235595703125, -0.280120849609375, -0.2078857421875, -0.135650634765625, -0.06341552734375, 0.008819580078125, 0.0810546875, 0.153289794921875, 0.22552490234375, 0.297760009765625, 0.3699951171875, 0.442230224609375, 0.51446533203125, 0.586700439453125, 0.658935546875, 0.731170654296875, 0.80340576171875, 0.875640869140625, 0.9478759765625, 1.020111083984375, 1.09234619140625, 1.164581298828125, 1.23681640625, 1.309051513671875, 1.38128662109375, 1.453521728515625, 1.5257568359375, 1.597991943359375, 1.67022705078125, 1.742462158203125, 1.814697265625, 1.886932373046875, 1.95916748046875, 2.031402587890625, 2.1036376953125, 2.175872802734375, 2.24810791015625, 2.320343017578125, 2.392578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 4.0, 10.0, 10.0, 13.0, 19.0, 30.0, 36.0, 56.0, 79.0, 83.0, 140.0, 213.0, 334.0, 656.0, 1234.0, 2831.0, 8809.0, 43177.0, 517772.0, 417327.0, 41492.0, 8501.0, 2835.0, 1239.0, 601.0, 348.0, 207.0, 152.0, 93.0, 61.0, 50.0, 53.0, 19.0, 14.0, 13.0, 12.0, 8.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.046875, -4.906646728515625, -4.76641845703125, -4.626190185546875, -4.4859619140625, -4.345733642578125, -4.20550537109375, -4.065277099609375, -3.925048828125, -3.784820556640625, -3.64459228515625, -3.504364013671875, -3.3641357421875, -3.223907470703125, -3.08367919921875, -2.943450927734375, -2.80322265625, -2.662994384765625, -2.52276611328125, -2.382537841796875, -2.2423095703125, -2.102081298828125, -1.96185302734375, -1.821624755859375, -1.681396484375, -1.541168212890625, -1.40093994140625, -1.260711669921875, -1.1204833984375, -0.980255126953125, -0.84002685546875, -0.699798583984375, -0.5595703125, -0.419342041015625, -0.27911376953125, -0.138885498046875, 0.0013427734375, 0.141571044921875, 0.28179931640625, 0.422027587890625, 0.562255859375, 0.702484130859375, 0.84271240234375, 0.982940673828125, 1.1231689453125, 1.263397216796875, 1.40362548828125, 1.543853759765625, 1.68408203125, 1.824310302734375, 1.96453857421875, 2.104766845703125, 2.2449951171875, 2.385223388671875, 2.52545166015625, 2.665679931640625, 2.805908203125, 2.946136474609375, 3.08636474609375, 3.226593017578125, 3.3668212890625, 3.507049560546875, 3.64727783203125, 3.787506103515625, 3.927734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 15.0, 14.0, 13.0, 25.0, 26.0, 34.0, 35.0, 52.0, 53.0, 44.0, 65.0, 64.0, 52.0, 64.0, 54.0, 76.0, 49.0, 53.0, 37.0, 27.0, 23.0, 26.0, 16.0, 11.0, 9.0, 7.0, 6.0, 6.0, 6.0, 0.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8187255859375, -8.535888671875, -8.2530517578125, -7.97021484375, -7.6873779296875, -7.404541015625, -7.1217041015625, -6.8388671875, -6.5560302734375, -6.273193359375, -5.9903564453125, -5.70751953125, -5.4246826171875, -5.141845703125, -4.8590087890625, -4.576171875, -4.2933349609375, -4.010498046875, -3.7276611328125, -3.44482421875, -3.1619873046875, -2.879150390625, -2.5963134765625, -2.3134765625, -2.0306396484375, -1.747802734375, -1.4649658203125, -1.18212890625, -0.8992919921875, -0.616455078125, -0.3336181640625, -0.05078125, 0.2320556640625, 0.514892578125, 0.7977294921875, 1.08056640625, 1.3634033203125, 1.646240234375, 1.9290771484375, 2.2119140625, 2.4947509765625, 2.777587890625, 3.0604248046875, 3.34326171875, 3.6260986328125, 3.908935546875, 4.1917724609375, 4.474609375, 4.7574462890625, 5.040283203125, 5.3231201171875, 5.60595703125, 5.8887939453125, 6.171630859375, 6.4544677734375, 6.7373046875, 7.0201416015625, 7.302978515625, 7.5858154296875, 7.86865234375, 8.1514892578125, 8.434326171875, 8.7171630859375, 9.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 17.0, 24.0, 22.0, 62.0, 82.0, 129.0, 199.0, 323.0, 570.0, 1057.0, 2388.0, 5594.0, 15649.0, 58456.0, 627585.0, 271626.0, 43318.0, 12552.0, 4659.0, 1962.0, 1023.0, 493.0, 280.0, 179.0, 87.0, 56.0, 42.0, 36.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7517242431640625, -1.696807861328125, -1.6418914794921875, -1.58697509765625, -1.5320587158203125, -1.477142333984375, -1.4222259521484375, -1.3673095703125, -1.3123931884765625, -1.257476806640625, -1.2025604248046875, -1.14764404296875, -1.0927276611328125, -1.037811279296875, -0.9828948974609375, -0.927978515625, -0.8730621337890625, -0.818145751953125, -0.7632293701171875, -0.70831298828125, -0.6533966064453125, -0.598480224609375, -0.5435638427734375, -0.4886474609375, -0.4337310791015625, -0.378814697265625, -0.3238983154296875, -0.26898193359375, -0.2140655517578125, -0.159149169921875, -0.1042327880859375, -0.04931640625, 0.0055999755859375, 0.060516357421875, 0.1154327392578125, 0.17034912109375, 0.2252655029296875, 0.280181884765625, 0.3350982666015625, 0.3900146484375, 0.4449310302734375, 0.499847412109375, 0.5547637939453125, 0.60968017578125, 0.6645965576171875, 0.719512939453125, 0.7744293212890625, 0.829345703125, 0.8842620849609375, 0.939178466796875, 0.9940948486328125, 1.04901123046875, 1.1039276123046875, 1.158843994140625, 1.2137603759765625, 1.2686767578125, 1.3235931396484375, 1.378509521484375, 1.4334259033203125, 1.48834228515625, 1.5432586669921875, 1.598175048828125, 1.6530914306640625, 1.7080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 4.0, 13.0, 20.0, 32.0, 46.0, 58.0, 80.0, 122.0, 150.0, 146.0, 74.0, 67.0, 47.0, 26.0, 23.0, 16.0, 10.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005035400390625, -0.0004870593547821045, -0.000470578670501709, -0.0004540979862213135, -0.00043761730194091797, -0.00042113661766052246, -0.00040465593338012695, -0.00038817524909973145, -0.00037169456481933594, -0.00035521388053894043, -0.0003387331962585449, -0.0003222525119781494, -0.0003057718276977539, -0.0002892911434173584, -0.0002728104591369629, -0.0002563297748565674, -0.00023984909057617188, -0.00022336840629577637, -0.00020688772201538086, -0.00019040703773498535, -0.00017392635345458984, -0.00015744566917419434, -0.00014096498489379883, -0.00012448430061340332, -0.00010800361633300781, -9.15229320526123e-05, -7.50422477722168e-05, -5.856156349182129e-05, -4.208087921142578e-05, -2.5600194931030273e-05, -9.119510650634766e-06, 7.361173629760742e-06, 2.384185791015625e-05, 4.032254219055176e-05, 5.6803226470947266e-05, 7.328391075134277e-05, 8.976459503173828e-05, 0.00010624527931213379, 0.0001227259635925293, 0.0001392066478729248, 0.0001556873321533203, 0.00017216801643371582, 0.00018864870071411133, 0.00020512938499450684, 0.00022161006927490234, 0.00023809075355529785, 0.00025457143783569336, 0.00027105212211608887, 0.0002875328063964844, 0.0003040134906768799, 0.0003204941749572754, 0.0003369748592376709, 0.0003534555435180664, 0.0003699362277984619, 0.0003864169120788574, 0.00040289759635925293, 0.00041937828063964844, 0.00043585896492004395, 0.00045233964920043945, 0.00046882033348083496, 0.00048530101776123047, 0.000501781702041626, 0.0005182623863220215, 0.000534743070602417, 0.0005512237548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 6.0, 8.0, 20.0, 29.0, 51.0, 64.0, 116.0, 279.0, 622.0, 1682.0, 5975.0, 35047.0, 746901.0, 231614.0, 19796.0, 4080.0, 1262.0, 472.0, 231.0, 87.0, 51.0, 52.0, 26.0, 14.0, 20.0, 10.0, 11.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.059234619140625, -2.96612548828125, -2.873016357421875, -2.7799072265625, -2.686798095703125, -2.59368896484375, -2.500579833984375, -2.407470703125, -2.314361572265625, -2.22125244140625, -2.128143310546875, -2.0350341796875, -1.941925048828125, -1.84881591796875, -1.755706787109375, -1.66259765625, -1.569488525390625, -1.47637939453125, -1.383270263671875, -1.2901611328125, -1.197052001953125, -1.10394287109375, -1.010833740234375, -0.917724609375, -0.824615478515625, -0.73150634765625, -0.638397216796875, -0.5452880859375, -0.452178955078125, -0.35906982421875, -0.265960693359375, -0.1728515625, -0.079742431640625, 0.01336669921875, 0.106475830078125, 0.1995849609375, 0.292694091796875, 0.38580322265625, 0.478912353515625, 0.572021484375, 0.665130615234375, 0.75823974609375, 0.851348876953125, 0.9444580078125, 1.037567138671875, 1.13067626953125, 1.223785400390625, 1.31689453125, 1.410003662109375, 1.50311279296875, 1.596221923828125, 1.6893310546875, 1.782440185546875, 1.87554931640625, 1.968658447265625, 2.061767578125, 2.154876708984375, 2.24798583984375, 2.341094970703125, 2.4342041015625, 2.527313232421875, 2.62042236328125, 2.713531494140625, 2.806640625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 14.0, 21.0, 27.0, 45.0, 69.0, 114.0, 178.0, 173.0, 119.0, 69.0, 54.0, 30.0, 24.0, 15.0, 11.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-4.16015625, -4.0716552734375, -3.983154296875, -3.8946533203125, -3.80615234375, -3.7176513671875, -3.629150390625, -3.5406494140625, -3.4521484375, -3.3636474609375, -3.275146484375, -3.1866455078125, -3.09814453125, -3.0096435546875, -2.921142578125, -2.8326416015625, -2.744140625, -2.6556396484375, -2.567138671875, -2.4786376953125, -2.39013671875, -2.3016357421875, -2.213134765625, -2.1246337890625, -2.0361328125, -1.9476318359375, -1.859130859375, -1.7706298828125, -1.68212890625, -1.5936279296875, -1.505126953125, -1.4166259765625, -1.328125, -1.2396240234375, -1.151123046875, -1.0626220703125, -0.97412109375, -0.8856201171875, -0.797119140625, -0.7086181640625, -0.6201171875, -0.5316162109375, -0.443115234375, -0.3546142578125, -0.26611328125, -0.1776123046875, -0.089111328125, -0.0006103515625, 0.087890625, 0.1763916015625, 0.264892578125, 0.3533935546875, 0.44189453125, 0.5303955078125, 0.618896484375, 0.7073974609375, 0.7958984375, 0.8843994140625, 0.972900390625, 1.0614013671875, 1.14990234375, 1.2384033203125, 1.326904296875, 1.4154052734375, 1.50390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 7.0, 15.0, 26.0, 63.0, 175.0, 430.0, 187.0, 64.0, 16.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.28250122070312, -78.20263671875, -76.12277221679688, -74.04290771484375, -71.96304321289062, -69.8831787109375, -67.80331420898438, -65.72344970703125, -63.64358139038086, -61.563716888427734, -59.48385238647461, -57.403987884521484, -55.324119567871094, -53.24425506591797, -51.164390563964844, -49.08452606201172, -47.004661560058594, -44.92479705810547, -42.844932556152344, -40.76506805419922, -38.685203552246094, -36.60533905029297, -34.52547073364258, -32.44560623168945, -30.365741729736328, -28.285877227783203, -26.206012725830078, -24.12614631652832, -22.046281814575195, -19.96641731262207, -17.886550903320312, -15.806686401367188, -13.726829528808594, -11.646965026855469, -9.567099571228027, -7.487234592437744, -5.407369613647461, -3.327505111694336, -1.2476396560668945, 0.8322257995605469, 2.912090301513672, 4.991955280303955, 7.071820259094238, 9.15168571472168, 11.231550216674805, 13.31141471862793, 15.391280174255371, 17.471145629882812, 19.551010131835938, 21.630874633789062, 23.710739135742188, 25.790605545043945, 27.87047004699707, 29.950334548950195, 32.03020095825195, 34.11006546020508, 36.1899299621582, 38.26979446411133, 40.34965896606445, 42.42952346801758, 44.50939178466797, 46.589256286621094, 48.66912078857422, 50.748985290527344, 52.82884979248047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 14.0, 14.0, 10.0, 30.0, 30.0, 19.0, 24.0, 32.0, 40.0, 53.0, 62.0, 82.0, 98.0, 84.0, 57.0, 54.0, 41.0, 35.0, 30.0, 30.0, 19.0, 18.0, 17.0, 18.0, 11.0, 16.0, 7.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.24529266357422, -29.26091194152832, -28.276531219482422, -27.29214859008789, -26.307767868041992, -25.323387145996094, -24.339006423950195, -23.354625701904297, -22.370243072509766, -21.385862350463867, -20.40148162841797, -19.417098999023438, -18.43271827697754, -17.44833755493164, -16.463956832885742, -15.479575157165527, -14.495194435119629, -13.51081371307373, -12.526432037353516, -11.542051315307617, -10.557669639587402, -9.573288917541504, -8.588907241821289, -7.604526519775391, -6.620145320892334, -5.635764122009277, -4.651382923126221, -3.667001962661743, -2.6826207637786865, -1.698239803314209, -0.7138586044311523, 0.2705225944519043, 1.254903793334961, 2.2392849922180176, 3.223666191101074, 4.208046913146973, 5.1924285888671875, 6.176809310913086, 7.161190509796143, 8.1455717086792, 9.129953384399414, 10.114334106445312, 11.098715782165527, 12.083096504211426, 13.06747817993164, 14.051858901977539, 15.036239624023438, 16.02062225341797, 17.005001068115234, 17.989381790161133, 18.97376251220703, 19.958145141601562, 20.94252586364746, 21.92690658569336, 22.911287307739258, 23.895668029785156, 24.880050659179688, 25.864431381225586, 26.848812103271484, 27.833194732666016, 28.817575454711914, 29.801956176757812, 30.78633689880371, 31.77071762084961, 32.75510025024414]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 5.0, 13.0, 14.0, 15.0, 29.0, 49.0, 75.0, 136.0, 217.0, 367.0, 789.0, 1715.0, 4001.0, 11012.0, 38705.0, 256075.0, 2713143.0, 1038481.0, 95883.0, 21038.0, 6984.0, 2829.0, 1307.0, 608.0, 312.0, 184.0, 93.0, 67.0, 46.0, 24.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.03515625, -3.915679931640625, -3.79620361328125, -3.676727294921875, -3.5572509765625, -3.437774658203125, -3.31829833984375, -3.198822021484375, -3.079345703125, -2.959869384765625, -2.84039306640625, -2.720916748046875, -2.6014404296875, -2.481964111328125, -2.36248779296875, -2.243011474609375, -2.12353515625, -2.004058837890625, -1.88458251953125, -1.765106201171875, -1.6456298828125, -1.526153564453125, -1.40667724609375, -1.287200927734375, -1.167724609375, -1.048248291015625, -0.92877197265625, -0.809295654296875, -0.6898193359375, -0.570343017578125, -0.45086669921875, -0.331390380859375, -0.2119140625, -0.092437744140625, 0.02703857421875, 0.146514892578125, 0.2659912109375, 0.385467529296875, 0.50494384765625, 0.624420166015625, 0.743896484375, 0.863372802734375, 0.98284912109375, 1.102325439453125, 1.2218017578125, 1.341278076171875, 1.46075439453125, 1.580230712890625, 1.69970703125, 1.819183349609375, 1.93865966796875, 2.058135986328125, 2.1776123046875, 2.297088623046875, 2.41656494140625, 2.536041259765625, 2.655517578125, 2.774993896484375, 2.89447021484375, 3.013946533203125, 3.1334228515625, 3.252899169921875, 3.37237548828125, 3.491851806640625, 3.611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 12.0, 11.0, 13.0, 19.0, 16.0, 31.0, 23.0, 32.0, 40.0, 38.0, 44.0, 52.0, 55.0, 52.0, 64.0, 69.0, 63.0, 48.0, 44.0, 48.0, 50.0, 29.0, 27.0, 24.0, 13.0, 19.0, 15.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.939453125, -2.8662872314453125, -2.793121337890625, -2.7199554443359375, -2.64678955078125, -2.5736236572265625, -2.500457763671875, -2.4272918701171875, -2.3541259765625, -2.2809600830078125, -2.207794189453125, -2.1346282958984375, -2.06146240234375, -1.9882965087890625, -1.915130615234375, -1.8419647216796875, -1.768798828125, -1.6956329345703125, -1.622467041015625, -1.5493011474609375, -1.47613525390625, -1.4029693603515625, -1.329803466796875, -1.2566375732421875, -1.1834716796875, -1.1103057861328125, -1.037139892578125, -0.9639739990234375, -0.89080810546875, -0.8176422119140625, -0.744476318359375, -0.6713104248046875, -0.59814453125, -0.5249786376953125, -0.451812744140625, -0.3786468505859375, -0.30548095703125, -0.2323150634765625, -0.159149169921875, -0.0859832763671875, -0.0128173828125, 0.0603485107421875, 0.133514404296875, 0.2066802978515625, 0.27984619140625, 0.3530120849609375, 0.426177978515625, 0.4993438720703125, 0.572509765625, 0.6456756591796875, 0.718841552734375, 0.7920074462890625, 0.86517333984375, 0.9383392333984375, 1.011505126953125, 1.0846710205078125, 1.1578369140625, 1.2310028076171875, 1.304168701171875, 1.3773345947265625, 1.45050048828125, 1.5236663818359375, 1.596832275390625, 1.6699981689453125, 1.7431640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 19.0, 25.0, 27.0, 43.0, 59.0, 128.0, 246.0, 587.0, 1479.0, 4560.0, 18414.0, 121670.0, 3057645.0, 915305.0, 57896.0, 11114.0, 3040.0, 1072.0, 430.0, 198.0, 114.0, 61.0, 37.0, 21.0, 26.0, 13.0, 13.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.1484375, -5.97186279296875, -5.7952880859375, -5.61871337890625, -5.442138671875, -5.26556396484375, -5.0889892578125, -4.91241455078125, -4.73583984375, -4.55926513671875, -4.3826904296875, -4.20611572265625, -4.029541015625, -3.85296630859375, -3.6763916015625, -3.49981689453125, -3.3232421875, -3.14666748046875, -2.9700927734375, -2.79351806640625, -2.616943359375, -2.44036865234375, -2.2637939453125, -2.08721923828125, -1.91064453125, -1.73406982421875, -1.5574951171875, -1.38092041015625, -1.204345703125, -1.02777099609375, -0.8511962890625, -0.67462158203125, -0.498046875, -0.32147216796875, -0.1448974609375, 0.03167724609375, 0.208251953125, 0.38482666015625, 0.5614013671875, 0.73797607421875, 0.91455078125, 1.09112548828125, 1.2677001953125, 1.44427490234375, 1.620849609375, 1.79742431640625, 1.9739990234375, 2.15057373046875, 2.3271484375, 2.50372314453125, 2.6802978515625, 2.85687255859375, 3.033447265625, 3.21002197265625, 3.3865966796875, 3.56317138671875, 3.73974609375, 3.91632080078125, 4.0928955078125, 4.26947021484375, 4.446044921875, 4.62261962890625, 4.7991943359375, 4.97576904296875, 5.15234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 12.0, 9.0, 13.0, 23.0, 42.0, 51.0, 60.0, 86.0, 129.0, 222.0, 376.0, 597.0, 772.0, 580.0, 340.0, 226.0, 128.0, 97.0, 68.0, 49.0, 37.0, 33.0, 27.0, 15.0, 11.0, 6.0, 13.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.9659423828125, -3.826416015625, -3.6868896484375, -3.54736328125, -3.4078369140625, -3.268310546875, -3.1287841796875, -2.9892578125, -2.8497314453125, -2.710205078125, -2.5706787109375, -2.43115234375, -2.2916259765625, -2.152099609375, -2.0125732421875, -1.873046875, -1.7335205078125, -1.593994140625, -1.4544677734375, -1.31494140625, -1.1754150390625, -1.035888671875, -0.8963623046875, -0.7568359375, -0.6173095703125, -0.477783203125, -0.3382568359375, -0.19873046875, -0.0592041015625, 0.080322265625, 0.2198486328125, 0.359375, 0.4989013671875, 0.638427734375, 0.7779541015625, 0.91748046875, 1.0570068359375, 1.196533203125, 1.3360595703125, 1.4755859375, 1.6151123046875, 1.754638671875, 1.8941650390625, 2.03369140625, 2.1732177734375, 2.312744140625, 2.4522705078125, 2.591796875, 2.7313232421875, 2.870849609375, 3.0103759765625, 3.14990234375, 3.2894287109375, 3.428955078125, 3.5684814453125, 3.7080078125, 3.8475341796875, 3.987060546875, 4.1265869140625, 4.26611328125, 4.4056396484375, 4.545166015625, 4.6846923828125, 4.82421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 7.0, 25.0, 63.0, 162.0, 278.0, 252.0, 128.0, 54.0, 13.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.43502426147461, -17.206241607666016, -14.977458953857422, -12.748676300048828, -10.519893646240234, -8.29111099243164, -6.062328338623047, -3.833545684814453, -1.6047630310058594, 0.6240196228027344, 2.852802276611328, 5.081584930419922, 7.310367584228516, 9.53915023803711, 11.767932891845703, 13.996715545654297, 16.22549819946289, 18.454280853271484, 20.683063507080078, 22.911846160888672, 25.140628814697266, 27.36941146850586, 29.598194122314453, 31.826976776123047, 34.05575942993164, 36.284542083740234, 38.51332473754883, 40.74210739135742, 42.970890045166016, 45.19967269897461, 47.4284553527832, 49.6572380065918, 51.886016845703125, 54.11479949951172, 56.34358215332031, 58.572364807128906, 60.8011474609375, 63.029930114746094, 65.25871276855469, 67.48749542236328, 69.71627807617188, 71.94506072998047, 74.17384338378906, 76.40262603759766, 78.63140869140625, 80.86019134521484, 83.08897399902344, 85.31775665283203, 87.54653930664062, 89.77532196044922, 92.00410461425781, 94.2328872680664, 96.461669921875, 98.6904525756836, 100.91923522949219, 103.14801788330078, 105.37680053710938, 107.60558319091797, 109.83436584472656, 112.06314849853516, 114.29193115234375, 116.52071380615234, 118.74949645996094, 120.97827911376953, 123.20706176757812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 6.0, 10.0, 14.0, 10.0, 12.0, 19.0, 21.0, 14.0, 25.0, 27.0, 23.0, 23.0, 33.0, 37.0, 48.0, 39.0, 41.0, 39.0, 44.0, 43.0, 39.0, 42.0, 52.0, 45.0, 38.0, 29.0, 31.0, 31.0, 27.0, 14.0, 16.0, 14.0, 13.0, 9.0, 10.0, 11.0, 15.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.35088539123535, -17.808513641357422, -17.266143798828125, -16.723772048950195, -16.181400299072266, -15.639029502868652, -15.096658706665039, -14.55428695678711, -14.011916160583496, -13.469545364379883, -12.927173614501953, -12.38480281829834, -11.842432022094727, -11.300060272216797, -10.757689476013184, -10.21531867980957, -9.67294692993164, -9.130576133728027, -8.588204383850098, -8.045833587646484, -7.503462314605713, -6.961091041564941, -6.418720245361328, -5.876348972320557, -5.333977699279785, -4.791606426239014, -4.249235153198242, -3.706864356994629, -3.1644930839538574, -2.622121810913086, -2.0797507762908936, -1.5373797416687012, -0.9950065612792969, -0.45263540744781494, 0.08973574638366699, 0.6321069002151489, 1.1744780540466309, 1.7168493270874023, 2.2592203617095947, 2.801591396331787, 3.3439626693725586, 3.88633394241333, 4.428705215454102, 4.971076011657715, 5.513447284698486, 6.055818557739258, 6.598189353942871, 7.140560626983643, 7.682931900024414, 8.225302696228027, 8.767674446105957, 9.31004524230957, 9.8524169921875, 10.394787788391113, 10.937158584594727, 11.479530334472656, 12.02190113067627, 12.564271926879883, 13.106643676757812, 13.649014472961426, 14.191385269165039, 14.733757019042969, 15.276127815246582, 15.818498611450195, 16.360870361328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 13.0, 15.0, 34.0, 35.0, 88.0, 121.0, 172.0, 292.0, 459.0, 934.0, 1989.0, 4221.0, 10510.0, 28967.0, 96860.0, 385302.0, 376936.0, 94628.0, 28222.0, 10400.0, 4260.0, 1910.0, 952.0, 490.0, 269.0, 171.0, 94.0, 75.0, 56.0, 23.0, 24.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.33447265625, -3.2333984375, -3.13232421875, -3.03125, -2.93017578125, -2.8291015625, -2.72802734375, -2.626953125, -2.52587890625, -2.4248046875, -2.32373046875, -2.22265625, -2.12158203125, -2.0205078125, -1.91943359375, -1.818359375, -1.71728515625, -1.6162109375, -1.51513671875, -1.4140625, -1.31298828125, -1.2119140625, -1.11083984375, -1.009765625, -0.90869140625, -0.8076171875, -0.70654296875, -0.60546875, -0.50439453125, -0.4033203125, -0.30224609375, -0.201171875, -0.10009765625, 0.0009765625, 0.10205078125, 0.203125, 0.30419921875, 0.4052734375, 0.50634765625, 0.607421875, 0.70849609375, 0.8095703125, 0.91064453125, 1.01171875, 1.11279296875, 1.2138671875, 1.31494140625, 1.416015625, 1.51708984375, 1.6181640625, 1.71923828125, 1.8203125, 1.92138671875, 2.0224609375, 2.12353515625, 2.224609375, 2.32568359375, 2.4267578125, 2.52783203125, 2.62890625, 2.72998046875, 2.8310546875, 2.93212890625, 3.033203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 6.0, 10.0, 10.0, 9.0, 14.0, 12.0, 16.0, 29.0, 25.0, 31.0, 29.0, 24.0, 34.0, 27.0, 31.0, 37.0, 42.0, 36.0, 55.0, 47.0, 46.0, 51.0, 32.0, 47.0, 35.0, 34.0, 31.0, 28.0, 34.0, 21.0, 19.0, 13.0, 17.0, 6.0, 9.0, 10.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.0382843017578125, -1.976959228515625, -1.9156341552734375, -1.85430908203125, -1.7929840087890625, -1.731658935546875, -1.6703338623046875, -1.6090087890625, -1.5476837158203125, -1.486358642578125, -1.4250335693359375, -1.36370849609375, -1.3023834228515625, -1.241058349609375, -1.1797332763671875, -1.118408203125, -1.0570831298828125, -0.995758056640625, -0.9344329833984375, -0.87310791015625, -0.8117828369140625, -0.750457763671875, -0.6891326904296875, -0.6278076171875, -0.5664825439453125, -0.505157470703125, -0.4438323974609375, -0.38250732421875, -0.3211822509765625, -0.259857177734375, -0.1985321044921875, -0.13720703125, -0.0758819580078125, -0.014556884765625, 0.0467681884765625, 0.10809326171875, 0.1694183349609375, 0.230743408203125, 0.2920684814453125, 0.3533935546875, 0.4147186279296875, 0.476043701171875, 0.5373687744140625, 0.59869384765625, 0.6600189208984375, 0.721343994140625, 0.7826690673828125, 0.843994140625, 0.9053192138671875, 0.966644287109375, 1.0279693603515625, 1.08929443359375, 1.1506195068359375, 1.211944580078125, 1.2732696533203125, 1.3345947265625, 1.3959197998046875, 1.457244873046875, 1.5185699462890625, 1.57989501953125, 1.6412200927734375, 1.702545166015625, 1.7638702392578125, 1.8251953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 15.0, 15.0, 16.0, 20.0, 34.0, 37.0, 43.0, 63.0, 94.0, 155.0, 254.0, 386.0, 634.0, 1092.0, 2358.0, 5917.0, 20900.0, 129893.0, 771564.0, 89035.0, 16307.0, 5061.0, 2083.0, 934.0, 518.0, 360.0, 253.0, 134.0, 111.0, 65.0, 57.0, 41.0, 22.0, 24.0, 11.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.1494140625, -3.998046875, -3.8466796875, -3.6953125, -3.5439453125, -3.392578125, -3.2412109375, -3.08984375, -2.9384765625, -2.787109375, -2.6357421875, -2.484375, -2.3330078125, -2.181640625, -2.0302734375, -1.87890625, -1.7275390625, -1.576171875, -1.4248046875, -1.2734375, -1.1220703125, -0.970703125, -0.8193359375, -0.66796875, -0.5166015625, -0.365234375, -0.2138671875, -0.0625, 0.0888671875, 0.240234375, 0.3916015625, 0.54296875, 0.6943359375, 0.845703125, 0.9970703125, 1.1484375, 1.2998046875, 1.451171875, 1.6025390625, 1.75390625, 1.9052734375, 2.056640625, 2.2080078125, 2.359375, 2.5107421875, 2.662109375, 2.8134765625, 2.96484375, 3.1162109375, 3.267578125, 3.4189453125, 3.5703125, 3.7216796875, 3.873046875, 4.0244140625, 4.17578125, 4.3271484375, 4.478515625, 4.6298828125, 4.78125, 4.9326171875, 5.083984375, 5.2353515625, 5.38671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 6.0, 6.0, 6.0, 9.0, 8.0, 25.0, 15.0, 21.0, 35.0, 33.0, 44.0, 63.0, 55.0, 56.0, 74.0, 68.0, 67.0, 68.0, 64.0, 57.0, 50.0, 31.0, 27.0, 21.0, 16.0, 24.0, 14.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.0960693359375, -8.778076171875, -8.4600830078125, -8.14208984375, -7.8240966796875, -7.506103515625, -7.1881103515625, -6.8701171875, -6.5521240234375, -6.234130859375, -5.9161376953125, -5.59814453125, -5.2801513671875, -4.962158203125, -4.6441650390625, -4.326171875, -4.0081787109375, -3.690185546875, -3.3721923828125, -3.05419921875, -2.7362060546875, -2.418212890625, -2.1002197265625, -1.7822265625, -1.4642333984375, -1.146240234375, -0.8282470703125, -0.51025390625, -0.1922607421875, 0.125732421875, 0.4437255859375, 0.76171875, 1.0797119140625, 1.397705078125, 1.7156982421875, 2.03369140625, 2.3516845703125, 2.669677734375, 2.9876708984375, 3.3056640625, 3.6236572265625, 3.941650390625, 4.2596435546875, 4.57763671875, 4.8956298828125, 5.213623046875, 5.5316162109375, 5.849609375, 6.1676025390625, 6.485595703125, 6.8035888671875, 7.12158203125, 7.4395751953125, 7.757568359375, 8.0755615234375, 8.3935546875, 8.7115478515625, 9.029541015625, 9.3475341796875, 9.66552734375, 9.9835205078125, 10.301513671875, 10.6195068359375, 10.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 12.0, 13.0, 18.0, 26.0, 60.0, 91.0, 122.0, 184.0, 285.0, 470.0, 814.0, 1447.0, 3127.0, 7910.0, 32942.0, 332038.0, 617047.0, 36446.0, 8571.0, 3200.0, 1511.0, 867.0, 497.0, 259.0, 183.0, 145.0, 83.0, 50.0, 45.0, 27.0, 18.0, 6.0, 11.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.7038726806640625, -1.648956298828125, -1.5940399169921875, -1.53912353515625, -1.4842071533203125, -1.429290771484375, -1.3743743896484375, -1.3194580078125, -1.2645416259765625, -1.209625244140625, -1.1547088623046875, -1.09979248046875, -1.0448760986328125, -0.989959716796875, -0.9350433349609375, -0.880126953125, -0.8252105712890625, -0.770294189453125, -0.7153778076171875, -0.66046142578125, -0.6055450439453125, -0.550628662109375, -0.4957122802734375, -0.4407958984375, -0.3858795166015625, -0.330963134765625, -0.2760467529296875, -0.22113037109375, -0.1662139892578125, -0.111297607421875, -0.0563812255859375, -0.00146484375, 0.0534515380859375, 0.108367919921875, 0.1632843017578125, 0.21820068359375, 0.2731170654296875, 0.328033447265625, 0.3829498291015625, 0.4378662109375, 0.4927825927734375, 0.547698974609375, 0.6026153564453125, 0.65753173828125, 0.7124481201171875, 0.767364501953125, 0.8222808837890625, 0.877197265625, 0.9321136474609375, 0.987030029296875, 1.0419464111328125, 1.09686279296875, 1.1517791748046875, 1.206695556640625, 1.2616119384765625, 1.3165283203125, 1.3714447021484375, 1.426361083984375, 1.4812774658203125, 1.53619384765625, 1.5911102294921875, 1.646026611328125, 1.7009429931640625, 1.755859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 9.0, 14.0, 17.0, 28.0, 46.0, 101.0, 153.0, 270.0, 168.0, 74.0, 44.0, 19.0, 16.0, 9.0, 6.0, 3.0, 8.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006971359252929688, -0.0006707906723022461, -0.0006444454193115234, -0.0006181001663208008, -0.0005917549133300781, -0.0005654096603393555, -0.0005390644073486328, -0.0005127191543579102, -0.0004863739013671875, -0.00046002864837646484, -0.0004336833953857422, -0.00040733814239501953, -0.0003809928894042969, -0.0003546476364135742, -0.00032830238342285156, -0.0003019571304321289, -0.00027561187744140625, -0.0002492666244506836, -0.00022292137145996094, -0.00019657611846923828, -0.00017023086547851562, -0.00014388561248779297, -0.00011754035949707031, -9.119510650634766e-05, -6.4849853515625e-05, -3.8504600524902344e-05, -1.2159347534179688e-05, 1.4185905456542969e-05, 4.0531158447265625e-05, 6.687641143798828e-05, 9.322166442871094e-05, 0.0001195669174194336, 0.00014591217041015625, 0.0001722574234008789, 0.00019860267639160156, 0.00022494792938232422, 0.0002512931823730469, 0.00027763843536376953, 0.0003039836883544922, 0.00033032894134521484, 0.0003566741943359375, 0.00038301944732666016, 0.0004093647003173828, 0.00043570995330810547, 0.0004620552062988281, 0.0004884004592895508, 0.0005147457122802734, 0.0005410909652709961, 0.0005674362182617188, 0.0005937814712524414, 0.0006201267242431641, 0.0006464719772338867, 0.0006728172302246094, 0.000699162483215332, 0.0007255077362060547, 0.0007518529891967773, 0.0007781982421875, 0.0008045434951782227, 0.0008308887481689453, 0.000857234001159668, 0.0008835792541503906, 0.0009099245071411133, 0.0009362697601318359, 0.0009626150131225586, 0.0009889602661132812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 10.0, 6.0, 10.0, 16.0, 24.0, 41.0, 63.0, 102.0, 190.0, 306.0, 615.0, 1319.0, 3072.0, 8589.0, 31210.0, 187497.0, 718816.0, 71877.0, 15744.0, 5047.0, 2010.0, 897.0, 453.0, 278.0, 112.0, 84.0, 60.0, 39.0, 23.0, 20.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.357421875, -1.3076171875, -1.2578125, -1.2080078125, -1.158203125, -1.1083984375, -1.05859375, -1.0087890625, -0.958984375, -0.9091796875, -0.859375, -0.8095703125, -0.759765625, -0.7099609375, -0.66015625, -0.6103515625, -0.560546875, -0.5107421875, -0.4609375, -0.4111328125, -0.361328125, -0.3115234375, -0.26171875, -0.2119140625, -0.162109375, -0.1123046875, -0.0625, -0.0126953125, 0.037109375, 0.0869140625, 0.13671875, 0.1865234375, 0.236328125, 0.2861328125, 0.3359375, 0.3857421875, 0.435546875, 0.4853515625, 0.53515625, 0.5849609375, 0.634765625, 0.6845703125, 0.734375, 0.7841796875, 0.833984375, 0.8837890625, 0.93359375, 0.9833984375, 1.033203125, 1.0830078125, 1.1328125, 1.1826171875, 1.232421875, 1.2822265625, 1.33203125, 1.3818359375, 1.431640625, 1.4814453125, 1.53125, 1.5810546875, 1.630859375, 1.6806640625, 1.73046875, 1.7802734375, 1.830078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 19.0, 24.0, 15.0, 48.0, 39.0, 53.0, 88.0, 117.0, 117.0, 127.0, 78.0, 55.0, 41.0, 47.0, 28.0, 27.0, 11.0, 13.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.919921875, -1.865875244140625, -1.81182861328125, -1.757781982421875, -1.7037353515625, -1.649688720703125, -1.59564208984375, -1.541595458984375, -1.487548828125, -1.433502197265625, -1.37945556640625, -1.325408935546875, -1.2713623046875, -1.217315673828125, -1.16326904296875, -1.109222412109375, -1.05517578125, -1.001129150390625, -0.94708251953125, -0.893035888671875, -0.8389892578125, -0.784942626953125, -0.73089599609375, -0.676849365234375, -0.622802734375, -0.568756103515625, -0.51470947265625, -0.460662841796875, -0.4066162109375, -0.352569580078125, -0.29852294921875, -0.244476318359375, -0.1904296875, -0.136383056640625, -0.08233642578125, -0.028289794921875, 0.0257568359375, 0.079803466796875, 0.13385009765625, 0.187896728515625, 0.241943359375, 0.295989990234375, 0.35003662109375, 0.404083251953125, 0.4581298828125, 0.512176513671875, 0.56622314453125, 0.620269775390625, 0.67431640625, 0.728363037109375, 0.78240966796875, 0.836456298828125, 0.8905029296875, 0.944549560546875, 0.99859619140625, 1.052642822265625, 1.106689453125, 1.160736083984375, 1.21478271484375, 1.268829345703125, 1.3228759765625, 1.376922607421875, 1.43096923828125, 1.485015869140625, 1.5390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 8.0, 30.0, 126.0, 594.0, 177.0, 39.0, 12.0, 9.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.8374786376953, -169.2025604248047, -165.567626953125, -161.93270874023438, -158.2977752685547, -154.66285705566406, -151.02792358398438, -147.39300537109375, -143.75808715820312, -140.1231689453125, -136.4882354736328, -132.8533172607422, -129.2183837890625, -125.58346557617188, -121.94853973388672, -118.31361389160156, -114.67868041992188, -111.04375457763672, -107.40882873535156, -103.77391052246094, -100.13898468017578, -96.50405883789062, -92.86913299560547, -89.23420715332031, -85.59928894042969, -81.96436309814453, -78.32943725585938, -74.69451904296875, -71.0595932006836, -67.42466735839844, -63.78974151611328, -60.154815673828125, -56.51988983154297, -52.88496398925781, -49.25004196166992, -45.615116119384766, -41.98019027709961, -38.34526824951172, -34.71034240722656, -31.075416564941406, -27.440492630004883, -23.80556869506836, -20.170642852783203, -16.53571891784668, -12.90079402923584, -9.265869140625, -5.630945205688477, -1.9960193634033203, 1.6389045715332031, 5.273829460144043, 8.908754348754883, 12.543678283691406, 16.178604125976562, 19.813528060913086, 23.44845199584961, 27.083377838134766, 30.71830177307129, 34.35322570800781, 37.98815155029297, 41.623077392578125, 45.257999420166016, 48.89292526245117, 52.52784729003906, 56.16277313232422, 59.797698974609375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 13.0, 7.0, 20.0, 14.0, 21.0, 24.0, 33.0, 34.0, 27.0, 28.0, 35.0, 51.0, 85.0, 96.0, 104.0, 86.0, 35.0, 33.0, 34.0, 18.0, 32.0, 19.0, 13.0, 16.0, 9.0, 15.0, 13.0, 3.0, 18.0, 7.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31207275390625, -28.33296012878418, -27.35384750366211, -26.374736785888672, -25.3956241607666, -24.41651153564453, -23.43739891052246, -22.45828628540039, -21.479175567626953, -20.500062942504883, -19.520950317382812, -18.541839599609375, -17.562726974487305, -16.583614349365234, -15.604501724243164, -14.625389099121094, -13.646276473999023, -12.667163848876953, -11.6880521774292, -10.708939552307129, -9.729827880859375, -8.750715255737305, -7.771602630615234, -6.792490482330322, -5.81337833404541, -4.834266185760498, -3.855153799057007, -2.8760414123535156, -1.8969292640686035, -0.9178171157836914, 0.061295509338378906, 1.040407657623291, 2.019519805908203, 2.9986319541931152, 3.9777443408966064, 4.956856727600098, 5.93596887588501, 6.915081024169922, 7.894193649291992, 8.873306274414062, 9.852417945861816, 10.831530570983887, 11.81064224243164, 12.789754867553711, 13.768867492675781, 14.747979164123535, 15.727091789245605, 16.70620346069336, 17.68531608581543, 18.6644287109375, 19.64354133605957, 20.62265396118164, 21.601764678955078, 22.58087730407715, 23.55998992919922, 24.53910255432129, 25.51821517944336, 26.49732780456543, 27.4764404296875, 28.455551147460938, 29.434663772583008, 30.413776397705078, 31.39288902282715, 32.37200164794922, 33.351112365722656]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 6.0, 5.0, 14.0, 23.0, 19.0, 39.0, 71.0, 101.0, 175.0, 357.0, 616.0, 1278.0, 2654.0, 6734.0, 20048.0, 74674.0, 457703.0, 2455829.0, 986113.0, 138410.0, 31940.0, 10056.0, 3806.0, 1770.0, 842.0, 428.0, 219.0, 150.0, 85.0, 41.0, 29.0, 21.0, 9.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.19921875, -6.046844482421875, -5.89447021484375, -5.742095947265625, -5.5897216796875, -5.437347412109375, -5.28497314453125, -5.132598876953125, -4.980224609375, -4.827850341796875, -4.67547607421875, -4.523101806640625, -4.3707275390625, -4.218353271484375, -4.06597900390625, -3.913604736328125, -3.76123046875, -3.608856201171875, -3.45648193359375, -3.304107666015625, -3.1517333984375, -2.999359130859375, -2.84698486328125, -2.694610595703125, -2.542236328125, -2.389862060546875, -2.23748779296875, -2.085113525390625, -1.9327392578125, -1.780364990234375, -1.62799072265625, -1.475616455078125, -1.3232421875, -1.170867919921875, -1.01849365234375, -0.866119384765625, -0.7137451171875, -0.561370849609375, -0.40899658203125, -0.256622314453125, -0.104248046875, 0.048126220703125, 0.20050048828125, 0.352874755859375, 0.5052490234375, 0.657623291015625, 0.80999755859375, 0.962371826171875, 1.11474609375, 1.267120361328125, 1.41949462890625, 1.571868896484375, 1.7242431640625, 1.876617431640625, 2.02899169921875, 2.181365966796875, 2.333740234375, 2.486114501953125, 2.63848876953125, 2.790863037109375, 2.9432373046875, 3.095611572265625, 3.24798583984375, 3.400360107421875, 3.552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 11.0, 12.0, 12.0, 15.0, 26.0, 25.0, 15.0, 28.0, 26.0, 30.0, 29.0, 32.0, 43.0, 39.0, 38.0, 41.0, 43.0, 62.0, 42.0, 50.0, 50.0, 43.0, 43.0, 45.0, 27.0, 24.0, 25.0, 9.0, 20.0, 15.0, 15.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-2.37890625, -2.315155029296875, -2.25140380859375, -2.187652587890625, -2.1239013671875, -2.060150146484375, -1.99639892578125, -1.932647705078125, -1.868896484375, -1.805145263671875, -1.74139404296875, -1.677642822265625, -1.6138916015625, -1.550140380859375, -1.48638916015625, -1.422637939453125, -1.35888671875, -1.295135498046875, -1.23138427734375, -1.167633056640625, -1.1038818359375, -1.040130615234375, -0.97637939453125, -0.912628173828125, -0.848876953125, -0.785125732421875, -0.72137451171875, -0.657623291015625, -0.5938720703125, -0.530120849609375, -0.46636962890625, -0.402618408203125, -0.3388671875, -0.275115966796875, -0.21136474609375, -0.147613525390625, -0.0838623046875, -0.020111083984375, 0.04364013671875, 0.107391357421875, 0.171142578125, 0.234893798828125, 0.29864501953125, 0.362396240234375, 0.4261474609375, 0.489898681640625, 0.55364990234375, 0.617401123046875, 0.68115234375, 0.744903564453125, 0.80865478515625, 0.872406005859375, 0.9361572265625, 0.999908447265625, 1.06365966796875, 1.127410888671875, 1.191162109375, 1.254913330078125, 1.31866455078125, 1.382415771484375, 1.4461669921875, 1.509918212890625, 1.57366943359375, 1.637420654296875, 1.701171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 15.0, 28.0, 17.0, 35.0, 49.0, 88.0, 122.0, 171.0, 317.0, 704.0, 1785.0, 7203.0, 100886.0, 3958150.0, 113907.0, 7537.0, 1754.0, 648.0, 323.0, 195.0, 122.0, 64.0, 39.0, 34.0, 20.0, 14.0, 8.0, 7.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.9920654296875, -16.499755859375, -16.0074462890625, -15.51513671875, -15.0228271484375, -14.530517578125, -14.0382080078125, -13.5458984375, -13.0535888671875, -12.561279296875, -12.0689697265625, -11.57666015625, -11.0843505859375, -10.592041015625, -10.0997314453125, -9.607421875, -9.1151123046875, -8.622802734375, -8.1304931640625, -7.63818359375, -7.1458740234375, -6.653564453125, -6.1612548828125, -5.6689453125, -5.1766357421875, -4.684326171875, -4.1920166015625, -3.69970703125, -3.2073974609375, -2.715087890625, -2.2227783203125, -1.73046875, -1.2381591796875, -0.745849609375, -0.2535400390625, 0.23876953125, 0.7310791015625, 1.223388671875, 1.7156982421875, 2.2080078125, 2.7003173828125, 3.192626953125, 3.6849365234375, 4.17724609375, 4.6695556640625, 5.161865234375, 5.6541748046875, 6.146484375, 6.6387939453125, 7.131103515625, 7.6234130859375, 8.11572265625, 8.6080322265625, 9.100341796875, 9.5926513671875, 10.0849609375, 10.5772705078125, 11.069580078125, 11.5618896484375, 12.05419921875, 12.5465087890625, 13.038818359375, 13.5311279296875, 14.0234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 5.0, 9.0, 10.0, 21.0, 23.0, 34.0, 45.0, 75.0, 88.0, 151.0, 220.0, 343.0, 528.0, 774.0, 611.0, 388.0, 250.0, 140.0, 120.0, 67.0, 52.0, 40.0, 33.0, 15.0, 11.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.671875, -9.392333984375, -9.11279296875, -8.833251953125, -8.5537109375, -8.274169921875, -7.99462890625, -7.715087890625, -7.435546875, -7.156005859375, -6.87646484375, -6.596923828125, -6.3173828125, -6.037841796875, -5.75830078125, -5.478759765625, -5.19921875, -4.919677734375, -4.64013671875, -4.360595703125, -4.0810546875, -3.801513671875, -3.52197265625, -3.242431640625, -2.962890625, -2.683349609375, -2.40380859375, -2.124267578125, -1.8447265625, -1.565185546875, -1.28564453125, -1.006103515625, -0.7265625, -0.447021484375, -0.16748046875, 0.112060546875, 0.3916015625, 0.671142578125, 0.95068359375, 1.230224609375, 1.509765625, 1.789306640625, 2.06884765625, 2.348388671875, 2.6279296875, 2.907470703125, 3.18701171875, 3.466552734375, 3.74609375, 4.025634765625, 4.30517578125, 4.584716796875, 4.8642578125, 5.143798828125, 5.42333984375, 5.702880859375, 5.982421875, 6.261962890625, 6.54150390625, 6.821044921875, 7.1005859375, 7.380126953125, 7.65966796875, 7.939208984375, 8.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 16.0, 15.0, 41.0, 64.0, 104.0, 153.0, 179.0, 163.0, 95.0, 59.0, 29.0, 25.0, 18.0, 7.0, 2.0, 8.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.10050964355469, -82.2998046875, -79.49910736083984, -76.69840240478516, -73.897705078125, -71.09700012207031, -68.29629516601562, -65.49559020996094, -62.69489288330078, -59.89419174194336, -57.09349060058594, -54.29278564453125, -51.49208450317383, -48.691383361816406, -45.89067840576172, -43.0899772644043, -40.289276123046875, -37.48857498168945, -34.68787384033203, -31.887168884277344, -29.086467742919922, -26.2857666015625, -23.485063552856445, -20.68436050415039, -17.88365936279297, -15.08295726776123, -12.282255172729492, -9.481553077697754, -6.680850982666016, -3.8801488876342773, -1.079446792602539, 1.7212562561035156, 4.521949768066406, 7.3226518630981445, 10.123353958129883, 12.924056053161621, 15.72475814819336, 18.52545928955078, 21.326162338256836, 24.12686538696289, 26.927566528320312, 29.728267669677734, 32.528968811035156, 35.329673767089844, 38.130374908447266, 40.93107604980469, 43.731781005859375, 46.5324821472168, 49.33318328857422, 52.13388442993164, 54.93458557128906, 57.73529052734375, 60.53599166870117, 63.336692810058594, 66.13739776611328, 68.93809509277344, 71.73880004882812, 74.53950500488281, 77.34020233154297, 80.14090728759766, 82.94160461425781, 85.7423095703125, 88.54301452636719, 91.34371948242188, 94.14441680908203]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 13.0, 11.0, 17.0, 17.0, 21.0, 17.0, 28.0, 28.0, 26.0, 38.0, 35.0, 43.0, 42.0, 31.0, 63.0, 54.0, 77.0, 65.0, 48.0, 35.0, 42.0, 33.0, 34.0, 29.0, 31.0, 24.0, 21.0, 15.0, 10.0, 13.0, 11.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.560752868652344, -41.1661262512207, -39.77149963378906, -38.37687301635742, -36.98224639892578, -35.587623596191406, -34.1929931640625, -32.798370361328125, -31.403743743896484, -30.009117126464844, -28.614490509033203, -27.219863891601562, -25.825239181518555, -24.430612564086914, -23.035985946655273, -21.641361236572266, -20.246732711791992, -18.85210609436035, -17.45747947692871, -16.062854766845703, -14.668228149414062, -13.273601531982422, -11.878974914550781, -10.484349250793457, -9.089722633361816, -7.695096492767334, -6.300470352172852, -4.905843734741211, -3.5112175941467285, -2.116591453552246, -0.7219648361206055, 0.6726608276367188, 2.0672874450683594, 3.461913585662842, 4.856539726257324, 6.251166343688965, 7.645792484283447, 9.04041862487793, 10.43504524230957, 11.829670906066895, 13.224297523498535, 14.618924140930176, 16.0135498046875, 17.40817642211914, 18.80280303955078, 20.197429656982422, 21.592056274414062, 22.98668098449707, 24.38130760192871, 25.77593421936035, 27.170560836791992, 28.565185546875, 29.95981216430664, 31.35443878173828, 32.74906539916992, 34.14369201660156, 35.5383186340332, 36.932945251464844, 38.327571868896484, 39.722198486328125, 41.116825103759766, 42.511451721191406, 43.90607452392578, 45.30070114135742, 46.69532775878906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 12.0, 21.0, 23.0, 47.0, 80.0, 149.0, 296.0, 627.0, 1335.0, 3488.0, 11567.0, 52423.0, 503832.0, 411947.0, 46219.0, 10639.0, 3328.0, 1276.0, 603.0, 288.0, 162.0, 84.0, 39.0, 33.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.48828125, -6.3173828125, -6.146484375, -5.9755859375, -5.8046875, -5.6337890625, -5.462890625, -5.2919921875, -5.12109375, -4.9501953125, -4.779296875, -4.6083984375, -4.4375, -4.2666015625, -4.095703125, -3.9248046875, -3.75390625, -3.5830078125, -3.412109375, -3.2412109375, -3.0703125, -2.8994140625, -2.728515625, -2.5576171875, -2.38671875, -2.2158203125, -2.044921875, -1.8740234375, -1.703125, -1.5322265625, -1.361328125, -1.1904296875, -1.01953125, -0.8486328125, -0.677734375, -0.5068359375, -0.3359375, -0.1650390625, 0.005859375, 0.1767578125, 0.34765625, 0.5185546875, 0.689453125, 0.8603515625, 1.03125, 1.2021484375, 1.373046875, 1.5439453125, 1.71484375, 1.8857421875, 2.056640625, 2.2275390625, 2.3984375, 2.5693359375, 2.740234375, 2.9111328125, 3.08203125, 3.2529296875, 3.423828125, 3.5947265625, 3.765625, 3.9365234375, 4.107421875, 4.2783203125, 4.44921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 6.0, 10.0, 6.0, 9.0, 26.0, 19.0, 20.0, 36.0, 33.0, 37.0, 37.0, 65.0, 51.0, 58.0, 54.0, 53.0, 89.0, 58.0, 58.0, 50.0, 42.0, 37.0, 33.0, 31.0, 16.0, 21.0, 9.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.49609375, -3.37030029296875, -3.2445068359375, -3.11871337890625, -2.992919921875, -2.86712646484375, -2.7413330078125, -2.61553955078125, -2.48974609375, -2.36395263671875, -2.2381591796875, -2.11236572265625, -1.986572265625, -1.86077880859375, -1.7349853515625, -1.60919189453125, -1.4833984375, -1.35760498046875, -1.2318115234375, -1.10601806640625, -0.980224609375, -0.85443115234375, -0.7286376953125, -0.60284423828125, -0.47705078125, -0.35125732421875, -0.2254638671875, -0.09967041015625, 0.026123046875, 0.15191650390625, 0.2777099609375, 0.40350341796875, 0.529296875, 0.65509033203125, 0.7808837890625, 0.90667724609375, 1.032470703125, 1.15826416015625, 1.2840576171875, 1.40985107421875, 1.53564453125, 1.66143798828125, 1.7872314453125, 1.91302490234375, 2.038818359375, 2.16461181640625, 2.2904052734375, 2.41619873046875, 2.5419921875, 2.66778564453125, 2.7935791015625, 2.91937255859375, 3.045166015625, 3.17095947265625, 3.2967529296875, 3.42254638671875, 3.54833984375, 3.67413330078125, 3.7999267578125, 3.92572021484375, 4.051513671875, 4.17730712890625, 4.3031005859375, 4.42889404296875, 4.5546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 10.0, 7.0, 21.0, 26.0, 37.0, 40.0, 71.0, 113.0, 185.0, 304.0, 533.0, 1169.0, 3408.0, 12334.0, 75402.0, 879342.0, 59583.0, 10544.0, 3002.0, 1111.0, 509.0, 272.0, 159.0, 92.0, 79.0, 61.0, 31.0, 22.0, 23.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0078125, -4.8377685546875, -4.667724609375, -4.4976806640625, -4.32763671875, -4.1575927734375, -3.987548828125, -3.8175048828125, -3.6474609375, -3.4774169921875, -3.307373046875, -3.1373291015625, -2.96728515625, -2.7972412109375, -2.627197265625, -2.4571533203125, -2.287109375, -2.1170654296875, -1.947021484375, -1.7769775390625, -1.60693359375, -1.4368896484375, -1.266845703125, -1.0968017578125, -0.9267578125, -0.7567138671875, -0.586669921875, -0.4166259765625, -0.24658203125, -0.0765380859375, 0.093505859375, 0.2635498046875, 0.43359375, 0.6036376953125, 0.773681640625, 0.9437255859375, 1.11376953125, 1.2838134765625, 1.453857421875, 1.6239013671875, 1.7939453125, 1.9639892578125, 2.134033203125, 2.3040771484375, 2.47412109375, 2.6441650390625, 2.814208984375, 2.9842529296875, 3.154296875, 3.3243408203125, 3.494384765625, 3.6644287109375, 3.83447265625, 4.0045166015625, 4.174560546875, 4.3446044921875, 4.5146484375, 4.6846923828125, 4.854736328125, 5.0247802734375, 5.19482421875, 5.3648681640625, 5.534912109375, 5.7049560546875, 5.875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 8.0, 8.0, 13.0, 14.0, 16.0, 18.0, 26.0, 31.0, 31.0, 33.0, 35.0, 55.0, 67.0, 73.0, 70.0, 67.0, 62.0, 61.0, 51.0, 41.0, 24.0, 22.0, 27.0, 9.0, 19.0, 18.0, 9.0, 6.0, 9.0, 8.0, 10.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-12.546875, -12.176513671875, -11.80615234375, -11.435791015625, -11.0654296875, -10.695068359375, -10.32470703125, -9.954345703125, -9.583984375, -9.213623046875, -8.84326171875, -8.472900390625, -8.1025390625, -7.732177734375, -7.36181640625, -6.991455078125, -6.62109375, -6.250732421875, -5.88037109375, -5.510009765625, -5.1396484375, -4.769287109375, -4.39892578125, -4.028564453125, -3.658203125, -3.287841796875, -2.91748046875, -2.547119140625, -2.1767578125, -1.806396484375, -1.43603515625, -1.065673828125, -0.6953125, -0.324951171875, 0.04541015625, 0.415771484375, 0.7861328125, 1.156494140625, 1.52685546875, 1.897216796875, 2.267578125, 2.637939453125, 3.00830078125, 3.378662109375, 3.7490234375, 4.119384765625, 4.48974609375, 4.860107421875, 5.23046875, 5.600830078125, 5.97119140625, 6.341552734375, 6.7119140625, 7.082275390625, 7.45263671875, 7.822998046875, 8.193359375, 8.563720703125, 8.93408203125, 9.304443359375, 9.6748046875, 10.045166015625, 10.41552734375, 10.785888671875, 11.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 4.0, 11.0, 12.0, 14.0, 22.0, 32.0, 31.0, 56.0, 70.0, 132.0, 197.0, 270.0, 503.0, 791.0, 1644.0, 3586.0, 8334.0, 23900.0, 105355.0, 796972.0, 74370.0, 18964.0, 7000.0, 2948.0, 1421.0, 703.0, 431.0, 256.0, 153.0, 112.0, 70.0, 49.0, 36.0, 24.0, 24.0, 14.0, 11.0, 9.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.82568359375, -0.8023605346679688, -0.7790374755859375, -0.7557144165039062, -0.732391357421875, -0.7090682983398438, -0.6857452392578125, -0.6624221801757812, -0.63909912109375, -0.6157760620117188, -0.5924530029296875, -0.5691299438476562, -0.545806884765625, -0.5224838256835938, -0.4991607666015625, -0.47583770751953125, -0.4525146484375, -0.42919158935546875, -0.4058685302734375, -0.38254547119140625, -0.359222412109375, -0.33589935302734375, -0.3125762939453125, -0.28925323486328125, -0.26593017578125, -0.24260711669921875, -0.2192840576171875, -0.19596099853515625, -0.172637939453125, -0.14931488037109375, -0.1259918212890625, -0.10266876220703125, -0.079345703125, -0.05602264404296875, -0.0326995849609375, -0.00937652587890625, 0.013946533203125, 0.03726959228515625, 0.0605926513671875, 0.08391571044921875, 0.10723876953125, 0.13056182861328125, 0.1538848876953125, 0.17720794677734375, 0.200531005859375, 0.22385406494140625, 0.2471771240234375, 0.27050018310546875, 0.2938232421875, 0.31714630126953125, 0.3404693603515625, 0.36379241943359375, 0.387115478515625, 0.41043853759765625, 0.4337615966796875, 0.45708465576171875, 0.48040771484375, 0.5037307739257812, 0.5270538330078125, 0.5503768920898438, 0.573699951171875, 0.5970230102539062, 0.6203460693359375, 0.6436691284179688, 0.6669921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 7.0, 6.0, 14.0, 25.0, 15.0, 42.0, 41.0, 48.0, 88.0, 102.0, 114.0, 109.0, 108.0, 66.0, 38.0, 40.0, 27.0, 21.0, 14.0, 15.0, 5.0, 8.0, 5.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002675056457519531, -0.0002602245658636093, -0.0002529434859752655, -0.0002456624060869217, -0.00023838132619857788, -0.00023110024631023407, -0.00022381916642189026, -0.00021653808653354645, -0.00020925700664520264, -0.00020197592675685883, -0.00019469484686851501, -0.0001874137669801712, -0.0001801326870918274, -0.00017285160720348358, -0.00016557052731513977, -0.00015828944742679596, -0.00015100836753845215, -0.00014372728765010834, -0.00013644620776176453, -0.00012916512787342072, -0.0001218840479850769, -0.0001146029680967331, -0.00010732188820838928, -0.00010004080832004547, -9.275972843170166e-05, -8.547864854335785e-05, -7.819756865501404e-05, -7.091648876667023e-05, -6.363540887832642e-05, -5.6354328989982605e-05, -4.9073249101638794e-05, -4.179216921329498e-05, -3.451108932495117e-05, -2.723000943660736e-05, -1.994892954826355e-05, -1.2667849659919739e-05, -5.386769771575928e-06, 1.8943101167678833e-06, 9.175390005111694e-06, 1.6456469893455505e-05, 2.3737549781799316e-05, 3.101862967014313e-05, 3.829970955848694e-05, 4.558078944683075e-05, 5.286186933517456e-05, 6.014294922351837e-05, 6.742402911186218e-05, 7.4705109000206e-05, 8.19861888885498e-05, 8.926726877689362e-05, 9.654834866523743e-05, 0.00010382942855358124, 0.00011111050844192505, 0.00011839158833026886, 0.00012567266821861267, 0.00013295374810695648, 0.0001402348279953003, 0.0001475159078836441, 0.00015479698777198792, 0.00016207806766033173, 0.00016935914754867554, 0.00017664022743701935, 0.00018392130732536316, 0.00019120238721370697, 0.00019848346710205078]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 16.0, 7.0, 12.0, 18.0, 26.0, 46.0, 76.0, 85.0, 128.0, 212.0, 328.0, 585.0, 991.0, 2026.0, 4190.0, 10450.0, 30537.0, 161880.0, 761164.0, 49798.0, 14657.0, 5631.0, 2503.0, 1313.0, 744.0, 403.0, 270.0, 157.0, 95.0, 65.0, 48.0, 38.0, 17.0, 14.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.86279296875, -0.8310546875, -0.79931640625, -0.767578125, -0.73583984375, -0.7041015625, -0.67236328125, -0.640625, -0.60888671875, -0.5771484375, -0.54541015625, -0.513671875, -0.48193359375, -0.4501953125, -0.41845703125, -0.38671875, -0.35498046875, -0.3232421875, -0.29150390625, -0.259765625, -0.22802734375, -0.1962890625, -0.16455078125, -0.1328125, -0.10107421875, -0.0693359375, -0.03759765625, -0.005859375, 0.02587890625, 0.0576171875, 0.08935546875, 0.12109375, 0.15283203125, 0.1845703125, 0.21630859375, 0.248046875, 0.27978515625, 0.3115234375, 0.34326171875, 0.375, 0.40673828125, 0.4384765625, 0.47021484375, 0.501953125, 0.53369140625, 0.5654296875, 0.59716796875, 0.62890625, 0.66064453125, 0.6923828125, 0.72412109375, 0.755859375, 0.78759765625, 0.8193359375, 0.85107421875, 0.8828125, 0.91455078125, 0.9462890625, 0.97802734375, 1.009765625, 1.04150390625, 1.0732421875, 1.10498046875, 1.13671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 10.0, 8.0, 9.0, 9.0, 15.0, 10.0, 9.0, 13.0, 18.0, 17.0, 23.0, 34.0, 45.0, 51.0, 65.0, 82.0, 100.0, 97.0, 89.0, 62.0, 45.0, 32.0, 24.0, 21.0, 15.0, 10.0, 13.0, 14.0, 10.0, 8.0, 11.0, 7.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.961090087890625, -0.93096923828125, -0.900848388671875, -0.8707275390625, -0.840606689453125, -0.81048583984375, -0.780364990234375, -0.750244140625, -0.720123291015625, -0.69000244140625, -0.659881591796875, -0.6297607421875, -0.599639892578125, -0.56951904296875, -0.539398193359375, -0.50927734375, -0.479156494140625, -0.44903564453125, -0.418914794921875, -0.3887939453125, -0.358673095703125, -0.32855224609375, -0.298431396484375, -0.268310546875, -0.238189697265625, -0.20806884765625, -0.177947998046875, -0.1478271484375, -0.117706298828125, -0.08758544921875, -0.057464599609375, -0.02734375, 0.002777099609375, 0.03289794921875, 0.063018798828125, 0.0931396484375, 0.123260498046875, 0.15338134765625, 0.183502197265625, 0.213623046875, 0.243743896484375, 0.27386474609375, 0.303985595703125, 0.3341064453125, 0.364227294921875, 0.39434814453125, 0.424468994140625, 0.45458984375, 0.484710693359375, 0.51483154296875, 0.544952392578125, 0.5750732421875, 0.605194091796875, 0.63531494140625, 0.665435791015625, 0.695556640625, 0.725677490234375, 0.75579833984375, 0.785919189453125, 0.8160400390625, 0.846160888671875, 0.87628173828125, 0.906402587890625, 0.9365234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 10.0, 4.0, 3.0, 9.0, 13.0, 17.0, 26.0, 46.0, 89.0, 322.0, 225.0, 96.0, 46.0, 40.0, 18.0, 16.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.705677032470703, -15.398041725158691, -14.09040641784668, -12.782772064208984, -11.475136756896973, -10.167501449584961, -8.859867095947266, -7.552231788635254, -6.244596481323242, -4.9369611740112305, -3.629326343536377, -2.3216912746429443, -1.0140562057495117, 0.2935791015625, 1.6012139320373535, 2.908848762512207, 4.216484069824219, 5.5241193771362305, 6.831754207611084, 8.139389038085938, 9.44702434539795, 10.754659652709961, 12.062294006347656, 13.369929313659668, 14.67756462097168, 15.985199928283691, 17.292835235595703, 18.6004695892334, 19.908103942871094, 21.215740203857422, 22.523374557495117, 23.831008911132812, 25.138648986816406, 26.4462833404541, 27.75391960144043, 29.061553955078125, 30.369190216064453, 31.67682456970215, 32.984458923339844, 34.29209518432617, 35.5997314453125, 36.90736770629883, 38.21500015258789, 39.52263641357422, 40.83027267456055, 42.137908935546875, 43.44554138183594, 44.753177642822266, 46.06081008911133, 47.368446350097656, 48.67607879638672, 49.98371505737305, 51.291351318359375, 52.59898376464844, 53.906620025634766, 55.214256286621094, 56.521888732910156, 57.829524993896484, 59.13715744018555, 60.444793701171875, 61.7524299621582, 63.06006622314453, 64.3676986694336, 65.67533111572266, 66.98297119140625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 7.0, 10.0, 6.0, 10.0, 6.0, 8.0, 9.0, 14.0, 27.0, 15.0, 21.0, 27.0, 41.0, 41.0, 77.0, 102.0, 128.0, 114.0, 76.0, 45.0, 19.0, 31.0, 14.0, 13.0, 14.0, 14.0, 12.0, 15.0, 12.0, 11.0, 7.0, 6.0, 7.0, 4.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.786760330200195, -30.809301376342773, -29.83184051513672, -28.854381561279297, -27.876920700073242, -26.89946174621582, -25.922000885009766, -24.944541931152344, -23.967082977294922, -22.9896240234375, -22.012163162231445, -21.034704208374023, -20.05724334716797, -19.079784393310547, -18.102325439453125, -17.12486457824707, -16.147403717041016, -15.169943809509277, -14.192483901977539, -13.215024948120117, -12.237564086914062, -11.26010513305664, -10.282645225524902, -9.305185317993164, -8.327725410461426, -7.3502655029296875, -6.372805595397949, -5.395346164703369, -4.417886257171631, -3.4404263496398926, -2.4629669189453125, -1.4855070114135742, -0.5080451965332031, 0.4694145917892456, 1.4468743801116943, 2.4243340492248535, 3.401793956756592, 4.37925386428833, 5.35671329498291, 6.334173202514648, 7.311633110046387, 8.289093017578125, 9.266552925109863, 10.244012832641602, 11.221471786499023, 12.198932647705078, 13.1763916015625, 14.153851509094238, 15.131311416625977, 16.1087703704834, 17.086231231689453, 18.063690185546875, 19.04115104675293, 20.01861000061035, 20.996070861816406, 21.973529815673828, 22.95098876953125, 23.928447723388672, 24.905908584594727, 25.88336753845215, 26.860828399658203, 27.838287353515625, 28.815746307373047, 29.7932071685791, 30.770668029785156]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 8.0, 13.0, 14.0, 19.0, 29.0, 29.0, 35.0, 32.0, 43.0, 52.0, 88.0, 220.0, 107.0, 61.0, 40.0, 36.0, 29.0, 19.0, 25.0, 15.0, 22.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.235137939453125, -3.10894775390625, -2.982757568359375, -2.8565673828125, -2.730377197265625, -2.60418701171875, -2.477996826171875, -2.351806640625, -2.225616455078125, -2.09942626953125, -1.973236083984375, -1.8470458984375, -1.720855712890625, -1.59466552734375, -1.468475341796875, -1.34228515625, -1.216094970703125, -1.08990478515625, -0.963714599609375, -0.8375244140625, -0.711334228515625, -0.58514404296875, -0.458953857421875, -0.332763671875, -0.206573486328125, -0.08038330078125, 0.045806884765625, 0.1719970703125, 0.298187255859375, 0.42437744140625, 0.550567626953125, 0.6767578125, 0.802947998046875, 0.92913818359375, 1.055328369140625, 1.1815185546875, 1.307708740234375, 1.43389892578125, 1.560089111328125, 1.686279296875, 1.812469482421875, 1.93865966796875, 2.064849853515625, 2.1910400390625, 2.317230224609375, 2.44342041015625, 2.569610595703125, 2.69580078125, 2.821990966796875, 2.94818115234375, 3.074371337890625, 3.2005615234375, 3.326751708984375, 3.45294189453125, 3.579132080078125, 3.705322265625, 3.831512451171875, 3.95770263671875, 4.083892822265625, 4.2100830078125, 4.336273193359375, 4.46246337890625, 4.588653564453125, 4.71484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 11.0, 13.0, 16.0, 37.0, 39.0, 72.0, 114.0, 248.0, 555.0, 1634.0, 5896.0, 59546.0, 8302411.0, 13253.0, 2926.0, 944.0, 384.0, 158.0, 73.0, 53.0, 41.0, 31.0, 26.0, 20.0, 8.0, 7.0, 12.0, 11.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 0.0, 1.0], "bins": [-23.040096282958984, -22.346797943115234, -21.653501510620117, -20.960203170776367, -20.266904830932617, -19.573606491088867, -18.88031005859375, -18.18701171875, -17.49371337890625, -16.8004150390625, -16.107118606567383, -15.413820266723633, -14.720521926879883, -14.02722454071045, -13.333927154541016, -12.640628814697266, -11.947331428527832, -11.254034042358398, -10.560735702514648, -9.867438316345215, -9.174139976501465, -8.480842590332031, -7.7875447273254395, -7.094246864318848, -6.400949001312256, -5.707651138305664, -5.014353275299072, -4.3210554122924805, -3.6277577877044678, -2.934459924697876, -2.2411623001098633, -1.5478644371032715, -0.8545665740966797, -0.16126877069473267, 0.5320290327072144, 1.2253267765045166, 1.9186246395111084, 2.6119225025177, 3.305220127105713, 3.9985179901123047, 4.6918158531188965, 5.385113716125488, 6.07841157913208, 6.771709442138672, 7.4650068283081055, 8.158305168151855, 8.851602554321289, 9.544900894165039, 10.238198280334473, 10.931495666503906, 11.624794006347656, 12.31809139251709, 13.01138973236084, 13.704687118530273, 14.397985458374023, 15.091282844543457, 15.78458023071289, 16.47787857055664, 17.171175003051758, 17.864473342895508, 18.557771682739258, 19.251070022583008, 19.944366455078125, 20.637664794921875, 21.330963134765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-37.35580062866211, -36.37879180908203, -35.40178298950195, -34.42477798461914, -33.44776916503906, -32.470760345458984, -31.493751525878906, -30.51674461364746, -29.539735794067383, -28.562726974487305, -27.58572006225586, -26.60871124267578, -25.631704330444336, -24.654695510864258, -23.677688598632812, -22.700679779052734, -21.723670959472656, -20.746662139892578, -19.769655227661133, -18.792646408081055, -17.81563949584961, -16.83863067626953, -15.86162281036377, -14.884614944458008, -13.907608032226562, -12.9306001663208, -11.953592300415039, -10.976583480834961, -9.9995756149292, -9.022567749023438, -8.045559883117676, -7.068551540374756, -6.091543197631836, -5.114535331726074, -4.137526988983154, -3.1605191230773926, -2.1835110187530518, -1.206502914428711, -0.22949504852294922, 0.7475132942199707, 1.7245211601257324, 2.7015292644500732, 3.678537368774414, 4.655545234680176, 5.6325531005859375, 6.609561443328857, 7.586569309234619, 8.563577651977539, 9.5405855178833, 10.517593383789062, 11.494601249694824, 12.471609115600586, 13.448617935180664, 14.425625801086426, 15.402633666992188, 16.379642486572266, 17.35664939880371, 18.33365821838379, 19.310665130615234, 20.287673950195312, 21.264680862426758, 22.241689682006836, 23.21869659423828, 24.19570541381836, 25.172714233398438]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 19.0, 16.0, 26.0, 34.0, 27.0, 45.0, 50.0, 56.0, 69.0, 65.0, 84.0, 61.0, 76.0, 54.0, 54.0, 52.0, 36.0, 37.0, 29.0, 24.0, 20.0, 12.0, 12.0, 12.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.942779541015625, -3.83477783203125, -3.726776123046875, -3.6187744140625, -3.510772705078125, -3.40277099609375, -3.294769287109375, -3.186767578125, -3.078765869140625, -2.97076416015625, -2.862762451171875, -2.7547607421875, -2.646759033203125, -2.53875732421875, -2.430755615234375, -2.32275390625, -2.214752197265625, -2.10675048828125, -1.998748779296875, -1.8907470703125, -1.782745361328125, -1.67474365234375, -1.566741943359375, -1.458740234375, -1.350738525390625, -1.24273681640625, -1.134735107421875, -1.0267333984375, -0.918731689453125, -0.81072998046875, -0.702728271484375, -0.5947265625, -0.486724853515625, -0.37872314453125, -0.270721435546875, -0.1627197265625, -0.054718017578125, 0.05328369140625, 0.161285400390625, 0.269287109375, 0.377288818359375, 0.48529052734375, 0.593292236328125, 0.7012939453125, 0.809295654296875, 0.91729736328125, 1.025299072265625, 1.13330078125, 1.241302490234375, 1.34930419921875, 1.457305908203125, 1.5653076171875, 1.673309326171875, 1.78131103515625, 1.889312744140625, 1.997314453125, 2.105316162109375, 2.21331787109375, 2.321319580078125, 2.4293212890625, 2.537322998046875, 2.64532470703125, 2.753326416015625, 2.861328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 6.0, 7.0, 19.0, 11.0, 26.0, 51.0, 77.0, 151.0, 297.0, 638.0, 1459.0, 3924.0, 11169.0, 35279.0, 114885.0, 211167.0, 98864.0, 30260.0, 9929.0, 3456.0, 1392.0, 586.0, 244.0, 142.0, 60.0, 47.0, 30.0, 21.0, 15.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.453125, -18.76904296875, -18.0849609375, -17.40087890625, -16.716796875, -16.03271484375, -15.3486328125, -14.66455078125, -13.98046875, -13.29638671875, -12.6123046875, -11.92822265625, -11.244140625, -10.56005859375, -9.8759765625, -9.19189453125, -8.5078125, -7.82373046875, -7.1396484375, -6.45556640625, -5.771484375, -5.08740234375, -4.4033203125, -3.71923828125, -3.03515625, -2.35107421875, -1.6669921875, -0.98291015625, -0.298828125, 0.38525390625, 1.0693359375, 1.75341796875, 2.4375, 3.12158203125, 3.8056640625, 4.48974609375, 5.173828125, 5.85791015625, 6.5419921875, 7.22607421875, 7.91015625, 8.59423828125, 9.2783203125, 9.96240234375, 10.646484375, 11.33056640625, 12.0146484375, 12.69873046875, 13.3828125, 14.06689453125, 14.7509765625, 15.43505859375, 16.119140625, 16.80322265625, 17.4873046875, 18.17138671875, 18.85546875, 19.53955078125, 20.2236328125, 20.90771484375, 21.591796875, 22.27587890625, 22.9599609375, 23.64404296875, 24.328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 8.0, 6.0, 11.0, 17.0, 28.0, 26.0, 37.0, 43.0, 58.0, 41.0, 60.0, 56.0, 60.0, 73.0, 63.0, 70.0, 55.0, 62.0, 34.0, 33.0, 34.0, 30.0, 22.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.452789306640625, -3.34893798828125, -3.245086669921875, -3.1412353515625, -3.037384033203125, -2.93353271484375, -2.829681396484375, -2.725830078125, -2.621978759765625, -2.51812744140625, -2.414276123046875, -2.3104248046875, -2.206573486328125, -2.10272216796875, -1.998870849609375, -1.89501953125, -1.791168212890625, -1.68731689453125, -1.583465576171875, -1.4796142578125, -1.375762939453125, -1.27191162109375, -1.168060302734375, -1.064208984375, -0.960357666015625, -0.85650634765625, -0.752655029296875, -0.6488037109375, -0.544952392578125, -0.44110107421875, -0.337249755859375, -0.2333984375, -0.129547119140625, -0.02569580078125, 0.078155517578125, 0.1820068359375, 0.285858154296875, 0.38970947265625, 0.493560791015625, 0.597412109375, 0.701263427734375, 0.80511474609375, 0.908966064453125, 1.0128173828125, 1.116668701171875, 1.22052001953125, 1.324371337890625, 1.42822265625, 1.532073974609375, 1.63592529296875, 1.739776611328125, 1.8436279296875, 1.947479248046875, 2.05133056640625, 2.155181884765625, 2.259033203125, 2.362884521484375, 2.46673583984375, 2.570587158203125, 2.6744384765625, 2.778289794921875, 2.88214111328125, 2.985992431640625, 3.08984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 7.0, 4.0, 6.0, 13.0, 17.0, 38.0, 75.0, 106.0, 96.0, 46.0, 25.0, 10.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.659618377685547, -29.742244720458984, -28.82486915588379, -27.907495498657227, -26.990121841430664, -26.07274627685547, -25.155372619628906, -24.237998962402344, -23.32062339782715, -22.403249740600586, -21.48587417602539, -20.568500518798828, -19.651126861572266, -18.73375129699707, -17.816377639770508, -16.899002075195312, -15.981629371643066, -15.064254760742188, -14.146881103515625, -13.229506492614746, -12.312131881713867, -11.394758224487305, -10.477383613586426, -9.560009002685547, -8.642635345458984, -7.725261211395264, -6.807886600494385, -5.890512466430664, -4.973137855529785, -4.0557637214660645, -3.1383895874023438, -2.221014976501465, -1.303640365600586, -0.3862660527229309, 0.5311082601547241, 1.4484825134277344, 2.365856885910034, 3.283231258392334, 4.200605392456055, 5.117980003356934, 6.035354137420654, 6.952728271484375, 7.870102882385254, 8.787477493286133, 9.704851150512695, 10.622225761413574, 11.539600372314453, 12.456974029541016, 13.374348640441895, 14.291723251342773, 15.209096908569336, 16.12647247314453, 17.043846130371094, 17.961219787597656, 18.87859344482422, 19.795969009399414, 20.713342666625977, 21.63071632385254, 22.548091888427734, 23.465465545654297, 24.38283920288086, 25.300214767456055, 26.217588424682617, 27.134963989257812, 28.052337646484375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 9.0, 2.0, 5.0, 27.0, 54.0, 132.0, 121.0, 59.0, 20.0, 8.0, 9.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.553199768066406, -24.54115104675293, -23.52910041809082, -22.517051696777344, -21.505001068115234, -20.492952346801758, -19.48090362548828, -18.468852996826172, -17.456804275512695, -16.44475555419922, -15.43270492553711, -14.420656204223633, -13.40860652923584, -12.396556854248047, -11.38450813293457, -10.372458457946777, -9.360408782958984, -8.348359107971191, -7.336309909820557, -6.324260711669922, -5.312211036682129, -4.300161361694336, -3.288112163543701, -2.2760629653930664, -1.2640132904052734, -0.25196385383605957, 0.7600855827331543, 1.7721350193023682, 2.784184455871582, 3.796234130859375, 4.80828332901001, 5.8203325271606445, 6.832378387451172, 7.844428062438965, 8.856477737426758, 9.868526458740234, 10.880576133728027, 11.89262580871582, 12.904674530029297, 13.91672420501709, 14.928773880004883, 15.940823554992676, 16.95287322998047, 17.964921951293945, 18.976970672607422, 19.98902130126953, 21.001070022583008, 22.013118743896484, 23.025169372558594, 24.03721809387207, 25.04926872253418, 26.061317443847656, 27.073368072509766, 28.085416793823242, 29.09746551513672, 30.109516143798828, 31.121564865112305, 32.13361358642578, 33.14566421508789, 34.15771484375, 35.169761657714844, 36.18181228637695, 37.19386291503906, 38.205909729003906, 39.217960357666016]}, "eval/loss": 1.8528554439544678, "eval/wer": 1.3865529551765172, "eval/runtime": 1072.1362, "eval/samples_per_second": 2.464, "eval/steps_per_second": 0.309, "train/train_runtime": 114528.9287, "train/train_samples_per_second": 4.984, "train/train_steps_per_second": 0.156, "train/total_flos": 0.0, "train/train_loss": 0.9826719127995244} \ No newline at end of file