{"train/loss": 4.2807, "train/learning_rate": 2.6640000000000002e-05, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6582, "_timestamp": 1646122716, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 11.0, 35.0, 125.0, 261.0, 319.0, 172.0, 66.0, 20.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.410669326782227, -19.659561157226562, -17.9084529876709, -16.157344818115234, -14.406237602233887, -12.655129432678223, -10.904022216796875, -9.152914047241211, -7.401805877685547, -5.650697708129883, -3.899590015411377, -2.148482322692871, -0.39737415313720703, 1.353734016418457, 3.1048412322998047, 4.855949401855469, 6.607057571411133, 8.358165740966797, 10.109273910522461, 11.860381126403809, 13.611489295959473, 15.362597465515137, 17.113704681396484, 18.86481285095215, 20.615921020507812, 22.367029190063477, 24.11813735961914, 25.869243621826172, 27.62035369873047, 29.3714599609375, 31.122568130493164, 32.87367630004883, 34.624786376953125, 36.375892639160156, 38.12700271606445, 39.878108978271484, 41.62921905517578, 43.38032531738281, 45.131431579589844, 46.88254165649414, 48.63365173339844, 50.38475799560547, 52.135868072509766, 53.8869743347168, 55.638084411621094, 57.389190673828125, 59.140296936035156, 60.89140701293945, 62.642513275146484, 64.39362335205078, 66.14472961425781, 67.89583587646484, 69.64694213867188, 71.39805603027344, 73.14916229248047, 74.9002685546875, 76.65137481689453, 78.40248107910156, 80.1535873413086, 81.90470123291016, 83.65580749511719, 85.40691375732422, 87.15802001953125, 88.90913391113281, 90.66024017333984]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 14.0, 11.0, 12.0, 13.0, 19.0, 24.0, 30.0, 28.0, 21.0, 33.0, 32.0, 38.0, 31.0, 49.0, 52.0, 42.0, 44.0, 48.0, 45.0, 27.0, 39.0, 39.0, 40.0, 36.0, 26.0, 44.0, 25.0, 14.0, 16.0, 13.0, 15.0, 10.0, 9.0, 15.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.66189193725586, -27.64937400817871, -26.636856079101562, -25.624338150024414, -24.611820220947266, -23.599300384521484, -22.586782455444336, -21.574264526367188, -20.56174659729004, -19.54922866821289, -18.536710739135742, -17.524192810058594, -16.511672973632812, -15.49915599822998, -14.486637115478516, -13.474119186401367, -12.461601257324219, -11.44908332824707, -10.436565399169922, -9.424046516418457, -8.411528587341309, -7.39901065826416, -6.3864922523498535, -5.373973846435547, -4.361455917358398, -3.348937749862671, -2.3364195823669434, -1.3239014148712158, -0.3113832473754883, 0.7011346817016602, 1.7136530876159668, 2.7261714935302734, 3.7386932373046875, 4.751211166381836, 5.763729572296143, 6.776247978210449, 7.788765907287598, 8.801283836364746, 9.813802719116211, 10.82632064819336, 11.838838577270508, 12.851356506347656, 13.863874435424805, 14.87639331817627, 15.888911247253418, 16.90142822265625, 17.91394805908203, 18.92646598815918, 19.938983917236328, 20.951501846313477, 21.964019775390625, 22.976537704467773, 23.989055633544922, 25.001575469970703, 26.01409339904785, 27.026611328125, 28.03912925720215, 29.051647186279297, 30.064165115356445, 31.076683044433594, 32.089202880859375, 33.10171890258789, 34.11423873901367, 35.12675476074219, 36.13927459716797]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 3.0, 4.0, 12.0, 18.0, 12.0, 6.0, 18.0, 22.0, 20.0, 17.0, 27.0, 25.0, 27.0, 41.0, 35.0, 34.0, 31.0, 36.0, 38.0, 49.0, 40.0, 50.0, 36.0, 35.0, 38.0, 41.0, 42.0, 44.0, 37.0, 18.0, 19.0, 25.0, 22.0, 22.0, 10.0, 10.0, 6.0, 8.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6298828125, -1.575836181640625, -1.52178955078125, -1.467742919921875, -1.4136962890625, -1.359649658203125, -1.30560302734375, -1.251556396484375, -1.197509765625, -1.143463134765625, -1.08941650390625, -1.035369873046875, -0.9813232421875, -0.927276611328125, -0.87322998046875, -0.819183349609375, -0.76513671875, -0.711090087890625, -0.65704345703125, -0.602996826171875, -0.5489501953125, -0.494903564453125, -0.44085693359375, -0.386810302734375, -0.332763671875, -0.278717041015625, -0.22467041015625, -0.170623779296875, -0.1165771484375, -0.062530517578125, -0.00848388671875, 0.045562744140625, 0.099609375, 0.153656005859375, 0.20770263671875, 0.261749267578125, 0.3157958984375, 0.369842529296875, 0.42388916015625, 0.477935791015625, 0.531982421875, 0.586029052734375, 0.64007568359375, 0.694122314453125, 0.7481689453125, 0.802215576171875, 0.85626220703125, 0.910308837890625, 0.96435546875, 1.018402099609375, 1.07244873046875, 1.126495361328125, 1.1805419921875, 1.234588623046875, 1.28863525390625, 1.342681884765625, 1.396728515625, 1.450775146484375, 1.50482177734375, 1.558868408203125, 1.6129150390625, 1.666961669921875, 1.72100830078125, 1.775054931640625, 1.8291015625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 4.0, 2.0, 11.0, 11.0, 16.0, 28.0, 38.0, 41.0, 72.0, 112.0, 143.0, 207.0, 359.0, 546.0, 842.0, 1496.0, 2486.0, 5125.0, 13058.0, 45985.0, 295568.0, 2373551.0, 1276554.0, 133378.0, 26846.0, 8912.0, 4004.0, 1956.0, 1093.0, 669.0, 372.0, 260.0, 176.0, 137.0, 74.0, 59.0, 22.0, 15.0, 21.0, 13.0, 6.0, 8.0, 2.0, 2.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.13250732421875, -4.9603271484375, -4.78814697265625, -4.615966796875, -4.44378662109375, -4.2716064453125, -4.09942626953125, -3.92724609375, -3.75506591796875, -3.5828857421875, -3.41070556640625, -3.238525390625, -3.06634521484375, -2.8941650390625, -2.72198486328125, -2.5498046875, -2.37762451171875, -2.2054443359375, -2.03326416015625, -1.861083984375, -1.68890380859375, -1.5167236328125, -1.34454345703125, -1.17236328125, -1.00018310546875, -0.8280029296875, -0.65582275390625, -0.483642578125, -0.31146240234375, -0.1392822265625, 0.03289794921875, 0.205078125, 0.37725830078125, 0.5494384765625, 0.72161865234375, 0.893798828125, 1.06597900390625, 1.2381591796875, 1.41033935546875, 1.58251953125, 1.75469970703125, 1.9268798828125, 2.09906005859375, 2.271240234375, 2.44342041015625, 2.6156005859375, 2.78778076171875, 2.9599609375, 3.13214111328125, 3.3043212890625, 3.47650146484375, 3.648681640625, 3.82086181640625, 3.9930419921875, 4.16522216796875, 4.33740234375, 4.50958251953125, 4.6817626953125, 4.85394287109375, 5.026123046875, 5.19830322265625, 5.3704833984375, 5.54266357421875, 5.71484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 17.0, 41.0, 101.0, 273.0, 754.0, 1464.0, 861.0, 341.0, 122.0, 48.0, 23.0, 13.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.355712890625, -17.77392578125, -17.192138671875, -16.6103515625, -16.028564453125, -15.44677734375, -14.864990234375, -14.283203125, -13.701416015625, -13.11962890625, -12.537841796875, -11.9560546875, -11.374267578125, -10.79248046875, -10.210693359375, -9.62890625, -9.047119140625, -8.46533203125, -7.883544921875, -7.3017578125, -6.719970703125, -6.13818359375, -5.556396484375, -4.974609375, -4.392822265625, -3.81103515625, -3.229248046875, -2.6474609375, -2.065673828125, -1.48388671875, -0.902099609375, -0.3203125, 0.261474609375, 0.84326171875, 1.425048828125, 2.0068359375, 2.588623046875, 3.17041015625, 3.752197265625, 4.333984375, 4.915771484375, 5.49755859375, 6.079345703125, 6.6611328125, 7.242919921875, 7.82470703125, 8.406494140625, 8.98828125, 9.570068359375, 10.15185546875, 10.733642578125, 11.3154296875, 11.897216796875, 12.47900390625, 13.060791015625, 13.642578125, 14.224365234375, 14.80615234375, 15.387939453125, 15.9697265625, 16.551513671875, 17.13330078125, 17.715087890625, 18.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 22.0, 34.0, 66.0, 188.0, 496.0, 1830.0, 20738.0, 4155250.0, 13254.0, 1630.0, 438.0, 162.0, 76.0, 34.0, 11.0, 10.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-53.84375, -52.1845703125, -50.525390625, -48.8662109375, -47.20703125, -45.5478515625, -43.888671875, -42.2294921875, -40.5703125, -38.9111328125, -37.251953125, -35.5927734375, -33.93359375, -32.2744140625, -30.615234375, -28.9560546875, -27.296875, -25.6376953125, -23.978515625, -22.3193359375, -20.66015625, -19.0009765625, -17.341796875, -15.6826171875, -14.0234375, -12.3642578125, -10.705078125, -9.0458984375, -7.38671875, -5.7275390625, -4.068359375, -2.4091796875, -0.75, 0.9091796875, 2.568359375, 4.2275390625, 5.88671875, 7.5458984375, 9.205078125, 10.8642578125, 12.5234375, 14.1826171875, 15.841796875, 17.5009765625, 19.16015625, 20.8193359375, 22.478515625, 24.1376953125, 25.796875, 27.4560546875, 29.115234375, 30.7744140625, 32.43359375, 34.0927734375, 35.751953125, 37.4111328125, 39.0703125, 40.7294921875, 42.388671875, 44.0478515625, 45.70703125, 47.3662109375, 49.025390625, 50.6845703125, 52.34375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 23.0, 158.0, 434.0, 331.0, 65.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.01431274414062, -68.62934875488281, -66.244384765625, -63.85941696166992, -61.474449157714844, -59.08948516845703, -56.70452117919922, -54.319557189941406, -51.93458938598633, -49.549625396728516, -47.16465759277344, -44.779693603515625, -42.39472961425781, -40.009761810302734, -37.62479782104492, -35.239830017089844, -32.85486602783203, -30.469900131225586, -28.08493423461914, -25.699970245361328, -23.315004348754883, -20.930038452148438, -18.545074462890625, -16.16010856628418, -13.775142669677734, -11.390176773071289, -9.00521183013916, -6.620246410369873, -4.235280990600586, -1.8503150939941406, 0.5346498489379883, 2.919614791870117, 5.304573059082031, 7.689538478851318, 10.074503898620605, 12.459468841552734, 14.84443473815918, 17.229400634765625, 19.614364624023438, 21.999330520629883, 24.384296417236328, 26.769262313842773, 29.15422821044922, 31.53919219970703, 33.924156188964844, 36.30912399291992, 38.694087982177734, 41.07905578613281, 43.464019775390625, 45.84898376464844, 48.233951568603516, 50.61891555786133, 53.003883361816406, 55.38884735107422, 57.77381134033203, 60.158775329589844, 62.54374313354492, 64.9287109375, 67.31367492675781, 69.69863891601562, 72.08360290527344, 74.46856689453125, 76.8535385131836, 79.2385025024414, 81.62346649169922]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 11.0, 6.0, 8.0, 11.0, 12.0, 19.0, 9.0, 21.0, 25.0, 33.0, 29.0, 27.0, 27.0, 44.0, 38.0, 38.0, 45.0, 39.0, 46.0, 53.0, 37.0, 42.0, 38.0, 46.0, 36.0, 40.0, 27.0, 40.0, 19.0, 21.0, 23.0, 25.0, 11.0, 13.0, 11.0, 7.0, 4.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.97994041442871, -24.260774612426758, -23.541608810424805, -22.822444915771484, -22.10327911376953, -21.384113311767578, -20.664947509765625, -19.945781707763672, -19.22661590576172, -18.507450103759766, -17.788284301757812, -17.06911849975586, -16.34995460510254, -15.630788803100586, -14.911623001098633, -14.19245719909668, -13.473292350769043, -12.75412654876709, -12.034961700439453, -11.3157958984375, -10.596630096435547, -9.877464294433594, -9.158299446105957, -8.439133644104004, -7.719968318939209, -7.000802993774414, -6.281637191772461, -5.562471866607666, -4.843306541442871, -4.124140739440918, -3.404975414276123, -2.68580961227417, -1.966644287109375, -1.247478723526001, -0.5283132791519165, 0.19085216522216797, 0.910017728805542, 1.629183292388916, 2.348348617553711, 3.067514419555664, 3.786679744720459, 4.505845069885254, 5.225010871887207, 5.944176197052002, 6.663341522216797, 7.38250732421875, 8.101673126220703, 8.820838928222656, 9.540003776550293, 10.259169578552246, 10.978334426879883, 11.697500228881836, 12.416666030883789, 13.135831832885742, 13.854996681213379, 14.574162483215332, 15.293327331542969, 16.012493133544922, 16.731658935546875, 17.450824737548828, 18.16998863220215, 18.8891544342041, 19.608320236206055, 20.327486038208008, 21.04665184020996]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 2.0, 6.0, 12.0, 7.0, 10.0, 17.0, 14.0, 14.0, 17.0, 27.0, 25.0, 28.0, 26.0, 34.0, 35.0, 29.0, 42.0, 39.0, 30.0, 45.0, 44.0, 39.0, 43.0, 28.0, 48.0, 34.0, 28.0, 43.0, 33.0, 30.0, 33.0, 30.0, 22.0, 18.0, 17.0, 10.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.5583953857421875, -1.505462646484375, -1.4525299072265625, -1.39959716796875, -1.3466644287109375, -1.293731689453125, -1.2407989501953125, -1.1878662109375, -1.1349334716796875, -1.082000732421875, -1.0290679931640625, -0.97613525390625, -0.9232025146484375, -0.870269775390625, -0.8173370361328125, -0.764404296875, -0.7114715576171875, -0.658538818359375, -0.6056060791015625, -0.55267333984375, -0.4997406005859375, -0.446807861328125, -0.3938751220703125, -0.3409423828125, -0.2880096435546875, -0.235076904296875, -0.1821441650390625, -0.12921142578125, -0.0762786865234375, -0.023345947265625, 0.0295867919921875, 0.08251953125, 0.1354522705078125, 0.188385009765625, 0.2413177490234375, 0.29425048828125, 0.3471832275390625, 0.400115966796875, 0.4530487060546875, 0.5059814453125, 0.5589141845703125, 0.611846923828125, 0.6647796630859375, 0.71771240234375, 0.7706451416015625, 0.823577880859375, 0.8765106201171875, 0.929443359375, 0.9823760986328125, 1.035308837890625, 1.0882415771484375, 1.14117431640625, 1.1941070556640625, 1.247039794921875, 1.2999725341796875, 1.3529052734375, 1.4058380126953125, 1.458770751953125, 1.5117034912109375, 1.56463623046875, 1.6175689697265625, 1.670501708984375, 1.7234344482421875, 1.7763671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 3.0, 5.0, 10.0, 12.0, 23.0, 30.0, 52.0, 75.0, 99.0, 177.0, 230.0, 320.0, 500.0, 746.0, 1109.0, 1826.0, 2745.0, 4138.0, 6615.0, 10063.0, 15863.0, 25082.0, 40020.0, 63716.0, 102553.0, 167471.0, 220871.0, 144348.0, 88877.0, 55330.0, 34384.0, 22165.0, 13848.0, 8902.0, 5715.0, 3796.0, 2380.0, 1521.0, 944.0, 681.0, 452.0, 289.0, 192.0, 131.0, 83.0, 55.0, 40.0, 29.0, 13.0, 8.0, 7.0, 8.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.1865234375, -0.1810932159423828, -0.17566299438476562, -0.17023277282714844, -0.16480255126953125, -0.15937232971191406, -0.15394210815429688, -0.1485118865966797, -0.1430816650390625, -0.1376514434814453, -0.13222122192382812, -0.12679100036621094, -0.12136077880859375, -0.11593055725097656, -0.11050033569335938, -0.10507011413574219, -0.099639892578125, -0.09420967102050781, -0.08877944946289062, -0.08334922790527344, -0.07791900634765625, -0.07248878479003906, -0.06705856323242188, -0.06162834167480469, -0.0561981201171875, -0.05076789855957031, -0.045337677001953125, -0.03990745544433594, -0.03447723388671875, -0.029047012329101562, -0.023616790771484375, -0.018186569213867188, -0.01275634765625, -0.0073261260986328125, -0.001895904541015625, 0.0035343170166015625, 0.00896453857421875, 0.014394760131835938, 0.019824981689453125, 0.025255203247070312, 0.0306854248046875, 0.03611564636230469, 0.041545867919921875, 0.04697608947753906, 0.05240631103515625, 0.05783653259277344, 0.06326675415039062, 0.06869697570800781, 0.074127197265625, 0.07955741882324219, 0.08498764038085938, 0.09041786193847656, 0.09584808349609375, 0.10127830505371094, 0.10670852661132812, 0.11213874816894531, 0.1175689697265625, 0.12299919128417969, 0.12842941284179688, 0.13385963439941406, 0.13928985595703125, 0.14472007751464844, 0.15015029907226562, 0.1555805206298828, 0.1610107421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 11.0, 9.0, 10.0, 14.0, 11.0, 11.0, 17.0, 23.0, 25.0, 32.0, 23.0, 40.0, 29.0, 39.0, 41.0, 41.0, 36.0, 44.0, 1064.0, 43.0, 48.0, 49.0, 29.0, 24.0, 36.0, 40.0, 28.0, 27.0, 31.0, 32.0, 23.0, 15.0, 9.0, 11.0, 6.0, 13.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0537109375, -1.0191802978515625, -0.984649658203125, -0.9501190185546875, -0.91558837890625, -0.8810577392578125, -0.846527099609375, -0.8119964599609375, -0.7774658203125, -0.7429351806640625, -0.708404541015625, -0.6738739013671875, -0.63934326171875, -0.6048126220703125, -0.570281982421875, -0.5357513427734375, -0.501220703125, -0.4666900634765625, -0.432159423828125, -0.3976287841796875, -0.36309814453125, -0.3285675048828125, -0.294036865234375, -0.2595062255859375, -0.2249755859375, -0.1904449462890625, -0.155914306640625, -0.1213836669921875, -0.08685302734375, -0.0523223876953125, -0.017791748046875, 0.0167388916015625, 0.05126953125, 0.0858001708984375, 0.120330810546875, 0.1548614501953125, 0.18939208984375, 0.2239227294921875, 0.258453369140625, 0.2929840087890625, 0.3275146484375, 0.3620452880859375, 0.396575927734375, 0.4311065673828125, 0.46563720703125, 0.5001678466796875, 0.534698486328125, 0.5692291259765625, 0.603759765625, 0.6382904052734375, 0.672821044921875, 0.7073516845703125, 0.74188232421875, 0.7764129638671875, 0.810943603515625, 0.8454742431640625, 0.8800048828125, 0.9145355224609375, 0.949066162109375, 0.9835968017578125, 1.01812744140625, 1.0526580810546875, 1.087188720703125, 1.1217193603515625, 1.15625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 13.0, 7.0, 14.0, 28.0, 42.0, 52.0, 81.0, 96.0, 148.0, 184.0, 307.0, 448.0, 629.0, 963.0, 1482.0, 2144.0, 3126.0, 4948.0, 7601.0, 11930.0, 19083.0, 30915.0, 52073.0, 89283.0, 153529.0, 1279273.0, 178715.0, 103196.0, 60702.0, 35743.0, 21909.0, 13518.0, 8493.0, 5523.0, 3628.0, 2401.0, 1539.0, 1054.0, 654.0, 478.0, 382.0, 245.0, 156.0, 105.0, 76.0, 64.0, 36.0, 29.0, 30.0, 24.0, 5.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0], "bins": [-0.1783447265625, -0.1728801727294922, -0.16741561889648438, -0.16195106506347656, -0.15648651123046875, -0.15102195739746094, -0.14555740356445312, -0.1400928497314453, -0.1346282958984375, -0.1291637420654297, -0.12369918823242188, -0.11823463439941406, -0.11277008056640625, -0.10730552673339844, -0.10184097290039062, -0.09637641906738281, -0.090911865234375, -0.08544731140136719, -0.07998275756835938, -0.07451820373535156, -0.06905364990234375, -0.06358909606933594, -0.058124542236328125, -0.05265998840332031, -0.0471954345703125, -0.04173088073730469, -0.036266326904296875, -0.030801773071289062, -0.02533721923828125, -0.019872665405273438, -0.014408111572265625, -0.008943557739257812, -0.00347900390625, 0.0019855499267578125, 0.007450103759765625, 0.012914657592773438, 0.01837921142578125, 0.023843765258789062, 0.029308319091796875, 0.03477287292480469, 0.0402374267578125, 0.04570198059082031, 0.051166534423828125, 0.05663108825683594, 0.06209564208984375, 0.06756019592285156, 0.07302474975585938, 0.07848930358886719, 0.083953857421875, 0.08941841125488281, 0.09488296508789062, 0.10034751892089844, 0.10581207275390625, 0.11127662658691406, 0.11674118041992188, 0.12220573425292969, 0.1276702880859375, 0.1331348419189453, 0.13859939575195312, 0.14406394958496094, 0.14952850341796875, 0.15499305725097656, 0.16045761108398438, 0.1659221649169922, 0.17138671875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 3.0, 3.0, 1.0, 7.0, 16.0, 14.0, 19.0, 28.0, 53.0, 73.0, 81.0, 102.0, 108.0, 113.0, 103.0, 70.0, 36.0, 38.0, 31.0, 19.0, 16.0, 7.0, 8.0, 4.0, 2.0, 2.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012884140014648438, -0.0012466013431549072, -0.0012047886848449707, -0.0011629760265350342, -0.0011211633682250977, -0.0010793507099151611, -0.0010375380516052246, -0.000995725393295288, -0.0009539127349853516, -0.000912100076675415, -0.0008702874183654785, -0.000828474760055542, -0.0007866621017456055, -0.0007448494434356689, -0.0007030367851257324, -0.0006612241268157959, -0.0006194114685058594, -0.0005775988101959229, -0.0005357861518859863, -0.0004939734935760498, -0.0004521608352661133, -0.00041034817695617676, -0.00036853551864624023, -0.0003267228603363037, -0.0002849102020263672, -0.00024309754371643066, -0.00020128488540649414, -0.00015947222709655762, -0.0001176595687866211, -7.584691047668457e-05, -3.403425216674805e-05, 7.778406143188477e-06, 4.9591064453125e-05, 9.140372276306152e-05, 0.00013321638107299805, 0.00017502903938293457, 0.0002168416976928711, 0.0002586543560028076, 0.00030046701431274414, 0.00034227967262268066, 0.0003840923309326172, 0.0004259049892425537, 0.00046771764755249023, 0.0005095303058624268, 0.0005513429641723633, 0.0005931556224822998, 0.0006349682807922363, 0.0006767809391021729, 0.0007185935974121094, 0.0007604062557220459, 0.0008022189140319824, 0.0008440315723419189, 0.0008858442306518555, 0.000927656888961792, 0.0009694695472717285, 0.001011282205581665, 0.0010530948638916016, 0.001094907522201538, 0.0011367201805114746, 0.0011785328388214111, 0.0012203454971313477, 0.0012621581554412842, 0.0013039708137512207, 0.0013457834720611572, 0.0013875961303710938]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 12.0, 18.0, 17.0, 13.0, 17.0, 19.0, 47.0, 52.0, 86.0, 132.0, 248.0, 352.0, 666.0, 6802.0, 1037121.0, 1485.0, 528.0, 294.0, 179.0, 108.0, 96.0, 53.0, 26.0, 22.0, 16.0, 13.0, 18.0, 15.0, 10.0, 16.0, 11.0, 0.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0225677490234375, -0.021823883056640625, -0.02108001708984375, -0.020336151123046875, -0.01959228515625, -0.018848419189453125, -0.01810455322265625, -0.017360687255859375, -0.0166168212890625, -0.015872955322265625, -0.01512908935546875, -0.014385223388671875, -0.013641357421875, -0.012897491455078125, -0.01215362548828125, -0.011409759521484375, -0.0106658935546875, -0.009922027587890625, -0.00917816162109375, -0.008434295654296875, -0.0076904296875, -0.006946563720703125, -0.00620269775390625, -0.005458831787109375, -0.0047149658203125, -0.003971099853515625, -0.00322723388671875, -0.002483367919921875, -0.001739501953125, -0.000995635986328125, -0.00025177001953125, 0.000492095947265625, 0.0012359619140625, 0.001979827880859375, 0.00272369384765625, 0.003467559814453125, 0.00421142578125, 0.004955291748046875, 0.00569915771484375, 0.006443023681640625, 0.0071868896484375, 0.007930755615234375, 0.00867462158203125, 0.009418487548828125, 0.010162353515625, 0.010906219482421875, 0.01165008544921875, 0.012393951416015625, 0.0131378173828125, 0.013881683349609375, 0.01462554931640625, 0.015369415283203125, 0.01611328125, 0.016857147216796875, 0.01760101318359375, 0.018344879150390625, 0.0190887451171875, 0.019832611083984375, 0.02057647705078125, 0.021320343017578125, 0.022064208984375, 0.022808074951171875, 0.02355194091796875, 0.024295806884765625, 0.0250396728515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 98.0, 791.0, 120.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005062459968030453, -0.00496419332921505, -0.0048659262247383595, -0.0047676595859229565, -0.0046693929471075535, -0.004571125842630863, -0.00447285920381546, -0.004374592565000057, -0.004276325460523367, -0.004178058821707964, -0.004079791717231274, -0.003981525078415871, -0.003883258206769824, -0.0037849913351237774, -0.0036867246963083744, -0.0035884578246623278, -0.0034901911858469248, -0.003391924314200878, -0.003293657675385475, -0.0031953908037394285, -0.003097123932093382, -0.002998857293277979, -0.0029005904216319323, -0.0028023235499858856, -0.0027040569111704826, -0.002605790039524436, -0.002507523400709033, -0.0024092565290629864, -0.0023109896574169397, -0.002212722785770893, -0.00211445614695549, -0.0020161892753094435, -0.0019179225200787187, -0.0018196557648479939, -0.0017213888932019472, -0.0016231221379712224, -0.0015248553827404976, -0.001426588511094451, -0.0013283217558637261, -0.0012300550006330013, -0.0011317881289869547, -0.0010335213737562299, -0.0009352545021101832, -0.0008369877468794584, -0.0007387209334410727, -0.000640454120002687, -0.0005421873647719622, -0.00044392055133357644, -0.0003456537378951907, -0.000247386924456805, -0.00014912014012224972, -5.0853355787694454e-05, 4.741345765069127e-05, 0.000145680271089077, 0.0002439470263198018, 0.00034221383975818753, 0.00044048065319657326, 0.000538747466634959, 0.0006370142800733447, 0.0007352810353040695, 0.0008335478487424552, 0.000931814662180841, 0.0010300814174115658, 0.0011283482890576124, 0.0012266150442883372]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 10.0, 7.0, 1.0, 9.0, 11.0, 17.0, 14.0, 16.0, 18.0, 24.0, 21.0, 27.0, 31.0, 27.0, 29.0, 32.0, 37.0, 31.0, 46.0, 37.0, 36.0, 32.0, 41.0, 63.0, 41.0, 41.0, 34.0, 28.0, 28.0, 26.0, 27.0, 17.0, 25.0, 15.0, 13.0, 13.0, 12.0, 7.0, 11.0, 11.0, 14.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0004799365997314453, -0.00046395137906074524, -0.00044796615839004517, -0.0004319809377193451, -0.000415995717048645, -0.00040001049637794495, -0.0003840252757072449, -0.0003680400550365448, -0.0003520548343658447, -0.00033606961369514465, -0.0003200843930244446, -0.0003040991723537445, -0.00028811395168304443, -0.00027212873101234436, -0.0002561435103416443, -0.00024015828967094421, -0.00022417306900024414, -0.00020818784832954407, -0.000192202627658844, -0.00017621740698814392, -0.00016023218631744385, -0.00014424696564674377, -0.0001282617449760437, -0.00011227652430534363, -9.629130363464355e-05, -8.030608296394348e-05, -6.432086229324341e-05, -4.8335641622543335e-05, -3.235042095184326e-05, -1.636520028114319e-05, -3.7997961044311523e-07, 1.5605241060256958e-05, 3.159046173095703e-05, 4.7575682401657104e-05, 6.356090307235718e-05, 7.954612374305725e-05, 9.553134441375732e-05, 0.0001115165650844574, 0.00012750178575515747, 0.00014348700642585754, 0.00015947222709655762, 0.0001754574477672577, 0.00019144266843795776, 0.00020742788910865784, 0.0002234131097793579, 0.00023939833045005798, 0.00025538355112075806, 0.00027136877179145813, 0.0002873539924621582, 0.0003033392131328583, 0.00031932443380355835, 0.0003353096544742584, 0.0003512948751449585, 0.00036728009581565857, 0.00038326531648635864, 0.0003992505371570587, 0.0004152357578277588, 0.00043122097849845886, 0.00044720619916915894, 0.000463191419839859, 0.0004791766405105591, 0.0004951618611812592, 0.0005111470818519592, 0.0005271323025226593, 0.0005431175231933594]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 2.0, 6.0, 12.0, 7.0, 10.0, 17.0, 14.0, 14.0, 17.0, 27.0, 25.0, 28.0, 26.0, 34.0, 35.0, 29.0, 42.0, 39.0, 30.0, 45.0, 44.0, 39.0, 43.0, 28.0, 48.0, 34.0, 28.0, 43.0, 33.0, 30.0, 33.0, 30.0, 22.0, 18.0, 17.0, 10.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.5583953857421875, -1.505462646484375, -1.4525299072265625, -1.39959716796875, -1.3466644287109375, -1.293731689453125, -1.2407989501953125, -1.1878662109375, -1.1349334716796875, -1.082000732421875, -1.0290679931640625, -0.97613525390625, -0.9232025146484375, -0.870269775390625, -0.8173370361328125, -0.764404296875, -0.7114715576171875, -0.658538818359375, -0.6056060791015625, -0.55267333984375, -0.4997406005859375, -0.446807861328125, -0.3938751220703125, -0.3409423828125, -0.2880096435546875, -0.235076904296875, -0.1821441650390625, -0.12921142578125, -0.0762786865234375, -0.023345947265625, 0.0295867919921875, 0.08251953125, 0.1354522705078125, 0.188385009765625, 0.2413177490234375, 0.29425048828125, 0.3471832275390625, 0.400115966796875, 0.4530487060546875, 0.5059814453125, 0.5589141845703125, 0.611846923828125, 0.6647796630859375, 0.71771240234375, 0.7706451416015625, 0.823577880859375, 0.8765106201171875, 0.929443359375, 0.9823760986328125, 1.035308837890625, 1.0882415771484375, 1.14117431640625, 1.1941070556640625, 1.247039794921875, 1.2999725341796875, 1.3529052734375, 1.4058380126953125, 1.458770751953125, 1.5117034912109375, 1.56463623046875, 1.6175689697265625, 1.670501708984375, 1.7234344482421875, 1.7763671875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 5.0, 15.0, 21.0, 19.0, 31.0, 49.0, 63.0, 95.0, 136.0, 153.0, 260.0, 384.0, 497.0, 685.0, 1095.0, 1521.0, 2333.0, 3751.0, 6376.0, 13172.0, 38648.0, 233837.0, 593993.0, 103578.0, 23757.0, 9549.0, 5119.0, 3038.0, 1931.0, 1313.0, 958.0, 639.0, 442.0, 341.0, 244.0, 132.0, 112.0, 63.0, 56.0, 38.0, 31.0, 18.0, 18.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.36041259765625, -6.1505126953125, -5.94061279296875, -5.730712890625, -5.52081298828125, -5.3109130859375, -5.10101318359375, -4.89111328125, -4.68121337890625, -4.4713134765625, -4.26141357421875, -4.051513671875, -3.84161376953125, -3.6317138671875, -3.42181396484375, -3.2119140625, -3.00201416015625, -2.7921142578125, -2.58221435546875, -2.372314453125, -2.16241455078125, -1.9525146484375, -1.74261474609375, -1.53271484375, -1.32281494140625, -1.1129150390625, -0.90301513671875, -0.693115234375, -0.48321533203125, -0.2733154296875, -0.06341552734375, 0.146484375, 0.35638427734375, 0.5662841796875, 0.77618408203125, 0.986083984375, 1.19598388671875, 1.4058837890625, 1.61578369140625, 1.82568359375, 2.03558349609375, 2.2454833984375, 2.45538330078125, 2.665283203125, 2.87518310546875, 3.0850830078125, 3.29498291015625, 3.5048828125, 3.71478271484375, 3.9246826171875, 4.13458251953125, 4.344482421875, 4.55438232421875, 4.7642822265625, 4.97418212890625, 5.18408203125, 5.39398193359375, 5.6038818359375, 5.81378173828125, 6.023681640625, 6.23358154296875, 6.4434814453125, 6.65338134765625, 6.86328125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 7.0, 11.0, 12.0, 10.0, 16.0, 19.0, 23.0, 27.0, 28.0, 27.0, 29.0, 39.0, 44.0, 54.0, 78.0, 72.0, 143.0, 235.0, 1323.0, 205.0, 131.0, 78.0, 68.0, 38.0, 33.0, 43.0, 36.0, 40.0, 28.0, 18.0, 17.0, 20.0, 14.0, 10.0, 7.0, 10.0, 5.0, 5.0, 5.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.8046875, -4.65643310546875, -4.5081787109375, -4.35992431640625, -4.211669921875, -4.06341552734375, -3.9151611328125, -3.76690673828125, -3.61865234375, -3.47039794921875, -3.3221435546875, -3.17388916015625, -3.025634765625, -2.87738037109375, -2.7291259765625, -2.58087158203125, -2.4326171875, -2.28436279296875, -2.1361083984375, -1.98785400390625, -1.839599609375, -1.69134521484375, -1.5430908203125, -1.39483642578125, -1.24658203125, -1.09832763671875, -0.9500732421875, -0.80181884765625, -0.653564453125, -0.50531005859375, -0.3570556640625, -0.20880126953125, -0.060546875, 0.08770751953125, 0.2359619140625, 0.38421630859375, 0.532470703125, 0.68072509765625, 0.8289794921875, 0.97723388671875, 1.12548828125, 1.27374267578125, 1.4219970703125, 1.57025146484375, 1.718505859375, 1.86676025390625, 2.0150146484375, 2.16326904296875, 2.3115234375, 2.45977783203125, 2.6080322265625, 2.75628662109375, 2.904541015625, 3.05279541015625, 3.2010498046875, 3.34930419921875, 3.49755859375, 3.64581298828125, 3.7940673828125, 3.94232177734375, 4.090576171875, 4.23883056640625, 4.3870849609375, 4.53533935546875, 4.68359375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 0.0, 3.0, 8.0, 1.0, 8.0, 6.0, 10.0, 13.0, 17.0, 24.0, 18.0, 26.0, 24.0, 33.0, 53.0, 50.0, 98.0, 189.0, 451.0, 1306.0, 11034.0, 2985521.0, 142693.0, 2600.0, 745.0, 268.0, 133.0, 75.0, 47.0, 47.0, 31.0, 25.0, 21.0, 17.0, 19.0, 13.0, 11.0, 15.0, 11.0, 10.0, 5.0, 2.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0], "bins": [-20.0625, -19.4677734375, -18.873046875, -18.2783203125, -17.68359375, -17.0888671875, -16.494140625, -15.8994140625, -15.3046875, -14.7099609375, -14.115234375, -13.5205078125, -12.92578125, -12.3310546875, -11.736328125, -11.1416015625, -10.546875, -9.9521484375, -9.357421875, -8.7626953125, -8.16796875, -7.5732421875, -6.978515625, -6.3837890625, -5.7890625, -5.1943359375, -4.599609375, -4.0048828125, -3.41015625, -2.8154296875, -2.220703125, -1.6259765625, -1.03125, -0.4365234375, 0.158203125, 0.7529296875, 1.34765625, 1.9423828125, 2.537109375, 3.1318359375, 3.7265625, 4.3212890625, 4.916015625, 5.5107421875, 6.10546875, 6.7001953125, 7.294921875, 7.8896484375, 8.484375, 9.0791015625, 9.673828125, 10.2685546875, 10.86328125, 11.4580078125, 12.052734375, 12.6474609375, 13.2421875, 13.8369140625, 14.431640625, 15.0263671875, 15.62109375, 16.2158203125, 16.810546875, 17.4052734375, 18.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 461.0, 547.0, 4.0, 1.0], "bins": [-180.85655212402344, -177.89210510253906, -174.92764282226562, -171.96319580078125, -168.9987335205078, -166.03428649902344, -163.06982421875, -160.10537719726562, -157.1409149169922, -154.1764678955078, -151.21200561523438, -148.24755859375, -145.28309631347656, -142.3186492919922, -139.35418701171875, -136.38973999023438, -133.42529296875, -130.46084594726562, -127.49638366699219, -124.53192901611328, -121.56747436523438, -118.60302734375, -115.63856506347656, -112.67411804199219, -109.70965576171875, -106.74520111083984, -103.78074645996094, -100.81629180908203, -97.85183715820312, -94.88739013671875, -91.92292785644531, -88.95848083496094, -85.99402618408203, -83.02957153320312, -80.06511688232422, -77.10066223144531, -74.1362075805664, -71.1717529296875, -68.20730590820312, -65.24285125732422, -62.27839660644531, -59.313941955566406, -56.3494873046875, -53.385032653808594, -50.42058181762695, -47.45612716674805, -44.49167251586914, -41.5272216796875, -38.562767028808594, -35.59831237792969, -32.63385772705078, -29.669404983520508, -26.704952239990234, -23.740497589111328, -20.776042938232422, -17.81159019470215, -14.847134590148926, -11.882680892944336, -8.91822624206543, -5.95377254486084, -2.98931884765625, -0.024865150451660156, 2.939589500427246, 5.9040422439575195, 8.868496894836426]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 6.0, 11.0, 6.0, 10.0, 9.0, 8.0, 16.0, 12.0, 27.0, 23.0, 26.0, 27.0, 30.0, 24.0, 40.0, 40.0, 42.0, 48.0, 36.0, 36.0, 33.0, 53.0, 36.0, 46.0, 33.0, 35.0, 37.0, 45.0, 44.0, 19.0, 25.0, 21.0, 14.0, 15.0, 13.0, 13.0, 6.0, 9.0, 7.0, 6.0, 5.0, 2.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.285415649414062, -17.76166343688965, -17.237911224365234, -16.714157104492188, -16.190404891967773, -15.66665267944336, -15.142900466918945, -14.619147300720215, -14.095394134521484, -13.57164192199707, -13.04788875579834, -12.524136543273926, -12.000383377075195, -11.476631164550781, -10.952878952026367, -10.429125785827637, -9.905373573303223, -9.381621360778809, -8.857868194580078, -8.334115982055664, -7.810362815856934, -7.2866106033325195, -6.762857913970947, -6.239105224609375, -5.715352535247803, -5.1915998458862305, -4.667847156524658, -4.144094467163086, -3.6203420162200928, -3.0965893268585205, -2.5728368759155273, -2.049084186553955, -1.5253314971923828, -1.0015788078308105, -0.47782623767852783, 0.04592633247375488, 0.5696790218353271, 1.0934317111968994, 1.6171841621398926, 2.140936851501465, 2.664689540863037, 3.1884422302246094, 3.7121949195861816, 4.235947608947754, 4.759699821472168, 5.283452987670898, 5.8072052001953125, 6.330957889556885, 6.854710578918457, 7.378463268280029, 7.902215957641602, 8.425968170166016, 8.949721336364746, 9.47347354888916, 9.99722671508789, 10.520978927612305, 11.044731140136719, 11.568483352661133, 12.092236518859863, 12.615988731384277, 13.139741897583008, 13.663494110107422, 14.187246322631836, 14.710999488830566, 15.234752655029297]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 8.0, 6.0, 11.0, 14.0, 16.0, 19.0, 30.0, 17.0, 20.0, 30.0, 28.0, 32.0, 33.0, 31.0, 30.0, 35.0, 32.0, 57.0, 47.0, 37.0, 37.0, 39.0, 35.0, 30.0, 35.0, 33.0, 35.0, 34.0, 23.0, 31.0, 21.0, 24.0, 18.0, 10.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8515625, -1.7961578369140625, -1.740753173828125, -1.6853485107421875, -1.62994384765625, -1.5745391845703125, -1.519134521484375, -1.4637298583984375, -1.4083251953125, -1.3529205322265625, -1.297515869140625, -1.2421112060546875, -1.18670654296875, -1.1313018798828125, -1.075897216796875, -1.0204925537109375, -0.965087890625, -0.9096832275390625, -0.854278564453125, -0.7988739013671875, -0.74346923828125, -0.6880645751953125, -0.632659912109375, -0.5772552490234375, -0.5218505859375, -0.4664459228515625, -0.411041259765625, -0.3556365966796875, -0.30023193359375, -0.2448272705078125, -0.189422607421875, -0.1340179443359375, -0.07861328125, -0.0232086181640625, 0.032196044921875, 0.0876007080078125, 0.14300537109375, 0.1984100341796875, 0.253814697265625, 0.3092193603515625, 0.3646240234375, 0.4200286865234375, 0.475433349609375, 0.5308380126953125, 0.58624267578125, 0.6416473388671875, 0.697052001953125, 0.7524566650390625, 0.807861328125, 0.8632659912109375, 0.918670654296875, 0.9740753173828125, 1.02947998046875, 1.0848846435546875, 1.140289306640625, 1.1956939697265625, 1.2510986328125, 1.3065032958984375, 1.361907958984375, 1.4173126220703125, 1.47271728515625, 1.5281219482421875, 1.583526611328125, 1.6389312744140625, 1.6943359375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 14.0, 14.0, 31.0, 36.0, 44.0, 58.0, 70.0, 107.0, 130.0, 185.0, 258.0, 381.0, 595.0, 1001.0, 1735.0, 3518.0, 7962.0, 21000.0, 77873.0, 569405.0, 2746134.0, 640373.0, 84381.0, 22451.0, 8280.0, 3610.0, 1735.0, 1010.0, 592.0, 385.0, 222.0, 171.0, 111.0, 80.0, 77.0, 66.0, 43.0, 26.0, 18.0, 16.0, 10.0, 10.0, 13.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.66796875, -6.46905517578125, -6.2701416015625, -6.07122802734375, -5.872314453125, -5.67340087890625, -5.4744873046875, -5.27557373046875, -5.07666015625, -4.87774658203125, -4.6788330078125, -4.47991943359375, -4.281005859375, -4.08209228515625, -3.8831787109375, -3.68426513671875, -3.4853515625, -3.28643798828125, -3.0875244140625, -2.88861083984375, -2.689697265625, -2.49078369140625, -2.2918701171875, -2.09295654296875, -1.89404296875, -1.69512939453125, -1.4962158203125, -1.29730224609375, -1.098388671875, -0.89947509765625, -0.7005615234375, -0.50164794921875, -0.302734375, -0.10382080078125, 0.0950927734375, 0.29400634765625, 0.492919921875, 0.69183349609375, 0.8907470703125, 1.08966064453125, 1.28857421875, 1.48748779296875, 1.6864013671875, 1.88531494140625, 2.084228515625, 2.28314208984375, 2.4820556640625, 2.68096923828125, 2.8798828125, 3.07879638671875, 3.2777099609375, 3.47662353515625, 3.675537109375, 3.87445068359375, 4.0733642578125, 4.27227783203125, 4.47119140625, 4.67010498046875, 4.8690185546875, 5.06793212890625, 5.266845703125, 5.46575927734375, 5.6646728515625, 5.86358642578125, 6.0625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 7.0, 4.0, 13.0, 26.0, 41.0, 64.0, 104.0, 166.0, 310.0, 550.0, 812.0, 746.0, 505.0, 327.0, 159.0, 103.0, 58.0, 37.0, 21.0, 10.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.03125, -15.65802001953125, -15.2847900390625, -14.91156005859375, -14.538330078125, -14.16510009765625, -13.7918701171875, -13.41864013671875, -13.04541015625, -12.67218017578125, -12.2989501953125, -11.92572021484375, -11.552490234375, -11.17926025390625, -10.8060302734375, -10.43280029296875, -10.0595703125, -9.68634033203125, -9.3131103515625, -8.93988037109375, -8.566650390625, -8.19342041015625, -7.8201904296875, -7.44696044921875, -7.07373046875, -6.70050048828125, -6.3272705078125, -5.95404052734375, -5.580810546875, -5.20758056640625, -4.8343505859375, -4.46112060546875, -4.087890625, -3.71466064453125, -3.3414306640625, -2.96820068359375, -2.594970703125, -2.22174072265625, -1.8485107421875, -1.47528076171875, -1.10205078125, -0.72882080078125, -0.3555908203125, 0.01763916015625, 0.390869140625, 0.76409912109375, 1.1373291015625, 1.51055908203125, 1.8837890625, 2.25701904296875, 2.6302490234375, 3.00347900390625, 3.376708984375, 3.74993896484375, 4.1231689453125, 4.49639892578125, 4.86962890625, 5.24285888671875, 5.6160888671875, 5.98931884765625, 6.362548828125, 6.73577880859375, 7.1090087890625, 7.48223876953125, 7.85546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 13.0, 17.0, 20.0, 30.0, 46.0, 62.0, 95.0, 148.0, 227.0, 456.0, 1033.0, 3164.0, 45106.0, 3675823.0, 456977.0, 7956.0, 1517.0, 646.0, 320.0, 180.0, 135.0, 76.0, 75.0, 31.0, 36.0, 27.0, 10.0, 5.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.88134765625, -19.1376953125, -18.39404296875, -17.650390625, -16.90673828125, -16.1630859375, -15.41943359375, -14.67578125, -13.93212890625, -13.1884765625, -12.44482421875, -11.701171875, -10.95751953125, -10.2138671875, -9.47021484375, -8.7265625, -7.98291015625, -7.2392578125, -6.49560546875, -5.751953125, -5.00830078125, -4.2646484375, -3.52099609375, -2.77734375, -2.03369140625, -1.2900390625, -0.54638671875, 0.197265625, 0.94091796875, 1.6845703125, 2.42822265625, 3.171875, 3.91552734375, 4.6591796875, 5.40283203125, 6.146484375, 6.89013671875, 7.6337890625, 8.37744140625, 9.12109375, 9.86474609375, 10.6083984375, 11.35205078125, 12.095703125, 12.83935546875, 13.5830078125, 14.32666015625, 15.0703125, 15.81396484375, 16.5576171875, 17.30126953125, 18.044921875, 18.78857421875, 19.5322265625, 20.27587890625, 21.01953125, 21.76318359375, 22.5068359375, 23.25048828125, 23.994140625, 24.73779296875, 25.4814453125, 26.22509765625, 26.96875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 15.0, 128.0, 419.0, 348.0, 93.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.20663452148438, -122.5921401977539, -119.97764587402344, -117.36315155029297, -114.7486572265625, -112.13416290283203, -109.51966857910156, -106.9051742553711, -104.29067993164062, -101.67618560791016, -99.06169128417969, -96.44719696044922, -93.83270263671875, -91.21820831298828, -88.60371398925781, -85.98921966552734, -83.37472534179688, -80.7602310180664, -78.14573669433594, -75.53124237060547, -72.916748046875, -70.30225372314453, -67.68775939941406, -65.0732650756836, -62.458778381347656, -59.84428405761719, -57.22978973388672, -54.61529541015625, -52.00080108642578, -49.38630676269531, -46.771812438964844, -44.157318115234375, -41.542823791503906, -38.92832946777344, -36.31383514404297, -33.6993408203125, -31.08484649658203, -28.470352172851562, -25.855859756469727, -23.241365432739258, -20.62687110900879, -18.01237678527832, -15.397882461547852, -12.7833890914917, -10.16889476776123, -7.554400444030762, -4.939907073974609, -2.3254127502441406, 0.2890815734863281, 2.9035756587982178, 5.518069744110107, 8.132563591003418, 10.747057914733887, 13.361552238464355, 15.976045608520508, 18.590539932250977, 21.205034255981445, 23.819528579711914, 26.434022903442383, 29.04851531982422, 31.663009643554688, 34.277503967285156, 36.891998291015625, 39.506492614746094, 42.12098693847656]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 2.0, 6.0, 5.0, 3.0, 8.0, 8.0, 20.0, 12.0, 15.0, 20.0, 17.0, 22.0, 20.0, 30.0, 30.0, 30.0, 21.0, 26.0, 26.0, 38.0, 43.0, 30.0, 43.0, 34.0, 42.0, 43.0, 38.0, 31.0, 29.0, 29.0, 31.0, 31.0, 30.0, 28.0, 21.0, 19.0, 20.0, 12.0, 11.0, 20.0, 14.0, 4.0, 6.0, 5.0, 5.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-19.546022415161133, -18.940147399902344, -18.334274291992188, -17.7283992767334, -17.12252426147461, -16.516651153564453, -15.910776138305664, -15.304901123046875, -14.699027061462402, -14.09315299987793, -13.48727798461914, -12.881403923034668, -12.275529861450195, -11.669654846191406, -11.063780784606934, -10.457906723022461, -9.852031707763672, -9.2461576461792, -8.64028263092041, -8.034408569335938, -7.428534030914307, -6.822659492492676, -6.216785430908203, -5.610910892486572, -5.005036354064941, -4.3991618156433105, -3.793287515640259, -3.187413215637207, -2.581538677215576, -1.9756641387939453, -1.3697898387908936, -0.7639155387878418, -0.15804100036621094, 0.44783341884613037, 1.0537078380584717, 1.659582257270813, 2.2654566764831543, 2.871331214904785, 3.477205514907837, 4.083079814910889, 4.6889543533325195, 5.29482889175415, 5.900703430175781, 6.506577491760254, 7.112452030181885, 7.718326568603516, 8.324200630187988, 8.930074691772461, 9.53594970703125, 10.141823768615723, 10.747698783874512, 11.353572845458984, 11.959447860717773, 12.565321922302246, 13.171195983886719, 13.777070999145508, 14.38294506072998, 14.988819122314453, 15.594694137573242, 16.20056915283203, 16.806442260742188, 17.412317276000977, 18.018192291259766, 18.624065399169922, 19.22994041442871]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 6.0, 8.0, 14.0, 5.0, 15.0, 14.0, 23.0, 22.0, 21.0, 36.0, 21.0, 24.0, 28.0, 36.0, 39.0, 41.0, 37.0, 54.0, 47.0, 50.0, 36.0, 33.0, 33.0, 39.0, 32.0, 27.0, 36.0, 33.0, 27.0, 21.0, 25.0, 18.0, 22.0, 17.0, 10.0, 6.0, 9.0, 4.0, 8.0, 4.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.7086029052734375, -1.651580810546875, -1.5945587158203125, -1.53753662109375, -1.4805145263671875, -1.423492431640625, -1.3664703369140625, -1.3094482421875, -1.2524261474609375, -1.195404052734375, -1.1383819580078125, -1.08135986328125, -1.0243377685546875, -0.967315673828125, -0.9102935791015625, -0.853271484375, -0.7962493896484375, -0.739227294921875, -0.6822052001953125, -0.62518310546875, -0.5681610107421875, -0.511138916015625, -0.4541168212890625, -0.3970947265625, -0.3400726318359375, -0.283050537109375, -0.2260284423828125, -0.16900634765625, -0.1119842529296875, -0.054962158203125, 0.0020599365234375, 0.05908203125, 0.1161041259765625, 0.173126220703125, 0.2301483154296875, 0.28717041015625, 0.3441925048828125, 0.401214599609375, 0.4582366943359375, 0.5152587890625, 0.5722808837890625, 0.629302978515625, 0.6863250732421875, 0.74334716796875, 0.8003692626953125, 0.857391357421875, 0.9144134521484375, 0.971435546875, 1.0284576416015625, 1.085479736328125, 1.1425018310546875, 1.19952392578125, 1.2565460205078125, 1.313568115234375, 1.3705902099609375, 1.4276123046875, 1.4846343994140625, 1.541656494140625, 1.5986785888671875, 1.65570068359375, 1.7127227783203125, 1.769744873046875, 1.8267669677734375, 1.8837890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 18.0, 34.0, 35.0, 53.0, 95.0, 123.0, 162.0, 242.0, 343.0, 485.0, 703.0, 982.0, 1342.0, 2046.0, 2951.0, 4046.0, 5863.0, 8603.0, 12257.0, 18097.0, 25922.0, 37961.0, 56120.0, 82040.0, 121085.0, 179530.0, 156154.0, 105044.0, 71146.0, 48567.0, 33044.0, 22677.0, 15613.0, 10739.0, 7465.0, 5314.0, 3536.0, 2429.0, 1707.0, 1210.0, 832.0, 554.0, 380.0, 338.0, 199.0, 117.0, 105.0, 75.0, 43.0, 47.0, 22.0, 27.0, 9.0, 8.0, 5.0, 1.0, 2.0], "bins": [-0.1602783203125, -0.1553936004638672, -0.15050888061523438, -0.14562416076660156, -0.14073944091796875, -0.13585472106933594, -0.13097000122070312, -0.1260852813720703, -0.1212005615234375, -0.11631584167480469, -0.11143112182617188, -0.10654640197753906, -0.10166168212890625, -0.09677696228027344, -0.09189224243164062, -0.08700752258300781, -0.082122802734375, -0.07723808288574219, -0.07235336303710938, -0.06746864318847656, -0.06258392333984375, -0.05769920349121094, -0.052814483642578125, -0.04792976379394531, -0.0430450439453125, -0.03816032409667969, -0.033275604248046875, -0.028390884399414062, -0.02350616455078125, -0.018621444702148438, -0.013736724853515625, -0.008852005004882812, -0.00396728515625, 0.0009174346923828125, 0.005802154541015625, 0.010686874389648438, 0.01557159423828125, 0.020456314086914062, 0.025341033935546875, 0.030225753784179688, 0.0351104736328125, 0.03999519348144531, 0.044879913330078125, 0.04976463317871094, 0.05464935302734375, 0.05953407287597656, 0.06441879272460938, 0.06930351257324219, 0.074188232421875, 0.07907295227050781, 0.08395767211914062, 0.08884239196777344, 0.09372711181640625, 0.09861183166503906, 0.10349655151367188, 0.10838127136230469, 0.1132659912109375, 0.11815071105957031, 0.12303543090820312, 0.12792015075683594, 0.13280487060546875, 0.13768959045410156, 0.14257431030273438, 0.1474590301513672, 0.15234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 5.0, 9.0, 12.0, 15.0, 16.0, 21.0, 25.0, 24.0, 30.0, 33.0, 32.0, 39.0, 40.0, 40.0, 51.0, 37.0, 41.0, 1066.0, 47.0, 43.0, 41.0, 36.0, 49.0, 37.0, 31.0, 41.0, 28.0, 31.0, 17.0, 22.0, 11.0, 8.0, 8.0, 6.0, 7.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.120361328125, -1.07958984375, -1.038818359375, -0.998046875, -0.957275390625, -0.91650390625, -0.875732421875, -0.8349609375, -0.794189453125, -0.75341796875, -0.712646484375, -0.671875, -0.631103515625, -0.59033203125, -0.549560546875, -0.5087890625, -0.468017578125, -0.42724609375, -0.386474609375, -0.345703125, -0.304931640625, -0.26416015625, -0.223388671875, -0.1826171875, -0.141845703125, -0.10107421875, -0.060302734375, -0.01953125, 0.021240234375, 0.06201171875, 0.102783203125, 0.1435546875, 0.184326171875, 0.22509765625, 0.265869140625, 0.306640625, 0.347412109375, 0.38818359375, 0.428955078125, 0.4697265625, 0.510498046875, 0.55126953125, 0.592041015625, 0.6328125, 0.673583984375, 0.71435546875, 0.755126953125, 0.7958984375, 0.836669921875, 0.87744140625, 0.918212890625, 0.958984375, 0.999755859375, 1.04052734375, 1.081298828125, 1.1220703125, 1.162841796875, 1.20361328125, 1.244384765625, 1.28515625, 1.325927734375, 1.36669921875, 1.407470703125, 1.4482421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 4.0, 11.0, 25.0, 21.0, 38.0, 66.0, 105.0, 125.0, 218.0, 343.0, 562.0, 824.0, 1291.0, 1957.0, 2962.0, 4584.0, 7175.0, 11399.0, 18602.0, 30291.0, 50752.0, 85862.0, 144124.0, 1273329.0, 185120.0, 110669.0, 65080.0, 38977.0, 23387.0, 14292.0, 8969.0, 5562.0, 3619.0, 2344.0, 1550.0, 993.0, 603.0, 467.0, 289.0, 196.0, 131.0, 85.0, 55.0, 31.0, 13.0, 17.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181884765625, -0.17596817016601562, -0.17005157470703125, -0.16413497924804688, -0.1582183837890625, -0.15230178833007812, -0.14638519287109375, -0.14046859741210938, -0.134552001953125, -0.12863540649414062, -0.12271881103515625, -0.11680221557617188, -0.1108856201171875, -0.10496902465820312, -0.09905242919921875, -0.09313583374023438, -0.08721923828125, -0.08130264282226562, -0.07538604736328125, -0.06946945190429688, -0.0635528564453125, -0.057636260986328125, -0.05171966552734375, -0.045803070068359375, -0.039886474609375, -0.033969879150390625, -0.02805328369140625, -0.022136688232421875, -0.0162200927734375, -0.010303497314453125, -0.00438690185546875, 0.001529693603515625, 0.0074462890625, 0.013362884521484375, 0.01927947998046875, 0.025196075439453125, 0.0311126708984375, 0.037029266357421875, 0.04294586181640625, 0.048862457275390625, 0.054779052734375, 0.060695648193359375, 0.06661224365234375, 0.07252883911132812, 0.0784454345703125, 0.08436203002929688, 0.09027862548828125, 0.09619522094726562, 0.10211181640625, 0.10802841186523438, 0.11394500732421875, 0.11986160278320312, 0.1257781982421875, 0.13169479370117188, 0.13761138916015625, 0.14352798461914062, 0.149444580078125, 0.15536117553710938, 0.16127777099609375, 0.16719436645507812, 0.1731109619140625, 0.17902755737304688, 0.18494415283203125, 0.19086074829101562, 0.19677734375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 12.0, 6.0, 16.0, 16.0, 22.0, 19.0, 28.0, 38.0, 40.0, 62.0, 69.0, 67.0, 79.0, 82.0, 70.0, 60.0, 64.0, 45.0, 36.0, 34.0, 24.0, 18.0, 19.0, 12.0, 12.0, 6.0, 7.0, 5.0, 6.0, 3.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008111000061035156, -0.0007812902331352234, -0.0007514804601669312, -0.0007216706871986389, -0.0006918609142303467, -0.0006620511412620544, -0.0006322413682937622, -0.00060243159532547, -0.0005726218223571777, -0.0005428120493888855, -0.0005130022764205933, -0.000483192503452301, -0.0004533827304840088, -0.00042357295751571655, -0.0003937631845474243, -0.0003639534115791321, -0.00033414363861083984, -0.0003043338656425476, -0.00027452409267425537, -0.00024471431970596313, -0.0002149045467376709, -0.00018509477376937866, -0.00015528500080108643, -0.0001254752278327942, -9.566545486450195e-05, -6.585568189620972e-05, -3.604590892791748e-05, -6.236135959625244e-06, 2.3573637008666992e-05, 5.338340997695923e-05, 8.319318294525146e-05, 0.0001130029559135437, 0.00014281272888183594, 0.00017262250185012817, 0.0002024322748184204, 0.00023224204778671265, 0.0002620518207550049, 0.0002918615937232971, 0.00032167136669158936, 0.0003514811396598816, 0.00038129091262817383, 0.00041110068559646606, 0.0004409104585647583, 0.00047072023153305054, 0.0005005300045013428, 0.000530339777469635, 0.0005601495504379272, 0.0005899593234062195, 0.0006197690963745117, 0.000649578869342804, 0.0006793886423110962, 0.0007091984152793884, 0.0007390081882476807, 0.0007688179612159729, 0.0007986277341842651, 0.0008284375071525574, 0.0008582472801208496, 0.0008880570530891418, 0.0009178668260574341, 0.0009476765990257263, 0.0009774863719940186, 0.0010072961449623108, 0.001037105917930603, 0.0010669156908988953, 0.0010967254638671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 8.0, 8.0, 5.0, 16.0, 18.0, 27.0, 42.0, 40.0, 68.0, 65.0, 93.0, 132.0, 233.0, 434.0, 961.0, 173823.0, 870042.0, 1250.0, 485.0, 270.0, 168.0, 88.0, 65.0, 56.0, 51.0, 27.0, 22.0, 15.0, 19.0, 6.0, 3.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.02181696891784668, -0.02115774154663086, -0.02049851417541504, -0.01983928680419922, -0.0191800594329834, -0.018520832061767578, -0.017861604690551758, -0.017202377319335938, -0.016543149948120117, -0.015883922576904297, -0.015224695205688477, -0.014565467834472656, -0.013906240463256836, -0.013247013092041016, -0.012587785720825195, -0.011928558349609375, -0.011269330978393555, -0.010610103607177734, -0.009950876235961914, -0.009291648864746094, -0.008632421493530273, -0.007973194122314453, -0.007313966751098633, -0.0066547393798828125, -0.005995512008666992, -0.005336284637451172, -0.0046770572662353516, -0.004017829895019531, -0.003358602523803711, -0.0026993751525878906, -0.0020401477813720703, -0.00138092041015625, -0.0007216930389404297, -6.246566772460938e-05, 0.0005967617034912109, 0.0012559890747070312, 0.0019152164459228516, 0.002574443817138672, 0.003233671188354492, 0.0038928985595703125, 0.004552125930786133, 0.005211353302001953, 0.0058705806732177734, 0.006529808044433594, 0.007189035415649414, 0.007848262786865234, 0.008507490158081055, 0.009166717529296875, 0.009825944900512695, 0.010485172271728516, 0.011144399642944336, 0.011803627014160156, 0.012462854385375977, 0.013122081756591797, 0.013781309127807617, 0.014440536499023438, 0.015099763870239258, 0.015758991241455078, 0.0164182186126709, 0.01707744598388672, 0.01773667335510254, 0.01839590072631836, 0.01905512809753418, 0.01971435546875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 44.0, 288.0, 473.0, 168.0, 36.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013142033712938428, -0.0012462243903428316, -0.0011782454093918204, -0.0011102664284408092, -0.00104228756390512, -0.0009743085247464478, -0.0009063296020030975, -0.0008383506210520864, -0.0007703716401010752, -0.000702392659150064, -0.0006344136781990528, -0.0005664347554557025, -0.0004984557745046914, -0.0004304767935536802, -0.00036249784170649946, -0.00029451888985931873, -0.00022653990890830755, -0.0001585609425092116, -9.058197611011565e-05, -2.2603009711019695e-05, 4.537595668807626e-05, 0.00011335493763908744, 0.00018133388948626816, 0.0002493128413334489, 0.00031729182228446007, 0.00038527080323547125, 0.00045324975508265197, 0.0005212287069298327, 0.0005892076878808439, 0.0006571866688318551, 0.0007251655915752053, 0.0007931445725262165, 0.0008611234370619059, 0.000929102418012917, 0.0009970813989639282, 0.0010650603799149394, 0.0011330393608659506, 0.00120101822540164, 0.0012689972063526511, 0.0013369761873036623, 0.0014049551682546735, 0.0014729341492056847, 0.0015409131301566958, 0.001608892111107707, 0.0016768709756433964, 0.0017448500730097294, 0.0018128289375454187, 0.00188080791849643, 0.001948786899447441, 0.0020167657639831305, 0.0020847448613494635, 0.002152723725885153, 0.002220702823251486, 0.002288681687787175, 0.002356660785153508, 0.0024246396496891975, 0.0024926187470555305, 0.00256059761159122, 0.002628576708957553, 0.0026965555734932423, 0.0027645346708595753, 0.0028325135353952646, 0.0029004926327615976, 0.002968471497297287, 0.0030364503618329763]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 11.0, 10.0, 14.0, 19.0, 14.0, 28.0, 27.0, 33.0, 27.0, 34.0, 42.0, 34.0, 38.0, 37.0, 51.0, 58.0, 50.0, 40.0, 34.0, 44.0, 37.0, 35.0, 41.0, 34.0, 36.0, 25.0, 18.0, 25.0, 22.0, 20.0, 12.0, 7.0, 11.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044536590576171875, -0.0004313727840781212, -0.0004173796623945236, -0.00040338654071092606, -0.0003893934190273285, -0.0003754002973437309, -0.00036140717566013336, -0.0003474140539765358, -0.00033342093229293823, -0.00031942781060934067, -0.0003054346889257431, -0.00029144156724214554, -0.000277448445558548, -0.0002634553238749504, -0.00024946220219135284, -0.00023546908050775528, -0.00022147595882415771, -0.00020748283714056015, -0.00019348971545696259, -0.00017949659377336502, -0.00016550347208976746, -0.0001515103504061699, -0.00013751722872257233, -0.00012352410703897476, -0.0001095309853553772, -9.553786367177963e-05, -8.154474198818207e-05, -6.75516203045845e-05, -5.355849862098694e-05, -3.9565376937389374e-05, -2.557225525379181e-05, -1.1579133570194244e-05, 2.4139881134033203e-06, 1.6407109797000885e-05, 3.040023148059845e-05, 4.4393353164196014e-05, 5.838647484779358e-05, 7.237959653139114e-05, 8.637271821498871e-05, 0.00010036583989858627, 0.00011435896158218384, 0.0001283520832657814, 0.00014234520494937897, 0.00015633832663297653, 0.0001703314483165741, 0.00018432457000017166, 0.00019831769168376923, 0.0002123108133673668, 0.00022630393505096436, 0.00024029705673456192, 0.0002542901784181595, 0.00026828330010175705, 0.0002822764217853546, 0.0002962695434689522, 0.00031026266515254974, 0.0003242557868361473, 0.0003382489085197449, 0.00035224203020334244, 0.00036623515188694, 0.00038022827357053757, 0.00039422139525413513, 0.0004082145169377327, 0.00042220763862133026, 0.0004362007603049278, 0.0004501938819885254]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 6.0, 8.0, 14.0, 5.0, 15.0, 14.0, 23.0, 22.0, 21.0, 36.0, 21.0, 24.0, 28.0, 36.0, 39.0, 41.0, 37.0, 54.0, 47.0, 50.0, 36.0, 33.0, 33.0, 39.0, 32.0, 27.0, 36.0, 33.0, 27.0, 21.0, 25.0, 18.0, 22.0, 17.0, 10.0, 6.0, 9.0, 4.0, 8.0, 4.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.7086029052734375, -1.651580810546875, -1.5945587158203125, -1.53753662109375, -1.4805145263671875, -1.423492431640625, -1.3664703369140625, -1.3094482421875, -1.2524261474609375, -1.195404052734375, -1.1383819580078125, -1.08135986328125, -1.0243377685546875, -0.967315673828125, -0.9102935791015625, -0.853271484375, -0.7962493896484375, -0.739227294921875, -0.6822052001953125, -0.62518310546875, -0.5681610107421875, -0.511138916015625, -0.4541168212890625, -0.3970947265625, -0.3400726318359375, -0.283050537109375, -0.2260284423828125, -0.16900634765625, -0.1119842529296875, -0.054962158203125, 0.0020599365234375, 0.05908203125, 0.1161041259765625, 0.173126220703125, 0.2301483154296875, 0.28717041015625, 0.3441925048828125, 0.401214599609375, 0.4582366943359375, 0.5152587890625, 0.5722808837890625, 0.629302978515625, 0.6863250732421875, 0.74334716796875, 0.8003692626953125, 0.857391357421875, 0.9144134521484375, 0.971435546875, 1.0284576416015625, 1.085479736328125, 1.1425018310546875, 1.19952392578125, 1.2565460205078125, 1.313568115234375, 1.3705902099609375, 1.4276123046875, 1.4846343994140625, 1.541656494140625, 1.5986785888671875, 1.65570068359375, 1.7127227783203125, 1.769744873046875, 1.8267669677734375, 1.8837890625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 7.0, 20.0, 16.0, 31.0, 41.0, 51.0, 72.0, 108.0, 186.0, 267.0, 403.0, 664.0, 1238.0, 2444.0, 5369.0, 13257.0, 35087.0, 100826.0, 274766.0, 361411.0, 161595.0, 55651.0, 20056.0, 7647.0, 3315.0, 1649.0, 900.0, 537.0, 293.0, 214.0, 123.0, 98.0, 51.0, 52.0, 34.0, 21.0, 11.0, 15.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.267578125, -2.189971923828125, -2.11236572265625, -2.034759521484375, -1.9571533203125, -1.879547119140625, -1.80194091796875, -1.724334716796875, -1.646728515625, -1.569122314453125, -1.49151611328125, -1.413909912109375, -1.3363037109375, -1.258697509765625, -1.18109130859375, -1.103485107421875, -1.02587890625, -0.948272705078125, -0.87066650390625, -0.793060302734375, -0.7154541015625, -0.637847900390625, -0.56024169921875, -0.482635498046875, -0.405029296875, -0.327423095703125, -0.24981689453125, -0.172210693359375, -0.0946044921875, -0.016998291015625, 0.06060791015625, 0.138214111328125, 0.2158203125, 0.293426513671875, 0.37103271484375, 0.448638916015625, 0.5262451171875, 0.603851318359375, 0.68145751953125, 0.759063720703125, 0.836669921875, 0.914276123046875, 0.99188232421875, 1.069488525390625, 1.1470947265625, 1.224700927734375, 1.30230712890625, 1.379913330078125, 1.45751953125, 1.535125732421875, 1.61273193359375, 1.690338134765625, 1.7679443359375, 1.845550537109375, 1.92315673828125, 2.000762939453125, 2.078369140625, 2.155975341796875, 2.23358154296875, 2.311187744140625, 2.3887939453125, 2.466400146484375, 2.54400634765625, 2.621612548828125, 2.69921875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 6.0, 7.0, 4.0, 16.0, 11.0, 15.0, 14.0, 21.0, 20.0, 22.0, 19.0, 30.0, 34.0, 33.0, 39.0, 46.0, 53.0, 73.0, 163.0, 355.0, 1380.0, 180.0, 97.0, 59.0, 48.0, 32.0, 26.0, 42.0, 25.0, 35.0, 18.0, 21.0, 13.0, 13.0, 14.0, 13.0, 10.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.37890625, -6.18603515625, -5.9931640625, -5.80029296875, -5.607421875, -5.41455078125, -5.2216796875, -5.02880859375, -4.8359375, -4.64306640625, -4.4501953125, -4.25732421875, -4.064453125, -3.87158203125, -3.6787109375, -3.48583984375, -3.29296875, -3.10009765625, -2.9072265625, -2.71435546875, -2.521484375, -2.32861328125, -2.1357421875, -1.94287109375, -1.75, -1.55712890625, -1.3642578125, -1.17138671875, -0.978515625, -0.78564453125, -0.5927734375, -0.39990234375, -0.20703125, -0.01416015625, 0.1787109375, 0.37158203125, 0.564453125, 0.75732421875, 0.9501953125, 1.14306640625, 1.3359375, 1.52880859375, 1.7216796875, 1.91455078125, 2.107421875, 2.30029296875, 2.4931640625, 2.68603515625, 2.87890625, 3.07177734375, 3.2646484375, 3.45751953125, 3.650390625, 3.84326171875, 4.0361328125, 4.22900390625, 4.421875, 4.61474609375, 4.8076171875, 5.00048828125, 5.193359375, 5.38623046875, 5.5791015625, 5.77197265625, 5.96484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 5.0, 11.0, 9.0, 15.0, 10.0, 11.0, 15.0, 12.0, 21.0, 37.0, 47.0, 45.0, 55.0, 94.0, 133.0, 308.0, 622.0, 2551.0, 58386.0, 2994003.0, 84910.0, 2867.0, 665.0, 298.0, 154.0, 96.0, 63.0, 47.0, 36.0, 26.0, 24.0, 20.0, 20.0, 12.0, 21.0, 11.0, 6.0, 7.0, 3.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.390625, -11.98486328125, -11.5791015625, -11.17333984375, -10.767578125, -10.36181640625, -9.9560546875, -9.55029296875, -9.14453125, -8.73876953125, -8.3330078125, -7.92724609375, -7.521484375, -7.11572265625, -6.7099609375, -6.30419921875, -5.8984375, -5.49267578125, -5.0869140625, -4.68115234375, -4.275390625, -3.86962890625, -3.4638671875, -3.05810546875, -2.65234375, -2.24658203125, -1.8408203125, -1.43505859375, -1.029296875, -0.62353515625, -0.2177734375, 0.18798828125, 0.59375, 0.99951171875, 1.4052734375, 1.81103515625, 2.216796875, 2.62255859375, 3.0283203125, 3.43408203125, 3.83984375, 4.24560546875, 4.6513671875, 5.05712890625, 5.462890625, 5.86865234375, 6.2744140625, 6.68017578125, 7.0859375, 7.49169921875, 7.8974609375, 8.30322265625, 8.708984375, 9.11474609375, 9.5205078125, 9.92626953125, 10.33203125, 10.73779296875, 11.1435546875, 11.54931640625, 11.955078125, 12.36083984375, 12.7666015625, 13.17236328125, 13.578125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 13.0, 91.0, 366.0, 417.0, 107.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.62337112426758, -49.66758728027344, -48.71180725097656, -47.75602340698242, -46.80023956298828, -45.84445571899414, -44.888671875, -43.932891845703125, -42.977108001708984, -42.021324157714844, -41.06554412841797, -40.10976028442383, -39.15397644042969, -38.19819259643555, -37.242408752441406, -36.28662872314453, -35.33084487915039, -34.37506103515625, -33.419281005859375, -32.463497161865234, -31.507713317871094, -30.551929473876953, -29.596147537231445, -28.640365600585938, -27.684581756591797, -26.728797912597656, -25.77301597595215, -24.81723403930664, -23.8614501953125, -22.90566635131836, -21.94988441467285, -20.994102478027344, -20.038318634033203, -19.082534790039062, -18.126752853393555, -17.170970916748047, -16.215187072753906, -15.259404182434082, -14.303621292114258, -13.347838401794434, -12.392054557800293, -11.436271667480469, -10.480488777160645, -9.52470588684082, -8.568922996520996, -7.613140106201172, -6.657357215881348, -5.701574325561523, -4.745791435241699, -3.790008544921875, -2.834225654602051, -1.8784427642822266, -0.9226598739624023, 0.033123016357421875, 0.9889059066772461, 1.9446887969970703, 2.9004716873168945, 3.8562545776367188, 4.812037467956543, 5.767820358276367, 6.723603248596191, 7.679386138916016, 8.63516902923584, 9.590951919555664, 10.546734809875488]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 6.0, 11.0, 8.0, 9.0, 15.0, 11.0, 20.0, 19.0, 22.0, 11.0, 21.0, 35.0, 31.0, 30.0, 45.0, 39.0, 32.0, 32.0, 45.0, 37.0, 43.0, 47.0, 42.0, 35.0, 33.0, 31.0, 32.0, 23.0, 36.0, 31.0, 22.0, 23.0, 17.0, 21.0, 15.0, 10.0, 14.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-18.093278884887695, -17.512300491333008, -16.931324005126953, -16.350345611572266, -15.769367218017578, -15.18838882446289, -14.60741138458252, -14.026433944702148, -13.445455551147461, -12.864477157592773, -12.283499717712402, -11.702522277832031, -11.121543884277344, -10.540565490722656, -9.959588050842285, -9.378610610961914, -8.797632217407227, -8.216653823852539, -7.635676383972168, -7.054698467254639, -6.473720550537109, -5.89274263381958, -5.311764717102051, -4.7307868003845215, -4.149808883666992, -3.568830966949463, -2.9878530502319336, -2.4068751335144043, -1.825897216796875, -1.2449193000793457, -0.6639413833618164, -0.08296346664428711, 0.4980144500732422, 1.0789923667907715, 1.6599702835083008, 2.24094820022583, 2.8219261169433594, 3.4029040336608887, 3.983881950378418, 4.564859867095947, 5.145837783813477, 5.726815700531006, 6.307793617248535, 6.8887715339660645, 7.469749450683594, 8.050727844238281, 8.631705284118652, 9.212682723999023, 9.793661117553711, 10.374639511108398, 10.95561695098877, 11.53659439086914, 12.117572784423828, 12.698551177978516, 13.279528617858887, 13.860506057739258, 14.441484451293945, 15.022462844848633, 15.603440284729004, 16.184417724609375, 16.765396118164062, 17.34637451171875, 17.927352905273438, 18.508329391479492, 19.08930778503418]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 12.0, 8.0, 12.0, 15.0, 24.0, 23.0, 30.0, 24.0, 22.0, 28.0, 26.0, 35.0, 36.0, 40.0, 42.0, 53.0, 46.0, 42.0, 45.0, 37.0, 27.0, 35.0, 37.0, 33.0, 34.0, 32.0, 25.0, 23.0, 25.0, 19.0, 14.0, 18.0, 14.0, 10.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.727783203125, -1.66845703125, -1.609130859375, -1.5498046875, -1.490478515625, -1.43115234375, -1.371826171875, -1.3125, -1.253173828125, -1.19384765625, -1.134521484375, -1.0751953125, -1.015869140625, -0.95654296875, -0.897216796875, -0.837890625, -0.778564453125, -0.71923828125, -0.659912109375, -0.6005859375, -0.541259765625, -0.48193359375, -0.422607421875, -0.36328125, -0.303955078125, -0.24462890625, -0.185302734375, -0.1259765625, -0.066650390625, -0.00732421875, 0.052001953125, 0.111328125, 0.170654296875, 0.22998046875, 0.289306640625, 0.3486328125, 0.407958984375, 0.46728515625, 0.526611328125, 0.5859375, 0.645263671875, 0.70458984375, 0.763916015625, 0.8232421875, 0.882568359375, 0.94189453125, 1.001220703125, 1.060546875, 1.119873046875, 1.17919921875, 1.238525390625, 1.2978515625, 1.357177734375, 1.41650390625, 1.475830078125, 1.53515625, 1.594482421875, 1.65380859375, 1.713134765625, 1.7724609375, 1.831787109375, 1.89111328125, 1.950439453125, 2.009765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 7.0, 8.0, 8.0, 13.0, 11.0, 24.0, 22.0, 32.0, 42.0, 48.0, 63.0, 123.0, 176.0, 297.0, 547.0, 1318.0, 4183.0, 19269.0, 140089.0, 1632175.0, 2155341.0, 206769.0, 25527.0, 5127.0, 1442.0, 634.0, 369.0, 193.0, 109.0, 70.0, 51.0, 42.0, 23.0, 25.0, 29.0, 14.0, 14.0, 8.0, 9.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.1875, -5.99462890625, -5.8017578125, -5.60888671875, -5.416015625, -5.22314453125, -5.0302734375, -4.83740234375, -4.64453125, -4.45166015625, -4.2587890625, -4.06591796875, -3.873046875, -3.68017578125, -3.4873046875, -3.29443359375, -3.1015625, -2.90869140625, -2.7158203125, -2.52294921875, -2.330078125, -2.13720703125, -1.9443359375, -1.75146484375, -1.55859375, -1.36572265625, -1.1728515625, -0.97998046875, -0.787109375, -0.59423828125, -0.4013671875, -0.20849609375, -0.015625, 0.17724609375, 0.3701171875, 0.56298828125, 0.755859375, 0.94873046875, 1.1416015625, 1.33447265625, 1.52734375, 1.72021484375, 1.9130859375, 2.10595703125, 2.298828125, 2.49169921875, 2.6845703125, 2.87744140625, 3.0703125, 3.26318359375, 3.4560546875, 3.64892578125, 3.841796875, 4.03466796875, 4.2275390625, 4.42041015625, 4.61328125, 4.80615234375, 4.9990234375, 5.19189453125, 5.384765625, 5.57763671875, 5.7705078125, 5.96337890625, 6.15625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 15.0, 7.0, 15.0, 35.0, 45.0, 53.0, 74.0, 114.0, 181.0, 232.0, 304.0, 409.0, 487.0, 535.0, 435.0, 302.0, 235.0, 168.0, 122.0, 77.0, 67.0, 52.0, 30.0, 24.0, 13.0, 12.0, 7.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.0, -8.7755126953125, -8.551025390625, -8.3265380859375, -8.10205078125, -7.8775634765625, -7.653076171875, -7.4285888671875, -7.2041015625, -6.9796142578125, -6.755126953125, -6.5306396484375, -6.30615234375, -6.0816650390625, -5.857177734375, -5.6326904296875, -5.408203125, -5.1837158203125, -4.959228515625, -4.7347412109375, -4.51025390625, -4.2857666015625, -4.061279296875, -3.8367919921875, -3.6123046875, -3.3878173828125, -3.163330078125, -2.9388427734375, -2.71435546875, -2.4898681640625, -2.265380859375, -2.0408935546875, -1.81640625, -1.5919189453125, -1.367431640625, -1.1429443359375, -0.91845703125, -0.6939697265625, -0.469482421875, -0.2449951171875, -0.0205078125, 0.2039794921875, 0.428466796875, 0.6529541015625, 0.87744140625, 1.1019287109375, 1.326416015625, 1.5509033203125, 1.775390625, 1.9998779296875, 2.224365234375, 2.4488525390625, 2.67333984375, 2.8978271484375, 3.122314453125, 3.3468017578125, 3.5712890625, 3.7957763671875, 4.020263671875, 4.2447509765625, 4.46923828125, 4.6937255859375, 4.918212890625, 5.1427001953125, 5.3671875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 17.0, 25.0, 28.0, 56.0, 60.0, 87.0, 155.0, 313.0, 605.0, 1612.0, 7136.0, 90538.0, 2529127.0, 1503705.0, 53298.0, 5003.0, 1203.0, 525.0, 270.0, 163.0, 109.0, 71.0, 32.0, 34.0, 29.0, 23.0, 11.0, 8.0, 0.0, 4.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.358154296875, -8.88818359375, -8.418212890625, -7.9482421875, -7.478271484375, -7.00830078125, -6.538330078125, -6.068359375, -5.598388671875, -5.12841796875, -4.658447265625, -4.1884765625, -3.718505859375, -3.24853515625, -2.778564453125, -2.30859375, -1.838623046875, -1.36865234375, -0.898681640625, -0.4287109375, 0.041259765625, 0.51123046875, 0.981201171875, 1.451171875, 1.921142578125, 2.39111328125, 2.861083984375, 3.3310546875, 3.801025390625, 4.27099609375, 4.740966796875, 5.2109375, 5.680908203125, 6.15087890625, 6.620849609375, 7.0908203125, 7.560791015625, 8.03076171875, 8.500732421875, 8.970703125, 9.440673828125, 9.91064453125, 10.380615234375, 10.8505859375, 11.320556640625, 11.79052734375, 12.260498046875, 12.73046875, 13.200439453125, 13.67041015625, 14.140380859375, 14.6103515625, 15.080322265625, 15.55029296875, 16.020263671875, 16.490234375, 16.960205078125, 17.43017578125, 17.900146484375, 18.3701171875, 18.840087890625, 19.31005859375, 19.780029296875, 20.25]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 23.0, 74.0, 175.0, 272.0, 239.0, 139.0, 68.0, 16.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.91654205322266, -82.16390991210938, -80.4112777709961, -78.65864562988281, -76.90602111816406, -75.15338897705078, -73.4007568359375, -71.64812469482422, -69.89549255371094, -68.14286041259766, -66.39022827148438, -64.6375961303711, -62.88496780395508, -61.13233947753906, -59.37970733642578, -57.6270751953125, -55.87444305419922, -54.12181091308594, -52.36918258666992, -50.61655044555664, -48.86391830444336, -47.111289978027344, -45.35865783691406, -43.60602569580078, -41.853397369384766, -40.100765228271484, -38.34813690185547, -36.59550476074219, -34.842872619628906, -33.090240478515625, -31.33761215209961, -29.584980010986328, -27.832347869873047, -26.0797176361084, -24.327085494995117, -22.57445526123047, -20.821823120117188, -19.06919288635254, -17.31656265258789, -15.56393051147461, -13.811299324035645, -12.05866813659668, -10.306036949157715, -8.55340576171875, -6.800775051116943, -5.048144340515137, -3.295513153076172, -1.542881965637207, 0.2097492218017578, 1.962380290031433, 3.7150113582611084, 5.467642307281494, 7.220273494720459, 8.972904205322266, 10.72553539276123, 12.478166580200195, 14.23079776763916, 15.983428955078125, 17.736059188842773, 19.488691329956055, 21.241321563720703, 22.993953704833984, 24.746583938598633, 26.49921417236328, 28.251846313476562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 5.0, 13.0, 12.0, 16.0, 14.0, 20.0, 20.0, 26.0, 22.0, 25.0, 23.0, 36.0, 39.0, 37.0, 28.0, 40.0, 34.0, 35.0, 46.0, 30.0, 47.0, 30.0, 38.0, 44.0, 33.0, 30.0, 28.0, 22.0, 29.0, 27.0, 17.0, 25.0, 11.0, 17.0, 9.0, 14.0, 8.0, 8.0, 9.0, 11.0, 4.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.723770141601562, -19.109909057617188, -18.49604606628418, -17.882183074951172, -17.268321990966797, -16.654460906982422, -16.040597915649414, -15.426735877990723, -14.812873840332031, -14.19901180267334, -13.585149765014648, -12.971287727355957, -12.357425689697266, -11.743563652038574, -11.129701614379883, -10.515839576721191, -9.9019775390625, -9.288115501403809, -8.674253463745117, -8.060391426086426, -7.446529388427734, -6.832667350769043, -6.218805313110352, -5.60494327545166, -4.991081237792969, -4.377219200134277, -3.763357162475586, -3.1494951248168945, -2.535633087158203, -1.9217710494995117, -1.3079090118408203, -0.6940469741821289, -0.08018302917480469, 0.5336790084838867, 1.1475410461425781, 1.7614030838012695, 2.375265121459961, 2.9891271591186523, 3.6029891967773438, 4.216851234436035, 4.830713272094727, 5.444575309753418, 6.058437347412109, 6.672299385070801, 7.286161422729492, 7.900023460388184, 8.513885498046875, 9.127747535705566, 9.741609573364258, 10.35547161102295, 10.96933364868164, 11.583195686340332, 12.197057723999023, 12.810919761657715, 13.424781799316406, 14.038643836975098, 14.652505874633789, 15.26636791229248, 15.880229949951172, 16.494091033935547, 17.107954025268555, 17.721817016601562, 18.335678100585938, 18.949539184570312, 19.56340217590332]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 6.0, 13.0, 13.0, 16.0, 18.0, 16.0, 27.0, 20.0, 24.0, 26.0, 28.0, 28.0, 30.0, 32.0, 33.0, 39.0, 38.0, 45.0, 39.0, 45.0, 42.0, 34.0, 37.0, 30.0, 38.0, 28.0, 25.0, 25.0, 34.0, 20.0, 23.0, 17.0, 17.0, 18.0, 14.0, 9.0, 5.0, 9.0, 12.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662109375, -1.60418701171875, -1.5462646484375, -1.48834228515625, -1.430419921875, -1.37249755859375, -1.3145751953125, -1.25665283203125, -1.19873046875, -1.14080810546875, -1.0828857421875, -1.02496337890625, -0.967041015625, -0.90911865234375, -0.8511962890625, -0.79327392578125, -0.7353515625, -0.67742919921875, -0.6195068359375, -0.56158447265625, -0.503662109375, -0.44573974609375, -0.3878173828125, -0.32989501953125, -0.27197265625, -0.21405029296875, -0.1561279296875, -0.09820556640625, -0.040283203125, 0.01763916015625, 0.0755615234375, 0.13348388671875, 0.19140625, 0.24932861328125, 0.3072509765625, 0.36517333984375, 0.423095703125, 0.48101806640625, 0.5389404296875, 0.59686279296875, 0.65478515625, 0.71270751953125, 0.7706298828125, 0.82855224609375, 0.886474609375, 0.94439697265625, 1.0023193359375, 1.06024169921875, 1.1181640625, 1.17608642578125, 1.2340087890625, 1.29193115234375, 1.349853515625, 1.40777587890625, 1.4656982421875, 1.52362060546875, 1.58154296875, 1.63946533203125, 1.6973876953125, 1.75531005859375, 1.813232421875, 1.87115478515625, 1.9290771484375, 1.98699951171875, 2.044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 13.0, 12.0, 9.0, 18.0, 29.0, 43.0, 42.0, 97.0, 107.0, 152.0, 258.0, 358.0, 556.0, 746.0, 1041.0, 1593.0, 2387.0, 3478.0, 5201.0, 7766.0, 11804.0, 17881.0, 26873.0, 41495.0, 62686.0, 95654.0, 148832.0, 196063.0, 146643.0, 94225.0, 62085.0, 40547.0, 26608.0, 17796.0, 11680.0, 7799.0, 5253.0, 3384.0, 2386.0, 1641.0, 1069.0, 764.0, 479.0, 352.0, 201.0, 149.0, 98.0, 73.0, 46.0, 30.0, 26.0, 17.0, 12.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.175537109375, -0.16977882385253906, -0.16402053833007812, -0.1582622528076172, -0.15250396728515625, -0.1467456817626953, -0.14098739624023438, -0.13522911071777344, -0.1294708251953125, -0.12371253967285156, -0.11795425415039062, -0.11219596862792969, -0.10643768310546875, -0.10067939758300781, -0.09492111206054688, -0.08916282653808594, -0.083404541015625, -0.07764625549316406, -0.07188796997070312, -0.06612968444824219, -0.06037139892578125, -0.05461311340332031, -0.048854827880859375, -0.04309654235839844, -0.0373382568359375, -0.03157997131347656, -0.025821685791015625, -0.020063400268554688, -0.01430511474609375, -0.008546829223632812, -0.002788543701171875, 0.0029697418212890625, 0.00872802734375, 0.014486312866210938, 0.020244598388671875, 0.026002883911132812, 0.03176116943359375, 0.03751945495605469, 0.043277740478515625, 0.04903602600097656, 0.0547943115234375, 0.06055259704589844, 0.06631088256835938, 0.07206916809082031, 0.07782745361328125, 0.08358573913574219, 0.08934402465820312, 0.09510231018066406, 0.100860595703125, 0.10661888122558594, 0.11237716674804688, 0.11813545227050781, 0.12389373779296875, 0.1296520233154297, 0.13541030883789062, 0.14116859436035156, 0.1469268798828125, 0.15268516540527344, 0.15844345092773438, 0.1642017364501953, 0.16996002197265625, 0.1757183074951172, 0.18147659301757812, 0.18723487854003906, 0.1929931640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 2.0, 8.0, 7.0, 10.0, 19.0, 17.0, 14.0, 20.0, 32.0, 22.0, 30.0, 31.0, 31.0, 29.0, 31.0, 42.0, 36.0, 40.0, 47.0, 1064.0, 45.0, 46.0, 38.0, 47.0, 28.0, 28.0, 37.0, 30.0, 31.0, 30.0, 22.0, 15.0, 16.0, 15.0, 10.0, 14.0, 12.0, 9.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.1314697265625, -1.092041015625, -1.0526123046875, -1.01318359375, -0.9737548828125, -0.934326171875, -0.8948974609375, -0.85546875, -0.8160400390625, -0.776611328125, -0.7371826171875, -0.69775390625, -0.6583251953125, -0.618896484375, -0.5794677734375, -0.5400390625, -0.5006103515625, -0.461181640625, -0.4217529296875, -0.38232421875, -0.3428955078125, -0.303466796875, -0.2640380859375, -0.224609375, -0.1851806640625, -0.145751953125, -0.1063232421875, -0.06689453125, -0.0274658203125, 0.011962890625, 0.0513916015625, 0.0908203125, 0.1302490234375, 0.169677734375, 0.2091064453125, 0.24853515625, 0.2879638671875, 0.327392578125, 0.3668212890625, 0.40625, 0.4456787109375, 0.485107421875, 0.5245361328125, 0.56396484375, 0.6033935546875, 0.642822265625, 0.6822509765625, 0.7216796875, 0.7611083984375, 0.800537109375, 0.8399658203125, 0.87939453125, 0.9188232421875, 0.958251953125, 0.9976806640625, 1.037109375, 1.0765380859375, 1.115966796875, 1.1553955078125, 1.19482421875, 1.2342529296875, 1.273681640625, 1.3131103515625, 1.3525390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 7.0, 7.0, 10.0, 18.0, 31.0, 39.0, 53.0, 75.0, 128.0, 168.0, 254.0, 376.0, 477.0, 709.0, 942.0, 1355.0, 1914.0, 2872.0, 3976.0, 5884.0, 8510.0, 12806.0, 19617.0, 30322.0, 47661.0, 76893.0, 124962.0, 1164862.0, 268444.0, 119262.0, 72173.0, 45626.0, 28691.0, 18897.0, 12287.0, 8349.0, 5647.0, 3778.0, 2636.0, 1884.0, 1383.0, 866.0, 702.0, 473.0, 345.0, 229.0, 158.0, 118.0, 87.0, 67.0, 34.0, 29.0, 15.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1689453125, -0.16348648071289062, -0.15802764892578125, -0.15256881713867188, -0.1471099853515625, -0.14165115356445312, -0.13619232177734375, -0.13073348999023438, -0.125274658203125, -0.11981582641601562, -0.11435699462890625, -0.10889816284179688, -0.1034393310546875, -0.09798049926757812, -0.09252166748046875, -0.08706283569335938, -0.08160400390625, -0.07614517211914062, -0.07068634033203125, -0.06522750854492188, -0.0597686767578125, -0.054309844970703125, -0.04885101318359375, -0.043392181396484375, -0.037933349609375, -0.032474517822265625, -0.02701568603515625, -0.021556854248046875, -0.0160980224609375, -0.010639190673828125, -0.00518035888671875, 0.000278472900390625, 0.0057373046875, 0.011196136474609375, 0.01665496826171875, 0.022113800048828125, 0.0275726318359375, 0.033031463623046875, 0.03849029541015625, 0.043949127197265625, 0.049407958984375, 0.054866790771484375, 0.06032562255859375, 0.06578445434570312, 0.0712432861328125, 0.07670211791992188, 0.08216094970703125, 0.08761978149414062, 0.09307861328125, 0.09853744506835938, 0.10399627685546875, 0.10945510864257812, 0.1149139404296875, 0.12037277221679688, 0.12583160400390625, 0.13129043579101562, 0.136749267578125, 0.14220809936523438, 0.14766693115234375, 0.15312576293945312, 0.1585845947265625, 0.16404342651367188, 0.16950225830078125, 0.17496109008789062, 0.180419921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 10.0, 5.0, 6.0, 6.0, 10.0, 11.0, 17.0, 15.0, 13.0, 22.0, 29.0, 38.0, 44.0, 53.0, 60.0, 57.0, 75.0, 84.0, 67.0, 61.0, 51.0, 47.0, 38.0, 38.0, 28.0, 24.0, 24.0, 19.0, 10.0, 9.0, 4.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.0009960532188415527, -0.000964045524597168, -0.0009320378303527832, -0.0009000301361083984, -0.0008680224418640137, -0.0008360147476196289, -0.0008040070533752441, -0.0007719993591308594, -0.0007399916648864746, -0.0007079839706420898, -0.0006759762763977051, -0.0006439685821533203, -0.0006119608879089355, -0.0005799531936645508, -0.000547945499420166, -0.0005159378051757812, -0.0004839301109313965, -0.0004519224166870117, -0.00041991472244262695, -0.0003879070281982422, -0.0003558993339538574, -0.00032389163970947266, -0.0002918839454650879, -0.0002598762512207031, -0.00022786855697631836, -0.0001958608627319336, -0.00016385316848754883, -0.00013184547424316406, -9.98377799987793e-05, -6.783008575439453e-05, -3.5822391510009766e-05, -3.814697265625e-06, 2.8192996978759766e-05, 6.020069122314453e-05, 9.22083854675293e-05, 0.00012421607971191406, 0.00015622377395629883, 0.0001882314682006836, 0.00022023916244506836, 0.0002522468566894531, 0.0002842545509338379, 0.00031626224517822266, 0.0003482699394226074, 0.0003802776336669922, 0.00041228532791137695, 0.0004442930221557617, 0.0004763007164001465, 0.0005083084106445312, 0.000540316104888916, 0.0005723237991333008, 0.0006043314933776855, 0.0006363391876220703, 0.0006683468818664551, 0.0007003545761108398, 0.0007323622703552246, 0.0007643699645996094, 0.0007963776588439941, 0.0008283853530883789, 0.0008603930473327637, 0.0008924007415771484, 0.0009244084358215332, 0.000956416130065918, 0.0009884238243103027, 0.0010204315185546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 0.0, 5.0, 2.0, 8.0, 11.0, 12.0, 10.0, 17.0, 27.0, 41.0, 59.0, 95.0, 101.0, 163.0, 261.0, 474.0, 5148.0, 1025686.0, 14909.0, 589.0, 297.0, 208.0, 115.0, 102.0, 57.0, 27.0, 40.0, 23.0, 21.0, 9.0, 9.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0249786376953125, -0.024256467819213867, -0.023534297943115234, -0.0228121280670166, -0.02208995819091797, -0.021367788314819336, -0.020645618438720703, -0.01992344856262207, -0.019201278686523438, -0.018479108810424805, -0.017756938934326172, -0.01703476905822754, -0.016312599182128906, -0.015590429306030273, -0.01486825942993164, -0.014146089553833008, -0.013423919677734375, -0.012701749801635742, -0.01197957992553711, -0.011257410049438477, -0.010535240173339844, -0.009813070297241211, -0.009090900421142578, -0.008368730545043945, -0.0076465606689453125, -0.00692439079284668, -0.006202220916748047, -0.005480051040649414, -0.004757881164550781, -0.0040357112884521484, -0.0033135414123535156, -0.002591371536254883, -0.00186920166015625, -0.0011470317840576172, -0.0004248619079589844, 0.00029730796813964844, 0.0010194778442382812, 0.001741647720336914, 0.002463817596435547, 0.0031859874725341797, 0.0039081573486328125, 0.004630327224731445, 0.005352497100830078, 0.006074666976928711, 0.006796836853027344, 0.0075190067291259766, 0.00824117660522461, 0.008963346481323242, 0.009685516357421875, 0.010407686233520508, 0.01112985610961914, 0.011852025985717773, 0.012574195861816406, 0.013296365737915039, 0.014018535614013672, 0.014740705490112305, 0.015462875366210938, 0.01618504524230957, 0.016907215118408203, 0.017629384994506836, 0.01835155487060547, 0.0190737247467041, 0.019795894622802734, 0.020518064498901367, 0.021240234375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 9.0, 14.0, 24.0, 37.0, 68.0, 109.0, 121.0, 147.0, 134.0, 109.0, 92.0, 58.0, 42.0, 18.0, 15.0, 4.0, 5.0, 5.0, 3.0], "bins": [-0.0011978396214544773, -0.0011752607533708215, -0.0011526820017024875, -0.0011301031336188316, -0.0011075242655351758, -0.0010849455138668418, -0.001062366645783186, -0.0010397877776995301, -0.0010172090260311961, -0.0009946301579475403, -0.0009720513480715454, -0.0009494725381955504, -0.0009268937283195555, -0.0009043149184435606, -0.0008817360503599048, -0.0008591572404839098, -0.000836578372400254, -0.0008139995625242591, -0.0007914206944406033, -0.0007688418845646083, -0.0007462630746886134, -0.0007236842066049576, -0.0007011053967289627, -0.0006785265868529677, -0.0006559477187693119, -0.000633368908893317, -0.0006107900408096611, -0.0005882112309336662, -0.0005656324210576713, -0.0005430536111816764, -0.0005204747430980206, -0.0004978959332220256, -0.0004753171233460307, -0.00045273828436620533, -0.0004301594744902104, -0.00040758063551038504, -0.0003850018256343901, -0.00036242298665456474, -0.00033984414767473936, -0.00031726533779874444, -0.00029468649881891906, -0.0002721076598390937, -0.00024952884996309876, -0.0002269500109832734, -0.00020437118655536324, -0.0001817923621274531, -0.0001592135231476277, -0.00013663469871971756, -0.00011405587429180741, -9.147704986389726e-05, -6.88982181600295e-05, -4.631938645616174e-05, -2.374056202825159e-05, -1.1617376003414392e-06, 2.1417101379483938e-05, 4.399592580739409e-05, 6.657475023530424e-05, 8.915357466321439e-05, 0.00011173240636708215, 0.0001343112380709499, 0.00015689006249886006, 0.0001794688869267702, 0.0002020477259065956, 0.00022462655033450574, 0.0002472053747624159]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 10.0, 12.0, 12.0, 15.0, 9.0, 20.0, 23.0, 17.0, 16.0, 27.0, 33.0, 20.0, 34.0, 40.0, 47.0, 45.0, 40.0, 33.0, 44.0, 51.0, 43.0, 37.0, 24.0, 48.0, 37.0, 32.0, 27.0, 33.0, 36.0, 20.0, 14.0, 25.0, 18.0, 11.0, 9.0, 7.0, 4.0, 5.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004337430000305176, -0.00041815266013145447, -0.00040256232023239136, -0.00038697198033332825, -0.00037138164043426514, -0.000355791300535202, -0.0003402009606361389, -0.0003246106207370758, -0.0003090202808380127, -0.0002934299409389496, -0.0002778396010398865, -0.00026224926114082336, -0.00024665892124176025, -0.00023106858134269714, -0.00021547824144363403, -0.00019988790154457092, -0.0001842975616455078, -0.0001687072217464447, -0.0001531168818473816, -0.00013752654194831848, -0.00012193620204925537, -0.00010634586215019226, -9.075552225112915e-05, -7.516518235206604e-05, -5.957484245300293e-05, -4.398450255393982e-05, -2.839416265487671e-05, -1.2803822755813599e-05, 2.7865171432495117e-06, 1.8376857042312622e-05, 3.396719694137573e-05, 4.955753684043884e-05, 6.514787673950195e-05, 8.073821663856506e-05, 9.632855653762817e-05, 0.00011191889643669128, 0.0001275092363357544, 0.0001430995762348175, 0.00015868991613388062, 0.00017428025603294373, 0.00018987059593200684, 0.00020546093583106995, 0.00022105127573013306, 0.00023664161562919617, 0.0002522319555282593, 0.0002678222954273224, 0.0002834126353263855, 0.0002990029752254486, 0.0003145933151245117, 0.00033018365502357483, 0.00034577399492263794, 0.00036136433482170105, 0.00037695467472076416, 0.00039254501461982727, 0.0004081353545188904, 0.0004237256944179535, 0.0004393160343170166, 0.0004549063742160797, 0.0004704967141151428, 0.00048608705401420593, 0.000501677393913269, 0.0005172677338123322, 0.0005328580737113953, 0.0005484484136104584, 0.0005640387535095215]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 6.0, 13.0, 13.0, 16.0, 18.0, 16.0, 27.0, 20.0, 24.0, 26.0, 28.0, 28.0, 30.0, 32.0, 33.0, 39.0, 38.0, 45.0, 39.0, 45.0, 42.0, 34.0, 37.0, 30.0, 38.0, 28.0, 25.0, 25.0, 34.0, 20.0, 23.0, 17.0, 17.0, 18.0, 14.0, 9.0, 5.0, 9.0, 12.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662109375, -1.60418701171875, -1.5462646484375, -1.48834228515625, -1.430419921875, -1.37249755859375, -1.3145751953125, -1.25665283203125, -1.19873046875, -1.14080810546875, -1.0828857421875, -1.02496337890625, -0.967041015625, -0.90911865234375, -0.8511962890625, -0.79327392578125, -0.7353515625, -0.67742919921875, -0.6195068359375, -0.56158447265625, -0.503662109375, -0.44573974609375, -0.3878173828125, -0.32989501953125, -0.27197265625, -0.21405029296875, -0.1561279296875, -0.09820556640625, -0.040283203125, 0.01763916015625, 0.0755615234375, 0.13348388671875, 0.19140625, 0.24932861328125, 0.3072509765625, 0.36517333984375, 0.423095703125, 0.48101806640625, 0.5389404296875, 0.59686279296875, 0.65478515625, 0.71270751953125, 0.7706298828125, 0.82855224609375, 0.886474609375, 0.94439697265625, 1.0023193359375, 1.06024169921875, 1.1181640625, 1.17608642578125, 1.2340087890625, 1.29193115234375, 1.349853515625, 1.40777587890625, 1.4656982421875, 1.52362060546875, 1.58154296875, 1.63946533203125, 1.6973876953125, 1.75531005859375, 1.813232421875, 1.87115478515625, 1.9290771484375, 1.98699951171875, 2.044921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 6.0, 6.0, 10.0, 19.0, 25.0, 25.0, 52.0, 49.0, 73.0, 94.0, 125.0, 206.0, 308.0, 502.0, 751.0, 1335.0, 2354.0, 4568.0, 8633.0, 17679.0, 39992.0, 109701.0, 348455.0, 333939.0, 104718.0, 39183.0, 17101.0, 8295.0, 4372.0, 2352.0, 1317.0, 821.0, 450.0, 302.0, 212.0, 155.0, 106.0, 78.0, 54.0, 25.0, 33.0, 34.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.48046875, -2.407470703125, -2.33447265625, -2.261474609375, -2.1884765625, -2.115478515625, -2.04248046875, -1.969482421875, -1.896484375, -1.823486328125, -1.75048828125, -1.677490234375, -1.6044921875, -1.531494140625, -1.45849609375, -1.385498046875, -1.3125, -1.239501953125, -1.16650390625, -1.093505859375, -1.0205078125, -0.947509765625, -0.87451171875, -0.801513671875, -0.728515625, -0.655517578125, -0.58251953125, -0.509521484375, -0.4365234375, -0.363525390625, -0.29052734375, -0.217529296875, -0.14453125, -0.071533203125, 0.00146484375, 0.074462890625, 0.1474609375, 0.220458984375, 0.29345703125, 0.366455078125, 0.439453125, 0.512451171875, 0.58544921875, 0.658447265625, 0.7314453125, 0.804443359375, 0.87744140625, 0.950439453125, 1.0234375, 1.096435546875, 1.16943359375, 1.242431640625, 1.3154296875, 1.388427734375, 1.46142578125, 1.534423828125, 1.607421875, 1.680419921875, 1.75341796875, 1.826416015625, 1.8994140625, 1.972412109375, 2.04541015625, 2.118408203125, 2.19140625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 9.0, 2.0, 6.0, 11.0, 9.0, 11.0, 19.0, 31.0, 24.0, 29.0, 45.0, 39.0, 46.0, 63.0, 66.0, 124.0, 401.0, 1506.0, 144.0, 75.0, 64.0, 39.0, 47.0, 48.0, 41.0, 27.0, 23.0, 15.0, 23.0, 13.0, 11.0, 8.0, 11.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.42816162109375, -7.1727294921875, -6.91729736328125, -6.661865234375, -6.40643310546875, -6.1510009765625, -5.89556884765625, -5.64013671875, -5.38470458984375, -5.1292724609375, -4.87384033203125, -4.618408203125, -4.36297607421875, -4.1075439453125, -3.85211181640625, -3.5966796875, -3.34124755859375, -3.0858154296875, -2.83038330078125, -2.574951171875, -2.31951904296875, -2.0640869140625, -1.80865478515625, -1.55322265625, -1.29779052734375, -1.0423583984375, -0.78692626953125, -0.531494140625, -0.27606201171875, -0.0206298828125, 0.23480224609375, 0.490234375, 0.74566650390625, 1.0010986328125, 1.25653076171875, 1.511962890625, 1.76739501953125, 2.0228271484375, 2.27825927734375, 2.53369140625, 2.78912353515625, 3.0445556640625, 3.29998779296875, 3.555419921875, 3.81085205078125, 4.0662841796875, 4.32171630859375, 4.5771484375, 4.83258056640625, 5.0880126953125, 5.34344482421875, 5.598876953125, 5.85430908203125, 6.1097412109375, 6.36517333984375, 6.62060546875, 6.87603759765625, 7.1314697265625, 7.38690185546875, 7.642333984375, 7.89776611328125, 8.1531982421875, 8.40863037109375, 8.6640625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 3.0, 8.0, 8.0, 4.0, 12.0, 8.0, 18.0, 22.0, 34.0, 32.0, 46.0, 58.0, 94.0, 133.0, 176.0, 378.0, 1135.0, 9408.0, 472220.0, 2637223.0, 21649.0, 1865.0, 492.0, 229.0, 130.0, 79.0, 50.0, 50.0, 30.0, 25.0, 14.0, 15.0, 11.0, 16.0, 2.0, 12.0, 4.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.5018310546875, -13.081787109375, -12.6617431640625, -12.24169921875, -11.8216552734375, -11.401611328125, -10.9815673828125, -10.5615234375, -10.1414794921875, -9.721435546875, -9.3013916015625, -8.88134765625, -8.4613037109375, -8.041259765625, -7.6212158203125, -7.201171875, -6.7811279296875, -6.361083984375, -5.9410400390625, -5.52099609375, -5.1009521484375, -4.680908203125, -4.2608642578125, -3.8408203125, -3.4207763671875, -3.000732421875, -2.5806884765625, -2.16064453125, -1.7406005859375, -1.320556640625, -0.9005126953125, -0.48046875, -0.0604248046875, 0.359619140625, 0.7796630859375, 1.19970703125, 1.6197509765625, 2.039794921875, 2.4598388671875, 2.8798828125, 3.2999267578125, 3.719970703125, 4.1400146484375, 4.56005859375, 4.9801025390625, 5.400146484375, 5.8201904296875, 6.240234375, 6.6602783203125, 7.080322265625, 7.5003662109375, 7.92041015625, 8.3404541015625, 8.760498046875, 9.1805419921875, 9.6005859375, 10.0206298828125, 10.440673828125, 10.8607177734375, 11.28076171875, 11.7008056640625, 12.120849609375, 12.5408935546875, 12.9609375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 12.0, 19.0, 31.0, 61.0, 89.0, 139.0, 154.0, 141.0, 144.0, 105.0, 52.0, 33.0, 12.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.281735420227051, -5.884679794311523, -5.487624645233154, -5.090569496154785, -4.693513870239258, -4.2964582443237305, -3.8994030952453613, -3.502347707748413, -3.105292320251465, -2.7082369327545166, -2.3111815452575684, -1.9141261577606201, -1.5170707702636719, -1.1200153827667236, -0.7229599952697754, -0.32590460777282715, 0.0711507797241211, 0.46820616722106934, 0.8652615547180176, 1.2623169422149658, 1.659372329711914, 2.0564277172088623, 2.4534831047058105, 2.850538492202759, 3.247593879699707, 3.6446492671966553, 4.0417046546936035, 4.438759803771973, 4.8358154296875, 5.232871055603027, 5.6299262046813965, 6.026981353759766, 6.424036026000977, 6.821091651916504, 7.218146800994873, 7.615201950073242, 8.01225757598877, 8.409313201904297, 8.806367874145508, 9.203423500061035, 9.600479125976562, 9.99753475189209, 10.394590377807617, 10.791645050048828, 11.188700675964355, 11.585756301879883, 11.982810974121094, 12.379866600036621, 12.776922225952148, 13.173977851867676, 13.571033477783203, 13.968088150024414, 14.365143775939941, 14.762199401855469, 15.15925407409668, 15.556309700012207, 15.953365325927734, 16.350419998168945, 16.74747657775879, 17.14453125, 17.541587829589844, 17.938642501831055, 18.335697174072266, 18.73275375366211, 19.12980842590332]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 7.0, 7.0, 6.0, 10.0, 9.0, 11.0, 18.0, 19.0, 13.0, 23.0, 20.0, 27.0, 31.0, 18.0, 33.0, 39.0, 44.0, 32.0, 44.0, 48.0, 47.0, 40.0, 43.0, 24.0, 37.0, 30.0, 42.0, 27.0, 31.0, 22.0, 34.0, 19.0, 18.0, 22.0, 20.0, 15.0, 10.0, 13.0, 16.0, 4.0, 6.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.8933048248291, -21.236045837402344, -20.578786849975586, -19.921527862548828, -19.26426887512207, -18.607009887695312, -17.949750900268555, -17.292491912841797, -16.63523292541504, -15.977973937988281, -15.320714950561523, -14.663455963134766, -14.006196975708008, -13.34893798828125, -12.691679000854492, -12.034420013427734, -11.377161026000977, -10.719902038574219, -10.062643051147461, -9.405384063720703, -8.748125076293945, -8.090866088867188, -7.43360710144043, -6.776348114013672, -6.119089126586914, -5.461830139160156, -4.804571151733398, -4.147312164306641, -3.490053176879883, -2.832794189453125, -2.175535202026367, -1.5182762145996094, -0.8610153198242188, -0.20375633239746094, 0.4535026550292969, 1.1107616424560547, 1.7680206298828125, 2.4252796173095703, 3.082538604736328, 3.739797592163086, 4.397056579589844, 5.054315567016602, 5.711574554443359, 6.368833541870117, 7.026092529296875, 7.683351516723633, 8.34061050415039, 8.997869491577148, 9.655128479003906, 10.312387466430664, 10.969646453857422, 11.62690544128418, 12.284164428710938, 12.941423416137695, 13.598682403564453, 14.255941390991211, 14.913200378417969, 15.570459365844727, 16.227718353271484, 16.884977340698242, 17.542236328125, 18.199495315551758, 18.856754302978516, 19.514013290405273, 20.17127227783203]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 12.0, 12.0, 10.0, 19.0, 19.0, 16.0, 24.0, 21.0, 29.0, 23.0, 15.0, 27.0, 33.0, 45.0, 32.0, 39.0, 39.0, 44.0, 41.0, 42.0, 36.0, 39.0, 39.0, 42.0, 26.0, 30.0, 20.0, 30.0, 22.0, 20.0, 26.0, 21.0, 18.0, 15.0, 6.0, 12.0, 11.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7501678466796875, -1.688812255859375, -1.6274566650390625, -1.56610107421875, -1.5047454833984375, -1.443389892578125, -1.3820343017578125, -1.3206787109375, -1.2593231201171875, -1.197967529296875, -1.1366119384765625, -1.07525634765625, -1.0139007568359375, -0.952545166015625, -0.8911895751953125, -0.829833984375, -0.7684783935546875, -0.707122802734375, -0.6457672119140625, -0.58441162109375, -0.5230560302734375, -0.461700439453125, -0.4003448486328125, -0.3389892578125, -0.2776336669921875, -0.216278076171875, -0.1549224853515625, -0.09356689453125, -0.0322113037109375, 0.029144287109375, 0.0904998779296875, 0.15185546875, 0.2132110595703125, 0.274566650390625, 0.3359222412109375, 0.39727783203125, 0.4586334228515625, 0.519989013671875, 0.5813446044921875, 0.6427001953125, 0.7040557861328125, 0.765411376953125, 0.8267669677734375, 0.88812255859375, 0.9494781494140625, 1.010833740234375, 1.0721893310546875, 1.133544921875, 1.1949005126953125, 1.256256103515625, 1.3176116943359375, 1.37896728515625, 1.4403228759765625, 1.501678466796875, 1.5630340576171875, 1.6243896484375, 1.6857452392578125, 1.747100830078125, 1.8084564208984375, 1.86981201171875, 1.9311676025390625, 1.992523193359375, 2.0538787841796875, 2.115234375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 1.0, 5.0, 8.0, 11.0, 10.0, 14.0, 18.0, 24.0, 14.0, 32.0, 21.0, 29.0, 32.0, 42.0, 85.0, 159.0, 459.0, 1918.0, 16251.0, 440741.0, 3485301.0, 235924.0, 10850.0, 1477.0, 366.0, 137.0, 68.0, 52.0, 31.0, 35.0, 17.0, 24.0, 14.0, 26.0, 16.0, 9.0, 14.0, 8.0, 5.0, 8.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.439697265625, -9.12939453125, -8.819091796875, -8.5087890625, -8.198486328125, -7.88818359375, -7.577880859375, -7.267578125, -6.957275390625, -6.64697265625, -6.336669921875, -6.0263671875, -5.716064453125, -5.40576171875, -5.095458984375, -4.78515625, -4.474853515625, -4.16455078125, -3.854248046875, -3.5439453125, -3.233642578125, -2.92333984375, -2.613037109375, -2.302734375, -1.992431640625, -1.68212890625, -1.371826171875, -1.0615234375, -0.751220703125, -0.44091796875, -0.130615234375, 0.1796875, 0.489990234375, 0.80029296875, 1.110595703125, 1.4208984375, 1.731201171875, 2.04150390625, 2.351806640625, 2.662109375, 2.972412109375, 3.28271484375, 3.593017578125, 3.9033203125, 4.213623046875, 4.52392578125, 4.834228515625, 5.14453125, 5.454833984375, 5.76513671875, 6.075439453125, 6.3857421875, 6.696044921875, 7.00634765625, 7.316650390625, 7.626953125, 7.937255859375, 8.24755859375, 8.557861328125, 8.8681640625, 9.178466796875, 9.48876953125, 9.799072265625, 10.109375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 14.0, 11.0, 24.0, 28.0, 43.0, 47.0, 50.0, 68.0, 107.0, 109.0, 165.0, 225.0, 260.0, 353.0, 395.0, 381.0, 400.0, 308.0, 256.0, 218.0, 137.0, 114.0, 90.0, 60.0, 43.0, 29.0, 24.0, 31.0, 11.0, 11.0, 10.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.19921875, -5.02740478515625, -4.8555908203125, -4.68377685546875, -4.511962890625, -4.34014892578125, -4.1683349609375, -3.99652099609375, -3.82470703125, -3.65289306640625, -3.4810791015625, -3.30926513671875, -3.137451171875, -2.96563720703125, -2.7938232421875, -2.62200927734375, -2.4501953125, -2.27838134765625, -2.1065673828125, -1.93475341796875, -1.762939453125, -1.59112548828125, -1.4193115234375, -1.24749755859375, -1.07568359375, -0.90386962890625, -0.7320556640625, -0.56024169921875, -0.388427734375, -0.21661376953125, -0.0447998046875, 0.12701416015625, 0.298828125, 0.47064208984375, 0.6424560546875, 0.81427001953125, 0.986083984375, 1.15789794921875, 1.3297119140625, 1.50152587890625, 1.67333984375, 1.84515380859375, 2.0169677734375, 2.18878173828125, 2.360595703125, 2.53240966796875, 2.7042236328125, 2.87603759765625, 3.0478515625, 3.21966552734375, 3.3914794921875, 3.56329345703125, 3.735107421875, 3.90692138671875, 4.0787353515625, 4.25054931640625, 4.42236328125, 4.59417724609375, 4.7659912109375, 4.93780517578125, 5.109619140625, 5.28143310546875, 5.4532470703125, 5.62506103515625, 5.796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 10.0, 13.0, 18.0, 19.0, 46.0, 55.0, 79.0, 125.0, 208.0, 433.0, 1439.0, 11006.0, 442533.0, 3623693.0, 108042.0, 4805.0, 861.0, 335.0, 185.0, 129.0, 89.0, 45.0, 32.0, 27.0, 18.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7578125, -15.1358642578125, -14.513916015625, -13.8919677734375, -13.27001953125, -12.6480712890625, -12.026123046875, -11.4041748046875, -10.7822265625, -10.1602783203125, -9.538330078125, -8.9163818359375, -8.29443359375, -7.6724853515625, -7.050537109375, -6.4285888671875, -5.806640625, -5.1846923828125, -4.562744140625, -3.9407958984375, -3.31884765625, -2.6968994140625, -2.074951171875, -1.4530029296875, -0.8310546875, -0.2091064453125, 0.412841796875, 1.0347900390625, 1.65673828125, 2.2786865234375, 2.900634765625, 3.5225830078125, 4.14453125, 4.7664794921875, 5.388427734375, 6.0103759765625, 6.63232421875, 7.2542724609375, 7.876220703125, 8.4981689453125, 9.1201171875, 9.7420654296875, 10.364013671875, 10.9859619140625, 11.60791015625, 12.2298583984375, 12.851806640625, 13.4737548828125, 14.095703125, 14.7176513671875, 15.339599609375, 15.9615478515625, 16.58349609375, 17.2054443359375, 17.827392578125, 18.4493408203125, 19.0712890625, 19.6932373046875, 20.315185546875, 20.9371337890625, 21.55908203125, 22.1810302734375, 22.802978515625, 23.4249267578125, 24.046875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 18.0, 49.0, 114.0, 207.0, 263.0, 196.0, 112.0, 42.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.81116485595703, -95.94668579101562, -94.08219909667969, -92.21772003173828, -90.35323333740234, -88.48875427246094, -86.624267578125, -84.7597885131836, -82.89530181884766, -81.03082275390625, -79.16633605957031, -77.3018569946289, -75.43737030029297, -73.57289123535156, -71.70840454101562, -69.84392547607422, -67.97943878173828, -66.11495971679688, -64.25047302246094, -62.385990142822266, -60.521507263183594, -58.65702438354492, -56.79254150390625, -54.92805862426758, -53.06357955932617, -51.1990966796875, -49.33461380004883, -47.470130920410156, -45.605648040771484, -43.74116516113281, -41.87668228149414, -40.01219940185547, -38.1477165222168, -36.283233642578125, -34.41875076293945, -32.55426788330078, -30.68978500366211, -28.825302124023438, -26.960819244384766, -25.096336364746094, -23.231853485107422, -21.36737060546875, -19.502887725830078, -17.638404846191406, -15.773921966552734, -13.909440040588379, -12.044957160949707, -10.180474281311035, -8.31599235534668, -6.451509475708008, -4.587026596069336, -2.7225441932678223, -0.8580613136291504, 1.0064210891723633, 2.870903968811035, 4.735386848449707, 6.599869728088379, 8.46435260772705, 10.328835487365723, 12.193317413330078, 14.05780029296875, 15.922283172607422, 17.786766052246094, 19.651248931884766, 21.515731811523438]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 4.0, 10.0, 7.0, 13.0, 13.0, 23.0, 21.0, 27.0, 19.0, 18.0, 29.0, 27.0, 37.0, 28.0, 36.0, 37.0, 37.0, 39.0, 35.0, 53.0, 36.0, 53.0, 35.0, 39.0, 32.0, 35.0, 40.0, 27.0, 30.0, 17.0, 21.0, 23.0, 17.0, 13.0, 11.0, 10.0, 8.0, 6.0, 5.0, 5.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.533710479736328, -16.919811248779297, -16.305910110473633, -15.692010879516602, -15.07811164855957, -14.464211463928223, -13.850311279296875, -13.236412048339844, -12.622512817382812, -12.008612632751465, -11.394713401794434, -10.780813217163086, -10.166913986206055, -9.553013801574707, -8.93911361694336, -8.325214385986328, -7.7113142013549805, -7.097414493560791, -6.483514785766602, -5.869614601135254, -5.255715370178223, -4.641815185546875, -4.0279154777526855, -3.414015769958496, -2.8001160621643066, -2.186216354370117, -1.5723165273666382, -0.9584167003631592, -0.3445169925689697, 0.2693827152252197, 0.8832826614379883, 1.4971823692321777, 2.111082077026367, 2.7249817848205566, 3.338881492614746, 3.9527814388275146, 4.566680908203125, 5.180581092834473, 5.794480800628662, 6.408380508422852, 7.022280216217041, 7.6361799240112305, 8.250080108642578, 8.86397933959961, 9.477879524230957, 10.091778755187988, 10.705678939819336, 11.319578170776367, 11.933478355407715, 12.547378540039062, 13.161277770996094, 13.775177955627441, 14.389077186584473, 15.00297737121582, 15.616876602172852, 16.230777740478516, 16.844676971435547, 17.458576202392578, 18.072477340698242, 18.686376571655273, 19.300275802612305, 19.914175033569336, 20.528076171875, 21.14197540283203, 21.755874633789062]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 9.0, 12.0, 7.0, 21.0, 21.0, 21.0, 22.0, 19.0, 33.0, 31.0, 38.0, 27.0, 30.0, 39.0, 38.0, 42.0, 35.0, 34.0, 41.0, 45.0, 34.0, 28.0, 25.0, 35.0, 39.0, 23.0, 24.0, 26.0, 19.0, 29.0, 17.0, 16.0, 15.0, 16.0, 9.0, 7.0, 11.0, 12.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8544921875, -1.7937164306640625, -1.732940673828125, -1.6721649169921875, -1.61138916015625, -1.5506134033203125, -1.489837646484375, -1.4290618896484375, -1.3682861328125, -1.3075103759765625, -1.246734619140625, -1.1859588623046875, -1.12518310546875, -1.0644073486328125, -1.003631591796875, -0.9428558349609375, -0.882080078125, -0.8213043212890625, -0.760528564453125, -0.6997528076171875, -0.63897705078125, -0.5782012939453125, -0.517425537109375, -0.4566497802734375, -0.3958740234375, -0.3350982666015625, -0.274322509765625, -0.2135467529296875, -0.15277099609375, -0.0919952392578125, -0.031219482421875, 0.0295562744140625, 0.09033203125, 0.1511077880859375, 0.211883544921875, 0.2726593017578125, 0.33343505859375, 0.3942108154296875, 0.454986572265625, 0.5157623291015625, 0.5765380859375, 0.6373138427734375, 0.698089599609375, 0.7588653564453125, 0.81964111328125, 0.8804168701171875, 0.941192626953125, 1.0019683837890625, 1.062744140625, 1.1235198974609375, 1.184295654296875, 1.2450714111328125, 1.30584716796875, 1.3666229248046875, 1.427398681640625, 1.4881744384765625, 1.5489501953125, 1.6097259521484375, 1.670501708984375, 1.7312774658203125, 1.79205322265625, 1.8528289794921875, 1.913604736328125, 1.9743804931640625, 2.03515625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 13.0, 27.0, 29.0, 38.0, 37.0, 63.0, 122.0, 192.0, 298.0, 419.0, 654.0, 1090.0, 1666.0, 2612.0, 4203.0, 6779.0, 11298.0, 19184.0, 32822.0, 56214.0, 96418.0, 166500.0, 247628.0, 166340.0, 95761.0, 56247.0, 33175.0, 18977.0, 11334.0, 7010.0, 4235.0, 2573.0, 1609.0, 1078.0, 672.0, 417.0, 274.0, 212.0, 103.0, 74.0, 45.0, 47.0, 28.0, 13.0, 10.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.22900390625, -0.22124099731445312, -0.21347808837890625, -0.20571517944335938, -0.1979522705078125, -0.19018936157226562, -0.18242645263671875, -0.17466354370117188, -0.166900634765625, -0.15913772583007812, -0.15137481689453125, -0.14361190795898438, -0.1358489990234375, -0.12808609008789062, -0.12032318115234375, -0.11256027221679688, -0.10479736328125, -0.09703445434570312, -0.08927154541015625, -0.08150863647460938, -0.0737457275390625, -0.06598281860351562, -0.05821990966796875, -0.050457000732421875, -0.042694091796875, -0.034931182861328125, -0.02716827392578125, -0.019405364990234375, -0.0116424560546875, -0.003879547119140625, 0.00388336181640625, 0.011646270751953125, 0.0194091796875, 0.027172088623046875, 0.03493499755859375, 0.042697906494140625, 0.0504608154296875, 0.058223724365234375, 0.06598663330078125, 0.07374954223632812, 0.081512451171875, 0.08927536010742188, 0.09703826904296875, 0.10480117797851562, 0.1125640869140625, 0.12032699584960938, 0.12808990478515625, 0.13585281372070312, 0.14361572265625, 0.15137863159179688, 0.15914154052734375, 0.16690444946289062, 0.1746673583984375, 0.18243026733398438, 0.19019317626953125, 0.19795608520507812, 0.205718994140625, 0.21348190307617188, 0.22124481201171875, 0.22900772094726562, 0.2367706298828125, 0.24453353881835938, 0.25229644775390625, 0.2600593566894531, 0.267822265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 3.0, 6.0, 9.0, 9.0, 14.0, 14.0, 16.0, 18.0, 10.0, 21.0, 25.0, 27.0, 28.0, 30.0, 33.0, 33.0, 38.0, 36.0, 41.0, 37.0, 47.0, 1069.0, 37.0, 41.0, 33.0, 36.0, 33.0, 28.0, 38.0, 20.0, 21.0, 21.0, 22.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 9.0, 9.0, 11.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2265625, -1.188690185546875, -1.15081787109375, -1.112945556640625, -1.0750732421875, -1.037200927734375, -0.99932861328125, -0.961456298828125, -0.923583984375, -0.885711669921875, -0.84783935546875, -0.809967041015625, -0.7720947265625, -0.734222412109375, -0.69635009765625, -0.658477783203125, -0.62060546875, -0.582733154296875, -0.54486083984375, -0.506988525390625, -0.4691162109375, -0.431243896484375, -0.39337158203125, -0.355499267578125, -0.317626953125, -0.279754638671875, -0.24188232421875, -0.204010009765625, -0.1661376953125, -0.128265380859375, -0.09039306640625, -0.052520751953125, -0.0146484375, 0.023223876953125, 0.06109619140625, 0.098968505859375, 0.1368408203125, 0.174713134765625, 0.21258544921875, 0.250457763671875, 0.288330078125, 0.326202392578125, 0.36407470703125, 0.401947021484375, 0.4398193359375, 0.477691650390625, 0.51556396484375, 0.553436279296875, 0.59130859375, 0.629180908203125, 0.66705322265625, 0.704925537109375, 0.7427978515625, 0.780670166015625, 0.81854248046875, 0.856414794921875, 0.894287109375, 0.932159423828125, 0.97003173828125, 1.007904052734375, 1.0457763671875, 1.083648681640625, 1.12152099609375, 1.159393310546875, 1.197265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 7.0, 19.0, 39.0, 44.0, 66.0, 105.0, 148.0, 234.0, 301.0, 465.0, 634.0, 967.0, 1415.0, 1973.0, 2970.0, 4168.0, 6246.0, 9400.0, 14030.0, 21188.0, 33177.0, 51680.0, 81746.0, 131119.0, 1237934.0, 185793.0, 111765.0, 70391.0, 44180.0, 28403.0, 18530.0, 12058.0, 8241.0, 5506.0, 3863.0, 2505.0, 1845.0, 1324.0, 794.0, 579.0, 414.0, 300.0, 218.0, 120.0, 85.0, 60.0, 31.0, 18.0, 12.0, 8.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.189697265625, -0.18391990661621094, -0.17814254760742188, -0.1723651885986328, -0.16658782958984375, -0.1608104705810547, -0.15503311157226562, -0.14925575256347656, -0.1434783935546875, -0.13770103454589844, -0.13192367553710938, -0.1261463165283203, -0.12036895751953125, -0.11459159851074219, -0.10881423950195312, -0.10303688049316406, -0.097259521484375, -0.09148216247558594, -0.08570480346679688, -0.07992744445800781, -0.07415008544921875, -0.06837272644042969, -0.06259536743164062, -0.05681800842285156, -0.0510406494140625, -0.04526329040527344, -0.039485931396484375, -0.03370857238769531, -0.02793121337890625, -0.022153854370117188, -0.016376495361328125, -0.010599136352539062, -0.00482177734375, 0.0009555816650390625, 0.006732940673828125, 0.012510299682617188, 0.01828765869140625, 0.024065017700195312, 0.029842376708984375, 0.03561973571777344, 0.0413970947265625, 0.04717445373535156, 0.052951812744140625, 0.05872917175292969, 0.06450653076171875, 0.07028388977050781, 0.07606124877929688, 0.08183860778808594, 0.087615966796875, 0.09339332580566406, 0.09917068481445312, 0.10494804382324219, 0.11072540283203125, 0.11650276184082031, 0.12228012084960938, 0.12805747985839844, 0.1338348388671875, 0.13961219787597656, 0.14538955688476562, 0.1511669158935547, 0.15694427490234375, 0.1627216339111328, 0.16849899291992188, 0.17427635192871094, 0.1800537109375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 6.0, 11.0, 14.0, 17.0, 14.0, 37.0, 57.0, 92.0, 132.0, 173.0, 155.0, 102.0, 49.0, 30.0, 23.0, 20.0, 17.0, 5.0, 7.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024738311767578125, -0.0024022161960601807, -0.002330601215362549, -0.002258986234664917, -0.002187371253967285, -0.0021157562732696533, -0.0020441412925720215, -0.0019725263118743896, -0.0019009113311767578, -0.001829296350479126, -0.0017576813697814941, -0.0016860663890838623, -0.0016144514083862305, -0.0015428364276885986, -0.0014712214469909668, -0.001399606466293335, -0.0013279914855957031, -0.0012563765048980713, -0.0011847615242004395, -0.0011131465435028076, -0.0010415315628051758, -0.0009699165821075439, -0.0008983016014099121, -0.0008266866207122803, -0.0007550716400146484, -0.0006834566593170166, -0.0006118416786193848, -0.0005402266979217529, -0.0004686117172241211, -0.00039699673652648926, -0.0003253817558288574, -0.0002537667751312256, -0.00018215179443359375, -0.00011053681373596191, -3.892183303833008e-05, 3.269314765930176e-05, 0.0001043081283569336, 0.00017592310905456543, 0.00024753808975219727, 0.0003191530704498291, 0.00039076805114746094, 0.0004623830318450928, 0.0005339980125427246, 0.0006056129932403564, 0.0006772279739379883, 0.0007488429546356201, 0.000820457935333252, 0.0008920729160308838, 0.0009636878967285156, 0.0010353028774261475, 0.0011069178581237793, 0.0011785328388214111, 0.001250147819519043, 0.0013217628002166748, 0.0013933777809143066, 0.0014649927616119385, 0.0015366077423095703, 0.0016082227230072021, 0.001679837703704834, 0.0017514526844024658, 0.0018230676651000977, 0.0018946826457977295, 0.0019662976264953613, 0.002037912607192993, 0.002109527587890625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 8.0, 6.0, 7.0, 8.0, 13.0, 16.0, 24.0, 35.0, 48.0, 70.0, 110.0, 198.0, 370.0, 1082.0, 630878.0, 413768.0, 999.0, 387.0, 173.0, 102.0, 62.0, 44.0, 35.0, 21.0, 18.0, 12.0, 13.0, 10.0, 8.0, 7.0, 2.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.03765869140625, -0.03655052185058594, -0.035442352294921875, -0.03433418273925781, -0.03322601318359375, -0.03211784362792969, -0.031009674072265625, -0.029901504516601562, -0.0287933349609375, -0.027685165405273438, -0.026576995849609375, -0.025468826293945312, -0.02436065673828125, -0.023252487182617188, -0.022144317626953125, -0.021036148071289062, -0.019927978515625, -0.018819808959960938, -0.017711639404296875, -0.016603469848632812, -0.01549530029296875, -0.014387130737304688, -0.013278961181640625, -0.012170791625976562, -0.0110626220703125, -0.009954452514648438, -0.008846282958984375, -0.0077381134033203125, -0.00662994384765625, -0.0055217742919921875, -0.004413604736328125, -0.0033054351806640625, -0.002197265625, -0.0010890960693359375, 1.9073486328125e-05, 0.0011272430419921875, 0.00223541259765625, 0.0033435821533203125, 0.004451751708984375, 0.0055599212646484375, 0.0066680908203125, 0.0077762603759765625, 0.008884429931640625, 0.009992599487304688, 0.01110076904296875, 0.012208938598632812, 0.013317108154296875, 0.014425277709960938, 0.015533447265625, 0.016641616821289062, 0.017749786376953125, 0.018857955932617188, 0.01996612548828125, 0.021074295043945312, 0.022182464599609375, 0.023290634155273438, 0.0243988037109375, 0.025506973266601562, 0.026615142822265625, 0.027723312377929688, 0.02883148193359375, 0.029939651489257812, 0.031047821044921875, 0.03215599060058594, 0.03326416015625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 20.0, 77.0, 254.0, 390.0, 195.0, 56.0, 13.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014005162520334125, -0.0013281760038807988, -0.0012558357557281852, -0.0011834955075755715, -0.001111155259422958, -0.0010388150112703443, -0.0009664747631177306, -0.000894134514965117, -0.0008217942668125033, -0.0007494540186598897, -0.0006771137705072761, -0.0006047735223546624, -0.0005324332742020488, -0.00046009302604943514, -0.0003877527778968215, -0.00031541252974420786, -0.00024307228159159422, -0.00017073203343898058, -9.839178528636694e-05, -2.60515371337533e-05, 4.628871101886034e-05, 0.00011862895917147398, 0.00019096920732408762, 0.00026330945547670126, 0.0003356497036293149, 0.00040798995178192854, 0.0004803301999345422, 0.0005526704480871558, 0.0006250106962397695, 0.0006973509443923831, 0.0007696911925449967, 0.0008420314406976104, 0.0009143715724349022, 0.0009867118205875158, 0.0010590520687401295, 0.0011313923168927431, 0.0012037325650453568, 0.0012760728131979704, 0.001348413061350584, 0.0014207533095031977, 0.0014930935576558113, 0.001565433805808425, 0.0016377740539610386, 0.0017101143021136522, 0.0017824545502662659, 0.0018547947984188795, 0.0019271350465714931, 0.001999475294724107, 0.0020718155428767204, 0.002144155791029334, 0.0022164960391819477, 0.0022888362873345613, 0.002361176535487175, 0.0024335167836397886, 0.0025058570317924023, 0.002578197279945016, 0.0026505375280976295, 0.002722877776250243, 0.002795218024402857, 0.0028675582725554705, 0.002939898520708084, 0.0030122387688606977, 0.0030845790170133114, 0.003156919265165925, 0.0032292595133185387]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 9.0, 19.0, 12.0, 11.0, 20.0, 16.0, 15.0, 34.0, 38.0, 35.0, 31.0, 33.0, 48.0, 31.0, 32.0, 40.0, 34.0, 51.0, 34.0, 37.0, 47.0, 32.0, 26.0, 40.0, 29.0, 32.0, 20.0, 27.0, 26.0, 28.0, 19.0, 17.0, 16.0, 10.0, 6.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0006836652755737305, -0.0006627347320318222, -0.0006418041884899139, -0.0006208736449480057, -0.0005999431014060974, -0.0005790125578641891, -0.0005580820143222809, -0.0005371514707803726, -0.0005162209272384644, -0.0004952903836965561, -0.00047435984015464783, -0.00045342929661273956, -0.0004324987530708313, -0.00041156820952892303, -0.00039063766598701477, -0.0003697071224451065, -0.00034877657890319824, -0.00032784603536129, -0.0003069154918193817, -0.00028598494827747345, -0.0002650544047355652, -0.00024412386119365692, -0.00022319331765174866, -0.0002022627741098404, -0.00018133223056793213, -0.00016040168702602386, -0.0001394711434841156, -0.00011854059994220734, -9.761005640029907e-05, -7.667951285839081e-05, -5.5748969316482544e-05, -3.481842577457428e-05, -1.3887882232666016e-05, 7.0426613092422485e-06, 2.7973204851150513e-05, 4.890374839305878e-05, 6.983429193496704e-05, 9.07648354768753e-05, 0.00011169537901878357, 0.00013262592256069183, 0.0001535564661026001, 0.00017448700964450836, 0.00019541755318641663, 0.0002163480967283249, 0.00023727864027023315, 0.0002582091838121414, 0.0002791397273540497, 0.00030007027089595795, 0.0003210008144378662, 0.0003419313579797745, 0.00036286190152168274, 0.000383792445063591, 0.00040472298860549927, 0.00042565353214740753, 0.0004465840756893158, 0.00046751461923122406, 0.0004884451627731323, 0.0005093757063150406, 0.0005303062498569489, 0.0005512367933988571, 0.0005721673369407654, 0.0005930978804826736, 0.0006140284240245819, 0.0006349589675664902, 0.0006558895111083984]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 9.0, 12.0, 7.0, 21.0, 21.0, 21.0, 22.0, 19.0, 33.0, 31.0, 38.0, 27.0, 30.0, 39.0, 38.0, 42.0, 35.0, 34.0, 41.0, 45.0, 34.0, 28.0, 25.0, 35.0, 40.0, 22.0, 24.0, 26.0, 19.0, 29.0, 17.0, 16.0, 15.0, 16.0, 9.0, 7.0, 11.0, 12.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8544921875, -1.7937164306640625, -1.732940673828125, -1.6721649169921875, -1.61138916015625, -1.5506134033203125, -1.489837646484375, -1.4290618896484375, -1.3682861328125, -1.3075103759765625, -1.246734619140625, -1.1859588623046875, -1.12518310546875, -1.0644073486328125, -1.003631591796875, -0.9428558349609375, -0.882080078125, -0.8213043212890625, -0.760528564453125, -0.6997528076171875, -0.63897705078125, -0.5782012939453125, -0.517425537109375, -0.4566497802734375, -0.3958740234375, -0.3350982666015625, -0.274322509765625, -0.2135467529296875, -0.15277099609375, -0.0919952392578125, -0.031219482421875, 0.0295562744140625, 0.09033203125, 0.1511077880859375, 0.211883544921875, 0.2726593017578125, 0.33343505859375, 0.3942108154296875, 0.454986572265625, 0.5157623291015625, 0.5765380859375, 0.6373138427734375, 0.698089599609375, 0.7588653564453125, 0.81964111328125, 0.8804168701171875, 0.941192626953125, 1.0019683837890625, 1.062744140625, 1.1235198974609375, 1.184295654296875, 1.2450714111328125, 1.30584716796875, 1.3666229248046875, 1.427398681640625, 1.4881744384765625, 1.5489501953125, 1.6097259521484375, 1.670501708984375, 1.7312774658203125, 1.79205322265625, 1.8528289794921875, 1.913604736328125, 1.9743804931640625, 2.03515625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 14.0, 13.0, 15.0, 19.0, 25.0, 35.0, 37.0, 59.0, 68.0, 110.0, 142.0, 231.0, 327.0, 570.0, 907.0, 1570.0, 3038.0, 6737.0, 17028.0, 49117.0, 169982.0, 429412.0, 254325.0, 73349.0, 23579.0, 9038.0, 4025.0, 1910.0, 1035.0, 608.0, 331.0, 285.0, 157.0, 117.0, 82.0, 61.0, 38.0, 39.0, 31.0, 23.0, 12.0, 10.0, 13.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.423828125, -2.34478759765625, -2.2657470703125, -2.18670654296875, -2.107666015625, -2.02862548828125, -1.9495849609375, -1.87054443359375, -1.79150390625, -1.71246337890625, -1.6334228515625, -1.55438232421875, -1.475341796875, -1.39630126953125, -1.3172607421875, -1.23822021484375, -1.1591796875, -1.08013916015625, -1.0010986328125, -0.92205810546875, -0.843017578125, -0.76397705078125, -0.6849365234375, -0.60589599609375, -0.52685546875, -0.44781494140625, -0.3687744140625, -0.28973388671875, -0.210693359375, -0.13165283203125, -0.0526123046875, 0.02642822265625, 0.10546875, 0.18450927734375, 0.2635498046875, 0.34259033203125, 0.421630859375, 0.50067138671875, 0.5797119140625, 0.65875244140625, 0.73779296875, 0.81683349609375, 0.8958740234375, 0.97491455078125, 1.053955078125, 1.13299560546875, 1.2120361328125, 1.29107666015625, 1.3701171875, 1.44915771484375, 1.5281982421875, 1.60723876953125, 1.686279296875, 1.76531982421875, 1.8443603515625, 1.92340087890625, 2.00244140625, 2.08148193359375, 2.1605224609375, 2.23956298828125, 2.318603515625, 2.39764404296875, 2.4766845703125, 2.55572509765625, 2.634765625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 4.0, 4.0, 4.0, 8.0, 8.0, 15.0, 15.0, 18.0, 19.0, 15.0, 31.0, 32.0, 36.0, 48.0, 53.0, 49.0, 77.0, 154.0, 1547.0, 348.0, 99.0, 64.0, 49.0, 55.0, 43.0, 40.0, 38.0, 27.0, 28.0, 24.0, 13.0, 16.0, 14.0, 10.0, 7.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.8359375, -8.58233642578125, -8.3287353515625, -8.07513427734375, -7.821533203125, -7.56793212890625, -7.3143310546875, -7.06072998046875, -6.80712890625, -6.55352783203125, -6.2999267578125, -6.04632568359375, -5.792724609375, -5.53912353515625, -5.2855224609375, -5.03192138671875, -4.7783203125, -4.52471923828125, -4.2711181640625, -4.01751708984375, -3.763916015625, -3.51031494140625, -3.2567138671875, -3.00311279296875, -2.74951171875, -2.49591064453125, -2.2423095703125, -1.98870849609375, -1.735107421875, -1.48150634765625, -1.2279052734375, -0.97430419921875, -0.720703125, -0.46710205078125, -0.2135009765625, 0.04010009765625, 0.293701171875, 0.54730224609375, 0.8009033203125, 1.05450439453125, 1.30810546875, 1.56170654296875, 1.8153076171875, 2.06890869140625, 2.322509765625, 2.57611083984375, 2.8297119140625, 3.08331298828125, 3.3369140625, 3.59051513671875, 3.8441162109375, 4.09771728515625, 4.351318359375, 4.60491943359375, 4.8585205078125, 5.11212158203125, 5.36572265625, 5.61932373046875, 5.8729248046875, 6.12652587890625, 6.380126953125, 6.63372802734375, 6.8873291015625, 7.14093017578125, 7.39453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 12.0, 21.0, 20.0, 26.0, 36.0, 34.0, 55.0, 86.0, 105.0, 155.0, 270.0, 706.0, 3012.0, 45205.0, 2991689.0, 97838.0, 4602.0, 887.0, 324.0, 162.0, 112.0, 64.0, 56.0, 26.0, 28.0, 26.0, 23.0, 16.0, 13.0, 13.0, 7.0, 6.0, 9.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7890625, -12.38427734375, -11.9794921875, -11.57470703125, -11.169921875, -10.76513671875, -10.3603515625, -9.95556640625, -9.55078125, -9.14599609375, -8.7412109375, -8.33642578125, -7.931640625, -7.52685546875, -7.1220703125, -6.71728515625, -6.3125, -5.90771484375, -5.5029296875, -5.09814453125, -4.693359375, -4.28857421875, -3.8837890625, -3.47900390625, -3.07421875, -2.66943359375, -2.2646484375, -1.85986328125, -1.455078125, -1.05029296875, -0.6455078125, -0.24072265625, 0.1640625, 0.56884765625, 0.9736328125, 1.37841796875, 1.783203125, 2.18798828125, 2.5927734375, 2.99755859375, 3.40234375, 3.80712890625, 4.2119140625, 4.61669921875, 5.021484375, 5.42626953125, 5.8310546875, 6.23583984375, 6.640625, 7.04541015625, 7.4501953125, 7.85498046875, 8.259765625, 8.66455078125, 9.0693359375, 9.47412109375, 9.87890625, 10.28369140625, 10.6884765625, 11.09326171875, 11.498046875, 11.90283203125, 12.3076171875, 12.71240234375, 13.1171875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [11.0, 981.0, 25.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390697479248047, -3.1935367584228516, 2.0036239624023438, 7.200784683227539, 12.397945404052734, 17.59510612487793, 22.792266845703125, 27.989429473876953, 33.186588287353516, 38.383750915527344, 43.580909729003906, 48.77806854248047, 53.9752311706543, 59.172393798828125, 64.36955261230469, 69.56671142578125, 74.76387023925781, 79.96102905273438, 85.15818786621094, 90.35535430908203, 95.5525131225586, 100.74967193603516, 105.94683837890625, 111.14399719238281, 116.34115600585938, 121.53831481933594, 126.7354736328125, 131.93263244628906, 137.12979125976562, 142.32696533203125, 147.5241241455078, 152.72128295898438, 157.91845703125, 163.11561584472656, 168.31277465820312, 173.5099334716797, 178.70709228515625, 183.90426635742188, 189.10142517089844, 194.298583984375, 199.49574279785156, 204.69290161132812, 209.8900604248047, 215.08721923828125, 220.28439331054688, 225.48155212402344, 230.6787109375, 235.87586975097656, 241.07302856445312, 246.2701873779297, 251.46734619140625, 256.6645202636719, 261.8616638183594, 267.058837890625, 272.2559814453125, 277.4531555175781, 282.65032958984375, 287.8475036621094, 293.0446472167969, 298.2418212890625, 303.43896484375, 308.6361389160156, 313.8332824707031, 319.03045654296875, 324.22760009765625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 9.0, 12.0, 10.0, 12.0, 16.0, 13.0, 16.0, 19.0, 27.0, 26.0, 43.0, 31.0, 30.0, 36.0, 37.0, 46.0, 46.0, 36.0, 53.0, 40.0, 42.0, 45.0, 31.0, 44.0, 49.0, 24.0, 33.0, 26.0, 20.0, 25.0, 17.0, 12.0, 16.0, 13.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.9840030670166, -25.197519302368164, -24.411033630371094, -23.624549865722656, -22.83806610107422, -22.05158233642578, -21.265098571777344, -20.478612899780273, -19.692129135131836, -18.9056453704834, -18.119159698486328, -17.33267593383789, -16.546192169189453, -15.759708404541016, -14.973223686218262, -14.186738967895508, -13.40025520324707, -12.613771438598633, -11.827286720275879, -11.040802001953125, -10.254318237304688, -9.46783447265625, -8.681349754333496, -7.8948655128479, -7.108381271362305, -6.321897029876709, -5.535412788391113, -4.748928546905518, -3.962444305419922, -3.175960063934326, -2.3894758224487305, -1.6029915809631348, -0.8165092468261719, -0.030025005340576172, 0.7564592361450195, 1.5429434776306152, 2.329427719116211, 3.1159119606018066, 3.9023962020874023, 4.688880443572998, 5.475364685058594, 6.2618489265441895, 7.048333168029785, 7.834817409515381, 8.621301651000977, 9.407785415649414, 10.194270133972168, 10.980754852294922, 11.76723861694336, 12.553722381591797, 13.34020709991455, 14.126691818237305, 14.913175582885742, 15.69965934753418, 16.48614501953125, 17.272628784179688, 18.059112548828125, 18.845596313476562, 19.632080078125, 20.41856575012207, 21.205049514770508, 21.991533279418945, 22.778018951416016, 23.564502716064453, 24.35098648071289]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 7.0, 6.0, 5.0, 4.0, 9.0, 6.0, 14.0, 6.0, 15.0, 12.0, 20.0, 27.0, 22.0, 16.0, 36.0, 30.0, 35.0, 33.0, 34.0, 48.0, 40.0, 46.0, 41.0, 44.0, 26.0, 29.0, 51.0, 30.0, 39.0, 21.0, 28.0, 22.0, 18.0, 31.0, 25.0, 23.0, 19.0, 18.0, 11.0, 10.0, 13.0, 14.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.854034423828125, -1.78814697265625, -1.722259521484375, -1.6563720703125, -1.590484619140625, -1.52459716796875, -1.458709716796875, -1.392822265625, -1.326934814453125, -1.26104736328125, -1.195159912109375, -1.1292724609375, -1.063385009765625, -0.99749755859375, -0.931610107421875, -0.86572265625, -0.799835205078125, -0.73394775390625, -0.668060302734375, -0.6021728515625, -0.536285400390625, -0.47039794921875, -0.404510498046875, -0.338623046875, -0.272735595703125, -0.20684814453125, -0.140960693359375, -0.0750732421875, -0.009185791015625, 0.05670166015625, 0.122589111328125, 0.1884765625, 0.254364013671875, 0.32025146484375, 0.386138916015625, 0.4520263671875, 0.517913818359375, 0.58380126953125, 0.649688720703125, 0.715576171875, 0.781463623046875, 0.84735107421875, 0.913238525390625, 0.9791259765625, 1.045013427734375, 1.11090087890625, 1.176788330078125, 1.24267578125, 1.308563232421875, 1.37445068359375, 1.440338134765625, 1.5062255859375, 1.572113037109375, 1.63800048828125, 1.703887939453125, 1.769775390625, 1.835662841796875, 1.90155029296875, 1.967437744140625, 2.0333251953125, 2.099212646484375, 2.16510009765625, 2.230987548828125, 2.296875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 12.0, 14.0, 12.0, 19.0, 24.0, 52.0, 49.0, 86.0, 105.0, 218.0, 345.0, 798.0, 1865.0, 5663.0, 19621.0, 82530.0, 484892.0, 1960910.0, 1335644.0, 237675.0, 45400.0, 11886.0, 3715.0, 1350.0, 555.0, 283.0, 180.0, 95.0, 55.0, 50.0, 41.0, 22.0, 20.0, 14.0, 13.0, 14.0, 5.0, 9.0, 6.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08099365234375, -3.9393310546875, -3.79766845703125, -3.656005859375, -3.51434326171875, -3.3726806640625, -3.23101806640625, -3.08935546875, -2.94769287109375, -2.8060302734375, -2.66436767578125, -2.522705078125, -2.38104248046875, -2.2393798828125, -2.09771728515625, -1.9560546875, -1.81439208984375, -1.6727294921875, -1.53106689453125, -1.389404296875, -1.24774169921875, -1.1060791015625, -0.96441650390625, -0.82275390625, -0.68109130859375, -0.5394287109375, -0.39776611328125, -0.256103515625, -0.11444091796875, 0.0272216796875, 0.16888427734375, 0.310546875, 0.45220947265625, 0.5938720703125, 0.73553466796875, 0.877197265625, 1.01885986328125, 1.1605224609375, 1.30218505859375, 1.44384765625, 1.58551025390625, 1.7271728515625, 1.86883544921875, 2.010498046875, 2.15216064453125, 2.2938232421875, 2.43548583984375, 2.5771484375, 2.71881103515625, 2.8604736328125, 3.00213623046875, 3.143798828125, 3.28546142578125, 3.4271240234375, 3.56878662109375, 3.71044921875, 3.85211181640625, 3.9937744140625, 4.13543701171875, 4.277099609375, 4.41876220703125, 4.5604248046875, 4.70208740234375, 4.84375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 15.0, 13.0, 22.0, 35.0, 42.0, 66.0, 85.0, 108.0, 163.0, 216.0, 266.0, 343.0, 465.0, 459.0, 431.0, 300.0, 266.0, 208.0, 132.0, 116.0, 64.0, 57.0, 53.0, 31.0, 28.0, 18.0, 13.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.39453125, -7.20159912109375, -7.0086669921875, -6.81573486328125, -6.622802734375, -6.42987060546875, -6.2369384765625, -6.04400634765625, -5.85107421875, -5.65814208984375, -5.4652099609375, -5.27227783203125, -5.079345703125, -4.88641357421875, -4.6934814453125, -4.50054931640625, -4.3076171875, -4.11468505859375, -3.9217529296875, -3.72882080078125, -3.535888671875, -3.34295654296875, -3.1500244140625, -2.95709228515625, -2.76416015625, -2.57122802734375, -2.3782958984375, -2.18536376953125, -1.992431640625, -1.79949951171875, -1.6065673828125, -1.41363525390625, -1.220703125, -1.02777099609375, -0.8348388671875, -0.64190673828125, -0.448974609375, -0.25604248046875, -0.0631103515625, 0.12982177734375, 0.32275390625, 0.51568603515625, 0.7086181640625, 0.90155029296875, 1.094482421875, 1.28741455078125, 1.4803466796875, 1.67327880859375, 1.8662109375, 2.05914306640625, 2.2520751953125, 2.44500732421875, 2.637939453125, 2.83087158203125, 3.0238037109375, 3.21673583984375, 3.40966796875, 3.60260009765625, 3.7955322265625, 3.98846435546875, 4.181396484375, 4.37432861328125, 4.5672607421875, 4.76019287109375, 4.953125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 8.0, 10.0, 8.0, 23.0, 15.0, 45.0, 48.0, 83.0, 149.0, 288.0, 712.0, 2809.0, 30517.0, 1463629.0, 2636207.0, 54364.0, 3717.0, 818.0, 385.0, 161.0, 85.0, 63.0, 49.0, 18.0, 19.0, 9.0, 10.0, 11.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4140625, -13.8394775390625, -13.264892578125, -12.6903076171875, -12.11572265625, -11.5411376953125, -10.966552734375, -10.3919677734375, -9.8173828125, -9.2427978515625, -8.668212890625, -8.0936279296875, -7.51904296875, -6.9444580078125, -6.369873046875, -5.7952880859375, -5.220703125, -4.6461181640625, -4.071533203125, -3.4969482421875, -2.92236328125, -2.3477783203125, -1.773193359375, -1.1986083984375, -0.6240234375, -0.0494384765625, 0.525146484375, 1.0997314453125, 1.67431640625, 2.2489013671875, 2.823486328125, 3.3980712890625, 3.97265625, 4.5472412109375, 5.121826171875, 5.6964111328125, 6.27099609375, 6.8455810546875, 7.420166015625, 7.9947509765625, 8.5693359375, 9.1439208984375, 9.718505859375, 10.2930908203125, 10.86767578125, 11.4422607421875, 12.016845703125, 12.5914306640625, 13.166015625, 13.7406005859375, 14.315185546875, 14.8897705078125, 15.46435546875, 16.0389404296875, 16.613525390625, 17.1881103515625, 17.7626953125, 18.3372802734375, 18.911865234375, 19.4864501953125, 20.06103515625, 20.6356201171875, 21.210205078125, 21.7847900390625, 22.359375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 29.0, 110.0, 214.0, 296.0, 219.0, 92.0, 31.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.41461944580078, -89.15377807617188, -86.89293670654297, -84.63209533691406, -82.37126159667969, -80.11042022705078, -77.84957885742188, -75.58873748779297, -73.32789611816406, -71.06705474853516, -68.80621337890625, -66.54537963867188, -64.28453826904297, -62.02369689941406, -59.762855529785156, -57.50201416015625, -55.24117660522461, -52.9803352355957, -50.71949768066406, -48.458656311035156, -46.19781494140625, -43.936973571777344, -41.6761360168457, -39.4152946472168, -37.154457092285156, -34.89361572265625, -32.63277816772461, -30.371936798095703, -28.111095428466797, -25.850255966186523, -23.58941650390625, -21.328575134277344, -19.067733764648438, -16.806894302368164, -14.546052932739258, -12.285213470458984, -10.024373054504395, -7.763532638549805, -5.502693176269531, -3.2418527603149414, -0.9810123443603516, 1.2798278331756592, 3.54066801071167, 5.801507949829102, 8.062348365783691, 10.323188781738281, 12.584028244018555, 14.844868659973145, 17.105709075927734, 19.366548538208008, 21.627389907836914, 23.888229370117188, 26.149070739746094, 28.409910202026367, 30.67074966430664, 32.93159103393555, 35.19242858886719, 37.453269958496094, 39.714107513427734, 41.97494888305664, 44.23579025268555, 46.49662780761719, 48.757469177246094, 51.018310546875, 53.279151916503906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 13.0, 9.0, 11.0, 20.0, 14.0, 16.0, 22.0, 12.0, 22.0, 27.0, 32.0, 25.0, 34.0, 43.0, 40.0, 40.0, 50.0, 30.0, 50.0, 42.0, 40.0, 37.0, 46.0, 33.0, 30.0, 45.0, 29.0, 30.0, 24.0, 21.0, 23.0, 11.0, 14.0, 14.0, 11.0, 7.0, 3.0, 4.0, 11.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-23.927833557128906, -23.265535354614258, -22.603235244750977, -21.940937042236328, -21.278636932373047, -20.6163387298584, -19.95404052734375, -19.29174041748047, -18.62944221496582, -17.967144012451172, -17.30484390258789, -16.642545700073242, -15.980246543884277, -15.317947387695312, -14.655649185180664, -13.9933500289917, -13.331050872802734, -12.66875171661377, -12.006452560424805, -11.344154357910156, -10.681855201721191, -10.019556045532227, -9.357257843017578, -8.694958686828613, -8.032659530639648, -7.370360374450684, -6.708061695098877, -6.04576301574707, -5.3834638595581055, -4.721164703369141, -4.058866024017334, -3.3965673446655273, -2.7342681884765625, -2.0719692707061768, -1.409670352935791, -0.7473714351654053, -0.08507251739501953, 0.5772264003753662, 1.239525318145752, 1.9018239974975586, 2.5641231536865234, 3.226422071456909, 3.888720989227295, 4.551019668579102, 5.213318824768066, 5.875617980957031, 6.537916660308838, 7.2002153396606445, 7.862514495849609, 8.524813652038574, 9.187112808227539, 9.849411010742188, 10.511710166931152, 11.174009323120117, 11.836307525634766, 12.49860668182373, 13.160905838012695, 13.82320499420166, 14.485504150390625, 15.147802352905273, 15.810101509094238, 16.472400665283203, 17.13469886779785, 17.7969970703125, 18.45929718017578]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 7.0, 8.0, 15.0, 12.0, 14.0, 14.0, 21.0, 16.0, 23.0, 18.0, 29.0, 37.0, 34.0, 29.0, 33.0, 41.0, 47.0, 32.0, 39.0, 56.0, 36.0, 34.0, 37.0, 33.0, 32.0, 32.0, 25.0, 31.0, 33.0, 27.0, 17.0, 21.0, 17.0, 13.0, 16.0, 13.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296875, -1.86004638671875, -1.7904052734375, -1.72076416015625, -1.651123046875, -1.58148193359375, -1.5118408203125, -1.44219970703125, -1.37255859375, -1.30291748046875, -1.2332763671875, -1.16363525390625, -1.093994140625, -1.02435302734375, -0.9547119140625, -0.88507080078125, -0.8154296875, -0.74578857421875, -0.6761474609375, -0.60650634765625, -0.536865234375, -0.46722412109375, -0.3975830078125, -0.32794189453125, -0.25830078125, -0.18865966796875, -0.1190185546875, -0.04937744140625, 0.020263671875, 0.08990478515625, 0.1595458984375, 0.22918701171875, 0.298828125, 0.36846923828125, 0.4381103515625, 0.50775146484375, 0.577392578125, 0.64703369140625, 0.7166748046875, 0.78631591796875, 0.85595703125, 0.92559814453125, 0.9952392578125, 1.06488037109375, 1.134521484375, 1.20416259765625, 1.2738037109375, 1.34344482421875, 1.4130859375, 1.48272705078125, 1.5523681640625, 1.62200927734375, 1.691650390625, 1.76129150390625, 1.8309326171875, 1.90057373046875, 1.97021484375, 2.03985595703125, 2.1094970703125, 2.17913818359375, 2.248779296875, 2.31842041015625, 2.3880615234375, 2.45770263671875, 2.52734375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 5.0, 8.0, 8.0, 19.0, 26.0, 31.0, 46.0, 74.0, 92.0, 156.0, 214.0, 290.0, 444.0, 748.0, 1048.0, 1631.0, 2300.0, 3520.0, 5345.0, 8103.0, 12338.0, 18475.0, 27925.0, 41769.0, 64570.0, 99117.0, 150191.0, 192042.0, 144120.0, 93983.0, 60920.0, 40182.0, 26500.0, 17687.0, 11571.0, 7743.0, 5166.0, 3359.0, 2247.0, 1486.0, 1032.0, 639.0, 448.0, 325.0, 199.0, 126.0, 104.0, 56.0, 53.0, 31.0, 12.0, 14.0, 10.0, 2.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.21923828125, -0.2122650146484375, -0.205291748046875, -0.1983184814453125, -0.19134521484375, -0.1843719482421875, -0.177398681640625, -0.1704254150390625, -0.1634521484375, -0.1564788818359375, -0.149505615234375, -0.1425323486328125, -0.13555908203125, -0.1285858154296875, -0.121612548828125, -0.1146392822265625, -0.107666015625, -0.1006927490234375, -0.093719482421875, -0.0867462158203125, -0.07977294921875, -0.0727996826171875, -0.065826416015625, -0.0588531494140625, -0.0518798828125, -0.0449066162109375, -0.037933349609375, -0.0309600830078125, -0.02398681640625, -0.0170135498046875, -0.010040283203125, -0.0030670166015625, 0.00390625, 0.0108795166015625, 0.017852783203125, 0.0248260498046875, 0.03179931640625, 0.0387725830078125, 0.045745849609375, 0.0527191162109375, 0.0596923828125, 0.0666656494140625, 0.073638916015625, 0.0806121826171875, 0.08758544921875, 0.0945587158203125, 0.101531982421875, 0.1085052490234375, 0.115478515625, 0.1224517822265625, 0.129425048828125, 0.1363983154296875, 0.14337158203125, 0.1503448486328125, 0.157318115234375, 0.1642913818359375, 0.1712646484375, 0.1782379150390625, 0.185211181640625, 0.1921844482421875, 0.19915771484375, 0.2061309814453125, 0.213104248046875, 0.2200775146484375, 0.22705078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 10.0, 7.0, 10.0, 8.0, 9.0, 18.0, 22.0, 18.0, 22.0, 24.0, 27.0, 32.0, 22.0, 31.0, 29.0, 29.0, 40.0, 32.0, 36.0, 28.0, 1061.0, 31.0, 30.0, 31.0, 35.0, 38.0, 37.0, 24.0, 25.0, 25.0, 25.0, 27.0, 19.0, 25.0, 15.0, 22.0, 17.0, 9.0, 10.0, 5.0, 8.0, 10.0, 4.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.32421875, -1.2828216552734375, -1.241424560546875, -1.2000274658203125, -1.15863037109375, -1.1172332763671875, -1.075836181640625, -1.0344390869140625, -0.9930419921875, -0.9516448974609375, -0.910247802734375, -0.8688507080078125, -0.82745361328125, -0.7860565185546875, -0.744659423828125, -0.7032623291015625, -0.661865234375, -0.6204681396484375, -0.579071044921875, -0.5376739501953125, -0.49627685546875, -0.4548797607421875, -0.413482666015625, -0.3720855712890625, -0.3306884765625, -0.2892913818359375, -0.247894287109375, -0.2064971923828125, -0.16510009765625, -0.1237030029296875, -0.082305908203125, -0.0409088134765625, 0.00048828125, 0.0418853759765625, 0.083282470703125, 0.1246795654296875, 0.16607666015625, 0.2074737548828125, 0.248870849609375, 0.2902679443359375, 0.3316650390625, 0.3730621337890625, 0.414459228515625, 0.4558563232421875, 0.49725341796875, 0.5386505126953125, 0.580047607421875, 0.6214447021484375, 0.662841796875, 0.7042388916015625, 0.745635986328125, 0.7870330810546875, 0.82843017578125, 0.8698272705078125, 0.911224365234375, 0.9526214599609375, 0.9940185546875, 1.0354156494140625, 1.076812744140625, 1.1182098388671875, 1.15960693359375, 1.2010040283203125, 1.242401123046875, 1.2837982177734375, 1.3251953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 7.0, 17.0, 22.0, 28.0, 50.0, 69.0, 96.0, 150.0, 196.0, 338.0, 450.0, 658.0, 971.0, 1483.0, 2224.0, 3291.0, 4896.0, 7458.0, 11547.0, 18179.0, 28505.0, 45738.0, 74646.0, 122290.0, 408375.0, 1036100.0, 125122.0, 75706.0, 46598.0, 29120.0, 18254.0, 11724.0, 7684.0, 4935.0, 3222.0, 2259.0, 1508.0, 1024.0, 694.0, 490.0, 320.0, 203.0, 147.0, 103.0, 79.0, 50.0, 42.0, 32.0, 12.0, 8.0, 0.0, 4.0, 4.0, 2.0], "bins": [-0.252685546875, -0.2454700469970703, -0.23825454711914062, -0.23103904724121094, -0.22382354736328125, -0.21660804748535156, -0.20939254760742188, -0.2021770477294922, -0.1949615478515625, -0.1877460479736328, -0.18053054809570312, -0.17331504821777344, -0.16609954833984375, -0.15888404846191406, -0.15166854858398438, -0.1444530487060547, -0.137237548828125, -0.1300220489501953, -0.12280654907226562, -0.11559104919433594, -0.10837554931640625, -0.10116004943847656, -0.09394454956054688, -0.08672904968261719, -0.0795135498046875, -0.07229804992675781, -0.06508255004882812, -0.05786705017089844, -0.05065155029296875, -0.04343605041503906, -0.036220550537109375, -0.029005050659179688, -0.02178955078125, -0.014574050903320312, -0.007358551025390625, -0.0001430511474609375, 0.00707244873046875, 0.014287948608398438, 0.021503448486328125, 0.028718948364257812, 0.0359344482421875, 0.04314994812011719, 0.050365447998046875, 0.05758094787597656, 0.06479644775390625, 0.07201194763183594, 0.07922744750976562, 0.08644294738769531, 0.093658447265625, 0.10087394714355469, 0.10808944702148438, 0.11530494689941406, 0.12252044677734375, 0.12973594665527344, 0.13695144653320312, 0.1441669464111328, 0.1513824462890625, 0.1585979461669922, 0.16581344604492188, 0.17302894592285156, 0.18024444580078125, 0.18745994567871094, 0.19467544555664062, 0.2018909454345703, 0.2091064453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 0.0, 8.0, 4.0, 4.0, 4.0, 9.0, 6.0, 13.0, 11.0, 15.0, 22.0, 27.0, 29.0, 57.0, 57.0, 76.0, 100.0, 105.0, 101.0, 85.0, 59.0, 43.0, 32.0, 29.0, 16.0, 14.0, 13.0, 10.0, 10.0, 9.0, 3.0, 2.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016088485717773438, -0.0015596002340316772, -0.0015103518962860107, -0.0014611035585403442, -0.0014118552207946777, -0.0013626068830490112, -0.0013133585453033447, -0.0012641102075576782, -0.0012148618698120117, -0.0011656135320663452, -0.0011163651943206787, -0.0010671168565750122, -0.0010178685188293457, -0.0009686201810836792, -0.0009193718433380127, -0.0008701235055923462, -0.0008208751678466797, -0.0007716268301010132, -0.0007223784923553467, -0.0006731301546096802, -0.0006238818168640137, -0.0005746334791183472, -0.0005253851413726807, -0.00047613680362701416, -0.00042688846588134766, -0.00037764012813568115, -0.00032839179039001465, -0.00027914345264434814, -0.00022989511489868164, -0.00018064677715301514, -0.00013139843940734863, -8.215010166168213e-05, -3.2901763916015625e-05, 1.634657382965088e-05, 6.559491157531738e-05, 0.00011484324932098389, 0.0001640915870666504, 0.0002133399248123169, 0.0002625882625579834, 0.0003118366003036499, 0.0003610849380493164, 0.0004103332757949829, 0.0004595816135406494, 0.0005088299512863159, 0.0005580782890319824, 0.0006073266267776489, 0.0006565749645233154, 0.0007058233022689819, 0.0007550716400146484, 0.0008043199777603149, 0.0008535683155059814, 0.000902816653251648, 0.0009520649909973145, 0.001001313328742981, 0.0010505616664886475, 0.001099810004234314, 0.0011490583419799805, 0.001198306679725647, 0.0012475550174713135, 0.00129680335521698, 0.0013460516929626465, 0.001395300030708313, 0.0014445483684539795, 0.001493796706199646, 0.0015430450439453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 5.0, 10.0, 5.0, 15.0, 23.0, 22.0, 34.0, 40.0, 49.0, 82.0, 132.0, 176.0, 341.0, 874.0, 129775.0, 914297.0, 1578.0, 420.0, 219.0, 127.0, 94.0, 71.0, 43.0, 29.0, 13.0, 13.0, 16.0, 14.0, 11.0, 6.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03076171875, -0.029773712158203125, -0.02878570556640625, -0.027797698974609375, -0.0268096923828125, -0.025821685791015625, -0.02483367919921875, -0.023845672607421875, -0.022857666015625, -0.021869659423828125, -0.02088165283203125, -0.019893646240234375, -0.0189056396484375, -0.017917633056640625, -0.01692962646484375, -0.015941619873046875, -0.01495361328125, -0.013965606689453125, -0.01297760009765625, -0.011989593505859375, -0.0110015869140625, -0.010013580322265625, -0.00902557373046875, -0.008037567138671875, -0.007049560546875, -0.006061553955078125, -0.00507354736328125, -0.004085540771484375, -0.0030975341796875, -0.002109527587890625, -0.00112152099609375, -0.000133514404296875, 0.0008544921875, 0.001842498779296875, 0.00283050537109375, 0.003818511962890625, 0.0048065185546875, 0.005794525146484375, 0.00678253173828125, 0.007770538330078125, 0.008758544921875, 0.009746551513671875, 0.01073455810546875, 0.011722564697265625, 0.0127105712890625, 0.013698577880859375, 0.01468658447265625, 0.015674591064453125, 0.01666259765625, 0.017650604248046875, 0.01863861083984375, 0.019626617431640625, 0.0206146240234375, 0.021602630615234375, 0.02259063720703125, 0.023578643798828125, 0.024566650390625, 0.025554656982421875, 0.02654266357421875, 0.027530670166015625, 0.0285186767578125, 0.029506683349609375, 0.03049468994140625, 0.031482696533203125, 0.032470703125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 20.0, 251.0, 579.0, 151.0, 16.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036342907696962357, -0.0034852419048547745, -0.0033361930400133133, -0.003187144175171852, -0.0030380955431610346, -0.0028890466783195734, -0.0027399978134781122, -0.0025909491814672947, -0.0024419003166258335, -0.0022928514517843723, -0.002143802586942911, -0.00199475372210145, -0.0018457050900906324, -0.0016966562252491713, -0.00154760736040771, -0.0013985586119815707, -0.0012495096307247877, -0.0011004607658833265, -0.0009514120174571872, -0.000802363152615726, -0.0006533143459819257, -0.0005042655393481255, -0.0003552166745066643, -0.00020616792608052492, -5.711906123906374e-05, 9.192975994665176e-05, 0.00024097858113236725, 0.000390027416869998, 0.0005390762235037982, 0.0006881250301375985, 0.0008371738949790597, 0.000986222643405199, 0.0011352715082466602, 0.0012843203730881214, 0.0014333691215142608, 0.001582417986355722, 0.0017314667347818613, 0.0018805155996233225, 0.0020295644644647837, 0.002178613096475601, 0.0023276619613170624, 0.0024767108261585236, 0.0026257596909999847, 0.002774808555841446, 0.0029238571878522635, 0.0030729060526937246, 0.003221954917535186, 0.0033710035495460033, 0.003520052647218108, 0.0036691015120595694, 0.0038181503769010305, 0.003967199008911848, 0.004116247873753309, 0.00426529673859477, 0.004414345603436232, 0.004563394468277693, 0.004712443333119154, 0.004861492197960615, 0.005010541062802076, 0.0051595899276435375, 0.005308638792484999, 0.005457687191665173, 0.005606736056506634, 0.005755784921348095, 0.005904833786189556]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 11.0, 14.0, 17.0, 17.0, 17.0, 25.0, 27.0, 31.0, 33.0, 34.0, 49.0, 43.0, 53.0, 46.0, 43.0, 51.0, 52.0, 46.0, 52.0, 39.0, 55.0, 45.0, 36.0, 27.0, 25.0, 20.0, 19.0, 13.0, 18.0, 9.0, 4.0, 8.0, 7.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008789896965026855, -0.0008522868156433105, -0.0008255839347839355, -0.0007988810539245605, -0.0007721781730651855, -0.0007454752922058105, -0.0007187724113464355, -0.0006920695304870605, -0.0006653666496276855, -0.0006386637687683105, -0.0006119608879089355, -0.0005852580070495605, -0.0005585551261901855, -0.0005318522453308105, -0.0005051493644714355, -0.00047844648361206055, -0.00045174360275268555, -0.00042504072189331055, -0.00039833784103393555, -0.00037163496017456055, -0.00034493207931518555, -0.00031822919845581055, -0.00029152631759643555, -0.00026482343673706055, -0.00023812055587768555, -0.00021141767501831055, -0.00018471479415893555, -0.00015801191329956055, -0.00013130903244018555, -0.00010460615158081055, -7.790327072143555e-05, -5.120038986206055e-05, -2.4497509002685547e-05, 2.205371856689453e-06, 2.8908252716064453e-05, 5.561113357543945e-05, 8.231401443481445e-05, 0.00010901689529418945, 0.00013571977615356445, 0.00016242265701293945, 0.00018912553787231445, 0.00021582841873168945, 0.00024253129959106445, 0.00026923418045043945, 0.00029593706130981445, 0.00032263994216918945, 0.00034934282302856445, 0.00037604570388793945, 0.00040274858474731445, 0.00042945146560668945, 0.00045615434646606445, 0.00048285722732543945, 0.0005095601081848145, 0.0005362629890441895, 0.0005629658699035645, 0.0005896687507629395, 0.0006163716316223145, 0.0006430745124816895, 0.0006697773933410645, 0.0006964802742004395, 0.0007231831550598145, 0.0007498860359191895, 0.0007765889167785645, 0.0008032917976379395, 0.0008299946784973145]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 7.0, 8.0, 15.0, 12.0, 14.0, 14.0, 21.0, 16.0, 23.0, 18.0, 29.0, 37.0, 34.0, 29.0, 33.0, 41.0, 47.0, 32.0, 39.0, 56.0, 36.0, 34.0, 37.0, 33.0, 32.0, 32.0, 25.0, 31.0, 33.0, 27.0, 17.0, 21.0, 17.0, 13.0, 16.0, 13.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296875, -1.86004638671875, -1.7904052734375, -1.72076416015625, -1.651123046875, -1.58148193359375, -1.5118408203125, -1.44219970703125, -1.37255859375, -1.30291748046875, -1.2332763671875, -1.16363525390625, -1.093994140625, -1.02435302734375, -0.9547119140625, -0.88507080078125, -0.8154296875, -0.74578857421875, -0.6761474609375, -0.60650634765625, -0.536865234375, -0.46722412109375, -0.3975830078125, -0.32794189453125, -0.25830078125, -0.18865966796875, -0.1190185546875, -0.04937744140625, 0.020263671875, 0.08990478515625, 0.1595458984375, 0.22918701171875, 0.298828125, 0.36846923828125, 0.4381103515625, 0.50775146484375, 0.577392578125, 0.64703369140625, 0.7166748046875, 0.78631591796875, 0.85595703125, 0.92559814453125, 0.9952392578125, 1.06488037109375, 1.134521484375, 1.20416259765625, 1.2738037109375, 1.34344482421875, 1.4130859375, 1.48272705078125, 1.5523681640625, 1.62200927734375, 1.691650390625, 1.76129150390625, 1.8309326171875, 1.90057373046875, 1.97021484375, 2.03985595703125, 2.1094970703125, 2.17913818359375, 2.248779296875, 2.31842041015625, 2.3880615234375, 2.45770263671875, 2.52734375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 13.0, 25.0, 17.0, 31.0, 60.0, 92.0, 155.0, 234.0, 391.0, 652.0, 1232.0, 2059.0, 3869.0, 7185.0, 14630.0, 30972.0, 67707.0, 148780.0, 270630.0, 253502.0, 132457.0, 59066.0, 27256.0, 13060.0, 6507.0, 3484.0, 1884.0, 1054.0, 621.0, 341.0, 210.0, 129.0, 88.0, 47.0, 29.0, 22.0, 13.0, 7.0, 11.0, 9.0, 4.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7451171875, -1.6886749267578125, -1.632232666015625, -1.5757904052734375, -1.51934814453125, -1.4629058837890625, -1.406463623046875, -1.3500213623046875, -1.2935791015625, -1.2371368408203125, -1.180694580078125, -1.1242523193359375, -1.06781005859375, -1.0113677978515625, -0.954925537109375, -0.8984832763671875, -0.842041015625, -0.7855987548828125, -0.729156494140625, -0.6727142333984375, -0.61627197265625, -0.5598297119140625, -0.503387451171875, -0.4469451904296875, -0.3905029296875, -0.3340606689453125, -0.277618408203125, -0.2211761474609375, -0.16473388671875, -0.1082916259765625, -0.051849365234375, 0.0045928955078125, 0.06103515625, 0.1174774169921875, 0.173919677734375, 0.2303619384765625, 0.28680419921875, 0.3432464599609375, 0.399688720703125, 0.4561309814453125, 0.5125732421875, 0.5690155029296875, 0.625457763671875, 0.6819000244140625, 0.73834228515625, 0.7947845458984375, 0.851226806640625, 0.9076690673828125, 0.964111328125, 1.0205535888671875, 1.076995849609375, 1.1334381103515625, 1.18988037109375, 1.2463226318359375, 1.302764892578125, 1.3592071533203125, 1.4156494140625, 1.4720916748046875, 1.528533935546875, 1.5849761962890625, 1.64141845703125, 1.6978607177734375, 1.754302978515625, 1.8107452392578125, 1.8671875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 10.0, 14.0, 15.0, 19.0, 28.0, 26.0, 27.0, 45.0, 48.0, 46.0, 50.0, 66.0, 91.0, 241.0, 1497.0, 256.0, 116.0, 53.0, 49.0, 40.0, 30.0, 32.0, 30.0, 41.0, 24.0, 17.0, 21.0, 17.0, 17.0, 12.0, 9.0, 7.0, 2.0, 6.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.578125, -8.3150634765625, -8.052001953125, -7.7889404296875, -7.52587890625, -7.2628173828125, -6.999755859375, -6.7366943359375, -6.4736328125, -6.2105712890625, -5.947509765625, -5.6844482421875, -5.42138671875, -5.1583251953125, -4.895263671875, -4.6322021484375, -4.369140625, -4.1060791015625, -3.843017578125, -3.5799560546875, -3.31689453125, -3.0538330078125, -2.790771484375, -2.5277099609375, -2.2646484375, -2.0015869140625, -1.738525390625, -1.4754638671875, -1.21240234375, -0.9493408203125, -0.686279296875, -0.4232177734375, -0.16015625, 0.1029052734375, 0.365966796875, 0.6290283203125, 0.89208984375, 1.1551513671875, 1.418212890625, 1.6812744140625, 1.9443359375, 2.2073974609375, 2.470458984375, 2.7335205078125, 2.99658203125, 3.2596435546875, 3.522705078125, 3.7857666015625, 4.048828125, 4.3118896484375, 4.574951171875, 4.8380126953125, 5.10107421875, 5.3641357421875, 5.627197265625, 5.8902587890625, 6.1533203125, 6.4163818359375, 6.679443359375, 6.9425048828125, 7.20556640625, 7.4686279296875, 7.731689453125, 7.9947509765625, 8.2578125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 11.0, 7.0, 10.0, 19.0, 25.0, 25.0, 27.0, 44.0, 59.0, 86.0, 141.0, 196.0, 380.0, 1190.0, 11629.0, 2662163.0, 462974.0, 5020.0, 813.0, 290.0, 207.0, 107.0, 69.0, 60.0, 32.0, 35.0, 18.0, 13.0, 8.0, 5.0, 10.0, 5.0, 11.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.109375, -19.5638427734375, -19.018310546875, -18.4727783203125, -17.92724609375, -17.3817138671875, -16.836181640625, -16.2906494140625, -15.7451171875, -15.1995849609375, -14.654052734375, -14.1085205078125, -13.56298828125, -13.0174560546875, -12.471923828125, -11.9263916015625, -11.380859375, -10.8353271484375, -10.289794921875, -9.7442626953125, -9.19873046875, -8.6531982421875, -8.107666015625, -7.5621337890625, -7.0166015625, -6.4710693359375, -5.925537109375, -5.3800048828125, -4.83447265625, -4.2889404296875, -3.743408203125, -3.1978759765625, -2.65234375, -2.1068115234375, -1.561279296875, -1.0157470703125, -0.47021484375, 0.0753173828125, 0.620849609375, 1.1663818359375, 1.7119140625, 2.2574462890625, 2.802978515625, 3.3485107421875, 3.89404296875, 4.4395751953125, 4.985107421875, 5.5306396484375, 6.076171875, 6.6217041015625, 7.167236328125, 7.7127685546875, 8.25830078125, 8.8038330078125, 9.349365234375, 9.8948974609375, 10.4404296875, 10.9859619140625, 11.531494140625, 12.0770263671875, 12.62255859375, 13.1680908203125, 13.713623046875, 14.2591552734375, 14.8046875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 61.0, 406.0, 463.0, 74.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.217530250549316, -13.325004577636719, -11.432479858398438, -9.53995418548584, -7.647428512573242, -5.7549028396606445, -3.8623781204223633, -1.9698524475097656, -0.07732677459716797, 1.8151986598968506, 3.707724094390869, 5.600249290466309, 7.492774963378906, 9.385300636291504, 11.277825355529785, 13.170351028442383, 15.06287670135498, 16.955402374267578, 18.84792709350586, 20.74045181274414, 22.632978439331055, 24.52550506591797, 26.41802978515625, 28.31055450439453, 30.203079223632812, 32.095603942871094, 33.988128662109375, 35.880653381347656, 37.7731819152832, 39.665706634521484, 41.558231353759766, 43.45075607299805, 45.343284606933594, 47.235809326171875, 49.128334045410156, 51.02085876464844, 52.913387298583984, 54.805912017822266, 56.69843673706055, 58.59096145629883, 60.483489990234375, 62.376014709472656, 64.26853942871094, 66.16106414794922, 68.0535888671875, 69.94612121582031, 71.83863830566406, 73.73117065429688, 75.62368774414062, 77.5162124633789, 79.40873718261719, 81.30126190185547, 83.19378662109375, 85.08631896972656, 86.97883605957031, 88.87136840820312, 90.7638931274414, 92.65641784667969, 94.54894256591797, 96.44146728515625, 98.33399200439453, 100.22651672363281, 102.11904907226562, 104.0115737915039, 105.90409851074219]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 7.0, 5.0, 6.0, 5.0, 5.0, 18.0, 16.0, 12.0, 17.0, 26.0, 29.0, 12.0, 31.0, 30.0, 31.0, 39.0, 43.0, 31.0, 44.0, 40.0, 48.0, 53.0, 48.0, 40.0, 40.0, 36.0, 22.0, 42.0, 29.0, 26.0, 29.0, 24.0, 18.0, 19.0, 21.0, 9.0, 10.0, 10.0, 2.0, 5.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.084693908691406, -28.240005493164062, -27.395315170288086, -26.550626754760742, -25.705936431884766, -24.861248016357422, -24.016559600830078, -23.1718692779541, -22.327178955078125, -21.48249053955078, -20.637800216674805, -19.79311180114746, -18.948421478271484, -18.10373306274414, -17.259044647216797, -16.41435432434082, -15.569665908813477, -14.724976539611816, -13.880287170410156, -13.035598754882812, -12.190908432006836, -11.346220016479492, -10.501530647277832, -9.656841278076172, -8.812151908874512, -7.967462539672852, -7.122773170471191, -6.2780842781066895, -5.433394908905029, -4.588705539703369, -3.744016647338867, -2.899327278137207, -2.0546398162841797, -1.209950566291809, -0.3652613162994385, 0.4794278144836426, 1.3241171836853027, 2.168806552886963, 3.013495445251465, 3.858184814453125, 4.702874183654785, 5.547563552856445, 6.3922529220581055, 7.236941814422607, 8.08163070678711, 8.926321029663086, 9.77100944519043, 10.61569881439209, 11.46038818359375, 12.30507755279541, 13.14976692199707, 13.994455337524414, 14.83914566040039, 15.683834075927734, 16.528522491455078, 17.373212814331055, 18.21790313720703, 19.062591552734375, 19.90728187561035, 20.751970291137695, 21.596660614013672, 22.441349029541016, 23.28603744506836, 24.130727767944336, 24.97541618347168]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 8.0, 8.0, 9.0, 10.0, 17.0, 14.0, 20.0, 17.0, 18.0, 21.0, 31.0, 29.0, 36.0, 36.0, 38.0, 31.0, 52.0, 39.0, 39.0, 47.0, 38.0, 34.0, 43.0, 33.0, 36.0, 35.0, 32.0, 24.0, 33.0, 27.0, 24.0, 20.0, 15.0, 21.0, 14.0, 8.0, 12.0, 8.0, 6.0, 5.0, 3.0, 6.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.00244140625, -1.9248046875, -1.84716796875, -1.76953125, -1.69189453125, -1.6142578125, -1.53662109375, -1.458984375, -1.38134765625, -1.3037109375, -1.22607421875, -1.1484375, -1.07080078125, -0.9931640625, -0.91552734375, -0.837890625, -0.76025390625, -0.6826171875, -0.60498046875, -0.52734375, -0.44970703125, -0.3720703125, -0.29443359375, -0.216796875, -0.13916015625, -0.0615234375, 0.01611328125, 0.09375, 0.17138671875, 0.2490234375, 0.32666015625, 0.404296875, 0.48193359375, 0.5595703125, 0.63720703125, 0.71484375, 0.79248046875, 0.8701171875, 0.94775390625, 1.025390625, 1.10302734375, 1.1806640625, 1.25830078125, 1.3359375, 1.41357421875, 1.4912109375, 1.56884765625, 1.646484375, 1.72412109375, 1.8017578125, 1.87939453125, 1.95703125, 2.03466796875, 2.1123046875, 2.18994140625, 2.267578125, 2.34521484375, 2.4228515625, 2.50048828125, 2.578125, 2.65576171875, 2.7333984375, 2.81103515625, 2.888671875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 3.0, 7.0, 12.0, 11.0, 12.0, 12.0, 16.0, 20.0, 31.0, 31.0, 70.0, 91.0, 129.0, 215.0, 450.0, 1125.0, 3890.0, 19570.0, 141423.0, 1296716.0, 2306177.0, 370597.0, 42720.0, 7506.0, 1898.0, 673.0, 293.0, 153.0, 118.0, 69.0, 60.0, 44.0, 23.0, 20.0, 18.0, 12.0, 17.0, 14.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.4173583984375, -5.225341796875, -5.0333251953125, -4.84130859375, -4.6492919921875, -4.457275390625, -4.2652587890625, -4.0732421875, -3.8812255859375, -3.689208984375, -3.4971923828125, -3.30517578125, -3.1131591796875, -2.921142578125, -2.7291259765625, -2.537109375, -2.3450927734375, -2.153076171875, -1.9610595703125, -1.76904296875, -1.5770263671875, -1.385009765625, -1.1929931640625, -1.0009765625, -0.8089599609375, -0.616943359375, -0.4249267578125, -0.23291015625, -0.0408935546875, 0.151123046875, 0.3431396484375, 0.53515625, 0.7271728515625, 0.919189453125, 1.1112060546875, 1.30322265625, 1.4952392578125, 1.687255859375, 1.8792724609375, 2.0712890625, 2.2633056640625, 2.455322265625, 2.6473388671875, 2.83935546875, 3.0313720703125, 3.223388671875, 3.4154052734375, 3.607421875, 3.7994384765625, 3.991455078125, 4.1834716796875, 4.37548828125, 4.5675048828125, 4.759521484375, 4.9515380859375, 5.1435546875, 5.3355712890625, 5.527587890625, 5.7196044921875, 5.91162109375, 6.1036376953125, 6.295654296875, 6.4876708984375, 6.6796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 16.0, 21.0, 33.0, 56.0, 53.0, 87.0, 144.0, 182.0, 250.0, 340.0, 443.0, 549.0, 508.0, 401.0, 286.0, 201.0, 141.0, 103.0, 86.0, 55.0, 30.0, 24.0, 13.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.34375, -9.10247802734375, -8.8612060546875, -8.61993408203125, -8.378662109375, -8.13739013671875, -7.8961181640625, -7.65484619140625, -7.41357421875, -7.17230224609375, -6.9310302734375, -6.68975830078125, -6.448486328125, -6.20721435546875, -5.9659423828125, -5.72467041015625, -5.4833984375, -5.24212646484375, -5.0008544921875, -4.75958251953125, -4.518310546875, -4.27703857421875, -4.0357666015625, -3.79449462890625, -3.55322265625, -3.31195068359375, -3.0706787109375, -2.82940673828125, -2.588134765625, -2.34686279296875, -2.1055908203125, -1.86431884765625, -1.623046875, -1.38177490234375, -1.1405029296875, -0.89923095703125, -0.657958984375, -0.41668701171875, -0.1754150390625, 0.06585693359375, 0.30712890625, 0.54840087890625, 0.7896728515625, 1.03094482421875, 1.272216796875, 1.51348876953125, 1.7547607421875, 1.99603271484375, 2.2373046875, 2.47857666015625, 2.7198486328125, 2.96112060546875, 3.202392578125, 3.44366455078125, 3.6849365234375, 3.92620849609375, 4.16748046875, 4.40875244140625, 4.6500244140625, 4.89129638671875, 5.132568359375, 5.37384033203125, 5.6151123046875, 5.85638427734375, 6.09765625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 11.0, 28.0, 20.0, 56.0, 55.0, 118.0, 176.0, 292.0, 675.0, 1677.0, 8194.0, 147196.0, 3351902.0, 657754.0, 21405.0, 2713.0, 938.0, 407.0, 242.0, 136.0, 79.0, 56.0, 44.0, 35.0, 23.0, 10.0, 8.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9921875, -15.4537353515625, -14.915283203125, -14.3768310546875, -13.83837890625, -13.2999267578125, -12.761474609375, -12.2230224609375, -11.6845703125, -11.1461181640625, -10.607666015625, -10.0692138671875, -9.53076171875, -8.9923095703125, -8.453857421875, -7.9154052734375, -7.376953125, -6.8385009765625, -6.300048828125, -5.7615966796875, -5.22314453125, -4.6846923828125, -4.146240234375, -3.6077880859375, -3.0693359375, -2.5308837890625, -1.992431640625, -1.4539794921875, -0.91552734375, -0.3770751953125, 0.161376953125, 0.6998291015625, 1.23828125, 1.7767333984375, 2.315185546875, 2.8536376953125, 3.39208984375, 3.9305419921875, 4.468994140625, 5.0074462890625, 5.5458984375, 6.0843505859375, 6.622802734375, 7.1612548828125, 7.69970703125, 8.2381591796875, 8.776611328125, 9.3150634765625, 9.853515625, 10.3919677734375, 10.930419921875, 11.4688720703125, 12.00732421875, 12.5457763671875, 13.084228515625, 13.6226806640625, 14.1611328125, 14.6995849609375, 15.238037109375, 15.7764892578125, 16.31494140625, 16.8533935546875, 17.391845703125, 17.9302978515625, 18.46875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 22.0, 126.0, 300.0, 312.0, 182.0, 52.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.18247985839844, -63.20735549926758, -60.23222732543945, -57.257102966308594, -54.28197479248047, -51.30685043334961, -48.33172607421875, -45.356597900390625, -42.3814697265625, -39.40634536743164, -36.431217193603516, -33.456092834472656, -30.48096466064453, -27.505840301513672, -24.53071403503418, -21.555587768554688, -18.580463409423828, -15.605337142944336, -12.630210876464844, -9.655085563659668, -6.679959297180176, -3.7048330307006836, -0.7297077178955078, 2.2454185485839844, 5.220544815063477, 8.195671081542969, 11.170797348022461, 14.145922660827637, 17.121047973632812, 20.096176147460938, 23.071300506591797, 26.04642677307129, 29.02155303955078, 31.996679306030273, 34.971805572509766, 37.946929931640625, 40.92205810546875, 43.89718246459961, 46.87230682373047, 49.847434997558594, 52.82256317138672, 55.79768753051758, 58.7728157043457, 61.74794006347656, 64.72306823730469, 67.69819641113281, 70.6733169555664, 73.64844512939453, 76.62356567382812, 79.59869384765625, 82.57381439208984, 85.54894256591797, 88.5240707397461, 91.49919891357422, 94.47431945800781, 97.44944763183594, 100.42457580566406, 103.39970397949219, 106.37482452392578, 109.3499526977539, 112.32508087158203, 115.30020904541016, 118.27532958984375, 121.25045776367188, 124.2255859375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 2.0, 3.0, 8.0, 14.0, 12.0, 8.0, 14.0, 14.0, 21.0, 22.0, 31.0, 21.0, 29.0, 32.0, 48.0, 36.0, 31.0, 41.0, 42.0, 58.0, 34.0, 44.0, 39.0, 39.0, 36.0, 41.0, 35.0, 34.0, 21.0, 32.0, 21.0, 21.0, 17.0, 22.0, 11.0, 16.0, 6.0, 10.0, 5.0, 8.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.872852325439453, -22.115867614746094, -21.358884811401367, -20.601900100708008, -19.84491539001465, -19.087932586669922, -18.330947875976562, -17.573963165283203, -16.816980361938477, -16.059995651245117, -15.303011894226074, -14.546028137207031, -13.789044380187988, -13.032060623168945, -12.275075912475586, -11.518092155456543, -10.761107444763184, -10.00412368774414, -9.247138977050781, -8.490155220031738, -7.733171463012695, -6.976187229156494, -6.219202995300293, -5.46221923828125, -4.705235004425049, -3.9482510089874268, -3.1912670135498047, -2.4342827796936035, -1.6772987842559814, -0.9203147888183594, -0.1633305549621582, 0.5936532020568848, 1.350637435913086, 2.107621431350708, 2.86460542678833, 3.6215896606445312, 4.378573417663574, 5.135557651519775, 5.892541885375977, 6.6495256423950195, 7.406509876251221, 8.163494110107422, 8.920477867126465, 9.677461624145508, 10.434446334838867, 11.19143009185791, 11.948413848876953, 12.705398559570312, 13.462382316589355, 14.219366073608398, 14.976350784301758, 15.7333345413208, 16.490318298339844, 17.247303009033203, 18.004287719726562, 18.76127052307129, 19.51825523376465, 20.275239944458008, 21.032222747802734, 21.789207458496094, 22.546192169189453, 23.30317497253418, 24.06015968322754, 24.817142486572266, 25.574127197265625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 8.0, 15.0, 14.0, 15.0, 13.0, 15.0, 24.0, 20.0, 30.0, 20.0, 28.0, 26.0, 35.0, 37.0, 43.0, 31.0, 38.0, 33.0, 40.0, 35.0, 32.0, 50.0, 41.0, 32.0, 29.0, 24.0, 37.0, 22.0, 31.0, 13.0, 24.0, 24.0, 24.0, 14.0, 13.0, 8.0, 11.0, 10.0, 9.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.234375, -2.159576416015625, -2.08477783203125, -2.009979248046875, -1.9351806640625, -1.860382080078125, -1.78558349609375, -1.710784912109375, -1.635986328125, -1.561187744140625, -1.48638916015625, -1.411590576171875, -1.3367919921875, -1.261993408203125, -1.18719482421875, -1.112396240234375, -1.03759765625, -0.962799072265625, -0.88800048828125, -0.813201904296875, -0.7384033203125, -0.663604736328125, -0.58880615234375, -0.514007568359375, -0.439208984375, -0.364410400390625, -0.28961181640625, -0.214813232421875, -0.1400146484375, -0.065216064453125, 0.00958251953125, 0.084381103515625, 0.1591796875, 0.233978271484375, 0.30877685546875, 0.383575439453125, 0.4583740234375, 0.533172607421875, 0.60797119140625, 0.682769775390625, 0.757568359375, 0.832366943359375, 0.90716552734375, 0.981964111328125, 1.0567626953125, 1.131561279296875, 1.20635986328125, 1.281158447265625, 1.35595703125, 1.430755615234375, 1.50555419921875, 1.580352783203125, 1.6551513671875, 1.729949951171875, 1.80474853515625, 1.879547119140625, 1.954345703125, 2.029144287109375, 2.10394287109375, 2.178741455078125, 2.2535400390625, 2.328338623046875, 2.40313720703125, 2.477935791015625, 2.552734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 27.0, 39.0, 49.0, 66.0, 125.0, 211.0, 272.0, 392.0, 569.0, 828.0, 1269.0, 1840.0, 2742.0, 4075.0, 6222.0, 9269.0, 13524.0, 20200.0, 30049.0, 44472.0, 65026.0, 99822.0, 153494.0, 189621.0, 135362.0, 88737.0, 58884.0, 39259.0, 26447.0, 18304.0, 12427.0, 8145.0, 5549.0, 3718.0, 2451.0, 1680.0, 1097.0, 755.0, 498.0, 333.0, 228.0, 141.0, 99.0, 75.0, 50.0, 26.0, 27.0, 17.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.20953750610351562, -0.20240020751953125, -0.19526290893554688, -0.1881256103515625, -0.18098831176757812, -0.17385101318359375, -0.16671371459960938, -0.159576416015625, -0.15243911743164062, -0.14530181884765625, -0.13816452026367188, -0.1310272216796875, -0.12388992309570312, -0.11675262451171875, -0.10961532592773438, -0.10247802734375, -0.09534072875976562, -0.08820343017578125, -0.08106613159179688, -0.0739288330078125, -0.06679153442382812, -0.05965423583984375, -0.052516937255859375, -0.045379638671875, -0.038242340087890625, -0.03110504150390625, -0.023967742919921875, -0.0168304443359375, -0.009693145751953125, -0.00255584716796875, 0.004581451416015625, 0.01171875, 0.018856048583984375, 0.02599334716796875, 0.033130645751953125, 0.0402679443359375, 0.047405242919921875, 0.05454254150390625, 0.061679840087890625, 0.068817138671875, 0.07595443725585938, 0.08309173583984375, 0.09022903442382812, 0.0973663330078125, 0.10450363159179688, 0.11164093017578125, 0.11877822875976562, 0.12591552734375, 0.13305282592773438, 0.14019012451171875, 0.14732742309570312, 0.1544647216796875, 0.16160202026367188, 0.16873931884765625, 0.17587661743164062, 0.183013916015625, 0.19015121459960938, 0.19728851318359375, 0.20442581176757812, 0.2115631103515625, 0.21870040893554688, 0.22583770751953125, 0.23297500610351562, 0.2401123046875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 5.0, 16.0, 6.0, 10.0, 14.0, 11.0, 12.0, 17.0, 32.0, 27.0, 28.0, 33.0, 25.0, 29.0, 40.0, 30.0, 44.0, 28.0, 39.0, 31.0, 1066.0, 42.0, 40.0, 38.0, 35.0, 25.0, 23.0, 32.0, 28.0, 25.0, 19.0, 19.0, 19.0, 23.0, 17.0, 22.0, 5.0, 9.0, 11.0, 6.0, 11.0, 4.0, 12.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.5537109375, -1.507781982421875, -1.46185302734375, -1.415924072265625, -1.3699951171875, -1.324066162109375, -1.27813720703125, -1.232208251953125, -1.186279296875, -1.140350341796875, -1.09442138671875, -1.048492431640625, -1.0025634765625, -0.956634521484375, -0.91070556640625, -0.864776611328125, -0.81884765625, -0.772918701171875, -0.72698974609375, -0.681060791015625, -0.6351318359375, -0.589202880859375, -0.54327392578125, -0.497344970703125, -0.451416015625, -0.405487060546875, -0.35955810546875, -0.313629150390625, -0.2677001953125, -0.221771240234375, -0.17584228515625, -0.129913330078125, -0.083984375, -0.038055419921875, 0.00787353515625, 0.053802490234375, 0.0997314453125, 0.145660400390625, 0.19158935546875, 0.237518310546875, 0.283447265625, 0.329376220703125, 0.37530517578125, 0.421234130859375, 0.4671630859375, 0.513092041015625, 0.55902099609375, 0.604949951171875, 0.65087890625, 0.696807861328125, 0.74273681640625, 0.788665771484375, 0.8345947265625, 0.880523681640625, 0.92645263671875, 0.972381591796875, 1.018310546875, 1.064239501953125, 1.11016845703125, 1.156097412109375, 1.2020263671875, 1.247955322265625, 1.29388427734375, 1.339813232421875, 1.3857421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 8.0, 13.0, 11.0, 21.0, 23.0, 31.0, 49.0, 62.0, 82.0, 120.0, 201.0, 274.0, 401.0, 569.0, 814.0, 1149.0, 1771.0, 2672.0, 3740.0, 5781.0, 8755.0, 13383.0, 20809.0, 33249.0, 53641.0, 87710.0, 146715.0, 1267825.0, 172901.0, 103631.0, 62424.0, 38514.0, 24090.0, 15350.0, 10019.0, 6612.0, 4353.0, 2989.0, 2050.0, 1356.0, 915.0, 616.0, 436.0, 286.0, 197.0, 149.0, 115.0, 81.0, 56.0, 43.0, 23.0, 20.0, 12.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2269287109375, -0.2195281982421875, -0.212127685546875, -0.2047271728515625, -0.19732666015625, -0.1899261474609375, -0.182525634765625, -0.1751251220703125, -0.167724609375, -0.1603240966796875, -0.152923583984375, -0.1455230712890625, -0.13812255859375, -0.1307220458984375, -0.123321533203125, -0.1159210205078125, -0.1085205078125, -0.1011199951171875, -0.093719482421875, -0.0863189697265625, -0.07891845703125, -0.0715179443359375, -0.064117431640625, -0.0567169189453125, -0.04931640625, -0.0419158935546875, -0.034515380859375, -0.0271148681640625, -0.01971435546875, -0.0123138427734375, -0.004913330078125, 0.0024871826171875, 0.0098876953125, 0.0172882080078125, 0.024688720703125, 0.0320892333984375, 0.03948974609375, 0.0468902587890625, 0.054290771484375, 0.0616912841796875, 0.069091796875, 0.0764923095703125, 0.083892822265625, 0.0912933349609375, 0.09869384765625, 0.1060943603515625, 0.113494873046875, 0.1208953857421875, 0.1282958984375, 0.1356964111328125, 0.143096923828125, 0.1504974365234375, 0.15789794921875, 0.1652984619140625, 0.172698974609375, 0.1800994873046875, 0.1875, 0.1949005126953125, 0.202301025390625, 0.2097015380859375, 0.21710205078125, 0.2245025634765625, 0.231903076171875, 0.2393035888671875, 0.2467041015625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 10.0, 7.0, 4.0, 9.0, 13.0, 11.0, 23.0, 23.0, 28.0, 40.0, 50.0, 57.0, 83.0, 85.0, 71.0, 91.0, 85.0, 67.0, 54.0, 34.0, 29.0, 21.0, 14.0, 17.0, 12.0, 20.0, 7.0, 8.0, 5.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001476287841796875, -0.0014338046312332153, -0.0013913214206695557, -0.001348838210105896, -0.0013063549995422363, -0.0012638717889785767, -0.001221388578414917, -0.0011789053678512573, -0.0011364221572875977, -0.001093938946723938, -0.0010514557361602783, -0.0010089725255966187, -0.000966489315032959, -0.0009240061044692993, -0.0008815228939056396, -0.00083903968334198, -0.0007965564727783203, -0.0007540732622146606, -0.000711590051651001, -0.0006691068410873413, -0.0006266236305236816, -0.000584140419960022, -0.0005416572093963623, -0.0004991739988327026, -0.00045669078826904297, -0.0004142075777053833, -0.00037172436714172363, -0.00032924115657806396, -0.0002867579460144043, -0.00024427473545074463, -0.00020179152488708496, -0.0001593083143234253, -0.00011682510375976562, -7.434189319610596e-05, -3.185868263244629e-05, 1.0624527931213379e-05, 5.310773849487305e-05, 9.559094905853271e-05, 0.00013807415962219238, 0.00018055737018585205, 0.00022304058074951172, 0.0002655237913131714, 0.00030800700187683105, 0.0003504902124404907, 0.0003929734230041504, 0.00043545663356781006, 0.0004779398441314697, 0.0005204230546951294, 0.0005629062652587891, 0.0006053894758224487, 0.0006478726863861084, 0.0006903558969497681, 0.0007328391075134277, 0.0007753223180770874, 0.0008178055286407471, 0.0008602887392044067, 0.0009027719497680664, 0.0009452551603317261, 0.0009877383708953857, 0.0010302215814590454, 0.001072704792022705, 0.0011151880025863647, 0.0011576712131500244, 0.001200154423713684, 0.0012426376342773438]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 13.0, 5.0, 6.0, 17.0, 17.0, 24.0, 23.0, 44.0, 58.0, 76.0, 133.0, 172.0, 296.0, 574.0, 4273.0, 907551.0, 132652.0, 1430.0, 428.0, 225.0, 153.0, 104.0, 81.0, 59.0, 40.0, 28.0, 16.0, 12.0, 15.0, 10.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023834228515625, -0.02300739288330078, -0.022180557250976562, -0.021353721618652344, -0.020526885986328125, -0.019700050354003906, -0.018873214721679688, -0.01804637908935547, -0.01721954345703125, -0.01639270782470703, -0.015565872192382812, -0.014739036560058594, -0.013912200927734375, -0.013085365295410156, -0.012258529663085938, -0.011431694030761719, -0.0106048583984375, -0.009778022766113281, -0.008951187133789062, -0.008124351501464844, -0.007297515869140625, -0.006470680236816406, -0.0056438446044921875, -0.004817008972167969, -0.00399017333984375, -0.0031633377075195312, -0.0023365020751953125, -0.0015096664428710938, -0.000682830810546875, 0.00014400482177734375, 0.0009708404541015625, 0.0017976760864257812, 0.00262451171875, 0.0034513473510742188, 0.0042781829833984375, 0.005105018615722656, 0.005931854248046875, 0.006758689880371094, 0.0075855255126953125, 0.008412361145019531, 0.00923919677734375, 0.010066032409667969, 0.010892868041992188, 0.011719703674316406, 0.012546539306640625, 0.013373374938964844, 0.014200210571289062, 0.015027046203613281, 0.0158538818359375, 0.01668071746826172, 0.017507553100585938, 0.018334388732910156, 0.019161224365234375, 0.019988059997558594, 0.020814895629882812, 0.02164173126220703, 0.02246856689453125, 0.02329540252685547, 0.024122238159179688, 0.024949073791503906, 0.025775909423828125, 0.026602745056152344, 0.027429580688476562, 0.02825641632080078, 0.029083251953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 49.0, 127.0, 281.0, 283.0, 171.0, 63.0, 16.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039117899723351, -0.0038353886920958757, -0.0037589874118566513, -0.003682586131617427, -0.0036061848513782024, -0.003529783571138978, -0.0034533822908997536, -0.003376981243491173, -0.0033005797304213047, -0.0032241784501820803, -0.003147777169942856, -0.0030713758897036314, -0.002994974609464407, -0.0029185733292251825, -0.002842172048985958, -0.0027657710015773773, -0.002689369721338153, -0.0026129684410989285, -0.002536567160859704, -0.0024601658806204796, -0.002383764600381255, -0.0023073633201420307, -0.0022309620399028063, -0.002154560759663582, -0.002078159712255001, -0.0020017584320157766, -0.0019253571517765522, -0.0018489558715373278, -0.0017725545912981033, -0.001696153311058879, -0.0016197521472349763, -0.0015433508669957519, -0.001466949237510562, -0.0013905479572713375, -0.001314146677032113, -0.0012377453967928886, -0.0011613441165536642, -0.0010849428363144398, -0.0010085416724905372, -0.0009321403922513127, -0.0008557391120120883, -0.0007793378317728639, -0.0007029365515336394, -0.0006265353295020759, -0.0005501340492628515, -0.00047373276902362704, -0.00039733151788823307, -0.0003209302667528391, -0.00024452898651361465, -0.00016812772082630545, -9.172645513899624e-05, -1.5325189451687038e-05, 6.107607623562217e-05, 0.0001374773564748466, 0.00021387860761024058, 0.00029027985874563456, 0.000366681138984859, 0.0004430824192240834, 0.0005194836994633079, 0.0005958849214948714, 0.0006722862017340958, 0.0007486874819733202, 0.0008250887040048838, 0.0009014899842441082, 0.0009778912644833326]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 1.0, 10.0, 10.0, 12.0, 16.0, 20.0, 10.0, 15.0, 21.0, 24.0, 29.0, 28.0, 28.0, 41.0, 38.0, 37.0, 48.0, 47.0, 40.0, 39.0, 39.0, 45.0, 47.0, 36.0, 45.0, 40.0, 26.0, 22.0, 37.0, 26.0, 15.0, 27.0, 10.0, 15.0, 10.0, 12.0, 2.0, 4.0, 7.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0006422996520996094, -0.0006229588761925697, -0.0006036181002855301, -0.0005842773243784904, -0.0005649365484714508, -0.0005455957725644112, -0.0005262549966573715, -0.0005069142207503319, -0.00048757344484329224, -0.0004682326689362526, -0.00044889189302921295, -0.0004295511171221733, -0.00041021034121513367, -0.000390869565308094, -0.0003715287894010544, -0.00035218801349401474, -0.0003328472375869751, -0.00031350646167993546, -0.0002941656857728958, -0.00027482490986585617, -0.00025548413395881653, -0.00023614335805177689, -0.00021680258214473724, -0.0001974618062376976, -0.00017812103033065796, -0.00015878025442361832, -0.00013943947851657867, -0.00012009870260953903, -0.00010075792670249939, -8.141715079545975e-05, -6.20763748884201e-05, -4.273559898138046e-05, -2.339482307434082e-05, -4.054047167301178e-06, 1.5286728739738464e-05, 3.462750464677811e-05, 5.396828055381775e-05, 7.330905646085739e-05, 9.264983236789703e-05, 0.00011199060827493668, 0.00013133138418197632, 0.00015067216008901596, 0.0001700129359960556, 0.00018935371190309525, 0.0002086944878101349, 0.00022803526371717453, 0.00024737603962421417, 0.0002667168155312538, 0.00028605759143829346, 0.0003053983673453331, 0.00032473914325237274, 0.0003440799191594124, 0.000363420695066452, 0.00038276147097349167, 0.0004021022468805313, 0.00042144302278757095, 0.0004407837986946106, 0.00046012457460165024, 0.0004794653505086899, 0.0004988061264157295, 0.0005181469023227692, 0.0005374876782298088, 0.0005568284541368484, 0.0005761692300438881, 0.0005955100059509277]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 8.0, 15.0, 14.0, 15.0, 13.0, 15.0, 24.0, 20.0, 30.0, 20.0, 28.0, 26.0, 35.0, 37.0, 43.0, 31.0, 38.0, 33.0, 40.0, 35.0, 32.0, 50.0, 41.0, 32.0, 29.0, 24.0, 37.0, 22.0, 31.0, 13.0, 24.0, 24.0, 24.0, 14.0, 13.0, 8.0, 11.0, 10.0, 9.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.234375, -2.159576416015625, -2.08477783203125, -2.009979248046875, -1.9351806640625, -1.860382080078125, -1.78558349609375, -1.710784912109375, -1.635986328125, -1.561187744140625, -1.48638916015625, -1.411590576171875, -1.3367919921875, -1.261993408203125, -1.18719482421875, -1.112396240234375, -1.03759765625, -0.962799072265625, -0.88800048828125, -0.813201904296875, -0.7384033203125, -0.663604736328125, -0.58880615234375, -0.514007568359375, -0.439208984375, -0.364410400390625, -0.28961181640625, -0.214813232421875, -0.1400146484375, -0.065216064453125, 0.00958251953125, 0.084381103515625, 0.1591796875, 0.233978271484375, 0.30877685546875, 0.383575439453125, 0.4583740234375, 0.533172607421875, 0.60797119140625, 0.682769775390625, 0.757568359375, 0.832366943359375, 0.90716552734375, 0.981964111328125, 1.0567626953125, 1.131561279296875, 1.20635986328125, 1.281158447265625, 1.35595703125, 1.430755615234375, 1.50555419921875, 1.580352783203125, 1.6551513671875, 1.729949951171875, 1.80474853515625, 1.879547119140625, 1.954345703125, 2.029144287109375, 2.10394287109375, 2.178741455078125, 2.2535400390625, 2.328338623046875, 2.40313720703125, 2.477935791015625, 2.552734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 11.0, 26.0, 22.0, 25.0, 37.0, 60.0, 77.0, 100.0, 163.0, 215.0, 306.0, 462.0, 671.0, 1108.0, 1777.0, 2714.0, 4436.0, 7729.0, 14529.0, 29664.0, 69879.0, 202312.0, 422409.0, 170627.0, 61221.0, 26119.0, 13220.0, 7110.0, 4142.0, 2624.0, 1607.0, 1025.0, 631.0, 448.0, 301.0, 197.0, 160.0, 88.0, 84.0, 50.0, 34.0, 30.0, 35.0, 15.0, 12.0, 11.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.048828125, -2.954803466796875, -2.86077880859375, -2.766754150390625, -2.6727294921875, -2.578704833984375, -2.48468017578125, -2.390655517578125, -2.296630859375, -2.202606201171875, -2.10858154296875, -2.014556884765625, -1.9205322265625, -1.826507568359375, -1.73248291015625, -1.638458251953125, -1.54443359375, -1.450408935546875, -1.35638427734375, -1.262359619140625, -1.1683349609375, -1.074310302734375, -0.98028564453125, -0.886260986328125, -0.792236328125, -0.698211669921875, -0.60418701171875, -0.510162353515625, -0.4161376953125, -0.322113037109375, -0.22808837890625, -0.134063720703125, -0.0400390625, 0.053985595703125, 0.14801025390625, 0.242034912109375, 0.3360595703125, 0.430084228515625, 0.52410888671875, 0.618133544921875, 0.712158203125, 0.806182861328125, 0.90020751953125, 0.994232177734375, 1.0882568359375, 1.182281494140625, 1.27630615234375, 1.370330810546875, 1.46435546875, 1.558380126953125, 1.65240478515625, 1.746429443359375, 1.8404541015625, 1.934478759765625, 2.02850341796875, 2.122528076171875, 2.216552734375, 2.310577392578125, 2.40460205078125, 2.498626708984375, 2.5926513671875, 2.686676025390625, 2.78070068359375, 2.874725341796875, 2.96875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 19.0, 21.0, 16.0, 19.0, 30.0, 25.0, 21.0, 27.0, 30.0, 45.0, 37.0, 42.0, 55.0, 76.0, 188.0, 1484.0, 323.0, 118.0, 67.0, 43.0, 49.0, 33.0, 31.0, 29.0, 36.0, 36.0, 24.0, 14.0, 20.0, 10.0, 7.0, 10.0, 10.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.015625, -8.732421875, -8.44921875, -8.166015625, -7.8828125, -7.599609375, -7.31640625, -7.033203125, -6.75, -6.466796875, -6.18359375, -5.900390625, -5.6171875, -5.333984375, -5.05078125, -4.767578125, -4.484375, -4.201171875, -3.91796875, -3.634765625, -3.3515625, -3.068359375, -2.78515625, -2.501953125, -2.21875, -1.935546875, -1.65234375, -1.369140625, -1.0859375, -0.802734375, -0.51953125, -0.236328125, 0.046875, 0.330078125, 0.61328125, 0.896484375, 1.1796875, 1.462890625, 1.74609375, 2.029296875, 2.3125, 2.595703125, 2.87890625, 3.162109375, 3.4453125, 3.728515625, 4.01171875, 4.294921875, 4.578125, 4.861328125, 5.14453125, 5.427734375, 5.7109375, 5.994140625, 6.27734375, 6.560546875, 6.84375, 7.126953125, 7.41015625, 7.693359375, 7.9765625, 8.259765625, 8.54296875, 8.826171875, 9.109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 16.0, 25.0, 20.0, 34.0, 47.0, 52.0, 95.0, 181.0, 235.0, 503.0, 2671.0, 82360.0, 3029781.0, 26883.0, 1592.0, 486.0, 217.0, 122.0, 83.0, 65.0, 49.0, 40.0, 22.0, 15.0, 17.0, 17.0, 3.0, 11.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.0, -22.217041015625, -21.43408203125, -20.651123046875, -19.8681640625, -19.085205078125, -18.30224609375, -17.519287109375, -16.736328125, -15.953369140625, -15.17041015625, -14.387451171875, -13.6044921875, -12.821533203125, -12.03857421875, -11.255615234375, -10.47265625, -9.689697265625, -8.90673828125, -8.123779296875, -7.3408203125, -6.557861328125, -5.77490234375, -4.991943359375, -4.208984375, -3.426025390625, -2.64306640625, -1.860107421875, -1.0771484375, -0.294189453125, 0.48876953125, 1.271728515625, 2.0546875, 2.837646484375, 3.62060546875, 4.403564453125, 5.1865234375, 5.969482421875, 6.75244140625, 7.535400390625, 8.318359375, 9.101318359375, 9.88427734375, 10.667236328125, 11.4501953125, 12.233154296875, 13.01611328125, 13.799072265625, 14.58203125, 15.364990234375, 16.14794921875, 16.930908203125, 17.7138671875, 18.496826171875, 19.27978515625, 20.062744140625, 20.845703125, 21.628662109375, 22.41162109375, 23.194580078125, 23.9775390625, 24.760498046875, 25.54345703125, 26.326416015625, 27.109375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 192.0, 666.0, 142.0, 3.0, 1.0, 1.0, 1.0], "bins": [-183.06349182128906, -179.92803955078125, -176.7926025390625, -173.6571502685547, -170.52171325683594, -167.38626098632812, -164.25082397460938, -161.11537170410156, -157.97991943359375, -154.84446716308594, -151.7090301513672, -148.57357788085938, -145.43814086914062, -142.3026885986328, -139.167236328125, -136.03179931640625, -132.8963623046875, -129.7609100341797, -126.62547302246094, -123.49002075195312, -120.35457611083984, -117.21913146972656, -114.08368682861328, -110.9482421875, -107.81278991699219, -104.6773452758789, -101.54190063476562, -98.40644836425781, -95.27100372314453, -92.13555908203125, -89.00011444091797, -85.86466979980469, -82.7292251586914, -79.59378051757812, -76.45833587646484, -73.32289123535156, -70.18743896484375, -67.05199432373047, -63.91654968261719, -60.781105041503906, -57.64565658569336, -54.51021194458008, -51.37476348876953, -48.23931884765625, -45.10387420654297, -41.96842956542969, -38.83298110961914, -35.69753646850586, -32.56208801269531, -29.4266414642334, -26.291196823120117, -23.155750274658203, -20.020305633544922, -16.884859085083008, -13.749412536621094, -10.613967895507812, -7.478523254394531, -4.343077659606934, -1.2076315879821777, 1.9278144836425781, 5.063260078430176, 8.198705673217773, 11.334152221679688, 14.469596862792969, 17.605043411254883]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 5.0, 6.0, 6.0, 8.0, 16.0, 8.0, 21.0, 20.0, 20.0, 31.0, 30.0, 33.0, 32.0, 46.0, 34.0, 44.0, 37.0, 39.0, 47.0, 42.0, 44.0, 46.0, 48.0, 46.0, 29.0, 23.0, 23.0, 31.0, 32.0, 24.0, 19.0, 22.0, 15.0, 18.0, 9.0, 9.0, 4.0, 4.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.365337371826172, -30.490711212158203, -29.616085052490234, -28.7414608001709, -27.86683464050293, -26.99220848083496, -26.117582321166992, -25.242958068847656, -24.368331909179688, -23.49370574951172, -22.61907958984375, -21.744455337524414, -20.869829177856445, -19.995203018188477, -19.120576858520508, -18.245952606201172, -17.371326446533203, -16.496700286865234, -15.622075080871582, -14.747448921203613, -13.872823715209961, -12.998197555541992, -12.123571395874023, -11.248946189880371, -10.374319076538086, -9.499692916870117, -8.625067710876465, -7.750441551208496, -6.875816345214844, -6.001190185546875, -5.1265645027160645, -4.251938819885254, -3.3773136138916016, -2.502687931060791, -1.628062129020691, -0.7534363269805908, 0.12118935585021973, 0.9958152770996094, 1.87044095993042, 2.7450666427612305, 3.619692325592041, 4.494318008422852, 5.368943691253662, 6.243569374084473, 7.118195533752441, 7.992821216583252, 8.867446899414062, 9.742073059082031, 10.616698265075684, 11.491324424743652, 12.365949630737305, 13.240575790405273, 14.115200996398926, 14.989827156066895, 15.864452362060547, 16.739078521728516, 17.613704681396484, 18.488330841064453, 19.362957000732422, 20.237581253051758, 21.112207412719727, 21.986833572387695, 22.861459732055664, 23.736083984375, 24.61071014404297]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 8.0, 3.0, 10.0, 8.0, 14.0, 18.0, 14.0, 11.0, 14.0, 22.0, 22.0, 26.0, 38.0, 28.0, 31.0, 38.0, 33.0, 31.0, 40.0, 34.0, 36.0, 29.0, 45.0, 43.0, 35.0, 45.0, 32.0, 34.0, 23.0, 28.0, 28.0, 22.0, 28.0, 20.0, 22.0, 14.0, 15.0, 14.0, 8.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.21484375, -2.1343994140625, -2.053955078125, -1.9735107421875, -1.89306640625, -1.8126220703125, -1.732177734375, -1.6517333984375, -1.5712890625, -1.4908447265625, -1.410400390625, -1.3299560546875, -1.24951171875, -1.1690673828125, -1.088623046875, -1.0081787109375, -0.927734375, -0.8472900390625, -0.766845703125, -0.6864013671875, -0.60595703125, -0.5255126953125, -0.445068359375, -0.3646240234375, -0.2841796875, -0.2037353515625, -0.123291015625, -0.0428466796875, 0.03759765625, 0.1180419921875, 0.198486328125, 0.2789306640625, 0.359375, 0.4398193359375, 0.520263671875, 0.6007080078125, 0.68115234375, 0.7615966796875, 0.842041015625, 0.9224853515625, 1.0029296875, 1.0833740234375, 1.163818359375, 1.2442626953125, 1.32470703125, 1.4051513671875, 1.485595703125, 1.5660400390625, 1.646484375, 1.7269287109375, 1.807373046875, 1.8878173828125, 1.96826171875, 2.0487060546875, 2.129150390625, 2.2095947265625, 2.2900390625, 2.3704833984375, 2.450927734375, 2.5313720703125, 2.61181640625, 2.6922607421875, 2.772705078125, 2.8531494140625, 2.93359375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 17.0, 17.0, 20.0, 27.0, 27.0, 55.0, 76.0, 96.0, 159.0, 276.0, 458.0, 972.0, 1933.0, 4414.0, 11491.0, 34145.0, 113811.0, 404255.0, 1139432.0, 1477528.0, 711784.0, 203842.0, 57795.0, 18692.0, 6995.0, 2865.0, 1345.0, 685.0, 391.0, 203.0, 134.0, 101.0, 64.0, 43.0, 38.0, 20.0, 14.0, 17.0, 7.0, 8.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.48046875, -3.369049072265625, -3.25762939453125, -3.146209716796875, -3.0347900390625, -2.923370361328125, -2.81195068359375, -2.700531005859375, -2.589111328125, -2.477691650390625, -2.36627197265625, -2.254852294921875, -2.1434326171875, -2.032012939453125, -1.92059326171875, -1.809173583984375, -1.69775390625, -1.586334228515625, -1.47491455078125, -1.363494873046875, -1.2520751953125, -1.140655517578125, -1.02923583984375, -0.917816162109375, -0.806396484375, -0.694976806640625, -0.58355712890625, -0.472137451171875, -0.3607177734375, -0.249298095703125, -0.13787841796875, -0.026458740234375, 0.0849609375, 0.196380615234375, 0.30780029296875, 0.419219970703125, 0.5306396484375, 0.642059326171875, 0.75347900390625, 0.864898681640625, 0.976318359375, 1.087738037109375, 1.19915771484375, 1.310577392578125, 1.4219970703125, 1.533416748046875, 1.64483642578125, 1.756256103515625, 1.86767578125, 1.979095458984375, 2.09051513671875, 2.201934814453125, 2.3133544921875, 2.424774169921875, 2.53619384765625, 2.647613525390625, 2.759033203125, 2.870452880859375, 2.98187255859375, 3.093292236328125, 3.2047119140625, 3.316131591796875, 3.42755126953125, 3.538970947265625, 3.650390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 14.0, 23.0, 42.0, 47.0, 67.0, 115.0, 150.0, 224.0, 339.0, 457.0, 547.0, 557.0, 464.0, 315.0, 220.0, 170.0, 108.0, 59.0, 44.0, 42.0, 20.0, 14.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-12.1953125, -11.91094970703125, -11.6265869140625, -11.34222412109375, -11.057861328125, -10.77349853515625, -10.4891357421875, -10.20477294921875, -9.92041015625, -9.63604736328125, -9.3516845703125, -9.06732177734375, -8.782958984375, -8.49859619140625, -8.2142333984375, -7.92987060546875, -7.6455078125, -7.36114501953125, -7.0767822265625, -6.79241943359375, -6.508056640625, -6.22369384765625, -5.9393310546875, -5.65496826171875, -5.37060546875, -5.08624267578125, -4.8018798828125, -4.51751708984375, -4.233154296875, -3.94879150390625, -3.6644287109375, -3.38006591796875, -3.095703125, -2.81134033203125, -2.5269775390625, -2.24261474609375, -1.958251953125, -1.67388916015625, -1.3895263671875, -1.10516357421875, -0.82080078125, -0.53643798828125, -0.2520751953125, 0.03228759765625, 0.316650390625, 0.60101318359375, 0.8853759765625, 1.16973876953125, 1.4541015625, 1.73846435546875, 2.0228271484375, 2.30718994140625, 2.591552734375, 2.87591552734375, 3.1602783203125, 3.44464111328125, 3.72900390625, 4.01336669921875, 4.2977294921875, 4.58209228515625, 4.866455078125, 5.15081787109375, 5.4351806640625, 5.71954345703125, 6.00390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 17.0, 14.0, 15.0, 34.0, 40.0, 67.0, 108.0, 198.0, 409.0, 1128.0, 5603.0, 133794.0, 3537832.0, 499765.0, 12597.0, 1499.0, 530.0, 252.0, 148.0, 67.0, 51.0, 21.0, 25.0, 19.0, 13.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3671875, -14.7440185546875, -14.120849609375, -13.4976806640625, -12.87451171875, -12.2513427734375, -11.628173828125, -11.0050048828125, -10.3818359375, -9.7586669921875, -9.135498046875, -8.5123291015625, -7.88916015625, -7.2659912109375, -6.642822265625, -6.0196533203125, -5.396484375, -4.7733154296875, -4.150146484375, -3.5269775390625, -2.90380859375, -2.2806396484375, -1.657470703125, -1.0343017578125, -0.4111328125, 0.2120361328125, 0.835205078125, 1.4583740234375, 2.08154296875, 2.7047119140625, 3.327880859375, 3.9510498046875, 4.57421875, 5.1973876953125, 5.820556640625, 6.4437255859375, 7.06689453125, 7.6900634765625, 8.313232421875, 8.9364013671875, 9.5595703125, 10.1827392578125, 10.805908203125, 11.4290771484375, 12.05224609375, 12.6754150390625, 13.298583984375, 13.9217529296875, 14.544921875, 15.1680908203125, 15.791259765625, 16.4144287109375, 17.03759765625, 17.6607666015625, 18.283935546875, 18.9071044921875, 19.5302734375, 20.1534423828125, 20.776611328125, 21.3997802734375, 22.02294921875, 22.6461181640625, 23.269287109375, 23.8924560546875, 24.515625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 17.0, 25.0, 33.0, 68.0, 93.0, 114.0, 129.0, 118.0, 134.0, 96.0, 56.0, 46.0, 32.0, 18.0, 7.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.169708251953125, -35.07180404663086, -33.973899841308594, -32.87599563598633, -31.778091430664062, -30.680187225341797, -29.582284927368164, -28.4843807220459, -27.386476516723633, -26.288572311401367, -25.1906681060791, -24.092763900756836, -22.994861602783203, -21.896957397460938, -20.799053192138672, -19.701148986816406, -18.60324478149414, -17.505340576171875, -16.40743637084961, -15.30953311920166, -14.211628913879395, -13.113724708557129, -12.01582145690918, -10.917917251586914, -9.820013046264648, -8.722108840942383, -7.624205112457275, -6.526301383972168, -5.428397178649902, -4.330492973327637, -3.2325892448425293, -2.134685516357422, -1.0367813110351562, 0.06112265586853027, 1.1590266227722168, 2.2569305896759033, 3.35483455657959, 4.4527387619018555, 5.550642490386963, 6.64854621887207, 7.746450424194336, 8.844354629516602, 9.942258834838867, 11.040162086486816, 12.138066291809082, 13.235970497131348, 14.333873748779297, 15.431777954101562, 16.529682159423828, 17.627586364746094, 18.72549057006836, 19.823394775390625, 20.92129898071289, 22.019203186035156, 23.11710548400879, 24.215009689331055, 25.31291389465332, 26.410818099975586, 27.50872230529785, 28.606626510620117, 29.70452880859375, 30.802433013916016, 31.90033721923828, 32.99824142456055, 34.09614562988281]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 5.0, 9.0, 5.0, 9.0, 14.0, 15.0, 13.0, 13.0, 19.0, 24.0, 17.0, 29.0, 32.0, 32.0, 36.0, 46.0, 30.0, 39.0, 45.0, 49.0, 35.0, 34.0, 36.0, 39.0, 45.0, 46.0, 35.0, 36.0, 30.0, 32.0, 20.0, 19.0, 16.0, 25.0, 12.0, 12.0, 8.0, 12.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.199748992919922, -22.46312141418457, -21.72649383544922, -20.989866256713867, -20.253238677978516, -19.51660919189453, -18.779983520507812, -18.043354034423828, -17.306726455688477, -16.570098876953125, -15.833471298217773, -15.096843719482422, -14.360215187072754, -13.623587608337402, -12.88696002960205, -12.150331497192383, -11.413704872131348, -10.677077293395996, -9.940449714660645, -9.203821182250977, -8.467193603515625, -7.730566024780273, -6.993938446044922, -6.257310390472412, -5.5206828117370605, -4.784055233001709, -4.047427177429199, -3.3107995986938477, -2.574171781539917, -1.8375439643859863, -1.1009163856506348, -0.364288330078125, 0.37233924865722656, 1.1089670658111572, 1.8455947637557983, 2.5822224617004395, 3.31885027885437, 4.055478096008301, 4.792105674743652, 5.528733730316162, 6.265361309051514, 7.001988887786865, 7.738616943359375, 8.475244522094727, 9.211872100830078, 9.94849967956543, 10.685127258300781, 11.42175579071045, 12.1583833694458, 12.895010948181152, 13.631638526916504, 14.368267059326172, 15.104894638061523, 15.841522216796875, 16.578149795532227, 17.314777374267578, 18.05140495300293, 18.78803253173828, 19.524660110473633, 20.261287689208984, 20.997915267944336, 21.734542846679688, 22.471172332763672, 23.207799911499023, 23.944427490234375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 4.0, 18.0, 21.0, 17.0, 22.0, 8.0, 24.0, 26.0, 18.0, 40.0, 31.0, 37.0, 45.0, 35.0, 31.0, 39.0, 45.0, 47.0, 44.0, 38.0, 31.0, 37.0, 31.0, 35.0, 31.0, 35.0, 34.0, 24.0, 23.0, 17.0, 6.0, 20.0, 19.0, 7.0, 10.0, 6.0, 6.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.759765625, -2.6722412109375, -2.584716796875, -2.4971923828125, -2.40966796875, -2.3221435546875, -2.234619140625, -2.1470947265625, -2.0595703125, -1.9720458984375, -1.884521484375, -1.7969970703125, -1.70947265625, -1.6219482421875, -1.534423828125, -1.4468994140625, -1.359375, -1.2718505859375, -1.184326171875, -1.0968017578125, -1.00927734375, -0.9217529296875, -0.834228515625, -0.7467041015625, -0.6591796875, -0.5716552734375, -0.484130859375, -0.3966064453125, -0.30908203125, -0.2215576171875, -0.134033203125, -0.0465087890625, 0.041015625, 0.1285400390625, 0.216064453125, 0.3035888671875, 0.39111328125, 0.4786376953125, 0.566162109375, 0.6536865234375, 0.7412109375, 0.8287353515625, 0.916259765625, 1.0037841796875, 1.09130859375, 1.1788330078125, 1.266357421875, 1.3538818359375, 1.44140625, 1.5289306640625, 1.616455078125, 1.7039794921875, 1.79150390625, 1.8790283203125, 1.966552734375, 2.0540771484375, 2.1416015625, 2.2291259765625, 2.316650390625, 2.4041748046875, 2.49169921875, 2.5792236328125, 2.666748046875, 2.7542724609375, 2.841796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 14.0, 25.0, 42.0, 55.0, 64.0, 94.0, 161.0, 211.0, 360.0, 536.0, 762.0, 1132.0, 1628.0, 2493.0, 3842.0, 5676.0, 8308.0, 12487.0, 18469.0, 28278.0, 42593.0, 65348.0, 101909.0, 158050.0, 200871.0, 137036.0, 88221.0, 57354.0, 37451.0, 24932.0, 16577.0, 10961.0, 7540.0, 4912.0, 3335.0, 2250.0, 1540.0, 978.0, 664.0, 502.0, 301.0, 189.0, 147.0, 95.0, 63.0, 36.0, 29.0, 20.0, 6.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2744140625, -0.26593017578125, -0.2574462890625, -0.24896240234375, -0.240478515625, -0.23199462890625, -0.2235107421875, -0.21502685546875, -0.20654296875, -0.19805908203125, -0.1895751953125, -0.18109130859375, -0.172607421875, -0.16412353515625, -0.1556396484375, -0.14715576171875, -0.138671875, -0.13018798828125, -0.1217041015625, -0.11322021484375, -0.104736328125, -0.09625244140625, -0.0877685546875, -0.07928466796875, -0.07080078125, -0.06231689453125, -0.0538330078125, -0.04534912109375, -0.036865234375, -0.02838134765625, -0.0198974609375, -0.01141357421875, -0.0029296875, 0.00555419921875, 0.0140380859375, 0.02252197265625, 0.031005859375, 0.03948974609375, 0.0479736328125, 0.05645751953125, 0.06494140625, 0.07342529296875, 0.0819091796875, 0.09039306640625, 0.098876953125, 0.10736083984375, 0.1158447265625, 0.12432861328125, 0.1328125, 0.14129638671875, 0.1497802734375, 0.15826416015625, 0.166748046875, 0.17523193359375, 0.1837158203125, 0.19219970703125, 0.20068359375, 0.20916748046875, 0.2176513671875, 0.22613525390625, 0.234619140625, 0.24310302734375, 0.2515869140625, 0.26007080078125, 0.2685546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 2.0, 5.0, 9.0, 13.0, 12.0, 19.0, 22.0, 17.0, 25.0, 18.0, 28.0, 20.0, 29.0, 41.0, 31.0, 37.0, 53.0, 36.0, 50.0, 1070.0, 50.0, 59.0, 40.0, 39.0, 38.0, 26.0, 28.0, 38.0, 22.0, 27.0, 24.0, 18.0, 16.0, 14.0, 8.0, 4.0, 4.0, 8.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6376953125, -1.5794830322265625, -1.521270751953125, -1.4630584716796875, -1.40484619140625, -1.3466339111328125, -1.288421630859375, -1.2302093505859375, -1.1719970703125, -1.1137847900390625, -1.055572509765625, -0.9973602294921875, -0.93914794921875, -0.8809356689453125, -0.822723388671875, -0.7645111083984375, -0.706298828125, -0.6480865478515625, -0.589874267578125, -0.5316619873046875, -0.47344970703125, -0.4152374267578125, -0.357025146484375, -0.2988128662109375, -0.2406005859375, -0.1823883056640625, -0.124176025390625, -0.0659637451171875, -0.00775146484375, 0.0504608154296875, 0.108673095703125, 0.1668853759765625, 0.22509765625, 0.2833099365234375, 0.341522216796875, 0.3997344970703125, 0.45794677734375, 0.5161590576171875, 0.574371337890625, 0.6325836181640625, 0.6907958984375, 0.7490081787109375, 0.807220458984375, 0.8654327392578125, 0.92364501953125, 0.9818572998046875, 1.040069580078125, 1.0982818603515625, 1.156494140625, 1.2147064208984375, 1.272918701171875, 1.3311309814453125, 1.38934326171875, 1.4475555419921875, 1.505767822265625, 1.5639801025390625, 1.6221923828125, 1.6804046630859375, 1.738616943359375, 1.7968292236328125, 1.85504150390625, 1.9132537841796875, 1.971466064453125, 2.0296783447265625, 2.087890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 4.0, 9.0, 15.0, 32.0, 28.0, 58.0, 90.0, 126.0, 200.0, 338.0, 544.0, 830.0, 1318.0, 2147.0, 3442.0, 5612.0, 9343.0, 15765.0, 27172.0, 47255.0, 84393.0, 153472.0, 1302443.0, 194743.0, 106454.0, 59080.0, 33362.0, 19325.0, 11520.0, 6863.0, 4114.0, 2619.0, 1636.0, 1056.0, 651.0, 360.0, 249.0, 158.0, 98.0, 83.0, 45.0, 23.0, 18.0, 14.0, 5.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.328125, -0.3180885314941406, -0.30805206298828125, -0.2980155944824219, -0.2879791259765625, -0.2779426574707031, -0.26790618896484375, -0.2578697204589844, -0.247833251953125, -0.23779678344726562, -0.22776031494140625, -0.21772384643554688, -0.2076873779296875, -0.19765090942382812, -0.18761444091796875, -0.17757797241210938, -0.16754150390625, -0.15750503540039062, -0.14746856689453125, -0.13743209838867188, -0.1273956298828125, -0.11735916137695312, -0.10732269287109375, -0.09728622436523438, -0.087249755859375, -0.07721328735351562, -0.06717681884765625, -0.057140350341796875, -0.0471038818359375, -0.037067413330078125, -0.02703094482421875, -0.016994476318359375, -0.0069580078125, 0.003078460693359375, 0.01311492919921875, 0.023151397705078125, 0.0331878662109375, 0.043224334716796875, 0.05326080322265625, 0.06329727172851562, 0.073333740234375, 0.08337020874023438, 0.09340667724609375, 0.10344314575195312, 0.1134796142578125, 0.12351608276367188, 0.13355255126953125, 0.14358901977539062, 0.15362548828125, 0.16366195678710938, 0.17369842529296875, 0.18373489379882812, 0.1937713623046875, 0.20380783081054688, 0.21384429931640625, 0.22388076782226562, 0.233917236328125, 0.24395370483398438, 0.25399017333984375, 0.2640266418457031, 0.2740631103515625, 0.2840995788574219, 0.29413604736328125, 0.3041725158691406, 0.314208984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 13.0, 22.0, 17.0, 43.0, 65.0, 66.0, 86.0, 111.0, 105.0, 128.0, 83.0, 54.0, 34.0, 30.0, 15.0, 18.0, 18.0, 10.0, 7.0, 8.0, 4.0, 3.0, 8.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015316009521484375, -0.0014852136373519897, -0.001438826322555542, -0.0013924390077590942, -0.0013460516929626465, -0.0012996643781661987, -0.001253277063369751, -0.0012068897485733032, -0.0011605024337768555, -0.0011141151189804077, -0.00106772780418396, -0.0010213404893875122, -0.0009749531745910645, -0.0009285658597946167, -0.0008821785449981689, -0.0008357912302017212, -0.0007894039154052734, -0.0007430166006088257, -0.0006966292858123779, -0.0006502419710159302, -0.0006038546562194824, -0.0005574673414230347, -0.0005110800266265869, -0.00046469271183013916, -0.0004183053970336914, -0.00037191808223724365, -0.0003255307674407959, -0.00027914345264434814, -0.0002327561378479004, -0.00018636882305145264, -0.00013998150825500488, -9.359419345855713e-05, -4.7206878662109375e-05, -8.195638656616211e-07, 4.556775093078613e-05, 9.195506572723389e-05, 0.00013834238052368164, 0.0001847296953201294, 0.00023111701011657715, 0.0002775043249130249, 0.00032389163970947266, 0.0003702789545059204, 0.00041666626930236816, 0.0004630535840988159, 0.0005094408988952637, 0.0005558282136917114, 0.0006022155284881592, 0.0006486028432846069, 0.0006949901580810547, 0.0007413774728775024, 0.0007877647876739502, 0.000834152102470398, 0.0008805394172668457, 0.0009269267320632935, 0.0009733140468597412, 0.001019701361656189, 0.0010660886764526367, 0.0011124759912490845, 0.0011588633060455322, 0.00120525062084198, 0.0012516379356384277, 0.0012980252504348755, 0.0013444125652313232, 0.001390799880027771, 0.0014371871948242188]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 8.0, 9.0, 11.0, 20.0, 23.0, 41.0, 55.0, 96.0, 179.0, 320.0, 838.0, 25475.0, 1011154.0, 8927.0, 642.0, 292.0, 178.0, 77.0, 71.0, 36.0, 21.0, 14.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0287017822265625, -0.027757883071899414, -0.026813983917236328, -0.025870084762573242, -0.024926185607910156, -0.02398228645324707, -0.023038387298583984, -0.0220944881439209, -0.021150588989257812, -0.020206689834594727, -0.01926279067993164, -0.018318891525268555, -0.01737499237060547, -0.016431093215942383, -0.015487194061279297, -0.014543294906616211, -0.013599395751953125, -0.012655496597290039, -0.011711597442626953, -0.010767698287963867, -0.009823799133300781, -0.008879899978637695, -0.00793600082397461, -0.0069921016693115234, -0.0060482025146484375, -0.0051043033599853516, -0.004160404205322266, -0.0032165050506591797, -0.0022726058959960938, -0.0013287067413330078, -0.0003848075866699219, 0.0005590915679931641, 0.00150299072265625, 0.002446889877319336, 0.003390789031982422, 0.004334688186645508, 0.005278587341308594, 0.00622248649597168, 0.007166385650634766, 0.008110284805297852, 0.009054183959960938, 0.009998083114624023, 0.01094198226928711, 0.011885881423950195, 0.012829780578613281, 0.013773679733276367, 0.014717578887939453, 0.01566147804260254, 0.016605377197265625, 0.01754927635192871, 0.018493175506591797, 0.019437074661254883, 0.02038097381591797, 0.021324872970581055, 0.02226877212524414, 0.023212671279907227, 0.024156570434570312, 0.0251004695892334, 0.026044368743896484, 0.02698826789855957, 0.027932167053222656, 0.028876066207885742, 0.029819965362548828, 0.030763864517211914, 0.031707763671875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 20.0, 56.0, 96.0, 179.0, 223.0, 210.0, 114.0, 78.0, 21.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012218608753755689, -0.0011628605425357819, -0.0011038602096959949, -0.0010448598768562078, -0.000985859427601099, -0.0009268591529689729, -0.000867858761921525, -0.000808858429081738, -0.000749858096241951, -0.000690857763402164, -0.000631857430562377, -0.0005728570395149291, -0.000513856706675142, -0.00045485637383535504, -0.0003958560118917376, -0.0003368556499481201, -0.0002778553171083331, -0.00021885496971663088, -0.00015985462232492864, -0.0001008542749332264, -4.185392754152417e-05, 1.7146405298262835e-05, 7.61467672418803e-05, 0.00013514712918549776, 0.00019414746202528477, 0.0002531477948650718, 0.00031214815680868924, 0.0003711485187523067, 0.0004301488515920937, 0.0004891491844318807, 0.0005481495754793286, 0.0006071499083191156, 0.0006661501247435808, 0.0007251504575833678, 0.0007841507904231548, 0.0008431511814706028, 0.0009021515143103898, 0.0009611518471501768, 0.0010201522381976247, 0.0010791525710374117, 0.0011381529038771987, 0.0011971532367169857, 0.0012561535695567727, 0.0013151539023965597, 0.0013741543516516685, 0.0014331545680761337, 0.0014921550173312426, 0.0015511553501710296, 0.0016101556830108166, 0.0016691560158506036, 0.0017281563486903906, 0.0017871566815301776, 0.0018461570143699646, 0.0019051574636250734, 0.0019641576800495386, 0.0020231581293046474, 0.0020821583457291126, 0.0021411587949842215, 0.0022001590114086866, 0.0022591594606637955, 0.0023181596770882607, 0.0023771601263433695, 0.0024361603427678347, 0.0024951607920229435, 0.0025541612412780523]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 3.0, 5.0, 8.0, 9.0, 8.0, 13.0, 16.0, 20.0, 19.0, 23.0, 20.0, 29.0, 28.0, 32.0, 24.0, 30.0, 29.0, 36.0, 37.0, 48.0, 41.0, 37.0, 32.0, 40.0, 26.0, 31.0, 43.0, 26.0, 30.0, 29.0, 20.0, 30.0, 26.0, 33.0, 22.0, 18.0, 14.0, 11.0, 15.0, 10.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.0005614757537841797, -0.0005443431437015533, -0.000527210533618927, -0.0005100779235363007, -0.0004929453134536743, -0.000475812703371048, -0.00045868009328842163, -0.0004415474832057953, -0.00042441487312316895, -0.0004072822630405426, -0.00039014965295791626, -0.0003730170428752899, -0.0003558844327926636, -0.00033875182271003723, -0.0003216192126274109, -0.00030448660254478455, -0.0002873539924621582, -0.00027022138237953186, -0.0002530887722969055, -0.00023595616221427917, -0.00021882355213165283, -0.0002016909420490265, -0.00018455833196640015, -0.0001674257218837738, -0.00015029311180114746, -0.00013316050171852112, -0.00011602789163589478, -9.889528155326843e-05, -8.176267147064209e-05, -6.463006138801575e-05, -4.7497451305389404e-05, -3.036484122276306e-05, -1.3232231140136719e-05, 3.900378942489624e-06, 2.1032989025115967e-05, 3.816559910774231e-05, 5.529820919036865e-05, 7.2430819272995e-05, 8.956342935562134e-05, 0.00010669603943824768, 0.00012382864952087402, 0.00014096125960350037, 0.0001580938696861267, 0.00017522647976875305, 0.0001923590898513794, 0.00020949169993400574, 0.00022662431001663208, 0.00024375692009925842, 0.00026088953018188477, 0.0002780221402645111, 0.00029515475034713745, 0.0003122873604297638, 0.00032941997051239014, 0.0003465525805950165, 0.0003636851906776428, 0.00038081780076026917, 0.0003979504108428955, 0.00041508302092552185, 0.0004322156310081482, 0.00044934824109077454, 0.0004664808511734009, 0.0004836134612560272, 0.0005007460713386536, 0.0005178786814212799, 0.0005350112915039062]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 4.0, 18.0, 21.0, 17.0, 22.0, 8.0, 24.0, 26.0, 18.0, 40.0, 31.0, 37.0, 45.0, 35.0, 31.0, 39.0, 45.0, 47.0, 44.0, 38.0, 31.0, 37.0, 31.0, 35.0, 31.0, 35.0, 34.0, 24.0, 23.0, 17.0, 6.0, 20.0, 19.0, 7.0, 10.0, 6.0, 6.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.759765625, -2.6722412109375, -2.584716796875, -2.4971923828125, -2.40966796875, -2.3221435546875, -2.234619140625, -2.1470947265625, -2.0595703125, -1.9720458984375, -1.884521484375, -1.7969970703125, -1.70947265625, -1.6219482421875, -1.534423828125, -1.4468994140625, -1.359375, -1.2718505859375, -1.184326171875, -1.0968017578125, -1.00927734375, -0.9217529296875, -0.834228515625, -0.7467041015625, -0.6591796875, -0.5716552734375, -0.484130859375, -0.3966064453125, -0.30908203125, -0.2215576171875, -0.134033203125, -0.0465087890625, 0.041015625, 0.1285400390625, 0.216064453125, 0.3035888671875, 0.39111328125, 0.4786376953125, 0.566162109375, 0.6536865234375, 0.7412109375, 0.8287353515625, 0.916259765625, 1.0037841796875, 1.09130859375, 1.1788330078125, 1.266357421875, 1.3538818359375, 1.44140625, 1.5289306640625, 1.616455078125, 1.7039794921875, 1.79150390625, 1.8790283203125, 1.966552734375, 2.0540771484375, 2.1416015625, 2.2291259765625, 2.316650390625, 2.4041748046875, 2.49169921875, 2.5792236328125, 2.666748046875, 2.7542724609375, 2.841796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 7.0, 7.0, 12.0, 20.0, 25.0, 31.0, 38.0, 85.0, 111.0, 181.0, 313.0, 501.0, 837.0, 1418.0, 2685.0, 4725.0, 8933.0, 17367.0, 36787.0, 93347.0, 255958.0, 363396.0, 153698.0, 57029.0, 24403.0, 12152.0, 6353.0, 3387.0, 1931.0, 1077.0, 648.0, 385.0, 261.0, 158.0, 90.0, 51.0, 25.0, 37.0, 21.0, 15.0, 14.0, 10.0, 6.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.85546875, -2.76104736328125, -2.6666259765625, -2.57220458984375, -2.477783203125, -2.38336181640625, -2.2889404296875, -2.19451904296875, -2.10009765625, -2.00567626953125, -1.9112548828125, -1.81683349609375, -1.722412109375, -1.62799072265625, -1.5335693359375, -1.43914794921875, -1.3447265625, -1.25030517578125, -1.1558837890625, -1.06146240234375, -0.967041015625, -0.87261962890625, -0.7781982421875, -0.68377685546875, -0.58935546875, -0.49493408203125, -0.4005126953125, -0.30609130859375, -0.211669921875, -0.11724853515625, -0.0228271484375, 0.07159423828125, 0.166015625, 0.26043701171875, 0.3548583984375, 0.44927978515625, 0.543701171875, 0.63812255859375, 0.7325439453125, 0.82696533203125, 0.92138671875, 1.01580810546875, 1.1102294921875, 1.20465087890625, 1.299072265625, 1.39349365234375, 1.4879150390625, 1.58233642578125, 1.6767578125, 1.77117919921875, 1.8656005859375, 1.96002197265625, 2.054443359375, 2.14886474609375, 2.2432861328125, 2.33770751953125, 2.43212890625, 2.52655029296875, 2.6209716796875, 2.71539306640625, 2.809814453125, 2.90423583984375, 2.9986572265625, 3.09307861328125, 3.1875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 11.0, 15.0, 11.0, 28.0, 25.0, 22.0, 28.0, 31.0, 30.0, 55.0, 63.0, 75.0, 139.0, 316.0, 1496.0, 198.0, 88.0, 69.0, 53.0, 49.0, 39.0, 37.0, 34.0, 23.0, 28.0, 20.0, 8.0, 13.0, 10.0, 4.0, 7.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.9322509765625, -10.544189453125, -10.1561279296875, -9.76806640625, -9.3800048828125, -8.991943359375, -8.6038818359375, -8.2158203125, -7.8277587890625, -7.439697265625, -7.0516357421875, -6.66357421875, -6.2755126953125, -5.887451171875, -5.4993896484375, -5.111328125, -4.7232666015625, -4.335205078125, -3.9471435546875, -3.55908203125, -3.1710205078125, -2.782958984375, -2.3948974609375, -2.0068359375, -1.6187744140625, -1.230712890625, -0.8426513671875, -0.45458984375, -0.0665283203125, 0.321533203125, 0.7095947265625, 1.09765625, 1.4857177734375, 1.873779296875, 2.2618408203125, 2.64990234375, 3.0379638671875, 3.426025390625, 3.8140869140625, 4.2021484375, 4.5902099609375, 4.978271484375, 5.3663330078125, 5.75439453125, 6.1424560546875, 6.530517578125, 6.9185791015625, 7.306640625, 7.6947021484375, 8.082763671875, 8.4708251953125, 8.85888671875, 9.2469482421875, 9.635009765625, 10.0230712890625, 10.4111328125, 10.7991943359375, 11.187255859375, 11.5753173828125, 11.96337890625, 12.3514404296875, 12.739501953125, 13.1275634765625, 13.515625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 8.0, 12.0, 20.0, 35.0, 39.0, 59.0, 99.0, 159.0, 291.0, 683.0, 5708.0, 3100197.0, 36599.0, 974.0, 319.0, 184.0, 100.0, 67.0, 55.0, 27.0, 20.0, 16.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.30908203125, -42.9931640625, -41.67724609375, -40.361328125, -39.04541015625, -37.7294921875, -36.41357421875, -35.09765625, -33.78173828125, -32.4658203125, -31.14990234375, -29.833984375, -28.51806640625, -27.2021484375, -25.88623046875, -24.5703125, -23.25439453125, -21.9384765625, -20.62255859375, -19.306640625, -17.99072265625, -16.6748046875, -15.35888671875, -14.04296875, -12.72705078125, -11.4111328125, -10.09521484375, -8.779296875, -7.46337890625, -6.1474609375, -4.83154296875, -3.515625, -2.19970703125, -0.8837890625, 0.43212890625, 1.748046875, 3.06396484375, 4.3798828125, 5.69580078125, 7.01171875, 8.32763671875, 9.6435546875, 10.95947265625, 12.275390625, 13.59130859375, 14.9072265625, 16.22314453125, 17.5390625, 18.85498046875, 20.1708984375, 21.48681640625, 22.802734375, 24.11865234375, 25.4345703125, 26.75048828125, 28.06640625, 29.38232421875, 30.6982421875, 32.01416015625, 33.330078125, 34.64599609375, 35.9619140625, 37.27783203125, 38.59375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 828.0, 186.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.70010375976562, -72.34761047363281, -64.9951171875, -57.642616271972656, -50.290122985839844, -42.93762969970703, -35.58513259887695, -28.232635498046875, -20.880142211914062, -13.527647018432617, -6.175151824951172, 1.1773433685302734, 8.529838562011719, 15.882331848144531, 23.23482894897461, 30.587326049804688, 37.9398193359375, 45.29231262207031, 52.64480972290039, 59.99730682373047, 67.34980010986328, 74.7022933959961, 82.05479431152344, 89.40728759765625, 96.75978088378906, 104.11227416992188, 111.46476745605469, 118.81726837158203, 126.16976165771484, 133.52224731445312, 140.874755859375, 148.2272491455078, 155.57974243164062, 162.93223571777344, 170.28472900390625, 177.63722229003906, 184.98971557617188, 192.34222412109375, 199.69471740722656, 207.04721069335938, 214.3997039794922, 221.752197265625, 229.1046905517578, 236.45718383789062, 243.8096923828125, 251.16217041015625, 258.5146789550781, 265.8671875, 273.21966552734375, 280.5721740722656, 287.9246520996094, 295.27716064453125, 302.629638671875, 309.9821472167969, 317.3346252441406, 324.6871337890625, 332.03961181640625, 339.3921203613281, 346.7445983886719, 354.09710693359375, 361.4495849609375, 368.8020935058594, 376.1545715332031, 383.507080078125, 390.8595886230469]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 12.0, 9.0, 19.0, 20.0, 21.0, 15.0, 28.0, 30.0, 22.0, 31.0, 34.0, 41.0, 44.0, 39.0, 50.0, 56.0, 43.0, 37.0, 43.0, 38.0, 35.0, 48.0, 52.0, 33.0, 34.0, 22.0, 20.0, 21.0, 14.0, 17.0, 11.0, 10.0, 6.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.21792984008789, -20.378402709960938, -19.538875579833984, -18.6993465423584, -17.859819412231445, -17.020292282104492, -16.18076515197754, -15.34123706817627, -14.501708984375, -13.662181854248047, -12.822653770446777, -11.983126640319824, -11.143598556518555, -10.304071426391602, -9.464544296264648, -8.625016212463379, -7.785489082336426, -6.9459614753723145, -6.106433868408203, -5.26690673828125, -4.4273786544799805, -3.5878515243530273, -2.748323917388916, -1.9087963104248047, -1.0692687034606934, -0.2297411561012268, 0.6097863912582397, 1.4493138790130615, 2.288841485977173, 3.128368854522705, 3.9678964614868164, 4.807424068450928, 5.646951675415039, 6.48647928237915, 7.326006889343262, 8.165534019470215, 9.005062103271484, 9.844589233398438, 10.68411636352539, 11.52364444732666, 12.36317253112793, 13.202699661254883, 14.042227745056152, 14.881754875183105, 15.721282958984375, 16.560810089111328, 17.40033721923828, 18.239864349365234, 19.079391479492188, 19.91891860961914, 20.758445739746094, 21.59797477722168, 22.437501907348633, 23.277029037475586, 24.11655616760254, 24.956085205078125, 25.795612335205078, 26.63513946533203, 27.474666595458984, 28.31419563293457, 29.153722763061523, 29.993249893188477, 30.83277702331543, 31.672306060791016, 32.51183319091797]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 14.0, 14.0, 15.0, 22.0, 19.0, 16.0, 21.0, 26.0, 32.0, 35.0, 35.0, 48.0, 47.0, 37.0, 42.0, 42.0, 41.0, 34.0, 36.0, 33.0, 42.0, 37.0, 50.0, 28.0, 37.0, 23.0, 22.0, 23.0, 22.0, 12.0, 15.0, 7.0, 11.0, 6.0, 9.0, 10.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.873382568359375, -2.77606201171875, -2.678741455078125, -2.5814208984375, -2.484100341796875, -2.38677978515625, -2.289459228515625, -2.192138671875, -2.094818115234375, -1.99749755859375, -1.900177001953125, -1.8028564453125, -1.705535888671875, -1.60821533203125, -1.510894775390625, -1.41357421875, -1.316253662109375, -1.21893310546875, -1.121612548828125, -1.0242919921875, -0.926971435546875, -0.82965087890625, -0.732330322265625, -0.635009765625, -0.537689208984375, -0.44036865234375, -0.343048095703125, -0.2457275390625, -0.148406982421875, -0.05108642578125, 0.046234130859375, 0.1435546875, 0.240875244140625, 0.33819580078125, 0.435516357421875, 0.5328369140625, 0.630157470703125, 0.72747802734375, 0.824798583984375, 0.922119140625, 1.019439697265625, 1.11676025390625, 1.214080810546875, 1.3114013671875, 1.408721923828125, 1.50604248046875, 1.603363037109375, 1.70068359375, 1.798004150390625, 1.89532470703125, 1.992645263671875, 2.0899658203125, 2.187286376953125, 2.28460693359375, 2.381927490234375, 2.479248046875, 2.576568603515625, 2.67388916015625, 2.771209716796875, 2.8685302734375, 2.965850830078125, 3.06317138671875, 3.160491943359375, 3.2578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 15.0, 14.0, 24.0, 15.0, 27.0, 24.0, 42.0, 60.0, 55.0, 63.0, 72.0, 139.0, 191.0, 418.0, 2102.0, 54884.0, 3045269.0, 1075210.0, 13560.0, 1076.0, 330.0, 155.0, 116.0, 82.0, 70.0, 50.0, 43.0, 27.0, 36.0, 16.0, 20.0, 10.0, 10.0, 12.0, 8.0, 7.0, 5.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.802734375, -13.33984375, -12.876953125, -12.4140625, -11.951171875, -11.48828125, -11.025390625, -10.5625, -10.099609375, -9.63671875, -9.173828125, -8.7109375, -8.248046875, -7.78515625, -7.322265625, -6.859375, -6.396484375, -5.93359375, -5.470703125, -5.0078125, -4.544921875, -4.08203125, -3.619140625, -3.15625, -2.693359375, -2.23046875, -1.767578125, -1.3046875, -0.841796875, -0.37890625, 0.083984375, 0.546875, 1.009765625, 1.47265625, 1.935546875, 2.3984375, 2.861328125, 3.32421875, 3.787109375, 4.25, 4.712890625, 5.17578125, 5.638671875, 6.1015625, 6.564453125, 7.02734375, 7.490234375, 7.953125, 8.416015625, 8.87890625, 9.341796875, 9.8046875, 10.267578125, 10.73046875, 11.193359375, 11.65625, 12.119140625, 12.58203125, 13.044921875, 13.5078125, 13.970703125, 14.43359375, 14.896484375, 15.359375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 10.0, 15.0, 27.0, 28.0, 59.0, 93.0, 148.0, 220.0, 338.0, 555.0, 602.0, 604.0, 482.0, 308.0, 197.0, 129.0, 103.0, 48.0, 31.0, 23.0, 14.0, 9.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.25, -13.9173583984375, -13.584716796875, -13.2520751953125, -12.91943359375, -12.5867919921875, -12.254150390625, -11.9215087890625, -11.5888671875, -11.2562255859375, -10.923583984375, -10.5909423828125, -10.25830078125, -9.9256591796875, -9.593017578125, -9.2603759765625, -8.927734375, -8.5950927734375, -8.262451171875, -7.9298095703125, -7.59716796875, -7.2645263671875, -6.931884765625, -6.5992431640625, -6.2666015625, -5.9339599609375, -5.601318359375, -5.2686767578125, -4.93603515625, -4.6033935546875, -4.270751953125, -3.9381103515625, -3.60546875, -3.2728271484375, -2.940185546875, -2.6075439453125, -2.27490234375, -1.9422607421875, -1.609619140625, -1.2769775390625, -0.9443359375, -0.6116943359375, -0.279052734375, 0.0535888671875, 0.38623046875, 0.7188720703125, 1.051513671875, 1.3841552734375, 1.716796875, 2.0494384765625, 2.382080078125, 2.7147216796875, 3.04736328125, 3.3800048828125, 3.712646484375, 4.0452880859375, 4.3779296875, 4.7105712890625, 5.043212890625, 5.3758544921875, 5.70849609375, 6.0411376953125, 6.373779296875, 6.7064208984375, 7.0390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 11.0, 7.0, 27.0, 37.0, 64.0, 116.0, 171.0, 310.0, 494.0, 1632.0, 34258.0, 3882113.0, 270273.0, 3327.0, 640.0, 307.0, 194.0, 114.0, 59.0, 53.0, 26.0, 18.0, 8.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.35986328125, -18.3759765625, -17.39208984375, -16.408203125, -15.42431640625, -14.4404296875, -13.45654296875, -12.47265625, -11.48876953125, -10.5048828125, -9.52099609375, -8.537109375, -7.55322265625, -6.5693359375, -5.58544921875, -4.6015625, -3.61767578125, -2.6337890625, -1.64990234375, -0.666015625, 0.31787109375, 1.3017578125, 2.28564453125, 3.26953125, 4.25341796875, 5.2373046875, 6.22119140625, 7.205078125, 8.18896484375, 9.1728515625, 10.15673828125, 11.140625, 12.12451171875, 13.1083984375, 14.09228515625, 15.076171875, 16.06005859375, 17.0439453125, 18.02783203125, 19.01171875, 19.99560546875, 20.9794921875, 21.96337890625, 22.947265625, 23.93115234375, 24.9150390625, 25.89892578125, 26.8828125, 27.86669921875, 28.8505859375, 29.83447265625, 30.818359375, 31.80224609375, 32.7861328125, 33.77001953125, 34.75390625, 35.73779296875, 36.7216796875, 37.70556640625, 38.689453125, 39.67333984375, 40.6572265625, 41.64111328125, 42.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 12.0, 30.0, 41.0, 78.0, 93.0, 149.0, 137.0, 161.0, 120.0, 83.0, 45.0, 24.0, 17.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21330642700195, -41.70648956298828, -40.199668884277344, -38.69285202026367, -37.186031341552734, -35.67921447753906, -34.172393798828125, -32.66557693481445, -31.15875816345215, -29.651939392089844, -28.14512062072754, -26.638301849365234, -25.131484985351562, -23.624664306640625, -22.117847442626953, -20.61102867126465, -19.104209899902344, -17.59739112854004, -16.090572357177734, -14.583754539489746, -13.076935768127441, -11.570116996765137, -10.063299179077148, -8.556480407714844, -7.049661636352539, -5.542842864990234, -4.036024570465088, -2.5292062759399414, -1.0223875045776367, 0.48443126678466797, 1.9912490844726562, 3.498067855834961, 5.004886627197266, 6.51170539855957, 8.018524169921875, 9.525341987609863, 11.032160758972168, 12.538979530334473, 14.045797348022461, 15.552616119384766, 17.05943489074707, 18.566253662109375, 20.07307243347168, 21.579891204833984, 23.086708068847656, 24.593528747558594, 26.100345611572266, 27.60716438293457, 29.113983154296875, 30.62080192565918, 32.127620697021484, 33.634437561035156, 35.141258239746094, 36.648075103759766, 38.15489196777344, 39.661712646484375, 41.16853332519531, 42.675350189208984, 44.18217086791992, 45.688987731933594, 47.19580841064453, 48.7026252746582, 50.209442138671875, 51.71626281738281, 53.223079681396484]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 18.0, 10.0, 11.0, 18.0, 23.0, 24.0, 27.0, 30.0, 27.0, 29.0, 24.0, 31.0, 35.0, 39.0, 40.0, 52.0, 30.0, 40.0, 45.0, 31.0, 39.0, 44.0, 33.0, 20.0, 30.0, 29.0, 28.0, 20.0, 23.0, 17.0, 15.0, 13.0, 16.0, 9.0, 13.0, 8.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-22.744861602783203, -22.04392433166504, -21.342987060546875, -20.642047882080078, -19.941110610961914, -19.24017333984375, -18.539236068725586, -17.838298797607422, -17.137361526489258, -16.436424255371094, -15.735486030578613, -15.03454875946045, -14.333611488342285, -13.632673263549805, -12.93173599243164, -12.230798721313477, -11.529860496520996, -10.828923225402832, -10.127985000610352, -9.427047729492188, -8.726110458374023, -8.02517318725586, -7.324234962463379, -6.623297691345215, -5.922359943389893, -5.22142219543457, -4.520484924316406, -3.819547176361084, -3.118609666824341, -2.4176721572875977, -1.7167344093322754, -1.0157971382141113, -0.31485939025878906, 0.3860781788825989, 1.0870157480239868, 1.7879533767700195, 2.4888908863067627, 3.189828395843506, 3.890766143798828, 4.591703414916992, 5.2926411628723145, 5.993578910827637, 6.694516181945801, 7.395453929901123, 8.096391677856445, 8.79732894897461, 9.498266220092773, 10.199203491210938, 10.900141716003418, 11.601078987121582, 12.302017211914062, 13.002954483032227, 13.70389175415039, 14.404829025268555, 15.105767250061035, 15.8067045211792, 16.50764274597168, 17.208580017089844, 17.909517288208008, 18.610454559326172, 19.31139373779297, 20.012331008911133, 20.713268280029297, 21.41420555114746, 22.115142822265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 16.0, 15.0, 14.0, 22.0, 23.0, 23.0, 20.0, 40.0, 31.0, 36.0, 39.0, 41.0, 38.0, 48.0, 42.0, 45.0, 43.0, 36.0, 39.0, 39.0, 29.0, 35.0, 40.0, 37.0, 30.0, 27.0, 20.0, 17.0, 19.0, 15.0, 10.0, 6.0, 3.0, 8.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.193359375, -3.095428466796875, -2.99749755859375, -2.899566650390625, -2.8016357421875, -2.703704833984375, -2.60577392578125, -2.507843017578125, -2.409912109375, -2.311981201171875, -2.21405029296875, -2.116119384765625, -2.0181884765625, -1.920257568359375, -1.82232666015625, -1.724395751953125, -1.62646484375, -1.528533935546875, -1.43060302734375, -1.332672119140625, -1.2347412109375, -1.136810302734375, -1.03887939453125, -0.940948486328125, -0.843017578125, -0.745086669921875, -0.64715576171875, -0.549224853515625, -0.4512939453125, -0.353363037109375, -0.25543212890625, -0.157501220703125, -0.0595703125, 0.038360595703125, 0.13629150390625, 0.234222412109375, 0.3321533203125, 0.430084228515625, 0.52801513671875, 0.625946044921875, 0.723876953125, 0.821807861328125, 0.91973876953125, 1.017669677734375, 1.1156005859375, 1.213531494140625, 1.31146240234375, 1.409393310546875, 1.50732421875, 1.605255126953125, 1.70318603515625, 1.801116943359375, 1.8990478515625, 1.996978759765625, 2.09490966796875, 2.192840576171875, 2.290771484375, 2.388702392578125, 2.48663330078125, 2.584564208984375, 2.6824951171875, 2.780426025390625, 2.87835693359375, 2.976287841796875, 3.07421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 27.0, 28.0, 50.0, 88.0, 120.0, 182.0, 265.0, 418.0, 631.0, 945.0, 1400.0, 2281.0, 3449.0, 5453.0, 8270.0, 12967.0, 20200.0, 31576.0, 50334.0, 81974.0, 133696.0, 205039.0, 183302.0, 114683.0, 70591.0, 43655.0, 27533.0, 17537.0, 11112.0, 7283.0, 4693.0, 3076.0, 2012.0, 1256.0, 821.0, 572.0, 359.0, 232.0, 151.0, 111.0, 60.0, 43.0, 25.0, 19.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.3184318542480469, -0.30776214599609375, -0.2970924377441406, -0.2864227294921875, -0.2757530212402344, -0.26508331298828125, -0.2544136047363281, -0.243743896484375, -0.23307418823242188, -0.22240447998046875, -0.21173477172851562, -0.2010650634765625, -0.19039535522460938, -0.17972564697265625, -0.16905593872070312, -0.15838623046875, -0.14771652221679688, -0.13704681396484375, -0.12637710571289062, -0.1157073974609375, -0.10503768920898438, -0.09436798095703125, -0.08369827270507812, -0.073028564453125, -0.062358856201171875, -0.05168914794921875, -0.041019439697265625, -0.0303497314453125, -0.019680023193359375, -0.00901031494140625, 0.001659393310546875, 0.0123291015625, 0.022998809814453125, 0.03366851806640625, 0.044338226318359375, 0.0550079345703125, 0.06567764282226562, 0.07634735107421875, 0.08701705932617188, 0.097686767578125, 0.10835647583007812, 0.11902618408203125, 0.12969589233398438, 0.1403656005859375, 0.15103530883789062, 0.16170501708984375, 0.17237472534179688, 0.18304443359375, 0.19371414184570312, 0.20438385009765625, 0.21505355834960938, 0.2257232666015625, 0.23639297485351562, 0.24706268310546875, 0.2577323913574219, 0.268402099609375, 0.2790718078613281, 0.28974151611328125, 0.3004112243652344, 0.3110809326171875, 0.3217506408691406, 0.33242034912109375, 0.3430900573730469, 0.353759765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 7.0, 8.0, 13.0, 5.0, 15.0, 15.0, 13.0, 23.0, 25.0, 19.0, 21.0, 33.0, 33.0, 43.0, 35.0, 44.0, 43.0, 43.0, 1059.0, 39.0, 43.0, 38.0, 47.0, 45.0, 31.0, 27.0, 36.0, 30.0, 29.0, 29.0, 22.0, 16.0, 22.0, 15.0, 7.0, 9.0, 10.0, 5.0, 2.0, 3.0, 0.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7642822265625, -1.705322265625, -1.6463623046875, -1.58740234375, -1.5284423828125, -1.469482421875, -1.4105224609375, -1.3515625, -1.2926025390625, -1.233642578125, -1.1746826171875, -1.11572265625, -1.0567626953125, -0.997802734375, -0.9388427734375, -0.8798828125, -0.8209228515625, -0.761962890625, -0.7030029296875, -0.64404296875, -0.5850830078125, -0.526123046875, -0.4671630859375, -0.408203125, -0.3492431640625, -0.290283203125, -0.2313232421875, -0.17236328125, -0.1134033203125, -0.054443359375, 0.0045166015625, 0.0634765625, 0.1224365234375, 0.181396484375, 0.2403564453125, 0.29931640625, 0.3582763671875, 0.417236328125, 0.4761962890625, 0.53515625, 0.5941162109375, 0.653076171875, 0.7120361328125, 0.77099609375, 0.8299560546875, 0.888916015625, 0.9478759765625, 1.0068359375, 1.0657958984375, 1.124755859375, 1.1837158203125, 1.24267578125, 1.3016357421875, 1.360595703125, 1.4195556640625, 1.478515625, 1.5374755859375, 1.596435546875, 1.6553955078125, 1.71435546875, 1.7733154296875, 1.832275390625, 1.8912353515625, 1.9501953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 7.0, 13.0, 13.0, 25.0, 29.0, 44.0, 57.0, 90.0, 144.0, 174.0, 243.0, 324.0, 451.0, 713.0, 1012.0, 1432.0, 1969.0, 2969.0, 4214.0, 6059.0, 9102.0, 13465.0, 20646.0, 32420.0, 50974.0, 80691.0, 131554.0, 1246279.0, 183056.0, 112274.0, 69482.0, 43705.0, 28059.0, 18074.0, 11915.0, 7774.0, 5411.0, 3671.0, 2601.0, 1678.0, 1213.0, 851.0, 668.0, 463.0, 346.0, 230.0, 157.0, 121.0, 90.0, 57.0, 57.0, 24.0, 12.0, 17.0, 9.0, 3.0, 6.0, 2.0], "bins": [-0.3017578125, -0.29283905029296875, -0.2839202880859375, -0.27500152587890625, -0.266082763671875, -0.25716400146484375, -0.2482452392578125, -0.23932647705078125, -0.23040771484375, -0.22148895263671875, -0.2125701904296875, -0.20365142822265625, -0.194732666015625, -0.18581390380859375, -0.1768951416015625, -0.16797637939453125, -0.1590576171875, -0.15013885498046875, -0.1412200927734375, -0.13230133056640625, -0.123382568359375, -0.11446380615234375, -0.1055450439453125, -0.09662628173828125, -0.08770751953125, -0.07878875732421875, -0.0698699951171875, -0.06095123291015625, -0.052032470703125, -0.04311370849609375, -0.0341949462890625, -0.02527618408203125, -0.016357421875, -0.00743865966796875, 0.0014801025390625, 0.01039886474609375, 0.019317626953125, 0.02823638916015625, 0.0371551513671875, 0.04607391357421875, 0.05499267578125, 0.06391143798828125, 0.0728302001953125, 0.08174896240234375, 0.090667724609375, 0.09958648681640625, 0.1085052490234375, 0.11742401123046875, 0.1263427734375, 0.13526153564453125, 0.1441802978515625, 0.15309906005859375, 0.162017822265625, 0.17093658447265625, 0.1798553466796875, 0.18877410888671875, 0.19769287109375, 0.20661163330078125, 0.2155303955078125, 0.22444915771484375, 0.233367919921875, 0.24228668212890625, 0.2512054443359375, 0.26012420654296875, 0.26904296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 9.0, 5.0, 18.0, 26.0, 21.0, 27.0, 41.0, 32.0, 47.0, 68.0, 68.0, 88.0, 94.0, 88.0, 60.0, 54.0, 48.0, 36.0, 30.0, 26.0, 15.0, 16.0, 14.0, 11.0, 8.0, 8.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.002044677734375, -0.0019882917404174805, -0.001931905746459961, -0.0018755197525024414, -0.0018191337585449219, -0.0017627477645874023, -0.0017063617706298828, -0.0016499757766723633, -0.0015935897827148438, -0.0015372037887573242, -0.0014808177947998047, -0.0014244318008422852, -0.0013680458068847656, -0.001311659812927246, -0.0012552738189697266, -0.001198887825012207, -0.0011425018310546875, -0.001086115837097168, -0.0010297298431396484, -0.0009733438491821289, -0.0009169578552246094, -0.0008605718612670898, -0.0008041858673095703, -0.0007477998733520508, -0.0006914138793945312, -0.0006350278854370117, -0.0005786418914794922, -0.0005222558975219727, -0.0004658699035644531, -0.0004094839096069336, -0.00035309791564941406, -0.00029671192169189453, -0.000240325927734375, -0.00018393993377685547, -0.00012755393981933594, -7.11679458618164e-05, -1.4781951904296875e-05, 4.1604042053222656e-05, 9.799003601074219e-05, 0.00015437602996826172, 0.00021076202392578125, 0.0002671480178833008, 0.0003235340118408203, 0.00037992000579833984, 0.0004363059997558594, 0.0004926919937133789, 0.0005490779876708984, 0.000605463981628418, 0.0006618499755859375, 0.000718235969543457, 0.0007746219635009766, 0.0008310079574584961, 0.0008873939514160156, 0.0009437799453735352, 0.0010001659393310547, 0.0010565519332885742, 0.0011129379272460938, 0.0011693239212036133, 0.0012257099151611328, 0.0012820959091186523, 0.0013384819030761719, 0.0013948678970336914, 0.001451253890991211, 0.0015076398849487305, 0.00156402587890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 10.0, 5.0, 18.0, 21.0, 23.0, 40.0, 59.0, 76.0, 152.0, 220.0, 432.0, 1115.0, 188211.0, 854982.0, 1969.0, 484.0, 285.0, 150.0, 87.0, 61.0, 46.0, 30.0, 17.0, 8.0, 8.0, 9.0, 5.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.033203125, -0.03202199935913086, -0.03084087371826172, -0.029659748077392578, -0.028478622436523438, -0.027297496795654297, -0.026116371154785156, -0.024935245513916016, -0.023754119873046875, -0.022572994232177734, -0.021391868591308594, -0.020210742950439453, -0.019029617309570312, -0.017848491668701172, -0.01666736602783203, -0.01548624038696289, -0.01430511474609375, -0.01312398910522461, -0.011942863464355469, -0.010761737823486328, -0.009580612182617188, -0.008399486541748047, -0.007218360900878906, -0.006037235260009766, -0.004856109619140625, -0.0036749839782714844, -0.0024938583374023438, -0.0013127326965332031, -0.0001316070556640625, 0.0010495185852050781, 0.0022306442260742188, 0.0034117698669433594, 0.0045928955078125, 0.005774021148681641, 0.006955146789550781, 0.008136272430419922, 0.009317398071289062, 0.010498523712158203, 0.011679649353027344, 0.012860774993896484, 0.014041900634765625, 0.015223026275634766, 0.016404151916503906, 0.017585277557373047, 0.018766403198242188, 0.019947528839111328, 0.02112865447998047, 0.02230978012084961, 0.02349090576171875, 0.02467203140258789, 0.02585315704345703, 0.027034282684326172, 0.028215408325195312, 0.029396533966064453, 0.030577659606933594, 0.031758785247802734, 0.032939910888671875, 0.034121036529541016, 0.035302162170410156, 0.0364832878112793, 0.03766441345214844, 0.03884553909301758, 0.04002666473388672, 0.04120779037475586, 0.042388916015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 48.0, 177.0, 318.0, 304.0, 127.0, 33.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004963819868862629, -0.004850596189498901, -0.004737372975796461, -0.0046241492964327335, -0.004510926082730293, -0.004397702403366566, -0.0042844791896641254, -0.004171255510300398, -0.004058032296597958, -0.00394480861723423, -0.0038315854035317898, -0.003718361956998706, -0.003605138510465622, -0.0034919148311018944, -0.0033786913845688105, -0.0032654679380357265, -0.003152244258671999, -0.003039020812138915, -0.002925797365605831, -0.0028125739190727472, -0.0026993504725396633, -0.0025861267931759357, -0.002472903346642852, -0.002359679900109768, -0.002246456453576684, -0.0021332330070436, -0.002020009560510516, -0.0019067859975621104, -0.0017935625510290265, -0.0016803391044959426, -0.0015671155415475368, -0.001453892095014453, -0.0013406688813120127, -0.0012274454347789288, -0.0011142219882458448, -0.001000998425297439, -0.0008877749787643552, -0.0007745515322312713, -0.0006613280274905264, -0.0005481045227497816, -0.0004348810762166977, -0.0003216576005797833, -0.00020843412494286895, -9.521064930595458e-05, 1.8012826330959797e-05, 0.0001312362728640437, 0.00024445977760478854, 0.00035768328234553337, 0.0004709067288786173, 0.0005841301754117012, 0.000697353680152446, 0.0008105771848931909, 0.0009238006314262748, 0.0010370240779593587, 0.0011502476409077644, 0.0012634710874408484, 0.0013766945339739323, 0.0014899179805070162, 0.0016031414270401, 0.0017163649899885058, 0.0018295884365215898, 0.0019428118830546737, 0.0020560354460030794, 0.0021692588925361633, 0.0022824823390692472]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 6.0, 6.0, 6.0, 8.0, 13.0, 14.0, 12.0, 22.0, 16.0, 24.0, 33.0, 26.0, 27.0, 25.0, 40.0, 46.0, 40.0, 36.0, 45.0, 43.0, 48.0, 49.0, 39.0, 35.0, 41.0, 35.0, 37.0, 31.0, 24.0, 32.0, 19.0, 27.0, 12.0, 20.0, 13.0, 14.0, 11.0, 4.0, 5.0, 3.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007690191268920898, -0.0007430091500282288, -0.0007169991731643677, -0.0006909891963005066, -0.0006649792194366455, -0.0006389692425727844, -0.0006129592657089233, -0.0005869492888450623, -0.0005609393119812012, -0.0005349293351173401, -0.000508919358253479, -0.0004829093813896179, -0.00045689940452575684, -0.00043088942766189575, -0.00040487945079803467, -0.0003788694739341736, -0.0003528594970703125, -0.0003268495202064514, -0.00030083954334259033, -0.00027482956647872925, -0.00024881958961486816, -0.00022280961275100708, -0.000196799635887146, -0.0001707896590232849, -0.00014477968215942383, -0.00011876970529556274, -9.275972843170166e-05, -6.674975156784058e-05, -4.073977470397949e-05, -1.4729797840118408e-05, 1.1280179023742676e-05, 3.729015588760376e-05, 6.330013275146484e-05, 8.931010961532593e-05, 0.00011532008647918701, 0.0001413300633430481, 0.00016734004020690918, 0.00019335001707077026, 0.00021935999393463135, 0.00024536997079849243, 0.0002713799476623535, 0.0002973899245262146, 0.0003233999013900757, 0.00034940987825393677, 0.00037541985511779785, 0.00040142983198165894, 0.00042743980884552, 0.0004534497857093811, 0.0004794597625732422, 0.0005054697394371033, 0.0005314797163009644, 0.0005574896931648254, 0.0005834996700286865, 0.0006095096468925476, 0.0006355196237564087, 0.0006615296006202698, 0.0006875395774841309, 0.0007135495543479919, 0.000739559531211853, 0.0007655695080757141, 0.0007915794849395752, 0.0008175894618034363, 0.0008435994386672974, 0.0008696094155311584, 0.0008956193923950195]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 16.0, 15.0, 14.0, 22.0, 23.0, 23.0, 20.0, 40.0, 31.0, 36.0, 39.0, 41.0, 38.0, 48.0, 42.0, 45.0, 43.0, 36.0, 39.0, 39.0, 29.0, 35.0, 40.0, 37.0, 30.0, 27.0, 20.0, 18.0, 18.0, 15.0, 10.0, 6.0, 3.0, 8.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.193359375, -3.095428466796875, -2.99749755859375, -2.899566650390625, -2.8016357421875, -2.703704833984375, -2.60577392578125, -2.507843017578125, -2.409912109375, -2.311981201171875, -2.21405029296875, -2.116119384765625, -2.0181884765625, -1.920257568359375, -1.82232666015625, -1.724395751953125, -1.62646484375, -1.528533935546875, -1.43060302734375, -1.332672119140625, -1.2347412109375, -1.136810302734375, -1.03887939453125, -0.940948486328125, -0.843017578125, -0.745086669921875, -0.64715576171875, -0.549224853515625, -0.4512939453125, -0.353363037109375, -0.25543212890625, -0.157501220703125, -0.0595703125, 0.038360595703125, 0.13629150390625, 0.234222412109375, 0.3321533203125, 0.430084228515625, 0.52801513671875, 0.625946044921875, 0.723876953125, 0.821807861328125, 0.91973876953125, 1.017669677734375, 1.1156005859375, 1.213531494140625, 1.31146240234375, 1.409393310546875, 1.50732421875, 1.605255126953125, 1.70318603515625, 1.801116943359375, 1.8990478515625, 1.996978759765625, 2.09490966796875, 2.192840576171875, 2.290771484375, 2.388702392578125, 2.48663330078125, 2.584564208984375, 2.6824951171875, 2.780426025390625, 2.87835693359375, 2.976287841796875, 3.07421875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 12.0, 11.0, 24.0, 21.0, 24.0, 36.0, 52.0, 80.0, 123.0, 233.0, 397.0, 612.0, 1089.0, 2052.0, 3617.0, 6776.0, 12448.0, 22154.0, 40475.0, 79576.0, 183980.0, 335620.0, 186558.0, 80849.0, 41231.0, 22403.0, 12612.0, 6942.0, 3808.0, 2014.0, 1081.0, 633.0, 374.0, 217.0, 138.0, 78.0, 63.0, 41.0, 22.0, 17.0, 11.0, 9.0, 12.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.451171875, -2.373382568359375, -2.29559326171875, -2.217803955078125, -2.1400146484375, -2.062225341796875, -1.98443603515625, -1.906646728515625, -1.828857421875, -1.751068115234375, -1.67327880859375, -1.595489501953125, -1.5177001953125, -1.439910888671875, -1.36212158203125, -1.284332275390625, -1.20654296875, -1.128753662109375, -1.05096435546875, -0.973175048828125, -0.8953857421875, -0.817596435546875, -0.73980712890625, -0.662017822265625, -0.584228515625, -0.506439208984375, -0.42864990234375, -0.350860595703125, -0.2730712890625, -0.195281982421875, -0.11749267578125, -0.039703369140625, 0.0380859375, 0.115875244140625, 0.19366455078125, 0.271453857421875, 0.3492431640625, 0.427032470703125, 0.50482177734375, 0.582611083984375, 0.660400390625, 0.738189697265625, 0.81597900390625, 0.893768310546875, 0.9715576171875, 1.049346923828125, 1.12713623046875, 1.204925537109375, 1.28271484375, 1.360504150390625, 1.43829345703125, 1.516082763671875, 1.5938720703125, 1.671661376953125, 1.74945068359375, 1.827239990234375, 1.905029296875, 1.982818603515625, 2.06060791015625, 2.138397216796875, 2.2161865234375, 2.293975830078125, 2.37176513671875, 2.449554443359375, 2.52734375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 7.0, 5.0, 8.0, 11.0, 10.0, 18.0, 22.0, 14.0, 20.0, 28.0, 30.0, 30.0, 34.0, 41.0, 44.0, 41.0, 63.0, 92.0, 191.0, 1563.0, 200.0, 103.0, 69.0, 51.0, 49.0, 32.0, 36.0, 29.0, 27.0, 24.0, 20.0, 19.0, 22.0, 20.0, 15.0, 7.0, 5.0, 11.0, 3.0, 3.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.1640625, -10.8310546875, -10.498046875, -10.1650390625, -9.83203125, -9.4990234375, -9.166015625, -8.8330078125, -8.5, -8.1669921875, -7.833984375, -7.5009765625, -7.16796875, -6.8349609375, -6.501953125, -6.1689453125, -5.8359375, -5.5029296875, -5.169921875, -4.8369140625, -4.50390625, -4.1708984375, -3.837890625, -3.5048828125, -3.171875, -2.8388671875, -2.505859375, -2.1728515625, -1.83984375, -1.5068359375, -1.173828125, -0.8408203125, -0.5078125, -0.1748046875, 0.158203125, 0.4912109375, 0.82421875, 1.1572265625, 1.490234375, 1.8232421875, 2.15625, 2.4892578125, 2.822265625, 3.1552734375, 3.48828125, 3.8212890625, 4.154296875, 4.4873046875, 4.8203125, 5.1533203125, 5.486328125, 5.8193359375, 6.15234375, 6.4853515625, 6.818359375, 7.1513671875, 7.484375, 7.8173828125, 8.150390625, 8.4833984375, 8.81640625, 9.1494140625, 9.482421875, 9.8154296875, 10.1484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 3.0, 13.0, 9.0, 33.0, 25.0, 42.0, 65.0, 111.0, 210.0, 386.0, 1586.0, 2626630.0, 514499.0, 1162.0, 388.0, 194.0, 112.0, 64.0, 45.0, 29.0, 27.0, 14.0, 8.0, 11.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.5, -63.77392578125, -62.0478515625, -60.32177734375, -58.595703125, -56.86962890625, -55.1435546875, -53.41748046875, -51.69140625, -49.96533203125, -48.2392578125, -46.51318359375, -44.787109375, -43.06103515625, -41.3349609375, -39.60888671875, -37.8828125, -36.15673828125, -34.4306640625, -32.70458984375, -30.978515625, -29.25244140625, -27.5263671875, -25.80029296875, -24.07421875, -22.34814453125, -20.6220703125, -18.89599609375, -17.169921875, -15.44384765625, -13.7177734375, -11.99169921875, -10.265625, -8.53955078125, -6.8134765625, -5.08740234375, -3.361328125, -1.63525390625, 0.0908203125, 1.81689453125, 3.54296875, 5.26904296875, 6.9951171875, 8.72119140625, 10.447265625, 12.17333984375, 13.8994140625, 15.62548828125, 17.3515625, 19.07763671875, 20.8037109375, 22.52978515625, 24.255859375, 25.98193359375, 27.7080078125, 29.43408203125, 31.16015625, 32.88623046875, 34.6123046875, 36.33837890625, 38.064453125, 39.79052734375, 41.5166015625, 43.24267578125, 44.96875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 47.0, 823.0, 144.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.200401306152344, -31.43024253845215, -26.660083770751953, -21.889925003051758, -17.119766235351562, -12.349607467651367, -7.579448699951172, -2.8092880249023438, 1.9608688354492188, 6.731027603149414, 11.50118637084961, 16.271345138549805, 21.04150390625, 25.811662673950195, 30.58182144165039, 35.35198211669922, 40.12213897705078, 44.892295837402344, 49.66245651245117, 54.4326171875, 59.20277404785156, 63.972930908203125, 68.74308776855469, 73.51325225830078, 78.28340911865234, 83.0535659790039, 87.82373046875, 92.59388732910156, 97.36404418945312, 102.13420104980469, 106.90435791015625, 111.67452239990234, 116.44467163085938, 121.21482849121094, 125.9849853515625, 130.75514221191406, 135.52529907226562, 140.29547119140625, 145.0656280517578, 149.83578491210938, 154.60594177246094, 159.3760986328125, 164.14625549316406, 168.91641235351562, 173.68658447265625, 178.4567413330078, 183.22689819335938, 187.99705505371094, 192.7672119140625, 197.53736877441406, 202.30752563476562, 207.0776824951172, 211.84783935546875, 216.61801147460938, 221.38816833496094, 226.1583251953125, 230.92848205566406, 235.69863891601562, 240.4687957763672, 245.23895263671875, 250.00912475585938, 254.77928161621094, 259.5494384765625, 264.319580078125, 269.0897521972656]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 7.0, 11.0, 6.0, 14.0, 18.0, 27.0, 20.0, 15.0, 24.0, 20.0, 32.0, 42.0, 34.0, 28.0, 33.0, 37.0, 47.0, 43.0, 31.0, 47.0, 40.0, 48.0, 39.0, 41.0, 31.0, 40.0, 33.0, 23.0, 18.0, 22.0, 22.0, 17.0, 8.0, 12.0, 14.0, 8.0, 12.0, 14.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.5570182800293, -31.543825149536133, -30.53063201904297, -29.517438888549805, -28.50424575805664, -27.491050720214844, -26.47785758972168, -25.464664459228516, -24.45147132873535, -23.438278198242188, -22.425085067749023, -21.41189193725586, -20.398696899414062, -19.38550567626953, -18.372310638427734, -17.35911750793457, -16.345924377441406, -15.332731246948242, -14.319538116455078, -13.306344032287598, -12.293150901794434, -11.27995777130127, -10.266763687133789, -9.253570556640625, -8.240377426147461, -7.227184295654297, -6.213990688323975, -5.200797080993652, -4.187603950500488, -3.174410820007324, -2.161217212677002, -1.1480236053466797, -0.13482666015625, 0.8783667087554932, 1.8915600776672363, 2.9047534465789795, 3.9179468154907227, 4.931139945983887, 5.944333553314209, 6.957527160644531, 7.970720291137695, 8.98391342163086, 9.997106552124023, 11.010300636291504, 12.023493766784668, 13.036686897277832, 14.049880981445312, 15.063074111938477, 16.07626724243164, 17.089460372924805, 18.10265350341797, 19.115846633911133, 20.129039764404297, 21.142234802246094, 22.155427932739258, 23.168621063232422, 24.181814193725586, 25.19500732421875, 26.208200454711914, 27.221393585205078, 28.234588623046875, 29.247779846191406, 30.260974884033203, 31.274168014526367, 32.28736114501953]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 10.0, 8.0, 8.0, 13.0, 10.0, 14.0, 17.0, 20.0, 31.0, 23.0, 38.0, 33.0, 32.0, 35.0, 47.0, 41.0, 32.0, 37.0, 37.0, 42.0, 46.0, 44.0, 34.0, 38.0, 39.0, 39.0, 28.0, 33.0, 29.0, 20.0, 17.0, 21.0, 17.0, 16.0, 4.0, 8.0, 10.0, 8.0, 4.0, 14.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.779296875, -3.671478271484375, -3.56365966796875, -3.455841064453125, -3.3480224609375, -3.240203857421875, -3.13238525390625, -3.024566650390625, -2.916748046875, -2.808929443359375, -2.70111083984375, -2.593292236328125, -2.4854736328125, -2.377655029296875, -2.26983642578125, -2.162017822265625, -2.05419921875, -1.946380615234375, -1.83856201171875, -1.730743408203125, -1.6229248046875, -1.515106201171875, -1.40728759765625, -1.299468994140625, -1.191650390625, -1.083831787109375, -0.97601318359375, -0.868194580078125, -0.7603759765625, -0.652557373046875, -0.54473876953125, -0.436920166015625, -0.3291015625, -0.221282958984375, -0.11346435546875, -0.005645751953125, 0.1021728515625, 0.209991455078125, 0.31781005859375, 0.425628662109375, 0.533447265625, 0.641265869140625, 0.74908447265625, 0.856903076171875, 0.9647216796875, 1.072540283203125, 1.18035888671875, 1.288177490234375, 1.39599609375, 1.503814697265625, 1.61163330078125, 1.719451904296875, 1.8272705078125, 1.935089111328125, 2.04290771484375, 2.150726318359375, 2.258544921875, 2.366363525390625, 2.47418212890625, 2.582000732421875, 2.6898193359375, 2.797637939453125, 2.90545654296875, 3.013275146484375, 3.12109375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 16.0, 8.0, 15.0, 25.0, 21.0, 41.0, 46.0, 62.0, 95.0, 147.0, 213.0, 333.0, 662.0, 1781.0, 5426.0, 21600.0, 109079.0, 616661.0, 1771053.0, 1294012.0, 301703.0, 53484.0, 11763.0, 3253.0, 1186.0, 574.0, 309.0, 202.0, 140.0, 88.0, 70.0, 50.0, 34.0, 19.0, 21.0, 11.0, 16.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.76171875, -5.5911865234375, -5.420654296875, -5.2501220703125, -5.07958984375, -4.9090576171875, -4.738525390625, -4.5679931640625, -4.3974609375, -4.2269287109375, -4.056396484375, -3.8858642578125, -3.71533203125, -3.5447998046875, -3.374267578125, -3.2037353515625, -3.033203125, -2.8626708984375, -2.692138671875, -2.5216064453125, -2.35107421875, -2.1805419921875, -2.010009765625, -1.8394775390625, -1.6689453125, -1.4984130859375, -1.327880859375, -1.1573486328125, -0.98681640625, -0.8162841796875, -0.645751953125, -0.4752197265625, -0.3046875, -0.1341552734375, 0.036376953125, 0.2069091796875, 0.37744140625, 0.5479736328125, 0.718505859375, 0.8890380859375, 1.0595703125, 1.2301025390625, 1.400634765625, 1.5711669921875, 1.74169921875, 1.9122314453125, 2.082763671875, 2.2532958984375, 2.423828125, 2.5943603515625, 2.764892578125, 2.9354248046875, 3.10595703125, 3.2764892578125, 3.447021484375, 3.6175537109375, 3.7880859375, 3.9586181640625, 4.129150390625, 4.2996826171875, 4.47021484375, 4.6407470703125, 4.811279296875, 4.9818115234375, 5.15234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 13.0, 16.0, 24.0, 29.0, 69.0, 86.0, 144.0, 204.0, 337.0, 495.0, 599.0, 582.0, 456.0, 332.0, 224.0, 150.0, 109.0, 80.0, 40.0, 29.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -11.0233154296875, -10.679443359375, -10.3355712890625, -9.99169921875, -9.6478271484375, -9.303955078125, -8.9600830078125, -8.6162109375, -8.2723388671875, -7.928466796875, -7.5845947265625, -7.24072265625, -6.8968505859375, -6.552978515625, -6.2091064453125, -5.865234375, -5.5213623046875, -5.177490234375, -4.8336181640625, -4.48974609375, -4.1458740234375, -3.802001953125, -3.4581298828125, -3.1142578125, -2.7703857421875, -2.426513671875, -2.0826416015625, -1.73876953125, -1.3948974609375, -1.051025390625, -0.7071533203125, -0.36328125, -0.0194091796875, 0.324462890625, 0.6683349609375, 1.01220703125, 1.3560791015625, 1.699951171875, 2.0438232421875, 2.3876953125, 2.7315673828125, 3.075439453125, 3.4193115234375, 3.76318359375, 4.1070556640625, 4.450927734375, 4.7947998046875, 5.138671875, 5.4825439453125, 5.826416015625, 6.1702880859375, 6.51416015625, 6.8580322265625, 7.201904296875, 7.5457763671875, 7.8896484375, 8.2335205078125, 8.577392578125, 8.9212646484375, 9.26513671875, 9.6090087890625, 9.952880859375, 10.2967529296875, 10.640625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 8.0, 9.0, 12.0, 24.0, 21.0, 38.0, 40.0, 78.0, 107.0, 145.0, 239.0, 438.0, 1033.0, 5384.0, 155182.0, 3577488.0, 440917.0, 10504.0, 1335.0, 506.0, 279.0, 149.0, 116.0, 63.0, 44.0, 41.0, 20.0, 25.0, 12.0, 11.0, 4.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.609375, -17.959228515625, -17.30908203125, -16.658935546875, -16.0087890625, -15.358642578125, -14.70849609375, -14.058349609375, -13.408203125, -12.758056640625, -12.10791015625, -11.457763671875, -10.8076171875, -10.157470703125, -9.50732421875, -8.857177734375, -8.20703125, -7.556884765625, -6.90673828125, -6.256591796875, -5.6064453125, -4.956298828125, -4.30615234375, -3.656005859375, -3.005859375, -2.355712890625, -1.70556640625, -1.055419921875, -0.4052734375, 0.244873046875, 0.89501953125, 1.545166015625, 2.1953125, 2.845458984375, 3.49560546875, 4.145751953125, 4.7958984375, 5.446044921875, 6.09619140625, 6.746337890625, 7.396484375, 8.046630859375, 8.69677734375, 9.346923828125, 9.9970703125, 10.647216796875, 11.29736328125, 11.947509765625, 12.59765625, 13.247802734375, 13.89794921875, 14.548095703125, 15.1982421875, 15.848388671875, 16.49853515625, 17.148681640625, 17.798828125, 18.448974609375, 19.09912109375, 19.749267578125, 20.3994140625, 21.049560546875, 21.69970703125, 22.349853515625, 23.0]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 44.0, 203.0, 370.0, 289.0, 82.0, 20.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.44813537597656, -76.74613189697266, -73.04412841796875, -69.34211730957031, -65.6401138305664, -61.9381103515625, -58.236106872558594, -54.53410339355469, -50.832096099853516, -47.13009262084961, -43.42808532714844, -39.72608184814453, -36.024078369140625, -32.32207107543945, -28.620067596435547, -24.918062210083008, -21.21605682373047, -17.51405143737793, -13.812047004699707, -10.110042572021484, -6.408037185668945, -2.7060317993164062, 0.9959716796875, 4.697977066040039, 8.399982452392578, 12.101987838745117, 15.80399227142334, 19.505996704101562, 23.2080020904541, 26.91000747680664, 30.612010955810547, 34.31401824951172, 38.016021728515625, 41.71802520751953, 45.4200325012207, 49.12203598022461, 52.82404327392578, 56.52604675292969, 60.228050231933594, 63.9300537109375, 67.63206481933594, 71.33406829833984, 75.03607177734375, 78.73808288574219, 82.4400863647461, 86.14208984375, 89.8440933227539, 93.54609680175781, 97.24810028076172, 100.95010375976562, 104.65210723876953, 108.35411071777344, 112.05612182617188, 115.75812530517578, 119.46012878417969, 123.1621322631836, 126.8641357421875, 130.56614685058594, 134.2681427001953, 137.97015380859375, 141.67214965820312, 145.37416076660156, 149.076171875, 152.77816772460938, 156.4801788330078]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 12.0, 12.0, 12.0, 21.0, 8.0, 18.0, 22.0, 25.0, 33.0, 34.0, 25.0, 48.0, 41.0, 40.0, 50.0, 46.0, 60.0, 39.0, 41.0, 43.0, 37.0, 33.0, 32.0, 37.0, 26.0, 25.0, 21.0, 22.0, 19.0, 20.0, 7.0, 11.0, 14.0, 6.0, 11.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.126510620117188, -27.277698516845703, -26.428884506225586, -25.5800724029541, -24.731260299682617, -23.8824462890625, -23.033634185791016, -22.18482208251953, -21.336009979248047, -20.487197875976562, -19.638383865356445, -18.78957176208496, -17.940759658813477, -17.09194564819336, -16.243133544921875, -15.39432144165039, -14.545507431030273, -13.696694374084473, -12.847882270812988, -11.999069213867188, -11.150257110595703, -10.301444053649902, -9.452630996704102, -8.603818893432617, -7.755005836486816, -6.906193256378174, -6.057380676269531, -5.2085676193237305, -4.359755039215088, -3.5109424591064453, -2.6621294021606445, -1.813316822052002, -0.9645042419433594, -0.11569154262542725, 0.7331211566925049, 1.5819339752197266, 2.430746555328369, 3.2795591354370117, 4.1283721923828125, 4.977184772491455, 5.825997352600098, 6.67480993270874, 7.523622512817383, 8.372435569763184, 9.221248626708984, 10.070060729980469, 10.91887378692627, 11.76768684387207, 12.616498947143555, 13.465312004089355, 14.31412410736084, 15.16293716430664, 16.011749267578125, 16.86056137084961, 17.709375381469727, 18.55818748474121, 19.407001495361328, 20.255813598632812, 21.10462760925293, 21.953439712524414, 22.8022518157959, 23.651065826416016, 24.4998779296875, 25.348690032958984, 26.19750213623047]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 9.0, 5.0, 11.0, 8.0, 11.0, 7.0, 12.0, 18.0, 17.0, 19.0, 23.0, 21.0, 32.0, 38.0, 30.0, 44.0, 30.0, 42.0, 32.0, 37.0, 43.0, 51.0, 52.0, 39.0, 40.0, 39.0, 35.0, 27.0, 35.0, 35.0, 29.0, 20.0, 23.0, 13.0, 14.0, 9.0, 10.0, 9.0, 11.0, 8.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.724609375, -3.617431640625, -3.51025390625, -3.403076171875, -3.2958984375, -3.188720703125, -3.08154296875, -2.974365234375, -2.8671875, -2.760009765625, -2.65283203125, -2.545654296875, -2.4384765625, -2.331298828125, -2.22412109375, -2.116943359375, -2.009765625, -1.902587890625, -1.79541015625, -1.688232421875, -1.5810546875, -1.473876953125, -1.36669921875, -1.259521484375, -1.15234375, -1.045166015625, -0.93798828125, -0.830810546875, -0.7236328125, -0.616455078125, -0.50927734375, -0.402099609375, -0.294921875, -0.187744140625, -0.08056640625, 0.026611328125, 0.1337890625, 0.240966796875, 0.34814453125, 0.455322265625, 0.5625, 0.669677734375, 0.77685546875, 0.884033203125, 0.9912109375, 1.098388671875, 1.20556640625, 1.312744140625, 1.419921875, 1.527099609375, 1.63427734375, 1.741455078125, 1.8486328125, 1.955810546875, 2.06298828125, 2.170166015625, 2.27734375, 2.384521484375, 2.49169921875, 2.598876953125, 2.7060546875, 2.813232421875, 2.92041015625, 3.027587890625, 3.134765625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 10.0, 10.0, 22.0, 37.0, 49.0, 91.0, 131.0, 195.0, 320.0, 553.0, 874.0, 1414.0, 2215.0, 3847.0, 6213.0, 10393.0, 17410.0, 28850.0, 49348.0, 85440.0, 152846.0, 256442.0, 185547.0, 102455.0, 58757.0, 33912.0, 20332.0, 12224.0, 7349.0, 4380.0, 2695.0, 1626.0, 913.0, 626.0, 349.0, 239.0, 153.0, 95.0, 58.0, 35.0, 33.0, 20.0, 14.0, 11.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.42626953125, -0.4123649597167969, -0.39846038818359375, -0.3845558166503906, -0.3706512451171875, -0.3567466735839844, -0.34284210205078125, -0.3289375305175781, -0.315032958984375, -0.3011283874511719, -0.28722381591796875, -0.2733192443847656, -0.2594146728515625, -0.24551010131835938, -0.23160552978515625, -0.21770095825195312, -0.20379638671875, -0.18989181518554688, -0.17598724365234375, -0.16208267211914062, -0.1481781005859375, -0.13427352905273438, -0.12036895751953125, -0.10646438598632812, -0.092559814453125, -0.07865524291992188, -0.06475067138671875, -0.050846099853515625, -0.0369415283203125, -0.023036956787109375, -0.00913238525390625, 0.004772186279296875, 0.0186767578125, 0.032581329345703125, 0.04648590087890625, 0.060390472412109375, 0.0742950439453125, 0.08819961547851562, 0.10210418701171875, 0.11600875854492188, 0.129913330078125, 0.14381790161132812, 0.15772247314453125, 0.17162704467773438, 0.1855316162109375, 0.19943618774414062, 0.21334075927734375, 0.22724533081054688, 0.24114990234375, 0.2550544738769531, 0.26895904541015625, 0.2828636169433594, 0.2967681884765625, 0.3106727600097656, 0.32457733154296875, 0.3384819030761719, 0.352386474609375, 0.3662910461425781, 0.38019561767578125, 0.3941001892089844, 0.4080047607421875, 0.4219093322753906, 0.43581390380859375, 0.4497184753417969, 0.463623046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 6.0, 13.0, 12.0, 13.0, 17.0, 13.0, 15.0, 23.0, 34.0, 17.0, 32.0, 23.0, 32.0, 31.0, 48.0, 45.0, 38.0, 43.0, 35.0, 1076.0, 47.0, 36.0, 42.0, 41.0, 30.0, 31.0, 38.0, 23.0, 22.0, 24.0, 23.0, 21.0, 12.0, 14.0, 11.0, 9.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.982421875, -1.914154052734375, -1.84588623046875, -1.777618408203125, -1.7093505859375, -1.641082763671875, -1.57281494140625, -1.504547119140625, -1.436279296875, -1.368011474609375, -1.29974365234375, -1.231475830078125, -1.1632080078125, -1.094940185546875, -1.02667236328125, -0.958404541015625, -0.89013671875, -0.821868896484375, -0.75360107421875, -0.685333251953125, -0.6170654296875, -0.548797607421875, -0.48052978515625, -0.412261962890625, -0.343994140625, -0.275726318359375, -0.20745849609375, -0.139190673828125, -0.0709228515625, -0.002655029296875, 0.06561279296875, 0.133880615234375, 0.2021484375, 0.270416259765625, 0.33868408203125, 0.406951904296875, 0.4752197265625, 0.543487548828125, 0.61175537109375, 0.680023193359375, 0.748291015625, 0.816558837890625, 0.88482666015625, 0.953094482421875, 1.0213623046875, 1.089630126953125, 1.15789794921875, 1.226165771484375, 1.29443359375, 1.362701416015625, 1.43096923828125, 1.499237060546875, 1.5675048828125, 1.635772705078125, 1.70404052734375, 1.772308349609375, 1.840576171875, 1.908843994140625, 1.97711181640625, 2.045379638671875, 2.1136474609375, 2.181915283203125, 2.25018310546875, 2.318450927734375, 2.38671875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 10.0, 10.0, 4.0, 18.0, 23.0, 34.0, 46.0, 82.0, 140.0, 234.0, 354.0, 534.0, 790.0, 1251.0, 1957.0, 3139.0, 4879.0, 8062.0, 13300.0, 22163.0, 38362.0, 67555.0, 123562.0, 258786.0, 1243028.0, 133752.0, 73009.0, 41287.0, 23910.0, 14146.0, 8487.0, 5232.0, 3250.0, 2079.0, 1285.0, 823.0, 531.0, 371.0, 224.0, 145.0, 110.0, 62.0, 39.0, 35.0, 11.0, 8.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3583984375, -0.3460693359375, -0.333740234375, -0.3214111328125, -0.30908203125, -0.2967529296875, -0.284423828125, -0.2720947265625, -0.259765625, -0.2474365234375, -0.235107421875, -0.2227783203125, -0.21044921875, -0.1981201171875, -0.185791015625, -0.1734619140625, -0.1611328125, -0.1488037109375, -0.136474609375, -0.1241455078125, -0.11181640625, -0.0994873046875, -0.087158203125, -0.0748291015625, -0.0625, -0.0501708984375, -0.037841796875, -0.0255126953125, -0.01318359375, -0.0008544921875, 0.011474609375, 0.0238037109375, 0.0361328125, 0.0484619140625, 0.060791015625, 0.0731201171875, 0.08544921875, 0.0977783203125, 0.110107421875, 0.1224365234375, 0.134765625, 0.1470947265625, 0.159423828125, 0.1717529296875, 0.18408203125, 0.1964111328125, 0.208740234375, 0.2210693359375, 0.2333984375, 0.2457275390625, 0.258056640625, 0.2703857421875, 0.28271484375, 0.2950439453125, 0.307373046875, 0.3197021484375, 0.33203125, 0.3443603515625, 0.356689453125, 0.3690185546875, 0.38134765625, 0.3936767578125, 0.406005859375, 0.4183349609375, 0.4306640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 7.0, 11.0, 12.0, 24.0, 11.0, 25.0, 39.0, 42.0, 52.0, 74.0, 87.0, 91.0, 109.0, 85.0, 66.0, 56.0, 44.0, 36.0, 21.0, 22.0, 9.0, 13.0, 12.0, 9.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020294189453125, -0.001941591501235962, -0.0018537640571594238, -0.0017659366130828857, -0.0016781091690063477, -0.0015902817249298096, -0.0015024542808532715, -0.0014146268367767334, -0.0013267993927001953, -0.0012389719486236572, -0.0011511445045471191, -0.001063317060470581, -0.000975489616394043, -0.0008876621723175049, -0.0007998347282409668, -0.0007120072841644287, -0.0006241798400878906, -0.0005363523960113525, -0.00044852495193481445, -0.00036069750785827637, -0.0002728700637817383, -0.0001850426197052002, -9.721517562866211e-05, -9.387731552124023e-06, 7.843971252441406e-05, 0.00016626715660095215, 0.00025409460067749023, 0.0003419220447540283, 0.0004297494888305664, 0.0005175769329071045, 0.0006054043769836426, 0.0006932318210601807, 0.0007810592651367188, 0.0008688867092132568, 0.0009567141532897949, 0.001044541597366333, 0.001132369041442871, 0.0012201964855194092, 0.0013080239295959473, 0.0013958513736724854, 0.0014836788177490234, 0.0015715062618255615, 0.0016593337059020996, 0.0017471611499786377, 0.0018349885940551758, 0.0019228160381317139, 0.002010643482208252, 0.00209847092628479, 0.002186298370361328, 0.002274125814437866, 0.0023619532585144043, 0.0024497807025909424, 0.0025376081466674805, 0.0026254355907440186, 0.0027132630348205566, 0.0028010904788970947, 0.002888917922973633, 0.002976745367050171, 0.003064572811126709, 0.003152400255203247, 0.003240227699279785, 0.0033280551433563232, 0.0034158825874328613, 0.0035037100315093994, 0.0035915374755859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 2.0, 5.0, 4.0, 7.0, 10.0, 8.0, 18.0, 23.0, 38.0, 41.0, 72.0, 116.0, 226.0, 418.0, 952.0, 130499.0, 913457.0, 1509.0, 479.0, 239.0, 147.0, 90.0, 59.0, 38.0, 35.0, 16.0, 14.0, 6.0, 7.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0738525390625, -0.07205677032470703, -0.07026100158691406, -0.0684652328491211, -0.06666946411132812, -0.06487369537353516, -0.06307792663574219, -0.06128215789794922, -0.05948638916015625, -0.05769062042236328, -0.05589485168457031, -0.054099082946777344, -0.052303314208984375, -0.050507545471191406, -0.04871177673339844, -0.04691600799560547, -0.0451202392578125, -0.04332447052001953, -0.04152870178222656, -0.039732933044433594, -0.037937164306640625, -0.036141395568847656, -0.03434562683105469, -0.03254985809326172, -0.03075408935546875, -0.02895832061767578, -0.027162551879882812, -0.025366783142089844, -0.023571014404296875, -0.021775245666503906, -0.019979476928710938, -0.01818370819091797, -0.016387939453125, -0.014592170715332031, -0.012796401977539062, -0.011000633239746094, -0.009204864501953125, -0.007409095764160156, -0.0056133270263671875, -0.0038175582885742188, -0.00202178955078125, -0.00022602081298828125, 0.0015697479248046875, 0.0033655166625976562, 0.005161285400390625, 0.006957054138183594, 0.008752822875976562, 0.010548591613769531, 0.0123443603515625, 0.014140129089355469, 0.015935897827148438, 0.017731666564941406, 0.019527435302734375, 0.021323204040527344, 0.023118972778320312, 0.02491474151611328, 0.02671051025390625, 0.02850627899169922, 0.030302047729492188, 0.032097816467285156, 0.033893585205078125, 0.035689353942871094, 0.03748512268066406, 0.03928089141845703, 0.04107666015625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 45.0, 163.0, 382.0, 264.0, 114.0, 29.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034184956457465887, -0.003280651057139039, -0.0031428064685314894, -0.003004961647093296, -0.0028671170584857464, -0.0027292724698781967, -0.002591427881270647, -0.0024535832926630974, -0.0023157387040555477, -0.002177894115447998, -0.0020400495268404484, -0.0019022048218175769, -0.0017643601167947054, -0.0016265155281871557, -0.001488670939579606, -0.0013508263509720564, -0.001212981529533863, -0.0010751369409263134, -0.0009372922359034419, -0.0007994476472958922, -0.0006616030004806817, -0.0005237583536654711, -0.0003859137650579214, -0.00024806911824271083, -0.00011022447142750025, 2.7620160835795105e-05, 0.00016546479309909046, 0.0003033094108104706, 0.00044115405762568116, 0.0005789987044408917, 0.0007168432930484414, 0.000854687939863652, 0.000992532353848219, 0.0011303769424557686, 0.00126822164747864, 0.0014060662360861897, 0.0015439109411090612, 0.001681755529716611, 0.0018196001183241606, 0.0019574447069317102, 0.0020952895283699036, 0.0022331341169774532, 0.002370978705585003, 0.0025088232941925526, 0.002646668115630746, 0.0027845127042382956, 0.0029223572928458452, 0.003060201881453395, 0.0031980464700609446, 0.0033358910586684942, 0.003473735647276044, 0.003611580468714237, 0.003749425057321787, 0.0038872696459293365, 0.004025114234536886, 0.004162958823144436, 0.0043008034117519855, 0.004438648000359535, 0.004576492588967085, 0.0047143371775746346, 0.004852181766182184, 0.004990026354789734, 0.005127871409058571, 0.0052657159976661205, 0.00540356058627367]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 9.0, 6.0, 14.0, 12.0, 10.0, 19.0, 25.0, 18.0, 28.0, 28.0, 25.0, 34.0, 35.0, 42.0, 52.0, 35.0, 45.0, 37.0, 37.0, 40.0, 40.0, 35.0, 45.0, 33.0, 30.0, 35.0, 31.0, 29.0, 26.0, 24.0, 30.0, 15.0, 12.0, 15.0, 9.0, 9.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011664032936096191, -0.001130513846874237, -0.001094624400138855, -0.001058734953403473, -0.0010228455066680908, -0.0009869560599327087, -0.0009510666131973267, -0.0009151771664619446, -0.0008792877197265625, -0.0008433982729911804, -0.0008075088262557983, -0.0007716193795204163, -0.0007357299327850342, -0.0006998404860496521, -0.00066395103931427, -0.0006280615925788879, -0.0005921721458435059, -0.0005562826991081238, -0.0005203932523727417, -0.0004845038056373596, -0.00044861435890197754, -0.00041272491216659546, -0.0003768354654312134, -0.0003409460186958313, -0.0003050565719604492, -0.00026916712522506714, -0.00023327767848968506, -0.00019738823175430298, -0.0001614987850189209, -0.00012560933828353882, -8.971989154815674e-05, -5.383044481277466e-05, -1.7940998077392578e-05, 1.7948448657989502e-05, 5.383789539337158e-05, 8.972734212875366e-05, 0.00012561678886413574, 0.00016150623559951782, 0.0001973956823348999, 0.00023328512907028198, 0.00026917457580566406, 0.00030506402254104614, 0.0003409534692764282, 0.0003768429160118103, 0.0004127323627471924, 0.00044862180948257446, 0.00048451125621795654, 0.0005204007029533386, 0.0005562901496887207, 0.0005921795964241028, 0.0006280690431594849, 0.0006639584898948669, 0.000699847936630249, 0.0007357373833656311, 0.0007716268301010132, 0.0008075162768363953, 0.0008434057235717773, 0.0008792951703071594, 0.0009151846170425415, 0.0009510740637779236, 0.0009869635105133057, 0.0010228529572486877, 0.0010587424039840698, 0.001094631850719452, 0.001130521297454834]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 9.0, 5.0, 11.0, 8.0, 11.0, 7.0, 12.0, 18.0, 17.0, 19.0, 24.0, 20.0, 32.0, 39.0, 29.0, 44.0, 30.0, 42.0, 32.0, 37.0, 43.0, 50.0, 53.0, 39.0, 40.0, 39.0, 36.0, 26.0, 35.0, 35.0, 29.0, 20.0, 23.0, 13.0, 14.0, 9.0, 10.0, 9.0, 11.0, 8.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.724609375, -3.617431640625, -3.51025390625, -3.403076171875, -3.2958984375, -3.188720703125, -3.08154296875, -2.974365234375, -2.8671875, -2.760009765625, -2.65283203125, -2.545654296875, -2.4384765625, -2.331298828125, -2.22412109375, -2.116943359375, -2.009765625, -1.902587890625, -1.79541015625, -1.688232421875, -1.5810546875, -1.473876953125, -1.36669921875, -1.259521484375, -1.15234375, -1.045166015625, -0.93798828125, -0.830810546875, -0.7236328125, -0.616455078125, -0.50927734375, -0.402099609375, -0.294921875, -0.187744140625, -0.08056640625, 0.026611328125, 0.1337890625, 0.240966796875, 0.34814453125, 0.455322265625, 0.5625, 0.669677734375, 0.77685546875, 0.884033203125, 0.9912109375, 1.098388671875, 1.20556640625, 1.312744140625, 1.419921875, 1.527099609375, 1.63427734375, 1.741455078125, 1.8486328125, 1.955810546875, 2.06298828125, 2.170166015625, 2.27734375, 2.384521484375, 2.49169921875, 2.598876953125, 2.7060546875, 2.813232421875, 2.92041015625, 3.027587890625, 3.134765625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 12.0, 20.0, 20.0, 33.0, 55.0, 68.0, 95.0, 148.0, 207.0, 286.0, 515.0, 785.0, 1395.0, 2496.0, 4726.0, 8663.0, 16338.0, 30387.0, 58109.0, 112734.0, 210943.0, 258550.0, 163249.0, 84544.0, 43542.0, 23019.0, 12360.0, 6686.0, 3615.0, 1984.0, 1093.0, 648.0, 408.0, 236.0, 185.0, 130.0, 74.0, 63.0, 52.0, 27.0, 17.0, 14.0, 10.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6796875, -2.594024658203125, -2.50836181640625, -2.422698974609375, -2.3370361328125, -2.251373291015625, -2.16571044921875, -2.080047607421875, -1.994384765625, -1.908721923828125, -1.82305908203125, -1.737396240234375, -1.6517333984375, -1.566070556640625, -1.48040771484375, -1.394744873046875, -1.30908203125, -1.223419189453125, -1.13775634765625, -1.052093505859375, -0.9664306640625, -0.880767822265625, -0.79510498046875, -0.709442138671875, -0.623779296875, -0.538116455078125, -0.45245361328125, -0.366790771484375, -0.2811279296875, -0.195465087890625, -0.10980224609375, -0.024139404296875, 0.0615234375, 0.147186279296875, 0.23284912109375, 0.318511962890625, 0.4041748046875, 0.489837646484375, 0.57550048828125, 0.661163330078125, 0.746826171875, 0.832489013671875, 0.91815185546875, 1.003814697265625, 1.0894775390625, 1.175140380859375, 1.26080322265625, 1.346466064453125, 1.43212890625, 1.517791748046875, 1.60345458984375, 1.689117431640625, 1.7747802734375, 1.860443115234375, 1.94610595703125, 2.031768798828125, 2.117431640625, 2.203094482421875, 2.28875732421875, 2.374420166015625, 2.4600830078125, 2.545745849609375, 2.63140869140625, 2.717071533203125, 2.802734375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 6.0, 2.0, 4.0, 10.0, 12.0, 11.0, 12.0, 13.0, 17.0, 29.0, 32.0, 33.0, 28.0, 41.0, 51.0, 56.0, 69.0, 106.0, 187.0, 1422.0, 293.0, 117.0, 86.0, 59.0, 53.0, 49.0, 47.0, 43.0, 26.0, 21.0, 18.0, 14.0, 24.0, 13.0, 7.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0078125, -12.5706787109375, -12.133544921875, -11.6964111328125, -11.25927734375, -10.8221435546875, -10.385009765625, -9.9478759765625, -9.5107421875, -9.0736083984375, -8.636474609375, -8.1993408203125, -7.76220703125, -7.3250732421875, -6.887939453125, -6.4508056640625, -6.013671875, -5.5765380859375, -5.139404296875, -4.7022705078125, -4.26513671875, -3.8280029296875, -3.390869140625, -2.9537353515625, -2.5166015625, -2.0794677734375, -1.642333984375, -1.2052001953125, -0.76806640625, -0.3309326171875, 0.106201171875, 0.5433349609375, 0.98046875, 1.4176025390625, 1.854736328125, 2.2918701171875, 2.72900390625, 3.1661376953125, 3.603271484375, 4.0404052734375, 4.4775390625, 4.9146728515625, 5.351806640625, 5.7889404296875, 6.22607421875, 6.6632080078125, 7.100341796875, 7.5374755859375, 7.974609375, 8.4117431640625, 8.848876953125, 9.2860107421875, 9.72314453125, 10.1602783203125, 10.597412109375, 11.0345458984375, 11.4716796875, 11.9088134765625, 12.345947265625, 12.7830810546875, 13.22021484375, 13.6573486328125, 14.094482421875, 14.5316162109375, 14.96875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 7.0, 13.0, 15.0, 33.0, 56.0, 79.0, 113.0, 194.0, 348.0, 954.0, 65337.0, 3075128.0, 2237.0, 543.0, 238.0, 145.0, 104.0, 51.0, 39.0, 18.0, 20.0, 14.0, 5.0, 5.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.1875, -56.125, -54.0625, -52.0, -49.9375, -47.875, -45.8125, -43.75, -41.6875, -39.625, -37.5625, -35.5, -33.4375, -31.375, -29.3125, -27.25, -25.1875, -23.125, -21.0625, -19.0, -16.9375, -14.875, -12.8125, -10.75, -8.6875, -6.625, -4.5625, -2.5, -0.4375, 1.625, 3.6875, 5.75, 7.8125, 9.875, 11.9375, 14.0, 16.0625, 18.125, 20.1875, 22.25, 24.3125, 26.375, 28.4375, 30.5, 32.5625, 34.625, 36.6875, 38.75, 40.8125, 42.875, 44.9375, 47.0, 49.0625, 51.125, 53.1875, 55.25, 57.3125, 59.375, 61.4375, 63.5, 65.5625, 67.625, 69.6875, 71.75, 73.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 442.0, 575.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.76115417480469, -58.14368438720703, -48.52621841430664, -38.90875244140625, -29.291282653808594, -19.673812866210938, -10.056346893310547, -0.43888092041015625, 9.1785888671875, 18.796056747436523, 28.413524627685547, 38.03099060058594, 47.648460388183594, 57.26593017578125, 66.88339233398438, 76.50086212158203, 86.11833190917969, 95.73580169677734, 105.353271484375, 114.97073364257812, 124.58820343017578, 134.20567321777344, 143.82313537597656, 153.44061279296875, 163.05807495117188, 172.675537109375, 182.2930145263672, 191.9104766845703, 201.5279541015625, 211.14541625976562, 220.76287841796875, 230.38034057617188, 239.997802734375, 249.61526489257812, 259.23272705078125, 268.8502197265625, 278.4676818847656, 288.08514404296875, 297.7026062011719, 307.320068359375, 316.93756103515625, 326.5550231933594, 336.1724853515625, 345.78997802734375, 355.4074401855469, 365.02490234375, 374.6423645019531, 384.25982666015625, 393.8772888183594, 403.4947509765625, 413.1122131347656, 422.7297058105469, 432.34716796875, 441.9646301269531, 451.58209228515625, 461.1995544433594, 470.8170166015625, 480.4344787597656, 490.05194091796875, 499.66943359375, 509.2868957519531, 518.9043579101562, 528.5218505859375, 538.1392822265625, 547.7567749023438]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 18.0, 18.0, 14.0, 22.0, 24.0, 30.0, 33.0, 24.0, 35.0, 38.0, 43.0, 32.0, 41.0, 37.0, 51.0, 41.0, 29.0, 47.0, 40.0, 36.0, 36.0, 27.0, 40.0, 26.0, 25.0, 22.0, 23.0, 18.0, 14.0, 9.0, 14.0, 14.0, 11.0, 7.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.858814239501953, -30.87700653076172, -29.895200729370117, -28.913393020629883, -27.93158531188965, -26.949779510498047, -25.967971801757812, -24.986164093017578, -24.004356384277344, -23.02254867553711, -22.040742874145508, -21.058935165405273, -20.07712745666504, -19.095321655273438, -18.113513946533203, -17.13170623779297, -16.149898529052734, -15.168091773986816, -14.186284065246582, -13.204477310180664, -12.22266960144043, -11.240862846374512, -10.259056091308594, -9.27724838256836, -8.295442581176758, -7.313635349273682, -6.3318281173706055, -5.3500213623046875, -4.368213653564453, -3.386406898498535, -2.404599666595459, -1.4227924346923828, -0.44098472595214844, 0.540822446346283, 1.5226296186447144, 2.504436731338501, 3.486243963241577, 4.468050956726074, 5.44985818862915, 6.431665420532227, 7.413472652435303, 8.395279884338379, 9.377086639404297, 10.358894348144531, 11.34070110321045, 12.322507858276367, 13.304315567016602, 14.286123275756836, 15.267930030822754, 16.249736785888672, 17.231544494628906, 18.21335220336914, 19.195158004760742, 20.176965713500977, 21.15877342224121, 22.140579223632812, 23.122386932373047, 24.10419464111328, 25.086000442504883, 26.067808151245117, 27.04961585998535, 28.031421661376953, 29.013229370117188, 29.995037078857422, 30.976844787597656]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 7.0, 7.0, 9.0, 8.0, 13.0, 10.0, 12.0, 19.0, 19.0, 16.0, 16.0, 26.0, 28.0, 30.0, 40.0, 28.0, 40.0, 36.0, 30.0, 42.0, 44.0, 36.0, 36.0, 40.0, 40.0, 44.0, 32.0, 25.0, 33.0, 33.0, 27.0, 26.0, 20.0, 21.0, 12.0, 15.0, 14.0, 12.0, 14.0, 9.0, 10.0, 4.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.814453125, -3.70263671875, -3.5908203125, -3.47900390625, -3.3671875, -3.25537109375, -3.1435546875, -3.03173828125, -2.919921875, -2.80810546875, -2.6962890625, -2.58447265625, -2.47265625, -2.36083984375, -2.2490234375, -2.13720703125, -2.025390625, -1.91357421875, -1.8017578125, -1.68994140625, -1.578125, -1.46630859375, -1.3544921875, -1.24267578125, -1.130859375, -1.01904296875, -0.9072265625, -0.79541015625, -0.68359375, -0.57177734375, -0.4599609375, -0.34814453125, -0.236328125, -0.12451171875, -0.0126953125, 0.09912109375, 0.2109375, 0.32275390625, 0.4345703125, 0.54638671875, 0.658203125, 0.77001953125, 0.8818359375, 0.99365234375, 1.10546875, 1.21728515625, 1.3291015625, 1.44091796875, 1.552734375, 1.66455078125, 1.7763671875, 1.88818359375, 2.0, 2.11181640625, 2.2236328125, 2.33544921875, 2.447265625, 2.55908203125, 2.6708984375, 2.78271484375, 2.89453125, 3.00634765625, 3.1181640625, 3.22998046875, 3.341796875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 17.0, 11.0, 5.0, 13.0, 17.0, 12.0, 19.0, 24.0, 21.0, 25.0, 40.0, 41.0, 67.0, 91.0, 247.0, 837.0, 5528.0, 173750.0, 3146953.0, 846249.0, 17489.0, 1711.0, 486.0, 195.0, 102.0, 60.0, 40.0, 37.0, 30.0, 30.0, 20.0, 15.0, 19.0, 13.0, 14.0, 11.0, 10.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.6875, -15.260009765625, -14.83251953125, -14.405029296875, -13.9775390625, -13.550048828125, -13.12255859375, -12.695068359375, -12.267578125, -11.840087890625, -11.41259765625, -10.985107421875, -10.5576171875, -10.130126953125, -9.70263671875, -9.275146484375, -8.84765625, -8.420166015625, -7.99267578125, -7.565185546875, -7.1376953125, -6.710205078125, -6.28271484375, -5.855224609375, -5.427734375, -5.000244140625, -4.57275390625, -4.145263671875, -3.7177734375, -3.290283203125, -2.86279296875, -2.435302734375, -2.0078125, -1.580322265625, -1.15283203125, -0.725341796875, -0.2978515625, 0.129638671875, 0.55712890625, 0.984619140625, 1.412109375, 1.839599609375, 2.26708984375, 2.694580078125, 3.1220703125, 3.549560546875, 3.97705078125, 4.404541015625, 4.83203125, 5.259521484375, 5.68701171875, 6.114501953125, 6.5419921875, 6.969482421875, 7.39697265625, 7.824462890625, 8.251953125, 8.679443359375, 9.10693359375, 9.534423828125, 9.9619140625, 10.389404296875, 10.81689453125, 11.244384765625, 11.671875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 15.0, 19.0, 32.0, 44.0, 53.0, 95.0, 154.0, 201.0, 326.0, 450.0, 571.0, 561.0, 465.0, 320.0, 252.0, 158.0, 111.0, 87.0, 46.0, 34.0, 18.0, 21.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3465576171875, -8.013427734375, -7.6802978515625, -7.34716796875, -7.0140380859375, -6.680908203125, -6.3477783203125, -6.0146484375, -5.6815185546875, -5.348388671875, -5.0152587890625, -4.68212890625, -4.3489990234375, -4.015869140625, -3.6827392578125, -3.349609375, -3.0164794921875, -2.683349609375, -2.3502197265625, -2.01708984375, -1.6839599609375, -1.350830078125, -1.0177001953125, -0.6845703125, -0.3514404296875, -0.018310546875, 0.3148193359375, 0.64794921875, 0.9810791015625, 1.314208984375, 1.6473388671875, 1.98046875, 2.3135986328125, 2.646728515625, 2.9798583984375, 3.31298828125, 3.6461181640625, 3.979248046875, 4.3123779296875, 4.6455078125, 4.9786376953125, 5.311767578125, 5.6448974609375, 5.97802734375, 6.3111572265625, 6.644287109375, 6.9774169921875, 7.310546875, 7.6436767578125, 7.976806640625, 8.3099365234375, 8.64306640625, 8.9761962890625, 9.309326171875, 9.6424560546875, 9.9755859375, 10.3087158203125, 10.641845703125, 10.9749755859375, 11.30810546875, 11.6412353515625, 11.974365234375, 12.3074951171875, 12.640625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 21.0, 31.0, 52.0, 78.0, 93.0, 158.0, 203.0, 427.0, 1013.0, 10328.0, 1770482.0, 2395644.0, 13577.0, 1097.0, 439.0, 206.0, 136.0, 90.0, 66.0, 38.0, 23.0, 16.0, 19.0, 6.0, 10.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.9375, -28.0615234375, -27.185546875, -26.3095703125, -25.43359375, -24.5576171875, -23.681640625, -22.8056640625, -21.9296875, -21.0537109375, -20.177734375, -19.3017578125, -18.42578125, -17.5498046875, -16.673828125, -15.7978515625, -14.921875, -14.0458984375, -13.169921875, -12.2939453125, -11.41796875, -10.5419921875, -9.666015625, -8.7900390625, -7.9140625, -7.0380859375, -6.162109375, -5.2861328125, -4.41015625, -3.5341796875, -2.658203125, -1.7822265625, -0.90625, -0.0302734375, 0.845703125, 1.7216796875, 2.59765625, 3.4736328125, 4.349609375, 5.2255859375, 6.1015625, 6.9775390625, 7.853515625, 8.7294921875, 9.60546875, 10.4814453125, 11.357421875, 12.2333984375, 13.109375, 13.9853515625, 14.861328125, 15.7373046875, 16.61328125, 17.4892578125, 18.365234375, 19.2412109375, 20.1171875, 20.9931640625, 21.869140625, 22.7451171875, 23.62109375, 24.4970703125, 25.373046875, 26.2490234375, 27.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 64.0, 143.0, 281.0, 278.0, 172.0, 49.0, 14.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.681861877441406, -42.80763244628906, -39.93340301513672, -37.05916976928711, -34.184940338134766, -31.310710906982422, -28.436479568481445, -25.56224822998047, -22.688018798828125, -19.81378936767578, -16.939558029174805, -14.065327644348145, -11.191097259521484, -8.316866874694824, -5.442636489868164, -2.5684051513671875, 0.30582427978515625, 3.1800546646118164, 6.054285049438477, 8.928515434265137, 11.802745819091797, 14.676976203918457, 17.551206588745117, 20.425437927246094, 23.299667358398438, 26.17389678955078, 29.048128128051758, 31.922359466552734, 34.79658889770508, 37.67081832885742, 40.54505157470703, 43.419281005859375, 46.29350280761719, 49.16773223876953, 52.041961669921875, 54.916194915771484, 57.79042434692383, 60.66465377807617, 63.53888702392578, 66.41311645507812, 69.28734588623047, 72.16157531738281, 75.03580474853516, 77.9100341796875, 80.78427124023438, 83.65850067138672, 86.53273010253906, 89.4069595336914, 92.28118896484375, 95.1554183959961, 98.02964782714844, 100.90387725830078, 103.77810668945312, 106.65234375, 109.52657318115234, 112.40080261230469, 115.27503204345703, 118.14926147460938, 121.02349090576172, 123.89772033691406, 126.77195739746094, 129.64617919921875, 132.52041625976562, 135.3946533203125, 138.2688751220703]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 8.0, 6.0, 11.0, 15.0, 21.0, 19.0, 26.0, 42.0, 29.0, 20.0, 40.0, 25.0, 40.0, 37.0, 38.0, 53.0, 37.0, 43.0, 34.0, 39.0, 34.0, 37.0, 44.0, 28.0, 32.0, 28.0, 26.0, 22.0, 20.0, 22.0, 22.0, 13.0, 15.0, 12.0, 7.0, 5.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.70192527770996, -24.874488830566406, -24.047054290771484, -23.21961784362793, -22.392181396484375, -21.564746856689453, -20.7373104095459, -19.909873962402344, -19.082439422607422, -18.255002975463867, -17.427568435668945, -16.60013198852539, -15.772695541381836, -14.945260047912598, -14.11782455444336, -13.290388107299805, -12.46295166015625, -11.635516166687012, -10.808079719543457, -9.980644226074219, -9.153207778930664, -8.325772285461426, -7.4983367919921875, -6.670900821685791, -5.8434648513793945, -5.016028881072998, -4.188592910766602, -3.3611574172973633, -2.533721446990967, -1.7062854766845703, -0.878849983215332, -0.05141401290893555, 0.7760200500488281, 1.603455901145935, 2.430891752243042, 3.2583274841308594, 4.085763454437256, 4.913199424743652, 5.740634918212891, 6.568070888519287, 7.395506858825684, 8.222942352294922, 9.050378799438477, 9.877814292907715, 10.705249786376953, 11.532686233520508, 12.360121726989746, 13.187557220458984, 14.014993667602539, 14.842429161071777, 15.669865608215332, 16.49730110168457, 17.324737548828125, 18.152172088623047, 18.9796085357666, 19.807044982910156, 20.634479522705078, 21.461915969848633, 22.289350509643555, 23.11678695678711, 23.944223403930664, 24.77165985107422, 25.59909439086914, 26.426530838012695, 27.25396728515625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 12.0, 11.0, 12.0, 8.0, 14.0, 13.0, 24.0, 21.0, 24.0, 23.0, 26.0, 22.0, 38.0, 28.0, 28.0, 40.0, 28.0, 38.0, 48.0, 37.0, 49.0, 61.0, 43.0, 32.0, 28.0, 28.0, 36.0, 27.0, 30.0, 33.0, 14.0, 16.0, 14.0, 9.0, 16.0, 14.0, 5.0, 7.0, 7.0, 9.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.890625, -3.779571533203125, -3.66851806640625, -3.557464599609375, -3.4464111328125, -3.335357666015625, -3.22430419921875, -3.113250732421875, -3.002197265625, -2.891143798828125, -2.78009033203125, -2.669036865234375, -2.5579833984375, -2.446929931640625, -2.33587646484375, -2.224822998046875, -2.11376953125, -2.002716064453125, -1.89166259765625, -1.780609130859375, -1.6695556640625, -1.558502197265625, -1.44744873046875, -1.336395263671875, -1.225341796875, -1.114288330078125, -1.00323486328125, -0.892181396484375, -0.7811279296875, -0.670074462890625, -0.55902099609375, -0.447967529296875, -0.3369140625, -0.225860595703125, -0.11480712890625, -0.003753662109375, 0.1072998046875, 0.218353271484375, 0.32940673828125, 0.440460205078125, 0.551513671875, 0.662567138671875, 0.77362060546875, 0.884674072265625, 0.9957275390625, 1.106781005859375, 1.21783447265625, 1.328887939453125, 1.43994140625, 1.550994873046875, 1.66204833984375, 1.773101806640625, 1.8841552734375, 1.995208740234375, 2.10626220703125, 2.217315673828125, 2.328369140625, 2.439422607421875, 2.55047607421875, 2.661529541015625, 2.7725830078125, 2.883636474609375, 2.99468994140625, 3.105743408203125, 3.216796875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 6.0, 5.0, 9.0, 16.0, 26.0, 27.0, 48.0, 67.0, 105.0, 171.0, 231.0, 335.0, 512.0, 730.0, 1065.0, 1527.0, 2282.0, 3354.0, 4920.0, 7187.0, 10484.0, 15231.0, 22685.0, 33500.0, 50234.0, 75322.0, 114351.0, 175476.0, 178788.0, 115820.0, 76779.0, 50952.0, 34078.0, 22794.0, 15550.0, 10663.0, 7448.0, 5065.0, 3279.0, 2458.0, 1601.0, 1085.0, 748.0, 450.0, 339.0, 246.0, 152.0, 118.0, 71.0, 65.0, 41.0, 26.0, 16.0, 8.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.36328125, -0.35193634033203125, -0.3405914306640625, -0.32924652099609375, -0.317901611328125, -0.30655670166015625, -0.2952117919921875, -0.28386688232421875, -0.27252197265625, -0.26117706298828125, -0.2498321533203125, -0.23848724365234375, -0.227142333984375, -0.21579742431640625, -0.2044525146484375, -0.19310760498046875, -0.1817626953125, -0.17041778564453125, -0.1590728759765625, -0.14772796630859375, -0.136383056640625, -0.12503814697265625, -0.1136932373046875, -0.10234832763671875, -0.09100341796875, -0.07965850830078125, -0.0683135986328125, -0.05696868896484375, -0.045623779296875, -0.03427886962890625, -0.0229339599609375, -0.01158905029296875, -0.000244140625, 0.01110076904296875, 0.0224456787109375, 0.03379058837890625, 0.045135498046875, 0.05648040771484375, 0.0678253173828125, 0.07917022705078125, 0.09051513671875, 0.10186004638671875, 0.1132049560546875, 0.12454986572265625, 0.135894775390625, 0.14723968505859375, 0.1585845947265625, 0.16992950439453125, 0.1812744140625, 0.19261932373046875, 0.2039642333984375, 0.21530914306640625, 0.226654052734375, 0.23799896240234375, 0.2493438720703125, 0.26068878173828125, 0.27203369140625, 0.28337860107421875, 0.2947235107421875, 0.30606842041015625, 0.317413330078125, 0.32875823974609375, 0.3401031494140625, 0.35144805908203125, 0.36279296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 5.0, 19.0, 14.0, 18.0, 13.0, 12.0, 25.0, 18.0, 18.0, 28.0, 15.0, 31.0, 35.0, 29.0, 32.0, 43.0, 28.0, 39.0, 25.0, 1071.0, 32.0, 47.0, 30.0, 37.0, 30.0, 33.0, 36.0, 32.0, 23.0, 30.0, 26.0, 22.0, 11.0, 14.0, 10.0, 11.0, 15.0, 10.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0], "bins": [-2.33984375, -2.2739105224609375, -2.207977294921875, -2.1420440673828125, -2.07611083984375, -2.0101776123046875, -1.944244384765625, -1.8783111572265625, -1.8123779296875, -1.7464447021484375, -1.680511474609375, -1.6145782470703125, -1.54864501953125, -1.4827117919921875, -1.416778564453125, -1.3508453369140625, -1.284912109375, -1.2189788818359375, -1.153045654296875, -1.0871124267578125, -1.02117919921875, -0.9552459716796875, -0.889312744140625, -0.8233795166015625, -0.7574462890625, -0.6915130615234375, -0.625579833984375, -0.5596466064453125, -0.49371337890625, -0.4277801513671875, -0.361846923828125, -0.2959136962890625, -0.22998046875, -0.1640472412109375, -0.098114013671875, -0.0321807861328125, 0.03375244140625, 0.0996856689453125, 0.165618896484375, 0.2315521240234375, 0.2974853515625, 0.3634185791015625, 0.429351806640625, 0.4952850341796875, 0.56121826171875, 0.6271514892578125, 0.693084716796875, 0.7590179443359375, 0.824951171875, 0.8908843994140625, 0.956817626953125, 1.0227508544921875, 1.08868408203125, 1.1546173095703125, 1.220550537109375, 1.2864837646484375, 1.3524169921875, 1.4183502197265625, 1.484283447265625, 1.5502166748046875, 1.61614990234375, 1.6820831298828125, 1.748016357421875, 1.8139495849609375, 1.8798828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 9.0, 15.0, 24.0, 30.0, 41.0, 64.0, 84.0, 124.0, 157.0, 268.0, 368.0, 522.0, 811.0, 1169.0, 1761.0, 2558.0, 3863.0, 5939.0, 9002.0, 14188.0, 21926.0, 35520.0, 57223.0, 94580.0, 156572.0, 1268696.0, 163113.0, 97793.0, 59410.0, 36603.0, 23103.0, 14281.0, 9104.0, 6028.0, 4028.0, 2614.0, 1759.0, 1121.0, 842.0, 521.0, 375.0, 277.0, 211.0, 131.0, 102.0, 66.0, 33.0, 33.0, 18.0, 22.0, 9.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0], "bins": [-0.385009765625, -0.37317657470703125, -0.3613433837890625, -0.34951019287109375, -0.337677001953125, -0.32584381103515625, -0.3140106201171875, -0.30217742919921875, -0.29034423828125, -0.27851104736328125, -0.2666778564453125, -0.25484466552734375, -0.243011474609375, -0.23117828369140625, -0.2193450927734375, -0.20751190185546875, -0.1956787109375, -0.18384552001953125, -0.1720123291015625, -0.16017913818359375, -0.148345947265625, -0.13651275634765625, -0.1246795654296875, -0.11284637451171875, -0.10101318359375, -0.08917999267578125, -0.0773468017578125, -0.06551361083984375, -0.053680419921875, -0.04184722900390625, -0.0300140380859375, -0.01818084716796875, -0.00634765625, 0.00548553466796875, 0.0173187255859375, 0.02915191650390625, 0.040985107421875, 0.05281829833984375, 0.0646514892578125, 0.07648468017578125, 0.08831787109375, 0.10015106201171875, 0.1119842529296875, 0.12381744384765625, 0.135650634765625, 0.14748382568359375, 0.1593170166015625, 0.17115020751953125, 0.1829833984375, 0.19481658935546875, 0.2066497802734375, 0.21848297119140625, 0.230316162109375, 0.24214935302734375, 0.2539825439453125, 0.26581573486328125, 0.27764892578125, 0.28948211669921875, 0.3013153076171875, 0.31314849853515625, 0.324981689453125, 0.33681488037109375, 0.3486480712890625, 0.36048126220703125, 0.372314453125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 14.0, 14.0, 7.0, 13.0, 19.0, 16.0, 27.0, 36.0, 59.0, 107.0, 177.0, 199.0, 87.0, 52.0, 24.0, 22.0, 25.0, 15.0, 15.0, 10.0, 10.0, 6.0, 7.0, 5.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.006381988525390625, -0.006204843521118164, -0.006027698516845703, -0.005850553512573242, -0.005673408508300781, -0.00549626350402832, -0.005319118499755859, -0.0051419734954833984, -0.0049648284912109375, -0.0047876834869384766, -0.004610538482666016, -0.004433393478393555, -0.004256248474121094, -0.004079103469848633, -0.003901958465576172, -0.003724813461303711, -0.00354766845703125, -0.003370523452758789, -0.003193378448486328, -0.003016233444213867, -0.0028390884399414062, -0.0026619434356689453, -0.0024847984313964844, -0.0023076534271240234, -0.0021305084228515625, -0.0019533634185791016, -0.0017762184143066406, -0.0015990734100341797, -0.0014219284057617188, -0.0012447834014892578, -0.0010676383972167969, -0.0008904933929443359, -0.000713348388671875, -0.0005362033843994141, -0.0003590583801269531, -0.0001819133758544922, -4.76837158203125e-06, 0.0001723766326904297, 0.0003495216369628906, 0.0005266666412353516, 0.0007038116455078125, 0.0008809566497802734, 0.0010581016540527344, 0.0012352466583251953, 0.0014123916625976562, 0.0015895366668701172, 0.0017666816711425781, 0.001943826675415039, 0.0021209716796875, 0.002298116683959961, 0.002475261688232422, 0.002652406692504883, 0.0028295516967773438, 0.0030066967010498047, 0.0031838417053222656, 0.0033609867095947266, 0.0035381317138671875, 0.0037152767181396484, 0.0038924217224121094, 0.00406956672668457, 0.004246711730957031, 0.004423856735229492, 0.004601001739501953, 0.004778146743774414, 0.004955291748046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 6.0, 8.0, 12.0, 11.0, 25.0, 27.0, 35.0, 52.0, 86.0, 183.0, 356.0, 939.0, 973298.0, 72041.0, 715.0, 315.0, 152.0, 93.0, 34.0, 46.0, 29.0, 21.0, 17.0, 10.0, 7.0, 6.0, 8.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09967041015625, -0.09609699249267578, -0.09252357482910156, -0.08895015716552734, -0.08537673950195312, -0.0818033218383789, -0.07822990417480469, -0.07465648651123047, -0.07108306884765625, -0.06750965118408203, -0.06393623352050781, -0.060362815856933594, -0.056789398193359375, -0.053215980529785156, -0.04964256286621094, -0.04606914520263672, -0.0424957275390625, -0.03892230987548828, -0.03534889221191406, -0.031775474548339844, -0.028202056884765625, -0.024628639221191406, -0.021055221557617188, -0.01748180389404297, -0.01390838623046875, -0.010334968566894531, -0.0067615509033203125, -0.0031881332397460938, 0.000385284423828125, 0.003958702087402344, 0.0075321197509765625, 0.011105537414550781, 0.014678955078125, 0.01825237274169922, 0.021825790405273438, 0.025399208068847656, 0.028972625732421875, 0.032546043395996094, 0.03611946105957031, 0.03969287872314453, 0.04326629638671875, 0.04683971405029297, 0.05041313171386719, 0.053986549377441406, 0.057559967041015625, 0.061133384704589844, 0.06470680236816406, 0.06828022003173828, 0.0718536376953125, 0.07542705535888672, 0.07900047302246094, 0.08257389068603516, 0.08614730834960938, 0.0897207260131836, 0.09329414367675781, 0.09686756134033203, 0.10044097900390625, 0.10401439666748047, 0.10758781433105469, 0.1111612319946289, 0.11473464965820312, 0.11830806732177734, 0.12188148498535156, 0.12545490264892578, 0.1290283203125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [715.0, 303.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012395386584103107, 8.418771903961897e-05, 0.0014079140964895487, 0.0027316403575241566, 0.004055366851389408, 0.00537909334525466, 0.006702819373458624, 0.008026545867323875, 0.00935027189552784, 0.010673997923731804, 0.011997724883258343, 0.013321450911462307, 0.014645177870988846, 0.01596890389919281, 0.017292629927396774, 0.01861635595560074, 0.019940083846449852, 0.021263809874653816, 0.02258753590285778, 0.023911263793706894, 0.025234989821910858, 0.026558715850114822, 0.027882441878318787, 0.02920616790652275, 0.030529893934726715, 0.03185361996293068, 0.033177345991134644, 0.03450107201933861, 0.03582479804754257, 0.037148527801036835, 0.0384722501039505, 0.03979597985744476, 0.04111970588564873, 0.04244343191385269, 0.043767157942056656, 0.04509088397026062, 0.046414609998464584, 0.04773833602666855, 0.04906206578016281, 0.050385791808366776, 0.05170951783657074, 0.053033243864774704, 0.05435696989297867, 0.05568069592118263, 0.0570044219493866, 0.05832815170288086, 0.059651874005794525, 0.06097560375928879, 0.062299326062202454, 0.06362305581569672, 0.06494677811861038, 0.06627050787210464, 0.06759423017501831, 0.06891795992851257, 0.07024168223142624, 0.0715654119849205, 0.07288914173841476, 0.07421287149190903, 0.07553659379482269, 0.07686032354831696, 0.07818404585123062, 0.07950777560472488, 0.08083149790763855, 0.08215522766113281, 0.08347894996404648]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 13.0, 12.0, 15.0, 21.0, 28.0, 22.0, 40.0, 41.0, 41.0, 53.0, 71.0, 64.0, 61.0, 68.0, 45.0, 69.0, 49.0, 54.0, 48.0, 43.0, 33.0, 27.0, 17.0, 16.0, 14.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00421518087387085, -0.004117949865758419, -0.0040207188576459885, -0.003923487849533558, -0.0038262568414211273, -0.0037290258333086967, -0.003631794825196266, -0.0035345638170838356, -0.003437332808971405, -0.0033401018008589745, -0.003242870792746544, -0.0031456397846341133, -0.0030484087765216827, -0.002951177768409252, -0.0028539467602968216, -0.002756715752184391, -0.0026594847440719604, -0.00256225373595953, -0.0024650227278470993, -0.0023677917197346687, -0.002270560711622238, -0.0021733297035098076, -0.002076098695397377, -0.0019788676872849464, -0.0018816366791725159, -0.0017844056710600853, -0.0016871746629476547, -0.0015899436548352242, -0.0014927126467227936, -0.001395481638610363, -0.0012982506304979324, -0.0012010196223855019, -0.0011037886142730713, -0.0010065576061606407, -0.0009093265980482101, -0.0008120955899357796, -0.000714864581823349, -0.0006176335737109184, -0.0005204025655984879, -0.0004231715574860573, -0.0003259405493736267, -0.00022870954126119614, -0.00013147853314876556, -3.424752503633499e-05, 6.298348307609558e-05, 0.00016021449118852615, 0.0002574454993009567, 0.0003546765074133873, 0.00045190751552581787, 0.0005491385236382484, 0.000646369531750679, 0.0007436005398631096, 0.0008408315479755402, 0.0009380625560879707, 0.0010352935642004013, 0.0011325245723128319, 0.0012297555804252625, 0.001326986588537693, 0.0014242175966501236, 0.0015214486047625542, 0.0016186796128749847, 0.0017159106209874153, 0.0018131416290998459, 0.0019103726372122765, 0.002007603645324707]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 12.0, 11.0, 12.0, 8.0, 14.0, 13.0, 24.0, 21.0, 24.0, 23.0, 26.0, 22.0, 38.0, 28.0, 28.0, 40.0, 28.0, 38.0, 48.0, 37.0, 49.0, 61.0, 43.0, 32.0, 28.0, 28.0, 36.0, 27.0, 30.0, 33.0, 14.0, 16.0, 14.0, 9.0, 16.0, 14.0, 5.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.890625, -3.779571533203125, -3.66851806640625, -3.557464599609375, -3.4464111328125, -3.335357666015625, -3.22430419921875, -3.113250732421875, -3.002197265625, -2.891143798828125, -2.78009033203125, -2.669036865234375, -2.5579833984375, -2.446929931640625, -2.33587646484375, -2.224822998046875, -2.11376953125, -2.002716064453125, -1.89166259765625, -1.780609130859375, -1.6695556640625, -1.558502197265625, -1.44744873046875, -1.336395263671875, -1.225341796875, -1.114288330078125, -1.00323486328125, -0.892181396484375, -0.7811279296875, -0.670074462890625, -0.55902099609375, -0.447967529296875, -0.3369140625, -0.225860595703125, -0.11480712890625, -0.003753662109375, 0.1072998046875, 0.218353271484375, 0.32940673828125, 0.440460205078125, 0.551513671875, 0.662567138671875, 0.77362060546875, 0.884674072265625, 0.9957275390625, 1.106781005859375, 1.21783447265625, 1.328887939453125, 1.43994140625, 1.550994873046875, 1.66204833984375, 1.773101806640625, 1.8841552734375, 1.995208740234375, 2.10626220703125, 2.217315673828125, 2.328369140625, 2.439422607421875, 2.55047607421875, 2.661529541015625, 2.7725830078125, 2.883636474609375, 2.99468994140625, 3.105743408203125, 3.216796875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 6.0, 10.0, 14.0, 24.0, 29.0, 36.0, 44.0, 78.0, 113.0, 154.0, 256.0, 441.0, 799.0, 1513.0, 3359.0, 7300.0, 15929.0, 35322.0, 77800.0, 172288.0, 342330.0, 214142.0, 95401.0, 43776.0, 19974.0, 8910.0, 4065.0, 1978.0, 958.0, 568.0, 321.0, 209.0, 109.0, 82.0, 52.0, 46.0, 32.0, 25.0, 12.0, 17.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.87890625, -3.763580322265625, -3.64825439453125, -3.532928466796875, -3.4176025390625, -3.302276611328125, -3.18695068359375, -3.071624755859375, -2.956298828125, -2.840972900390625, -2.72564697265625, -2.610321044921875, -2.4949951171875, -2.379669189453125, -2.26434326171875, -2.149017333984375, -2.03369140625, -1.918365478515625, -1.80303955078125, -1.687713623046875, -1.5723876953125, -1.457061767578125, -1.34173583984375, -1.226409912109375, -1.111083984375, -0.995758056640625, -0.88043212890625, -0.765106201171875, -0.6497802734375, -0.534454345703125, -0.41912841796875, -0.303802490234375, -0.1884765625, -0.073150634765625, 0.04217529296875, 0.157501220703125, 0.2728271484375, 0.388153076171875, 0.50347900390625, 0.618804931640625, 0.734130859375, 0.849456787109375, 0.96478271484375, 1.080108642578125, 1.1954345703125, 1.310760498046875, 1.42608642578125, 1.541412353515625, 1.65673828125, 1.772064208984375, 1.88739013671875, 2.002716064453125, 2.1180419921875, 2.233367919921875, 2.34869384765625, 2.464019775390625, 2.579345703125, 2.694671630859375, 2.80999755859375, 2.925323486328125, 3.0406494140625, 3.155975341796875, 3.27130126953125, 3.386627197265625, 3.501953125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 13.0, 16.0, 8.0, 19.0, 16.0, 24.0, 31.0, 34.0, 39.0, 42.0, 50.0, 60.0, 92.0, 152.0, 1464.0, 342.0, 138.0, 80.0, 59.0, 45.0, 50.0, 53.0, 34.0, 30.0, 27.0, 24.0, 16.0, 13.0, 9.0, 16.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.90625, -13.46923828125, -13.0322265625, -12.59521484375, -12.158203125, -11.72119140625, -11.2841796875, -10.84716796875, -10.41015625, -9.97314453125, -9.5361328125, -9.09912109375, -8.662109375, -8.22509765625, -7.7880859375, -7.35107421875, -6.9140625, -6.47705078125, -6.0400390625, -5.60302734375, -5.166015625, -4.72900390625, -4.2919921875, -3.85498046875, -3.41796875, -2.98095703125, -2.5439453125, -2.10693359375, -1.669921875, -1.23291015625, -0.7958984375, -0.35888671875, 0.078125, 0.51513671875, 0.9521484375, 1.38916015625, 1.826171875, 2.26318359375, 2.7001953125, 3.13720703125, 3.57421875, 4.01123046875, 4.4482421875, 4.88525390625, 5.322265625, 5.75927734375, 6.1962890625, 6.63330078125, 7.0703125, 7.50732421875, 7.9443359375, 8.38134765625, 8.818359375, 9.25537109375, 9.6923828125, 10.12939453125, 10.56640625, 11.00341796875, 11.4404296875, 11.87744140625, 12.314453125, 12.75146484375, 13.1884765625, 13.62548828125, 14.0625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 5.0, 11.0, 12.0, 15.0, 27.0, 38.0, 70.0, 81.0, 128.0, 231.0, 536.0, 1955.0, 3084782.0, 56152.0, 860.0, 329.0, 150.0, 103.0, 65.0, 44.0, 30.0, 26.0, 16.0, 12.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -30.70361328125, -28.6259765625, -26.54833984375, -24.470703125, -22.39306640625, -20.3154296875, -18.23779296875, -16.16015625, -14.08251953125, -12.0048828125, -9.92724609375, -7.849609375, -5.77197265625, -3.6943359375, -1.61669921875, 0.4609375, 2.53857421875, 4.6162109375, 6.69384765625, 8.771484375, 10.84912109375, 12.9267578125, 15.00439453125, 17.08203125, 19.15966796875, 21.2373046875, 23.31494140625, 25.392578125, 27.47021484375, 29.5478515625, 31.62548828125, 33.703125, 35.78076171875, 37.8583984375, 39.93603515625, 42.013671875, 44.09130859375, 46.1689453125, 48.24658203125, 50.32421875, 52.40185546875, 54.4794921875, 56.55712890625, 58.634765625, 60.71240234375, 62.7900390625, 64.86767578125, 66.9453125, 69.02294921875, 71.1005859375, 73.17822265625, 75.255859375, 77.33349609375, 79.4111328125, 81.48876953125, 83.56640625, 85.64404296875, 87.7216796875, 89.79931640625, 91.876953125, 93.95458984375, 96.0322265625, 98.10986328125, 100.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 15.0, 31.0, 68.0, 113.0, 140.0, 194.0, 171.0, 122.0, 81.0, 38.0, 22.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.78023147583008, -38.822933197021484, -37.865631103515625, -36.90833282470703, -35.95103073120117, -34.99373245239258, -34.03643035888672, -33.079132080078125, -32.121829986572266, -31.16452980041504, -30.207229614257812, -29.249929428100586, -28.29262924194336, -27.335330963134766, -26.378028869628906, -25.420730590820312, -24.46343231201172, -23.506132125854492, -22.548831939697266, -21.59153175354004, -20.634231567382812, -19.67693328857422, -18.71963119506836, -17.762332916259766, -16.805030822753906, -15.84773063659668, -14.890430450439453, -13.933130264282227, -12.975831031799316, -12.01853084564209, -11.061230659484863, -10.103931427001953, -9.146631240844727, -8.1893310546875, -7.232031345367432, -6.274731159210205, -5.317431449890137, -4.36013126373291, -3.4028310775756836, -2.4455313682556152, -1.4882311820983887, -0.5309311747550964, 0.4263688325881958, 1.3836688995361328, 2.3409688472747803, 3.2982687950134277, 4.255568981170654, 5.212868690490723, 6.170168876647949, 7.127469062805176, 8.084769248962402, 9.042068481445312, 9.999368667602539, 10.956668853759766, 11.913969039916992, 12.871269226074219, 13.828569412231445, 14.785869598388672, 15.743169784545898, 16.700469970703125, 17.65777015686035, 18.615070343017578, 19.572368621826172, 20.5296688079834, 21.486968994140625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 7.0, 6.0, 6.0, 4.0, 14.0, 7.0, 13.0, 16.0, 16.0, 23.0, 27.0, 32.0, 30.0, 42.0, 31.0, 25.0, 48.0, 29.0, 40.0, 57.0, 42.0, 26.0, 41.0, 47.0, 41.0, 32.0, 33.0, 29.0, 31.0, 19.0, 25.0, 26.0, 19.0, 25.0, 20.0, 11.0, 11.0, 14.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-40.60022735595703, -39.471412658691406, -38.34259796142578, -37.213783264160156, -36.08496856689453, -34.95615768432617, -33.82734298706055, -32.69852828979492, -31.569713592529297, -30.440898895263672, -29.312084197998047, -28.183271408081055, -27.05445671081543, -25.925642013549805, -24.796829223632812, -23.668014526367188, -22.539199829101562, -21.410385131835938, -20.281570434570312, -19.15275764465332, -18.023942947387695, -16.89512825012207, -15.766314506530762, -14.637500762939453, -13.508686065673828, -12.379871368408203, -11.251057624816895, -10.122243881225586, -8.993429183959961, -7.864614963531494, -6.735800743103027, -5.6069865226745605, -4.478176116943359, -3.3493618965148926, -2.220547676086426, -1.091733455657959, 0.03708076477050781, 1.1658949851989746, 2.2947092056274414, 3.423523426055908, 4.552337646484375, 5.681151866912842, 6.809966087341309, 7.938780307769775, 9.067594528198242, 10.196409225463867, 11.325222969055176, 12.454036712646484, 13.58285140991211, 14.711666107177734, 15.840479850769043, 16.96929359436035, 18.098108291625977, 19.2269229888916, 20.355735778808594, 21.48455047607422, 22.613365173339844, 23.74217987060547, 24.870994567871094, 25.999807357788086, 27.12862205505371, 28.257436752319336, 29.386249542236328, 30.515064239501953, 31.643878936767578]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 13.0, 11.0, 10.0, 12.0, 19.0, 10.0, 17.0, 10.0, 23.0, 20.0, 23.0, 28.0, 26.0, 27.0, 29.0, 27.0, 35.0, 29.0, 46.0, 34.0, 48.0, 37.0, 29.0, 45.0, 42.0, 43.0, 34.0, 30.0, 18.0, 25.0, 19.0, 21.0, 25.0, 17.0, 17.0, 17.0, 9.0, 10.0, 9.0, 8.0, 8.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-4.0625, -3.944122314453125, -3.82574462890625, -3.707366943359375, -3.5889892578125, -3.470611572265625, -3.35223388671875, -3.233856201171875, -3.115478515625, -2.997100830078125, -2.87872314453125, -2.760345458984375, -2.6419677734375, -2.523590087890625, -2.40521240234375, -2.286834716796875, -2.16845703125, -2.050079345703125, -1.93170166015625, -1.813323974609375, -1.6949462890625, -1.576568603515625, -1.45819091796875, -1.339813232421875, -1.221435546875, -1.103057861328125, -0.98468017578125, -0.866302490234375, -0.7479248046875, -0.629547119140625, -0.51116943359375, -0.392791748046875, -0.2744140625, -0.156036376953125, -0.03765869140625, 0.080718994140625, 0.1990966796875, 0.317474365234375, 0.43585205078125, 0.554229736328125, 0.672607421875, 0.790985107421875, 0.90936279296875, 1.027740478515625, 1.1461181640625, 1.264495849609375, 1.38287353515625, 1.501251220703125, 1.61962890625, 1.738006591796875, 1.85638427734375, 1.974761962890625, 2.0931396484375, 2.211517333984375, 2.32989501953125, 2.448272705078125, 2.566650390625, 2.685028076171875, 2.80340576171875, 2.921783447265625, 3.0401611328125, 3.158538818359375, 3.27691650390625, 3.395294189453125, 3.513671875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 11.0, 14.0, 7.0, 15.0, 17.0, 26.0, 13.0, 22.0, 27.0, 32.0, 38.0, 46.0, 97.0, 153.0, 448.0, 1459.0, 10834.0, 380576.0, 3203401.0, 579285.0, 14763.0, 1789.0, 534.0, 214.0, 103.0, 71.0, 44.0, 40.0, 28.0, 21.0, 25.0, 21.0, 13.0, 14.0, 11.0, 6.0, 13.0, 7.0, 5.0, 10.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.40625, -13.9769287109375, -13.547607421875, -13.1182861328125, -12.68896484375, -12.2596435546875, -11.830322265625, -11.4010009765625, -10.9716796875, -10.5423583984375, -10.113037109375, -9.6837158203125, -9.25439453125, -8.8250732421875, -8.395751953125, -7.9664306640625, -7.537109375, -7.1077880859375, -6.678466796875, -6.2491455078125, -5.81982421875, -5.3905029296875, -4.961181640625, -4.5318603515625, -4.1025390625, -3.6732177734375, -3.243896484375, -2.8145751953125, -2.38525390625, -1.9559326171875, -1.526611328125, -1.0972900390625, -0.66796875, -0.2386474609375, 0.190673828125, 0.6199951171875, 1.04931640625, 1.4786376953125, 1.907958984375, 2.3372802734375, 2.7666015625, 3.1959228515625, 3.625244140625, 4.0545654296875, 4.48388671875, 4.9132080078125, 5.342529296875, 5.7718505859375, 6.201171875, 6.6304931640625, 7.059814453125, 7.4891357421875, 7.91845703125, 8.3477783203125, 8.777099609375, 9.2064208984375, 9.6357421875, 10.0650634765625, 10.494384765625, 10.9237060546875, 11.35302734375, 11.7823486328125, 12.211669921875, 12.6409912109375, 13.0703125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 1.0, 8.0, 11.0, 6.0, 13.0, 16.0, 23.0, 33.0, 51.0, 44.0, 72.0, 106.0, 132.0, 142.0, 215.0, 280.0, 335.0, 406.0, 413.0, 397.0, 317.0, 248.0, 198.0, 135.0, 118.0, 86.0, 61.0, 61.0, 31.0, 30.0, 17.0, 22.0, 11.0, 9.0, 9.0, 2.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.34698486328125, -7.0963134765625, -6.84564208984375, -6.594970703125, -6.34429931640625, -6.0936279296875, -5.84295654296875, -5.59228515625, -5.34161376953125, -5.0909423828125, -4.84027099609375, -4.589599609375, -4.33892822265625, -4.0882568359375, -3.83758544921875, -3.5869140625, -3.33624267578125, -3.0855712890625, -2.83489990234375, -2.584228515625, -2.33355712890625, -2.0828857421875, -1.83221435546875, -1.58154296875, -1.33087158203125, -1.0802001953125, -0.82952880859375, -0.578857421875, -0.32818603515625, -0.0775146484375, 0.17315673828125, 0.423828125, 0.67449951171875, 0.9251708984375, 1.17584228515625, 1.426513671875, 1.67718505859375, 1.9278564453125, 2.17852783203125, 2.42919921875, 2.67987060546875, 2.9305419921875, 3.18121337890625, 3.431884765625, 3.68255615234375, 3.9332275390625, 4.18389892578125, 4.4345703125, 4.68524169921875, 4.9359130859375, 5.18658447265625, 5.437255859375, 5.68792724609375, 5.9385986328125, 6.18927001953125, 6.43994140625, 6.69061279296875, 6.9412841796875, 7.19195556640625, 7.442626953125, 7.69329833984375, 7.9439697265625, 8.19464111328125, 8.4453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 2.0, 4.0, 5.0, 17.0, 13.0, 24.0, 27.0, 46.0, 46.0, 68.0, 83.0, 143.0, 174.0, 218.0, 304.0, 648.0, 2898.0, 155012.0, 3904347.0, 125816.0, 2588.0, 600.0, 328.0, 206.0, 171.0, 129.0, 111.0, 61.0, 61.0, 29.0, 32.0, 16.0, 15.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-30.296875, -29.418212890625, -28.53955078125, -27.660888671875, -26.7822265625, -25.903564453125, -25.02490234375, -24.146240234375, -23.267578125, -22.388916015625, -21.51025390625, -20.631591796875, -19.7529296875, -18.874267578125, -17.99560546875, -17.116943359375, -16.23828125, -15.359619140625, -14.48095703125, -13.602294921875, -12.7236328125, -11.844970703125, -10.96630859375, -10.087646484375, -9.208984375, -8.330322265625, -7.45166015625, -6.572998046875, -5.6943359375, -4.815673828125, -3.93701171875, -3.058349609375, -2.1796875, -1.301025390625, -0.42236328125, 0.456298828125, 1.3349609375, 2.213623046875, 3.09228515625, 3.970947265625, 4.849609375, 5.728271484375, 6.60693359375, 7.485595703125, 8.3642578125, 9.242919921875, 10.12158203125, 11.000244140625, 11.87890625, 12.757568359375, 13.63623046875, 14.514892578125, 15.3935546875, 16.272216796875, 17.15087890625, 18.029541015625, 18.908203125, 19.786865234375, 20.66552734375, 21.544189453125, 22.4228515625, 23.301513671875, 24.18017578125, 25.058837890625, 25.9375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 28.0, 148.0, 310.0, 348.0, 143.0, 32.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.7931671142578, -169.27244567871094, -165.751708984375, -162.23098754882812, -158.71026611328125, -155.18954467773438, -151.66880798339844, -148.14808654785156, -144.6273651123047, -141.1066436767578, -137.58590698242188, -134.065185546875, -130.54446411132812, -127.02373504638672, -123.50300598144531, -119.98228454589844, -116.46155548095703, -112.94082641601562, -109.42010498046875, -105.89937591552734, -102.37865447998047, -98.85792541503906, -95.33720397949219, -91.81647491455078, -88.29574584960938, -84.77501678466797, -81.2542953491211, -77.73356628417969, -74.21284484863281, -70.6921157836914, -67.17138671875, -63.650665283203125, -60.12993621826172, -56.60921096801758, -53.08848571777344, -49.56775665283203, -46.047035217285156, -42.52630615234375, -39.00558090209961, -35.48485565185547, -31.964130401611328, -28.443405151367188, -24.922679901123047, -21.401952743530273, -17.881227493286133, -14.360502243041992, -10.839775085449219, -7.319049835205078, -3.7983245849609375, -0.27759885787963867, 3.24312686920166, 6.763853073120117, 10.284578323364258, 13.805303573608398, 17.326030731201172, 20.846755981445312, 24.367481231689453, 27.888206481933594, 31.408931732177734, 34.929656982421875, 38.45038604736328, 41.971107482910156, 45.49183654785156, 49.0125617980957, 52.533287048339844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 3.0, 8.0, 10.0, 8.0, 11.0, 9.0, 17.0, 25.0, 22.0, 21.0, 16.0, 27.0, 30.0, 28.0, 34.0, 36.0, 25.0, 49.0, 37.0, 42.0, 43.0, 34.0, 38.0, 47.0, 33.0, 41.0, 39.0, 29.0, 27.0, 30.0, 21.0, 18.0, 20.0, 24.0, 20.0, 12.0, 16.0, 8.0, 12.0, 4.0, 4.0, 6.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.174842834472656, -22.32456398010254, -21.474285125732422, -20.624006271362305, -19.773727416992188, -18.92344856262207, -18.073169708251953, -17.222888946533203, -16.37261199951172, -15.522333145141602, -14.672054290771484, -13.821775436401367, -12.97149658203125, -12.121217727661133, -11.2709379196167, -10.420659065246582, -9.570379257202148, -8.720100402832031, -7.869821548461914, -7.019542217254639, -6.1692633628845215, -5.318984508514404, -4.468705177307129, -3.6184263229370117, -2.7681474685668945, -1.9178684949874878, -1.067589521408081, -0.21731042861938477, 0.6329684257507324, 1.4832472801208496, 2.333526611328125, 3.183805465698242, 4.034084320068359, 4.884363174438477, 5.734642028808594, 6.584921360015869, 7.435200214385986, 8.285478591918945, 9.135758399963379, 9.986037254333496, 10.836316108703613, 11.68659496307373, 12.536873817443848, 13.387153625488281, 14.237432479858398, 15.087711334228516, 15.937990188598633, 16.78826904296875, 17.638547897338867, 18.488826751708984, 19.3391056060791, 20.18938446044922, 21.039663314819336, 21.889942169189453, 22.740222930908203, 23.590499877929688, 24.440780639648438, 25.291059494018555, 26.141338348388672, 26.99161720275879, 27.841896057128906, 28.692174911499023, 29.54245376586914, 30.39273452758789, 31.243011474609375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 11.0, 13.0, 13.0, 16.0, 15.0, 25.0, 18.0, 17.0, 27.0, 25.0, 40.0, 34.0, 31.0, 40.0, 38.0, 46.0, 46.0, 49.0, 48.0, 46.0, 45.0, 41.0, 39.0, 32.0, 39.0, 20.0, 25.0, 21.0, 21.0, 20.0, 21.0, 14.0, 11.0, 7.0, 6.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.95550537109375, -3.8250732421875, -3.69464111328125, -3.564208984375, -3.43377685546875, -3.3033447265625, -3.17291259765625, -3.04248046875, -2.91204833984375, -2.7816162109375, -2.65118408203125, -2.520751953125, -2.39031982421875, -2.2598876953125, -2.12945556640625, -1.9990234375, -1.86859130859375, -1.7381591796875, -1.60772705078125, -1.477294921875, -1.34686279296875, -1.2164306640625, -1.08599853515625, -0.95556640625, -0.82513427734375, -0.6947021484375, -0.56427001953125, -0.433837890625, -0.30340576171875, -0.1729736328125, -0.04254150390625, 0.087890625, 0.21832275390625, 0.3487548828125, 0.47918701171875, 0.609619140625, 0.74005126953125, 0.8704833984375, 1.00091552734375, 1.13134765625, 1.26177978515625, 1.3922119140625, 1.52264404296875, 1.653076171875, 1.78350830078125, 1.9139404296875, 2.04437255859375, 2.1748046875, 2.30523681640625, 2.4356689453125, 2.56610107421875, 2.696533203125, 2.82696533203125, 2.9573974609375, 3.08782958984375, 3.21826171875, 3.34869384765625, 3.4791259765625, 3.60955810546875, 3.739990234375, 3.87042236328125, 4.0008544921875, 4.13128662109375, 4.26171875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 19.0, 29.0, 33.0, 54.0, 78.0, 119.0, 172.0, 276.0, 390.0, 640.0, 1073.0, 1630.0, 2664.0, 4127.0, 6779.0, 11031.0, 18144.0, 30367.0, 51444.0, 88213.0, 155293.0, 247659.0, 178915.0, 102306.0, 59178.0, 34368.0, 20512.0, 12458.0, 7561.0, 4752.0, 3121.0, 1838.0, 1226.0, 753.0, 431.0, 311.0, 206.0, 125.0, 76.0, 59.0, 44.0, 22.0, 11.0, 9.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5163993835449219, -0.5005722045898438, -0.4847450256347656, -0.4689178466796875, -0.4530906677246094, -0.43726348876953125, -0.4214363098144531, -0.405609130859375, -0.3897819519042969, -0.37395477294921875, -0.3581275939941406, -0.3423004150390625, -0.3264732360839844, -0.31064605712890625, -0.2948188781738281, -0.27899169921875, -0.2631645202636719, -0.24733734130859375, -0.23151016235351562, -0.2156829833984375, -0.19985580444335938, -0.18402862548828125, -0.16820144653320312, -0.152374267578125, -0.13654708862304688, -0.12071990966796875, -0.10489273071289062, -0.0890655517578125, -0.07323837280273438, -0.05741119384765625, -0.041584014892578125, -0.0257568359375, -0.009929656982421875, 0.00589752197265625, 0.021724700927734375, 0.0375518798828125, 0.053379058837890625, 0.06920623779296875, 0.08503341674804688, 0.100860595703125, 0.11668777465820312, 0.13251495361328125, 0.14834213256835938, 0.1641693115234375, 0.17999649047851562, 0.19582366943359375, 0.21165084838867188, 0.22747802734375, 0.24330520629882812, 0.25913238525390625, 0.2749595642089844, 0.2907867431640625, 0.3066139221191406, 0.32244110107421875, 0.3382682800292969, 0.354095458984375, 0.3699226379394531, 0.38574981689453125, 0.4015769958496094, 0.4174041748046875, 0.4332313537597656, 0.44905853271484375, 0.4648857116699219, 0.480712890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 8.0, 5.0, 13.0, 13.0, 15.0, 13.0, 20.0, 29.0, 18.0, 17.0, 26.0, 18.0, 26.0, 38.0, 30.0, 35.0, 44.0, 32.0, 25.0, 50.0, 1062.0, 33.0, 41.0, 46.0, 42.0, 25.0, 32.0, 33.0, 34.0, 29.0, 25.0, 15.0, 17.0, 12.0, 16.0, 15.0, 15.0, 12.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.166015625, -2.090667724609375, -2.01531982421875, -1.939971923828125, -1.8646240234375, -1.789276123046875, -1.71392822265625, -1.638580322265625, -1.563232421875, -1.487884521484375, -1.41253662109375, -1.337188720703125, -1.2618408203125, -1.186492919921875, -1.11114501953125, -1.035797119140625, -0.96044921875, -0.885101318359375, -0.80975341796875, -0.734405517578125, -0.6590576171875, -0.583709716796875, -0.50836181640625, -0.433013916015625, -0.357666015625, -0.282318115234375, -0.20697021484375, -0.131622314453125, -0.0562744140625, 0.019073486328125, 0.09442138671875, 0.169769287109375, 0.2451171875, 0.320465087890625, 0.39581298828125, 0.471160888671875, 0.5465087890625, 0.621856689453125, 0.69720458984375, 0.772552490234375, 0.847900390625, 0.923248291015625, 0.99859619140625, 1.073944091796875, 1.1492919921875, 1.224639892578125, 1.29998779296875, 1.375335693359375, 1.45068359375, 1.526031494140625, 1.60137939453125, 1.676727294921875, 1.7520751953125, 1.827423095703125, 1.90277099609375, 1.978118896484375, 2.053466796875, 2.128814697265625, 2.20416259765625, 2.279510498046875, 2.3548583984375, 2.430206298828125, 2.50555419921875, 2.580902099609375, 2.65625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 7.0, 4.0, 11.0, 9.0, 22.0, 36.0, 36.0, 56.0, 86.0, 170.0, 178.0, 268.0, 378.0, 521.0, 773.0, 1194.0, 1649.0, 2367.0, 3563.0, 5151.0, 7479.0, 11208.0, 17104.0, 26088.0, 40564.0, 63798.0, 101855.0, 166358.0, 1252789.0, 143258.0, 88791.0, 55864.0, 35684.0, 23028.0, 15254.0, 10030.0, 6721.0, 4496.0, 3130.0, 2229.0, 1458.0, 1029.0, 770.0, 513.0, 350.0, 253.0, 183.0, 121.0, 83.0, 72.0, 42.0, 30.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.369384765625, -0.35760498046875, -0.3458251953125, -0.33404541015625, -0.322265625, -0.31048583984375, -0.2987060546875, -0.28692626953125, -0.275146484375, -0.26336669921875, -0.2515869140625, -0.23980712890625, -0.22802734375, -0.21624755859375, -0.2044677734375, -0.19268798828125, -0.180908203125, -0.16912841796875, -0.1573486328125, -0.14556884765625, -0.1337890625, -0.12200927734375, -0.1102294921875, -0.09844970703125, -0.086669921875, -0.07489013671875, -0.0631103515625, -0.05133056640625, -0.03955078125, -0.02777099609375, -0.0159912109375, -0.00421142578125, 0.007568359375, 0.01934814453125, 0.0311279296875, 0.04290771484375, 0.0546875, 0.06646728515625, 0.0782470703125, 0.09002685546875, 0.101806640625, 0.11358642578125, 0.1253662109375, 0.13714599609375, 0.14892578125, 0.16070556640625, 0.1724853515625, 0.18426513671875, 0.196044921875, 0.20782470703125, 0.2196044921875, 0.23138427734375, 0.2431640625, 0.25494384765625, 0.2667236328125, 0.27850341796875, 0.290283203125, 0.30206298828125, 0.3138427734375, 0.32562255859375, 0.33740234375, 0.34918212890625, 0.3609619140625, 0.37274169921875, 0.384521484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 2.0, 4.0, 6.0, 4.0, 7.0, 14.0, 9.0, 11.0, 25.0, 21.0, 35.0, 34.0, 59.0, 47.0, 92.0, 90.0, 95.0, 73.0, 71.0, 55.0, 39.0, 27.0, 31.0, 25.0, 26.0, 18.0, 11.0, 15.0, 15.0, 5.0, 5.0, 5.0, 2.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00405120849609375, -0.00392603874206543, -0.0038008689880371094, -0.003675699234008789, -0.0035505294799804688, -0.0034253597259521484, -0.003300189971923828, -0.003175020217895508, -0.0030498504638671875, -0.002924680709838867, -0.002799510955810547, -0.0026743412017822266, -0.0025491714477539062, -0.002424001693725586, -0.0022988319396972656, -0.0021736621856689453, -0.002048492431640625, -0.0019233226776123047, -0.0017981529235839844, -0.001672983169555664, -0.0015478134155273438, -0.0014226436614990234, -0.0012974739074707031, -0.0011723041534423828, -0.0010471343994140625, -0.0009219646453857422, -0.0007967948913574219, -0.0006716251373291016, -0.0005464553833007812, -0.00042128562927246094, -0.0002961158752441406, -0.0001709461212158203, -4.57763671875e-05, 7.939338684082031e-05, 0.00020456314086914062, 0.00032973289489746094, 0.00045490264892578125, 0.0005800724029541016, 0.0007052421569824219, 0.0008304119110107422, 0.0009555816650390625, 0.0010807514190673828, 0.0012059211730957031, 0.0013310909271240234, 0.0014562606811523438, 0.001581430435180664, 0.0017066001892089844, 0.0018317699432373047, 0.001956939697265625, 0.0020821094512939453, 0.0022072792053222656, 0.002332448959350586, 0.0024576187133789062, 0.0025827884674072266, 0.002707958221435547, 0.002833127975463867, 0.0029582977294921875, 0.003083467483520508, 0.003208637237548828, 0.0033338069915771484, 0.0034589767456054688, 0.003584146499633789, 0.0037093162536621094, 0.0038344860076904297, 0.00395965576171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 1.0, 12.0, 5.0, 19.0, 17.0, 24.0, 23.0, 38.0, 54.0, 72.0, 95.0, 142.0, 249.0, 548.0, 1712.0, 995386.0, 48134.0, 964.0, 401.0, 239.0, 116.0, 88.0, 48.0, 34.0, 21.0, 18.0, 17.0, 15.0, 13.0, 9.0, 5.0, 7.0, 4.0, 7.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07284927368164062, -0.07032012939453125, -0.06779098510742188, -0.0652618408203125, -0.06273269653320312, -0.06020355224609375, -0.057674407958984375, -0.055145263671875, -0.052616119384765625, -0.05008697509765625, -0.047557830810546875, -0.0450286865234375, -0.042499542236328125, -0.03997039794921875, -0.037441253662109375, -0.034912109375, -0.032382965087890625, -0.02985382080078125, -0.027324676513671875, -0.0247955322265625, -0.022266387939453125, -0.01973724365234375, -0.017208099365234375, -0.014678955078125, -0.012149810791015625, -0.00962066650390625, -0.007091522216796875, -0.0045623779296875, -0.002033233642578125, 0.00049591064453125, 0.003025054931640625, 0.00555419921875, 0.008083343505859375, 0.01061248779296875, 0.013141632080078125, 0.0156707763671875, 0.018199920654296875, 0.02072906494140625, 0.023258209228515625, 0.025787353515625, 0.028316497802734375, 0.03084564208984375, 0.033374786376953125, 0.0359039306640625, 0.038433074951171875, 0.04096221923828125, 0.043491363525390625, 0.0460205078125, 0.048549652099609375, 0.05107879638671875, 0.053607940673828125, 0.0561370849609375, 0.058666229248046875, 0.06119537353515625, 0.06372451782226562, 0.066253662109375, 0.06878280639648438, 0.07131195068359375, 0.07384109497070312, 0.0763702392578125, 0.07889938354492188, 0.08142852783203125, 0.08395767211914062, 0.08648681640625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [23.0, 944.0, 49.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001130416989326477, -0.0004181775148026645, 0.000294061959721148, 0.0010063014924526215, 0.001718540908768773, 0.0024307803250849247, 0.00314301997423172, 0.003855259157717228, 0.004567498806864023, 0.0052797384560108185, 0.0059919776394963264, 0.006704217288643122, 0.007416456937789917, 0.008128696121275425, 0.008840935304760933, 0.009553175419569016, 0.010265414603054523, 0.010977653786540031, 0.011689893901348114, 0.012402133084833622, 0.01311437226831913, 0.013826612383127213, 0.01453885156661272, 0.015251090750098228, 0.01596333086490631, 0.016675570979714394, 0.017387809231877327, 0.01810004934668541, 0.018812289461493492, 0.019524527713656425, 0.020236767828464508, 0.02094900608062744, 0.021661246195435524, 0.022373486310243607, 0.02308572456240654, 0.023797964677214622, 0.024510204792022705, 0.02522244304418564, 0.02593468315899372, 0.026646923273801804, 0.027359161525964737, 0.02807140164077282, 0.028783639892935753, 0.029495880007743835, 0.030208120122551918, 0.03092035837471485, 0.031632598489522934, 0.03234483674168587, 0.0330570787191391, 0.03376931697130203, 0.034481558948755264, 0.0351937972009182, 0.03590603545308113, 0.03661827743053436, 0.037330515682697296, 0.03804275393486023, 0.03875499218702316, 0.039467230439186096, 0.04017947241663933, 0.04089171066880226, 0.041603948920965195, 0.042316190898418427, 0.04302842915058136, 0.04374066740274429, 0.044452909380197525]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 4.0, 9.0, 11.0, 13.0, 17.0, 20.0, 16.0, 18.0, 21.0, 25.0, 33.0, 41.0, 59.0, 45.0, 35.0, 43.0, 46.0, 42.0, 46.0, 45.0, 44.0, 49.0, 41.0, 33.0, 21.0, 36.0, 20.0, 31.0, 25.0, 25.0, 13.0, 16.0, 9.0, 14.0, 3.0, 10.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.002246558666229248, -0.0021857330575585365, -0.002124907448887825, -0.0020640818402171135, -0.002003256231546402, -0.0019424306228756905, -0.001881605014204979, -0.0018207794055342674, -0.001759953796863556, -0.0016991281881928444, -0.0016383025795221329, -0.0015774769708514214, -0.0015166513621807098, -0.0014558257535099983, -0.0013950001448392868, -0.0013341745361685753, -0.0012733489274978638, -0.0012125233188271523, -0.0011516977101564407, -0.0010908721014857292, -0.0010300464928150177, -0.0009692208841443062, -0.0009083952754735947, -0.0008475696668028831, -0.0007867440581321716, -0.0007259184494614601, -0.0006650928407907486, -0.0006042672321200371, -0.0005434416234493256, -0.00048261601477861404, -0.0004217904061079025, -0.000360964797437191, -0.0003001391887664795, -0.00023931358009576797, -0.00017848797142505646, -0.00011766236275434494, -5.683675408363342e-05, 3.9888545870780945e-06, 6.481446325778961e-05, 0.00012564007192850113, 0.00018646568059921265, 0.00024729128926992416, 0.0003081168979406357, 0.0003689425066113472, 0.0004297681152820587, 0.0004905937239527702, 0.0005514193326234818, 0.0006122449412941933, 0.0006730705499649048, 0.0007338961586356163, 0.0007947217673063278, 0.0008555473759770393, 0.0009163729846477509, 0.0009771985933184624, 0.0010380242019891739, 0.0010988498106598854, 0.001159675419330597, 0.0012205010280013084, 0.00128132663667202, 0.0013421522453427315, 0.001402977854013443, 0.0014638034626841545, 0.001524629071354866, 0.0015854546800255775, 0.001646280288696289]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 11.0, 13.0, 13.0, 16.0, 15.0, 25.0, 18.0, 17.0, 27.0, 25.0, 40.0, 34.0, 31.0, 40.0, 38.0, 46.0, 46.0, 49.0, 48.0, 46.0, 45.0, 40.0, 40.0, 32.0, 39.0, 20.0, 25.0, 21.0, 20.0, 21.0, 21.0, 14.0, 11.0, 7.0, 6.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.95550537109375, -3.8250732421875, -3.69464111328125, -3.564208984375, -3.43377685546875, -3.3033447265625, -3.17291259765625, -3.04248046875, -2.91204833984375, -2.7816162109375, -2.65118408203125, -2.520751953125, -2.39031982421875, -2.2598876953125, -2.12945556640625, -1.9990234375, -1.86859130859375, -1.7381591796875, -1.60772705078125, -1.477294921875, -1.34686279296875, -1.2164306640625, -1.08599853515625, -0.95556640625, -0.82513427734375, -0.6947021484375, -0.56427001953125, -0.433837890625, -0.30340576171875, -0.1729736328125, -0.04254150390625, 0.087890625, 0.21832275390625, 0.3487548828125, 0.47918701171875, 0.609619140625, 0.74005126953125, 0.8704833984375, 1.00091552734375, 1.13134765625, 1.26177978515625, 1.3922119140625, 1.52264404296875, 1.653076171875, 1.78350830078125, 1.9139404296875, 2.04437255859375, 2.1748046875, 2.30523681640625, 2.4356689453125, 2.56610107421875, 2.696533203125, 2.82696533203125, 2.9573974609375, 3.08782958984375, 3.21826171875, 3.34869384765625, 3.4791259765625, 3.60955810546875, 3.739990234375, 3.87042236328125, 4.0008544921875, 4.13128662109375, 4.26171875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 15.0, 14.0, 27.0, 32.0, 47.0, 69.0, 97.0, 163.0, 233.0, 341.0, 660.0, 1113.0, 2155.0, 4643.0, 10345.0, 24378.0, 60974.0, 154366.0, 375363.0, 247007.0, 97746.0, 39170.0, 15819.0, 6913.0, 3088.0, 1555.0, 847.0, 467.0, 287.0, 186.0, 119.0, 91.0, 60.0, 49.0, 28.0, 21.0, 14.0, 15.0, 7.0, 11.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.57421875, -3.4454345703125, -3.316650390625, -3.1878662109375, -3.05908203125, -2.9302978515625, -2.801513671875, -2.6727294921875, -2.5439453125, -2.4151611328125, -2.286376953125, -2.1575927734375, -2.02880859375, -1.9000244140625, -1.771240234375, -1.6424560546875, -1.513671875, -1.3848876953125, -1.256103515625, -1.1273193359375, -0.99853515625, -0.8697509765625, -0.740966796875, -0.6121826171875, -0.4833984375, -0.3546142578125, -0.225830078125, -0.0970458984375, 0.03173828125, 0.1605224609375, 0.289306640625, 0.4180908203125, 0.546875, 0.6756591796875, 0.804443359375, 0.9332275390625, 1.06201171875, 1.1907958984375, 1.319580078125, 1.4483642578125, 1.5771484375, 1.7059326171875, 1.834716796875, 1.9635009765625, 2.09228515625, 2.2210693359375, 2.349853515625, 2.4786376953125, 2.607421875, 2.7362060546875, 2.864990234375, 2.9937744140625, 3.12255859375, 3.2513427734375, 3.380126953125, 3.5089111328125, 3.6376953125, 3.7664794921875, 3.895263671875, 4.0240478515625, 4.15283203125, 4.2816162109375, 4.410400390625, 4.5391845703125, 4.66796875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 9.0, 14.0, 13.0, 12.0, 15.0, 25.0, 24.0, 31.0, 34.0, 36.0, 37.0, 73.0, 74.0, 122.0, 194.0, 1502.0, 239.0, 130.0, 73.0, 55.0, 48.0, 48.0, 40.0, 44.0, 22.0, 24.0, 20.0, 21.0, 15.0, 10.0, 8.0, 4.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.9625244140625, -15.487548828125, -15.0125732421875, -14.53759765625, -14.0626220703125, -13.587646484375, -13.1126708984375, -12.6376953125, -12.1627197265625, -11.687744140625, -11.2127685546875, -10.73779296875, -10.2628173828125, -9.787841796875, -9.3128662109375, -8.837890625, -8.3629150390625, -7.887939453125, -7.4129638671875, -6.93798828125, -6.4630126953125, -5.988037109375, -5.5130615234375, -5.0380859375, -4.5631103515625, -4.088134765625, -3.6131591796875, -3.13818359375, -2.6632080078125, -2.188232421875, -1.7132568359375, -1.23828125, -0.7633056640625, -0.288330078125, 0.1866455078125, 0.66162109375, 1.1365966796875, 1.611572265625, 2.0865478515625, 2.5615234375, 3.0364990234375, 3.511474609375, 3.9864501953125, 4.46142578125, 4.9364013671875, 5.411376953125, 5.8863525390625, 6.361328125, 6.8363037109375, 7.311279296875, 7.7862548828125, 8.26123046875, 8.7362060546875, 9.211181640625, 9.6861572265625, 10.1611328125, 10.6361083984375, 11.111083984375, 11.5860595703125, 12.06103515625, 12.5360107421875, 13.010986328125, 13.4859619140625, 13.9609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 3.0, 7.0, 14.0, 17.0, 18.0, 31.0, 36.0, 61.0, 94.0, 145.0, 249.0, 468.0, 1380.0, 518491.0, 2621888.0, 1583.0, 479.0, 237.0, 152.0, 105.0, 69.0, 45.0, 29.0, 26.0, 16.0, 8.0, 7.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.5625, -73.40673828125, -71.2509765625, -69.09521484375, -66.939453125, -64.78369140625, -62.6279296875, -60.47216796875, -58.31640625, -56.16064453125, -54.0048828125, -51.84912109375, -49.693359375, -47.53759765625, -45.3818359375, -43.22607421875, -41.0703125, -38.91455078125, -36.7587890625, -34.60302734375, -32.447265625, -30.29150390625, -28.1357421875, -25.97998046875, -23.82421875, -21.66845703125, -19.5126953125, -17.35693359375, -15.201171875, -13.04541015625, -10.8896484375, -8.73388671875, -6.578125, -4.42236328125, -2.2666015625, -0.11083984375, 2.044921875, 4.20068359375, 6.3564453125, 8.51220703125, 10.66796875, 12.82373046875, 14.9794921875, 17.13525390625, 19.291015625, 21.44677734375, 23.6025390625, 25.75830078125, 27.9140625, 30.06982421875, 32.2255859375, 34.38134765625, 36.537109375, 38.69287109375, 40.8486328125, 43.00439453125, 45.16015625, 47.31591796875, 49.4716796875, 51.62744140625, 53.783203125, 55.93896484375, 58.0947265625, 60.25048828125, 62.40625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 768.0, 205.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-276.6659240722656, -271.6042785644531, -266.5426025390625, -261.48095703125, -256.4193115234375, -251.35763549804688, -246.29598999023438, -241.2343292236328, -236.17266845703125, -231.1110076904297, -226.04934692382812, -220.98770141601562, -215.92604064941406, -210.8643798828125, -205.802734375, -200.74107360839844, -195.67941284179688, -190.6177520751953, -185.55609130859375, -180.49444580078125, -175.4327850341797, -170.37112426757812, -165.30947875976562, -160.24781799316406, -155.1861572265625, -150.12449645996094, -145.06283569335938, -140.00119018554688, -134.9395294189453, -129.87786865234375, -124.81621551513672, -119.75456237792969, -114.6928939819336, -109.63124084472656, -104.569580078125, -99.50791931152344, -94.4462661743164, -89.38461303710938, -84.32295227050781, -79.26129150390625, -74.19963836669922, -69.13798522949219, -64.07632446289062, -59.01466751098633, -53.95301055908203, -48.891353607177734, -43.82969665527344, -38.76803970336914, -33.706382751464844, -28.644725799560547, -23.58306884765625, -18.521411895751953, -13.459754943847656, -8.39809799194336, -3.3364410400390625, 1.7252159118652344, 6.786872863769531, 11.848529815673828, 16.910186767578125, 21.971843719482422, 27.03350067138672, 32.095157623291016, 37.15681457519531, 42.21847152709961, 47.280128479003906]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 12.0, 11.0, 14.0, 13.0, 17.0, 16.0, 20.0, 23.0, 26.0, 19.0, 28.0, 29.0, 49.0, 33.0, 37.0, 33.0, 49.0, 37.0, 40.0, 56.0, 50.0, 43.0, 51.0, 34.0, 35.0, 33.0, 37.0, 21.0, 26.0, 15.0, 13.0, 19.0, 11.0, 7.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.9032096862793, -37.78009033203125, -36.6569709777832, -35.53384780883789, -34.410728454589844, -33.2876091003418, -32.16448974609375, -31.041370391845703, -29.918249130249023, -28.795129776000977, -27.672008514404297, -26.54888916015625, -25.425769805908203, -24.302648544311523, -23.179529190063477, -22.056407928466797, -20.93328857421875, -19.810169219970703, -18.687047958374023, -17.563928604125977, -16.440807342529297, -15.31768798828125, -14.194568634033203, -13.07144832611084, -11.948328018188477, -10.825207710266113, -9.70208740234375, -8.578968048095703, -7.45584774017334, -6.332727432250977, -5.2096076011657715, -4.086487770080566, -2.9633636474609375, -1.8402435779571533, -0.7171235084533691, 0.40599656105041504, 1.5291166305541992, 2.6522369384765625, 3.7753567695617676, 4.898476600646973, 6.021596908569336, 7.144717216491699, 8.267837524414062, 9.39095687866211, 10.514077186584473, 11.637197494506836, 12.760316848754883, 13.883437156677246, 15.00655746459961, 16.129676818847656, 17.252798080444336, 18.375917434692383, 19.499038696289062, 20.62215805053711, 21.745277404785156, 22.868396759033203, 23.991518020629883, 25.11463737487793, 26.23775863647461, 27.360877990722656, 28.483997344970703, 29.607118606567383, 30.73023796081543, 31.85335922241211, 32.976478576660156]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 13.0, 12.0, 14.0, 10.0, 17.0, 20.0, 31.0, 25.0, 28.0, 32.0, 26.0, 32.0, 36.0, 54.0, 35.0, 35.0, 44.0, 50.0, 51.0, 50.0, 39.0, 34.0, 37.0, 34.0, 35.0, 22.0, 21.0, 25.0, 24.0, 22.0, 7.0, 10.0, 13.0, 10.0, 8.0, 1.0, 8.0, 4.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62890625, -4.483642578125, -4.33837890625, -4.193115234375, -4.0478515625, -3.902587890625, -3.75732421875, -3.612060546875, -3.466796875, -3.321533203125, -3.17626953125, -3.031005859375, -2.8857421875, -2.740478515625, -2.59521484375, -2.449951171875, -2.3046875, -2.159423828125, -2.01416015625, -1.868896484375, -1.7236328125, -1.578369140625, -1.43310546875, -1.287841796875, -1.142578125, -0.997314453125, -0.85205078125, -0.706787109375, -0.5615234375, -0.416259765625, -0.27099609375, -0.125732421875, 0.01953125, 0.164794921875, 0.31005859375, 0.455322265625, 0.6005859375, 0.745849609375, 0.89111328125, 1.036376953125, 1.181640625, 1.326904296875, 1.47216796875, 1.617431640625, 1.7626953125, 1.907958984375, 2.05322265625, 2.198486328125, 2.34375, 2.489013671875, 2.63427734375, 2.779541015625, 2.9248046875, 3.070068359375, 3.21533203125, 3.360595703125, 3.505859375, 3.651123046875, 3.79638671875, 3.941650390625, 4.0869140625, 4.232177734375, 4.37744140625, 4.522705078125, 4.66796875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 8.0, 12.0, 12.0, 13.0, 11.0, 21.0, 20.0, 29.0, 42.0, 45.0, 72.0, 110.0, 223.0, 382.0, 1159.0, 5877.0, 99534.0, 1755433.0, 2165762.0, 155128.0, 7949.0, 1289.0, 457.0, 225.0, 133.0, 68.0, 56.0, 51.0, 25.0, 30.0, 16.0, 27.0, 10.0, 10.0, 8.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1937255859375, -11.824951171875, -11.4561767578125, -11.08740234375, -10.7186279296875, -10.349853515625, -9.9810791015625, -9.6123046875, -9.2435302734375, -8.874755859375, -8.5059814453125, -8.13720703125, -7.7684326171875, -7.399658203125, -7.0308837890625, -6.662109375, -6.2933349609375, -5.924560546875, -5.5557861328125, -5.18701171875, -4.8182373046875, -4.449462890625, -4.0806884765625, -3.7119140625, -3.3431396484375, -2.974365234375, -2.6055908203125, -2.23681640625, -1.8680419921875, -1.499267578125, -1.1304931640625, -0.76171875, -0.3929443359375, -0.024169921875, 0.3446044921875, 0.71337890625, 1.0821533203125, 1.450927734375, 1.8197021484375, 2.1884765625, 2.5572509765625, 2.926025390625, 3.2947998046875, 3.66357421875, 4.0323486328125, 4.401123046875, 4.7698974609375, 5.138671875, 5.5074462890625, 5.876220703125, 6.2449951171875, 6.61376953125, 6.9825439453125, 7.351318359375, 7.7200927734375, 8.0888671875, 8.4576416015625, 8.826416015625, 9.1951904296875, 9.56396484375, 9.9327392578125, 10.301513671875, 10.6702880859375, 11.0390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 9.0, 13.0, 21.0, 9.0, 17.0, 29.0, 25.0, 49.0, 54.0, 46.0, 103.0, 128.0, 164.0, 196.0, 238.0, 323.0, 385.0, 424.0, 352.0, 317.0, 296.0, 212.0, 153.0, 120.0, 87.0, 76.0, 64.0, 46.0, 28.0, 20.0, 19.0, 7.0, 7.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.203125, -7.95849609375, -7.7138671875, -7.46923828125, -7.224609375, -6.97998046875, -6.7353515625, -6.49072265625, -6.24609375, -6.00146484375, -5.7568359375, -5.51220703125, -5.267578125, -5.02294921875, -4.7783203125, -4.53369140625, -4.2890625, -4.04443359375, -3.7998046875, -3.55517578125, -3.310546875, -3.06591796875, -2.8212890625, -2.57666015625, -2.33203125, -2.08740234375, -1.8427734375, -1.59814453125, -1.353515625, -1.10888671875, -0.8642578125, -0.61962890625, -0.375, -0.13037109375, 0.1142578125, 0.35888671875, 0.603515625, 0.84814453125, 1.0927734375, 1.33740234375, 1.58203125, 1.82666015625, 2.0712890625, 2.31591796875, 2.560546875, 2.80517578125, 3.0498046875, 3.29443359375, 3.5390625, 3.78369140625, 4.0283203125, 4.27294921875, 4.517578125, 4.76220703125, 5.0068359375, 5.25146484375, 5.49609375, 5.74072265625, 5.9853515625, 6.22998046875, 6.474609375, 6.71923828125, 6.9638671875, 7.20849609375, 7.453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 20.0, 12.0, 11.0, 30.0, 39.0, 50.0, 79.0, 107.0, 122.0, 172.0, 218.0, 320.0, 505.0, 1687.0, 91034.0, 3857735.0, 237571.0, 2731.0, 516.0, 322.0, 259.0, 181.0, 131.0, 95.0, 87.0, 48.0, 48.0, 40.0, 19.0, 14.0, 20.0, 15.0, 5.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.78125, -26.90185546875, -26.0224609375, -25.14306640625, -24.263671875, -23.38427734375, -22.5048828125, -21.62548828125, -20.74609375, -19.86669921875, -18.9873046875, -18.10791015625, -17.228515625, -16.34912109375, -15.4697265625, -14.59033203125, -13.7109375, -12.83154296875, -11.9521484375, -11.07275390625, -10.193359375, -9.31396484375, -8.4345703125, -7.55517578125, -6.67578125, -5.79638671875, -4.9169921875, -4.03759765625, -3.158203125, -2.27880859375, -1.3994140625, -0.52001953125, 0.359375, 1.23876953125, 2.1181640625, 2.99755859375, 3.876953125, 4.75634765625, 5.6357421875, 6.51513671875, 7.39453125, 8.27392578125, 9.1533203125, 10.03271484375, 10.912109375, 11.79150390625, 12.6708984375, 13.55029296875, 14.4296875, 15.30908203125, 16.1884765625, 17.06787109375, 17.947265625, 18.82666015625, 19.7060546875, 20.58544921875, 21.46484375, 22.34423828125, 23.2236328125, 24.10302734375, 24.982421875, 25.86181640625, 26.7412109375, 27.62060546875, 28.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 29.0, 41.0, 77.0, 134.0, 173.0, 178.0, 151.0, 104.0, 66.0, 26.0, 15.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.451772689819336, -29.8267879486084, -28.20180320739746, -26.576820373535156, -24.95183563232422, -23.32685089111328, -21.701866149902344, -20.076881408691406, -18.45189666748047, -16.82691192626953, -15.20192813873291, -13.576943397521973, -11.951959609985352, -10.326974868774414, -8.701990127563477, -7.0770063400268555, -5.452022552490234, -3.827038288116455, -2.2020537853240967, -0.5770692825317383, 1.047914981842041, 2.6728992462158203, 4.297883987426758, 5.922867774963379, 7.547852516174316, 9.172837257385254, 10.797821044921875, 12.422805786132812, 14.04779052734375, 15.672774314880371, 17.297760009765625, 18.92274284362793, 20.547725677490234, 22.172710418701172, 23.79769515991211, 25.422679901123047, 27.04766273498535, 28.67264747619629, 30.297632217407227, 31.92261505126953, 33.54759979248047, 35.172584533691406, 36.797569274902344, 38.42255401611328, 40.04753875732422, 41.672523498535156, 43.297508239746094, 44.922489166259766, 46.54747772216797, 48.172462463378906, 49.797447204589844, 51.42243194580078, 53.04741668701172, 54.672401428222656, 56.297386169433594, 57.922367095947266, 59.5473518371582, 61.17233657836914, 62.79732131958008, 64.42230224609375, 66.04728698730469, 67.67227172851562, 69.29725646972656, 70.9222412109375, 72.54722595214844]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 10.0, 8.0, 10.0, 13.0, 13.0, 16.0, 16.0, 27.0, 18.0, 27.0, 37.0, 35.0, 27.0, 31.0, 29.0, 41.0, 37.0, 33.0, 39.0, 39.0, 37.0, 36.0, 38.0, 34.0, 30.0, 33.0, 24.0, 27.0, 36.0, 26.0, 26.0, 13.0, 26.0, 20.0, 15.0, 10.0, 15.0, 7.0, 9.0, 13.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.834339141845703, -22.01299285888672, -21.191648483276367, -20.370302200317383, -19.54895782470703, -18.727611541748047, -17.906265258789062, -17.08492088317871, -16.263574600219727, -15.442229270935059, -14.62088394165039, -13.799537658691406, -12.978192329406738, -12.15684700012207, -11.335501670837402, -10.514156341552734, -9.692811012268066, -8.871465682983398, -8.05012035369873, -7.228774547576904, -6.407428741455078, -5.58608341217041, -4.764738082885742, -3.943392276763916, -3.122046947479248, -2.300701379776001, -1.4793559312820435, -0.6580104827880859, 0.16333508491516113, 0.9846806526184082, 1.8060259819030762, 2.6273717880249023, 3.4487171173095703, 4.270062446594238, 5.0914082527160645, 5.912753582000732, 6.734099388122559, 7.555444717407227, 8.376790046691895, 9.198135375976562, 10.019481658935547, 10.840826988220215, 11.662172317504883, 12.483518600463867, 13.304863929748535, 14.126209259033203, 14.947554588317871, 15.768899917602539, 16.59024429321289, 17.411590576171875, 18.232934951782227, 19.05428123474121, 19.875625610351562, 20.696971893310547, 21.51831817626953, 22.339662551879883, 23.161008834838867, 23.98235511779785, 24.803699493408203, 25.625045776367188, 26.44639015197754, 27.267736434936523, 28.089080810546875, 28.91042709350586, 29.731773376464844]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 7.0, 6.0, 8.0, 10.0, 12.0, 16.0, 16.0, 20.0, 28.0, 36.0, 26.0, 36.0, 28.0, 35.0, 31.0, 38.0, 51.0, 46.0, 40.0, 42.0, 43.0, 38.0, 35.0, 45.0, 36.0, 33.0, 33.0, 26.0, 30.0, 19.0, 14.0, 17.0, 14.0, 9.0, 16.0, 6.0, 6.0, 12.0, 8.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.968017578125, -3.83447265625, -3.700927734375, -3.5673828125, -3.433837890625, -3.30029296875, -3.166748046875, -3.033203125, -2.899658203125, -2.76611328125, -2.632568359375, -2.4990234375, -2.365478515625, -2.23193359375, -2.098388671875, -1.96484375, -1.831298828125, -1.69775390625, -1.564208984375, -1.4306640625, -1.297119140625, -1.16357421875, -1.030029296875, -0.896484375, -0.762939453125, -0.62939453125, -0.495849609375, -0.3623046875, -0.228759765625, -0.09521484375, 0.038330078125, 0.171875, 0.305419921875, 0.43896484375, 0.572509765625, 0.7060546875, 0.839599609375, 0.97314453125, 1.106689453125, 1.240234375, 1.373779296875, 1.50732421875, 1.640869140625, 1.7744140625, 1.907958984375, 2.04150390625, 2.175048828125, 2.30859375, 2.442138671875, 2.57568359375, 2.709228515625, 2.8427734375, 2.976318359375, 3.10986328125, 3.243408203125, 3.376953125, 3.510498046875, 3.64404296875, 3.777587890625, 3.9111328125, 4.044677734375, 4.17822265625, 4.311767578125, 4.4453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 11.0, 21.0, 26.0, 47.0, 71.0, 119.0, 161.0, 263.0, 422.0, 678.0, 956.0, 1562.0, 2626.0, 4105.0, 6588.0, 10518.0, 16963.0, 28615.0, 48175.0, 83279.0, 141470.0, 233266.0, 192803.0, 112009.0, 65832.0, 38632.0, 22904.0, 13671.0, 8547.0, 5176.0, 3275.0, 2107.0, 1280.0, 829.0, 539.0, 361.0, 227.0, 157.0, 82.0, 56.0, 40.0, 28.0, 22.0, 16.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48328399658203125, -0.4670562744140625, -0.45082855224609375, -0.434600830078125, -0.41837310791015625, -0.4021453857421875, -0.38591766357421875, -0.36968994140625, -0.35346221923828125, -0.3372344970703125, -0.32100677490234375, -0.304779052734375, -0.28855133056640625, -0.2723236083984375, -0.25609588623046875, -0.2398681640625, -0.22364044189453125, -0.2074127197265625, -0.19118499755859375, -0.174957275390625, -0.15872955322265625, -0.1425018310546875, -0.12627410888671875, -0.11004638671875, -0.09381866455078125, -0.0775909423828125, -0.06136322021484375, -0.045135498046875, -0.02890777587890625, -0.0126800537109375, 0.00354766845703125, 0.019775390625, 0.03600311279296875, 0.0522308349609375, 0.06845855712890625, 0.084686279296875, 0.10091400146484375, 0.1171417236328125, 0.13336944580078125, 0.14959716796875, 0.16582489013671875, 0.1820526123046875, 0.19828033447265625, 0.214508056640625, 0.23073577880859375, 0.2469635009765625, 0.26319122314453125, 0.2794189453125, 0.29564666748046875, 0.3118743896484375, 0.32810211181640625, 0.344329833984375, 0.36055755615234375, 0.3767852783203125, 0.39301300048828125, 0.40924072265625, 0.42546844482421875, 0.4416961669921875, 0.45792388916015625, 0.474151611328125, 0.49037933349609375, 0.5066070556640625, 0.5228347778320312, 0.5390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 13.0, 16.0, 19.0, 17.0, 25.0, 26.0, 36.0, 31.0, 48.0, 38.0, 42.0, 37.0, 32.0, 37.0, 1066.0, 37.0, 43.0, 44.0, 47.0, 44.0, 32.0, 42.0, 26.0, 31.0, 20.0, 20.0, 18.0, 13.0, 13.0, 10.0, 9.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.857421875, -2.766265869140625, -2.67510986328125, -2.583953857421875, -2.4927978515625, -2.401641845703125, -2.31048583984375, -2.219329833984375, -2.128173828125, -2.037017822265625, -1.94586181640625, -1.854705810546875, -1.7635498046875, -1.672393798828125, -1.58123779296875, -1.490081787109375, -1.39892578125, -1.307769775390625, -1.21661376953125, -1.125457763671875, -1.0343017578125, -0.943145751953125, -0.85198974609375, -0.760833740234375, -0.669677734375, -0.578521728515625, -0.48736572265625, -0.396209716796875, -0.3050537109375, -0.213897705078125, -0.12274169921875, -0.031585693359375, 0.0595703125, 0.150726318359375, 0.24188232421875, 0.333038330078125, 0.4241943359375, 0.515350341796875, 0.60650634765625, 0.697662353515625, 0.788818359375, 0.879974365234375, 0.97113037109375, 1.062286376953125, 1.1534423828125, 1.244598388671875, 1.33575439453125, 1.426910400390625, 1.51806640625, 1.609222412109375, 1.70037841796875, 1.791534423828125, 1.8826904296875, 1.973846435546875, 2.06500244140625, 2.156158447265625, 2.247314453125, 2.338470458984375, 2.42962646484375, 2.520782470703125, 2.6119384765625, 2.703094482421875, 2.79425048828125, 2.885406494140625, 2.9765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 7.0, 6.0, 12.0, 15.0, 17.0, 36.0, 63.0, 70.0, 97.0, 158.0, 221.0, 309.0, 435.0, 643.0, 865.0, 1290.0, 1945.0, 2747.0, 3914.0, 5706.0, 8828.0, 12895.0, 20103.0, 31535.0, 50269.0, 81962.0, 136651.0, 1250054.0, 187841.0, 111939.0, 67307.0, 41472.0, 26305.0, 17016.0, 11015.0, 7371.0, 5069.0, 3326.0, 2283.0, 1654.0, 1105.0, 822.0, 553.0, 351.0, 261.0, 163.0, 122.0, 100.0, 61.0, 42.0, 39.0, 30.0, 12.0, 12.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.425537109375, -0.4121551513671875, -0.398773193359375, -0.3853912353515625, -0.37200927734375, -0.3586273193359375, -0.345245361328125, -0.3318634033203125, -0.3184814453125, -0.3050994873046875, -0.291717529296875, -0.2783355712890625, -0.26495361328125, -0.2515716552734375, -0.238189697265625, -0.2248077392578125, -0.21142578125, -0.1980438232421875, -0.184661865234375, -0.1712799072265625, -0.15789794921875, -0.1445159912109375, -0.131134033203125, -0.1177520751953125, -0.1043701171875, -0.0909881591796875, -0.077606201171875, -0.0642242431640625, -0.05084228515625, -0.0374603271484375, -0.024078369140625, -0.0106964111328125, 0.002685546875, 0.0160675048828125, 0.029449462890625, 0.0428314208984375, 0.05621337890625, 0.0695953369140625, 0.082977294921875, 0.0963592529296875, 0.1097412109375, 0.1231231689453125, 0.136505126953125, 0.1498870849609375, 0.16326904296875, 0.1766510009765625, 0.190032958984375, 0.2034149169921875, 0.216796875, 0.2301788330078125, 0.243560791015625, 0.2569427490234375, 0.27032470703125, 0.2837066650390625, 0.297088623046875, 0.3104705810546875, 0.3238525390625, 0.3372344970703125, 0.350616455078125, 0.3639984130859375, 0.37738037109375, 0.3907623291015625, 0.404144287109375, 0.4175262451171875, 0.430908203125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 1.0, 7.0, 5.0, 9.0, 16.0, 17.0, 23.0, 21.0, 15.0, 30.0, 31.0, 37.0, 47.0, 43.0, 59.0, 96.0, 99.0, 76.0, 45.0, 59.0, 39.0, 33.0, 26.0, 33.0, 22.0, 22.0, 10.0, 13.0, 12.0, 6.0, 8.0, 6.0, 5.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00328826904296875, -0.003183215856552124, -0.003078162670135498, -0.002973109483718872, -0.002868056297302246, -0.00276300311088562, -0.002657949924468994, -0.002552896738052368, -0.002447843551635742, -0.002342790365219116, -0.0022377371788024902, -0.0021326839923858643, -0.0020276308059692383, -0.0019225776195526123, -0.0018175244331359863, -0.0017124712467193604, -0.0016074180603027344, -0.0015023648738861084, -0.0013973116874694824, -0.0012922585010528564, -0.0011872053146362305, -0.0010821521282196045, -0.0009770989418029785, -0.0008720457553863525, -0.0007669925689697266, -0.0006619393825531006, -0.0005568861961364746, -0.00045183300971984863, -0.00034677982330322266, -0.00024172663688659668, -0.0001366734504699707, -3.1620264053344727e-05, 7.343292236328125e-05, 0.00017848610877990723, 0.0002835392951965332, 0.0003885924816131592, 0.0004936456680297852, 0.0005986988544464111, 0.0007037520408630371, 0.0008088052272796631, 0.0009138584136962891, 0.001018911600112915, 0.001123964786529541, 0.001229017972946167, 0.001334071159362793, 0.001439124345779419, 0.001544177532196045, 0.001649230718612671, 0.0017542839050292969, 0.0018593370914459229, 0.001964390277862549, 0.002069443464279175, 0.0021744966506958008, 0.0022795498371124268, 0.0023846030235290527, 0.0024896562099456787, 0.0025947093963623047, 0.0026997625827789307, 0.0028048157691955566, 0.0029098689556121826, 0.0030149221420288086, 0.0031199753284454346, 0.0032250285148620605, 0.0033300817012786865, 0.0034351348876953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 10.0, 7.0, 11.0, 8.0, 18.0, 10.0, 24.0, 31.0, 34.0, 44.0, 63.0, 107.0, 123.0, 214.0, 392.0, 912.0, 36158.0, 1006703.0, 2216.0, 582.0, 282.0, 155.0, 99.0, 79.0, 52.0, 40.0, 37.0, 29.0, 21.0, 18.0, 17.0, 7.0, 5.0, 9.0, 9.0, 5.0, 6.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06499767303466797, -0.06291770935058594, -0.060837745666503906, -0.058757781982421875, -0.056677818298339844, -0.05459785461425781, -0.05251789093017578, -0.05043792724609375, -0.04835796356201172, -0.04627799987792969, -0.044198036193847656, -0.042118072509765625, -0.040038108825683594, -0.03795814514160156, -0.03587818145751953, -0.0337982177734375, -0.03171825408935547, -0.029638290405273438, -0.027558326721191406, -0.025478363037109375, -0.023398399353027344, -0.021318435668945312, -0.01923847198486328, -0.01715850830078125, -0.015078544616699219, -0.012998580932617188, -0.010918617248535156, -0.008838653564453125, -0.006758689880371094, -0.0046787261962890625, -0.0025987625122070312, -0.000518798828125, 0.0015611648559570312, 0.0036411285400390625, 0.005721092224121094, 0.007801055908203125, 0.009881019592285156, 0.011960983276367188, 0.014040946960449219, 0.01612091064453125, 0.01820087432861328, 0.020280838012695312, 0.022360801696777344, 0.024440765380859375, 0.026520729064941406, 0.028600692749023438, 0.03068065643310547, 0.0327606201171875, 0.03484058380126953, 0.03692054748535156, 0.039000511169433594, 0.041080474853515625, 0.043160438537597656, 0.04524040222167969, 0.04732036590576172, 0.04940032958984375, 0.05148029327392578, 0.05356025695800781, 0.055640220642089844, 0.057720184326171875, 0.059800148010253906, 0.06188011169433594, 0.06396007537841797, 0.0660400390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 318.0, 682.0, 15.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020517955999821424, -0.001554188784211874, -0.0010565820848569274, -0.0005589753855019808, -6.136856973171234e-05, 0.0004362382460385561, 0.0009338448289781809, 0.0014314516447484493, 0.0019290584605187178, 0.002426665276288986, 0.002924271859228611, 0.0034218786749988794, 0.003919485490769148, 0.00441709253937006, 0.004914699122309685, 0.0054123057052493095, 0.005909912288188934, 0.006407518871128559, 0.006905125919729471, 0.007402732502669096, 0.007900339551270008, 0.008397946134209633, 0.008895552717149258, 0.009393159300088882, 0.009890766814351082, 0.010388373397290707, 0.010885979980230331, 0.01138358749449253, 0.011881194077432156, 0.01237880066037178, 0.012876407243311405, 0.01337401382625103, 0.01387162134051323, 0.014369227923452854, 0.014866834506392479, 0.015364442020654678, 0.01586204767227173, 0.016359655186533928, 0.016857262700796127, 0.017354868352413177, 0.017852475866675377, 0.018350083380937576, 0.018847689032554626, 0.019345296546816826, 0.019842902198433876, 0.020340509712696075, 0.020838115364313126, 0.021335722878575325, 0.021833330392837524, 0.022330937907099724, 0.022828543558716774, 0.023326151072978973, 0.023823756724596024, 0.024321364238858223, 0.024818971753120422, 0.025316577404737473, 0.025814183056354523, 0.026311790570616722, 0.026809396222233772, 0.02730700373649597, 0.027804609388113022, 0.02830221690237522, 0.02879982441663742, 0.02929743006825447, 0.02979503758251667]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 10.0, 10.0, 12.0, 21.0, 15.0, 15.0, 31.0, 30.0, 37.0, 31.0, 26.0, 30.0, 36.0, 44.0, 44.0, 49.0, 43.0, 45.0, 37.0, 44.0, 37.0, 38.0, 34.0, 38.0, 38.0, 33.0, 26.0, 30.0, 23.0, 17.0, 12.0, 9.0, 9.0, 10.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018265843391418457, -0.001769261434674263, -0.0017119385302066803, -0.0016546156257390976, -0.001597292721271515, -0.0015399698168039322, -0.0014826469123363495, -0.0014253240078687668, -0.001368001103401184, -0.0013106781989336014, -0.0012533552944660187, -0.001196032389998436, -0.0011387094855308533, -0.0010813865810632706, -0.0010240636765956879, -0.0009667407721281052, -0.0009094178676605225, -0.0008520949631929398, -0.0007947720587253571, -0.0007374491542577744, -0.0006801262497901917, -0.000622803345322609, -0.0005654804408550262, -0.0005081575363874435, -0.00045083463191986084, -0.00039351172745227814, -0.00033618882298469543, -0.00027886591851711273, -0.00022154301404953003, -0.00016422010958194733, -0.00010689720511436462, -4.957430064678192e-05, 7.748603820800781e-06, 6.507150828838348e-05, 0.0001223944127559662, 0.0001797173172235489, 0.0002370402216911316, 0.0002943631261587143, 0.000351686030626297, 0.0004090089350938797, 0.0004663318395614624, 0.0005236547440290451, 0.0005809776484966278, 0.0006383005529642105, 0.0006956234574317932, 0.0007529463618993759, 0.0008102692663669586, 0.0008675921708345413, 0.000924915075302124, 0.0009822379797697067, 0.0010395608842372894, 0.0010968837887048721, 0.0011542066931724548, 0.0012115295976400375, 0.0012688525021076202, 0.001326175406575203, 0.0013834983110427856, 0.0014408212155103683, 0.001498144119977951, 0.0015554670244455338, 0.0016127899289131165, 0.0016701128333806992, 0.0017274357378482819, 0.0017847586423158646, 0.0018420815467834473]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 7.0, 6.0, 8.0, 10.0, 12.0, 16.0, 16.0, 20.0, 28.0, 36.0, 26.0, 36.0, 28.0, 35.0, 31.0, 39.0, 50.0, 46.0, 40.0, 42.0, 43.0, 38.0, 35.0, 45.0, 36.0, 33.0, 33.0, 26.0, 30.0, 19.0, 14.0, 18.0, 13.0, 9.0, 16.0, 6.0, 6.0, 12.0, 8.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.968017578125, -3.83447265625, -3.700927734375, -3.5673828125, -3.433837890625, -3.30029296875, -3.166748046875, -3.033203125, -2.899658203125, -2.76611328125, -2.632568359375, -2.4990234375, -2.365478515625, -2.23193359375, -2.098388671875, -1.96484375, -1.831298828125, -1.69775390625, -1.564208984375, -1.4306640625, -1.297119140625, -1.16357421875, -1.030029296875, -0.896484375, -0.762939453125, -0.62939453125, -0.495849609375, -0.3623046875, -0.228759765625, -0.09521484375, 0.038330078125, 0.171875, 0.305419921875, 0.43896484375, 0.572509765625, 0.7060546875, 0.839599609375, 0.97314453125, 1.106689453125, 1.240234375, 1.373779296875, 1.50732421875, 1.640869140625, 1.7744140625, 1.907958984375, 2.04150390625, 2.175048828125, 2.30859375, 2.442138671875, 2.57568359375, 2.709228515625, 2.8427734375, 2.976318359375, 3.10986328125, 3.243408203125, 3.376953125, 3.510498046875, 3.64404296875, 3.777587890625, 3.9111328125, 4.044677734375, 4.17822265625, 4.311767578125, 4.4453125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 6.0, 21.0, 17.0, 25.0, 24.0, 48.0, 65.0, 69.0, 89.0, 166.0, 251.0, 358.0, 725.0, 1483.0, 3189.0, 7520.0, 18505.0, 48944.0, 128505.0, 361726.0, 298554.0, 108908.0, 41107.0, 15768.0, 6557.0, 2792.0, 1342.0, 640.0, 385.0, 214.0, 137.0, 105.0, 73.0, 54.0, 41.0, 36.0, 20.0, 17.0, 15.0, 15.0, 5.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.825836181640625, -3.68878173828125, -3.551727294921875, -3.4146728515625, -3.277618408203125, -3.14056396484375, -3.003509521484375, -2.866455078125, -2.729400634765625, -2.59234619140625, -2.455291748046875, -2.3182373046875, -2.181182861328125, -2.04412841796875, -1.907073974609375, -1.77001953125, -1.632965087890625, -1.49591064453125, -1.358856201171875, -1.2218017578125, -1.084747314453125, -0.94769287109375, -0.810638427734375, -0.673583984375, -0.536529541015625, -0.39947509765625, -0.262420654296875, -0.1253662109375, 0.011688232421875, 0.14874267578125, 0.285797119140625, 0.4228515625, 0.559906005859375, 0.69696044921875, 0.834014892578125, 0.9710693359375, 1.108123779296875, 1.24517822265625, 1.382232666015625, 1.519287109375, 1.656341552734375, 1.79339599609375, 1.930450439453125, 2.0675048828125, 2.204559326171875, 2.34161376953125, 2.478668212890625, 2.61572265625, 2.752777099609375, 2.88983154296875, 3.026885986328125, 3.1639404296875, 3.300994873046875, 3.43804931640625, 3.575103759765625, 3.712158203125, 3.849212646484375, 3.98626708984375, 4.123321533203125, 4.2603759765625, 4.397430419921875, 4.53448486328125, 4.671539306640625, 4.80859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 8.0, 2.0, 2.0, 17.0, 12.0, 16.0, 11.0, 19.0, 22.0, 22.0, 20.0, 25.0, 36.0, 45.0, 40.0, 39.0, 47.0, 68.0, 125.0, 266.0, 1465.0, 193.0, 102.0, 60.0, 49.0, 34.0, 35.0, 32.0, 34.0, 34.0, 19.0, 24.0, 13.0, 34.0, 17.0, 14.0, 13.0, 9.0, 4.0, 2.0, 3.0, 8.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0], "bins": [-14.9296875, -14.4676513671875, -14.005615234375, -13.5435791015625, -13.08154296875, -12.6195068359375, -12.157470703125, -11.6954345703125, -11.2333984375, -10.7713623046875, -10.309326171875, -9.8472900390625, -9.38525390625, -8.9232177734375, -8.461181640625, -7.9991455078125, -7.537109375, -7.0750732421875, -6.613037109375, -6.1510009765625, -5.68896484375, -5.2269287109375, -4.764892578125, -4.3028564453125, -3.8408203125, -3.3787841796875, -2.916748046875, -2.4547119140625, -1.99267578125, -1.5306396484375, -1.068603515625, -0.6065673828125, -0.14453125, 0.3175048828125, 0.779541015625, 1.2415771484375, 1.70361328125, 2.1656494140625, 2.627685546875, 3.0897216796875, 3.5517578125, 4.0137939453125, 4.475830078125, 4.9378662109375, 5.39990234375, 5.8619384765625, 6.323974609375, 6.7860107421875, 7.248046875, 7.7100830078125, 8.172119140625, 8.6341552734375, 9.09619140625, 9.5582275390625, 10.020263671875, 10.4822998046875, 10.9443359375, 11.4063720703125, 11.868408203125, 12.3304443359375, 12.79248046875, 13.2545166015625, 13.716552734375, 14.1785888671875, 14.640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 11.0, 14.0, 18.0, 26.0, 40.0, 54.0, 112.0, 143.0, 264.0, 567.0, 3476.0, 3126786.0, 12495.0, 903.0, 320.0, 180.0, 105.0, 61.0, 30.0, 27.0, 13.0, 16.0, 12.0, 7.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.125, -90.4384765625, -87.751953125, -85.0654296875, -82.37890625, -79.6923828125, -77.005859375, -74.3193359375, -71.6328125, -68.9462890625, -66.259765625, -63.5732421875, -60.88671875, -58.2001953125, -55.513671875, -52.8271484375, -50.140625, -47.4541015625, -44.767578125, -42.0810546875, -39.39453125, -36.7080078125, -34.021484375, -31.3349609375, -28.6484375, -25.9619140625, -23.275390625, -20.5888671875, -17.90234375, -15.2158203125, -12.529296875, -9.8427734375, -7.15625, -4.4697265625, -1.783203125, 0.9033203125, 3.58984375, 6.2763671875, 8.962890625, 11.6494140625, 14.3359375, 17.0224609375, 19.708984375, 22.3955078125, 25.08203125, 27.7685546875, 30.455078125, 33.1416015625, 35.828125, 38.5146484375, 41.201171875, 43.8876953125, 46.57421875, 49.2607421875, 51.947265625, 54.6337890625, 57.3203125, 60.0068359375, 62.693359375, 65.3798828125, 68.06640625, 70.7529296875, 73.439453125, 76.1259765625, 78.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 49.0, 448.0, 481.0, 34.0], "bins": [-200.37918090820312, -197.14105224609375, -193.90292358398438, -190.664794921875, -187.4266815185547, -184.1885528564453, -180.95042419433594, -177.71229553222656, -174.4741668701172, -171.2360382080078, -167.99790954589844, -164.75979614257812, -161.52166748046875, -158.28353881835938, -155.04541015625, -151.80728149414062, -148.5691680908203, -145.33103942871094, -142.09291076660156, -138.85479736328125, -135.61666870117188, -132.3785400390625, -129.14041137695312, -125.90228271484375, -122.66415405273438, -119.426025390625, -116.18790435791016, -112.94977569580078, -109.7116470336914, -106.47352600097656, -103.23539733886719, -99.99726867675781, -96.75914764404297, -93.5210189819336, -90.28289794921875, -87.04476928710938, -83.806640625, -80.56851959228516, -77.33039093017578, -74.09226989746094, -70.85414123535156, -67.61601257324219, -64.37789154052734, -61.13976287841797, -57.90163803100586, -54.66351318359375, -51.425384521484375, -48.187259674072266, -44.949134826660156, -41.71100997924805, -38.47288131713867, -35.23475646972656, -31.996631622314453, -28.75850486755371, -25.52037811279297, -22.28225326538086, -19.044124603271484, -15.805998802185059, -12.567873001098633, -9.32974624633789, -6.091620445251465, -2.853494644165039, 0.3846321105957031, 3.6227569580078125, 6.8608832359313965]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 12.0, 7.0, 11.0, 17.0, 15.0, 13.0, 19.0, 27.0, 19.0, 22.0, 30.0, 31.0, 31.0, 56.0, 32.0, 32.0, 30.0, 34.0, 34.0, 33.0, 45.0, 31.0, 37.0, 32.0, 31.0, 35.0, 33.0, 21.0, 27.0, 25.0, 24.0, 18.0, 18.0, 16.0, 15.0, 16.0, 15.0, 17.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.33367919921875, -33.2402229309082, -32.146766662597656, -31.053306579589844, -29.959850311279297, -28.86639404296875, -27.77293586730957, -26.67947769165039, -25.586021423339844, -24.492565155029297, -23.399106979370117, -22.305648803710938, -21.21219253540039, -20.118736267089844, -19.025278091430664, -17.931819915771484, -16.838363647460938, -15.744906425476074, -14.651449203491211, -13.557991981506348, -12.464534759521484, -11.371077537536621, -10.277620315551758, -9.184163093566895, -8.090705871582031, -6.997248649597168, -5.903791427612305, -4.810334205627441, -3.716876983642578, -2.623419761657715, -1.5299625396728516, -0.4365053176879883, 0.6569557189941406, 1.750412940979004, 2.843870162963867, 3.9373273849487305, 5.030784606933594, 6.124241828918457, 7.21769905090332, 8.311156272888184, 9.404613494873047, 10.49807071685791, 11.591527938842773, 12.684985160827637, 13.7784423828125, 14.871899604797363, 15.965356826782227, 17.058815002441406, 18.152271270751953, 19.2457275390625, 20.33918571472168, 21.43264389038086, 22.526100158691406, 23.619556427001953, 24.713014602661133, 25.806472778320312, 26.89992904663086, 27.993385314941406, 29.086843490600586, 30.180301666259766, 31.273757934570312, 32.36721420288086, 33.460670471191406, 34.55413055419922, 35.647586822509766]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 13.0, 2.0, 6.0, 9.0, 11.0, 9.0, 15.0, 14.0, 14.0, 18.0, 30.0, 24.0, 22.0, 22.0, 39.0, 41.0, 42.0, 48.0, 47.0, 45.0, 37.0, 39.0, 37.0, 40.0, 38.0, 45.0, 38.0, 43.0, 34.0, 20.0, 22.0, 16.0, 18.0, 18.0, 19.0, 17.0, 7.0, 9.0, 8.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.48663330078125, -4.3404541015625, -4.19427490234375, -4.048095703125, -3.90191650390625, -3.7557373046875, -3.60955810546875, -3.46337890625, -3.31719970703125, -3.1710205078125, -3.02484130859375, -2.878662109375, -2.73248291015625, -2.5863037109375, -2.44012451171875, -2.2939453125, -2.14776611328125, -2.0015869140625, -1.85540771484375, -1.709228515625, -1.56304931640625, -1.4168701171875, -1.27069091796875, -1.12451171875, -0.97833251953125, -0.8321533203125, -0.68597412109375, -0.539794921875, -0.39361572265625, -0.2474365234375, -0.10125732421875, 0.044921875, 0.19110107421875, 0.3372802734375, 0.48345947265625, 0.629638671875, 0.77581787109375, 0.9219970703125, 1.06817626953125, 1.21435546875, 1.36053466796875, 1.5067138671875, 1.65289306640625, 1.799072265625, 1.94525146484375, 2.0914306640625, 2.23760986328125, 2.3837890625, 2.52996826171875, 2.6761474609375, 2.82232666015625, 2.968505859375, 3.11468505859375, 3.2608642578125, 3.40704345703125, 3.55322265625, 3.69940185546875, 3.8455810546875, 3.99176025390625, 4.137939453125, 4.28411865234375, 4.4302978515625, 4.57647705078125, 4.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 15.0, 9.0, 9.0, 13.0, 15.0, 20.0, 26.0, 28.0, 36.0, 36.0, 59.0, 56.0, 82.0, 107.0, 166.0, 316.0, 851.0, 3376.0, 33276.0, 605975.0, 2704420.0, 793329.0, 45722.0, 4205.0, 966.0, 382.0, 214.0, 125.0, 91.0, 64.0, 55.0, 40.0, 38.0, 35.0, 26.0, 18.0, 13.0, 13.0, 11.0, 8.0, 12.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.599609375, -11.25390625, -10.908203125, -10.5625, -10.216796875, -9.87109375, -9.525390625, -9.1796875, -8.833984375, -8.48828125, -8.142578125, -7.796875, -7.451171875, -7.10546875, -6.759765625, -6.4140625, -6.068359375, -5.72265625, -5.376953125, -5.03125, -4.685546875, -4.33984375, -3.994140625, -3.6484375, -3.302734375, -2.95703125, -2.611328125, -2.265625, -1.919921875, -1.57421875, -1.228515625, -0.8828125, -0.537109375, -0.19140625, 0.154296875, 0.5, 0.845703125, 1.19140625, 1.537109375, 1.8828125, 2.228515625, 2.57421875, 2.919921875, 3.265625, 3.611328125, 3.95703125, 4.302734375, 4.6484375, 4.994140625, 5.33984375, 5.685546875, 6.03125, 6.376953125, 6.72265625, 7.068359375, 7.4140625, 7.759765625, 8.10546875, 8.451171875, 8.796875, 9.142578125, 9.48828125, 9.833984375, 10.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 10.0, 11.0, 11.0, 12.0, 22.0, 33.0, 40.0, 39.0, 62.0, 86.0, 103.0, 157.0, 199.0, 273.0, 340.0, 415.0, 422.0, 415.0, 342.0, 263.0, 226.0, 141.0, 97.0, 86.0, 61.0, 57.0, 35.0, 32.0, 20.0, 15.0, 9.0, 7.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9453125, -10.66839599609375, -10.3914794921875, -10.11456298828125, -9.837646484375, -9.56072998046875, -9.2838134765625, -9.00689697265625, -8.72998046875, -8.45306396484375, -8.1761474609375, -7.89923095703125, -7.622314453125, -7.34539794921875, -7.0684814453125, -6.79156494140625, -6.5146484375, -6.23773193359375, -5.9608154296875, -5.68389892578125, -5.406982421875, -5.13006591796875, -4.8531494140625, -4.57623291015625, -4.29931640625, -4.02239990234375, -3.7454833984375, -3.46856689453125, -3.191650390625, -2.91473388671875, -2.6378173828125, -2.36090087890625, -2.083984375, -1.80706787109375, -1.5301513671875, -1.25323486328125, -0.976318359375, -0.69940185546875, -0.4224853515625, -0.14556884765625, 0.13134765625, 0.40826416015625, 0.6851806640625, 0.96209716796875, 1.239013671875, 1.51593017578125, 1.7928466796875, 2.06976318359375, 2.3466796875, 2.62359619140625, 2.9005126953125, 3.17742919921875, 3.454345703125, 3.73126220703125, 4.0081787109375, 4.28509521484375, 4.56201171875, 4.83892822265625, 5.1158447265625, 5.39276123046875, 5.669677734375, 5.94659423828125, 6.2235107421875, 6.50042724609375, 6.77734375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 9.0, 11.0, 12.0, 23.0, 22.0, 40.0, 61.0, 76.0, 90.0, 117.0, 204.0, 281.0, 430.0, 1031.0, 63333.0, 4094126.0, 32165.0, 893.0, 388.0, 288.0, 194.0, 116.0, 108.0, 68.0, 42.0, 36.0, 36.0, 17.0, 14.0, 10.0, 11.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -32.96435546875, -31.6162109375, -30.26806640625, -28.919921875, -27.57177734375, -26.2236328125, -24.87548828125, -23.52734375, -22.17919921875, -20.8310546875, -19.48291015625, -18.134765625, -16.78662109375, -15.4384765625, -14.09033203125, -12.7421875, -11.39404296875, -10.0458984375, -8.69775390625, -7.349609375, -6.00146484375, -4.6533203125, -3.30517578125, -1.95703125, -0.60888671875, 0.7392578125, 2.08740234375, 3.435546875, 4.78369140625, 6.1318359375, 7.47998046875, 8.828125, 10.17626953125, 11.5244140625, 12.87255859375, 14.220703125, 15.56884765625, 16.9169921875, 18.26513671875, 19.61328125, 20.96142578125, 22.3095703125, 23.65771484375, 25.005859375, 26.35400390625, 27.7021484375, 29.05029296875, 30.3984375, 31.74658203125, 33.0947265625, 34.44287109375, 35.791015625, 37.13916015625, 38.4873046875, 39.83544921875, 41.18359375, 42.53173828125, 43.8798828125, 45.22802734375, 46.576171875, 47.92431640625, 49.2724609375, 50.62060546875, 51.96875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 54.0, 481.0, 436.0, 41.0, 4.0, 1.0, 1.0], "bins": [-393.7418518066406, -387.0700988769531, -380.3983154296875, -373.7265625, -367.0548095703125, -360.3830261230469, -353.7112731933594, -347.03948974609375, -340.36773681640625, -333.69598388671875, -327.0242004394531, -320.3524475097656, -313.6806640625, -307.0089111328125, -300.337158203125, -293.6653747558594, -286.9936218261719, -280.3218688964844, -273.65008544921875, -266.97833251953125, -260.30657958984375, -253.63479614257812, -246.96304321289062, -240.29127502441406, -233.6195068359375, -226.94773864746094, -220.27597045898438, -213.60421752929688, -206.9324493408203, -200.26068115234375, -193.58892822265625, -186.9171600341797, -180.24537658691406, -173.5736083984375, -166.90185546875, -160.23008728027344, -153.55831909179688, -146.8865509033203, -140.21478271484375, -133.54302978515625, -126.87126159667969, -120.19949340820312, -113.5277328491211, -106.85597229003906, -100.1842041015625, -93.51243591308594, -86.8406753540039, -80.16891479492188, -73.49714660644531, -66.82537841796875, -60.15361785888672, -53.48185348510742, -46.810089111328125, -40.13832473754883, -33.46656036376953, -26.794795989990234, -20.123035430908203, -13.451271057128906, -6.779506683349609, -0.1077423095703125, 6.564022064208984, 13.235786437988281, 19.907550811767578, 26.579315185546875, 33.25107955932617]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 12.0, 19.0, 14.0, 17.0, 25.0, 22.0, 31.0, 30.0, 31.0, 33.0, 38.0, 44.0, 50.0, 35.0, 39.0, 35.0, 33.0, 37.0, 40.0, 44.0, 41.0, 35.0, 32.0, 24.0, 27.0, 19.0, 19.0, 23.0, 31.0, 18.0, 13.0, 13.0, 14.0, 9.0, 7.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.215652465820312, -24.342227935791016, -23.46880531311035, -22.595380783081055, -21.721956253051758, -20.848533630371094, -19.975109100341797, -19.1016845703125, -18.228261947631836, -17.35483741760254, -16.481414794921875, -15.607990264892578, -14.734566688537598, -13.861143112182617, -12.98771858215332, -12.11429500579834, -11.240870475769043, -10.367446899414062, -9.494022369384766, -8.620598793029785, -7.747175216674805, -6.873751163482666, -6.000327110290527, -5.126903533935547, -4.253479480743408, -3.3800556659698486, -2.506631851196289, -1.6332077980041504, -0.7597839832305908, 0.11363983154296875, 0.9870638847351074, 1.860487461090088, 2.7339115142822266, 3.607335329055786, 4.480759143829346, 5.354183197021484, 6.227606773376465, 7.1010308265686035, 7.974454879760742, 8.847878456115723, 9.721302032470703, 10.594725608825684, 11.46815013885498, 12.341573715209961, 13.214997291564941, 14.088420867919922, 14.961845397949219, 15.8352689743042, 16.708694458007812, 17.58211898803711, 18.455541610717773, 19.32896614074707, 20.202390670776367, 21.07581329345703, 21.949237823486328, 22.822662353515625, 23.69608497619629, 24.569509506225586, 25.44293212890625, 26.316356658935547, 27.189781188964844, 28.063203811645508, 28.936628341674805, 29.81005096435547, 30.683475494384766]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 9.0, 10.0, 5.0, 8.0, 16.0, 8.0, 11.0, 21.0, 22.0, 21.0, 32.0, 11.0, 31.0, 34.0, 30.0, 41.0, 31.0, 46.0, 43.0, 39.0, 44.0, 37.0, 48.0, 35.0, 42.0, 35.0, 37.0, 27.0, 29.0, 23.0, 21.0, 22.0, 12.0, 22.0, 15.0, 11.0, 10.0, 18.0, 11.0, 8.0, 5.0, 1.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.4296875, -4.29736328125, -4.1650390625, -4.03271484375, -3.900390625, -3.76806640625, -3.6357421875, -3.50341796875, -3.37109375, -3.23876953125, -3.1064453125, -2.97412109375, -2.841796875, -2.70947265625, -2.5771484375, -2.44482421875, -2.3125, -2.18017578125, -2.0478515625, -1.91552734375, -1.783203125, -1.65087890625, -1.5185546875, -1.38623046875, -1.25390625, -1.12158203125, -0.9892578125, -0.85693359375, -0.724609375, -0.59228515625, -0.4599609375, -0.32763671875, -0.1953125, -0.06298828125, 0.0693359375, 0.20166015625, 0.333984375, 0.46630859375, 0.5986328125, 0.73095703125, 0.86328125, 0.99560546875, 1.1279296875, 1.26025390625, 1.392578125, 1.52490234375, 1.6572265625, 1.78955078125, 1.921875, 2.05419921875, 2.1865234375, 2.31884765625, 2.451171875, 2.58349609375, 2.7158203125, 2.84814453125, 2.98046875, 3.11279296875, 3.2451171875, 3.37744140625, 3.509765625, 3.64208984375, 3.7744140625, 3.90673828125, 4.0390625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 12.0, 9.0, 19.0, 18.0, 26.0, 55.0, 74.0, 109.0, 175.0, 223.0, 342.0, 543.0, 758.0, 1096.0, 1689.0, 2456.0, 3506.0, 5199.0, 7609.0, 11093.0, 16260.0, 23826.0, 35225.0, 51924.0, 77190.0, 116511.0, 183941.0, 172446.0, 109506.0, 72698.0, 49159.0, 33114.0, 22896.0, 15575.0, 10587.0, 7223.0, 5029.0, 3312.0, 2288.0, 1477.0, 1119.0, 778.0, 449.0, 338.0, 217.0, 152.0, 93.0, 65.0, 52.0, 32.0, 29.0, 20.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.39013671875, -0.3771018981933594, -0.36406707763671875, -0.3510322570800781, -0.3379974365234375, -0.3249626159667969, -0.31192779541015625, -0.2988929748535156, -0.285858154296875, -0.2728233337402344, -0.25978851318359375, -0.24675369262695312, -0.2337188720703125, -0.22068405151367188, -0.20764923095703125, -0.19461441040039062, -0.18157958984375, -0.16854476928710938, -0.15550994873046875, -0.14247512817382812, -0.1294403076171875, -0.11640548706054688, -0.10337066650390625, -0.09033584594726562, -0.077301025390625, -0.06426620483398438, -0.05123138427734375, -0.038196563720703125, -0.0251617431640625, -0.012126922607421875, 0.00090789794921875, 0.013942718505859375, 0.0269775390625, 0.040012359619140625, 0.05304718017578125, 0.06608200073242188, 0.0791168212890625, 0.09215164184570312, 0.10518646240234375, 0.11822128295898438, 0.131256103515625, 0.14429092407226562, 0.15732574462890625, 0.17036056518554688, 0.1833953857421875, 0.19643020629882812, 0.20946502685546875, 0.22249984741210938, 0.23553466796875, 0.24856948852539062, 0.26160430908203125, 0.2746391296386719, 0.2876739501953125, 0.3007087707519531, 0.31374359130859375, 0.3267784118652344, 0.339813232421875, 0.3528480529785156, 0.36588287353515625, 0.3789176940917969, 0.3919525146484375, 0.4049873352050781, 0.41802215576171875, 0.4310569763183594, 0.444091796875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 13.0, 8.0, 10.0, 14.0, 8.0, 21.0, 17.0, 16.0, 31.0, 21.0, 26.0, 31.0, 39.0, 28.0, 36.0, 52.0, 38.0, 42.0, 47.0, 1060.0, 42.0, 48.0, 36.0, 44.0, 33.0, 27.0, 31.0, 21.0, 31.0, 25.0, 16.0, 18.0, 22.0, 16.0, 8.0, 8.0, 5.0, 5.0, 8.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.5487060546875, -2.462646484375, -2.3765869140625, -2.29052734375, -2.2044677734375, -2.118408203125, -2.0323486328125, -1.9462890625, -1.8602294921875, -1.774169921875, -1.6881103515625, -1.60205078125, -1.5159912109375, -1.429931640625, -1.3438720703125, -1.2578125, -1.1717529296875, -1.085693359375, -0.9996337890625, -0.91357421875, -0.8275146484375, -0.741455078125, -0.6553955078125, -0.5693359375, -0.4832763671875, -0.397216796875, -0.3111572265625, -0.22509765625, -0.1390380859375, -0.052978515625, 0.0330810546875, 0.119140625, 0.2052001953125, 0.291259765625, 0.3773193359375, 0.46337890625, 0.5494384765625, 0.635498046875, 0.7215576171875, 0.8076171875, 0.8936767578125, 0.979736328125, 1.0657958984375, 1.15185546875, 1.2379150390625, 1.323974609375, 1.4100341796875, 1.49609375, 1.5821533203125, 1.668212890625, 1.7542724609375, 1.84033203125, 1.9263916015625, 2.012451171875, 2.0985107421875, 2.1845703125, 2.2706298828125, 2.356689453125, 2.4427490234375, 2.52880859375, 2.6148681640625, 2.700927734375, 2.7869873046875, 2.873046875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 11.0, 18.0, 22.0, 49.0, 61.0, 113.0, 143.0, 168.0, 297.0, 433.0, 674.0, 883.0, 1419.0, 2164.0, 3204.0, 5093.0, 7903.0, 12790.0, 20823.0, 34338.0, 58893.0, 104214.0, 194004.0, 1295692.0, 150046.0, 82742.0, 47206.0, 27712.0, 16824.0, 10364.0, 6509.0, 4203.0, 2730.0, 1780.0, 1203.0, 786.0, 513.0, 350.0, 246.0, 179.0, 103.0, 74.0, 59.0, 30.0, 21.0, 20.0, 7.0, 10.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.47789764404296875, -0.4626312255859375, -0.44736480712890625, -0.432098388671875, -0.41683197021484375, -0.4015655517578125, -0.38629913330078125, -0.37103271484375, -0.35576629638671875, -0.3404998779296875, -0.32523345947265625, -0.309967041015625, -0.29470062255859375, -0.2794342041015625, -0.26416778564453125, -0.2489013671875, -0.23363494873046875, -0.2183685302734375, -0.20310211181640625, -0.187835693359375, -0.17256927490234375, -0.1573028564453125, -0.14203643798828125, -0.12677001953125, -0.11150360107421875, -0.0962371826171875, -0.08097076416015625, -0.065704345703125, -0.05043792724609375, -0.0351715087890625, -0.01990509033203125, -0.004638671875, 0.01062774658203125, 0.0258941650390625, 0.04116058349609375, 0.056427001953125, 0.07169342041015625, 0.0869598388671875, 0.10222625732421875, 0.11749267578125, 0.13275909423828125, 0.1480255126953125, 0.16329193115234375, 0.178558349609375, 0.19382476806640625, 0.2090911865234375, 0.22435760498046875, 0.2396240234375, 0.25489044189453125, 0.2701568603515625, 0.28542327880859375, 0.300689697265625, 0.31595611572265625, 0.3312225341796875, 0.34648895263671875, 0.36175537109375, 0.37702178955078125, 0.3922882080078125, 0.40755462646484375, 0.422821044921875, 0.43808746337890625, 0.4533538818359375, 0.46862030029296875, 0.48388671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 10.0, 10.0, 6.0, 15.0, 13.0, 19.0, 19.0, 34.0, 40.0, 71.0, 99.0, 125.0, 149.0, 111.0, 76.0, 38.0, 26.0, 24.0, 23.0, 5.0, 11.0, 13.0, 12.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004238128662109375, -0.004087924957275391, -0.003937721252441406, -0.003787517547607422, -0.0036373138427734375, -0.003487110137939453, -0.0033369064331054688, -0.0031867027282714844, -0.0030364990234375, -0.0028862953186035156, -0.0027360916137695312, -0.002585887908935547, -0.0024356842041015625, -0.002285480499267578, -0.0021352767944335938, -0.0019850730895996094, -0.001834869384765625, -0.0016846656799316406, -0.0015344619750976562, -0.0013842582702636719, -0.0012340545654296875, -0.0010838508605957031, -0.0009336471557617188, -0.0007834434509277344, -0.00063323974609375, -0.0004830360412597656, -0.00033283233642578125, -0.00018262863159179688, -3.24249267578125e-05, 0.00011777877807617188, 0.00026798248291015625, 0.0004181861877441406, 0.000568389892578125, 0.0007185935974121094, 0.0008687973022460938, 0.0010190010070800781, 0.0011692047119140625, 0.0013194084167480469, 0.0014696121215820312, 0.0016198158264160156, 0.00177001953125, 0.0019202232360839844, 0.0020704269409179688, 0.002220630645751953, 0.0023708343505859375, 0.002521038055419922, 0.0026712417602539062, 0.0028214454650878906, 0.002971649169921875, 0.0031218528747558594, 0.0032720565795898438, 0.003422260284423828, 0.0035724639892578125, 0.003722667694091797, 0.0038728713989257812, 0.004023075103759766, 0.00417327880859375, 0.004323482513427734, 0.004473686218261719, 0.004623889923095703, 0.0047740936279296875, 0.004924297332763672, 0.005074501037597656, 0.005224704742431641, 0.005374908447265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 11.0, 18.0, 10.0, 12.0, 24.0, 30.0, 44.0, 53.0, 79.0, 140.0, 341.0, 1106.0, 1026544.0, 18858.0, 612.0, 239.0, 131.0, 75.0, 57.0, 26.0, 21.0, 23.0, 15.0, 10.0, 16.0, 10.0, 1.0, 7.0, 0.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.113525390625, -0.1103525161743164, -0.10717964172363281, -0.10400676727294922, -0.10083389282226562, -0.09766101837158203, -0.09448814392089844, -0.09131526947021484, -0.08814239501953125, -0.08496952056884766, -0.08179664611816406, -0.07862377166748047, -0.07545089721679688, -0.07227802276611328, -0.06910514831542969, -0.0659322738647461, -0.0627593994140625, -0.059586524963378906, -0.05641365051269531, -0.05324077606201172, -0.050067901611328125, -0.04689502716064453, -0.04372215270996094, -0.040549278259277344, -0.03737640380859375, -0.034203529357910156, -0.031030654907226562, -0.02785778045654297, -0.024684906005859375, -0.02151203155517578, -0.018339157104492188, -0.015166282653808594, -0.011993408203125, -0.008820533752441406, -0.0056476593017578125, -0.0024747848510742188, 0.000698089599609375, 0.0038709640502929688, 0.0070438385009765625, 0.010216712951660156, 0.01338958740234375, 0.016562461853027344, 0.019735336303710938, 0.02290821075439453, 0.026081085205078125, 0.02925395965576172, 0.03242683410644531, 0.035599708557128906, 0.0387725830078125, 0.041945457458496094, 0.04511833190917969, 0.04829120635986328, 0.051464080810546875, 0.05463695526123047, 0.05780982971191406, 0.060982704162597656, 0.06415557861328125, 0.06732845306396484, 0.07050132751464844, 0.07367420196533203, 0.07684707641601562, 0.08001995086669922, 0.08319282531738281, 0.0863656997680664, 0.08953857421875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 31.0, 618.0, 353.0, 13.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026506457943469286, -0.002262889640405774, -0.0018751334864646196, -0.001487377448938787, -0.0010996212949976325, -0.000711865141056478, -0.00032410910353064537, 6.364705041050911e-05, 0.0004514032043516636, 0.0008391593582928181, 0.0012269155122339725, 0.0016146715497598052, 0.0020024278201162815, 0.002390183974057436, 0.002777939895167947, 0.0031656960491091013, 0.0035534522030502558, 0.003941208124160767, 0.004328964278101921, 0.0047167204320430756, 0.00510447658598423, 0.0054922327399253845, 0.005879988893866539, 0.0062677450478076935, 0.006655501201748848, 0.0070432573556900024, 0.007431013509631157, 0.007818769663572311, 0.008206525817513466, 0.00859428197145462, 0.008982038125395775, 0.00936979427933693, 0.00975754950195551, 0.010145305655896664, 0.010533061809837818, 0.010920817963778973, 0.011308574117720127, 0.011696330271661282, 0.012084086425602436, 0.01247184257954359, 0.012859598733484745, 0.0132473548874259, 0.013635111041367054, 0.014022867195308208, 0.014410623349249363, 0.014798379503190517, 0.015186135657131672, 0.015573891811072826, 0.015961647033691406, 0.01634940318763256, 0.016737159341573715, 0.01712491549551487, 0.017512671649456024, 0.01790042780339718, 0.018288183957338333, 0.018675940111279488, 0.019063696265220642, 0.019451452419161797, 0.01983920857310295, 0.020226964727044106, 0.02061472088098526, 0.021002477034926414, 0.02139023318886757, 0.021777989342808723, 0.022165745496749878]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 2.0, 8.0, 10.0, 9.0, 10.0, 16.0, 22.0, 21.0, 16.0, 20.0, 26.0, 32.0, 26.0, 27.0, 15.0, 26.0, 40.0, 44.0, 39.0, 37.0, 33.0, 41.0, 29.0, 29.0, 31.0, 28.0, 34.0, 25.0, 27.0, 39.0, 24.0, 22.0, 19.0, 16.0, 21.0, 19.0, 21.0, 6.0, 23.0, 16.0, 7.0, 8.0, 6.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0017477869987487793, -0.0016932990401983261, -0.001638811081647873, -0.0015843231230974197, -0.0015298351645469666, -0.0014753472059965134, -0.0014208592474460602, -0.001366371288895607, -0.0013118833303451538, -0.0012573953717947006, -0.0012029074132442474, -0.0011484194546937943, -0.001093931496143341, -0.0010394435375928879, -0.0009849555790424347, -0.0009304676204919815, -0.0008759796619415283, -0.0008214917033910751, -0.000767003744840622, -0.0007125157862901688, -0.0006580278277397156, -0.0006035398691892624, -0.0005490519106388092, -0.000494563952088356, -0.00044007599353790283, -0.00038558803498744965, -0.00033110007643699646, -0.0002766121178865433, -0.0002221241593360901, -0.0001676362007856369, -0.00011314824223518372, -5.866028368473053e-05, -4.172325134277344e-06, 5.031563341617584e-05, 0.00010480359196662903, 0.00015929155051708221, 0.0002137795090675354, 0.0002682674676179886, 0.00032275542616844177, 0.00037724338471889496, 0.00043173134326934814, 0.00048621930181980133, 0.0005407072603702545, 0.0005951952189207077, 0.0006496831774711609, 0.0007041711360216141, 0.0007586590945720673, 0.0008131470531225204, 0.0008676350116729736, 0.0009221229702234268, 0.00097661092877388, 0.0010310988873243332, 0.0010855868458747864, 0.0011400748044252396, 0.0011945627629756927, 0.001249050721526146, 0.0013035386800765991, 0.0013580266386270523, 0.0014125145971775055, 0.0014670025557279587, 0.0015214905142784119, 0.001575978472828865, 0.0016304664313793182, 0.0016849543899297714, 0.0017394423484802246]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 9.0, 10.0, 5.0, 8.0, 16.0, 8.0, 11.0, 21.0, 22.0, 21.0, 32.0, 11.0, 31.0, 34.0, 30.0, 41.0, 31.0, 46.0, 43.0, 39.0, 44.0, 37.0, 48.0, 35.0, 42.0, 35.0, 37.0, 27.0, 29.0, 23.0, 21.0, 22.0, 12.0, 22.0, 15.0, 11.0, 10.0, 18.0, 11.0, 8.0, 5.0, 1.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.4296875, -4.29736328125, -4.1650390625, -4.03271484375, -3.900390625, -3.76806640625, -3.6357421875, -3.50341796875, -3.37109375, -3.23876953125, -3.1064453125, -2.97412109375, -2.841796875, -2.70947265625, -2.5771484375, -2.44482421875, -2.3125, -2.18017578125, -2.0478515625, -1.91552734375, -1.783203125, -1.65087890625, -1.5185546875, -1.38623046875, -1.25390625, -1.12158203125, -0.9892578125, -0.85693359375, -0.724609375, -0.59228515625, -0.4599609375, -0.32763671875, -0.1953125, -0.06298828125, 0.0693359375, 0.20166015625, 0.333984375, 0.46630859375, 0.5986328125, 0.73095703125, 0.86328125, 0.99560546875, 1.1279296875, 1.26025390625, 1.392578125, 1.52490234375, 1.6572265625, 1.78955078125, 1.921875, 2.05419921875, 2.1865234375, 2.31884765625, 2.451171875, 2.58349609375, 2.7158203125, 2.84814453125, 2.98046875, 3.11279296875, 3.2451171875, 3.37744140625, 3.509765625, 3.64208984375, 3.7744140625, 3.90673828125, 4.0390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 8.0, 12.0, 9.0, 12.0, 9.0, 14.0, 27.0, 36.0, 51.0, 72.0, 150.0, 263.0, 436.0, 824.0, 1630.0, 3091.0, 5772.0, 11259.0, 22889.0, 48588.0, 116573.0, 294190.0, 315329.0, 126054.0, 51898.0, 23974.0, 12175.0, 6239.0, 3224.0, 1671.0, 953.0, 431.0, 257.0, 152.0, 75.0, 53.0, 30.0, 23.0, 19.0, 11.0, 14.0, 12.0, 6.0, 9.0, 12.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-4.1171875, -3.992584228515625, -3.86798095703125, -3.743377685546875, -3.6187744140625, -3.494171142578125, -3.36956787109375, -3.244964599609375, -3.120361328125, -2.995758056640625, -2.87115478515625, -2.746551513671875, -2.6219482421875, -2.497344970703125, -2.37274169921875, -2.248138427734375, -2.12353515625, -1.998931884765625, -1.87432861328125, -1.749725341796875, -1.6251220703125, -1.500518798828125, -1.37591552734375, -1.251312255859375, -1.126708984375, -1.002105712890625, -0.87750244140625, -0.752899169921875, -0.6282958984375, -0.503692626953125, -0.37908935546875, -0.254486083984375, -0.1298828125, -0.005279541015625, 0.11932373046875, 0.243927001953125, 0.3685302734375, 0.493133544921875, 0.61773681640625, 0.742340087890625, 0.866943359375, 0.991546630859375, 1.11614990234375, 1.240753173828125, 1.3653564453125, 1.489959716796875, 1.61456298828125, 1.739166259765625, 1.86376953125, 1.988372802734375, 2.11297607421875, 2.237579345703125, 2.3621826171875, 2.486785888671875, 2.61138916015625, 2.735992431640625, 2.860595703125, 2.985198974609375, 3.10980224609375, 3.234405517578125, 3.3590087890625, 3.483612060546875, 3.60821533203125, 3.732818603515625, 3.857421875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 10.0, 5.0, 8.0, 15.0, 13.0, 13.0, 26.0, 44.0, 18.0, 34.0, 41.0, 38.0, 62.0, 62.0, 104.0, 279.0, 1606.0, 229.0, 86.0, 66.0, 51.0, 39.0, 45.0, 27.0, 25.0, 35.0, 17.0, 13.0, 11.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.54296875, -20.8984375, -20.25390625, -19.609375, -18.96484375, -18.3203125, -17.67578125, -17.03125, -16.38671875, -15.7421875, -15.09765625, -14.453125, -13.80859375, -13.1640625, -12.51953125, -11.875, -11.23046875, -10.5859375, -9.94140625, -9.296875, -8.65234375, -8.0078125, -7.36328125, -6.71875, -6.07421875, -5.4296875, -4.78515625, -4.140625, -3.49609375, -2.8515625, -2.20703125, -1.5625, -0.91796875, -0.2734375, 0.37109375, 1.015625, 1.66015625, 2.3046875, 2.94921875, 3.59375, 4.23828125, 4.8828125, 5.52734375, 6.171875, 6.81640625, 7.4609375, 8.10546875, 8.75, 9.39453125, 10.0390625, 10.68359375, 11.328125, 11.97265625, 12.6171875, 13.26171875, 13.90625, 14.55078125, 15.1953125, 15.83984375, 16.484375, 17.12890625, 17.7734375, 18.41796875, 19.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 13.0, 29.0, 31.0, 27.0, 56.0, 72.0, 97.0, 164.0, 299.0, 625.0, 5205.0, 3127733.0, 9728.0, 692.0, 342.0, 201.0, 111.0, 69.0, 63.0, 37.0, 23.0, 25.0, 18.0, 10.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.625, -60.505859375, -58.38671875, -56.267578125, -54.1484375, -52.029296875, -49.91015625, -47.791015625, -45.671875, -43.552734375, -41.43359375, -39.314453125, -37.1953125, -35.076171875, -32.95703125, -30.837890625, -28.71875, -26.599609375, -24.48046875, -22.361328125, -20.2421875, -18.123046875, -16.00390625, -13.884765625, -11.765625, -9.646484375, -7.52734375, -5.408203125, -3.2890625, -1.169921875, 0.94921875, 3.068359375, 5.1875, 7.306640625, 9.42578125, 11.544921875, 13.6640625, 15.783203125, 17.90234375, 20.021484375, 22.140625, 24.259765625, 26.37890625, 28.498046875, 30.6171875, 32.736328125, 34.85546875, 36.974609375, 39.09375, 41.212890625, 43.33203125, 45.451171875, 47.5703125, 49.689453125, 51.80859375, 53.927734375, 56.046875, 58.166015625, 60.28515625, 62.404296875, 64.5234375, 66.642578125, 68.76171875, 70.880859375, 73.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 16.0, 304.0, 590.0, 100.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-175.8588409423828, -172.73094177246094, -169.60302734375, -166.47512817382812, -163.34722900390625, -160.2193145751953, -157.09141540527344, -153.96351623535156, -150.83560180664062, -147.70770263671875, -144.5797882080078, -141.45188903808594, -138.32398986816406, -135.19607543945312, -132.06817626953125, -128.94027709960938, -125.81237030029297, -122.68446350097656, -119.55656433105469, -116.42865753173828, -113.30075073242188, -110.1728515625, -107.0449447631836, -103.91703796386719, -100.78913879394531, -97.6612319946289, -94.53333282470703, -91.40542602539062, -88.27751922607422, -85.14961242675781, -82.02171325683594, -78.89380645751953, -75.76590728759766, -72.63800048828125, -69.51010131835938, -66.38219451904297, -63.25428771972656, -60.12638473510742, -56.99848175048828, -53.870574951171875, -50.742671966552734, -47.614768981933594, -44.48686218261719, -41.35895919799805, -38.231056213378906, -35.1031494140625, -31.97524642944336, -28.847341537475586, -25.719436645507812, -22.59153175354004, -19.463626861572266, -16.335723876953125, -13.207818984985352, -10.079914093017578, -6.9520111083984375, -3.824106216430664, -0.6962013244628906, 2.4317030906677246, 5.55960750579834, 8.687511444091797, 11.81541633605957, 14.943321228027344, 18.071224212646484, 21.199129104614258, 24.32703399658203]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 4.0, 9.0, 8.0, 12.0, 14.0, 19.0, 14.0, 23.0, 23.0, 29.0, 32.0, 34.0, 34.0, 46.0, 45.0, 48.0, 37.0, 43.0, 61.0, 53.0, 42.0, 41.0, 43.0, 37.0, 27.0, 35.0, 19.0, 30.0, 24.0, 14.0, 12.0, 18.0, 9.0, 14.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.43581008911133, -37.1386604309082, -35.84151077270508, -34.54435729980469, -33.24720764160156, -31.950057983398438, -30.652908325195312, -29.355758666992188, -28.058609008789062, -26.761459350585938, -25.46430778503418, -24.167158126831055, -22.87000846862793, -21.572856903076172, -20.275707244873047, -18.978557586669922, -17.681406021118164, -16.38425636291504, -15.087105751037598, -13.789955139160156, -12.492805480957031, -11.19565486907959, -9.898504257202148, -8.601354598999023, -7.304203987121582, -6.007053852081299, -4.709903717041016, -3.412753105163574, -2.115602970123291, -0.8184528350830078, 0.4786977767944336, 1.7758474349975586, 3.072998046875, 4.370148181915283, 5.667298316955566, 6.964448928833008, 8.261598587036133, 9.558749198913574, 10.855899810791016, 12.15304946899414, 13.450200080871582, 14.747350692749023, 16.04450035095215, 17.341651916503906, 18.63880157470703, 19.935951232910156, 21.23310089111328, 22.530250549316406, 23.827402114868164, 25.12455177307129, 26.421703338623047, 27.718852996826172, 29.016002655029297, 30.313152313232422, 31.61030387878418, 32.90745544433594, 34.20460510253906, 35.50175476074219, 36.79890441894531, 38.09605407714844, 39.39320755004883, 40.69035720825195, 41.98750686645508, 43.2846565246582, 44.58180618286133]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 14.0, 13.0, 14.0, 20.0, 20.0, 16.0, 21.0, 20.0, 22.0, 33.0, 30.0, 38.0, 27.0, 54.0, 44.0, 39.0, 43.0, 40.0, 43.0, 33.0, 39.0, 40.0, 39.0, 25.0, 23.0, 28.0, 28.0, 22.0, 23.0, 15.0, 18.0, 15.0, 14.0, 8.0, 10.0, 9.0, 8.0, 3.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.8359375, -4.690673828125, -4.54541015625, -4.400146484375, -4.2548828125, -4.109619140625, -3.96435546875, -3.819091796875, -3.673828125, -3.528564453125, -3.38330078125, -3.238037109375, -3.0927734375, -2.947509765625, -2.80224609375, -2.656982421875, -2.51171875, -2.366455078125, -2.22119140625, -2.075927734375, -1.9306640625, -1.785400390625, -1.64013671875, -1.494873046875, -1.349609375, -1.204345703125, -1.05908203125, -0.913818359375, -0.7685546875, -0.623291015625, -0.47802734375, -0.332763671875, -0.1875, -0.042236328125, 0.10302734375, 0.248291015625, 0.3935546875, 0.538818359375, 0.68408203125, 0.829345703125, 0.974609375, 1.119873046875, 1.26513671875, 1.410400390625, 1.5556640625, 1.700927734375, 1.84619140625, 1.991455078125, 2.13671875, 2.281982421875, 2.42724609375, 2.572509765625, 2.7177734375, 2.863037109375, 3.00830078125, 3.153564453125, 3.298828125, 3.444091796875, 3.58935546875, 3.734619140625, 3.8798828125, 4.025146484375, 4.17041015625, 4.315673828125, 4.4609375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 5.0, 8.0, 10.0, 18.0, 15.0, 18.0, 21.0, 32.0, 46.0, 60.0, 73.0, 73.0, 147.0, 207.0, 478.0, 1565.0, 11571.0, 428582.0, 3210134.0, 523978.0, 14190.0, 1688.0, 531.0, 226.0, 140.0, 109.0, 66.0, 70.0, 56.0, 24.0, 19.0, 22.0, 22.0, 13.0, 15.0, 6.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.671875, -16.20263671875, -15.7333984375, -15.26416015625, -14.794921875, -14.32568359375, -13.8564453125, -13.38720703125, -12.91796875, -12.44873046875, -11.9794921875, -11.51025390625, -11.041015625, -10.57177734375, -10.1025390625, -9.63330078125, -9.1640625, -8.69482421875, -8.2255859375, -7.75634765625, -7.287109375, -6.81787109375, -6.3486328125, -5.87939453125, -5.41015625, -4.94091796875, -4.4716796875, -4.00244140625, -3.533203125, -3.06396484375, -2.5947265625, -2.12548828125, -1.65625, -1.18701171875, -0.7177734375, -0.24853515625, 0.220703125, 0.68994140625, 1.1591796875, 1.62841796875, 2.09765625, 2.56689453125, 3.0361328125, 3.50537109375, 3.974609375, 4.44384765625, 4.9130859375, 5.38232421875, 5.8515625, 6.32080078125, 6.7900390625, 7.25927734375, 7.728515625, 8.19775390625, 8.6669921875, 9.13623046875, 9.60546875, 10.07470703125, 10.5439453125, 11.01318359375, 11.482421875, 11.95166015625, 12.4208984375, 12.89013671875, 13.359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 12.0, 15.0, 35.0, 49.0, 61.0, 81.0, 115.0, 172.0, 214.0, 310.0, 459.0, 561.0, 562.0, 408.0, 283.0, 221.0, 167.0, 95.0, 69.0, 51.0, 32.0, 27.0, 20.0, 14.0, 9.0, 9.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.8204345703125, -11.461181640625, -11.1019287109375, -10.74267578125, -10.3834228515625, -10.024169921875, -9.6649169921875, -9.3056640625, -8.9464111328125, -8.587158203125, -8.2279052734375, -7.86865234375, -7.5093994140625, -7.150146484375, -6.7908935546875, -6.431640625, -6.0723876953125, -5.713134765625, -5.3538818359375, -4.99462890625, -4.6353759765625, -4.276123046875, -3.9168701171875, -3.5576171875, -3.1983642578125, -2.839111328125, -2.4798583984375, -2.12060546875, -1.7613525390625, -1.402099609375, -1.0428466796875, -0.68359375, -0.3243408203125, 0.034912109375, 0.3941650390625, 0.75341796875, 1.1126708984375, 1.471923828125, 1.8311767578125, 2.1904296875, 2.5496826171875, 2.908935546875, 3.2681884765625, 3.62744140625, 3.9866943359375, 4.345947265625, 4.7052001953125, 5.064453125, 5.4237060546875, 5.782958984375, 6.1422119140625, 6.50146484375, 6.8607177734375, 7.219970703125, 7.5792236328125, 7.9384765625, 8.2977294921875, 8.656982421875, 9.0162353515625, 9.37548828125, 9.7347412109375, 10.093994140625, 10.4532470703125, 10.8125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 6.0, 1.0, 8.0, 11.0, 11.0, 23.0, 31.0, 29.0, 54.0, 89.0, 110.0, 199.0, 305.0, 443.0, 1326.0, 490825.0, 3695596.0, 3650.0, 578.0, 305.0, 229.0, 145.0, 113.0, 58.0, 55.0, 32.0, 18.0, 12.0, 9.0, 7.0, 1.0, 8.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.34375, -47.70751953125, -46.0712890625, -44.43505859375, -42.798828125, -41.16259765625, -39.5263671875, -37.89013671875, -36.25390625, -34.61767578125, -32.9814453125, -31.34521484375, -29.708984375, -28.07275390625, -26.4365234375, -24.80029296875, -23.1640625, -21.52783203125, -19.8916015625, -18.25537109375, -16.619140625, -14.98291015625, -13.3466796875, -11.71044921875, -10.07421875, -8.43798828125, -6.8017578125, -5.16552734375, -3.529296875, -1.89306640625, -0.2568359375, 1.37939453125, 3.015625, 4.65185546875, 6.2880859375, 7.92431640625, 9.560546875, 11.19677734375, 12.8330078125, 14.46923828125, 16.10546875, 17.74169921875, 19.3779296875, 21.01416015625, 22.650390625, 24.28662109375, 25.9228515625, 27.55908203125, 29.1953125, 30.83154296875, 32.4677734375, 34.10400390625, 35.740234375, 37.37646484375, 39.0126953125, 40.64892578125, 42.28515625, 43.92138671875, 45.5576171875, 47.19384765625, 48.830078125, 50.46630859375, 52.1025390625, 53.73876953125, 55.375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 20.0, 70.0, 224.0, 308.0, 263.0, 97.0, 26.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-130.99229431152344, -127.77217102050781, -124.55205535888672, -121.33193969726562, -118.11181640625, -114.89169311523438, -111.67157745361328, -108.45146179199219, -105.23133850097656, -102.01121520996094, -98.79109954833984, -95.57098388671875, -92.35086059570312, -89.1307373046875, -85.9106216430664, -82.69050598144531, -79.47038269042969, -76.25025939941406, -73.03014373779297, -69.81002807617188, -66.58990478515625, -63.36978530883789, -60.14966583251953, -56.92954635620117, -53.70942687988281, -50.48930740356445, -47.269187927246094, -44.049068450927734, -40.828948974609375, -37.608829498291016, -34.388710021972656, -31.168590545654297, -27.948471069335938, -24.728351593017578, -21.50823211669922, -18.28811264038086, -15.0679931640625, -11.84787368774414, -8.627754211425781, -5.407634735107422, -2.1875152587890625, 1.0326042175292969, 4.252723693847656, 7.472843170166016, 10.692962646484375, 13.913082122802734, 17.133201599121094, 20.353321075439453, 23.573440551757812, 26.793560028076172, 30.01367950439453, 33.23379898071289, 36.45391845703125, 39.67403793334961, 42.89415740966797, 46.11427688598633, 49.33439636230469, 52.55451583862305, 55.774635314941406, 58.994754791259766, 62.214874267578125, 65.43499755859375, 68.65511322021484, 71.87522888183594, 75.09535217285156]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 7.0, 6.0, 12.0, 6.0, 9.0, 10.0, 17.0, 19.0, 16.0, 29.0, 35.0, 34.0, 38.0, 22.0, 50.0, 46.0, 43.0, 42.0, 51.0, 43.0, 35.0, 48.0, 37.0, 48.0, 44.0, 25.0, 28.0, 29.0, 18.0, 18.0, 14.0, 20.0, 29.0, 15.0, 13.0, 8.0, 5.0, 6.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.433204650878906, -27.459083557128906, -26.484962463378906, -25.51084327697754, -24.53672218322754, -23.56260108947754, -22.588481903076172, -21.614360809326172, -20.640239715576172, -19.666118621826172, -18.691997528076172, -17.717878341674805, -16.743757247924805, -15.769636154174805, -14.795516014099121, -13.821395874023438, -12.847274780273438, -11.873153686523438, -10.899033546447754, -9.92491340637207, -8.95079231262207, -7.9766716957092285, -7.002551078796387, -6.028430461883545, -5.054309844970703, -4.080189228057861, -3.1060686111450195, -2.1319479942321777, -1.157827377319336, -0.18370676040649414, 0.7904138565063477, 1.7645344734191895, 2.7386550903320312, 3.712775707244873, 4.686896324157715, 5.661016941070557, 6.635137557983398, 7.60925817489624, 8.583378791809082, 9.557498931884766, 10.531620025634766, 11.505741119384766, 12.47986125946045, 13.453981399536133, 14.428102493286133, 15.402223587036133, 16.3763427734375, 17.3504638671875, 18.3245849609375, 19.2987060546875, 20.2728271484375, 21.246946334838867, 22.221067428588867, 23.195188522338867, 24.169307708740234, 25.143428802490234, 26.117549896240234, 27.091670989990234, 28.065792083740234, 29.0399112701416, 30.0140323638916, 30.9881534576416, 31.96227264404297, 32.93639373779297, 33.91051483154297]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 9.0, 5.0, 7.0, 11.0, 12.0, 12.0, 12.0, 16.0, 24.0, 19.0, 25.0, 27.0, 35.0, 33.0, 36.0, 46.0, 46.0, 35.0, 44.0, 59.0, 40.0, 44.0, 40.0, 39.0, 37.0, 40.0, 32.0, 33.0, 29.0, 25.0, 22.0, 18.0, 14.0, 8.0, 11.0, 20.0, 7.0, 4.0, 6.0, 9.0, 7.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.77203369140625, -4.6182861328125, -4.46453857421875, -4.310791015625, -4.15704345703125, -4.0032958984375, -3.84954833984375, -3.69580078125, -3.54205322265625, -3.3883056640625, -3.23455810546875, -3.080810546875, -2.92706298828125, -2.7733154296875, -2.61956787109375, -2.4658203125, -2.31207275390625, -2.1583251953125, -2.00457763671875, -1.850830078125, -1.69708251953125, -1.5433349609375, -1.38958740234375, -1.23583984375, -1.08209228515625, -0.9283447265625, -0.77459716796875, -0.620849609375, -0.46710205078125, -0.3133544921875, -0.15960693359375, -0.005859375, 0.14788818359375, 0.3016357421875, 0.45538330078125, 0.609130859375, 0.76287841796875, 0.9166259765625, 1.07037353515625, 1.22412109375, 1.37786865234375, 1.5316162109375, 1.68536376953125, 1.839111328125, 1.99285888671875, 2.1466064453125, 2.30035400390625, 2.4541015625, 2.60784912109375, 2.7615966796875, 2.91534423828125, 3.069091796875, 3.22283935546875, 3.3765869140625, 3.53033447265625, 3.68408203125, 3.83782958984375, 3.9915771484375, 4.14532470703125, 4.299072265625, 4.45281982421875, 4.6065673828125, 4.76031494140625, 4.9140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 13.0, 9.0, 26.0, 17.0, 45.0, 74.0, 117.0, 195.0, 332.0, 459.0, 797.0, 1492.0, 2427.0, 3906.0, 6850.0, 11694.0, 19183.0, 31753.0, 53600.0, 93178.0, 168804.0, 266059.0, 165508.0, 91211.0, 52653.0, 31506.0, 18706.0, 11295.0, 6775.0, 3946.0, 2424.0, 1442.0, 815.0, 500.0, 275.0, 153.0, 93.0, 80.0, 40.0, 35.0, 26.0, 16.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.60693359375, -0.5882492065429688, -0.5695648193359375, -0.5508804321289062, -0.532196044921875, -0.5135116577148438, -0.4948272705078125, -0.47614288330078125, -0.45745849609375, -0.43877410888671875, -0.4200897216796875, -0.40140533447265625, -0.382720947265625, -0.36403656005859375, -0.3453521728515625, -0.32666778564453125, -0.3079833984375, -0.28929901123046875, -0.2706146240234375, -0.25193023681640625, -0.233245849609375, -0.21456146240234375, -0.1958770751953125, -0.17719268798828125, -0.15850830078125, -0.13982391357421875, -0.1211395263671875, -0.10245513916015625, -0.083770751953125, -0.06508636474609375, -0.0464019775390625, -0.02771759033203125, -0.009033203125, 0.00965118408203125, 0.0283355712890625, 0.04701995849609375, 0.065704345703125, 0.08438873291015625, 0.1030731201171875, 0.12175750732421875, 0.14044189453125, 0.15912628173828125, 0.1778106689453125, 0.19649505615234375, 0.215179443359375, 0.23386383056640625, 0.2525482177734375, 0.27123260498046875, 0.2899169921875, 0.30860137939453125, 0.3272857666015625, 0.34597015380859375, 0.364654541015625, 0.38333892822265625, 0.4020233154296875, 0.42070770263671875, 0.43939208984375, 0.45807647705078125, 0.4767608642578125, 0.49544525146484375, 0.514129638671875, 0.5328140258789062, 0.5514984130859375, 0.5701828002929688, 0.5888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 2.0, 10.0, 14.0, 17.0, 12.0, 21.0, 20.0, 17.0, 22.0, 24.0, 32.0, 31.0, 48.0, 41.0, 34.0, 39.0, 38.0, 47.0, 1068.0, 34.0, 40.0, 48.0, 38.0, 44.0, 29.0, 32.0, 20.0, 22.0, 26.0, 25.0, 24.0, 16.0, 16.0, 9.0, 9.0, 10.0, 6.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.333984375, -3.23809814453125, -3.1422119140625, -3.04632568359375, -2.950439453125, -2.85455322265625, -2.7586669921875, -2.66278076171875, -2.56689453125, -2.47100830078125, -2.3751220703125, -2.27923583984375, -2.183349609375, -2.08746337890625, -1.9915771484375, -1.89569091796875, -1.7998046875, -1.70391845703125, -1.6080322265625, -1.51214599609375, -1.416259765625, -1.32037353515625, -1.2244873046875, -1.12860107421875, -1.03271484375, -0.93682861328125, -0.8409423828125, -0.74505615234375, -0.649169921875, -0.55328369140625, -0.4573974609375, -0.36151123046875, -0.265625, -0.16973876953125, -0.0738525390625, 0.02203369140625, 0.117919921875, 0.21380615234375, 0.3096923828125, 0.40557861328125, 0.50146484375, 0.59735107421875, 0.6932373046875, 0.78912353515625, 0.885009765625, 0.98089599609375, 1.0767822265625, 1.17266845703125, 1.2685546875, 1.36444091796875, 1.4603271484375, 1.55621337890625, 1.652099609375, 1.74798583984375, 1.8438720703125, 1.93975830078125, 2.03564453125, 2.13153076171875, 2.2274169921875, 2.32330322265625, 2.419189453125, 2.51507568359375, 2.6109619140625, 2.70684814453125, 2.802734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 6.0, 18.0, 25.0, 24.0, 47.0, 58.0, 120.0, 136.0, 226.0, 341.0, 483.0, 630.0, 908.0, 1285.0, 1943.0, 2967.0, 4227.0, 6465.0, 9770.0, 15317.0, 24247.0, 38513.0, 63026.0, 105954.0, 179321.0, 1265251.0, 146022.0, 86623.0, 52410.0, 32246.0, 20163.0, 12905.0, 8360.0, 5442.0, 3665.0, 2474.0, 1708.0, 1165.0, 808.0, 564.0, 400.0, 229.0, 202.0, 130.0, 82.0, 74.0, 53.0, 35.0, 18.0, 17.0, 13.0, 8.0, 1.0, 4.0, 1.0], "bins": [-0.51220703125, -0.4972801208496094, -0.48235321044921875, -0.4674263000488281, -0.4524993896484375, -0.4375724792480469, -0.42264556884765625, -0.4077186584472656, -0.392791748046875, -0.3778648376464844, -0.36293792724609375, -0.3480110168457031, -0.3330841064453125, -0.3181571960449219, -0.30323028564453125, -0.2883033752441406, -0.27337646484375, -0.2584495544433594, -0.24352264404296875, -0.22859573364257812, -0.2136688232421875, -0.19874191284179688, -0.18381500244140625, -0.16888809204101562, -0.153961181640625, -0.13903427124023438, -0.12410736083984375, -0.10918045043945312, -0.0942535400390625, -0.07932662963867188, -0.06439971923828125, -0.049472808837890625, -0.0345458984375, -0.019618988037109375, -0.00469207763671875, 0.010234832763671875, 0.0251617431640625, 0.040088653564453125, 0.05501556396484375, 0.06994247436523438, 0.084869384765625, 0.09979629516601562, 0.11472320556640625, 0.12965011596679688, 0.1445770263671875, 0.15950393676757812, 0.17443084716796875, 0.18935775756835938, 0.20428466796875, 0.21921157836914062, 0.23413848876953125, 0.24906539916992188, 0.2639923095703125, 0.2789192199707031, 0.29384613037109375, 0.3087730407714844, 0.323699951171875, 0.3386268615722656, 0.35355377197265625, 0.3684806823730469, 0.3834075927734375, 0.3983345031738281, 0.41326141357421875, 0.4281883239746094, 0.443115234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 6.0, 7.0, 17.0, 19.0, 15.0, 23.0, 35.0, 54.0, 50.0, 115.0, 112.0, 136.0, 95.0, 71.0, 39.0, 35.0, 26.0, 15.0, 20.0, 12.0, 16.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005901336669921875, -0.005716979503631592, -0.005532622337341309, -0.005348265171051025, -0.005163908004760742, -0.004979550838470459, -0.004795193672180176, -0.004610836505889893, -0.004426479339599609, -0.004242122173309326, -0.004057765007019043, -0.0038734078407287598, -0.0036890506744384766, -0.0035046935081481934, -0.00332033634185791, -0.003135979175567627, -0.0029516220092773438, -0.0027672648429870605, -0.0025829076766967773, -0.002398550510406494, -0.002214193344116211, -0.0020298361778259277, -0.0018454790115356445, -0.0016611218452453613, -0.0014767646789550781, -0.001292407512664795, -0.0011080503463745117, -0.0009236931800842285, -0.0007393360137939453, -0.0005549788475036621, -0.0003706216812133789, -0.0001862645149230957, -1.9073486328125e-06, 0.0001824498176574707, 0.0003668069839477539, 0.0005511641502380371, 0.0007355213165283203, 0.0009198784828186035, 0.0011042356491088867, 0.00128859281539917, 0.0014729499816894531, 0.0016573071479797363, 0.0018416643142700195, 0.0020260214805603027, 0.002210378646850586, 0.002394735813140869, 0.0025790929794311523, 0.0027634501457214355, 0.0029478073120117188, 0.003132164478302002, 0.003316521644592285, 0.0035008788108825684, 0.0036852359771728516, 0.0038695931434631348, 0.004053950309753418, 0.004238307476043701, 0.004422664642333984, 0.004607021808624268, 0.004791378974914551, 0.004975736141204834, 0.005160093307495117, 0.0053444504737854, 0.005528807640075684, 0.005713164806365967, 0.00589752197265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 9.0, 5.0, 5.0, 9.0, 8.0, 7.0, 12.0, 15.0, 23.0, 32.0, 33.0, 51.0, 51.0, 90.0, 135.0, 317.0, 758.0, 267490.0, 777911.0, 824.0, 302.0, 164.0, 101.0, 46.0, 38.0, 26.0, 22.0, 19.0, 13.0, 11.0, 7.0, 3.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.126708984375, -0.12275314331054688, -0.11879730224609375, -0.11484146118164062, -0.1108856201171875, -0.10692977905273438, -0.10297393798828125, -0.09901809692382812, -0.095062255859375, -0.09110641479492188, -0.08715057373046875, -0.08319473266601562, -0.0792388916015625, -0.07528305053710938, -0.07132720947265625, -0.06737136840820312, -0.06341552734375, -0.059459686279296875, -0.05550384521484375, -0.051548004150390625, -0.0475921630859375, -0.043636322021484375, -0.03968048095703125, -0.035724639892578125, -0.031768798828125, -0.027812957763671875, -0.02385711669921875, -0.019901275634765625, -0.0159454345703125, -0.011989593505859375, -0.00803375244140625, -0.004077911376953125, -0.0001220703125, 0.003833770751953125, 0.00778961181640625, 0.011745452880859375, 0.0157012939453125, 0.019657135009765625, 0.02361297607421875, 0.027568817138671875, 0.031524658203125, 0.035480499267578125, 0.03943634033203125, 0.043392181396484375, 0.0473480224609375, 0.051303863525390625, 0.05525970458984375, 0.059215545654296875, 0.06317138671875, 0.06712722778320312, 0.07108306884765625, 0.07503890991210938, 0.0789947509765625, 0.08295059204101562, 0.08690643310546875, 0.09086227416992188, 0.094818115234375, 0.09877395629882812, 0.10272979736328125, 0.10668563842773438, 0.1106414794921875, 0.11459732055664062, 0.11855316162109375, 0.12250900268554688, 0.12646484375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 29.0, 468.0, 476.0, 34.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005579321179538965, -0.005208000540733337, -0.004836679436266422, -0.004465358331799507, -0.004094037692993879, -0.003722716821357608, -0.0033513959497213364, -0.002980075078085065, -0.0026087542064487934, -0.002237433334812522, -0.0018661124631762505, -0.001494791591539979, -0.0011234707199037075, -0.000752149848267436, -0.00038082897663116455, -9.508104994893074e-06, 0.0003618127666413784, 0.0007331336382776499, 0.0011044545099139214, 0.0014757753815501928, 0.0018470962531864643, 0.002218417124822736, 0.0025897379964590073, 0.0029610588680952787, 0.00333237973973155, 0.0037037006113678217, 0.004075021483004093, 0.004446342587471008, 0.004817663226276636, 0.005188983865082264, 0.005560304969549179, 0.005931626074016094, 0.006302947178483009, 0.0066742682829499245, 0.007045588921755552, 0.00741690956056118, 0.007788230665028095, 0.00815955176949501, 0.008530871942639351, 0.008902193047106266, 0.009273514151573181, 0.009644835256040096, 0.010016156360507011, 0.010387476533651352, 0.010758797638118267, 0.011130118742585182, 0.011501438915729523, 0.011872760020196438, 0.012244081124663353, 0.012615402229130268, 0.012986723333597183, 0.013358043506741524, 0.013729364611208439, 0.014100685715675354, 0.014472005888819695, 0.01484332699328661, 0.015214648097753525, 0.01558596920222044, 0.015957290306687355, 0.016328610479831696, 0.016699932515621185, 0.017071252688765526, 0.017442572861909866, 0.017813894897699356, 0.018185215070843697]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 6.0, 9.0, 9.0, 15.0, 10.0, 22.0, 24.0, 21.0, 42.0, 25.0, 37.0, 33.0, 30.0, 31.0, 44.0, 51.0, 46.0, 48.0, 56.0, 47.0, 34.0, 36.0, 44.0, 35.0, 35.0, 34.0, 24.0, 22.0, 23.0, 16.0, 20.0, 8.0, 8.0, 7.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002447962760925293, -0.002362370491027832, -0.002276778221130371, -0.00219118595123291, -0.0021055936813354492, -0.0020200014114379883, -0.0019344091415405273, -0.0018488168716430664, -0.0017632246017456055, -0.0016776323318481445, -0.0015920400619506836, -0.0015064477920532227, -0.0014208555221557617, -0.0013352632522583008, -0.0012496709823608398, -0.001164078712463379, -0.001078486442565918, -0.000992894172668457, -0.0009073019027709961, -0.0008217096328735352, -0.0007361173629760742, -0.0006505250930786133, -0.0005649328231811523, -0.0004793405532836914, -0.00039374828338623047, -0.00030815601348876953, -0.0002225637435913086, -0.00013697147369384766, -5.137920379638672e-05, 3.421306610107422e-05, 0.00011980533599853516, 0.0002053976058959961, 0.00029098987579345703, 0.00037658214569091797, 0.0004621744155883789, 0.0005477666854858398, 0.0006333589553833008, 0.0007189512252807617, 0.0008045434951782227, 0.0008901357650756836, 0.0009757280349731445, 0.0010613203048706055, 0.0011469125747680664, 0.0012325048446655273, 0.0013180971145629883, 0.0014036893844604492, 0.0014892816543579102, 0.001574873924255371, 0.001660466194152832, 0.001746058464050293, 0.001831650733947754, 0.0019172430038452148, 0.0020028352737426758, 0.0020884275436401367, 0.0021740198135375977, 0.0022596120834350586, 0.0023452043533325195, 0.0024307966232299805, 0.0025163888931274414, 0.0026019811630249023, 0.0026875734329223633, 0.0027731657028198242, 0.002858757972717285, 0.002944350242614746, 0.003029942512512207]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 9.0, 5.0, 7.0, 11.0, 12.0, 12.0, 12.0, 16.0, 24.0, 19.0, 25.0, 27.0, 35.0, 33.0, 36.0, 46.0, 46.0, 35.0, 44.0, 59.0, 40.0, 44.0, 40.0, 39.0, 37.0, 40.0, 32.0, 33.0, 29.0, 25.0, 22.0, 18.0, 14.0, 8.0, 11.0, 20.0, 7.0, 4.0, 6.0, 9.0, 7.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.77203369140625, -4.6182861328125, -4.46453857421875, -4.310791015625, -4.15704345703125, -4.0032958984375, -3.84954833984375, -3.69580078125, -3.54205322265625, -3.3883056640625, -3.23455810546875, -3.080810546875, -2.92706298828125, -2.7733154296875, -2.61956787109375, -2.4658203125, -2.31207275390625, -2.1583251953125, -2.00457763671875, -1.850830078125, -1.69708251953125, -1.5433349609375, -1.38958740234375, -1.23583984375, -1.08209228515625, -0.9283447265625, -0.77459716796875, -0.620849609375, -0.46710205078125, -0.3133544921875, -0.15960693359375, -0.005859375, 0.14788818359375, 0.3016357421875, 0.45538330078125, 0.609130859375, 0.76287841796875, 0.9166259765625, 1.07037353515625, 1.22412109375, 1.37786865234375, 1.5316162109375, 1.68536376953125, 1.839111328125, 1.99285888671875, 2.1466064453125, 2.30035400390625, 2.4541015625, 2.60784912109375, 2.7615966796875, 2.91534423828125, 3.069091796875, 3.22283935546875, 3.3765869140625, 3.53033447265625, 3.68408203125, 3.83782958984375, 3.9915771484375, 4.14532470703125, 4.299072265625, 4.45281982421875, 4.6065673828125, 4.76031494140625, 4.9140625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 7.0, 8.0, 14.0, 15.0, 21.0, 36.0, 37.0, 42.0, 51.0, 77.0, 105.0, 170.0, 259.0, 442.0, 1012.0, 2528.0, 6392.0, 17072.0, 46492.0, 126901.0, 347287.0, 315979.0, 115993.0, 41633.0, 15572.0, 5987.0, 2274.0, 930.0, 403.0, 258.0, 120.0, 118.0, 68.0, 45.0, 41.0, 42.0, 25.0, 24.0, 16.0, 12.0, 15.0, 6.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.85357666015625, -4.6915283203125, -4.52947998046875, -4.367431640625, -4.20538330078125, -4.0433349609375, -3.88128662109375, -3.71923828125, -3.55718994140625, -3.3951416015625, -3.23309326171875, -3.071044921875, -2.90899658203125, -2.7469482421875, -2.58489990234375, -2.4228515625, -2.26080322265625, -2.0987548828125, -1.93670654296875, -1.774658203125, -1.61260986328125, -1.4505615234375, -1.28851318359375, -1.12646484375, -0.96441650390625, -0.8023681640625, -0.64031982421875, -0.478271484375, -0.31622314453125, -0.1541748046875, 0.00787353515625, 0.169921875, 0.33197021484375, 0.4940185546875, 0.65606689453125, 0.818115234375, 0.98016357421875, 1.1422119140625, 1.30426025390625, 1.46630859375, 1.62835693359375, 1.7904052734375, 1.95245361328125, 2.114501953125, 2.27655029296875, 2.4385986328125, 2.60064697265625, 2.7626953125, 2.92474365234375, 3.0867919921875, 3.24884033203125, 3.410888671875, 3.57293701171875, 3.7349853515625, 3.89703369140625, 4.05908203125, 4.22113037109375, 4.3831787109375, 4.54522705078125, 4.707275390625, 4.86932373046875, 5.0313720703125, 5.19342041015625, 5.35546875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 7.0, 5.0, 11.0, 14.0, 6.0, 12.0, 24.0, 19.0, 23.0, 30.0, 34.0, 33.0, 39.0, 41.0, 48.0, 69.0, 106.0, 335.0, 1546.0, 168.0, 86.0, 58.0, 54.0, 43.0, 35.0, 38.0, 27.0, 29.0, 25.0, 20.0, 14.0, 18.0, 6.0, 5.0, 1.0, 8.0, 9.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -12.9256591796875, -12.390380859375, -11.8551025390625, -11.31982421875, -10.7845458984375, -10.249267578125, -9.7139892578125, -9.1787109375, -8.6434326171875, -8.108154296875, -7.5728759765625, -7.03759765625, -6.5023193359375, -5.967041015625, -5.4317626953125, -4.896484375, -4.3612060546875, -3.825927734375, -3.2906494140625, -2.75537109375, -2.2200927734375, -1.684814453125, -1.1495361328125, -0.6142578125, -0.0789794921875, 0.456298828125, 0.9915771484375, 1.52685546875, 2.0621337890625, 2.597412109375, 3.1326904296875, 3.66796875, 4.2032470703125, 4.738525390625, 5.2738037109375, 5.80908203125, 6.3443603515625, 6.879638671875, 7.4149169921875, 7.9501953125, 8.4854736328125, 9.020751953125, 9.5560302734375, 10.09130859375, 10.6265869140625, 11.161865234375, 11.6971435546875, 12.232421875, 12.7677001953125, 13.302978515625, 13.8382568359375, 14.37353515625, 14.9088134765625, 15.444091796875, 15.9793701171875, 16.5146484375, 17.0499267578125, 17.585205078125, 18.1204833984375, 18.65576171875, 19.1910400390625, 19.726318359375, 20.2615966796875, 20.796875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 11.0, 11.0, 12.0, 22.0, 36.0, 37.0, 62.0, 89.0, 144.0, 240.0, 547.0, 1698.0, 232410.0, 2906786.0, 2179.0, 632.0, 304.0, 165.0, 101.0, 59.0, 34.0, 40.0, 20.0, 13.0, 5.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.5, -75.2919921875, -73.083984375, -70.8759765625, -68.66796875, -66.4599609375, -64.251953125, -62.0439453125, -59.8359375, -57.6279296875, -55.419921875, -53.2119140625, -51.00390625, -48.7958984375, -46.587890625, -44.3798828125, -42.171875, -39.9638671875, -37.755859375, -35.5478515625, -33.33984375, -31.1318359375, -28.923828125, -26.7158203125, -24.5078125, -22.2998046875, -20.091796875, -17.8837890625, -15.67578125, -13.4677734375, -11.259765625, -9.0517578125, -6.84375, -4.6357421875, -2.427734375, -0.2197265625, 1.98828125, 4.1962890625, 6.404296875, 8.6123046875, 10.8203125, 13.0283203125, 15.236328125, 17.4443359375, 19.65234375, 21.8603515625, 24.068359375, 26.2763671875, 28.484375, 30.6923828125, 32.900390625, 35.1083984375, 37.31640625, 39.5244140625, 41.732421875, 43.9404296875, 46.1484375, 48.3564453125, 50.564453125, 52.7724609375, 54.98046875, 57.1884765625, 59.396484375, 61.6044921875, 63.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 37.0, 252.0, 400.0, 251.0, 53.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.685096740722656, -33.7551383972168, -31.82518196105957, -29.89522361755371, -27.965267181396484, -26.035308837890625, -24.105350494384766, -22.175392150878906, -20.24543571472168, -18.31547737121582, -16.385520935058594, -14.455562591552734, -12.525605201721191, -10.595647811889648, -8.665689468383789, -6.735732078552246, -4.805774688720703, -2.875817060470581, -0.945859432220459, 0.9840984344482422, 2.914055824279785, 4.844013214111328, 6.7739715576171875, 8.70392894744873, 10.633886337280273, 12.563843727111816, 14.49380111694336, 16.42375946044922, 18.353717803955078, 20.283674240112305, 22.213632583618164, 24.14358901977539, 26.07354736328125, 28.00350570678711, 29.933462142944336, 31.863420486450195, 33.79337692260742, 35.72333526611328, 37.65329360961914, 39.583251953125, 41.513206481933594, 43.44316482543945, 45.37312316894531, 47.303077697753906, 49.233036041259766, 51.162994384765625, 53.092952728271484, 55.022911071777344, 56.9528694152832, 58.88282775878906, 60.81278610229492, 62.74274444580078, 64.67269897460938, 66.6026611328125, 68.5326156616211, 70.46257019042969, 72.39253234863281, 74.3224868774414, 76.25244903564453, 78.18240356445312, 80.11236572265625, 82.04232025146484, 83.97227478027344, 85.90223693847656, 87.83219146728516]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 4.0, 12.0, 10.0, 12.0, 20.0, 15.0, 22.0, 17.0, 28.0, 20.0, 27.0, 18.0, 33.0, 29.0, 34.0, 35.0, 44.0, 39.0, 38.0, 39.0, 37.0, 44.0, 36.0, 30.0, 30.0, 34.0, 33.0, 35.0, 28.0, 20.0, 24.0, 23.0, 17.0, 15.0, 15.0, 18.0, 10.0, 10.0, 4.0, 5.0, 4.0, 8.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.919395446777344, -29.837020874023438, -28.7546443939209, -27.67226791381836, -26.589893341064453, -25.507518768310547, -24.425142288208008, -23.34276580810547, -22.260391235351562, -21.178016662597656, -20.095640182495117, -19.013263702392578, -17.930889129638672, -16.848514556884766, -15.766138076782227, -14.683762550354004, -13.601387023925781, -12.519011497497559, -11.436635971069336, -10.354260444641113, -9.27188491821289, -8.189509391784668, -7.107133865356445, -6.024758338928223, -4.9423828125, -3.8600072860717773, -2.7776317596435547, -1.695256233215332, -0.6128807067871094, 0.4694948196411133, 1.551870346069336, 2.6342458724975586, 3.716625213623047, 4.7990007400512695, 5.881376266479492, 6.963751792907715, 8.046127319335938, 9.12850284576416, 10.210878372192383, 11.293253898620605, 12.375629425048828, 13.45800495147705, 14.540380477905273, 15.622756004333496, 16.70513153076172, 17.787506103515625, 18.869882583618164, 19.952259063720703, 21.03463363647461, 22.117008209228516, 23.199384689331055, 24.281761169433594, 25.3641357421875, 26.446510314941406, 27.528886795043945, 28.611263275146484, 29.69363784790039, 30.776012420654297, 31.858388900756836, 32.940765380859375, 34.02313995361328, 35.10551452636719, 36.187889099121094, 37.270267486572266, 38.35264205932617]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 5.0, 4.0, 6.0, 10.0, 9.0, 15.0, 9.0, 17.0, 17.0, 21.0, 27.0, 22.0, 36.0, 31.0, 41.0, 39.0, 28.0, 36.0, 49.0, 41.0, 33.0, 38.0, 34.0, 37.0, 29.0, 33.0, 34.0, 34.0, 34.0, 32.0, 25.0, 29.0, 17.0, 14.0, 16.0, 11.0, 12.0, 9.0, 9.0, 6.0, 6.0, 8.0, 7.0, 7.0, 6.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.9140625, -4.761474609375, -4.60888671875, -4.456298828125, -4.3037109375, -4.151123046875, -3.99853515625, -3.845947265625, -3.693359375, -3.540771484375, -3.38818359375, -3.235595703125, -3.0830078125, -2.930419921875, -2.77783203125, -2.625244140625, -2.47265625, -2.320068359375, -2.16748046875, -2.014892578125, -1.8623046875, -1.709716796875, -1.55712890625, -1.404541015625, -1.251953125, -1.099365234375, -0.94677734375, -0.794189453125, -0.6416015625, -0.489013671875, -0.33642578125, -0.183837890625, -0.03125, 0.121337890625, 0.27392578125, 0.426513671875, 0.5791015625, 0.731689453125, 0.88427734375, 1.036865234375, 1.189453125, 1.342041015625, 1.49462890625, 1.647216796875, 1.7998046875, 1.952392578125, 2.10498046875, 2.257568359375, 2.41015625, 2.562744140625, 2.71533203125, 2.867919921875, 3.0205078125, 3.173095703125, 3.32568359375, 3.478271484375, 3.630859375, 3.783447265625, 3.93603515625, 4.088623046875, 4.2412109375, 4.393798828125, 4.54638671875, 4.698974609375, 4.8515625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 20.0, 15.0, 22.0, 33.0, 28.0, 54.0, 37.0, 63.0, 80.0, 94.0, 129.0, 166.0, 317.0, 1089.0, 8816.0, 270373.0, 3047721.0, 838818.0, 22925.0, 2169.0, 433.0, 184.0, 122.0, 90.0, 77.0, 66.0, 52.0, 42.0, 38.0, 26.0, 21.0, 28.0, 21.0, 18.0, 6.0, 7.0, 5.0, 9.0, 6.0, 12.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.875, -15.4034423828125, -14.931884765625, -14.4603271484375, -13.98876953125, -13.5172119140625, -13.045654296875, -12.5740966796875, -12.1025390625, -11.6309814453125, -11.159423828125, -10.6878662109375, -10.21630859375, -9.7447509765625, -9.273193359375, -8.8016357421875, -8.330078125, -7.8585205078125, -7.386962890625, -6.9154052734375, -6.44384765625, -5.9722900390625, -5.500732421875, -5.0291748046875, -4.5576171875, -4.0860595703125, -3.614501953125, -3.1429443359375, -2.67138671875, -2.1998291015625, -1.728271484375, -1.2567138671875, -0.78515625, -0.3135986328125, 0.157958984375, 0.6295166015625, 1.10107421875, 1.5726318359375, 2.044189453125, 2.5157470703125, 2.9873046875, 3.4588623046875, 3.930419921875, 4.4019775390625, 4.87353515625, 5.3450927734375, 5.816650390625, 6.2882080078125, 6.759765625, 7.2313232421875, 7.702880859375, 8.1744384765625, 8.64599609375, 9.1175537109375, 9.589111328125, 10.0606689453125, 10.5322265625, 11.0037841796875, 11.475341796875, 11.9468994140625, 12.41845703125, 12.8900146484375, 13.361572265625, 13.8331298828125, 14.3046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 13.0, 6.0, 23.0, 21.0, 34.0, 46.0, 59.0, 83.0, 133.0, 194.0, 256.0, 356.0, 524.0, 587.0, 477.0, 373.0, 265.0, 181.0, 128.0, 87.0, 63.0, 38.0, 29.0, 34.0, 14.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 0.0, 1.0, 4.0], "bins": [-15.1875, -14.8388671875, -14.490234375, -14.1416015625, -13.79296875, -13.4443359375, -13.095703125, -12.7470703125, -12.3984375, -12.0498046875, -11.701171875, -11.3525390625, -11.00390625, -10.6552734375, -10.306640625, -9.9580078125, -9.609375, -9.2607421875, -8.912109375, -8.5634765625, -8.21484375, -7.8662109375, -7.517578125, -7.1689453125, -6.8203125, -6.4716796875, -6.123046875, -5.7744140625, -5.42578125, -5.0771484375, -4.728515625, -4.3798828125, -4.03125, -3.6826171875, -3.333984375, -2.9853515625, -2.63671875, -2.2880859375, -1.939453125, -1.5908203125, -1.2421875, -0.8935546875, -0.544921875, -0.1962890625, 0.15234375, 0.5009765625, 0.849609375, 1.1982421875, 1.546875, 1.8955078125, 2.244140625, 2.5927734375, 2.94140625, 3.2900390625, 3.638671875, 3.9873046875, 4.3359375, 4.6845703125, 5.033203125, 5.3818359375, 5.73046875, 6.0791015625, 6.427734375, 6.7763671875, 7.125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 7.0, 8.0, 23.0, 29.0, 36.0, 39.0, 56.0, 114.0, 167.0, 258.0, 381.0, 787.0, 27170.0, 4148672.0, 14634.0, 721.0, 407.0, 255.0, 167.0, 111.0, 65.0, 43.0, 39.0, 16.0, 22.0, 16.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5625, -35.7265625, -33.890625, -32.0546875, -30.21875, -28.3828125, -26.546875, -24.7109375, -22.875, -21.0390625, -19.203125, -17.3671875, -15.53125, -13.6953125, -11.859375, -10.0234375, -8.1875, -6.3515625, -4.515625, -2.6796875, -0.84375, 0.9921875, 2.828125, 4.6640625, 6.5, 8.3359375, 10.171875, 12.0078125, 13.84375, 15.6796875, 17.515625, 19.3515625, 21.1875, 23.0234375, 24.859375, 26.6953125, 28.53125, 30.3671875, 32.203125, 34.0390625, 35.875, 37.7109375, 39.546875, 41.3828125, 43.21875, 45.0546875, 46.890625, 48.7265625, 50.5625, 52.3984375, 54.234375, 56.0703125, 57.90625, 59.7421875, 61.578125, 63.4140625, 65.25, 67.0859375, 68.921875, 70.7578125, 72.59375, 74.4296875, 76.265625, 78.1015625, 79.9375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 37.0, 61.0, 120.0, 148.0, 163.0, 128.0, 147.0, 71.0, 62.0, 41.0, 12.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.550968170166016, -56.03363800048828, -54.51630783081055, -52.99897766113281, -51.481651306152344, -49.96432113647461, -48.446990966796875, -46.92966079711914, -45.412330627441406, -43.89500045776367, -42.37767028808594, -40.8603401184082, -39.34300994873047, -37.82568359375, -36.308353424072266, -34.79102325439453, -33.2736930847168, -31.756362915039062, -30.239032745361328, -28.721704483032227, -27.204374313354492, -25.687044143676758, -24.169715881347656, -22.652385711669922, -21.135055541992188, -19.617725372314453, -18.10039520263672, -16.583066940307617, -15.065736770629883, -13.548406600952148, -12.03107738494873, -10.513748168945312, -8.996417999267578, -7.479088306427002, -5.961758613586426, -4.44442892074585, -2.9270992279052734, -1.4097695350646973, 0.1075601577758789, 1.6248893737792969, 3.1422195434570312, 4.659549236297607, 6.176878929138184, 7.69420862197876, 9.211538314819336, 10.72886848449707, 12.246197700500488, 13.763526916503906, 15.28085708618164, 16.798187255859375, 18.31551742553711, 19.83284568786621, 21.350175857543945, 22.86750602722168, 24.38483428955078, 25.902164459228516, 27.41949462890625, 28.936824798583984, 30.45415496826172, 31.97148323059082, 33.48881530761719, 35.006141662597656, 36.52347183227539, 38.040802001953125, 39.55813217163086]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 5.0, 8.0, 9.0, 6.0, 13.0, 18.0, 15.0, 14.0, 20.0, 19.0, 25.0, 19.0, 47.0, 42.0, 35.0, 35.0, 54.0, 39.0, 31.0, 36.0, 49.0, 47.0, 49.0, 30.0, 42.0, 36.0, 30.0, 24.0, 25.0, 20.0, 20.0, 17.0, 21.0, 17.0, 13.0, 14.0, 12.0, 15.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-30.931190490722656, -29.95403480529785, -28.976877212524414, -27.99972152709961, -27.022563934326172, -26.045408248901367, -25.068252563476562, -24.091094970703125, -23.11393928527832, -22.136783599853516, -21.159626007080078, -20.182470321655273, -19.20531463623047, -18.22815704345703, -17.251001358032227, -16.273845672607422, -15.296688079833984, -14.319531440734863, -13.342374801635742, -12.365219116210938, -11.388062477111816, -10.410905838012695, -9.43375015258789, -8.45659351348877, -7.479436874389648, -6.502280235290527, -5.5251240730285645, -4.547967910766602, -3.5708112716674805, -2.5936546325683594, -1.6164984703063965, -0.6393423080444336, 0.3378143310546875, 1.3149707317352295, 2.2921271324157715, 3.2692835330963135, 4.2464399337768555, 5.223596572875977, 6.2007527351379395, 7.177908897399902, 8.155065536499023, 9.132222175598145, 10.109378814697266, 11.08653450012207, 12.063691139221191, 13.040847778320312, 14.018003463745117, 14.995160102844238, 15.97231674194336, 16.949472427368164, 17.9266300201416, 18.903785705566406, 19.880943298339844, 20.85809898376465, 21.835254669189453, 22.81241226196289, 23.789567947387695, 24.7667236328125, 25.743881225585938, 26.721036911010742, 27.698192596435547, 28.675350189208984, 29.65250587463379, 30.629661560058594, 31.60681915283203]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 10.0, 7.0, 11.0, 9.0, 14.0, 17.0, 17.0, 21.0, 21.0, 24.0, 29.0, 28.0, 34.0, 34.0, 38.0, 45.0, 36.0, 36.0, 35.0, 49.0, 38.0, 47.0, 47.0, 35.0, 34.0, 39.0, 24.0, 22.0, 32.0, 24.0, 15.0, 20.0, 16.0, 20.0, 12.0, 13.0, 9.0, 7.0, 4.0, 8.0, 5.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.03057861328125, -4.8658447265625, -4.70111083984375, -4.536376953125, -4.37164306640625, -4.2069091796875, -4.04217529296875, -3.87744140625, -3.71270751953125, -3.5479736328125, -3.38323974609375, -3.218505859375, -3.05377197265625, -2.8890380859375, -2.72430419921875, -2.5595703125, -2.39483642578125, -2.2301025390625, -2.06536865234375, -1.900634765625, -1.73590087890625, -1.5711669921875, -1.40643310546875, -1.24169921875, -1.07696533203125, -0.9122314453125, -0.74749755859375, -0.582763671875, -0.41802978515625, -0.2532958984375, -0.08856201171875, 0.076171875, 0.24090576171875, 0.4056396484375, 0.57037353515625, 0.735107421875, 0.89984130859375, 1.0645751953125, 1.22930908203125, 1.39404296875, 1.55877685546875, 1.7235107421875, 1.88824462890625, 2.052978515625, 2.21771240234375, 2.3824462890625, 2.54718017578125, 2.7119140625, 2.87664794921875, 3.0413818359375, 3.20611572265625, 3.370849609375, 3.53558349609375, 3.7003173828125, 3.86505126953125, 4.02978515625, 4.19451904296875, 4.3592529296875, 4.52398681640625, 4.688720703125, 4.85345458984375, 5.0181884765625, 5.18292236328125, 5.34765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 11.0, 14.0, 29.0, 36.0, 76.0, 110.0, 197.0, 310.0, 517.0, 919.0, 1441.0, 2388.0, 3910.0, 6738.0, 11049.0, 18152.0, 30060.0, 51828.0, 89304.0, 160864.0, 258141.0, 176984.0, 97179.0, 55755.0, 33005.0, 19659.0, 11799.0, 7166.0, 4350.0, 2633.0, 1611.0, 875.0, 560.0, 354.0, 176.0, 128.0, 91.0, 50.0, 35.0, 24.0, 10.0, 12.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55859375, -0.5383377075195312, -0.5180816650390625, -0.49782562255859375, -0.477569580078125, -0.45731353759765625, -0.4370574951171875, -0.41680145263671875, -0.39654541015625, -0.37628936767578125, -0.3560333251953125, -0.33577728271484375, -0.315521240234375, -0.29526519775390625, -0.2750091552734375, -0.25475311279296875, -0.2344970703125, -0.21424102783203125, -0.1939849853515625, -0.17372894287109375, -0.153472900390625, -0.13321685791015625, -0.1129608154296875, -0.09270477294921875, -0.07244873046875, -0.05219268798828125, -0.0319366455078125, -0.01168060302734375, 0.008575439453125, 0.02883148193359375, 0.0490875244140625, 0.06934356689453125, 0.089599609375, 0.10985565185546875, 0.1301116943359375, 0.15036773681640625, 0.170623779296875, 0.19087982177734375, 0.2111358642578125, 0.23139190673828125, 0.25164794921875, 0.27190399169921875, 0.2921600341796875, 0.31241607666015625, 0.332672119140625, 0.35292816162109375, 0.3731842041015625, 0.39344024658203125, 0.4136962890625, 0.43395233154296875, 0.4542083740234375, 0.47446441650390625, 0.494720458984375, 0.5149765014648438, 0.5352325439453125, 0.5554885864257812, 0.57574462890625, 0.5960006713867188, 0.6162567138671875, 0.6365127563476562, 0.656768798828125, 0.6770248413085938, 0.6972808837890625, 0.7175369262695312, 0.73779296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 8.0, 7.0, 6.0, 11.0, 11.0, 7.0, 6.0, 16.0, 14.0, 14.0, 28.0, 27.0, 23.0, 30.0, 29.0, 39.0, 37.0, 41.0, 40.0, 37.0, 43.0, 1066.0, 46.0, 38.0, 35.0, 39.0, 33.0, 32.0, 40.0, 32.0, 26.0, 31.0, 17.0, 17.0, 19.0, 9.0, 11.0, 16.0, 10.0, 10.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.162109375, -3.058502197265625, -2.95489501953125, -2.851287841796875, -2.7476806640625, -2.644073486328125, -2.54046630859375, -2.436859130859375, -2.333251953125, -2.229644775390625, -2.12603759765625, -2.022430419921875, -1.9188232421875, -1.815216064453125, -1.71160888671875, -1.608001708984375, -1.50439453125, -1.400787353515625, -1.29718017578125, -1.193572998046875, -1.0899658203125, -0.986358642578125, -0.88275146484375, -0.779144287109375, -0.675537109375, -0.571929931640625, -0.46832275390625, -0.364715576171875, -0.2611083984375, -0.157501220703125, -0.05389404296875, 0.049713134765625, 0.1533203125, 0.256927490234375, 0.36053466796875, 0.464141845703125, 0.5677490234375, 0.671356201171875, 0.77496337890625, 0.878570556640625, 0.982177734375, 1.085784912109375, 1.18939208984375, 1.292999267578125, 1.3966064453125, 1.500213623046875, 1.60382080078125, 1.707427978515625, 1.81103515625, 1.914642333984375, 2.01824951171875, 2.121856689453125, 2.2254638671875, 2.329071044921875, 2.43267822265625, 2.536285400390625, 2.639892578125, 2.743499755859375, 2.84710693359375, 2.950714111328125, 3.0543212890625, 3.157928466796875, 3.26153564453125, 3.365142822265625, 3.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 15.0, 41.0, 50.0, 81.0, 97.0, 140.0, 179.0, 298.0, 388.0, 577.0, 813.0, 1135.0, 1521.0, 2261.0, 3212.0, 4675.0, 6703.0, 9769.0, 14681.0, 21910.0, 33770.0, 53585.0, 85590.0, 136580.0, 1244346.0, 174498.0, 107567.0, 66953.0, 42222.0, 27104.0, 17876.0, 12033.0, 8072.0, 5487.0, 3908.0, 2661.0, 1932.0, 1267.0, 955.0, 631.0, 445.0, 332.0, 226.0, 159.0, 118.0, 77.0, 47.0, 36.0, 19.0, 19.0, 11.0, 12.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0], "bins": [-0.447509765625, -0.432952880859375, -0.41839599609375, -0.403839111328125, -0.3892822265625, -0.374725341796875, -0.36016845703125, -0.345611572265625, -0.3310546875, -0.316497802734375, -0.30194091796875, -0.287384033203125, -0.2728271484375, -0.258270263671875, -0.24371337890625, -0.229156494140625, -0.214599609375, -0.200042724609375, -0.18548583984375, -0.170928955078125, -0.1563720703125, -0.141815185546875, -0.12725830078125, -0.112701416015625, -0.09814453125, -0.083587646484375, -0.06903076171875, -0.054473876953125, -0.0399169921875, -0.025360107421875, -0.01080322265625, 0.003753662109375, 0.018310546875, 0.032867431640625, 0.04742431640625, 0.061981201171875, 0.0765380859375, 0.091094970703125, 0.10565185546875, 0.120208740234375, 0.134765625, 0.149322509765625, 0.16387939453125, 0.178436279296875, 0.1929931640625, 0.207550048828125, 0.22210693359375, 0.236663818359375, 0.251220703125, 0.265777587890625, 0.28033447265625, 0.294891357421875, 0.3094482421875, 0.324005126953125, 0.33856201171875, 0.353118896484375, 0.36767578125, 0.382232666015625, 0.39678955078125, 0.411346435546875, 0.4259033203125, 0.440460205078125, 0.45501708984375, 0.469573974609375, 0.484130859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 12.0, 13.0, 21.0, 21.0, 21.0, 24.0, 38.0, 42.0, 49.0, 46.0, 68.0, 90.0, 95.0, 89.0, 77.0, 50.0, 37.0, 40.0, 24.0, 22.0, 31.0, 14.0, 13.0, 5.0, 13.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005054473876953125, -0.004911899566650391, -0.004769325256347656, -0.004626750946044922, -0.0044841766357421875, -0.004341602325439453, -0.004199028015136719, -0.004056453704833984, -0.00391387939453125, -0.0037713050842285156, -0.0036287307739257812, -0.003486156463623047, -0.0033435821533203125, -0.003201007843017578, -0.0030584335327148438, -0.0029158592224121094, -0.002773284912109375, -0.0026307106018066406, -0.0024881362915039062, -0.002345561981201172, -0.0022029876708984375, -0.002060413360595703, -0.0019178390502929688, -0.0017752647399902344, -0.0016326904296875, -0.0014901161193847656, -0.0013475418090820312, -0.0012049674987792969, -0.0010623931884765625, -0.0009198188781738281, -0.0007772445678710938, -0.0006346702575683594, -0.000492095947265625, -0.0003495216369628906, -0.00020694732666015625, -6.437301635742188e-05, 7.82012939453125e-05, 0.00022077560424804688, 0.00036334991455078125, 0.0005059242248535156, 0.00064849853515625, 0.0007910728454589844, 0.0009336471557617188, 0.0010762214660644531, 0.0012187957763671875, 0.0013613700866699219, 0.0015039443969726562, 0.0016465187072753906, 0.001789093017578125, 0.0019316673278808594, 0.0020742416381835938, 0.002216815948486328, 0.0023593902587890625, 0.002501964569091797, 0.0026445388793945312, 0.0027871131896972656, 0.0029296875, 0.0030722618103027344, 0.0032148361206054688, 0.003357410430908203, 0.0034999847412109375, 0.003642559051513672, 0.0037851333618164062, 0.003927707672119141, 0.004070281982421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 10.0, 11.0, 19.0, 12.0, 18.0, 24.0, 39.0, 53.0, 56.0, 76.0, 112.0, 208.0, 439.0, 1104.0, 376795.0, 667212.0, 1177.0, 457.0, 218.0, 132.0, 86.0, 70.0, 50.0, 47.0, 32.0, 25.0, 9.0, 17.0, 10.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0838623046875, -0.08097267150878906, -0.07808303833007812, -0.07519340515136719, -0.07230377197265625, -0.06941413879394531, -0.06652450561523438, -0.06363487243652344, -0.0607452392578125, -0.05785560607910156, -0.054965972900390625, -0.05207633972167969, -0.04918670654296875, -0.04629707336425781, -0.043407440185546875, -0.04051780700683594, -0.037628173828125, -0.03473854064941406, -0.031848907470703125, -0.028959274291992188, -0.02606964111328125, -0.023180007934570312, -0.020290374755859375, -0.017400741577148438, -0.0145111083984375, -0.011621475219726562, -0.008731842041015625, -0.0058422088623046875, -0.00295257568359375, -6.29425048828125e-05, 0.002826690673828125, 0.0057163238525390625, 0.00860595703125, 0.011495590209960938, 0.014385223388671875, 0.017274856567382812, 0.02016448974609375, 0.023054122924804688, 0.025943756103515625, 0.028833389282226562, 0.0317230224609375, 0.03461265563964844, 0.037502288818359375, 0.04039192199707031, 0.04328155517578125, 0.04617118835449219, 0.049060821533203125, 0.05195045471191406, 0.054840087890625, 0.05772972106933594, 0.060619354248046875, 0.06350898742675781, 0.06639862060546875, 0.06928825378417969, 0.07217788696289062, 0.07506752014160156, 0.0779571533203125, 0.08084678649902344, 0.08373641967773438, 0.08662605285644531, 0.08951568603515625, 0.09240531921386719, 0.09529495239257812, 0.09818458557128906, 0.10107421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 142.0, 655.0, 191.0, 16.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033897263929247856, -0.003035973059013486, -0.002682219725102186, -0.002328466158360243, -0.001974712824448943, -0.0016209594905376434, -0.0012672059237957, -0.0009134525898844004, -0.0005596992559731007, -0.00020594586385414004, 0.00014780752826482058, 0.0005015609785914421, 0.0008553143125027418, 0.0012090676464140415, 0.0015628212131559849, 0.0019165745470672846, 0.0022703278809785843, 0.002624081214889884, 0.0029778345488011837, 0.003331588115543127, 0.0036853414494544268, 0.0040390947833657265, 0.00439284835010767, 0.004746601916849613, 0.005100355017930269, 0.005454108584672213, 0.005807861685752869, 0.006161615252494812, 0.006515368819236755, 0.006869121920317411, 0.007222875487059355, 0.007576628588140011, 0.007930383086204529, 0.008284136652946472, 0.008637890219688416, 0.008991643786430359, 0.009345396421849728, 0.009699149988591671, 0.010052903555333614, 0.010406657122075558, 0.010760409757494926, 0.01111416332423687, 0.011467916890978813, 0.011821670457720757, 0.012175423093140125, 0.012529176659882069, 0.012882930226624012, 0.013236683793365955, 0.013590437360107899, 0.013944190926849842, 0.014297944493591785, 0.014651697129011154, 0.015005450695753098, 0.015359204262495041, 0.015712957829236984, 0.016066711395978928, 0.01642046496272087, 0.016774218529462814, 0.017127972096204758, 0.0174817256629467, 0.017835479229688644, 0.018189232796430588, 0.01854298636317253, 0.018896738067269325, 0.01925049163401127]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 11.0, 7.0, 9.0, 10.0, 11.0, 10.0, 10.0, 13.0, 19.0, 14.0, 23.0, 26.0, 28.0, 26.0, 41.0, 40.0, 37.0, 32.0, 40.0, 41.0, 37.0, 43.0, 51.0, 44.0, 40.0, 43.0, 33.0, 39.0, 31.0, 35.0, 25.0, 20.0, 19.0, 17.0, 19.0, 12.0, 9.0, 7.0, 10.0, 5.0, 4.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.002082526683807373, -0.002019566483795643, -0.0019566062837839127, -0.0018936460837721825, -0.0018306858837604523, -0.001767725683748722, -0.0017047654837369919, -0.0016418052837252617, -0.0015788450837135315, -0.0015158848837018013, -0.001452924683690071, -0.001389964483678341, -0.0013270042836666107, -0.0012640440836548805, -0.0012010838836431503, -0.0011381236836314201, -0.00107516348361969, -0.0010122032836079597, -0.0009492430835962296, -0.0008862828835844994, -0.0008233226835727692, -0.000760362483561039, -0.0006974022835493088, -0.0006344420835375786, -0.0005714818835258484, -0.0005085216835141182, -0.000445561483502388, -0.0003826012834906578, -0.0003196410834789276, -0.0002566808834671974, -0.00019372068345546722, -0.00013076048344373703, -6.780028343200684e-05, -4.840083420276642e-06, 5.812011659145355e-05, 0.00012108031660318375, 0.00018404051661491394, 0.00024700071662664413, 0.00030996091663837433, 0.0003729211166501045, 0.0004358813166618347, 0.0004988415166735649, 0.0005618017166852951, 0.0006247619166970253, 0.0006877221167087555, 0.0007506823167204857, 0.0008136425167322159, 0.0008766027167439461, 0.0009395629167556763, 0.0010025231167674065, 0.0010654833167791367, 0.0011284435167908669, 0.001191403716802597, 0.0012543639168143272, 0.0013173241168260574, 0.0013802843168377876, 0.0014432445168495178, 0.001506204716861248, 0.0015691649168729782, 0.0016321251168847084, 0.0016950853168964386, 0.0017580455169081688, 0.001821005716919899, 0.0018839659169316292, 0.0019469261169433594]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 10.0, 7.0, 11.0, 9.0, 14.0, 17.0, 17.0, 22.0, 20.0, 24.0, 29.0, 28.0, 34.0, 34.0, 38.0, 45.0, 36.0, 36.0, 35.0, 49.0, 38.0, 47.0, 47.0, 35.0, 34.0, 39.0, 24.0, 22.0, 32.0, 24.0, 15.0, 20.0, 16.0, 20.0, 12.0, 13.0, 9.0, 7.0, 4.0, 8.0, 5.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.03057861328125, -4.8658447265625, -4.70111083984375, -4.536376953125, -4.37164306640625, -4.2069091796875, -4.04217529296875, -3.87744140625, -3.71270751953125, -3.5479736328125, -3.38323974609375, -3.218505859375, -3.05377197265625, -2.8890380859375, -2.72430419921875, -2.5595703125, -2.39483642578125, -2.2301025390625, -2.06536865234375, -1.900634765625, -1.73590087890625, -1.5711669921875, -1.40643310546875, -1.24169921875, -1.07696533203125, -0.9122314453125, -0.74749755859375, -0.582763671875, -0.41802978515625, -0.2532958984375, -0.08856201171875, 0.076171875, 0.24090576171875, 0.4056396484375, 0.57037353515625, 0.735107421875, 0.89984130859375, 1.0645751953125, 1.22930908203125, 1.39404296875, 1.55877685546875, 1.7235107421875, 1.88824462890625, 2.052978515625, 2.21771240234375, 2.3824462890625, 2.54718017578125, 2.7119140625, 2.87664794921875, 3.0413818359375, 3.20611572265625, 3.370849609375, 3.53558349609375, 3.7003173828125, 3.86505126953125, 4.02978515625, 4.19451904296875, 4.3592529296875, 4.52398681640625, 4.688720703125, 4.85345458984375, 5.0181884765625, 5.18292236328125, 5.34765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 8.0, 16.0, 9.0, 15.0, 23.0, 27.0, 36.0, 47.0, 64.0, 65.0, 121.0, 171.0, 215.0, 384.0, 694.0, 1931.0, 9976.0, 67850.0, 627948.0, 294358.0, 36131.0, 5543.0, 1331.0, 522.0, 335.0, 191.0, 125.0, 84.0, 78.0, 51.0, 35.0, 31.0, 35.0, 16.0, 18.0, 11.0, 10.0, 6.0, 8.0, 7.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.34423828125, -10.0087890625, -9.67333984375, -9.337890625, -9.00244140625, -8.6669921875, -8.33154296875, -7.99609375, -7.66064453125, -7.3251953125, -6.98974609375, -6.654296875, -6.31884765625, -5.9833984375, -5.64794921875, -5.3125, -4.97705078125, -4.6416015625, -4.30615234375, -3.970703125, -3.63525390625, -3.2998046875, -2.96435546875, -2.62890625, -2.29345703125, -1.9580078125, -1.62255859375, -1.287109375, -0.95166015625, -0.6162109375, -0.28076171875, 0.0546875, 0.39013671875, 0.7255859375, 1.06103515625, 1.396484375, 1.73193359375, 2.0673828125, 2.40283203125, 2.73828125, 3.07373046875, 3.4091796875, 3.74462890625, 4.080078125, 4.41552734375, 4.7509765625, 5.08642578125, 5.421875, 5.75732421875, 6.0927734375, 6.42822265625, 6.763671875, 7.09912109375, 7.4345703125, 7.77001953125, 8.10546875, 8.44091796875, 8.7763671875, 9.11181640625, 9.447265625, 9.78271484375, 10.1181640625, 10.45361328125, 10.7890625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 5.0, 9.0, 6.0, 8.0, 14.0, 12.0, 11.0, 16.0, 27.0, 17.0, 23.0, 30.0, 19.0, 47.0, 46.0, 42.0, 52.0, 67.0, 135.0, 348.0, 1413.0, 173.0, 74.0, 57.0, 45.0, 42.0, 38.0, 38.0, 24.0, 22.0, 21.0, 10.0, 25.0, 12.0, 17.0, 17.0, 13.0, 10.0, 6.0, 6.0, 10.0, 3.0, 4.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0], "bins": [-15.546875, -15.046875, -14.546875, -14.046875, -13.546875, -13.046875, -12.546875, -12.046875, -11.546875, -11.046875, -10.546875, -10.046875, -9.546875, -9.046875, -8.546875, -8.046875, -7.546875, -7.046875, -6.546875, -6.046875, -5.546875, -5.046875, -4.546875, -4.046875, -3.546875, -3.046875, -2.546875, -2.046875, -1.546875, -1.046875, -0.546875, -0.046875, 0.453125, 0.953125, 1.453125, 1.953125, 2.453125, 2.953125, 3.453125, 3.953125, 4.453125, 4.953125, 5.453125, 5.953125, 6.453125, 6.953125, 7.453125, 7.953125, 8.453125, 8.953125, 9.453125, 9.953125, 10.453125, 10.953125, 11.453125, 11.953125, 12.453125, 12.953125, 13.453125, 13.953125, 14.453125, 14.953125, 15.453125, 15.953125, 16.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 8.0, 19.0, 8.0, 10.0, 18.0, 16.0, 26.0, 25.0, 27.0, 24.0, 41.0, 39.0, 52.0, 73.0, 83.0, 145.0, 267.0, 437.0, 1055.0, 9567.0, 3071365.0, 59120.0, 1700.0, 580.0, 263.0, 181.0, 109.0, 75.0, 62.0, 51.0, 35.0, 39.0, 34.0, 16.0, 19.0, 27.0, 11.0, 6.0, 14.0, 6.0, 14.0, 11.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-51.75, -50.212890625, -48.67578125, -47.138671875, -45.6015625, -44.064453125, -42.52734375, -40.990234375, -39.453125, -37.916015625, -36.37890625, -34.841796875, -33.3046875, -31.767578125, -30.23046875, -28.693359375, -27.15625, -25.619140625, -24.08203125, -22.544921875, -21.0078125, -19.470703125, -17.93359375, -16.396484375, -14.859375, -13.322265625, -11.78515625, -10.248046875, -8.7109375, -7.173828125, -5.63671875, -4.099609375, -2.5625, -1.025390625, 0.51171875, 2.048828125, 3.5859375, 5.123046875, 6.66015625, 8.197265625, 9.734375, 11.271484375, 12.80859375, 14.345703125, 15.8828125, 17.419921875, 18.95703125, 20.494140625, 22.03125, 23.568359375, 25.10546875, 26.642578125, 28.1796875, 29.716796875, 31.25390625, 32.791015625, 34.328125, 35.865234375, 37.40234375, 38.939453125, 40.4765625, 42.013671875, 43.55078125, 45.087890625, 46.625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 23.0, 185.0, 376.0, 337.0, 75.0, 14.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.329197883605957, -11.34319019317627, -9.357181549072266, -7.371173858642578, -5.385165691375732, -3.3991575241088867, -1.4131498336791992, 0.5728588104248047, 2.558866500854492, 4.544874668121338, 6.530882835388184, 8.516890525817871, 10.502899169921875, 12.488906860351562, 14.47491455078125, 16.460922241210938, 18.446929931640625, 20.432937622070312, 22.4189453125, 24.404953002929688, 26.390962600708008, 28.376970291137695, 30.362977981567383, 32.3489875793457, 34.33499526977539, 36.32100296020508, 38.307010650634766, 40.29301834106445, 42.27902603149414, 44.265037536621094, 46.25104522705078, 48.23705291748047, 50.22305679321289, 52.20906448364258, 54.195072174072266, 56.18107986450195, 58.16708755493164, 60.153099060058594, 62.13910675048828, 64.12511444091797, 66.11112213134766, 68.09712982177734, 70.08313751220703, 72.06914520263672, 74.0551528930664, 76.0411605834961, 78.02716827392578, 80.01317596435547, 81.99918365478516, 83.98519134521484, 85.97119903564453, 87.95720672607422, 89.9432144165039, 91.9292221069336, 93.91522979736328, 95.90123748779297, 97.88725280761719, 99.87326049804688, 101.85926818847656, 103.84527587890625, 105.83128356933594, 107.81729125976562, 109.80329895019531, 111.789306640625, 113.77531433105469]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 9.0, 8.0, 4.0, 7.0, 17.0, 18.0, 22.0, 20.0, 24.0, 25.0, 25.0, 30.0, 38.0, 41.0, 46.0, 43.0, 39.0, 45.0, 55.0, 45.0, 35.0, 37.0, 41.0, 40.0, 46.0, 32.0, 19.0, 36.0, 20.0, 21.0, 22.0, 17.0, 12.0, 8.0, 12.0, 12.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.566932678222656, -53.87208557128906, -52.177242279052734, -50.48239517211914, -48.78754806518555, -47.09270477294922, -45.397857666015625, -43.70301055908203, -42.00816345214844, -40.313316345214844, -38.618473052978516, -36.92362594604492, -35.22877883911133, -33.533935546875, -31.839088439941406, -30.144241333007812, -28.449398040771484, -26.754552841186523, -25.05970573425293, -23.36486053466797, -21.670013427734375, -19.975168228149414, -18.280323028564453, -16.58547592163086, -14.890630722045898, -13.195784568786621, -11.500938415527344, -9.806093215942383, -8.111247062683105, -6.416400909423828, -4.721555709838867, -3.02670955657959, -1.3318595886230469, 0.36298632621765137, 2.0578322410583496, 3.7526779174804688, 5.447524070739746, 7.142370223999023, 8.837215423583984, 10.532061576843262, 12.226907730102539, 13.921753883361816, 15.616600036621094, 17.311445236206055, 19.006290435791016, 20.70113754272461, 22.39598274230957, 24.09082794189453, 25.785675048828125, 27.480520248413086, 29.17536735534668, 30.87021255493164, 32.565059661865234, 34.25990295410156, 35.954750061035156, 37.64959716796875, 39.344444274902344, 41.03929138183594, 42.734134674072266, 44.42898178100586, 46.12382888793945, 47.81867218017578, 49.513519287109375, 51.20836639404297, 52.9032096862793]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 12.0, 2.0, 9.0, 7.0, 12.0, 11.0, 9.0, 15.0, 19.0, 14.0, 24.0, 27.0, 19.0, 30.0, 25.0, 25.0, 31.0, 40.0, 37.0, 34.0, 36.0, 47.0, 45.0, 43.0, 29.0, 45.0, 37.0, 28.0, 30.0, 26.0, 23.0, 20.0, 27.0, 24.0, 23.0, 14.0, 18.0, 16.0, 15.0, 13.0, 10.0, 8.0, 10.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.34765625, -5.17236328125, -4.9970703125, -4.82177734375, -4.646484375, -4.47119140625, -4.2958984375, -4.12060546875, -3.9453125, -3.77001953125, -3.5947265625, -3.41943359375, -3.244140625, -3.06884765625, -2.8935546875, -2.71826171875, -2.54296875, -2.36767578125, -2.1923828125, -2.01708984375, -1.841796875, -1.66650390625, -1.4912109375, -1.31591796875, -1.140625, -0.96533203125, -0.7900390625, -0.61474609375, -0.439453125, -0.26416015625, -0.0888671875, 0.08642578125, 0.26171875, 0.43701171875, 0.6123046875, 0.78759765625, 0.962890625, 1.13818359375, 1.3134765625, 1.48876953125, 1.6640625, 1.83935546875, 2.0146484375, 2.18994140625, 2.365234375, 2.54052734375, 2.7158203125, 2.89111328125, 3.06640625, 3.24169921875, 3.4169921875, 3.59228515625, 3.767578125, 3.94287109375, 4.1181640625, 4.29345703125, 4.46875, 4.64404296875, 4.8193359375, 4.99462890625, 5.169921875, 5.34521484375, 5.5205078125, 5.69580078125, 5.87109375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 2.0, 6.0, 7.0, 13.0, 13.0, 6.0, 14.0, 25.0, 30.0, 31.0, 32.0, 54.0, 75.0, 83.0, 165.0, 311.0, 547.0, 1122.0, 3054.0, 11925.0, 69934.0, 424523.0, 1431964.0, 1601368.0, 538629.0, 88903.0, 14672.0, 3799.0, 1402.0, 647.0, 302.0, 192.0, 124.0, 76.0, 57.0, 47.0, 27.0, 16.0, 23.0, 11.0, 11.0, 10.0, 5.0, 12.0, 3.0, 2.0, 7.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.55859375, -6.30706787109375, -6.0555419921875, -5.80401611328125, -5.552490234375, -5.30096435546875, -5.0494384765625, -4.79791259765625, -4.54638671875, -4.29486083984375, -4.0433349609375, -3.79180908203125, -3.540283203125, -3.28875732421875, -3.0372314453125, -2.78570556640625, -2.5341796875, -2.28265380859375, -2.0311279296875, -1.77960205078125, -1.528076171875, -1.27655029296875, -1.0250244140625, -0.77349853515625, -0.52197265625, -0.27044677734375, -0.0189208984375, 0.23260498046875, 0.484130859375, 0.73565673828125, 0.9871826171875, 1.23870849609375, 1.490234375, 1.74176025390625, 1.9932861328125, 2.24481201171875, 2.496337890625, 2.74786376953125, 2.9993896484375, 3.25091552734375, 3.50244140625, 3.75396728515625, 4.0054931640625, 4.25701904296875, 4.508544921875, 4.76007080078125, 5.0115966796875, 5.26312255859375, 5.5146484375, 5.76617431640625, 6.0177001953125, 6.26922607421875, 6.520751953125, 6.77227783203125, 7.0238037109375, 7.27532958984375, 7.52685546875, 7.77838134765625, 8.0299072265625, 8.28143310546875, 8.532958984375, 8.78448486328125, 9.0360107421875, 9.28753662109375, 9.5390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 8.0, 16.0, 20.0, 40.0, 36.0, 62.0, 111.0, 149.0, 233.0, 340.0, 528.0, 631.0, 559.0, 452.0, 297.0, 193.0, 124.0, 82.0, 58.0, 36.0, 25.0, 26.0, 17.0, 10.0, 11.0, 1.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.921875, -18.4805908203125, -18.039306640625, -17.5980224609375, -17.15673828125, -16.7154541015625, -16.274169921875, -15.8328857421875, -15.3916015625, -14.9503173828125, -14.509033203125, -14.0677490234375, -13.62646484375, -13.1851806640625, -12.743896484375, -12.3026123046875, -11.861328125, -11.4200439453125, -10.978759765625, -10.5374755859375, -10.09619140625, -9.6549072265625, -9.213623046875, -8.7723388671875, -8.3310546875, -7.8897705078125, -7.448486328125, -7.0072021484375, -6.56591796875, -6.1246337890625, -5.683349609375, -5.2420654296875, -4.80078125, -4.3594970703125, -3.918212890625, -3.4769287109375, -3.03564453125, -2.5943603515625, -2.153076171875, -1.7117919921875, -1.2705078125, -0.8292236328125, -0.387939453125, 0.0533447265625, 0.49462890625, 0.9359130859375, 1.377197265625, 1.8184814453125, 2.259765625, 2.7010498046875, 3.142333984375, 3.5836181640625, 4.02490234375, 4.4661865234375, 4.907470703125, 5.3487548828125, 5.7900390625, 6.2313232421875, 6.672607421875, 7.1138916015625, 7.55517578125, 7.9964599609375, 8.437744140625, 8.8790283203125, 9.3203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 12.0, 9.0, 19.0, 33.0, 45.0, 70.0, 97.0, 176.0, 352.0, 637.0, 1616.0, 13933.0, 4037312.0, 135528.0, 2535.0, 875.0, 439.0, 247.0, 133.0, 73.0, 50.0, 32.0, 18.0, 17.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -33.60595703125, -32.0556640625, -30.50537109375, -28.955078125, -27.40478515625, -25.8544921875, -24.30419921875, -22.75390625, -21.20361328125, -19.6533203125, -18.10302734375, -16.552734375, -15.00244140625, -13.4521484375, -11.90185546875, -10.3515625, -8.80126953125, -7.2509765625, -5.70068359375, -4.150390625, -2.60009765625, -1.0498046875, 0.50048828125, 2.05078125, 3.60107421875, 5.1513671875, 6.70166015625, 8.251953125, 9.80224609375, 11.3525390625, 12.90283203125, 14.453125, 16.00341796875, 17.5537109375, 19.10400390625, 20.654296875, 22.20458984375, 23.7548828125, 25.30517578125, 26.85546875, 28.40576171875, 29.9560546875, 31.50634765625, 33.056640625, 34.60693359375, 36.1572265625, 37.70751953125, 39.2578125, 40.80810546875, 42.3583984375, 43.90869140625, 45.458984375, 47.00927734375, 48.5595703125, 50.10986328125, 51.66015625, 53.21044921875, 54.7607421875, 56.31103515625, 57.861328125, 59.41162109375, 60.9619140625, 62.51220703125, 64.0625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 178.0, 545.0, 272.0, 14.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.85655212402344, -189.66622924804688, -183.4759063720703, -177.28558349609375, -171.0952606201172, -164.90493774414062, -158.714599609375, -152.5242919921875, -146.33395385742188, -140.1436309814453, -133.95330810546875, -127.76298522949219, -121.57266235351562, -115.38233947753906, -109.19200897216797, -103.0016860961914, -96.81137084960938, -90.62104797363281, -84.43072509765625, -78.24040222167969, -72.05007934570312, -65.85975646972656, -59.66942596435547, -53.479103088378906, -47.288780212402344, -41.09845733642578, -34.90813446044922, -28.71780776977539, -22.527484893798828, -16.337162017822266, -10.146835327148438, -3.956512451171875, 2.2338104248046875, 8.424134254455566, 14.614458084106445, 20.80478286743164, 26.995105743408203, 33.185428619384766, 39.375755310058594, 45.566078186035156, 51.75640106201172, 57.94672393798828, 64.13704681396484, 70.32737731933594, 76.5177001953125, 82.70802307128906, 88.89834594726562, 95.08866882324219, 101.27899169921875, 107.46931457519531, 113.65963745117188, 119.84996032714844, 126.040283203125, 132.23060607910156, 138.42092895507812, 144.61126708984375, 150.80157470703125, 156.9918975830078, 163.18222045898438, 169.37254333496094, 175.5628662109375, 181.75318908691406, 187.94351196289062, 194.13385009765625, 200.3241729736328]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 8.0, 14.0, 15.0, 20.0, 12.0, 20.0, 25.0, 32.0, 31.0, 35.0, 34.0, 35.0, 36.0, 36.0, 47.0, 40.0, 48.0, 35.0, 42.0, 36.0, 44.0, 38.0, 46.0, 38.0, 25.0, 28.0, 22.0, 18.0, 22.0, 13.0, 15.0, 17.0, 10.0, 7.0, 10.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.47553253173828, -36.366600036621094, -35.257667541503906, -34.14873504638672, -33.03980255126953, -31.930870056152344, -30.821937561035156, -29.71300506591797, -28.60407257080078, -27.495140075683594, -26.386207580566406, -25.27727508544922, -24.16834259033203, -23.059410095214844, -21.950477600097656, -20.84154510498047, -19.732614517211914, -18.623682022094727, -17.51474952697754, -16.40581703186035, -15.296884536743164, -14.187952041625977, -13.079020500183105, -11.970088005065918, -10.86115550994873, -9.752223014831543, -8.643290519714355, -7.534358501434326, -6.425426006317139, -5.316493511199951, -4.207561492919922, -3.0986289978027344, -1.9896965026855469, -0.8807641267776489, 0.22816824913024902, 1.3371005058288574, 2.446033000946045, 3.5549654960632324, 4.663897514343262, 5.772830009460449, 6.881762504577637, 7.990694999694824, 9.099627494812012, 10.208559036254883, 11.31749153137207, 12.426424026489258, 13.535356521606445, 14.644289016723633, 15.75322151184082, 16.862154006958008, 17.971086502075195, 19.080018997192383, 20.18895149230957, 21.297883987426758, 22.406814575195312, 23.5157470703125, 24.624679565429688, 25.733612060546875, 26.842544555664062, 27.95147705078125, 29.060409545898438, 30.169342041015625, 31.278274536132812, 32.38720703125, 33.49613952636719]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 10.0, 1.0, 10.0, 8.0, 11.0, 12.0, 9.0, 22.0, 23.0, 17.0, 21.0, 25.0, 27.0, 21.0, 37.0, 47.0, 34.0, 38.0, 39.0, 50.0, 60.0, 34.0, 52.0, 42.0, 32.0, 42.0, 29.0, 39.0, 28.0, 27.0, 27.0, 21.0, 13.0, 21.0, 15.0, 10.0, 12.0, 8.0, 13.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6348876953125, -5.445556640625, -5.2562255859375, -5.06689453125, -4.8775634765625, -4.688232421875, -4.4989013671875, -4.3095703125, -4.1202392578125, -3.930908203125, -3.7415771484375, -3.55224609375, -3.3629150390625, -3.173583984375, -2.9842529296875, -2.794921875, -2.6055908203125, -2.416259765625, -2.2269287109375, -2.03759765625, -1.8482666015625, -1.658935546875, -1.4696044921875, -1.2802734375, -1.0909423828125, -0.901611328125, -0.7122802734375, -0.52294921875, -0.3336181640625, -0.144287109375, 0.0450439453125, 0.234375, 0.4237060546875, 0.613037109375, 0.8023681640625, 0.99169921875, 1.1810302734375, 1.370361328125, 1.5596923828125, 1.7490234375, 1.9383544921875, 2.127685546875, 2.3170166015625, 2.50634765625, 2.6956787109375, 2.885009765625, 3.0743408203125, 3.263671875, 3.4530029296875, 3.642333984375, 3.8316650390625, 4.02099609375, 4.2103271484375, 4.399658203125, 4.5889892578125, 4.7783203125, 4.9676513671875, 5.156982421875, 5.3463134765625, 5.53564453125, 5.7249755859375, 5.914306640625, 6.1036376953125, 6.29296875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 6.0, 6.0, 19.0, 21.0, 37.0, 40.0, 61.0, 100.0, 140.0, 244.0, 277.0, 450.0, 702.0, 1024.0, 1465.0, 2214.0, 3389.0, 5064.0, 7578.0, 11409.0, 17232.0, 26574.0, 41751.0, 66569.0, 109573.0, 185498.0, 216616.0, 131542.0, 79298.0, 49045.0, 31226.0, 19823.0, 13180.0, 8891.0, 5773.0, 3909.0, 2498.0, 1719.0, 1239.0, 721.0, 545.0, 367.0, 230.0, 152.0, 109.0, 68.0, 53.0, 41.0, 18.0, 14.0, 20.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0], "bins": [-0.57177734375, -0.5545425415039062, -0.5373077392578125, -0.5200729370117188, -0.502838134765625, -0.48560333251953125, -0.4683685302734375, -0.45113372802734375, -0.43389892578125, -0.41666412353515625, -0.3994293212890625, -0.38219451904296875, -0.364959716796875, -0.34772491455078125, -0.3304901123046875, -0.31325531005859375, -0.2960205078125, -0.27878570556640625, -0.2615509033203125, -0.24431610107421875, -0.227081298828125, -0.20984649658203125, -0.1926116943359375, -0.17537689208984375, -0.15814208984375, -0.14090728759765625, -0.1236724853515625, -0.10643768310546875, -0.089202880859375, -0.07196807861328125, -0.0547332763671875, -0.03749847412109375, -0.020263671875, -0.00302886962890625, 0.0142059326171875, 0.03144073486328125, 0.048675537109375, 0.06591033935546875, 0.0831451416015625, 0.10037994384765625, 0.11761474609375, 0.13484954833984375, 0.1520843505859375, 0.16931915283203125, 0.186553955078125, 0.20378875732421875, 0.2210235595703125, 0.23825836181640625, 0.2554931640625, 0.27272796630859375, 0.2899627685546875, 0.30719757080078125, 0.324432373046875, 0.34166717529296875, 0.3589019775390625, 0.37613677978515625, 0.39337158203125, 0.41060638427734375, 0.4278411865234375, 0.44507598876953125, 0.462310791015625, 0.47954559326171875, 0.4967803955078125, 0.5140151977539062, 0.53125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 9.0, 10.0, 9.0, 7.0, 10.0, 11.0, 15.0, 19.0, 13.0, 24.0, 24.0, 21.0, 35.0, 29.0, 35.0, 34.0, 33.0, 37.0, 35.0, 41.0, 1070.0, 50.0, 35.0, 45.0, 37.0, 42.0, 33.0, 30.0, 32.0, 33.0, 16.0, 21.0, 21.0, 22.0, 13.0, 13.0, 15.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.42578125, -3.3116455078125, -3.197509765625, -3.0833740234375, -2.96923828125, -2.8551025390625, -2.740966796875, -2.6268310546875, -2.5126953125, -2.3985595703125, -2.284423828125, -2.1702880859375, -2.05615234375, -1.9420166015625, -1.827880859375, -1.7137451171875, -1.599609375, -1.4854736328125, -1.371337890625, -1.2572021484375, -1.14306640625, -1.0289306640625, -0.914794921875, -0.8006591796875, -0.6865234375, -0.5723876953125, -0.458251953125, -0.3441162109375, -0.22998046875, -0.1158447265625, -0.001708984375, 0.1124267578125, 0.2265625, 0.3406982421875, 0.454833984375, 0.5689697265625, 0.68310546875, 0.7972412109375, 0.911376953125, 1.0255126953125, 1.1396484375, 1.2537841796875, 1.367919921875, 1.4820556640625, 1.59619140625, 1.7103271484375, 1.824462890625, 1.9385986328125, 2.052734375, 2.1668701171875, 2.281005859375, 2.3951416015625, 2.50927734375, 2.6234130859375, 2.737548828125, 2.8516845703125, 2.9658203125, 3.0799560546875, 3.194091796875, 3.3082275390625, 3.42236328125, 3.5364990234375, 3.650634765625, 3.7647705078125, 3.87890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 7.0, 11.0, 24.0, 20.0, 31.0, 42.0, 59.0, 80.0, 105.0, 155.0, 208.0, 317.0, 489.0, 672.0, 1013.0, 1297.0, 1958.0, 2876.0, 4268.0, 6292.0, 9483.0, 14404.0, 22509.0, 35882.0, 57321.0, 93438.0, 154638.0, 1267248.0, 160855.0, 96547.0, 59632.0, 36542.0, 23361.0, 15040.0, 9804.0, 6367.0, 4361.0, 2978.0, 2082.0, 1458.0, 930.0, 705.0, 473.0, 367.0, 202.0, 192.0, 139.0, 79.0, 59.0, 35.0, 23.0, 15.0, 12.0, 17.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0], "bins": [-0.5234375, -0.5068359375, -0.490234375, -0.4736328125, -0.45703125, -0.4404296875, -0.423828125, -0.4072265625, -0.390625, -0.3740234375, -0.357421875, -0.3408203125, -0.32421875, -0.3076171875, -0.291015625, -0.2744140625, -0.2578125, -0.2412109375, -0.224609375, -0.2080078125, -0.19140625, -0.1748046875, -0.158203125, -0.1416015625, -0.125, -0.1083984375, -0.091796875, -0.0751953125, -0.05859375, -0.0419921875, -0.025390625, -0.0087890625, 0.0078125, 0.0244140625, 0.041015625, 0.0576171875, 0.07421875, 0.0908203125, 0.107421875, 0.1240234375, 0.140625, 0.1572265625, 0.173828125, 0.1904296875, 0.20703125, 0.2236328125, 0.240234375, 0.2568359375, 0.2734375, 0.2900390625, 0.306640625, 0.3232421875, 0.33984375, 0.3564453125, 0.373046875, 0.3896484375, 0.40625, 0.4228515625, 0.439453125, 0.4560546875, 0.47265625, 0.4892578125, 0.505859375, 0.5224609375, 0.5390625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 12.0, 16.0, 12.0, 25.0, 30.0, 34.0, 81.0, 142.0, 168.0, 148.0, 110.0, 66.0, 46.0, 32.0, 15.0, 9.0, 11.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0098876953125, -0.009577751159667969, -0.009267807006835938, -0.008957862854003906, -0.008647918701171875, -0.008337974548339844, -0.008028030395507812, -0.007718086242675781, -0.00740814208984375, -0.007098197937011719, -0.0067882537841796875, -0.006478309631347656, -0.006168365478515625, -0.005858421325683594, -0.0055484771728515625, -0.005238533020019531, -0.0049285888671875, -0.004618644714355469, -0.0043087005615234375, -0.003998756408691406, -0.003688812255859375, -0.0033788681030273438, -0.0030689239501953125, -0.0027589797973632812, -0.00244903564453125, -0.0021390914916992188, -0.0018291473388671875, -0.0015192031860351562, -0.001209259033203125, -0.0008993148803710938, -0.0005893707275390625, -0.00027942657470703125, 3.0517578125e-05, 0.00034046173095703125, 0.0006504058837890625, 0.0009603500366210938, 0.001270294189453125, 0.0015802383422851562, 0.0018901824951171875, 0.0022001266479492188, 0.00251007080078125, 0.0028200149536132812, 0.0031299591064453125, 0.0034399032592773438, 0.003749847412109375, 0.004059791564941406, 0.0043697357177734375, 0.004679679870605469, 0.0049896240234375, 0.005299568176269531, 0.0056095123291015625, 0.005919456481933594, 0.006229400634765625, 0.006539344787597656, 0.0068492889404296875, 0.007159233093261719, 0.00746917724609375, 0.007779121398925781, 0.008089065551757812, 0.008399009704589844, 0.008708953857421875, 0.009018898010253906, 0.009328842163085938, 0.009638786315917969, 0.00994873046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 13.0, 13.0, 18.0, 30.0, 30.0, 64.0, 129.0, 248.0, 673.0, 769377.0, 276693.0, 686.0, 221.0, 111.0, 69.0, 57.0, 25.0, 21.0, 18.0, 13.0, 8.0, 2.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.19854736328125, -0.192138671875, -0.18572998046875, -0.1793212890625, -0.17291259765625, -0.16650390625, -0.16009521484375, -0.1536865234375, -0.14727783203125, -0.140869140625, -0.13446044921875, -0.1280517578125, -0.12164306640625, -0.115234375, -0.10882568359375, -0.1024169921875, -0.09600830078125, -0.089599609375, -0.08319091796875, -0.0767822265625, -0.07037353515625, -0.06396484375, -0.05755615234375, -0.0511474609375, -0.04473876953125, -0.038330078125, -0.03192138671875, -0.0255126953125, -0.01910400390625, -0.0126953125, -0.00628662109375, 0.0001220703125, 0.00653076171875, 0.012939453125, 0.01934814453125, 0.0257568359375, 0.03216552734375, 0.03857421875, 0.04498291015625, 0.0513916015625, 0.05780029296875, 0.064208984375, 0.07061767578125, 0.0770263671875, 0.08343505859375, 0.08984375, 0.09625244140625, 0.1026611328125, 0.10906982421875, 0.115478515625, 0.12188720703125, 0.1282958984375, 0.13470458984375, 0.14111328125, 0.14752197265625, 0.1539306640625, 0.16033935546875, 0.166748046875, 0.17315673828125, 0.1795654296875, 0.18597412109375, 0.1923828125, 0.19879150390625, 0.2052001953125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 86.0, 623.0, 274.0, 20.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01970273070037365, -0.019314132630825043, -0.018925536423921585, -0.018536938354372978, -0.01814834028482437, -0.017759744077920914, -0.017371146008372307, -0.0169825479388237, -0.016593951731920242, -0.016205353662371635, -0.015816757455468178, -0.015428159385919571, -0.015039562247693539, -0.014650965109467506, -0.0142623670399189, -0.013873769901692867, -0.013485172763466835, -0.013096575625240803, -0.012707977555692196, -0.012319380417466164, -0.011930783279240131, -0.011542186141014099, -0.011153588071465492, -0.01076499093323946, -0.010376392863690853, -0.00998779572546482, -0.009599197655916214, -0.009210600517690182, -0.00882200337946415, -0.008433406241238117, -0.00804480817168951, -0.007656211033463478, -0.0072676134295761585, -0.006879015825688839, -0.006490418687462807, -0.006101821083575487, -0.005713223945349455, -0.005324626341462135, -0.004936029203236103, -0.0045474315993487835, -0.004158833995461464, -0.003770236624404788, -0.003381639253348112, -0.0029930416494607925, -0.0026044445112347603, -0.0022158469073474407, -0.0018272495362907648, -0.001438652165234089, -0.0010500550270080566, -0.0006614576559513807, -0.0002728602266870439, 0.00011573720257729292, 0.0005043345736339688, 0.0008929319446906447, 0.0012815294321626425, 0.0016701268032193184, 0.0020587241742759943, 0.00244732154533267, 0.002835918916389346, 0.003224516287446022, 0.0036131138913333416, 0.004001711029559374, 0.004390308633446693, 0.004778905771672726, 0.005167503375560045]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 10.0, 15.0, 13.0, 15.0, 18.0, 21.0, 24.0, 21.0, 24.0, 27.0, 34.0, 33.0, 31.0, 41.0, 36.0, 26.0, 45.0, 40.0, 39.0, 34.0, 48.0, 28.0, 34.0, 40.0, 31.0, 33.0, 30.0, 35.0, 20.0, 18.0, 12.0, 21.0, 12.0, 12.0, 13.0, 11.0, 5.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.002680182456970215, -0.002591380849480629, -0.002502579241991043, -0.002413777634501457, -0.0023249760270118713, -0.0022361744195222855, -0.0021473728120326996, -0.0020585712045431137, -0.001969769597053528, -0.001880967989563942, -0.001792166382074356, -0.0017033647745847702, -0.0016145631670951843, -0.0015257615596055984, -0.0014369599521160126, -0.0013481583446264267, -0.0012593567371368408, -0.001170555129647255, -0.001081753522157669, -0.0009929519146680832, -0.0009041503071784973, -0.0008153486996889114, -0.0007265470921993256, -0.0006377454847097397, -0.0005489438772201538, -0.00046014226973056793, -0.00037134066224098206, -0.0002825390547513962, -0.0001937374472618103, -0.00010493583977222443, -1.613423228263855e-05, 7.266737520694733e-05, 0.0001614689826965332, 0.0002502705901861191, 0.00033907219767570496, 0.00042787380516529083, 0.0005166754126548767, 0.0006054770201444626, 0.0006942786276340485, 0.0007830802351236343, 0.0008718818426132202, 0.0009606834501028061, 0.001049485057592392, 0.0011382866650819778, 0.0012270882725715637, 0.0013158898800611496, 0.0014046914875507355, 0.0014934930950403214, 0.0015822947025299072, 0.001671096310019493, 0.001759897917509079, 0.0018486995249986649, 0.0019375011324882507, 0.0020263027399778366, 0.0021151043474674225, 0.0022039059549570084, 0.0022927075624465942, 0.00238150916993618, 0.002470310777425766, 0.002559112384915352, 0.0026479139924049377, 0.0027367155998945236, 0.0028255172073841095, 0.0029143188148736954, 0.0030031204223632812]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 10.0, 1.0, 10.0, 8.0, 11.0, 12.0, 9.0, 22.0, 23.0, 17.0, 21.0, 25.0, 27.0, 21.0, 37.0, 47.0, 34.0, 39.0, 38.0, 50.0, 59.0, 35.0, 52.0, 42.0, 32.0, 42.0, 29.0, 39.0, 28.0, 27.0, 27.0, 21.0, 13.0, 21.0, 15.0, 10.0, 12.0, 8.0, 13.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6348876953125, -5.445556640625, -5.2562255859375, -5.06689453125, -4.8775634765625, -4.688232421875, -4.4989013671875, -4.3095703125, -4.1202392578125, -3.930908203125, -3.7415771484375, -3.55224609375, -3.3629150390625, -3.173583984375, -2.9842529296875, -2.794921875, -2.6055908203125, -2.416259765625, -2.2269287109375, -2.03759765625, -1.8482666015625, -1.658935546875, -1.4696044921875, -1.2802734375, -1.0909423828125, -0.901611328125, -0.7122802734375, -0.52294921875, -0.3336181640625, -0.144287109375, 0.0450439453125, 0.234375, 0.4237060546875, 0.613037109375, 0.8023681640625, 0.99169921875, 1.1810302734375, 1.370361328125, 1.5596923828125, 1.7490234375, 1.9383544921875, 2.127685546875, 2.3170166015625, 2.50634765625, 2.6956787109375, 2.885009765625, 3.0743408203125, 3.263671875, 3.4530029296875, 3.642333984375, 3.8316650390625, 4.02099609375, 4.2103271484375, 4.399658203125, 4.5889892578125, 4.7783203125, 4.9676513671875, 5.156982421875, 5.3463134765625, 5.53564453125, 5.7249755859375, 5.914306640625, 6.1036376953125, 6.29296875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 7.0, 14.0, 20.0, 24.0, 27.0, 40.0, 68.0, 126.0, 248.0, 469.0, 1134.0, 2847.0, 7298.0, 18842.0, 51546.0, 157893.0, 412039.0, 265229.0, 82479.0, 29402.0, 11355.0, 4289.0, 1645.0, 720.0, 333.0, 170.0, 82.0, 47.0, 24.0, 31.0, 18.0, 15.0, 11.0, 6.0, 15.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.12969970703125, -5.9234619140625, -5.71722412109375, -5.510986328125, -5.30474853515625, -5.0985107421875, -4.89227294921875, -4.68603515625, -4.47979736328125, -4.2735595703125, -4.06732177734375, -3.861083984375, -3.65484619140625, -3.4486083984375, -3.24237060546875, -3.0361328125, -2.82989501953125, -2.6236572265625, -2.41741943359375, -2.211181640625, -2.00494384765625, -1.7987060546875, -1.59246826171875, -1.38623046875, -1.17999267578125, -0.9737548828125, -0.76751708984375, -0.561279296875, -0.35504150390625, -0.1488037109375, 0.05743408203125, 0.263671875, 0.46990966796875, 0.6761474609375, 0.88238525390625, 1.088623046875, 1.29486083984375, 1.5010986328125, 1.70733642578125, 1.91357421875, 2.11981201171875, 2.3260498046875, 2.53228759765625, 2.738525390625, 2.94476318359375, 3.1510009765625, 3.35723876953125, 3.5634765625, 3.76971435546875, 3.9759521484375, 4.18218994140625, 4.388427734375, 4.59466552734375, 4.8009033203125, 5.00714111328125, 5.21337890625, 5.41961669921875, 5.6258544921875, 5.83209228515625, 6.038330078125, 6.24456787109375, 6.4508056640625, 6.65704345703125, 6.86328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 6.0, 13.0, 17.0, 18.0, 20.0, 20.0, 21.0, 22.0, 28.0, 28.0, 39.0, 42.0, 29.0, 47.0, 64.0, 111.0, 245.0, 1460.0, 241.0, 101.0, 69.0, 51.0, 35.0, 43.0, 39.0, 27.0, 27.0, 31.0, 26.0, 17.0, 26.0, 9.0, 5.0, 15.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-21.0625, -20.451416015625, -19.84033203125, -19.229248046875, -18.6181640625, -18.007080078125, -17.39599609375, -16.784912109375, -16.173828125, -15.562744140625, -14.95166015625, -14.340576171875, -13.7294921875, -13.118408203125, -12.50732421875, -11.896240234375, -11.28515625, -10.674072265625, -10.06298828125, -9.451904296875, -8.8408203125, -8.229736328125, -7.61865234375, -7.007568359375, -6.396484375, -5.785400390625, -5.17431640625, -4.563232421875, -3.9521484375, -3.341064453125, -2.72998046875, -2.118896484375, -1.5078125, -0.896728515625, -0.28564453125, 0.325439453125, 0.9365234375, 1.547607421875, 2.15869140625, 2.769775390625, 3.380859375, 3.991943359375, 4.60302734375, 5.214111328125, 5.8251953125, 6.436279296875, 7.04736328125, 7.658447265625, 8.26953125, 8.880615234375, 9.49169921875, 10.102783203125, 10.7138671875, 11.324951171875, 11.93603515625, 12.547119140625, 13.158203125, 13.769287109375, 14.38037109375, 14.991455078125, 15.6025390625, 16.213623046875, 16.82470703125, 17.435791015625, 18.046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 7.0, 6.0, 8.0, 12.0, 18.0, 14.0, 21.0, 30.0, 38.0, 68.0, 98.0, 148.0, 228.0, 442.0, 857.0, 4911.0, 2996913.0, 138541.0, 1850.0, 626.0, 321.0, 162.0, 114.0, 76.0, 49.0, 48.0, 24.0, 16.0, 16.0, 9.0, 5.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.25, -53.51220703125, -51.7744140625, -50.03662109375, -48.298828125, -46.56103515625, -44.8232421875, -43.08544921875, -41.34765625, -39.60986328125, -37.8720703125, -36.13427734375, -34.396484375, -32.65869140625, -30.9208984375, -29.18310546875, -27.4453125, -25.70751953125, -23.9697265625, -22.23193359375, -20.494140625, -18.75634765625, -17.0185546875, -15.28076171875, -13.54296875, -11.80517578125, -10.0673828125, -8.32958984375, -6.591796875, -4.85400390625, -3.1162109375, -1.37841796875, 0.359375, 2.09716796875, 3.8349609375, 5.57275390625, 7.310546875, 9.04833984375, 10.7861328125, 12.52392578125, 14.26171875, 15.99951171875, 17.7373046875, 19.47509765625, 21.212890625, 22.95068359375, 24.6884765625, 26.42626953125, 28.1640625, 29.90185546875, 31.6396484375, 33.37744140625, 35.115234375, 36.85302734375, 38.5908203125, 40.32861328125, 42.06640625, 43.80419921875, 45.5419921875, 47.27978515625, 49.017578125, 50.75537109375, 52.4931640625, 54.23095703125, 55.96875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 36.0, 161.0, 373.0, 311.0, 99.0, 24.0, 1.0, 0.0, 1.0], "bins": [-121.3439712524414, -119.24247741699219, -117.14098358154297, -115.03948974609375, -112.93800354003906, -110.83650970458984, -108.73501586914062, -106.6335220336914, -104.53202819824219, -102.43053436279297, -100.32904052734375, -98.22755432128906, -96.12606048583984, -94.02456665039062, -91.9230728149414, -89.82157897949219, -87.7200927734375, -85.61859893798828, -83.51710510253906, -81.41561889648438, -79.31412506103516, -77.21263122558594, -75.11113739013672, -73.0096435546875, -70.90814971923828, -68.80665588378906, -66.70516204833984, -64.60366821289062, -62.50217819213867, -60.40068817138672, -58.2991943359375, -56.19770050048828, -54.09620666503906, -51.994712829589844, -49.89322280883789, -47.79172897338867, -45.69023513793945, -43.5887451171875, -41.48725128173828, -39.38575744628906, -37.284263610839844, -35.182769775390625, -33.08127975463867, -30.979785919189453, -28.878292083740234, -26.77680015563965, -24.675308227539062, -22.573814392089844, -20.47232437133789, -18.370832443237305, -16.269338607788086, -14.1678466796875, -12.066353797912598, -9.964860916137695, -7.863368988037109, -5.761876106262207, -3.6603832244873047, -1.5588905811309814, 0.5426020622253418, 2.644094467163086, 4.745587348937988, 6.847080230712891, 8.948572158813477, 11.050065040588379, 13.151557922363281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 2.0, 5.0, 8.0, 9.0, 16.0, 17.0, 11.0, 24.0, 20.0, 25.0, 19.0, 20.0, 26.0, 33.0, 35.0, 27.0, 27.0, 53.0, 36.0, 42.0, 44.0, 38.0, 43.0, 48.0, 37.0, 34.0, 33.0, 35.0, 22.0, 21.0, 29.0, 21.0, 19.0, 21.0, 18.0, 18.0, 15.0, 11.0, 6.0, 3.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.848304748535156, -48.334922790527344, -46.82154083251953, -45.30815887451172, -43.794776916503906, -42.281394958496094, -40.76801300048828, -39.25463104248047, -37.741249084472656, -36.227867126464844, -34.71448516845703, -33.20110321044922, -31.687721252441406, -30.174339294433594, -28.66095733642578, -27.14757537841797, -25.634193420410156, -24.120811462402344, -22.60742950439453, -21.09404754638672, -19.580665588378906, -18.067283630371094, -16.55390167236328, -15.040519714355469, -13.527137756347656, -12.013755798339844, -10.500373840332031, -8.986991882324219, -7.473609924316406, -5.960227966308594, -4.446846008300781, -2.9334640502929688, -1.4200782775878906, 0.09330368041992188, 1.6066856384277344, 3.120067596435547, 4.633449554443359, 6.146831512451172, 7.660213470458984, 9.173595428466797, 10.68697738647461, 12.200359344482422, 13.713741302490234, 15.227123260498047, 16.74050521850586, 18.253887176513672, 19.767269134521484, 21.280651092529297, 22.79403305053711, 24.307415008544922, 25.820796966552734, 27.334178924560547, 28.84756088256836, 30.360942840576172, 31.874324798583984, 33.3877067565918, 34.90108871459961, 36.41447067260742, 37.927852630615234, 39.44123458862305, 40.95461654663086, 42.46799850463867, 43.981380462646484, 45.4947624206543, 47.00814437866211]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 9.0, 9.0, 8.0, 10.0, 14.0, 15.0, 22.0, 17.0, 24.0, 28.0, 32.0, 37.0, 29.0, 35.0, 29.0, 39.0, 42.0, 38.0, 37.0, 44.0, 46.0, 45.0, 32.0, 34.0, 37.0, 23.0, 30.0, 20.0, 25.0, 26.0, 16.0, 16.0, 18.0, 11.0, 13.0, 14.0, 14.0, 12.0, 7.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.34368896484375, -5.1600341796875, -4.97637939453125, -4.792724609375, -4.60906982421875, -4.4254150390625, -4.24176025390625, -4.05810546875, -3.87445068359375, -3.6907958984375, -3.50714111328125, -3.323486328125, -3.13983154296875, -2.9561767578125, -2.77252197265625, -2.5888671875, -2.40521240234375, -2.2215576171875, -2.03790283203125, -1.854248046875, -1.67059326171875, -1.4869384765625, -1.30328369140625, -1.11962890625, -0.93597412109375, -0.7523193359375, -0.56866455078125, -0.385009765625, -0.20135498046875, -0.0177001953125, 0.16595458984375, 0.349609375, 0.53326416015625, 0.7169189453125, 0.90057373046875, 1.084228515625, 1.26788330078125, 1.4515380859375, 1.63519287109375, 1.81884765625, 2.00250244140625, 2.1861572265625, 2.36981201171875, 2.553466796875, 2.73712158203125, 2.9207763671875, 3.10443115234375, 3.2880859375, 3.47174072265625, 3.6553955078125, 3.83905029296875, 4.022705078125, 4.20635986328125, 4.3900146484375, 4.57366943359375, 4.75732421875, 4.94097900390625, 5.1246337890625, 5.30828857421875, 5.491943359375, 5.67559814453125, 5.8592529296875, 6.04290771484375, 6.2265625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 7.0, 11.0, 9.0, 15.0, 18.0, 14.0, 26.0, 31.0, 34.0, 52.0, 53.0, 68.0, 97.0, 116.0, 218.0, 700.0, 6064.0, 452010.0, 3479377.0, 249689.0, 4267.0, 618.0, 214.0, 101.0, 85.0, 73.0, 61.0, 40.0, 29.0, 30.0, 22.0, 16.0, 18.0, 15.0, 14.0, 13.0, 7.0, 10.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.237548828125, -16.63134765625, -16.025146484375, -15.4189453125, -14.812744140625, -14.20654296875, -13.600341796875, -12.994140625, -12.387939453125, -11.78173828125, -11.175537109375, -10.5693359375, -9.963134765625, -9.35693359375, -8.750732421875, -8.14453125, -7.538330078125, -6.93212890625, -6.325927734375, -5.7197265625, -5.113525390625, -4.50732421875, -3.901123046875, -3.294921875, -2.688720703125, -2.08251953125, -1.476318359375, -0.8701171875, -0.263916015625, 0.34228515625, 0.948486328125, 1.5546875, 2.160888671875, 2.76708984375, 3.373291015625, 3.9794921875, 4.585693359375, 5.19189453125, 5.798095703125, 6.404296875, 7.010498046875, 7.61669921875, 8.222900390625, 8.8291015625, 9.435302734375, 10.04150390625, 10.647705078125, 11.25390625, 11.860107421875, 12.46630859375, 13.072509765625, 13.6787109375, 14.284912109375, 14.89111328125, 15.497314453125, 16.103515625, 16.709716796875, 17.31591796875, 17.922119140625, 18.5283203125, 19.134521484375, 19.74072265625, 20.346923828125, 20.953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 10.0, 19.0, 14.0, 19.0, 28.0, 34.0, 35.0, 59.0, 77.0, 90.0, 162.0, 206.0, 294.0, 347.0, 418.0, 429.0, 432.0, 333.0, 242.0, 217.0, 148.0, 96.0, 71.0, 73.0, 45.0, 29.0, 18.0, 18.0, 27.0, 12.0, 6.0, 6.0, 5.0, 10.0, 5.0, 5.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.1953125, -8.9205322265625, -8.645751953125, -8.3709716796875, -8.09619140625, -7.8214111328125, -7.546630859375, -7.2718505859375, -6.9970703125, -6.7222900390625, -6.447509765625, -6.1727294921875, -5.89794921875, -5.6231689453125, -5.348388671875, -5.0736083984375, -4.798828125, -4.5240478515625, -4.249267578125, -3.9744873046875, -3.69970703125, -3.4249267578125, -3.150146484375, -2.8753662109375, -2.6005859375, -2.3258056640625, -2.051025390625, -1.7762451171875, -1.50146484375, -1.2266845703125, -0.951904296875, -0.6771240234375, -0.40234375, -0.1275634765625, 0.147216796875, 0.4219970703125, 0.69677734375, 0.9715576171875, 1.246337890625, 1.5211181640625, 1.7958984375, 2.0706787109375, 2.345458984375, 2.6202392578125, 2.89501953125, 3.1697998046875, 3.444580078125, 3.7193603515625, 3.994140625, 4.2689208984375, 4.543701171875, 4.8184814453125, 5.09326171875, 5.3680419921875, 5.642822265625, 5.9176025390625, 6.1923828125, 6.4671630859375, 6.741943359375, 7.0167236328125, 7.29150390625, 7.5662841796875, 7.841064453125, 8.1158447265625, 8.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 7.0, 7.0, 14.0, 13.0, 17.0, 24.0, 30.0, 49.0, 44.0, 56.0, 87.0, 134.0, 145.0, 206.0, 320.0, 445.0, 1053.0, 7499.0, 386471.0, 3716539.0, 75858.0, 3082.0, 717.0, 428.0, 308.0, 188.0, 120.0, 99.0, 83.0, 46.0, 39.0, 32.0, 30.0, 21.0, 16.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.515625, -27.5751953125, -26.634765625, -25.6943359375, -24.75390625, -23.8134765625, -22.873046875, -21.9326171875, -20.9921875, -20.0517578125, -19.111328125, -18.1708984375, -17.23046875, -16.2900390625, -15.349609375, -14.4091796875, -13.46875, -12.5283203125, -11.587890625, -10.6474609375, -9.70703125, -8.7666015625, -7.826171875, -6.8857421875, -5.9453125, -5.0048828125, -4.064453125, -3.1240234375, -2.18359375, -1.2431640625, -0.302734375, 0.6376953125, 1.578125, 2.5185546875, 3.458984375, 4.3994140625, 5.33984375, 6.2802734375, 7.220703125, 8.1611328125, 9.1015625, 10.0419921875, 10.982421875, 11.9228515625, 12.86328125, 13.8037109375, 14.744140625, 15.6845703125, 16.625, 17.5654296875, 18.505859375, 19.4462890625, 20.38671875, 21.3271484375, 22.267578125, 23.2080078125, 24.1484375, 25.0888671875, 26.029296875, 26.9697265625, 27.91015625, 28.8505859375, 29.791015625, 30.7314453125, 31.671875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 37.0, 134.0, 294.0, 358.0, 142.0, 33.0, 8.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.67366027832031, -95.59175109863281, -92.50984191894531, -89.42793273925781, -86.34603118896484, -83.26412200927734, -80.18221282958984, -77.10030364990234, -74.01840209960938, -70.93649291992188, -67.85458374023438, -64.77267456054688, -61.690773010253906, -58.608863830566406, -55.526954650878906, -52.445045471191406, -49.363136291503906, -46.281227111816406, -43.19932174682617, -40.11741256713867, -37.03550720214844, -33.95359802246094, -30.871688842773438, -27.78978157043457, -24.707874298095703, -21.625967025756836, -18.54405975341797, -15.462150573730469, -12.380243301391602, -9.298336029052734, -6.216426849365234, -3.134519577026367, -0.05260467529296875, 3.0293030738830566, 6.111210823059082, 9.193119049072266, 12.275026321411133, 15.35693359375, 18.4388427734375, 21.520750045776367, 24.602657318115234, 27.6845645904541, 30.76647186279297, 33.84838104248047, 36.93029022216797, 40.0121955871582, 43.0941047668457, 46.17601013183594, 49.25791931152344, 52.33982849121094, 55.42173385620117, 58.50364303588867, 61.585548400878906, 64.6674575805664, 67.7493667602539, 70.8312759399414, 73.91317749023438, 76.99508666992188, 80.07699584960938, 83.15890502929688, 86.24080657958984, 89.32271575927734, 92.40462493896484, 95.48653411865234, 98.56844329833984]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 16.0, 19.0, 27.0, 19.0, 22.0, 26.0, 41.0, 32.0, 34.0, 44.0, 43.0, 37.0, 48.0, 30.0, 39.0, 44.0, 49.0, 36.0, 32.0, 43.0, 38.0, 30.0, 21.0, 28.0, 25.0, 24.0, 18.0, 17.0, 9.0, 15.0, 7.0, 10.0, 7.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-36.279273986816406, -35.24752426147461, -34.21577835083008, -33.18402862548828, -32.15228271484375, -31.120532989501953, -30.088783264160156, -29.057035446166992, -28.025287628173828, -26.993539810180664, -25.9617919921875, -24.930042266845703, -23.89829444885254, -22.866546630859375, -21.834796905517578, -20.803049087524414, -19.77130126953125, -18.739553451538086, -17.707805633544922, -16.676055908203125, -15.644308090209961, -14.612560272216797, -13.580811500549316, -12.549062728881836, -11.517314910888672, -10.485567092895508, -9.453818321228027, -8.422069549560547, -7.390321731567383, -6.3585734367370605, -5.326825141906738, -4.295076847076416, -3.2633323669433594, -2.231584072113037, -1.1998357772827148, -0.16808748245239258, 0.8636608123779297, 1.895409107208252, 2.927157402038574, 3.9589056968688965, 4.990653991699219, 6.022402286529541, 7.054150581359863, 8.085899353027344, 9.117647171020508, 10.149394989013672, 11.181143760681152, 12.212892532348633, 13.244640350341797, 14.276388168334961, 15.308136940002441, 16.339885711669922, 17.371633529663086, 18.40338134765625, 19.435131072998047, 20.46687889099121, 21.498626708984375, 22.53037452697754, 23.562122344970703, 24.5938720703125, 25.625619888305664, 26.657367706298828, 27.689117431640625, 28.72086524963379, 29.752613067626953]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 6.0, 3.0, 7.0, 13.0, 13.0, 17.0, 22.0, 32.0, 26.0, 28.0, 29.0, 41.0, 36.0, 31.0, 43.0, 42.0, 41.0, 53.0, 39.0, 31.0, 40.0, 42.0, 32.0, 31.0, 34.0, 37.0, 24.0, 31.0, 25.0, 22.0, 19.0, 17.0, 23.0, 11.0, 7.0, 7.0, 8.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.76171875, -5.57330322265625, -5.3848876953125, -5.19647216796875, -5.008056640625, -4.81964111328125, -4.6312255859375, -4.44281005859375, -4.25439453125, -4.06597900390625, -3.8775634765625, -3.68914794921875, -3.500732421875, -3.31231689453125, -3.1239013671875, -2.93548583984375, -2.7470703125, -2.55865478515625, -2.3702392578125, -2.18182373046875, -1.993408203125, -1.80499267578125, -1.6165771484375, -1.42816162109375, -1.23974609375, -1.05133056640625, -0.8629150390625, -0.67449951171875, -0.486083984375, -0.29766845703125, -0.1092529296875, 0.07916259765625, 0.267578125, 0.45599365234375, 0.6444091796875, 0.83282470703125, 1.021240234375, 1.20965576171875, 1.3980712890625, 1.58648681640625, 1.77490234375, 1.96331787109375, 2.1517333984375, 2.34014892578125, 2.528564453125, 2.71697998046875, 2.9053955078125, 3.09381103515625, 3.2822265625, 3.47064208984375, 3.6590576171875, 3.84747314453125, 4.035888671875, 4.22430419921875, 4.4127197265625, 4.60113525390625, 4.78955078125, 4.97796630859375, 5.1663818359375, 5.35479736328125, 5.543212890625, 5.73162841796875, 5.9200439453125, 6.10845947265625, 6.296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 7.0, 10.0, 14.0, 29.0, 28.0, 46.0, 69.0, 84.0, 114.0, 174.0, 278.0, 382.0, 481.0, 718.0, 1027.0, 1389.0, 1993.0, 2728.0, 3966.0, 5497.0, 7996.0, 11435.0, 16788.0, 24294.0, 35449.0, 51922.0, 77509.0, 117644.0, 177808.0, 168787.0, 110388.0, 72534.0, 48329.0, 33334.0, 23006.0, 15498.0, 10922.0, 7621.0, 5294.0, 3790.0, 2644.0, 1878.0, 1346.0, 958.0, 704.0, 487.0, 334.0, 247.0, 178.0, 136.0, 86.0, 55.0, 41.0, 33.0, 19.0, 14.0, 9.0, 9.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.46923828125, -0.45406341552734375, -0.4388885498046875, -0.42371368408203125, -0.408538818359375, -0.39336395263671875, -0.3781890869140625, -0.36301422119140625, -0.34783935546875, -0.33266448974609375, -0.3174896240234375, -0.30231475830078125, -0.287139892578125, -0.27196502685546875, -0.2567901611328125, -0.24161529541015625, -0.2264404296875, -0.21126556396484375, -0.1960906982421875, -0.18091583251953125, -0.165740966796875, -0.15056610107421875, -0.1353912353515625, -0.12021636962890625, -0.10504150390625, -0.08986663818359375, -0.0746917724609375, -0.05951690673828125, -0.044342041015625, -0.02916717529296875, -0.0139923095703125, 0.00118255615234375, 0.016357421875, 0.03153228759765625, 0.0467071533203125, 0.06188201904296875, 0.077056884765625, 0.09223175048828125, 0.1074066162109375, 0.12258148193359375, 0.13775634765625, 0.15293121337890625, 0.1681060791015625, 0.18328094482421875, 0.198455810546875, 0.21363067626953125, 0.2288055419921875, 0.24398040771484375, 0.2591552734375, 0.27433013916015625, 0.2895050048828125, 0.30467987060546875, 0.319854736328125, 0.33502960205078125, 0.3502044677734375, 0.36537933349609375, 0.38055419921875, 0.39572906494140625, 0.4109039306640625, 0.42607879638671875, 0.441253662109375, 0.45642852783203125, 0.4716033935546875, 0.48677825927734375, 0.501953125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 11.0, 7.0, 13.0, 19.0, 10.0, 17.0, 20.0, 24.0, 26.0, 27.0, 20.0, 30.0, 30.0, 48.0, 37.0, 35.0, 45.0, 28.0, 34.0, 1057.0, 48.0, 30.0, 35.0, 47.0, 37.0, 28.0, 24.0, 32.0, 26.0, 23.0, 25.0, 19.0, 17.0, 18.0, 14.0, 7.0, 15.0, 8.0, 8.0, 4.0, 5.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.190765380859375, -3.07489013671875, -2.959014892578125, -2.8431396484375, -2.727264404296875, -2.61138916015625, -2.495513916015625, -2.379638671875, -2.263763427734375, -2.14788818359375, -2.032012939453125, -1.9161376953125, -1.800262451171875, -1.68438720703125, -1.568511962890625, -1.45263671875, -1.336761474609375, -1.22088623046875, -1.105010986328125, -0.9891357421875, -0.873260498046875, -0.75738525390625, -0.641510009765625, -0.525634765625, -0.409759521484375, -0.29388427734375, -0.178009033203125, -0.0621337890625, 0.053741455078125, 0.16961669921875, 0.285491943359375, 0.4013671875, 0.517242431640625, 0.63311767578125, 0.748992919921875, 0.8648681640625, 0.980743408203125, 1.09661865234375, 1.212493896484375, 1.328369140625, 1.444244384765625, 1.56011962890625, 1.675994873046875, 1.7918701171875, 1.907745361328125, 2.02362060546875, 2.139495849609375, 2.25537109375, 2.371246337890625, 2.48712158203125, 2.602996826171875, 2.7188720703125, 2.834747314453125, 2.95062255859375, 3.066497802734375, 3.182373046875, 3.298248291015625, 3.41412353515625, 3.529998779296875, 3.6458740234375, 3.761749267578125, 3.87762451171875, 3.993499755859375, 4.109375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 4.0, 12.0, 14.0, 27.0, 22.0, 35.0, 65.0, 86.0, 132.0, 170.0, 263.0, 412.0, 603.0, 814.0, 1147.0, 1689.0, 2469.0, 3656.0, 5445.0, 7859.0, 11907.0, 18056.0, 28063.0, 44687.0, 72402.0, 118616.0, 296978.0, 1139290.0, 128325.0, 77436.0, 47837.0, 30112.0, 19449.0, 12595.0, 8428.0, 5654.0, 3819.0, 2605.0, 1878.0, 1236.0, 894.0, 621.0, 373.0, 317.0, 202.0, 138.0, 102.0, 72.0, 44.0, 33.0, 21.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50048828125, -0.48384857177734375, -0.4672088623046875, -0.45056915283203125, -0.433929443359375, -0.41728973388671875, -0.4006500244140625, -0.38401031494140625, -0.36737060546875, -0.35073089599609375, -0.3340911865234375, -0.31745147705078125, -0.300811767578125, -0.28417205810546875, -0.2675323486328125, -0.25089263916015625, -0.2342529296875, -0.21761322021484375, -0.2009735107421875, -0.18433380126953125, -0.167694091796875, -0.15105438232421875, -0.1344146728515625, -0.11777496337890625, -0.10113525390625, -0.08449554443359375, -0.0678558349609375, -0.05121612548828125, -0.034576416015625, -0.01793670654296875, -0.0012969970703125, 0.01534271240234375, 0.031982421875, 0.04862213134765625, 0.0652618408203125, 0.08190155029296875, 0.098541259765625, 0.11518096923828125, 0.1318206787109375, 0.14846038818359375, 0.16510009765625, 0.18173980712890625, 0.1983795166015625, 0.21501922607421875, 0.231658935546875, 0.24829864501953125, 0.2649383544921875, 0.28157806396484375, 0.2982177734375, 0.31485748291015625, 0.3314971923828125, 0.34813690185546875, 0.364776611328125, 0.38141632080078125, 0.3980560302734375, 0.41469573974609375, 0.43133544921875, 0.44797515869140625, 0.4646148681640625, 0.48125457763671875, 0.497894287109375, 0.5145339965820312, 0.5311737060546875, 0.5478134155273438, 0.564453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 9.0, 11.0, 6.0, 11.0, 19.0, 18.0, 20.0, 24.0, 34.0, 28.0, 48.0, 63.0, 85.0, 109.0, 96.0, 71.0, 72.0, 39.0, 31.0, 27.0, 19.0, 28.0, 18.0, 18.0, 9.0, 12.0, 17.0, 13.0, 6.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006649017333984375, -0.006403863430023193, -0.006158709526062012, -0.00591355562210083, -0.0056684017181396484, -0.005423247814178467, -0.005178093910217285, -0.0049329400062561035, -0.004687786102294922, -0.00444263219833374, -0.004197478294372559, -0.003952324390411377, -0.0037071704864501953, -0.0034620165824890137, -0.003216862678527832, -0.0029717087745666504, -0.0027265548706054688, -0.002481400966644287, -0.0022362470626831055, -0.001991093158721924, -0.0017459392547607422, -0.0015007853507995605, -0.001255631446838379, -0.0010104775428771973, -0.0007653236389160156, -0.000520169734954834, -0.00027501583099365234, -2.9861927032470703e-05, 0.00021529197692871094, 0.0004604458808898926, 0.0007055997848510742, 0.0009507536888122559, 0.0011959075927734375, 0.0014410614967346191, 0.0016862154006958008, 0.0019313693046569824, 0.002176523208618164, 0.0024216771125793457, 0.0026668310165405273, 0.002911984920501709, 0.0031571388244628906, 0.0034022927284240723, 0.003647446632385254, 0.0038926005363464355, 0.004137754440307617, 0.004382908344268799, 0.0046280622482299805, 0.004873216152191162, 0.005118370056152344, 0.005363523960113525, 0.005608677864074707, 0.005853831768035889, 0.00609898567199707, 0.006344139575958252, 0.006589293479919434, 0.006834447383880615, 0.007079601287841797, 0.0073247551918029785, 0.00756990909576416, 0.007815062999725342, 0.008060216903686523, 0.008305370807647705, 0.008550524711608887, 0.008795678615570068, 0.00904083251953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 5.0, 6.0, 8.0, 9.0, 25.0, 25.0, 19.0, 28.0, 33.0, 46.0, 53.0, 75.0, 102.0, 172.0, 351.0, 733.0, 10915.0, 1033233.0, 1439.0, 514.0, 237.0, 147.0, 85.0, 70.0, 40.0, 35.0, 33.0, 20.0, 19.0, 15.0, 10.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.192138671875, -0.186981201171875, -0.18182373046875, -0.176666259765625, -0.1715087890625, -0.166351318359375, -0.16119384765625, -0.156036376953125, -0.15087890625, -0.145721435546875, -0.14056396484375, -0.135406494140625, -0.1302490234375, -0.125091552734375, -0.11993408203125, -0.114776611328125, -0.109619140625, -0.104461669921875, -0.09930419921875, -0.094146728515625, -0.0889892578125, -0.083831787109375, -0.07867431640625, -0.073516845703125, -0.068359375, -0.063201904296875, -0.05804443359375, -0.052886962890625, -0.0477294921875, -0.042572021484375, -0.03741455078125, -0.032257080078125, -0.027099609375, -0.021942138671875, -0.01678466796875, -0.011627197265625, -0.0064697265625, -0.001312255859375, 0.00384521484375, 0.009002685546875, 0.01416015625, 0.019317626953125, 0.02447509765625, 0.029632568359375, 0.0347900390625, 0.039947509765625, 0.04510498046875, 0.050262451171875, 0.055419921875, 0.060577392578125, 0.06573486328125, 0.070892333984375, 0.0760498046875, 0.081207275390625, 0.08636474609375, 0.091522216796875, 0.0966796875, 0.101837158203125, 0.10699462890625, 0.112152099609375, 0.1173095703125, 0.122467041015625, 0.12762451171875, 0.132781982421875, 0.137939453125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 99.0, 882.0, 31.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040068477392196655, -0.03925670310854912, -0.03844492882490158, -0.037633154541254044, -0.036821380257606506, -0.03600960597395897, -0.03519783169031143, -0.034386057406663895, -0.03357428312301636, -0.03276250883936882, -0.03195073455572128, -0.031138960272073746, -0.03032718598842621, -0.02951541170477867, -0.028703637421131134, -0.027891863137483597, -0.02708008699119091, -0.026268312707543373, -0.025456538423895836, -0.0246447641402483, -0.02383298985660076, -0.023021215572953224, -0.022209439426660538, -0.021397665143013, -0.020585890859365463, -0.019774116575717926, -0.01896234229207039, -0.01815056800842285, -0.017338793724775314, -0.016527019441127777, -0.01571524515748024, -0.014903469942510128, -0.014091694727540016, -0.013279920443892479, -0.012468146160244942, -0.011656371876597404, -0.010844597592949867, -0.01003282330930233, -0.009221048094332218, -0.008409273810684681, -0.007597499527037144, -0.0067857252433896065, -0.005973950959742069, -0.005162176210433245, -0.0043504019267857075, -0.0035386276431381702, -0.0027268528938293457, -0.0019150786101818085, -0.0011033043265342712, -0.0002915299264714122, 0.0005202444735914469, 0.0013320189900696278, 0.002143793273717165, 0.0029555675573647022, 0.0037673423066735268, 0.004579116590321064, 0.005390890873968601, 0.0062026651576161385, 0.007014439441263676, 0.007826214656233788, 0.008637988939881325, 0.009449763223528862, 0.0102615375071764, 0.011073311790823936, 0.011885086074471474]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 7.0, 2.0, 15.0, 16.0, 10.0, 20.0, 14.0, 17.0, 28.0, 23.0, 22.0, 32.0, 26.0, 40.0, 31.0, 36.0, 44.0, 35.0, 44.0, 42.0, 52.0, 46.0, 56.0, 46.0, 37.0, 39.0, 19.0, 34.0, 27.0, 29.0, 24.0, 17.0, 17.0, 9.0, 8.0, 8.0, 14.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.004099180921912193, -0.003971677273511887, -0.00384417362511158, -0.003716669976711273, -0.0035891663283109665, -0.00346166267991066, -0.003334159031510353, -0.0032066553831100464, -0.0030791517347097397, -0.002951648086309433, -0.0028241444379091263, -0.0026966407895088196, -0.002569137141108513, -0.002441633492708206, -0.0023141298443078995, -0.0021866261959075928, -0.002059122547507286, -0.0019316188991069794, -0.0018041152507066727, -0.001676611602306366, -0.0015491079539060593, -0.0014216043055057526, -0.0012941006571054459, -0.0011665970087051392, -0.0010390933603048325, -0.0009115897119045258, -0.0007840860635042191, -0.0006565824151039124, -0.0005290787667036057, -0.00040157511830329895, -0.00027407146990299225, -0.00014656782150268555, -1.9064173102378845e-05, 0.00010843947529792786, 0.00023594312369823456, 0.00036344677209854126, 0.000490950420498848, 0.0006184540688991547, 0.0007459577172994614, 0.0008734613656997681, 0.0010009650141000748, 0.0011284686625003815, 0.0012559723109006882, 0.0013834759593009949, 0.0015109796077013016, 0.0016384832561016083, 0.001765986904501915, 0.0018934905529022217, 0.0020209942013025284, 0.002148497849702835, 0.002276001498103142, 0.0024035051465034485, 0.002531008794903755, 0.002658512443304062, 0.0027860160917043686, 0.0029135197401046753, 0.003041023388504982, 0.0031685270369052887, 0.0032960306853055954, 0.003423534333705902, 0.003551037982106209, 0.0036785416305065155, 0.003806045278906822, 0.003933548927307129]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 6.0, 3.0, 7.0, 13.0, 13.0, 17.0, 22.0, 32.0, 26.0, 28.0, 29.0, 41.0, 36.0, 31.0, 43.0, 42.0, 41.0, 53.0, 39.0, 31.0, 40.0, 42.0, 32.0, 31.0, 34.0, 37.0, 24.0, 31.0, 25.0, 22.0, 19.0, 17.0, 23.0, 11.0, 7.0, 7.0, 8.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.76171875, -5.57330322265625, -5.3848876953125, -5.19647216796875, -5.008056640625, -4.81964111328125, -4.6312255859375, -4.44281005859375, -4.25439453125, -4.06597900390625, -3.8775634765625, -3.68914794921875, -3.500732421875, -3.31231689453125, -3.1239013671875, -2.93548583984375, -2.7470703125, -2.55865478515625, -2.3702392578125, -2.18182373046875, -1.993408203125, -1.80499267578125, -1.6165771484375, -1.42816162109375, -1.23974609375, -1.05133056640625, -0.8629150390625, -0.67449951171875, -0.486083984375, -0.29766845703125, -0.1092529296875, 0.07916259765625, 0.267578125, 0.45599365234375, 0.6444091796875, 0.83282470703125, 1.021240234375, 1.20965576171875, 1.3980712890625, 1.58648681640625, 1.77490234375, 1.96331787109375, 2.1517333984375, 2.34014892578125, 2.528564453125, 2.71697998046875, 2.9053955078125, 3.09381103515625, 3.2822265625, 3.47064208984375, 3.6590576171875, 3.84747314453125, 4.035888671875, 4.22430419921875, 4.4127197265625, 4.60113525390625, 4.78955078125, 4.97796630859375, 5.1663818359375, 5.35479736328125, 5.543212890625, 5.73162841796875, 5.9200439453125, 6.10845947265625, 6.296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 6.0, 7.0, 7.0, 9.0, 14.0, 16.0, 29.0, 42.0, 28.0, 75.0, 72.0, 116.0, 124.0, 193.0, 295.0, 453.0, 955.0, 3584.0, 18884.0, 119465.0, 655834.0, 210432.0, 29501.0, 5514.0, 1243.0, 529.0, 283.0, 230.0, 152.0, 104.0, 91.0, 56.0, 51.0, 43.0, 28.0, 23.0, 16.0, 15.0, 5.0, 14.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.671875, -10.323486328125, -9.97509765625, -9.626708984375, -9.2783203125, -8.929931640625, -8.58154296875, -8.233154296875, -7.884765625, -7.536376953125, -7.18798828125, -6.839599609375, -6.4912109375, -6.142822265625, -5.79443359375, -5.446044921875, -5.09765625, -4.749267578125, -4.40087890625, -4.052490234375, -3.7041015625, -3.355712890625, -3.00732421875, -2.658935546875, -2.310546875, -1.962158203125, -1.61376953125, -1.265380859375, -0.9169921875, -0.568603515625, -0.22021484375, 0.128173828125, 0.4765625, 0.824951171875, 1.17333984375, 1.521728515625, 1.8701171875, 2.218505859375, 2.56689453125, 2.915283203125, 3.263671875, 3.612060546875, 3.96044921875, 4.308837890625, 4.6572265625, 5.005615234375, 5.35400390625, 5.702392578125, 6.05078125, 6.399169921875, 6.74755859375, 7.095947265625, 7.4443359375, 7.792724609375, 8.14111328125, 8.489501953125, 8.837890625, 9.186279296875, 9.53466796875, 9.883056640625, 10.2314453125, 10.579833984375, 10.92822265625, 11.276611328125, 11.625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 6.0, 7.0, 9.0, 16.0, 7.0, 19.0, 15.0, 20.0, 33.0, 31.0, 23.0, 23.0, 33.0, 43.0, 46.0, 46.0, 90.0, 146.0, 391.0, 1379.0, 154.0, 74.0, 68.0, 27.0, 41.0, 25.0, 39.0, 32.0, 27.0, 31.0, 16.0, 26.0, 23.0, 15.0, 12.0, 6.0, 5.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.609375, -18.028076171875, -17.44677734375, -16.865478515625, -16.2841796875, -15.702880859375, -15.12158203125, -14.540283203125, -13.958984375, -13.377685546875, -12.79638671875, -12.215087890625, -11.6337890625, -11.052490234375, -10.47119140625, -9.889892578125, -9.30859375, -8.727294921875, -8.14599609375, -7.564697265625, -6.9833984375, -6.402099609375, -5.82080078125, -5.239501953125, -4.658203125, -4.076904296875, -3.49560546875, -2.914306640625, -2.3330078125, -1.751708984375, -1.17041015625, -0.589111328125, -0.0078125, 0.573486328125, 1.15478515625, 1.736083984375, 2.3173828125, 2.898681640625, 3.47998046875, 4.061279296875, 4.642578125, 5.223876953125, 5.80517578125, 6.386474609375, 6.9677734375, 7.549072265625, 8.13037109375, 8.711669921875, 9.29296875, 9.874267578125, 10.45556640625, 11.036865234375, 11.6181640625, 12.199462890625, 12.78076171875, 13.362060546875, 13.943359375, 14.524658203125, 15.10595703125, 15.687255859375, 16.2685546875, 16.849853515625, 17.43115234375, 18.012451171875, 18.59375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 9.0, 3.0, 5.0, 3.0, 13.0, 8.0, 22.0, 29.0, 40.0, 43.0, 33.0, 77.0, 104.0, 100.0, 190.0, 373.0, 797.0, 3864.0, 2482733.0, 652752.0, 2771.0, 715.0, 328.0, 207.0, 101.0, 81.0, 66.0, 58.0, 35.0, 32.0, 21.0, 22.0, 14.0, 9.0, 11.0, 9.0, 5.0, 8.0, 2.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.71875, -44.138671875, -42.55859375, -40.978515625, -39.3984375, -37.818359375, -36.23828125, -34.658203125, -33.078125, -31.498046875, -29.91796875, -28.337890625, -26.7578125, -25.177734375, -23.59765625, -22.017578125, -20.4375, -18.857421875, -17.27734375, -15.697265625, -14.1171875, -12.537109375, -10.95703125, -9.376953125, -7.796875, -6.216796875, -4.63671875, -3.056640625, -1.4765625, 0.103515625, 1.68359375, 3.263671875, 4.84375, 6.423828125, 8.00390625, 9.583984375, 11.1640625, 12.744140625, 14.32421875, 15.904296875, 17.484375, 19.064453125, 20.64453125, 22.224609375, 23.8046875, 25.384765625, 26.96484375, 28.544921875, 30.125, 31.705078125, 33.28515625, 34.865234375, 36.4453125, 38.025390625, 39.60546875, 41.185546875, 42.765625, 44.345703125, 45.92578125, 47.505859375, 49.0859375, 50.666015625, 52.24609375, 53.826171875, 55.40625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 929.0, 73.0], "bins": [-524.0326538085938, -515.6627197265625, -507.292724609375, -498.92279052734375, -490.5528259277344, -482.182861328125, -473.8128967285156, -465.44293212890625, -457.072998046875, -448.7030334472656, -440.33306884765625, -431.963134765625, -423.5931701660156, -415.22320556640625, -406.8532409667969, -398.4832763671875, -390.11334228515625, -381.7433776855469, -373.3734130859375, -365.00347900390625, -356.6335144042969, -348.2635498046875, -339.8935852050781, -331.52362060546875, -323.1536560058594, -314.78369140625, -306.4137268066406, -298.0437927246094, -289.673828125, -281.3038635253906, -272.93389892578125, -264.56396484375, -256.19403076171875, -247.82406616210938, -239.45411682128906, -231.0841522216797, -222.71420288085938, -214.34423828125, -205.97427368164062, -197.6043243408203, -189.23435974121094, -180.86439514160156, -172.49444580078125, -164.12448120117188, -155.75453186035156, -147.3845672607422, -139.01461791992188, -130.6446533203125, -122.27470397949219, -113.90474700927734, -105.5347900390625, -97.16482543945312, -88.79487609863281, -80.42491149902344, -72.0549545288086, -63.68499755859375, -55.315040588378906, -46.94508361816406, -38.57512664794922, -30.20516586303711, -21.835208892822266, -13.465251922607422, -5.0952911376953125, 3.2746658325195312, 11.644623756408691]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 5.0, 14.0, 14.0, 24.0, 25.0, 16.0, 24.0, 32.0, 22.0, 38.0, 39.0, 26.0, 40.0, 31.0, 35.0, 34.0, 38.0, 28.0, 37.0, 37.0, 40.0, 45.0, 33.0, 28.0, 27.0, 21.0, 28.0, 24.0, 22.0, 27.0, 18.0, 24.0, 13.0, 12.0, 13.0, 10.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-46.82723617553711, -45.36745834350586, -43.907684326171875, -42.447906494140625, -40.98813247680664, -39.52835464477539, -38.068580627441406, -36.608802795410156, -35.149024963378906, -33.689247131347656, -32.22947311401367, -30.769695281982422, -29.309921264648438, -27.850143432617188, -26.39036750793457, -24.930591583251953, -23.47081756591797, -22.01104164123535, -20.551265716552734, -19.091487884521484, -17.6317138671875, -16.17193603515625, -14.712160110473633, -13.252384185791016, -11.792608261108398, -10.332832336425781, -8.873056411743164, -7.4132795333862305, -5.953503608703613, -4.493727684020996, -3.0339508056640625, -1.5741748809814453, -0.1143951416015625, 1.3453810214996338, 2.80515718460083, 4.2649335861206055, 5.724709510803223, 7.18448543548584, 8.644262313842773, 10.10403823852539, 11.563814163208008, 13.023590087890625, 14.483366012573242, 15.943142890930176, 17.40291976928711, 18.862693786621094, 20.322471618652344, 21.78224754333496, 23.242023468017578, 24.701799392700195, 26.161575317382812, 27.621353149414062, 29.081127166748047, 30.540904998779297, 32.00067901611328, 33.46045684814453, 34.92023468017578, 36.38001251220703, 37.839786529541016, 39.299564361572266, 40.75933837890625, 42.2191162109375, 43.67889404296875, 45.138668060302734, 46.59844207763672]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 8.0, 6.0, 5.0, 15.0, 17.0, 11.0, 19.0, 29.0, 25.0, 35.0, 36.0, 32.0, 37.0, 52.0, 39.0, 46.0, 43.0, 59.0, 35.0, 41.0, 52.0, 42.0, 35.0, 30.0, 30.0, 30.0, 27.0, 27.0, 28.0, 13.0, 19.0, 21.0, 12.0, 5.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.07550048828125, -5.8502197265625, -5.62493896484375, -5.399658203125, -5.17437744140625, -4.9490966796875, -4.72381591796875, -4.49853515625, -4.27325439453125, -4.0479736328125, -3.82269287109375, -3.597412109375, -3.37213134765625, -3.1468505859375, -2.92156982421875, -2.6962890625, -2.47100830078125, -2.2457275390625, -2.02044677734375, -1.795166015625, -1.56988525390625, -1.3446044921875, -1.11932373046875, -0.89404296875, -0.66876220703125, -0.4434814453125, -0.21820068359375, 0.007080078125, 0.23236083984375, 0.4576416015625, 0.68292236328125, 0.908203125, 1.13348388671875, 1.3587646484375, 1.58404541015625, 1.809326171875, 2.03460693359375, 2.2598876953125, 2.48516845703125, 2.71044921875, 2.93572998046875, 3.1610107421875, 3.38629150390625, 3.611572265625, 3.83685302734375, 4.0621337890625, 4.28741455078125, 4.5126953125, 4.73797607421875, 4.9632568359375, 5.18853759765625, 5.413818359375, 5.63909912109375, 5.8643798828125, 6.08966064453125, 6.31494140625, 6.54022216796875, 6.7655029296875, 6.99078369140625, 7.216064453125, 7.44134521484375, 7.6666259765625, 7.89190673828125, 8.1171875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 10.0, 15.0, 12.0, 24.0, 20.0, 23.0, 41.0, 54.0, 64.0, 85.0, 121.0, 249.0, 592.0, 3272.0, 78878.0, 2000663.0, 2032921.0, 72621.0, 3229.0, 620.0, 239.0, 117.0, 81.0, 54.0, 42.0, 45.0, 27.0, 37.0, 18.0, 14.0, 14.0, 12.0, 6.0, 9.0, 10.0, 5.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.0499267578125, -13.529541015625, -13.0091552734375, -12.48876953125, -11.9683837890625, -11.447998046875, -10.9276123046875, -10.4072265625, -9.8868408203125, -9.366455078125, -8.8460693359375, -8.32568359375, -7.8052978515625, -7.284912109375, -6.7645263671875, -6.244140625, -5.7237548828125, -5.203369140625, -4.6829833984375, -4.16259765625, -3.6422119140625, -3.121826171875, -2.6014404296875, -2.0810546875, -1.5606689453125, -1.040283203125, -0.5198974609375, 0.00048828125, 0.5208740234375, 1.041259765625, 1.5616455078125, 2.08203125, 2.6024169921875, 3.122802734375, 3.6431884765625, 4.16357421875, 4.6839599609375, 5.204345703125, 5.7247314453125, 6.2451171875, 6.7655029296875, 7.285888671875, 7.8062744140625, 8.32666015625, 8.8470458984375, 9.367431640625, 9.8878173828125, 10.408203125, 10.9285888671875, 11.448974609375, 11.9693603515625, 12.48974609375, 13.0101318359375, 13.530517578125, 14.0509033203125, 14.5712890625, 15.0916748046875, 15.612060546875, 16.1324462890625, 16.65283203125, 17.1732177734375, 17.693603515625, 18.2139892578125, 18.734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 8.0, 7.0, 7.0, 3.0, 19.0, 13.0, 33.0, 32.0, 40.0, 55.0, 68.0, 80.0, 109.0, 162.0, 192.0, 272.0, 364.0, 399.0, 421.0, 412.0, 331.0, 256.0, 193.0, 145.0, 107.0, 81.0, 68.0, 44.0, 30.0, 25.0, 13.0, 14.0, 12.0, 9.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0], "bins": [-9.8203125, -9.55902099609375, -9.2977294921875, -9.03643798828125, -8.775146484375, -8.51385498046875, -8.2525634765625, -7.99127197265625, -7.72998046875, -7.46868896484375, -7.2073974609375, -6.94610595703125, -6.684814453125, -6.42352294921875, -6.1622314453125, -5.90093994140625, -5.6396484375, -5.37835693359375, -5.1170654296875, -4.85577392578125, -4.594482421875, -4.33319091796875, -4.0718994140625, -3.81060791015625, -3.54931640625, -3.28802490234375, -3.0267333984375, -2.76544189453125, -2.504150390625, -2.24285888671875, -1.9815673828125, -1.72027587890625, -1.458984375, -1.19769287109375, -0.9364013671875, -0.67510986328125, -0.413818359375, -0.15252685546875, 0.1087646484375, 0.37005615234375, 0.63134765625, 0.89263916015625, 1.1539306640625, 1.41522216796875, 1.676513671875, 1.93780517578125, 2.1990966796875, 2.46038818359375, 2.7216796875, 2.98297119140625, 3.2442626953125, 3.50555419921875, 3.766845703125, 4.02813720703125, 4.2894287109375, 4.55072021484375, 4.81201171875, 5.07330322265625, 5.3345947265625, 5.59588623046875, 5.857177734375, 6.11846923828125, 6.3797607421875, 6.64105224609375, 6.90234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 10.0, 17.0, 28.0, 29.0, 39.0, 52.0, 57.0, 69.0, 106.0, 151.0, 222.0, 286.0, 479.0, 1042.0, 3425.0, 29524.0, 974786.0, 3080754.0, 93114.0, 6579.0, 1511.0, 662.0, 358.0, 247.0, 181.0, 123.0, 93.0, 92.0, 59.0, 40.0, 26.0, 17.0, 22.0, 10.0, 8.0, 10.0, 11.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.859375, -20.16845703125, -19.4775390625, -18.78662109375, -18.095703125, -17.40478515625, -16.7138671875, -16.02294921875, -15.33203125, -14.64111328125, -13.9501953125, -13.25927734375, -12.568359375, -11.87744140625, -11.1865234375, -10.49560546875, -9.8046875, -9.11376953125, -8.4228515625, -7.73193359375, -7.041015625, -6.35009765625, -5.6591796875, -4.96826171875, -4.27734375, -3.58642578125, -2.8955078125, -2.20458984375, -1.513671875, -0.82275390625, -0.1318359375, 0.55908203125, 1.25, 1.94091796875, 2.6318359375, 3.32275390625, 4.013671875, 4.70458984375, 5.3955078125, 6.08642578125, 6.77734375, 7.46826171875, 8.1591796875, 8.85009765625, 9.541015625, 10.23193359375, 10.9228515625, 11.61376953125, 12.3046875, 12.99560546875, 13.6865234375, 14.37744140625, 15.068359375, 15.75927734375, 16.4501953125, 17.14111328125, 17.83203125, 18.52294921875, 19.2138671875, 19.90478515625, 20.595703125, 21.28662109375, 21.9775390625, 22.66845703125, 23.359375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 30.0, 79.0, 147.0, 221.0, 223.0, 194.0, 68.0, 26.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.190202713012695, -24.065330505371094, -21.940460205078125, -19.815587997436523, -17.690715789794922, -15.565845489501953, -13.440973281860352, -11.316102027893066, -9.191230773925781, -7.066359519958496, -4.941487789154053, -2.8166160583496094, -0.6917448043823242, 1.433126449584961, 3.5579986572265625, 5.682869911193848, 7.807741165161133, 9.932612419128418, 12.057483673095703, 14.182355880737305, 16.307228088378906, 18.432098388671875, 20.556970596313477, 22.681842803955078, 24.806713104248047, 26.93158531188965, 29.056455612182617, 31.18132781982422, 33.30619812011719, 35.431068420410156, 37.55594253540039, 39.68081283569336, 41.805686950683594, 43.93055725097656, 46.0554313659668, 48.180301666259766, 50.305171966552734, 52.43004608154297, 54.55491638183594, 56.679786682128906, 58.804656982421875, 60.929527282714844, 63.05440139770508, 65.17927551269531, 67.30414581298828, 69.42901611328125, 71.55388641357422, 73.67875671386719, 75.80363464355469, 77.92850494384766, 80.05337524414062, 82.17825317382812, 84.3031234741211, 86.42799377441406, 88.55286407470703, 90.677734375, 92.80260467529297, 94.92747497558594, 97.0523452758789, 99.17721557617188, 101.30209350585938, 103.42696380615234, 105.55183410644531, 107.67670440673828, 109.80157470703125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 11.0, 5.0, 11.0, 7.0, 9.0, 14.0, 19.0, 19.0, 24.0, 14.0, 22.0, 27.0, 33.0, 23.0, 17.0, 41.0, 29.0, 39.0, 29.0, 35.0, 27.0, 46.0, 41.0, 28.0, 37.0, 37.0, 37.0, 48.0, 21.0, 22.0, 22.0, 31.0, 25.0, 28.0, 18.0, 14.0, 14.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 8.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.276453018188477, -27.345558166503906, -26.41466522216797, -25.4837703704834, -24.55287742614746, -23.62198257446289, -22.691089630126953, -21.760194778442383, -20.829299926757812, -19.898405075073242, -18.967512130737305, -18.036617279052734, -17.105724334716797, -16.174829483032227, -15.243935585021973, -14.313041687011719, -13.382148742675781, -12.451254844665527, -11.520360946655273, -10.589466094970703, -9.658573150634766, -8.727678298950195, -7.796784400939941, -6.8658905029296875, -5.934996604919434, -5.00410270690918, -4.073208808898926, -3.1423144340515137, -2.2114205360412598, -1.2805266380310059, -0.34963226318359375, 0.5812616348266602, 1.5121536254882812, 2.443047523498535, 3.373941659927368, 4.304835796356201, 5.235729694366455, 6.166623592376709, 7.097517967224121, 8.028411865234375, 8.959305763244629, 9.890199661254883, 10.821093559265137, 11.75198745727539, 12.682882308959961, 13.613775253295898, 14.544670104980469, 15.475564002990723, 16.406457901000977, 17.337352752685547, 18.268245697021484, 19.199140548706055, 20.130033493041992, 21.060928344726562, 21.9918212890625, 22.92271614074707, 23.85361099243164, 24.78450584411621, 25.71539878845215, 26.64629364013672, 27.577186584472656, 28.508081436157227, 29.438976287841797, 30.369869232177734, 31.300762176513672]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 8.0, 3.0, 4.0, 9.0, 9.0, 13.0, 6.0, 10.0, 27.0, 28.0, 30.0, 18.0, 26.0, 38.0, 46.0, 46.0, 41.0, 46.0, 30.0, 32.0, 47.0, 49.0, 42.0, 40.0, 41.0, 28.0, 43.0, 29.0, 29.0, 30.0, 21.0, 22.0, 17.0, 19.0, 15.0, 9.0, 10.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.4921875, -6.2860107421875, -6.079833984375, -5.8736572265625, -5.66748046875, -5.4613037109375, -5.255126953125, -5.0489501953125, -4.8427734375, -4.6365966796875, -4.430419921875, -4.2242431640625, -4.01806640625, -3.8118896484375, -3.605712890625, -3.3995361328125, -3.193359375, -2.9871826171875, -2.781005859375, -2.5748291015625, -2.36865234375, -2.1624755859375, -1.956298828125, -1.7501220703125, -1.5439453125, -1.3377685546875, -1.131591796875, -0.9254150390625, -0.71923828125, -0.5130615234375, -0.306884765625, -0.1007080078125, 0.10546875, 0.3116455078125, 0.517822265625, 0.7239990234375, 0.93017578125, 1.1363525390625, 1.342529296875, 1.5487060546875, 1.7548828125, 1.9610595703125, 2.167236328125, 2.3734130859375, 2.57958984375, 2.7857666015625, 2.991943359375, 3.1981201171875, 3.404296875, 3.6104736328125, 3.816650390625, 4.0228271484375, 4.22900390625, 4.4351806640625, 4.641357421875, 4.8475341796875, 5.0537109375, 5.2598876953125, 5.466064453125, 5.6722412109375, 5.87841796875, 6.0845947265625, 6.290771484375, 6.4969482421875, 6.703125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 16.0, 24.0, 28.0, 64.0, 45.0, 109.0, 136.0, 173.0, 291.0, 401.0, 636.0, 874.0, 1212.0, 1792.0, 2589.0, 3831.0, 5483.0, 8079.0, 11850.0, 17303.0, 25673.0, 38609.0, 59976.0, 93129.0, 147288.0, 202051.0, 149608.0, 95231.0, 60579.0, 39409.0, 26269.0, 17932.0, 11992.0, 8123.0, 5482.0, 3760.0, 2620.0, 1802.0, 1296.0, 868.0, 560.0, 406.0, 278.0, 201.0, 155.0, 116.0, 65.0, 41.0, 24.0, 23.0, 17.0, 14.0, 13.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.56005859375, -0.5422897338867188, -0.5245208740234375, -0.5067520141601562, -0.488983154296875, -0.47121429443359375, -0.4534454345703125, -0.43567657470703125, -0.41790771484375, -0.40013885498046875, -0.3823699951171875, -0.36460113525390625, -0.346832275390625, -0.32906341552734375, -0.3112945556640625, -0.29352569580078125, -0.2757568359375, -0.25798797607421875, -0.2402191162109375, -0.22245025634765625, -0.204681396484375, -0.18691253662109375, -0.1691436767578125, -0.15137481689453125, -0.13360595703125, -0.11583709716796875, -0.0980682373046875, -0.08029937744140625, -0.062530517578125, -0.04476165771484375, -0.0269927978515625, -0.00922393798828125, 0.008544921875, 0.02631378173828125, 0.0440826416015625, 0.06185150146484375, 0.079620361328125, 0.09738922119140625, 0.1151580810546875, 0.13292694091796875, 0.15069580078125, 0.16846466064453125, 0.1862335205078125, 0.20400238037109375, 0.221771240234375, 0.23954010009765625, 0.2573089599609375, 0.27507781982421875, 0.2928466796875, 0.31061553955078125, 0.3283843994140625, 0.34615325927734375, 0.363922119140625, 0.38169097900390625, 0.3994598388671875, 0.41722869873046875, 0.43499755859375, 0.45276641845703125, 0.4705352783203125, 0.48830413818359375, 0.506072998046875, 0.5238418579101562, 0.5416107177734375, 0.5593795776367188, 0.5771484375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 11.0, 10.0, 14.0, 12.0, 22.0, 26.0, 24.0, 31.0, 16.0, 16.0, 37.0, 30.0, 37.0, 34.0, 40.0, 32.0, 43.0, 29.0, 1064.0, 37.0, 48.0, 30.0, 30.0, 31.0, 28.0, 37.0, 25.0, 30.0, 24.0, 21.0, 21.0, 26.0, 17.0, 12.0, 18.0, 9.0, 6.0, 12.0, 2.0, 0.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.19921875, -4.076904296875, -3.95458984375, -3.832275390625, -3.7099609375, -3.587646484375, -3.46533203125, -3.343017578125, -3.220703125, -3.098388671875, -2.97607421875, -2.853759765625, -2.7314453125, -2.609130859375, -2.48681640625, -2.364501953125, -2.2421875, -2.119873046875, -1.99755859375, -1.875244140625, -1.7529296875, -1.630615234375, -1.50830078125, -1.385986328125, -1.263671875, -1.141357421875, -1.01904296875, -0.896728515625, -0.7744140625, -0.652099609375, -0.52978515625, -0.407470703125, -0.28515625, -0.162841796875, -0.04052734375, 0.081787109375, 0.2041015625, 0.326416015625, 0.44873046875, 0.571044921875, 0.693359375, 0.815673828125, 0.93798828125, 1.060302734375, 1.1826171875, 1.304931640625, 1.42724609375, 1.549560546875, 1.671875, 1.794189453125, 1.91650390625, 2.038818359375, 2.1611328125, 2.283447265625, 2.40576171875, 2.528076171875, 2.650390625, 2.772705078125, 2.89501953125, 3.017333984375, 3.1396484375, 3.261962890625, 3.38427734375, 3.506591796875, 3.62890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 11.0, 26.0, 30.0, 46.0, 50.0, 87.0, 111.0, 165.0, 221.0, 329.0, 515.0, 718.0, 1009.0, 1500.0, 2281.0, 3442.0, 5042.0, 7677.0, 12008.0, 18822.0, 29643.0, 48119.0, 80311.0, 133958.0, 1239538.0, 210530.0, 115876.0, 69319.0, 42015.0, 26100.0, 16472.0, 10427.0, 6896.0, 4524.0, 3051.0, 1962.0, 1403.0, 876.0, 634.0, 409.0, 292.0, 193.0, 143.0, 109.0, 68.0, 42.0, 32.0, 28.0, 18.0, 14.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.6044921875, -0.5855178833007812, -0.5665435791015625, -0.5475692749023438, -0.528594970703125, -0.5096206665039062, -0.4906463623046875, -0.47167205810546875, -0.45269775390625, -0.43372344970703125, -0.4147491455078125, -0.39577484130859375, -0.376800537109375, -0.35782623291015625, -0.3388519287109375, -0.31987762451171875, -0.3009033203125, -0.28192901611328125, -0.2629547119140625, -0.24398040771484375, -0.225006103515625, -0.20603179931640625, -0.1870574951171875, -0.16808319091796875, -0.14910888671875, -0.13013458251953125, -0.1111602783203125, -0.09218597412109375, -0.073211669921875, -0.05423736572265625, -0.0352630615234375, -0.01628875732421875, 0.002685546875, 0.02165985107421875, 0.0406341552734375, 0.05960845947265625, 0.078582763671875, 0.09755706787109375, 0.1165313720703125, 0.13550567626953125, 0.15447998046875, 0.17345428466796875, 0.1924285888671875, 0.21140289306640625, 0.230377197265625, 0.24935150146484375, 0.2683258056640625, 0.28730010986328125, 0.3062744140625, 0.32524871826171875, 0.3442230224609375, 0.36319732666015625, 0.382171630859375, 0.40114593505859375, 0.4201202392578125, 0.43909454345703125, 0.45806884765625, 0.47704315185546875, 0.4960174560546875, 0.5149917602539062, 0.533966064453125, 0.5529403686523438, 0.5719146728515625, 0.5908889770507812, 0.60986328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 9.0, 9.0, 12.0, 14.0, 9.0, 10.0, 18.0, 23.0, 34.0, 38.0, 40.0, 60.0, 100.0, 94.0, 114.0, 86.0, 69.0, 47.0, 43.0, 28.0, 21.0, 21.0, 12.0, 5.0, 10.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0064239501953125, -0.006235778331756592, -0.006047606468200684, -0.005859434604644775, -0.005671262741088867, -0.005483090877532959, -0.005294919013977051, -0.005106747150421143, -0.004918575286865234, -0.004730403423309326, -0.004542231559753418, -0.00435405969619751, -0.0041658878326416016, -0.003977715969085693, -0.003789544105529785, -0.003601372241973877, -0.0034132003784179688, -0.0032250285148620605, -0.0030368566513061523, -0.002848684787750244, -0.002660512924194336, -0.0024723410606384277, -0.0022841691970825195, -0.0020959973335266113, -0.0019078254699707031, -0.001719653606414795, -0.0015314817428588867, -0.0013433098793029785, -0.0011551380157470703, -0.0009669661521911621, -0.0007787942886352539, -0.0005906224250793457, -0.0004024505615234375, -0.0002142786979675293, -2.6106834411621094e-05, 0.0001620650291442871, 0.0003502368927001953, 0.0005384087562561035, 0.0007265806198120117, 0.0009147524833679199, 0.0011029243469238281, 0.0012910962104797363, 0.0014792680740356445, 0.0016674399375915527, 0.001855611801147461, 0.002043783664703369, 0.0022319555282592773, 0.0024201273918151855, 0.0026082992553710938, 0.002796471118927002, 0.00298464298248291, 0.0031728148460388184, 0.0033609867095947266, 0.0035491585731506348, 0.003737330436706543, 0.003925502300262451, 0.004113674163818359, 0.004301846027374268, 0.004490017890930176, 0.004678189754486084, 0.004866361618041992, 0.0050545334815979, 0.005242705345153809, 0.005430877208709717, 0.005619049072265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 6.0, 11.0, 6.0, 13.0, 17.0, 11.0, 22.0, 32.0, 40.0, 50.0, 95.0, 122.0, 236.0, 406.0, 1177.0, 991801.0, 52685.0, 797.0, 338.0, 197.0, 133.0, 73.0, 55.0, 32.0, 41.0, 22.0, 20.0, 23.0, 16.0, 11.0, 12.0, 14.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10864830017089844, -0.10474777221679688, -0.10084724426269531, -0.09694671630859375, -0.09304618835449219, -0.08914566040039062, -0.08524513244628906, -0.0813446044921875, -0.07744407653808594, -0.07354354858398438, -0.06964302062988281, -0.06574249267578125, -0.06184196472167969, -0.057941436767578125, -0.05404090881347656, -0.050140380859375, -0.04623985290527344, -0.042339324951171875, -0.03843879699707031, -0.03453826904296875, -0.030637741088867188, -0.026737213134765625, -0.022836685180664062, -0.0189361572265625, -0.015035629272460938, -0.011135101318359375, -0.0072345733642578125, -0.00333404541015625, 0.0005664825439453125, 0.004467010498046875, 0.008367538452148438, 0.01226806640625, 0.016168594360351562, 0.020069122314453125, 0.023969650268554688, 0.02787017822265625, 0.03177070617675781, 0.035671234130859375, 0.03957176208496094, 0.0434722900390625, 0.04737281799316406, 0.051273345947265625, 0.05517387390136719, 0.05907440185546875, 0.06297492980957031, 0.06687545776367188, 0.07077598571777344, 0.074676513671875, 0.07857704162597656, 0.08247756958007812, 0.08637809753417969, 0.09027862548828125, 0.09417915344238281, 0.09807968139648438, 0.10198020935058594, 0.1058807373046875, 0.10978126525878906, 0.11368179321289062, 0.11758232116699219, 0.12148284912109375, 0.1253833770751953, 0.12928390502929688, 0.13318443298339844, 0.1370849609375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 19.0, 391.0, 574.0, 29.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006860879249870777, -0.0064063784666359425, -0.005951878149062395, -0.00549737736582756, -0.005042877048254013, -0.004588376265019178, -0.004133875481784344, -0.0036793749313801527, -0.0032248743809759617, -0.0027703738305717707, -0.0023158732801675797, -0.001861372496932745, -0.001406871946528554, -0.0009523713961243629, -0.0004978706128895283, -4.337006248533726e-05, 0.00041113048791885376, 0.0008656310965307057, 0.0013201317051425576, 0.0017746323719620705, 0.0022291329223662615, 0.0026836334727704525, 0.003138134256005287, 0.003592634806409478, 0.004047135356813669, 0.004501636140048504, 0.004956136457622051, 0.005410637240856886, 0.005865138024091721, 0.006319638341665268, 0.006774139124900103, 0.007228639908134937, 0.00768313929438591, 0.008137639611959457, 0.00859214086085558, 0.009046641178429127, 0.009501141496002674, 0.009955642744898796, 0.010410143062472343, 0.01086464338004589, 0.011319143697619438, 0.011773644015192986, 0.012228145264089108, 0.012682645581662655, 0.013137145899236202, 0.013591647148132324, 0.014046147465705872, 0.014500647783279419, 0.014955149032175541, 0.015409649349749088, 0.01586415059864521, 0.016318650916218758, 0.016773151233792305, 0.017227651551365852, 0.01768215373158455, 0.018136654049158096, 0.018591154366731644, 0.01904565468430519, 0.01950015500187874, 0.019954655319452286, 0.020409157499670982, 0.02086365781724453, 0.021318158134818077, 0.021772658452391624, 0.022227158769965172]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 5.0, 14.0, 20.0, 13.0, 11.0, 20.0, 25.0, 25.0, 29.0, 30.0, 26.0, 39.0, 31.0, 49.0, 46.0, 44.0, 44.0, 32.0, 49.0, 42.0, 46.0, 38.0, 36.0, 33.0, 32.0, 30.0, 31.0, 28.0, 21.0, 16.0, 15.0, 11.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.003086388111114502, -0.0029953066259622574, -0.002904225140810013, -0.0028131436556577682, -0.0027220621705055237, -0.002630980685353279, -0.0025398992002010345, -0.00244881771504879, -0.0023577362298965454, -0.002266654744744301, -0.0021755732595920563, -0.0020844917744398117, -0.001993410289287567, -0.0019023288041353226, -0.001811247318983078, -0.0017201658338308334, -0.0016290843486785889, -0.0015380028635263443, -0.0014469213783740997, -0.0013558398932218552, -0.0012647584080696106, -0.001173676922917366, -0.0010825954377651215, -0.000991513952612877, -0.0009004324674606323, -0.0008093509823083878, -0.0007182694971561432, -0.0006271880120038986, -0.000536106526851654, -0.0004450250416994095, -0.0003539435565471649, -0.00026286207139492035, -0.00017178058624267578, -8.069910109043121e-05, 1.0382384061813354e-05, 0.00010146386921405792, 0.0001925453543663025, 0.00028362683951854706, 0.0003747083246707916, 0.0004657898098230362, 0.0005568712949752808, 0.0006479527801275253, 0.0007390342652797699, 0.0008301157504320145, 0.000921197235584259, 0.0010122787207365036, 0.0011033602058887482, 0.0011944416910409927, 0.0012855231761932373, 0.0013766046613454819, 0.0014676861464977264, 0.001558767631649971, 0.0016498491168022156, 0.0017409306019544601, 0.0018320120871067047, 0.0019230935722589493, 0.002014175057411194, 0.0021052565425634384, 0.002196338027715683, 0.0022874195128679276, 0.002378500998020172, 0.0024695824831724167, 0.0025606639683246613, 0.002651745453476906, 0.0027428269386291504]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 8.0, 3.0, 4.0, 9.0, 9.0, 13.0, 6.0, 10.0, 27.0, 28.0, 30.0, 18.0, 26.0, 38.0, 46.0, 46.0, 41.0, 46.0, 30.0, 32.0, 47.0, 48.0, 43.0, 40.0, 41.0, 28.0, 43.0, 29.0, 29.0, 30.0, 21.0, 22.0, 17.0, 19.0, 15.0, 9.0, 10.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.4921875, -6.2860107421875, -6.079833984375, -5.8736572265625, -5.66748046875, -5.4613037109375, -5.255126953125, -5.0489501953125, -4.8427734375, -4.6365966796875, -4.430419921875, -4.2242431640625, -4.01806640625, -3.8118896484375, -3.605712890625, -3.3995361328125, -3.193359375, -2.9871826171875, -2.781005859375, -2.5748291015625, -2.36865234375, -2.1624755859375, -1.956298828125, -1.7501220703125, -1.5439453125, -1.3377685546875, -1.131591796875, -0.9254150390625, -0.71923828125, -0.5130615234375, -0.306884765625, -0.1007080078125, 0.10546875, 0.3116455078125, 0.517822265625, 0.7239990234375, 0.93017578125, 1.1363525390625, 1.342529296875, 1.5487060546875, 1.7548828125, 1.9610595703125, 2.167236328125, 2.3734130859375, 2.57958984375, 2.7857666015625, 2.991943359375, 3.1981201171875, 3.404296875, 3.6104736328125, 3.816650390625, 4.0228271484375, 4.22900390625, 4.4351806640625, 4.641357421875, 4.8475341796875, 5.0537109375, 5.2598876953125, 5.466064453125, 5.6722412109375, 5.87841796875, 6.0845947265625, 6.290771484375, 6.4969482421875, 6.703125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 12.0, 7.0, 11.0, 27.0, 21.0, 32.0, 40.0, 55.0, 95.0, 96.0, 146.0, 218.0, 268.0, 377.0, 513.0, 721.0, 1556.0, 5894.0, 37880.0, 640530.0, 327528.0, 24608.0, 4192.0, 1294.0, 636.0, 468.0, 319.0, 242.0, 192.0, 154.0, 107.0, 75.0, 57.0, 43.0, 31.0, 24.0, 19.0, 14.0, 9.0, 11.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-16.421875, -15.906982421875, -15.39208984375, -14.877197265625, -14.3623046875, -13.847412109375, -13.33251953125, -12.817626953125, -12.302734375, -11.787841796875, -11.27294921875, -10.758056640625, -10.2431640625, -9.728271484375, -9.21337890625, -8.698486328125, -8.18359375, -7.668701171875, -7.15380859375, -6.638916015625, -6.1240234375, -5.609130859375, -5.09423828125, -4.579345703125, -4.064453125, -3.549560546875, -3.03466796875, -2.519775390625, -2.0048828125, -1.489990234375, -0.97509765625, -0.460205078125, 0.0546875, 0.569580078125, 1.08447265625, 1.599365234375, 2.1142578125, 2.629150390625, 3.14404296875, 3.658935546875, 4.173828125, 4.688720703125, 5.20361328125, 5.718505859375, 6.2333984375, 6.748291015625, 7.26318359375, 7.778076171875, 8.29296875, 8.807861328125, 9.32275390625, 9.837646484375, 10.3525390625, 10.867431640625, 11.38232421875, 11.897216796875, 12.412109375, 12.927001953125, 13.44189453125, 13.956787109375, 14.4716796875, 14.986572265625, 15.50146484375, 16.016357421875, 16.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 6.0, 5.0, 5.0, 8.0, 7.0, 11.0, 14.0, 15.0, 20.0, 22.0, 25.0, 40.0, 38.0, 32.0, 42.0, 39.0, 46.0, 112.0, 218.0, 1640.0, 197.0, 88.0, 55.0, 45.0, 37.0, 34.0, 31.0, 29.0, 30.0, 27.0, 18.0, 19.0, 16.0, 11.0, 14.0, 12.0, 8.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.26318359375, -21.6357421875, -21.00830078125, -20.380859375, -19.75341796875, -19.1259765625, -18.49853515625, -17.87109375, -17.24365234375, -16.6162109375, -15.98876953125, -15.361328125, -14.73388671875, -14.1064453125, -13.47900390625, -12.8515625, -12.22412109375, -11.5966796875, -10.96923828125, -10.341796875, -9.71435546875, -9.0869140625, -8.45947265625, -7.83203125, -7.20458984375, -6.5771484375, -5.94970703125, -5.322265625, -4.69482421875, -4.0673828125, -3.43994140625, -2.8125, -2.18505859375, -1.5576171875, -0.93017578125, -0.302734375, 0.32470703125, 0.9521484375, 1.57958984375, 2.20703125, 2.83447265625, 3.4619140625, 4.08935546875, 4.716796875, 5.34423828125, 5.9716796875, 6.59912109375, 7.2265625, 7.85400390625, 8.4814453125, 9.10888671875, 9.736328125, 10.36376953125, 10.9912109375, 11.61865234375, 12.24609375, 12.87353515625, 13.5009765625, 14.12841796875, 14.755859375, 15.38330078125, 16.0107421875, 16.63818359375, 17.265625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 7.0, 17.0, 12.0, 10.0, 21.0, 12.0, 16.0, 30.0, 40.0, 41.0, 56.0, 45.0, 77.0, 131.0, 231.0, 546.0, 2041.0, 51362.0, 3078193.0, 10541.0, 1231.0, 351.0, 206.0, 106.0, 78.0, 59.0, 45.0, 35.0, 32.0, 20.0, 23.0, 20.0, 5.0, 8.0, 7.0, 8.0, 5.0, 4.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.1875, -44.49755859375, -42.8076171875, -41.11767578125, -39.427734375, -37.73779296875, -36.0478515625, -34.35791015625, -32.66796875, -30.97802734375, -29.2880859375, -27.59814453125, -25.908203125, -24.21826171875, -22.5283203125, -20.83837890625, -19.1484375, -17.45849609375, -15.7685546875, -14.07861328125, -12.388671875, -10.69873046875, -9.0087890625, -7.31884765625, -5.62890625, -3.93896484375, -2.2490234375, -0.55908203125, 1.130859375, 2.82080078125, 4.5107421875, 6.20068359375, 7.890625, 9.58056640625, 11.2705078125, 12.96044921875, 14.650390625, 16.34033203125, 18.0302734375, 19.72021484375, 21.41015625, 23.10009765625, 24.7900390625, 26.47998046875, 28.169921875, 29.85986328125, 31.5498046875, 33.23974609375, 34.9296875, 36.61962890625, 38.3095703125, 39.99951171875, 41.689453125, 43.37939453125, 45.0693359375, 46.75927734375, 48.44921875, 50.13916015625, 51.8291015625, 53.51904296875, 55.208984375, 56.89892578125, 58.5888671875, 60.27880859375, 61.96875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 32.0, 86.0, 131.0, 190.0, 213.0, 169.0, 103.0, 51.0, 17.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.60552215576172, -31.626922607421875, -30.648324966430664, -29.66972541809082, -28.69112777709961, -27.712528228759766, -26.733928680419922, -25.75533103942871, -24.776731491088867, -23.798131942749023, -22.819534301757812, -21.84093475341797, -20.862337112426758, -19.883737564086914, -18.905139923095703, -17.92654037475586, -16.947940826416016, -15.969342231750488, -14.990743637084961, -14.012144088745117, -13.03354549407959, -12.054946899414062, -11.076348304748535, -10.097749710083008, -9.119152069091797, -8.14055347442627, -7.161954402923584, -6.183355808258057, -5.204756736755371, -4.226158142089844, -3.2475595474243164, -2.268960475921631, -1.2903614044189453, -0.31176263093948364, 0.666836142539978, 1.645434856414795, 2.6240336894989014, 3.602632522583008, 4.581231117248535, 5.559830188751221, 6.538428783416748, 7.517027378082275, 8.495626449584961, 9.474225044250488, 10.452823638916016, 11.43142318725586, 12.41002082824707, 13.388620376586914, 14.367218971252441, 15.345817565917969, 16.324417114257812, 17.303014755249023, 18.281614303588867, 19.260211944580078, 20.238811492919922, 21.217411041259766, 22.196008682250977, 23.17460823059082, 24.15320587158203, 25.131805419921875, 26.110403060913086, 27.08900260925293, 28.06760025024414, 29.046199798583984, 30.024799346923828]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 4.0, 6.0, 2.0, 3.0, 7.0, 15.0, 7.0, 22.0, 20.0, 19.0, 25.0, 18.0, 20.0, 27.0, 30.0, 29.0, 31.0, 29.0, 32.0, 30.0, 35.0, 29.0, 46.0, 52.0, 34.0, 34.0, 38.0, 29.0, 32.0, 29.0, 27.0, 29.0, 35.0, 24.0, 20.0, 14.0, 15.0, 19.0, 18.0, 12.0, 10.0, 6.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-44.967777252197266, -43.60894012451172, -42.25010299682617, -40.891265869140625, -39.53242874145508, -38.17359161376953, -36.81475067138672, -35.45591735839844, -34.097076416015625, -32.73823928833008, -31.37940216064453, -30.020565032958984, -28.661727905273438, -27.30289077758789, -25.94405174255371, -24.585214614868164, -23.22637939453125, -21.867542266845703, -20.508705139160156, -19.14986801147461, -17.791030883789062, -16.432193756103516, -15.073354721069336, -13.714517593383789, -12.355680465698242, -10.996843338012695, -9.638006210327148, -8.279168128967285, -6.920331001281738, -5.561493873596191, -4.202655792236328, -2.8438186645507812, -1.4849815368652344, -0.1261441707611084, 1.2326931953430176, 2.5915307998657227, 3.9503679275512695, 5.309205055236816, 6.66804313659668, 8.026880264282227, 9.385717391967773, 10.74455451965332, 12.103391647338867, 13.46222972869873, 14.821066856384277, 16.17990493774414, 17.538742065429688, 18.897579193115234, 20.25641632080078, 21.615253448486328, 22.974090576171875, 24.332927703857422, 25.69176483154297, 27.050601959228516, 28.409440994262695, 29.768278121948242, 31.12711524963379, 32.48595428466797, 33.844791412353516, 35.20362854003906, 36.56246566772461, 37.921302795410156, 39.2801399230957, 40.63897705078125, 41.9978141784668]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 12.0, 12.0, 11.0, 16.0, 12.0, 30.0, 35.0, 32.0, 35.0, 26.0, 41.0, 40.0, 49.0, 47.0, 35.0, 44.0, 35.0, 42.0, 40.0, 36.0, 34.0, 30.0, 33.0, 42.0, 29.0, 30.0, 22.0, 17.0, 18.0, 16.0, 18.0, 14.0, 12.0, 4.0, 10.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.52734375, -6.31298828125, -6.0986328125, -5.88427734375, -5.669921875, -5.45556640625, -5.2412109375, -5.02685546875, -4.8125, -4.59814453125, -4.3837890625, -4.16943359375, -3.955078125, -3.74072265625, -3.5263671875, -3.31201171875, -3.09765625, -2.88330078125, -2.6689453125, -2.45458984375, -2.240234375, -2.02587890625, -1.8115234375, -1.59716796875, -1.3828125, -1.16845703125, -0.9541015625, -0.73974609375, -0.525390625, -0.31103515625, -0.0966796875, 0.11767578125, 0.33203125, 0.54638671875, 0.7607421875, 0.97509765625, 1.189453125, 1.40380859375, 1.6181640625, 1.83251953125, 2.046875, 2.26123046875, 2.4755859375, 2.68994140625, 2.904296875, 3.11865234375, 3.3330078125, 3.54736328125, 3.76171875, 3.97607421875, 4.1904296875, 4.40478515625, 4.619140625, 4.83349609375, 5.0478515625, 5.26220703125, 5.4765625, 5.69091796875, 5.9052734375, 6.11962890625, 6.333984375, 6.54833984375, 6.7626953125, 6.97705078125, 7.19140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 12.0, 9.0, 18.0, 22.0, 23.0, 41.0, 39.0, 41.0, 85.0, 97.0, 151.0, 164.0, 243.0, 388.0, 707.0, 2156.0, 13688.0, 176860.0, 1612331.0, 2083802.0, 278430.0, 19776.0, 2872.0, 827.0, 427.0, 284.0, 161.0, 141.0, 107.0, 73.0, 73.0, 46.0, 42.0, 25.0, 25.0, 18.0, 13.0, 12.0, 12.0, 5.0, 6.0, 5.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.140625, -10.7576904296875, -10.374755859375, -9.9918212890625, -9.60888671875, -9.2259521484375, -8.843017578125, -8.4600830078125, -8.0771484375, -7.6942138671875, -7.311279296875, -6.9283447265625, -6.54541015625, -6.1624755859375, -5.779541015625, -5.3966064453125, -5.013671875, -4.6307373046875, -4.247802734375, -3.8648681640625, -3.48193359375, -3.0989990234375, -2.716064453125, -2.3331298828125, -1.9501953125, -1.5672607421875, -1.184326171875, -0.8013916015625, -0.41845703125, -0.0355224609375, 0.347412109375, 0.7303466796875, 1.11328125, 1.4962158203125, 1.879150390625, 2.2620849609375, 2.64501953125, 3.0279541015625, 3.410888671875, 3.7938232421875, 4.1767578125, 4.5596923828125, 4.942626953125, 5.3255615234375, 5.70849609375, 6.0914306640625, 6.474365234375, 6.8572998046875, 7.240234375, 7.6231689453125, 8.006103515625, 8.3890380859375, 8.77197265625, 9.1549072265625, 9.537841796875, 9.9207763671875, 10.3037109375, 10.6866455078125, 11.069580078125, 11.4525146484375, 11.83544921875, 12.2183837890625, 12.601318359375, 12.9842529296875, 13.3671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 13.0, 14.0, 20.0, 28.0, 49.0, 72.0, 112.0, 207.0, 357.0, 512.0, 662.0, 555.0, 532.0, 366.0, 187.0, 147.0, 73.0, 53.0, 41.0, 18.0, 14.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.372314453125, -8.94775390625, -8.523193359375, -8.0986328125, -7.674072265625, -7.24951171875, -6.824951171875, -6.400390625, -5.975830078125, -5.55126953125, -5.126708984375, -4.7021484375, -4.277587890625, -3.85302734375, -3.428466796875, -3.00390625, -2.579345703125, -2.15478515625, -1.730224609375, -1.3056640625, -0.881103515625, -0.45654296875, -0.031982421875, 0.392578125, 0.817138671875, 1.24169921875, 1.666259765625, 2.0908203125, 2.515380859375, 2.93994140625, 3.364501953125, 3.7890625, 4.213623046875, 4.63818359375, 5.062744140625, 5.4873046875, 5.911865234375, 6.33642578125, 6.760986328125, 7.185546875, 7.610107421875, 8.03466796875, 8.459228515625, 8.8837890625, 9.308349609375, 9.73291015625, 10.157470703125, 10.58203125, 11.006591796875, 11.43115234375, 11.855712890625, 12.2802734375, 12.704833984375, 13.12939453125, 13.553955078125, 13.978515625, 14.403076171875, 14.82763671875, 15.252197265625, 15.6767578125, 16.101318359375, 16.52587890625, 16.950439453125, 17.375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 1.0, 7.0, 9.0, 13.0, 26.0, 45.0, 64.0, 102.0, 210.0, 344.0, 741.0, 2264.0, 44078.0, 3892775.0, 246858.0, 4690.0, 1081.0, 450.0, 214.0, 127.0, 69.0, 46.0, 26.0, 13.0, 12.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.318603515625, -42.13720703125, -40.955810546875, -39.7744140625, -38.593017578125, -37.41162109375, -36.230224609375, -35.048828125, -33.867431640625, -32.68603515625, -31.504638671875, -30.3232421875, -29.141845703125, -27.96044921875, -26.779052734375, -25.59765625, -24.416259765625, -23.23486328125, -22.053466796875, -20.8720703125, -19.690673828125, -18.50927734375, -17.327880859375, -16.146484375, -14.965087890625, -13.78369140625, -12.602294921875, -11.4208984375, -10.239501953125, -9.05810546875, -7.876708984375, -6.6953125, -5.513916015625, -4.33251953125, -3.151123046875, -1.9697265625, -0.788330078125, 0.39306640625, 1.574462890625, 2.755859375, 3.937255859375, 5.11865234375, 6.300048828125, 7.4814453125, 8.662841796875, 9.84423828125, 11.025634765625, 12.20703125, 13.388427734375, 14.56982421875, 15.751220703125, 16.9326171875, 18.114013671875, 19.29541015625, 20.476806640625, 21.658203125, 22.839599609375, 24.02099609375, 25.202392578125, 26.3837890625, 27.565185546875, 28.74658203125, 29.927978515625, 31.109375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 93.0, 327.0, 414.0, 150.0, 16.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.908550262451172, -17.654666900634766, -13.400782585144043, -9.14689826965332, -4.893014907836914, -0.6391315460205078, 3.6147537231445312, 7.8686370849609375, 12.122520446777344, 16.37640380859375, 20.630287170410156, 24.884172439575195, 29.1380558013916, 33.391937255859375, 37.64582443237305, 41.89970779418945, 46.15359115600586, 50.407474517822266, 54.66135787963867, 58.915245056152344, 63.16912841796875, 67.42301177978516, 71.67689514160156, 75.93077850341797, 80.18466186523438, 84.43854522705078, 88.69242858886719, 92.9463119506836, 97.2001953125, 101.4540786743164, 105.70796203613281, 109.96185302734375, 114.21574401855469, 118.4696273803711, 122.7235107421875, 126.9773941040039, 131.2312774658203, 135.48516845703125, 139.73904418945312, 143.99293518066406, 148.24681091308594, 152.50070190429688, 156.75457763671875, 161.0084686279297, 165.26234436035156, 169.5162353515625, 173.77011108398438, 178.0240020751953, 182.27789306640625, 186.5317840576172, 190.78565979003906, 195.03955078125, 199.29342651367188, 203.5473175048828, 207.8011932373047, 212.05508422851562, 216.3089599609375, 220.56285095214844, 224.8167266845703, 229.07061767578125, 233.32449340820312, 237.57838439941406, 241.83226013183594, 246.08615112304688, 250.34002685546875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 9.0, 17.0, 16.0, 15.0, 13.0, 22.0, 26.0, 25.0, 27.0, 38.0, 46.0, 31.0, 35.0, 44.0, 41.0, 48.0, 42.0, 43.0, 37.0, 41.0, 34.0, 30.0, 35.0, 31.0, 25.0, 27.0, 29.0, 22.0, 20.0, 19.0, 12.0, 13.0, 7.0, 8.0, 8.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.4581298828125, -32.43269729614258, -31.40726661682129, -30.3818359375, -29.356403350830078, -28.330970764160156, -27.305540084838867, -26.280109405517578, -25.254676818847656, -24.229244232177734, -23.203813552856445, -22.178382873535156, -21.152950286865234, -20.127517700195312, -19.102087020874023, -18.076656341552734, -17.051223754882812, -16.02579116821289, -15.000360488891602, -13.974928855895996, -12.94949722290039, -11.924065589904785, -10.89863395690918, -9.873202323913574, -8.847770690917969, -7.822339057922363, -6.796907424926758, -5.771475791931152, -4.746044158935547, -3.7206125259399414, -2.695180892944336, -1.6697492599487305, -0.644317626953125, 0.38111400604248047, 1.406545639038086, 2.4319772720336914, 3.457408905029297, 4.482840538024902, 5.508272171020508, 6.533703804016113, 7.559135437011719, 8.584567070007324, 9.60999870300293, 10.635430335998535, 11.66086196899414, 12.686293601989746, 13.711725234985352, 14.737156867980957, 15.762588500976562, 16.788021087646484, 17.813451766967773, 18.838882446289062, 19.864315032958984, 20.889747619628906, 21.915178298950195, 22.940608978271484, 23.966041564941406, 24.991474151611328, 26.016904830932617, 27.042335510253906, 28.067768096923828, 29.09320068359375, 30.11863136291504, 31.144062042236328, 32.16949462890625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 19.0, 18.0, 20.0, 33.0, 24.0, 35.0, 48.0, 34.0, 44.0, 46.0, 41.0, 45.0, 40.0, 46.0, 48.0, 42.0, 36.0, 35.0, 47.0, 46.0, 32.0, 29.0, 33.0, 26.0, 19.0, 18.0, 11.0, 10.0, 13.0, 12.0, 6.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.53656005859375, -5.3035888671875, -5.07061767578125, -4.837646484375, -4.60467529296875, -4.3717041015625, -4.13873291015625, -3.90576171875, -3.67279052734375, -3.4398193359375, -3.20684814453125, -2.973876953125, -2.74090576171875, -2.5079345703125, -2.27496337890625, -2.0419921875, -1.80902099609375, -1.5760498046875, -1.34307861328125, -1.110107421875, -0.87713623046875, -0.6441650390625, -0.41119384765625, -0.17822265625, 0.05474853515625, 0.2877197265625, 0.52069091796875, 0.753662109375, 0.98663330078125, 1.2196044921875, 1.45257568359375, 1.685546875, 1.91851806640625, 2.1514892578125, 2.38446044921875, 2.617431640625, 2.85040283203125, 3.0833740234375, 3.31634521484375, 3.54931640625, 3.78228759765625, 4.0152587890625, 4.24822998046875, 4.481201171875, 4.71417236328125, 4.9471435546875, 5.18011474609375, 5.4130859375, 5.64605712890625, 5.8790283203125, 6.11199951171875, 6.344970703125, 6.57794189453125, 6.8109130859375, 7.04388427734375, 7.27685546875, 7.50982666015625, 7.7427978515625, 7.97576904296875, 8.208740234375, 8.44171142578125, 8.6746826171875, 8.90765380859375, 9.140625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 3.0, 10.0, 16.0, 14.0, 19.0, 38.0, 51.0, 103.0, 118.0, 202.0, 265.0, 426.0, 654.0, 890.0, 1392.0, 2063.0, 2972.0, 4524.0, 6635.0, 10218.0, 15621.0, 24667.0, 38625.0, 61422.0, 98303.0, 155123.0, 208537.0, 152537.0, 95821.0, 60010.0, 37811.0, 23886.0, 15250.0, 10053.0, 6565.0, 4482.0, 3026.0, 2044.0, 1392.0, 948.0, 592.0, 398.0, 258.0, 185.0, 129.0, 89.0, 49.0, 32.0, 20.0, 15.0, 11.0, 17.0, 9.0, 9.0, 3.0, 2.0, 1.0], "bins": [-0.67529296875, -0.655120849609375, -0.63494873046875, -0.614776611328125, -0.5946044921875, -0.574432373046875, -0.55426025390625, -0.534088134765625, -0.513916015625, -0.493743896484375, -0.47357177734375, -0.453399658203125, -0.4332275390625, -0.413055419921875, -0.39288330078125, -0.372711181640625, -0.3525390625, -0.332366943359375, -0.31219482421875, -0.292022705078125, -0.2718505859375, -0.251678466796875, -0.23150634765625, -0.211334228515625, -0.191162109375, -0.170989990234375, -0.15081787109375, -0.130645751953125, -0.1104736328125, -0.090301513671875, -0.07012939453125, -0.049957275390625, -0.02978515625, -0.009613037109375, 0.01055908203125, 0.030731201171875, 0.0509033203125, 0.071075439453125, 0.09124755859375, 0.111419677734375, 0.131591796875, 0.151763916015625, 0.17193603515625, 0.192108154296875, 0.2122802734375, 0.232452392578125, 0.25262451171875, 0.272796630859375, 0.29296875, 0.313140869140625, 0.33331298828125, 0.353485107421875, 0.3736572265625, 0.393829345703125, 0.41400146484375, 0.434173583984375, 0.454345703125, 0.474517822265625, 0.49468994140625, 0.514862060546875, 0.5350341796875, 0.555206298828125, 0.57537841796875, 0.595550537109375, 0.61572265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 7.0, 10.0, 13.0, 18.0, 22.0, 23.0, 16.0, 23.0, 23.0, 25.0, 42.0, 33.0, 50.0, 43.0, 42.0, 48.0, 35.0, 1071.0, 44.0, 39.0, 34.0, 35.0, 30.0, 31.0, 30.0, 39.0, 20.0, 21.0, 20.0, 21.0, 22.0, 17.0, 17.0, 12.0, 6.0, 9.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.21405029296875, -4.0804443359375, -3.94683837890625, -3.813232421875, -3.67962646484375, -3.5460205078125, -3.41241455078125, -3.27880859375, -3.14520263671875, -3.0115966796875, -2.87799072265625, -2.744384765625, -2.61077880859375, -2.4771728515625, -2.34356689453125, -2.2099609375, -2.07635498046875, -1.9427490234375, -1.80914306640625, -1.675537109375, -1.54193115234375, -1.4083251953125, -1.27471923828125, -1.14111328125, -1.00750732421875, -0.8739013671875, -0.74029541015625, -0.606689453125, -0.47308349609375, -0.3394775390625, -0.20587158203125, -0.072265625, 0.06134033203125, 0.1949462890625, 0.32855224609375, 0.462158203125, 0.59576416015625, 0.7293701171875, 0.86297607421875, 0.99658203125, 1.13018798828125, 1.2637939453125, 1.39739990234375, 1.531005859375, 1.66461181640625, 1.7982177734375, 1.93182373046875, 2.0654296875, 2.19903564453125, 2.3326416015625, 2.46624755859375, 2.599853515625, 2.73345947265625, 2.8670654296875, 3.00067138671875, 3.13427734375, 3.26788330078125, 3.4014892578125, 3.53509521484375, 3.668701171875, 3.80230712890625, 3.9359130859375, 4.06951904296875, 4.203125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 11.0, 6.0, 15.0, 19.0, 37.0, 54.0, 60.0, 95.0, 147.0, 212.0, 287.0, 416.0, 625.0, 922.0, 1337.0, 2205.0, 3212.0, 4784.0, 7433.0, 11378.0, 18299.0, 29842.0, 49965.0, 84980.0, 148140.0, 1272925.0, 190206.0, 107963.0, 62273.0, 36865.0, 22548.0, 14104.0, 8803.0, 5792.0, 3772.0, 2327.0, 1653.0, 1110.0, 727.0, 512.0, 338.0, 229.0, 157.0, 98.0, 62.0, 48.0, 37.0, 30.0, 20.0, 15.0, 6.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0], "bins": [-0.66259765625, -0.6423416137695312, -0.6220855712890625, -0.6018295288085938, -0.581573486328125, -0.5613174438476562, -0.5410614013671875, -0.5208053588867188, -0.50054931640625, -0.48029327392578125, -0.4600372314453125, -0.43978118896484375, -0.419525146484375, -0.39926910400390625, -0.3790130615234375, -0.35875701904296875, -0.3385009765625, -0.31824493408203125, -0.2979888916015625, -0.27773284912109375, -0.257476806640625, -0.23722076416015625, -0.2169647216796875, -0.19670867919921875, -0.17645263671875, -0.15619659423828125, -0.1359405517578125, -0.11568450927734375, -0.095428466796875, -0.07517242431640625, -0.0549163818359375, -0.03466033935546875, -0.014404296875, 0.00585174560546875, 0.0261077880859375, 0.04636383056640625, 0.066619873046875, 0.08687591552734375, 0.1071319580078125, 0.12738800048828125, 0.14764404296875, 0.16790008544921875, 0.1881561279296875, 0.20841217041015625, 0.228668212890625, 0.24892425537109375, 0.2691802978515625, 0.28943634033203125, 0.3096923828125, 0.32994842529296875, 0.3502044677734375, 0.37046051025390625, 0.390716552734375, 0.41097259521484375, 0.4312286376953125, 0.45148468017578125, 0.47174072265625, 0.49199676513671875, 0.5122528076171875, 0.5325088500976562, 0.552764892578125, 0.5730209350585938, 0.5932769775390625, 0.6135330200195312, 0.6337890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 4.0, 5.0, 8.0, 12.0, 7.0, 11.0, 9.0, 13.0, 17.0, 23.0, 19.0, 28.0, 23.0, 40.0, 44.0, 56.0, 73.0, 91.0, 88.0, 77.0, 44.0, 41.0, 43.0, 26.0, 28.0, 23.0, 18.0, 20.0, 16.0, 12.0, 14.0, 13.0, 10.0, 4.0, 8.0, 4.0, 4.0, 1.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.006275177001953125, -0.006074666976928711, -0.005874156951904297, -0.005673646926879883, -0.005473136901855469, -0.005272626876831055, -0.005072116851806641, -0.0048716068267822266, -0.0046710968017578125, -0.0044705867767333984, -0.004270076751708984, -0.00406956672668457, -0.0038690567016601562, -0.003668546676635742, -0.003468036651611328, -0.003267526626586914, -0.0030670166015625, -0.002866506576538086, -0.002665996551513672, -0.002465486526489258, -0.0022649765014648438, -0.0020644664764404297, -0.0018639564514160156, -0.0016634464263916016, -0.0014629364013671875, -0.0012624263763427734, -0.0010619163513183594, -0.0008614063262939453, -0.0006608963012695312, -0.0004603862762451172, -0.0002598762512207031, -5.936622619628906e-05, 0.000141143798828125, 0.00034165382385253906, 0.0005421638488769531, 0.0007426738739013672, 0.0009431838989257812, 0.0011436939239501953, 0.0013442039489746094, 0.0015447139739990234, 0.0017452239990234375, 0.0019457340240478516, 0.0021462440490722656, 0.0023467540740966797, 0.0025472640991210938, 0.002747774124145508, 0.002948284149169922, 0.003148794174194336, 0.00334930419921875, 0.003549814224243164, 0.003750324249267578, 0.003950834274291992, 0.004151344299316406, 0.00435185432434082, 0.004552364349365234, 0.0047528743743896484, 0.0049533843994140625, 0.0051538944244384766, 0.005354404449462891, 0.005554914474487305, 0.005755424499511719, 0.005955934524536133, 0.006156444549560547, 0.006356954574584961, 0.006557464599609375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 9.0, 4.0, 7.0, 11.0, 16.0, 6.0, 13.0, 16.0, 13.0, 25.0, 32.0, 42.0, 55.0, 69.0, 72.0, 121.0, 193.0, 299.0, 545.0, 2123.0, 1034703.0, 8306.0, 741.0, 355.0, 236.0, 133.0, 83.0, 72.0, 47.0, 46.0, 32.0, 21.0, 19.0, 22.0, 15.0, 9.0, 13.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1380615234375, -0.13383102416992188, -0.12960052490234375, -0.12537002563476562, -0.1211395263671875, -0.11690902709960938, -0.11267852783203125, -0.10844802856445312, -0.104217529296875, -0.09998703002929688, -0.09575653076171875, -0.09152603149414062, -0.0872955322265625, -0.08306503295898438, -0.07883453369140625, -0.07460403442382812, -0.07037353515625, -0.06614303588867188, -0.06191253662109375, -0.057682037353515625, -0.0534515380859375, -0.049221038818359375, -0.04499053955078125, -0.040760040283203125, -0.036529541015625, -0.032299041748046875, -0.02806854248046875, -0.023838043212890625, -0.0196075439453125, -0.015377044677734375, -0.01114654541015625, -0.006916046142578125, -0.002685546875, 0.001544952392578125, 0.00577545166015625, 0.010005950927734375, 0.0142364501953125, 0.018466949462890625, 0.02269744873046875, 0.026927947998046875, 0.031158447265625, 0.035388946533203125, 0.03961944580078125, 0.043849945068359375, 0.0480804443359375, 0.052310943603515625, 0.05654144287109375, 0.060771942138671875, 0.06500244140625, 0.06923294067382812, 0.07346343994140625, 0.07769393920898438, 0.0819244384765625, 0.08615493774414062, 0.09038543701171875, 0.09461593627929688, 0.098846435546875, 0.10307693481445312, 0.10730743408203125, 0.11153793334960938, 0.1157684326171875, 0.11999893188476562, 0.12422943115234375, 0.12845993041992188, 0.1326904296875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 111.0, 582.0, 282.0, 26.0, 9.0], "bins": [-0.025942981243133545, -0.025515755638480186, -0.02508852817118168, -0.02466130256652832, -0.024234075099229813, -0.023806849494576454, -0.023379622027277946, -0.022952396422624588, -0.02252516895532608, -0.022097943350672722, -0.021670715883374214, -0.021243490278720856, -0.020816262811422348, -0.02038903720676899, -0.019961809739470482, -0.019534584134817123, -0.019107356667518616, -0.018680131062865257, -0.01825290359556675, -0.01782567799091339, -0.017398450523614883, -0.016971224918961525, -0.016543997451663017, -0.01611677184700966, -0.01568954437971115, -0.015262317843735218, -0.014835091307759285, -0.014407864771783352, -0.013980638235807419, -0.013553411699831486, -0.013126185163855553, -0.01269895862787962, -0.012271732091903687, -0.011844505555927753, -0.01141727901995182, -0.010990052483975887, -0.010562825947999954, -0.010135599412024021, -0.009708372876048088, -0.009281146340072155, -0.008853919804096222, -0.008426693268120289, -0.007999466732144356, -0.007572240196168423, -0.00714501366019249, -0.0067177871242165565, -0.0062905605882406235, -0.00586333405226469, -0.005436108447611332, -0.005008881911635399, -0.004581655375659466, -0.004154428839683533, -0.0037272023037075996, -0.0032999760005623102, -0.002872749464586377, -0.002445522928610444, -0.0020182961598038673, -0.0015910696238279343, -0.0011638430878520012, -0.0007366166682913899, -0.00030939013231545687, 0.00011783628724515438, 0.0005450628232210875, 0.0009722893591970205, 0.0013995158951729536]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 0.0, 4.0, 9.0, 4.0, 6.0, 7.0, 8.0, 7.0, 10.0, 11.0, 15.0, 18.0, 19.0, 24.0, 12.0, 25.0, 36.0, 31.0, 28.0, 29.0, 33.0, 32.0, 29.0, 29.0, 32.0, 23.0, 32.0, 33.0, 33.0, 32.0, 33.0, 36.0, 28.0, 27.0, 22.0, 25.0, 29.0, 26.0, 25.0, 20.0, 19.0, 23.0, 8.0, 14.0, 7.0, 7.0, 9.0, 7.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0], "bins": [-0.002785205841064453, -0.0026930272579193115, -0.00260084867477417, -0.0025086700916290283, -0.0024164915084838867, -0.002324312925338745, -0.0022321343421936035, -0.002139955759048462, -0.0020477771759033203, -0.0019555985927581787, -0.0018634200096130371, -0.0017712414264678955, -0.001679062843322754, -0.0015868842601776123, -0.0014947056770324707, -0.001402527093887329, -0.0013103485107421875, -0.001218169927597046, -0.0011259913444519043, -0.0010338127613067627, -0.0009416341781616211, -0.0008494555950164795, -0.0007572770118713379, -0.0006650984287261963, -0.0005729198455810547, -0.0004807412624359131, -0.0003885626792907715, -0.0002963840961456299, -0.00020420551300048828, -0.00011202692985534668, -1.9848346710205078e-05, 7.233023643493652e-05, 0.00016450881958007812, 0.0002566874027252197, 0.00034886598587036133, 0.00044104456901550293, 0.0005332231521606445, 0.0006254017353057861, 0.0007175803184509277, 0.0008097589015960693, 0.0009019374847412109, 0.0009941160678863525, 0.0010862946510314941, 0.0011784732341766357, 0.0012706518173217773, 0.001362830400466919, 0.0014550089836120605, 0.0015471875667572021, 0.0016393661499023438, 0.0017315447330474854, 0.001823723316192627, 0.0019159018993377686, 0.00200808048248291, 0.0021002590656280518, 0.0021924376487731934, 0.002284616231918335, 0.0023767948150634766, 0.002468973398208618, 0.0025611519813537598, 0.0026533305644989014, 0.002745509147644043, 0.0028376877307891846, 0.002929866313934326, 0.0030220448970794678, 0.0031142234802246094]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 19.0, 18.0, 20.0, 33.0, 24.0, 34.0, 49.0, 34.0, 44.0, 46.0, 41.0, 45.0, 40.0, 46.0, 48.0, 42.0, 36.0, 35.0, 47.0, 46.0, 32.0, 29.0, 33.0, 26.0, 19.0, 18.0, 11.0, 10.0, 13.0, 12.0, 6.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.53656005859375, -5.3035888671875, -5.07061767578125, -4.837646484375, -4.60467529296875, -4.3717041015625, -4.13873291015625, -3.90576171875, -3.67279052734375, -3.4398193359375, -3.20684814453125, -2.973876953125, -2.74090576171875, -2.5079345703125, -2.27496337890625, -2.0419921875, -1.80902099609375, -1.5760498046875, -1.34307861328125, -1.110107421875, -0.87713623046875, -0.6441650390625, -0.41119384765625, -0.17822265625, 0.05474853515625, 0.2877197265625, 0.52069091796875, 0.753662109375, 0.98663330078125, 1.2196044921875, 1.45257568359375, 1.685546875, 1.91851806640625, 2.1514892578125, 2.38446044921875, 2.617431640625, 2.85040283203125, 3.0833740234375, 3.31634521484375, 3.54931640625, 3.78228759765625, 4.0152587890625, 4.24822998046875, 4.481201171875, 4.71417236328125, 4.9471435546875, 5.18011474609375, 5.4130859375, 5.64605712890625, 5.8790283203125, 6.11199951171875, 6.344970703125, 6.57794189453125, 6.8109130859375, 7.04388427734375, 7.27685546875, 7.50982666015625, 7.7427978515625, 7.97576904296875, 8.208740234375, 8.44171142578125, 8.6746826171875, 8.90765380859375, 9.140625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 16.0, 18.0, 24.0, 50.0, 59.0, 104.0, 116.0, 196.0, 254.0, 425.0, 842.0, 1698.0, 3977.0, 10705.0, 32398.0, 104769.0, 353094.0, 373539.0, 112091.0, 34410.0, 11528.0, 4264.0, 1806.0, 808.0, 457.0, 276.0, 170.0, 116.0, 86.0, 55.0, 48.0, 26.0, 34.0, 22.0, 14.0, 13.0, 8.0, 3.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.6378173828125, -6.361572265625, -6.0853271484375, -5.80908203125, -5.5328369140625, -5.256591796875, -4.9803466796875, -4.7041015625, -4.4278564453125, -4.151611328125, -3.8753662109375, -3.59912109375, -3.3228759765625, -3.046630859375, -2.7703857421875, -2.494140625, -2.2178955078125, -1.941650390625, -1.6654052734375, -1.38916015625, -1.1129150390625, -0.836669921875, -0.5604248046875, -0.2841796875, -0.0079345703125, 0.268310546875, 0.5445556640625, 0.82080078125, 1.0970458984375, 1.373291015625, 1.6495361328125, 1.92578125, 2.2020263671875, 2.478271484375, 2.7545166015625, 3.03076171875, 3.3070068359375, 3.583251953125, 3.8594970703125, 4.1357421875, 4.4119873046875, 4.688232421875, 4.9644775390625, 5.24072265625, 5.5169677734375, 5.793212890625, 6.0694580078125, 6.345703125, 6.6219482421875, 6.898193359375, 7.1744384765625, 7.45068359375, 7.7269287109375, 8.003173828125, 8.2794189453125, 8.5556640625, 8.8319091796875, 9.108154296875, 9.3843994140625, 9.66064453125, 9.9368896484375, 10.213134765625, 10.4893798828125, 10.765625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 6.0, 14.0, 17.0, 14.0, 25.0, 28.0, 24.0, 25.0, 37.0, 40.0, 38.0, 58.0, 81.0, 136.0, 341.0, 1488.0, 172.0, 76.0, 54.0, 53.0, 49.0, 38.0, 32.0, 28.0, 15.0, 28.0, 18.0, 17.0, 13.0, 11.0, 10.0, 9.0, 9.0, 9.0, 2.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.855224609375, -17.24169921875, -16.628173828125, -16.0146484375, -15.401123046875, -14.78759765625, -14.174072265625, -13.560546875, -12.947021484375, -12.33349609375, -11.719970703125, -11.1064453125, -10.492919921875, -9.87939453125, -9.265869140625, -8.65234375, -8.038818359375, -7.42529296875, -6.811767578125, -6.1982421875, -5.584716796875, -4.97119140625, -4.357666015625, -3.744140625, -3.130615234375, -2.51708984375, -1.903564453125, -1.2900390625, -0.676513671875, -0.06298828125, 0.550537109375, 1.1640625, 1.777587890625, 2.39111328125, 3.004638671875, 3.6181640625, 4.231689453125, 4.84521484375, 5.458740234375, 6.072265625, 6.685791015625, 7.29931640625, 7.912841796875, 8.5263671875, 9.139892578125, 9.75341796875, 10.366943359375, 10.98046875, 11.593994140625, 12.20751953125, 12.821044921875, 13.4345703125, 14.048095703125, 14.66162109375, 15.275146484375, 15.888671875, 16.502197265625, 17.11572265625, 17.729248046875, 18.3427734375, 18.956298828125, 19.56982421875, 20.183349609375, 20.796875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 3.0, 7.0, 15.0, 10.0, 18.0, 27.0, 33.0, 50.0, 71.0, 105.0, 144.0, 253.0, 378.0, 677.0, 2120.0, 62749.0, 2985416.0, 89167.0, 2581.0, 731.0, 396.0, 240.0, 165.0, 97.0, 69.0, 42.0, 28.0, 30.0, 18.0, 11.0, 12.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.40625, -36.3232421875, -35.240234375, -34.1572265625, -33.07421875, -31.9912109375, -30.908203125, -29.8251953125, -28.7421875, -27.6591796875, -26.576171875, -25.4931640625, -24.41015625, -23.3271484375, -22.244140625, -21.1611328125, -20.078125, -18.9951171875, -17.912109375, -16.8291015625, -15.74609375, -14.6630859375, -13.580078125, -12.4970703125, -11.4140625, -10.3310546875, -9.248046875, -8.1650390625, -7.08203125, -5.9990234375, -4.916015625, -3.8330078125, -2.75, -1.6669921875, -0.583984375, 0.4990234375, 1.58203125, 2.6650390625, 3.748046875, 4.8310546875, 5.9140625, 6.9970703125, 8.080078125, 9.1630859375, 10.24609375, 11.3291015625, 12.412109375, 13.4951171875, 14.578125, 15.6611328125, 16.744140625, 17.8271484375, 18.91015625, 19.9931640625, 21.076171875, 22.1591796875, 23.2421875, 24.3251953125, 25.408203125, 26.4912109375, 27.57421875, 28.6572265625, 29.740234375, 30.8232421875, 31.90625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 52.0, 137.0, 283.0, 280.0, 179.0, 59.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.78744506835938, -76.96009826660156, -75.13275146484375, -73.30540466308594, -71.47805786132812, -69.65071105957031, -67.8233642578125, -65.99602508544922, -64.1686782836914, -62.341331481933594, -60.51398468017578, -58.68663787841797, -56.85929489135742, -55.03194808959961, -53.2046012878418, -51.377254486083984, -49.54990768432617, -47.72256088256836, -45.89521408081055, -44.06787109375, -42.24052429199219, -40.413177490234375, -38.58583068847656, -36.75848388671875, -34.93113708496094, -33.103790283203125, -31.276445388793945, -29.449098587036133, -27.621753692626953, -25.79440689086914, -23.967060089111328, -22.139713287353516, -20.31237030029297, -18.485023498535156, -16.657678604125977, -14.830331802368164, -13.002985954284668, -11.175640106201172, -9.34829330444336, -7.520947456359863, -5.693601608276367, -3.866255521774292, -2.038909435272217, -0.2115631103515625, 1.6157827377319336, 3.4431285858154297, 5.270475387573242, 7.097821235656738, 8.925167083740234, 10.75251293182373, 12.579858779907227, 14.407205581665039, 16.23455047607422, 18.06189727783203, 19.889244079589844, 21.716590881347656, 23.543935775756836, 25.37128257751465, 27.198627471923828, 29.02597427368164, 30.853321075439453, 32.6806640625, 34.50801086425781, 36.335357666015625, 38.16270446777344]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 8.0, 11.0, 13.0, 16.0, 16.0, 19.0, 22.0, 24.0, 38.0, 17.0, 15.0, 48.0, 29.0, 30.0, 34.0, 42.0, 41.0, 41.0, 35.0, 50.0, 50.0, 44.0, 36.0, 35.0, 38.0, 27.0, 29.0, 33.0, 27.0, 18.0, 16.0, 17.0, 13.0, 14.0, 8.0, 9.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-46.361366271972656, -45.11009216308594, -43.858821868896484, -42.607547760009766, -41.35627746582031, -40.105003356933594, -38.853729248046875, -37.60245895385742, -36.3511848449707, -35.099910736083984, -33.84864044189453, -32.59736633300781, -31.346094131469727, -30.09482192993164, -28.843549728393555, -27.59227752685547, -26.341005325317383, -25.089733123779297, -23.83846092224121, -22.587188720703125, -21.335914611816406, -20.08464241027832, -18.833370208740234, -17.582096099853516, -16.330825805664062, -15.079553604125977, -13.828280448913574, -12.577008247375488, -11.325735092163086, -10.074462890625, -8.823190689086914, -7.571917533874512, -6.320644378662109, -5.069371700286865, -3.8180992603302, -2.566826820373535, -1.315554141998291, -0.06428146362304688, 1.186990737915039, 2.4382638931274414, 3.6895360946655273, 4.9408087730407715, 6.192081451416016, 7.443353652954102, 8.694625854492188, 9.94589900970459, 11.197171211242676, 12.448444366455078, 13.699716567993164, 14.95098876953125, 16.202260971069336, 17.453533172607422, 18.70480728149414, 19.956079483032227, 21.207351684570312, 22.45862579345703, 23.709896087646484, 24.96116828918457, 26.212440490722656, 27.463714599609375, 28.71498680114746, 29.966259002685547, 31.217531204223633, 32.46880340576172, 33.72007751464844]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 14.0, 10.0, 20.0, 23.0, 33.0, 24.0, 45.0, 41.0, 41.0, 48.0, 48.0, 53.0, 62.0, 37.0, 39.0, 51.0, 53.0, 46.0, 44.0, 32.0, 36.0, 28.0, 27.0, 20.0, 15.0, 23.0, 17.0, 2.0, 14.0, 14.0, 6.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.54046630859375, -6.2879638671875, -6.03546142578125, -5.782958984375, -5.53045654296875, -5.2779541015625, -5.02545166015625, -4.77294921875, -4.52044677734375, -4.2679443359375, -4.01544189453125, -3.762939453125, -3.51043701171875, -3.2579345703125, -3.00543212890625, -2.7529296875, -2.50042724609375, -2.2479248046875, -1.99542236328125, -1.742919921875, -1.49041748046875, -1.2379150390625, -0.98541259765625, -0.73291015625, -0.48040771484375, -0.2279052734375, 0.02459716796875, 0.277099609375, 0.52960205078125, 0.7821044921875, 1.03460693359375, 1.287109375, 1.53961181640625, 1.7921142578125, 2.04461669921875, 2.297119140625, 2.54962158203125, 2.8021240234375, 3.05462646484375, 3.30712890625, 3.55963134765625, 3.8121337890625, 4.06463623046875, 4.317138671875, 4.56964111328125, 4.8221435546875, 5.07464599609375, 5.3271484375, 5.57965087890625, 5.8321533203125, 6.08465576171875, 6.337158203125, 6.58966064453125, 6.8421630859375, 7.09466552734375, 7.34716796875, 7.59967041015625, 7.8521728515625, 8.10467529296875, 8.357177734375, 8.60968017578125, 8.8621826171875, 9.11468505859375, 9.3671875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 4.0, 11.0, 7.0, 12.0, 12.0, 18.0, 36.0, 39.0, 45.0, 55.0, 77.0, 139.0, 223.0, 427.0, 854.0, 2087.0, 7184.0, 31502.0, 175121.0, 813463.0, 1828719.0, 1056750.0, 226276.0, 38267.0, 8159.0, 2433.0, 1017.0, 491.0, 277.0, 163.0, 102.0, 67.0, 58.0, 37.0, 37.0, 16.0, 18.0, 13.0, 11.0, 12.0, 7.0, 5.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.125, -7.8677978515625, -7.610595703125, -7.3533935546875, -7.09619140625, -6.8389892578125, -6.581787109375, -6.3245849609375, -6.0673828125, -5.8101806640625, -5.552978515625, -5.2957763671875, -5.03857421875, -4.7813720703125, -4.524169921875, -4.2669677734375, -4.009765625, -3.7525634765625, -3.495361328125, -3.2381591796875, -2.98095703125, -2.7237548828125, -2.466552734375, -2.2093505859375, -1.9521484375, -1.6949462890625, -1.437744140625, -1.1805419921875, -0.92333984375, -0.6661376953125, -0.408935546875, -0.1517333984375, 0.10546875, 0.3626708984375, 0.619873046875, 0.8770751953125, 1.13427734375, 1.3914794921875, 1.648681640625, 1.9058837890625, 2.1630859375, 2.4202880859375, 2.677490234375, 2.9346923828125, 3.19189453125, 3.4490966796875, 3.706298828125, 3.9635009765625, 4.220703125, 4.4779052734375, 4.735107421875, 4.9923095703125, 5.24951171875, 5.5067138671875, 5.763916015625, 6.0211181640625, 6.2783203125, 6.5355224609375, 6.792724609375, 7.0499267578125, 7.30712890625, 7.5643310546875, 7.821533203125, 8.0787353515625, 8.3359375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 14.0, 9.0, 17.0, 14.0, 22.0, 31.0, 42.0, 46.0, 74.0, 93.0, 180.0, 206.0, 290.0, 386.0, 424.0, 476.0, 399.0, 349.0, 259.0, 176.0, 137.0, 107.0, 75.0, 57.0, 33.0, 25.0, 27.0, 15.0, 12.0, 12.0, 10.0, 8.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.6953125, -7.4332275390625, -7.171142578125, -6.9090576171875, -6.64697265625, -6.3848876953125, -6.122802734375, -5.8607177734375, -5.5986328125, -5.3365478515625, -5.074462890625, -4.8123779296875, -4.55029296875, -4.2882080078125, -4.026123046875, -3.7640380859375, -3.501953125, -3.2398681640625, -2.977783203125, -2.7156982421875, -2.45361328125, -2.1915283203125, -1.929443359375, -1.6673583984375, -1.4052734375, -1.1431884765625, -0.881103515625, -0.6190185546875, -0.35693359375, -0.0948486328125, 0.167236328125, 0.4293212890625, 0.69140625, 0.9534912109375, 1.215576171875, 1.4776611328125, 1.73974609375, 2.0018310546875, 2.263916015625, 2.5260009765625, 2.7880859375, 3.0501708984375, 3.312255859375, 3.5743408203125, 3.83642578125, 4.0985107421875, 4.360595703125, 4.6226806640625, 4.884765625, 5.1468505859375, 5.408935546875, 5.6710205078125, 5.93310546875, 6.1951904296875, 6.457275390625, 6.7193603515625, 6.9814453125, 7.2435302734375, 7.505615234375, 7.7677001953125, 8.02978515625, 8.2918701171875, 8.553955078125, 8.8160400390625, 9.078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 6.0, 3.0, 8.0, 14.0, 15.0, 14.0, 18.0, 33.0, 35.0, 49.0, 72.0, 114.0, 150.0, 234.0, 450.0, 1082.0, 3138.0, 11119.0, 55486.0, 470435.0, 2933348.0, 628935.0, 69460.0, 13665.0, 3745.0, 1277.0, 560.0, 282.0, 155.0, 111.0, 66.0, 47.0, 30.0, 33.0, 25.0, 14.0, 19.0, 6.0, 9.0, 9.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.4866943359375, -13.059326171875, -12.6319580078125, -12.20458984375, -11.7772216796875, -11.349853515625, -10.9224853515625, -10.4951171875, -10.0677490234375, -9.640380859375, -9.2130126953125, -8.78564453125, -8.3582763671875, -7.930908203125, -7.5035400390625, -7.076171875, -6.6488037109375, -6.221435546875, -5.7940673828125, -5.36669921875, -4.9393310546875, -4.511962890625, -4.0845947265625, -3.6572265625, -3.2298583984375, -2.802490234375, -2.3751220703125, -1.94775390625, -1.5203857421875, -1.093017578125, -0.6656494140625, -0.23828125, 0.1890869140625, 0.616455078125, 1.0438232421875, 1.47119140625, 1.8985595703125, 2.325927734375, 2.7532958984375, 3.1806640625, 3.6080322265625, 4.035400390625, 4.4627685546875, 4.89013671875, 5.3175048828125, 5.744873046875, 6.1722412109375, 6.599609375, 7.0269775390625, 7.454345703125, 7.8817138671875, 8.30908203125, 8.7364501953125, 9.163818359375, 9.5911865234375, 10.0185546875, 10.4459228515625, 10.873291015625, 11.3006591796875, 11.72802734375, 12.1553955078125, 12.582763671875, 13.0101318359375, 13.4375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 21.0, 119.0, 414.0, 359.0, 87.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.27662467956543, -26.41468048095703, -22.552738189697266, -18.6907958984375, -14.828851699829102, -10.966909408569336, -7.1049652099609375, -3.243021011352539, 0.6189212799072266, 4.480864524841309, 8.34280776977539, 12.204751014709473, 16.066694259643555, 19.92863655090332, 23.79058074951172, 27.652524948120117, 31.514467239379883, 35.37641143798828, 39.23835372924805, 43.10029602050781, 46.962242126464844, 50.824180603027344, 54.686126708984375, 58.548072814941406, 62.410011291503906, 66.27195739746094, 70.13389587402344, 73.99584197998047, 77.8577880859375, 81.7197265625, 85.58167266845703, 89.44361877441406, 93.30555725097656, 97.1675033569336, 101.0294418334961, 104.89138793945312, 108.75332641601562, 112.61527252197266, 116.47721862792969, 120.33915710449219, 124.20110321044922, 128.06304931640625, 131.92498779296875, 135.78692626953125, 139.6488800048828, 143.5108184814453, 147.3727569580078, 151.23471069335938, 155.09664916992188, 158.95858764648438, 162.82054138183594, 166.68247985839844, 170.54441833496094, 174.4063720703125, 178.268310546875, 182.1302490234375, 185.9921875, 189.8541259765625, 193.71607971191406, 197.57801818847656, 201.43995666503906, 205.30191040039062, 209.16384887695312, 213.02578735351562, 216.8877410888672]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 18.0, 20.0, 13.0, 19.0, 27.0, 25.0, 30.0, 34.0, 41.0, 43.0, 38.0, 47.0, 52.0, 46.0, 66.0, 45.0, 43.0, 39.0, 35.0, 42.0, 33.0, 34.0, 31.0, 32.0, 20.0, 20.0, 12.0, 12.0, 12.0, 10.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.29904556274414, -39.17722702026367, -38.05541229248047, -36.93359375, -35.81177520751953, -34.68995666503906, -33.568138122558594, -32.44632339477539, -31.324504852294922, -30.202686309814453, -29.080869674682617, -27.95905303955078, -26.837234497070312, -25.715415954589844, -24.593599319458008, -23.471782684326172, -22.349964141845703, -21.228145599365234, -20.1063289642334, -18.984512329101562, -17.862693786621094, -16.740875244140625, -15.619058609008789, -14.497241020202637, -13.375423431396484, -12.253605842590332, -11.13178825378418, -10.009970664978027, -8.888153076171875, -7.766335487365723, -6.64451789855957, -5.522700309753418, -4.400886535644531, -3.279068946838379, -2.1572513580322266, -1.0354337692260742, 0.08638381958007812, 1.2082014083862305, 2.330018997192383, 3.451836585998535, 4.5736541748046875, 5.69547176361084, 6.817289352416992, 7.9391069412231445, 9.060924530029297, 10.18274211883545, 11.304559707641602, 12.426377296447754, 13.548194885253906, 14.670012474060059, 15.791830062866211, 16.913646697998047, 18.035465240478516, 19.157283782958984, 20.27910041809082, 21.400917053222656, 22.522735595703125, 23.644554138183594, 24.76637077331543, 25.888187408447266, 27.010005950927734, 28.131824493408203, 29.25364112854004, 30.375457763671875, 31.497276306152344]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 9.0, 15.0, 12.0, 15.0, 11.0, 19.0, 17.0, 26.0, 28.0, 40.0, 38.0, 39.0, 50.0, 40.0, 43.0, 33.0, 49.0, 49.0, 46.0, 47.0, 41.0, 28.0, 28.0, 30.0, 23.0, 35.0, 22.0, 20.0, 20.0, 21.0, 19.0, 10.0, 4.0, 7.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.20001220703125, -5.9859619140625, -5.77191162109375, -5.557861328125, -5.34381103515625, -5.1297607421875, -4.91571044921875, -4.70166015625, -4.48760986328125, -4.2735595703125, -4.05950927734375, -3.845458984375, -3.63140869140625, -3.4173583984375, -3.20330810546875, -2.9892578125, -2.77520751953125, -2.5611572265625, -2.34710693359375, -2.133056640625, -1.91900634765625, -1.7049560546875, -1.49090576171875, -1.27685546875, -1.06280517578125, -0.8487548828125, -0.63470458984375, -0.420654296875, -0.20660400390625, 0.0074462890625, 0.22149658203125, 0.435546875, 0.64959716796875, 0.8636474609375, 1.07769775390625, 1.291748046875, 1.50579833984375, 1.7198486328125, 1.93389892578125, 2.14794921875, 2.36199951171875, 2.5760498046875, 2.79010009765625, 3.004150390625, 3.21820068359375, 3.4322509765625, 3.64630126953125, 3.8603515625, 4.07440185546875, 4.2884521484375, 4.50250244140625, 4.716552734375, 4.93060302734375, 5.1446533203125, 5.35870361328125, 5.57275390625, 5.78680419921875, 6.0008544921875, 6.21490478515625, 6.428955078125, 6.64300537109375, 6.8570556640625, 7.07110595703125, 7.28515625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 6.0, 10.0, 29.0, 44.0, 87.0, 150.0, 221.0, 361.0, 532.0, 790.0, 1338.0, 2112.0, 3489.0, 5370.0, 8675.0, 14211.0, 23304.0, 38932.0, 65513.0, 117317.0, 213992.0, 235862.0, 132460.0, 74111.0, 43157.0, 25658.0, 15416.0, 9592.0, 5862.0, 3743.0, 2266.0, 1454.0, 811.0, 614.0, 422.0, 237.0, 158.0, 95.0, 58.0, 33.0, 14.0, 6.0, 9.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.734375, -0.7099761962890625, -0.685577392578125, -0.6611785888671875, -0.63677978515625, -0.6123809814453125, -0.587982177734375, -0.5635833740234375, -0.5391845703125, -0.5147857666015625, -0.490386962890625, -0.4659881591796875, -0.44158935546875, -0.4171905517578125, -0.392791748046875, -0.3683929443359375, -0.343994140625, -0.3195953369140625, -0.295196533203125, -0.2707977294921875, -0.24639892578125, -0.2220001220703125, -0.197601318359375, -0.1732025146484375, -0.1488037109375, -0.1244049072265625, -0.100006103515625, -0.0756072998046875, -0.05120849609375, -0.0268096923828125, -0.002410888671875, 0.0219879150390625, 0.04638671875, 0.0707855224609375, 0.095184326171875, 0.1195831298828125, 0.14398193359375, 0.1683807373046875, 0.192779541015625, 0.2171783447265625, 0.2415771484375, 0.2659759521484375, 0.290374755859375, 0.3147735595703125, 0.33917236328125, 0.3635711669921875, 0.387969970703125, 0.4123687744140625, 0.436767578125, 0.4611663818359375, 0.485565185546875, 0.5099639892578125, 0.53436279296875, 0.5587615966796875, 0.583160400390625, 0.6075592041015625, 0.6319580078125, 0.6563568115234375, 0.680755615234375, 0.7051544189453125, 0.72955322265625, 0.7539520263671875, 0.778350830078125, 0.8027496337890625, 0.8271484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 11.0, 7.0, 17.0, 12.0, 12.0, 6.0, 16.0, 23.0, 30.0, 19.0, 27.0, 31.0, 27.0, 37.0, 36.0, 31.0, 34.0, 38.0, 31.0, 1057.0, 41.0, 34.0, 46.0, 40.0, 40.0, 22.0, 39.0, 26.0, 26.0, 29.0, 21.0, 25.0, 16.0, 23.0, 19.0, 12.0, 9.0, 9.0, 7.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.24609375, -4.11737060546875, -3.9886474609375, -3.85992431640625, -3.731201171875, -3.60247802734375, -3.4737548828125, -3.34503173828125, -3.21630859375, -3.08758544921875, -2.9588623046875, -2.83013916015625, -2.701416015625, -2.57269287109375, -2.4439697265625, -2.31524658203125, -2.1865234375, -2.05780029296875, -1.9290771484375, -1.80035400390625, -1.671630859375, -1.54290771484375, -1.4141845703125, -1.28546142578125, -1.15673828125, -1.02801513671875, -0.8992919921875, -0.77056884765625, -0.641845703125, -0.51312255859375, -0.3843994140625, -0.25567626953125, -0.126953125, 0.00177001953125, 0.1304931640625, 0.25921630859375, 0.387939453125, 0.51666259765625, 0.6453857421875, 0.77410888671875, 0.90283203125, 1.03155517578125, 1.1602783203125, 1.28900146484375, 1.417724609375, 1.54644775390625, 1.6751708984375, 1.80389404296875, 1.9326171875, 2.06134033203125, 2.1900634765625, 2.31878662109375, 2.447509765625, 2.57623291015625, 2.7049560546875, 2.83367919921875, 2.96240234375, 3.09112548828125, 3.2198486328125, 3.34857177734375, 3.477294921875, 3.60601806640625, 3.7347412109375, 3.86346435546875, 3.9921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 8.0, 8.0, 7.0, 23.0, 17.0, 31.0, 54.0, 71.0, 88.0, 135.0, 200.0, 261.0, 390.0, 545.0, 785.0, 1152.0, 1574.0, 2218.0, 3175.0, 4598.0, 6515.0, 9717.0, 14310.0, 20961.0, 31793.0, 49014.0, 75595.0, 118144.0, 707244.0, 706619.0, 118759.0, 75671.0, 48681.0, 32077.0, 21055.0, 14286.0, 9611.0, 6609.0, 4594.0, 3187.0, 2115.0, 1520.0, 1113.0, 810.0, 540.0, 381.0, 268.0, 149.0, 144.0, 98.0, 72.0, 41.0, 37.0, 21.0, 16.0, 12.0, 8.0, 10.0, 4.0, 3.0, 1.0], "bins": [-0.5849609375, -0.566680908203125, -0.54840087890625, -0.530120849609375, -0.5118408203125, -0.493560791015625, -0.47528076171875, -0.457000732421875, -0.438720703125, -0.420440673828125, -0.40216064453125, -0.383880615234375, -0.3656005859375, -0.347320556640625, -0.32904052734375, -0.310760498046875, -0.29248046875, -0.274200439453125, -0.25592041015625, -0.237640380859375, -0.2193603515625, -0.201080322265625, -0.18280029296875, -0.164520263671875, -0.146240234375, -0.127960205078125, -0.10968017578125, -0.091400146484375, -0.0731201171875, -0.054840087890625, -0.03656005859375, -0.018280029296875, 0.0, 0.018280029296875, 0.03656005859375, 0.054840087890625, 0.0731201171875, 0.091400146484375, 0.10968017578125, 0.127960205078125, 0.146240234375, 0.164520263671875, 0.18280029296875, 0.201080322265625, 0.2193603515625, 0.237640380859375, 0.25592041015625, 0.274200439453125, 0.29248046875, 0.310760498046875, 0.32904052734375, 0.347320556640625, 0.3656005859375, 0.383880615234375, 0.40216064453125, 0.420440673828125, 0.438720703125, 0.457000732421875, 0.47528076171875, 0.493560791015625, 0.5118408203125, 0.530120849609375, 0.54840087890625, 0.566680908203125, 0.5849609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 10.0, 8.0, 6.0, 11.0, 12.0, 13.0, 15.0, 26.0, 25.0, 26.0, 37.0, 53.0, 66.0, 54.0, 92.0, 117.0, 79.0, 71.0, 60.0, 43.0, 23.0, 21.0, 28.0, 27.0, 20.0, 7.0, 6.0, 12.0, 1.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005321502685546875, -0.005140066146850586, -0.004958629608154297, -0.004777193069458008, -0.004595756530761719, -0.00441431999206543, -0.004232883453369141, -0.0040514469146728516, -0.0038700103759765625, -0.0036885738372802734, -0.0035071372985839844, -0.0033257007598876953, -0.0031442642211914062, -0.002962827682495117, -0.002781391143798828, -0.002599954605102539, -0.00241851806640625, -0.002237081527709961, -0.002055644989013672, -0.0018742084503173828, -0.0016927719116210938, -0.0015113353729248047, -0.0013298988342285156, -0.0011484622955322266, -0.0009670257568359375, -0.0007855892181396484, -0.0006041526794433594, -0.0004227161407470703, -0.00024127960205078125, -5.984306335449219e-05, 0.00012159347534179688, 0.00030303001403808594, 0.000484466552734375, 0.0006659030914306641, 0.0008473396301269531, 0.0010287761688232422, 0.0012102127075195312, 0.0013916492462158203, 0.0015730857849121094, 0.0017545223236083984, 0.0019359588623046875, 0.0021173954010009766, 0.0022988319396972656, 0.0024802684783935547, 0.0026617050170898438, 0.002843141555786133, 0.003024578094482422, 0.003206014633178711, 0.003387451171875, 0.003568887710571289, 0.003750324249267578, 0.003931760787963867, 0.004113197326660156, 0.004294633865356445, 0.004476070404052734, 0.0046575069427490234, 0.0048389434814453125, 0.0050203800201416016, 0.005201816558837891, 0.00538325309753418, 0.005564689636230469, 0.005746126174926758, 0.005927562713623047, 0.006108999252319336, 0.006290435791015625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 13.0, 12.0, 16.0, 21.0, 21.0, 55.0, 70.0, 72.0, 98.0, 132.0, 249.0, 454.0, 1114.0, 788252.0, 255682.0, 955.0, 446.0, 292.0, 134.0, 99.0, 83.0, 43.0, 45.0, 38.0, 26.0, 19.0, 21.0, 19.0, 9.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.12371826171875, -0.1201791763305664, -0.11664009094238281, -0.11310100555419922, -0.10956192016601562, -0.10602283477783203, -0.10248374938964844, -0.09894466400146484, -0.09540557861328125, -0.09186649322509766, -0.08832740783691406, -0.08478832244873047, -0.08124923706054688, -0.07771015167236328, -0.07417106628417969, -0.0706319808959961, -0.0670928955078125, -0.0635538101196289, -0.06001472473144531, -0.05647563934326172, -0.052936553955078125, -0.04939746856689453, -0.04585838317871094, -0.042319297790527344, -0.03878021240234375, -0.035241127014160156, -0.03170204162597656, -0.02816295623779297, -0.024623870849609375, -0.02108478546142578, -0.017545700073242188, -0.014006614685058594, -0.010467529296875, -0.006928443908691406, -0.0033893585205078125, 0.00014972686767578125, 0.003688812255859375, 0.007227897644042969, 0.010766983032226562, 0.014306068420410156, 0.01784515380859375, 0.021384239196777344, 0.024923324584960938, 0.02846240997314453, 0.032001495361328125, 0.03554058074951172, 0.03907966613769531, 0.042618751525878906, 0.0461578369140625, 0.049696922302246094, 0.05323600769042969, 0.05677509307861328, 0.060314178466796875, 0.06385326385498047, 0.06739234924316406, 0.07093143463134766, 0.07447052001953125, 0.07800960540771484, 0.08154869079589844, 0.08508777618408203, 0.08862686157226562, 0.09216594696044922, 0.09570503234863281, 0.0992441177368164, 0.102783203125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 15.0, 87.0, 330.0, 385.0, 153.0, 36.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006570666562765837, -0.006337686907500029, -0.006104706786572933, -0.005871727131307125, -0.005638747476041317, -0.005405767820775509, -0.005172788165509701, -0.004939808044582605, -0.004706828389316797, -0.004473848734050989, -0.004240868613123894, -0.004007888957858086, -0.0037749093025922775, -0.0035419296473264694, -0.0033089497592300177, -0.003075969871133566, -0.002842990215867758, -0.0026100105606019497, -0.002377030672505498, -0.002144050784409046, -0.001911071129143238, -0.0016780913574621081, -0.0014451115857809782, -0.0012121318140998483, -0.0009791520424187183, -0.0007461722707375884, -0.0005131924990564585, -0.00028021272737532854, -4.723295569419861e-05, 0.00018574681598693132, 0.00041872658766806126, 0.0006517063593491912, 0.0008846856653690338, 0.0011176654370501637, 0.0013506452087312937, 0.0015836249804124236, 0.0018166047520935535, 0.0020495844073593616, 0.0022825642954558134, 0.002515544183552265, 0.0027485238388180733, 0.0029815034940838814, 0.003214483382180333, 0.003447463270276785, 0.003680442925542593, 0.003913422580808401, 0.0041464027017354965, 0.004379382357001305, 0.004612362012267113, 0.004845341667532921, 0.005078321322798729, 0.005311301443725824, 0.0055442810989916325, 0.005777260754257441, 0.006010240875184536, 0.006243220530450344, 0.006476200185716152, 0.00670917984098196, 0.006942159496247768, 0.007175139617174864, 0.007408119272440672, 0.00764109892770648, 0.007874079048633575, 0.008107058703899384, 0.008340038359165192]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 12.0, 7.0, 10.0, 12.0, 15.0, 10.0, 17.0, 21.0, 17.0, 16.0, 28.0, 25.0, 37.0, 36.0, 55.0, 37.0, 49.0, 40.0, 32.0, 45.0, 44.0, 48.0, 49.0, 36.0, 45.0, 45.0, 27.0, 25.0, 24.0, 26.0, 17.0, 18.0, 17.0, 9.0, 15.0, 7.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0028798580169677734, -0.002792659215629101, -0.002705460414290428, -0.0026182616129517555, -0.002531062811613083, -0.0024438640102744102, -0.0023566652089357376, -0.002269466407597065, -0.0021822676062583923, -0.0020950688049197197, -0.002007870003581047, -0.0019206712022423744, -0.0018334724009037018, -0.0017462735995650291, -0.0016590747982263565, -0.0015718759968876839, -0.0014846771955490112, -0.0013974783942103386, -0.001310279592871666, -0.0012230807915329933, -0.0011358819901943207, -0.001048683188855648, -0.0009614843875169754, -0.0008742855861783028, -0.0007870867848396301, -0.0006998879835009575, -0.0006126891821622849, -0.0005254903808236122, -0.0004382915794849396, -0.00035109277814626694, -0.0002638939768075943, -0.00017669517546892166, -8.949637413024902e-05, -2.2975727915763855e-06, 8.490122854709625e-05, 0.0001721000298857689, 0.00025929883122444153, 0.00034649763256311417, 0.0004336964339017868, 0.0005208952352404594, 0.0006080940365791321, 0.0006952928379178047, 0.0007824916392564774, 0.00086969044059515, 0.0009568892419338226, 0.0010440880432724953, 0.001131286844611168, 0.0012184856459498405, 0.0013056844472885132, 0.0013928832486271858, 0.0014800820499658585, 0.001567280851304531, 0.0016544796526432037, 0.0017416784539818764, 0.001828877255320549, 0.0019160760566592216, 0.0020032748579978943, 0.002090473659336567, 0.0021776724606752396, 0.002264871262013912, 0.002352070063352585, 0.0024392688646912575, 0.00252646766602993, 0.0026136664673686028, 0.0027008652687072754]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 9.0, 15.0, 12.0, 15.0, 11.0, 19.0, 17.0, 26.0, 28.0, 40.0, 38.0, 39.0, 50.0, 42.0, 41.0, 33.0, 49.0, 49.0, 46.0, 47.0, 41.0, 28.0, 28.0, 30.0, 23.0, 35.0, 22.0, 20.0, 19.0, 22.0, 19.0, 10.0, 4.0, 7.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.20001220703125, -5.9859619140625, -5.77191162109375, -5.557861328125, -5.34381103515625, -5.1297607421875, -4.91571044921875, -4.70166015625, -4.48760986328125, -4.2735595703125, -4.05950927734375, -3.845458984375, -3.63140869140625, -3.4173583984375, -3.20330810546875, -2.9892578125, -2.77520751953125, -2.5611572265625, -2.34710693359375, -2.133056640625, -1.91900634765625, -1.7049560546875, -1.49090576171875, -1.27685546875, -1.06280517578125, -0.8487548828125, -0.63470458984375, -0.420654296875, -0.20660400390625, 0.0074462890625, 0.22149658203125, 0.435546875, 0.64959716796875, 0.8636474609375, 1.07769775390625, 1.291748046875, 1.50579833984375, 1.7198486328125, 1.93389892578125, 2.14794921875, 2.36199951171875, 2.5760498046875, 2.79010009765625, 3.004150390625, 3.21820068359375, 3.4322509765625, 3.64630126953125, 3.8603515625, 4.07440185546875, 4.2884521484375, 4.50250244140625, 4.716552734375, 4.93060302734375, 5.1446533203125, 5.35870361328125, 5.57275390625, 5.78680419921875, 6.0008544921875, 6.21490478515625, 6.428955078125, 6.64300537109375, 6.8570556640625, 7.07110595703125, 7.28515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 12.0, 16.0, 15.0, 22.0, 21.0, 36.0, 39.0, 68.0, 100.0, 113.0, 135.0, 174.0, 215.0, 342.0, 487.0, 769.0, 1429.0, 2919.0, 8011.0, 25625.0, 87169.0, 265628.0, 401220.0, 173810.0, 53651.0, 15856.0, 5139.0, 2212.0, 1103.0, 595.0, 402.0, 317.0, 199.0, 156.0, 120.0, 94.0, 68.0, 67.0, 42.0, 45.0, 21.0, 24.0, 17.0, 19.0, 4.0, 5.0, 4.0, 6.0, 1.0, 5.0, 1.0, 1.0], "bins": [-9.234375, -8.96514892578125, -8.6959228515625, -8.42669677734375, -8.157470703125, -7.88824462890625, -7.6190185546875, -7.34979248046875, -7.08056640625, -6.81134033203125, -6.5421142578125, -6.27288818359375, -6.003662109375, -5.73443603515625, -5.4652099609375, -5.19598388671875, -4.9267578125, -4.65753173828125, -4.3883056640625, -4.11907958984375, -3.849853515625, -3.58062744140625, -3.3114013671875, -3.04217529296875, -2.77294921875, -2.50372314453125, -2.2344970703125, -1.96527099609375, -1.696044921875, -1.42681884765625, -1.1575927734375, -0.88836669921875, -0.619140625, -0.34991455078125, -0.0806884765625, 0.18853759765625, 0.457763671875, 0.72698974609375, 0.9962158203125, 1.26544189453125, 1.53466796875, 1.80389404296875, 2.0731201171875, 2.34234619140625, 2.611572265625, 2.88079833984375, 3.1500244140625, 3.41925048828125, 3.6884765625, 3.95770263671875, 4.2269287109375, 4.49615478515625, 4.765380859375, 5.03460693359375, 5.3038330078125, 5.57305908203125, 5.84228515625, 6.11151123046875, 6.3807373046875, 6.64996337890625, 6.919189453125, 7.18841552734375, 7.4576416015625, 7.72686767578125, 7.99609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 10.0, 7.0, 15.0, 18.0, 20.0, 19.0, 23.0, 25.0, 32.0, 36.0, 39.0, 50.0, 54.0, 71.0, 90.0, 152.0, 1361.0, 329.0, 166.0, 91.0, 65.0, 41.0, 50.0, 37.0, 39.0, 27.0, 22.0, 18.0, 27.0, 17.0, 16.0, 13.0, 5.0, 7.0, 9.0, 3.0, 9.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-19.734375, -19.2005615234375, -18.666748046875, -18.1329345703125, -17.59912109375, -17.0653076171875, -16.531494140625, -15.9976806640625, -15.4638671875, -14.9300537109375, -14.396240234375, -13.8624267578125, -13.32861328125, -12.7947998046875, -12.260986328125, -11.7271728515625, -11.193359375, -10.6595458984375, -10.125732421875, -9.5919189453125, -9.05810546875, -8.5242919921875, -7.990478515625, -7.4566650390625, -6.9228515625, -6.3890380859375, -5.855224609375, -5.3214111328125, -4.78759765625, -4.2537841796875, -3.719970703125, -3.1861572265625, -2.65234375, -2.1185302734375, -1.584716796875, -1.0509033203125, -0.51708984375, 0.0167236328125, 0.550537109375, 1.0843505859375, 1.6181640625, 2.1519775390625, 2.685791015625, 3.2196044921875, 3.75341796875, 4.2872314453125, 4.821044921875, 5.3548583984375, 5.888671875, 6.4224853515625, 6.956298828125, 7.4901123046875, 8.02392578125, 8.5577392578125, 9.091552734375, 9.6253662109375, 10.1591796875, 10.6929931640625, 11.226806640625, 11.7606201171875, 12.29443359375, 12.8282470703125, 13.362060546875, 13.8958740234375, 14.4296875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 10.0, 7.0, 8.0, 15.0, 13.0, 16.0, 32.0, 32.0, 37.0, 63.0, 85.0, 151.0, 181.0, 280.0, 416.0, 712.0, 1614.0, 21414.0, 2758155.0, 354686.0, 4923.0, 1033.0, 589.0, 356.0, 221.0, 158.0, 130.0, 90.0, 72.0, 43.0, 37.0, 32.0, 17.0, 19.0, 13.0, 11.0, 10.0, 6.0, 10.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.40625, -35.35986328125, -34.3134765625, -33.26708984375, -32.220703125, -31.17431640625, -30.1279296875, -29.08154296875, -28.03515625, -26.98876953125, -25.9423828125, -24.89599609375, -23.849609375, -22.80322265625, -21.7568359375, -20.71044921875, -19.6640625, -18.61767578125, -17.5712890625, -16.52490234375, -15.478515625, -14.43212890625, -13.3857421875, -12.33935546875, -11.29296875, -10.24658203125, -9.2001953125, -8.15380859375, -7.107421875, -6.06103515625, -5.0146484375, -3.96826171875, -2.921875, -1.87548828125, -0.8291015625, 0.21728515625, 1.263671875, 2.31005859375, 3.3564453125, 4.40283203125, 5.44921875, 6.49560546875, 7.5419921875, 8.58837890625, 9.634765625, 10.68115234375, 11.7275390625, 12.77392578125, 13.8203125, 14.86669921875, 15.9130859375, 16.95947265625, 18.005859375, 19.05224609375, 20.0986328125, 21.14501953125, 22.19140625, 23.23779296875, 24.2841796875, 25.33056640625, 26.376953125, 27.42333984375, 28.4697265625, 29.51611328125, 30.5625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 21.0, 168.0, 520.0, 267.0, 39.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.81574630737305, -38.499183654785156, -35.182621002197266, -31.866056442260742, -28.54949188232422, -25.232929229736328, -21.916366577148438, -18.599802017211914, -15.283239364624023, -11.966675758361816, -8.65011215209961, -5.333549499511719, -2.0169858932495117, 1.2995777130126953, 4.616140365600586, 7.932704925537109, 11.249267578125, 14.565831184387207, 17.882394790649414, 21.198957443237305, 24.515522003173828, 27.83208465576172, 31.14864730834961, 34.4652099609375, 37.781776428222656, 41.09833908081055, 44.41490173339844, 47.731468200683594, 51.048030853271484, 54.364593505859375, 57.681156158447266, 60.997718811035156, 64.31427764892578, 67.63084411621094, 70.94740295410156, 74.26396942138672, 77.58052825927734, 80.8970947265625, 84.21365356445312, 87.53022003173828, 90.84678649902344, 94.1633529663086, 97.47991180419922, 100.79647827148438, 104.113037109375, 107.42960357666016, 110.74617004394531, 114.06272888183594, 117.37928771972656, 120.69585418701172, 124.01241302490234, 127.3289794921875, 130.64553833007812, 133.96209716796875, 137.27867126464844, 140.59523010253906, 143.91180419921875, 147.22836303710938, 150.54493713378906, 153.8614959716797, 157.1780548095703, 160.49462890625, 163.81118774414062, 167.12774658203125, 170.44430541992188]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 13.0, 11.0, 14.0, 15.0, 21.0, 28.0, 33.0, 28.0, 38.0, 29.0, 39.0, 49.0, 31.0, 48.0, 43.0, 54.0, 36.0, 40.0, 50.0, 42.0, 45.0, 32.0, 40.0, 24.0, 22.0, 26.0, 23.0, 18.0, 19.0, 12.0, 15.0, 13.0, 7.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.16120147705078, -37.803550720214844, -36.445899963378906, -35.08824920654297, -33.73059844970703, -32.372947692871094, -31.01529884338379, -29.65764808654785, -28.299997329711914, -26.942346572875977, -25.58469581604004, -24.227046966552734, -22.869396209716797, -21.51174545288086, -20.154094696044922, -18.796443939208984, -17.438793182373047, -16.08114242553711, -14.723491668701172, -13.36584186553955, -12.008191108703613, -10.650540351867676, -9.292890548706055, -7.935239791870117, -6.57758903503418, -5.219938278198242, -3.862287998199463, -2.5046377182006836, -1.146986961364746, 0.2106637954711914, 1.5683135986328125, 2.92596435546875, 4.283618927001953, 5.641269683837891, 6.99891996383667, 8.35657024383545, 9.714221000671387, 11.071871757507324, 12.429521560668945, 13.787172317504883, 15.14482307434082, 16.502473831176758, 17.860124588012695, 19.2177734375, 20.575424194335938, 21.933074951171875, 23.290725708007812, 24.64837646484375, 26.006027221679688, 27.363677978515625, 28.721328735351562, 30.0789794921875, 31.436630249023438, 32.794281005859375, 34.15193176269531, 35.50958251953125, 36.86723327636719, 38.224884033203125, 39.58253479003906, 40.940185546875, 42.29783630371094, 43.655487060546875, 45.01313781738281, 46.37078857421875, 47.72843551635742]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 11.0, 16.0, 15.0, 11.0, 22.0, 17.0, 19.0, 31.0, 35.0, 35.0, 35.0, 53.0, 49.0, 48.0, 44.0, 42.0, 52.0, 51.0, 53.0, 33.0, 33.0, 35.0, 32.0, 22.0, 17.0, 20.0, 29.0, 16.0, 16.0, 15.0, 11.0, 17.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.90625, -5.6796875, -5.453125, -5.2265625, -5.0, -4.7734375, -4.546875, -4.3203125, -4.09375, -3.8671875, -3.640625, -3.4140625, -3.1875, -2.9609375, -2.734375, -2.5078125, -2.28125, -2.0546875, -1.828125, -1.6015625, -1.375, -1.1484375, -0.921875, -0.6953125, -0.46875, -0.2421875, -0.015625, 0.2109375, 0.4375, 0.6640625, 0.890625, 1.1171875, 1.34375, 1.5703125, 1.796875, 2.0234375, 2.25, 2.4765625, 2.703125, 2.9296875, 3.15625, 3.3828125, 3.609375, 3.8359375, 4.0625, 4.2890625, 4.515625, 4.7421875, 4.96875, 5.1953125, 5.421875, 5.6484375, 5.875, 6.1015625, 6.328125, 6.5546875, 6.78125, 7.0078125, 7.234375, 7.4609375, 7.6875, 7.9140625, 8.140625, 8.3671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 10.0, 8.0, 8.0, 13.0, 16.0, 13.0, 20.0, 28.0, 28.0, 41.0, 52.0, 57.0, 91.0, 112.0, 141.0, 207.0, 251.0, 334.0, 484.0, 2739.0, 4104991.0, 82246.0, 762.0, 375.0, 276.0, 210.0, 190.0, 122.0, 101.0, 65.0, 59.0, 53.0, 23.0, 30.0, 27.0, 14.0, 13.0, 16.0, 15.0, 7.0, 4.0, 7.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.0625, -65.9169921875, -63.771484375, -61.6259765625, -59.48046875, -57.3349609375, -55.189453125, -53.0439453125, -50.8984375, -48.7529296875, -46.607421875, -44.4619140625, -42.31640625, -40.1708984375, -38.025390625, -35.8798828125, -33.734375, -31.5888671875, -29.443359375, -27.2978515625, -25.15234375, -23.0068359375, -20.861328125, -18.7158203125, -16.5703125, -14.4248046875, -12.279296875, -10.1337890625, -7.98828125, -5.8427734375, -3.697265625, -1.5517578125, 0.59375, 2.7392578125, 4.884765625, 7.0302734375, 9.17578125, 11.3212890625, 13.466796875, 15.6123046875, 17.7578125, 19.9033203125, 22.048828125, 24.1943359375, 26.33984375, 28.4853515625, 30.630859375, 32.7763671875, 34.921875, 37.0673828125, 39.212890625, 41.3583984375, 43.50390625, 45.6494140625, 47.794921875, 49.9404296875, 52.0859375, 54.2314453125, 56.376953125, 58.5224609375, 60.66796875, 62.8134765625, 64.958984375, 67.1044921875, 69.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 8.0, 4.0, 12.0, 14.0, 9.0, 21.0, 21.0, 31.0, 39.0, 48.0, 70.0, 122.0, 156.0, 254.0, 411.0, 538.0, 567.0, 541.0, 391.0, 251.0, 168.0, 93.0, 79.0, 54.0, 29.0, 38.0, 23.0, 15.0, 15.0, 15.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.546875, -10.201416015625, -9.85595703125, -9.510498046875, -9.1650390625, -8.819580078125, -8.47412109375, -8.128662109375, -7.783203125, -7.437744140625, -7.09228515625, -6.746826171875, -6.4013671875, -6.055908203125, -5.71044921875, -5.364990234375, -5.01953125, -4.674072265625, -4.32861328125, -3.983154296875, -3.6376953125, -3.292236328125, -2.94677734375, -2.601318359375, -2.255859375, -1.910400390625, -1.56494140625, -1.219482421875, -0.8740234375, -0.528564453125, -0.18310546875, 0.162353515625, 0.5078125, 0.853271484375, 1.19873046875, 1.544189453125, 1.8896484375, 2.235107421875, 2.58056640625, 2.926025390625, 3.271484375, 3.616943359375, 3.96240234375, 4.307861328125, 4.6533203125, 4.998779296875, 5.34423828125, 5.689697265625, 6.03515625, 6.380615234375, 6.72607421875, 7.071533203125, 7.4169921875, 7.762451171875, 8.10791015625, 8.453369140625, 8.798828125, 9.144287109375, 9.48974609375, 9.835205078125, 10.1806640625, 10.526123046875, 10.87158203125, 11.217041015625, 11.5625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 7.0, 8.0, 16.0, 14.0, 19.0, 30.0, 26.0, 43.0, 68.0, 71.0, 166.0, 458.0, 3071.0, 775722.0, 3407622.0, 5796.0, 607.0, 214.0, 93.0, 54.0, 46.0, 35.0, 18.0, 23.0, 17.0, 11.0, 6.0, 4.0, 3.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.6875, -45.990234375, -44.29296875, -42.595703125, -40.8984375, -39.201171875, -37.50390625, -35.806640625, -34.109375, -32.412109375, -30.71484375, -29.017578125, -27.3203125, -25.623046875, -23.92578125, -22.228515625, -20.53125, -18.833984375, -17.13671875, -15.439453125, -13.7421875, -12.044921875, -10.34765625, -8.650390625, -6.953125, -5.255859375, -3.55859375, -1.861328125, -0.1640625, 1.533203125, 3.23046875, 4.927734375, 6.625, 8.322265625, 10.01953125, 11.716796875, 13.4140625, 15.111328125, 16.80859375, 18.505859375, 20.203125, 21.900390625, 23.59765625, 25.294921875, 26.9921875, 28.689453125, 30.38671875, 32.083984375, 33.78125, 35.478515625, 37.17578125, 38.873046875, 40.5703125, 42.267578125, 43.96484375, 45.662109375, 47.359375, 49.056640625, 50.75390625, 52.451171875, 54.1484375, 55.845703125, 57.54296875, 59.240234375, 60.9375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 15.0, 33.0, 58.0, 112.0, 147.0, 167.0, 154.0, 132.0, 92.0, 43.0, 33.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.77703285217285, -18.356338500976562, -16.935644149780273, -15.514948844909668, -14.094253540039062, -12.673559188842773, -11.252864837646484, -9.832169532775879, -8.41147518157959, -6.990780353546143, -5.570085525512695, -4.149391174316406, -2.728696346282959, -1.3080015182495117, 0.11269283294677734, 1.5333881378173828, 2.954082489013672, 4.374777317047119, 5.795472145080566, 7.2161664962768555, 8.636861801147461, 10.05755615234375, 11.478250503540039, 12.898945808410645, 14.319640159606934, 15.740334510803223, 17.161029815673828, 18.581724166870117, 20.002418518066406, 21.423114776611328, 22.843807220458984, 24.264503479003906, 25.685199737548828, 27.105894088745117, 28.526588439941406, 29.947284698486328, 31.367979049682617, 32.788673400878906, 34.20936584472656, 35.630062103271484, 37.050758361816406, 38.47145462036133, 39.892147064208984, 41.312843322753906, 42.73353576660156, 44.154232025146484, 45.574928283691406, 46.99562072753906, 48.41631317138672, 49.83700942993164, 51.2577018737793, 52.67839813232422, 54.099090576171875, 55.5197868347168, 56.94048309326172, 58.361175537109375, 59.7818717956543, 61.20256805419922, 62.623260498046875, 64.04395294189453, 65.46465301513672, 66.88534545898438, 68.30603790283203, 69.72673797607422, 71.14743041992188]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 7.0, 8.0, 15.0, 20.0, 13.0, 17.0, 28.0, 26.0, 34.0, 30.0, 27.0, 29.0, 41.0, 38.0, 30.0, 32.0, 45.0, 43.0, 30.0, 42.0, 44.0, 36.0, 41.0, 45.0, 38.0, 25.0, 29.0, 19.0, 17.0, 21.0, 27.0, 16.0, 15.0, 16.0, 7.0, 9.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.2213134765625, -35.143367767333984, -34.06542205810547, -32.98747634887695, -31.909528732299805, -30.83158302307129, -29.753637313842773, -28.675691604614258, -27.59774398803711, -26.519798278808594, -25.441852569580078, -24.363906860351562, -23.285959243774414, -22.2080135345459, -21.130067825317383, -20.052122116088867, -18.97417640686035, -17.896230697631836, -16.81828498840332, -15.740338325500488, -14.662391662597656, -13.58444595336914, -12.506500244140625, -11.42855453491211, -10.350607872009277, -9.272662162780762, -8.19471549987793, -7.116769790649414, -6.03882360458374, -4.960877418518066, -3.882931709289551, -2.804985523223877, -1.7270393371582031, -0.6490932703018188, 0.42885279655456543, 1.5067987442016602, 2.584744930267334, 3.662691116333008, 4.740636825561523, 5.818583011627197, 6.896529197692871, 7.974475383758545, 9.052421569824219, 10.130367279052734, 11.20831298828125, 12.286259651184082, 13.364205360412598, 14.44215202331543, 15.520097732543945, 16.59804344177246, 17.675989151000977, 18.753936767578125, 19.83188247680664, 20.909828186035156, 21.987773895263672, 23.065719604492188, 24.143665313720703, 25.22161102294922, 26.299556732177734, 27.37750244140625, 28.4554500579834, 29.533395767211914, 30.61134147644043, 31.689287185668945, 32.767234802246094]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 8.0, 8.0, 6.0, 11.0, 8.0, 19.0, 15.0, 20.0, 21.0, 25.0, 24.0, 37.0, 39.0, 42.0, 49.0, 40.0, 40.0, 40.0, 46.0, 34.0, 37.0, 45.0, 48.0, 25.0, 35.0, 38.0, 28.0, 32.0, 26.0, 27.0, 19.0, 13.0, 11.0, 13.0, 10.0, 11.0, 8.0, 5.0, 3.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.83203125, -6.62457275390625, -6.4171142578125, -6.20965576171875, -6.002197265625, -5.79473876953125, -5.5872802734375, -5.37982177734375, -5.17236328125, -4.96490478515625, -4.7574462890625, -4.54998779296875, -4.342529296875, -4.13507080078125, -3.9276123046875, -3.72015380859375, -3.5126953125, -3.30523681640625, -3.0977783203125, -2.89031982421875, -2.682861328125, -2.47540283203125, -2.2679443359375, -2.06048583984375, -1.85302734375, -1.64556884765625, -1.4381103515625, -1.23065185546875, -1.023193359375, -0.81573486328125, -0.6082763671875, -0.40081787109375, -0.193359375, 0.01409912109375, 0.2215576171875, 0.42901611328125, 0.636474609375, 0.84393310546875, 1.0513916015625, 1.25885009765625, 1.46630859375, 1.67376708984375, 1.8812255859375, 2.08868408203125, 2.296142578125, 2.50360107421875, 2.7110595703125, 2.91851806640625, 3.1259765625, 3.33343505859375, 3.5408935546875, 3.74835205078125, 3.955810546875, 4.16326904296875, 4.3707275390625, 4.57818603515625, 4.78564453125, 4.99310302734375, 5.2005615234375, 5.40802001953125, 5.615478515625, 5.82293701171875, 6.0303955078125, 6.23785400390625, 6.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 13.0, 25.0, 30.0, 54.0, 74.0, 125.0, 175.0, 246.0, 331.0, 525.0, 766.0, 1117.0, 1799.0, 2628.0, 3990.0, 6190.0, 9167.0, 14206.0, 21389.0, 32922.0, 51205.0, 81935.0, 131757.0, 203628.0, 178325.0, 110973.0, 69137.0, 43752.0, 28069.0, 18168.0, 12063.0, 7973.0, 5346.0, 3442.0, 2401.0, 1557.0, 1026.0, 659.0, 438.0, 314.0, 208.0, 138.0, 81.0, 65.0, 44.0, 28.0, 18.0, 10.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6123046875, -0.592437744140625, -0.57257080078125, -0.552703857421875, -0.5328369140625, -0.512969970703125, -0.49310302734375, -0.473236083984375, -0.453369140625, -0.433502197265625, -0.41363525390625, -0.393768310546875, -0.3739013671875, -0.354034423828125, -0.33416748046875, -0.314300537109375, -0.29443359375, -0.274566650390625, -0.25469970703125, -0.234832763671875, -0.2149658203125, -0.195098876953125, -0.17523193359375, -0.155364990234375, -0.135498046875, -0.115631103515625, -0.09576416015625, -0.075897216796875, -0.0560302734375, -0.036163330078125, -0.01629638671875, 0.003570556640625, 0.0234375, 0.043304443359375, 0.06317138671875, 0.083038330078125, 0.1029052734375, 0.122772216796875, 0.14263916015625, 0.162506103515625, 0.182373046875, 0.202239990234375, 0.22210693359375, 0.241973876953125, 0.2618408203125, 0.281707763671875, 0.30157470703125, 0.321441650390625, 0.34130859375, 0.361175537109375, 0.38104248046875, 0.400909423828125, 0.4207763671875, 0.440643310546875, 0.46051025390625, 0.480377197265625, 0.500244140625, 0.520111083984375, 0.53997802734375, 0.559844970703125, 0.5797119140625, 0.599578857421875, 0.61944580078125, 0.639312744140625, 0.6591796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 5.0, 6.0, 10.0, 3.0, 7.0, 15.0, 14.0, 14.0, 24.0, 11.0, 23.0, 23.0, 31.0, 26.0, 38.0, 41.0, 40.0, 46.0, 32.0, 40.0, 37.0, 1057.0, 39.0, 48.0, 43.0, 37.0, 30.0, 32.0, 27.0, 23.0, 20.0, 28.0, 20.0, 19.0, 22.0, 15.0, 15.0, 8.0, 5.0, 11.0, 11.0, 3.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.41796875, -4.29205322265625, -4.1661376953125, -4.04022216796875, -3.914306640625, -3.78839111328125, -3.6624755859375, -3.53656005859375, -3.41064453125, -3.28472900390625, -3.1588134765625, -3.03289794921875, -2.906982421875, -2.78106689453125, -2.6551513671875, -2.52923583984375, -2.4033203125, -2.27740478515625, -2.1514892578125, -2.02557373046875, -1.899658203125, -1.77374267578125, -1.6478271484375, -1.52191162109375, -1.39599609375, -1.27008056640625, -1.1441650390625, -1.01824951171875, -0.892333984375, -0.76641845703125, -0.6405029296875, -0.51458740234375, -0.388671875, -0.26275634765625, -0.1368408203125, -0.01092529296875, 0.114990234375, 0.24090576171875, 0.3668212890625, 0.49273681640625, 0.61865234375, 0.74456787109375, 0.8704833984375, 0.99639892578125, 1.122314453125, 1.24822998046875, 1.3741455078125, 1.50006103515625, 1.6259765625, 1.75189208984375, 1.8778076171875, 2.00372314453125, 2.129638671875, 2.25555419921875, 2.3814697265625, 2.50738525390625, 2.63330078125, 2.75921630859375, 2.8851318359375, 3.01104736328125, 3.136962890625, 3.26287841796875, 3.3887939453125, 3.51470947265625, 3.640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 4.0, 5.0, 16.0, 17.0, 28.0, 38.0, 61.0, 73.0, 91.0, 184.0, 232.0, 321.0, 397.0, 650.0, 846.0, 1161.0, 1658.0, 2347.0, 3535.0, 5059.0, 7593.0, 11536.0, 17783.0, 28011.0, 45112.0, 75729.0, 129457.0, 1236831.0, 227856.0, 116245.0, 68122.0, 40987.0, 25636.0, 16322.0, 10554.0, 6974.0, 4712.0, 3257.0, 2278.0, 1599.0, 1131.0, 763.0, 540.0, 401.0, 286.0, 213.0, 157.0, 86.0, 82.0, 62.0, 32.0, 21.0, 16.0, 18.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.638671875, -0.6180038452148438, -0.5973358154296875, -0.5766677856445312, -0.555999755859375, -0.5353317260742188, -0.5146636962890625, -0.49399566650390625, -0.47332763671875, -0.45265960693359375, -0.4319915771484375, -0.41132354736328125, -0.390655517578125, -0.36998748779296875, -0.3493194580078125, -0.32865142822265625, -0.3079833984375, -0.28731536865234375, -0.2666473388671875, -0.24597930908203125, -0.225311279296875, -0.20464324951171875, -0.1839752197265625, -0.16330718994140625, -0.14263916015625, -0.12197113037109375, -0.1013031005859375, -0.08063507080078125, -0.059967041015625, -0.03929901123046875, -0.0186309814453125, 0.00203704833984375, 0.022705078125, 0.04337310791015625, 0.0640411376953125, 0.08470916748046875, 0.105377197265625, 0.12604522705078125, 0.1467132568359375, 0.16738128662109375, 0.18804931640625, 0.20871734619140625, 0.2293853759765625, 0.25005340576171875, 0.270721435546875, 0.29138946533203125, 0.3120574951171875, 0.33272552490234375, 0.3533935546875, 0.37406158447265625, 0.3947296142578125, 0.41539764404296875, 0.436065673828125, 0.45673370361328125, 0.4774017333984375, 0.49806976318359375, 0.51873779296875, 0.5394058227539062, 0.5600738525390625, 0.5807418823242188, 0.601409912109375, 0.6220779418945312, 0.6427459716796875, 0.6634140014648438, 0.68408203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 3.0, 9.0, 8.0, 5.0, 8.0, 17.0, 24.0, 28.0, 45.0, 57.0, 68.0, 105.0, 93.0, 108.0, 106.0, 66.0, 52.0, 33.0, 30.0, 33.0, 17.0, 14.0, 18.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004974365234375, -0.004795849323272705, -0.00461733341217041, -0.004438817501068115, -0.00426030158996582, -0.004081785678863525, -0.0039032697677612305, -0.0037247538566589355, -0.0035462379455566406, -0.0033677220344543457, -0.0031892061233520508, -0.003010690212249756, -0.002832174301147461, -0.002653658390045166, -0.002475142478942871, -0.002296626567840576, -0.0021181106567382812, -0.0019395947456359863, -0.0017610788345336914, -0.0015825629234313965, -0.0014040470123291016, -0.0012255311012268066, -0.0010470151901245117, -0.0008684992790222168, -0.0006899833679199219, -0.000511467456817627, -0.00033295154571533203, -0.0001544356346130371, 2.4080276489257812e-05, 0.00020259618759155273, 0.00038111209869384766, 0.0005596280097961426, 0.0007381439208984375, 0.0009166598320007324, 0.0010951757431030273, 0.0012736916542053223, 0.0014522075653076172, 0.0016307234764099121, 0.001809239387512207, 0.001987755298614502, 0.002166271209716797, 0.002344787120819092, 0.0025233030319213867, 0.0027018189430236816, 0.0028803348541259766, 0.0030588507652282715, 0.0032373666763305664, 0.0034158825874328613, 0.0035943984985351562, 0.003772914409637451, 0.003951430320739746, 0.004129946231842041, 0.004308462142944336, 0.004486978054046631, 0.004665493965148926, 0.004844009876251221, 0.005022525787353516, 0.0052010416984558105, 0.0053795576095581055, 0.0055580735206604, 0.005736589431762695, 0.00591510534286499, 0.006093621253967285, 0.00627213716506958, 0.006450653076171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 13.0, 12.0, 19.0, 40.0, 40.0, 49.0, 71.0, 84.0, 121.0, 218.0, 385.0, 937.0, 29182.0, 1014017.0, 1972.0, 537.0, 280.0, 196.0, 91.0, 78.0, 40.0, 22.0, 20.0, 21.0, 18.0, 16.0, 6.0, 11.0, 10.0, 11.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.12030029296875, -0.11698150634765625, -0.1136627197265625, -0.11034393310546875, -0.107025146484375, -0.10370635986328125, -0.1003875732421875, -0.09706878662109375, -0.09375, -0.09043121337890625, -0.0871124267578125, -0.08379364013671875, -0.080474853515625, -0.07715606689453125, -0.0738372802734375, -0.07051849365234375, -0.06719970703125, -0.06388092041015625, -0.0605621337890625, -0.05724334716796875, -0.053924560546875, -0.05060577392578125, -0.0472869873046875, -0.04396820068359375, -0.0406494140625, -0.03733062744140625, -0.0340118408203125, -0.03069305419921875, -0.027374267578125, -0.02405548095703125, -0.0207366943359375, -0.01741790771484375, -0.01409912109375, -0.01078033447265625, -0.0074615478515625, -0.00414276123046875, -0.000823974609375, 0.00249481201171875, 0.0058135986328125, 0.00913238525390625, 0.012451171875, 0.01576995849609375, 0.0190887451171875, 0.02240753173828125, 0.025726318359375, 0.02904510498046875, 0.0323638916015625, 0.03568267822265625, 0.03900146484375, 0.04232025146484375, 0.0456390380859375, 0.04895782470703125, 0.052276611328125, 0.05559539794921875, 0.0589141845703125, 0.06223297119140625, 0.0655517578125, 0.06887054443359375, 0.0721893310546875, 0.07550811767578125, 0.078826904296875, 0.08214569091796875, 0.0854644775390625, 0.08878326416015625, 0.09210205078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 29.0, 251.0, 511.0, 189.0, 27.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013438710942864418, -0.013136073015630245, -0.012833436019718647, -0.012530798092484474, -0.012228160165250301, -0.011925523169338703, -0.01162288524210453, -0.011320248246192932, -0.01101761031895876, -0.010714972391724586, -0.010412335395812988, -0.010109697468578815, -0.009807059541344643, -0.009504422545433044, -0.009201784618198872, -0.008899146690964699, -0.0085965096950531, -0.008293871767818928, -0.00799123477190733, -0.007688596844673157, -0.007385959383100271, -0.007083321921527386, -0.006780683994293213, -0.006478046532720327, -0.006175408139824867, -0.005872770678251982, -0.005570132751017809, -0.005267495289444923, -0.004964857827872038, -0.004662220366299152, -0.0043595824390649796, -0.004056944977492094, -0.0037543075159192085, -0.0034516698215156794, -0.003149032359942794, -0.0028463946655392647, -0.002543757203966379, -0.00224111950956285, -0.0019384818151593208, -0.0016358443535864353, -0.0013332066591829062, -0.0010305690811946988, -0.0007279314449988306, -0.0004252938088029623, -0.00012265623081475496, 0.00017998134717345238, 0.00048261904157698154, 0.0007852565031498671, 0.0010878941975533962, 0.0013905317755416036, 0.001693169353529811, 0.00199580704793334, 0.0022984445095062256, 0.0026010822039097548, 0.002903719898313284, 0.0032063573598861694, 0.0035089950542896986, 0.0038116327486932278, 0.004114270210266113, 0.004416908137500286, 0.004719545599073172, 0.005022183060646057, 0.00532482098788023, 0.005627457983791828, 0.005930095911026001]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 7.0, 14.0, 18.0, 12.0, 19.0, 22.0, 35.0, 24.0, 22.0, 33.0, 37.0, 46.0, 35.0, 44.0, 39.0, 36.0, 37.0, 39.0, 37.0, 46.0, 40.0, 41.0, 44.0, 39.0, 30.0, 30.0, 31.0, 28.0, 11.0, 12.0, 14.0, 11.0, 7.0, 12.0, 6.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.002507627010345459, -0.002432519569993019, -0.0023574121296405792, -0.0022823046892881393, -0.0022071972489356995, -0.0021320898085832596, -0.0020569823682308197, -0.00198187492787838, -0.00190676748752594, -0.0018316600471735, -0.0017565526068210602, -0.0016814451664686203, -0.0016063377261161804, -0.0015312302857637405, -0.0014561228454113007, -0.0013810154050588608, -0.001305907964706421, -0.001230800524353981, -0.0011556930840015411, -0.0010805856436491013, -0.0010054782032966614, -0.0009303707629442215, -0.0008552633225917816, -0.0007801558822393417, -0.0007050484418869019, -0.000629941001534462, -0.0005548335611820221, -0.0004797261208295822, -0.00040461868047714233, -0.00032951124012470245, -0.0002544037997722626, -0.0001792963594198227, -0.00010418891906738281, -2.9081478714942932e-05, 4.602596163749695e-05, 0.00012113340198993683, 0.0001962408423423767, 0.0002713482826948166, 0.00034645572304725647, 0.00042156316339969635, 0.0004966706037521362, 0.0005717780441045761, 0.000646885484457016, 0.0007219929248094559, 0.0007971003651618958, 0.0008722078055143356, 0.0009473152458667755, 0.0010224226862192154, 0.0010975301265716553, 0.0011726375669240952, 0.001247745007276535, 0.001322852447628975, 0.0013979598879814148, 0.0014730673283338547, 0.0015481747686862946, 0.0016232822090387344, 0.0016983896493911743, 0.0017734970897436142, 0.001848604530096054, 0.001923711970448494, 0.001998819410800934, 0.0020739268511533737, 0.0021490342915058136, 0.0022241417318582535, 0.0022992491722106934]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 8.0, 8.0, 6.0, 11.0, 8.0, 19.0, 15.0, 20.0, 21.0, 25.0, 24.0, 37.0, 39.0, 43.0, 47.0, 41.0, 40.0, 41.0, 45.0, 34.0, 37.0, 45.0, 48.0, 25.0, 35.0, 38.0, 28.0, 32.0, 26.0, 27.0, 19.0, 12.0, 12.0, 13.0, 10.0, 11.0, 8.0, 5.0, 3.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.83203125, -6.62457275390625, -6.4171142578125, -6.20965576171875, -6.002197265625, -5.79473876953125, -5.5872802734375, -5.37982177734375, -5.17236328125, -4.96490478515625, -4.7574462890625, -4.54998779296875, -4.342529296875, -4.13507080078125, -3.9276123046875, -3.72015380859375, -3.5126953125, -3.30523681640625, -3.0977783203125, -2.89031982421875, -2.682861328125, -2.47540283203125, -2.2679443359375, -2.06048583984375, -1.85302734375, -1.64556884765625, -1.4381103515625, -1.23065185546875, -1.023193359375, -0.81573486328125, -0.6082763671875, -0.40081787109375, -0.193359375, 0.01409912109375, 0.2215576171875, 0.42901611328125, 0.636474609375, 0.84393310546875, 1.0513916015625, 1.25885009765625, 1.46630859375, 1.67376708984375, 1.8812255859375, 2.08868408203125, 2.296142578125, 2.50360107421875, 2.7110595703125, 2.91851806640625, 3.1259765625, 3.33343505859375, 3.5408935546875, 3.74835205078125, 3.955810546875, 4.16326904296875, 4.3707275390625, 4.57818603515625, 4.78564453125, 4.99310302734375, 5.2005615234375, 5.40802001953125, 5.615478515625, 5.82293701171875, 6.0303955078125, 6.23785400390625, 6.4453125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 14.0, 20.0, 25.0, 25.0, 45.0, 54.0, 60.0, 93.0, 119.0, 132.0, 192.0, 261.0, 311.0, 406.0, 607.0, 789.0, 1089.0, 1651.0, 3359.0, 13976.0, 92601.0, 468195.0, 379369.0, 66500.0, 10249.0, 2745.0, 1570.0, 1058.0, 749.0, 567.0, 424.0, 290.0, 228.0, 170.0, 158.0, 111.0, 80.0, 57.0, 52.0, 34.0, 20.0, 23.0, 16.0, 15.0, 12.0, 5.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.9609375, -12.567138671875, -12.17333984375, -11.779541015625, -11.3857421875, -10.991943359375, -10.59814453125, -10.204345703125, -9.810546875, -9.416748046875, -9.02294921875, -8.629150390625, -8.2353515625, -7.841552734375, -7.44775390625, -7.053955078125, -6.66015625, -6.266357421875, -5.87255859375, -5.478759765625, -5.0849609375, -4.691162109375, -4.29736328125, -3.903564453125, -3.509765625, -3.115966796875, -2.72216796875, -2.328369140625, -1.9345703125, -1.540771484375, -1.14697265625, -0.753173828125, -0.359375, 0.034423828125, 0.42822265625, 0.822021484375, 1.2158203125, 1.609619140625, 2.00341796875, 2.397216796875, 2.791015625, 3.184814453125, 3.57861328125, 3.972412109375, 4.3662109375, 4.760009765625, 5.15380859375, 5.547607421875, 5.94140625, 6.335205078125, 6.72900390625, 7.122802734375, 7.5166015625, 7.910400390625, 8.30419921875, 8.697998046875, 9.091796875, 9.485595703125, 9.87939453125, 10.273193359375, 10.6669921875, 11.060791015625, 11.45458984375, 11.848388671875, 12.2421875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 10.0, 10.0, 18.0, 16.0, 29.0, 27.0, 42.0, 57.0, 55.0, 61.0, 94.0, 215.0, 1581.0, 297.0, 139.0, 73.0, 47.0, 57.0, 42.0, 54.0, 27.0, 23.0, 11.0, 9.0, 10.0, 11.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.35888671875, -20.6396484375, -19.92041015625, -19.201171875, -18.48193359375, -17.7626953125, -17.04345703125, -16.32421875, -15.60498046875, -14.8857421875, -14.16650390625, -13.447265625, -12.72802734375, -12.0087890625, -11.28955078125, -10.5703125, -9.85107421875, -9.1318359375, -8.41259765625, -7.693359375, -6.97412109375, -6.2548828125, -5.53564453125, -4.81640625, -4.09716796875, -3.3779296875, -2.65869140625, -1.939453125, -1.22021484375, -0.5009765625, 0.21826171875, 0.9375, 1.65673828125, 2.3759765625, 3.09521484375, 3.814453125, 4.53369140625, 5.2529296875, 5.97216796875, 6.69140625, 7.41064453125, 8.1298828125, 8.84912109375, 9.568359375, 10.28759765625, 11.0068359375, 11.72607421875, 12.4453125, 13.16455078125, 13.8837890625, 14.60302734375, 15.322265625, 16.04150390625, 16.7607421875, 17.47998046875, 18.19921875, 18.91845703125, 19.6376953125, 20.35693359375, 21.076171875, 21.79541015625, 22.5146484375, 23.23388671875, 23.953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 1.0, 4.0, 8.0, 4.0, 4.0, 7.0, 11.0, 18.0, 15.0, 25.0, 33.0, 52.0, 64.0, 78.0, 122.0, 177.0, 308.0, 515.0, 864.0, 2166.0, 2138195.0, 998685.0, 2058.0, 893.0, 507.0, 298.0, 171.0, 108.0, 70.0, 59.0, 41.0, 34.0, 26.0, 21.0, 18.0, 11.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-71.8125, -69.69921875, -67.5859375, -65.47265625, -63.359375, -61.24609375, -59.1328125, -57.01953125, -54.90625, -52.79296875, -50.6796875, -48.56640625, -46.453125, -44.33984375, -42.2265625, -40.11328125, -38.0, -35.88671875, -33.7734375, -31.66015625, -29.546875, -27.43359375, -25.3203125, -23.20703125, -21.09375, -18.98046875, -16.8671875, -14.75390625, -12.640625, -10.52734375, -8.4140625, -6.30078125, -4.1875, -2.07421875, 0.0390625, 2.15234375, 4.265625, 6.37890625, 8.4921875, 10.60546875, 12.71875, 14.83203125, 16.9453125, 19.05859375, 21.171875, 23.28515625, 25.3984375, 27.51171875, 29.625, 31.73828125, 33.8515625, 35.96484375, 38.078125, 40.19140625, 42.3046875, 44.41796875, 46.53125, 48.64453125, 50.7578125, 52.87109375, 54.984375, 57.09765625, 59.2109375, 61.32421875, 63.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 35.0, 279.0, 520.0, 148.0, 22.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.13524627685547, -74.47967529296875, -70.82410430908203, -67.16853332519531, -63.51295852661133, -59.85738754272461, -56.201812744140625, -52.546241760253906, -48.89067077636719, -45.23509979248047, -41.57952880859375, -37.923954010009766, -34.26838302612305, -30.612812042236328, -26.957239151000977, -23.301666259765625, -19.646095275878906, -15.990523338317871, -12.334951400756836, -8.6793794631958, -5.023807525634766, -1.3682365417480469, 2.2873363494873047, 5.942909240722656, 9.598480224609375, 13.25405216217041, 16.909624099731445, 20.565196990966797, 24.220767974853516, 27.876338958740234, 31.531911849975586, 35.18748474121094, 38.843048095703125, 42.498619079589844, 46.15419006347656, 49.80976486206055, 53.465335845947266, 57.120906829833984, 60.77648162841797, 64.43205261230469, 68.0876235961914, 71.74319458007812, 75.39876556396484, 79.05433654785156, 82.70991516113281, 86.365478515625, 90.02105712890625, 93.67662811279297, 97.33219909667969, 100.9877700805664, 104.64334106445312, 108.29891204833984, 111.95448303222656, 115.61006164550781, 119.26563262939453, 122.92120361328125, 126.57677459716797, 130.2323455810547, 133.88792419433594, 137.54348754882812, 141.19906616210938, 144.85462951660156, 148.5102081298828, 152.165771484375, 155.82135009765625]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 3.0, 1.0, 6.0, 5.0, 3.0, 13.0, 12.0, 20.0, 16.0, 19.0, 27.0, 28.0, 32.0, 26.0, 34.0, 37.0, 35.0, 49.0, 33.0, 42.0, 49.0, 35.0, 46.0, 43.0, 33.0, 35.0, 36.0, 46.0, 37.0, 35.0, 27.0, 18.0, 18.0, 26.0, 14.0, 17.0, 9.0, 10.0, 5.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.30299377441406, -50.79027557373047, -49.27756118774414, -47.76484298706055, -46.25212860107422, -44.739410400390625, -43.22669219970703, -41.7139778137207, -40.201263427734375, -38.68854522705078, -37.17583084106445, -35.66311264038086, -34.15039825439453, -32.63768005371094, -31.124963760375977, -29.612247467041016, -28.099529266357422, -26.58681297302246, -25.0740966796875, -23.561378479003906, -22.048664093017578, -20.535945892333984, -19.023229598999023, -17.510513305664062, -15.997797012329102, -14.48508071899414, -12.97236442565918, -11.459647178649902, -9.946930885314941, -8.43421459197998, -6.921497344970703, -5.408781051635742, -3.8960647583007812, -2.383348226547241, -0.8706316947937012, 0.642085075378418, 2.154801368713379, 3.66751766204834, 5.180234909057617, 6.692951202392578, 8.205667495727539, 9.7183837890625, 11.231100082397461, 12.743817329406738, 14.2565336227417, 15.76924991607666, 17.281967163085938, 18.7946834564209, 20.30739974975586, 21.82011604309082, 23.33283233642578, 24.845550537109375, 26.358264923095703, 27.870983123779297, 29.383699417114258, 30.89641571044922, 32.40913391113281, 33.921852111816406, 35.434566497802734, 36.94728469848633, 38.459999084472656, 39.97271728515625, 41.485435485839844, 42.99814987182617, 44.5108642578125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 5.0, 2.0, 5.0, 10.0, 7.0, 14.0, 10.0, 7.0, 11.0, 18.0, 15.0, 9.0, 27.0, 28.0, 27.0, 34.0, 25.0, 34.0, 36.0, 38.0, 45.0, 47.0, 45.0, 33.0, 37.0, 38.0, 35.0, 28.0, 37.0, 34.0, 22.0, 19.0, 22.0, 24.0, 20.0, 21.0, 28.0, 17.0, 14.0, 8.0, 12.0, 10.0, 12.0, 5.0, 9.0, 5.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.015625, -5.82525634765625, -5.6348876953125, -5.44451904296875, -5.254150390625, -5.06378173828125, -4.8734130859375, -4.68304443359375, -4.49267578125, -4.30230712890625, -4.1119384765625, -3.92156982421875, -3.731201171875, -3.54083251953125, -3.3504638671875, -3.16009521484375, -2.9697265625, -2.77935791015625, -2.5889892578125, -2.39862060546875, -2.208251953125, -2.01788330078125, -1.8275146484375, -1.63714599609375, -1.44677734375, -1.25640869140625, -1.0660400390625, -0.87567138671875, -0.685302734375, -0.49493408203125, -0.3045654296875, -0.11419677734375, 0.076171875, 0.26654052734375, 0.4569091796875, 0.64727783203125, 0.837646484375, 1.02801513671875, 1.2183837890625, 1.40875244140625, 1.59912109375, 1.78948974609375, 1.9798583984375, 2.17022705078125, 2.360595703125, 2.55096435546875, 2.7413330078125, 2.93170166015625, 3.1220703125, 3.31243896484375, 3.5028076171875, 3.69317626953125, 3.883544921875, 4.07391357421875, 4.2642822265625, 4.45465087890625, 4.64501953125, 4.83538818359375, 5.0257568359375, 5.21612548828125, 5.406494140625, 5.59686279296875, 5.7872314453125, 5.97760009765625, 6.16796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 3.0, 10.0, 16.0, 9.0, 19.0, 15.0, 23.0, 42.0, 38.0, 63.0, 67.0, 126.0, 201.0, 310.0, 473.0, 871.0, 1667.0, 3498.0, 8760.0, 28327.0, 131150.0, 619114.0, 1746295.0, 1244087.0, 317753.0, 63926.0, 16100.0, 5725.0, 2444.0, 1263.0, 667.0, 396.0, 231.0, 160.0, 96.0, 84.0, 58.0, 42.0, 33.0, 32.0, 17.0, 18.0, 8.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-9.8359375, -9.56103515625, -9.2861328125, -9.01123046875, -8.736328125, -8.46142578125, -8.1865234375, -7.91162109375, -7.63671875, -7.36181640625, -7.0869140625, -6.81201171875, -6.537109375, -6.26220703125, -5.9873046875, -5.71240234375, -5.4375, -5.16259765625, -4.8876953125, -4.61279296875, -4.337890625, -4.06298828125, -3.7880859375, -3.51318359375, -3.23828125, -2.96337890625, -2.6884765625, -2.41357421875, -2.138671875, -1.86376953125, -1.5888671875, -1.31396484375, -1.0390625, -0.76416015625, -0.4892578125, -0.21435546875, 0.060546875, 0.33544921875, 0.6103515625, 0.88525390625, 1.16015625, 1.43505859375, 1.7099609375, 1.98486328125, 2.259765625, 2.53466796875, 2.8095703125, 3.08447265625, 3.359375, 3.63427734375, 3.9091796875, 4.18408203125, 4.458984375, 4.73388671875, 5.0087890625, 5.28369140625, 5.55859375, 5.83349609375, 6.1083984375, 6.38330078125, 6.658203125, 6.93310546875, 7.2080078125, 7.48291015625, 7.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 8.0, 11.0, 14.0, 19.0, 25.0, 35.0, 51.0, 47.0, 65.0, 87.0, 135.0, 140.0, 205.0, 323.0, 401.0, 553.0, 451.0, 401.0, 270.0, 187.0, 145.0, 130.0, 80.0, 70.0, 40.0, 42.0, 32.0, 23.0, 17.0, 13.0, 12.0, 12.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.296875, -11.9334716796875, -11.570068359375, -11.2066650390625, -10.84326171875, -10.4798583984375, -10.116455078125, -9.7530517578125, -9.3896484375, -9.0262451171875, -8.662841796875, -8.2994384765625, -7.93603515625, -7.5726318359375, -7.209228515625, -6.8458251953125, -6.482421875, -6.1190185546875, -5.755615234375, -5.3922119140625, -5.02880859375, -4.6654052734375, -4.302001953125, -3.9385986328125, -3.5751953125, -3.2117919921875, -2.848388671875, -2.4849853515625, -2.12158203125, -1.7581787109375, -1.394775390625, -1.0313720703125, -0.66796875, -0.3045654296875, 0.058837890625, 0.4222412109375, 0.78564453125, 1.1490478515625, 1.512451171875, 1.8758544921875, 2.2392578125, 2.6026611328125, 2.966064453125, 3.3294677734375, 3.69287109375, 4.0562744140625, 4.419677734375, 4.7830810546875, 5.146484375, 5.5098876953125, 5.873291015625, 6.2366943359375, 6.60009765625, 6.9635009765625, 7.326904296875, 7.6903076171875, 8.0537109375, 8.4171142578125, 8.780517578125, 9.1439208984375, 9.50732421875, 9.8707275390625, 10.234130859375, 10.5975341796875, 10.9609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 7.0, 7.0, 10.0, 8.0, 14.0, 20.0, 31.0, 52.0, 49.0, 75.0, 95.0, 154.0, 215.0, 353.0, 567.0, 889.0, 1797.0, 4948.0, 30530.0, 439649.0, 3305741.0, 373370.0, 26901.0, 4567.0, 1794.0, 882.0, 543.0, 323.0, 196.0, 144.0, 96.0, 84.0, 46.0, 39.0, 27.0, 10.0, 14.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.15234375, -16.5703125, -15.98828125, -15.40625, -14.82421875, -14.2421875, -13.66015625, -13.078125, -12.49609375, -11.9140625, -11.33203125, -10.75, -10.16796875, -9.5859375, -9.00390625, -8.421875, -7.83984375, -7.2578125, -6.67578125, -6.09375, -5.51171875, -4.9296875, -4.34765625, -3.765625, -3.18359375, -2.6015625, -2.01953125, -1.4375, -0.85546875, -0.2734375, 0.30859375, 0.890625, 1.47265625, 2.0546875, 2.63671875, 3.21875, 3.80078125, 4.3828125, 4.96484375, 5.546875, 6.12890625, 6.7109375, 7.29296875, 7.875, 8.45703125, 9.0390625, 9.62109375, 10.203125, 10.78515625, 11.3671875, 11.94921875, 12.53125, 13.11328125, 13.6953125, 14.27734375, 14.859375, 15.44140625, 16.0234375, 16.60546875, 17.1875, 17.76953125, 18.3515625, 18.93359375, 19.515625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 300.0, 714.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-504.1849670410156, -487.4500732421875, -470.7152099609375, -453.9803466796875, -437.2454528808594, -420.51055908203125, -403.77569580078125, -387.04083251953125, -370.3059387207031, -353.571044921875, -336.836181640625, -320.101318359375, -303.3664245605469, -286.63153076171875, -269.89666748046875, -253.1617889404297, -236.42691040039062, -219.69203186035156, -202.9571533203125, -186.22227478027344, -169.48739624023438, -152.7525177001953, -136.01763916015625, -119.28276062011719, -102.54788208007812, -85.81300354003906, -69.078125, -52.34324645996094, -35.608367919921875, -18.873489379882812, -2.13861083984375, 14.596267700195312, 31.3311767578125, 48.06605529785156, 64.80093383789062, 81.53581237792969, 98.27069091796875, 115.00556945800781, 131.74044799804688, 148.47532653808594, 165.210205078125, 181.94508361816406, 198.67996215820312, 215.4148406982422, 232.14971923828125, 248.8845977783203, 265.6194763183594, 282.3543701171875, 299.0892333984375, 315.8240966796875, 332.5589904785156, 349.29388427734375, 366.02874755859375, 382.76361083984375, 399.4985046386719, 416.2333984375, 432.96826171875, 449.703125, 466.4380187988281, 483.17291259765625, 499.90777587890625, 516.6426391601562, 533.3775634765625, 550.1124267578125, 566.8472900390625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 9.0, 4.0, 7.0, 14.0, 12.0, 11.0, 9.0, 17.0, 28.0, 23.0, 25.0, 26.0, 34.0, 32.0, 29.0, 36.0, 33.0, 39.0, 44.0, 45.0, 40.0, 37.0, 41.0, 38.0, 42.0, 32.0, 30.0, 30.0, 36.0, 32.0, 27.0, 23.0, 22.0, 22.0, 6.0, 19.0, 9.0, 12.0, 3.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.014892578125, -39.63541030883789, -38.255924224853516, -36.876441955566406, -35.4969596862793, -34.11747741699219, -32.73799133300781, -31.358509063720703, -29.979026794433594, -28.59954261779785, -27.220060348510742, -25.840576171875, -24.46109390258789, -23.08160972595215, -21.702125549316406, -20.322643280029297, -18.943159103393555, -17.563674926757812, -16.184192657470703, -14.804708480834961, -13.425226211547852, -12.04574203491211, -10.666258811950684, -9.286775588989258, -7.907292366027832, -6.527809143066406, -5.1483259201049805, -3.7688422203063965, -2.3893589973449707, -1.009875774383545, 0.36960792541503906, 1.7490911483764648, 3.1285743713378906, 4.508057594299316, 5.887540817260742, 7.267024517059326, 8.646507263183594, 10.025991439819336, 11.405474662780762, 12.784957885742188, 14.164441108703613, 15.543924331665039, 16.92340850830078, 18.30289077758789, 19.682374954223633, 21.061857223510742, 22.441341400146484, 23.820823669433594, 25.200307846069336, 26.579792022705078, 27.959274291992188, 29.33875846862793, 30.71824073791504, 32.09772491455078, 33.47720718383789, 34.856689453125, 36.236175537109375, 37.615657806396484, 38.99514389038086, 40.37462615966797, 41.75410842895508, 43.13359069824219, 44.51307678222656, 45.89255905151367, 47.27204132080078]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 17.0, 15.0, 21.0, 19.0, 26.0, 26.0, 25.0, 32.0, 41.0, 62.0, 49.0, 52.0, 68.0, 70.0, 49.0, 51.0, 41.0, 59.0, 51.0, 35.0, 25.0, 29.0, 17.0, 21.0, 18.0, 10.0, 21.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9765625, -5.7806396484375, -5.584716796875, -5.3887939453125, -5.19287109375, -4.9969482421875, -4.801025390625, -4.6051025390625, -4.4091796875, -4.2132568359375, -4.017333984375, -3.8214111328125, -3.62548828125, -3.4295654296875, -3.233642578125, -3.0377197265625, -2.841796875, -2.6458740234375, -2.449951171875, -2.2540283203125, -2.05810546875, -1.8621826171875, -1.666259765625, -1.4703369140625, -1.2744140625, -1.0784912109375, -0.882568359375, -0.6866455078125, -0.49072265625, -0.2947998046875, -0.098876953125, 0.0970458984375, 0.29296875, 0.4888916015625, 0.684814453125, 0.8807373046875, 1.07666015625, 1.2725830078125, 1.468505859375, 1.6644287109375, 1.8603515625, 2.0562744140625, 2.252197265625, 2.4481201171875, 2.64404296875, 2.8399658203125, 3.035888671875, 3.2318115234375, 3.427734375, 3.6236572265625, 3.819580078125, 4.0155029296875, 4.21142578125, 4.4073486328125, 4.603271484375, 4.7991943359375, 4.9951171875, 5.1910400390625, 5.386962890625, 5.5828857421875, 5.77880859375, 5.9747314453125, 6.170654296875, 6.3665771484375, 6.5625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 13.0, 16.0, 21.0, 39.0, 57.0, 90.0, 152.0, 209.0, 327.0, 475.0, 817.0, 1337.0, 2252.0, 3777.0, 6316.0, 10175.0, 17882.0, 30354.0, 52950.0, 95434.0, 180233.0, 274068.0, 165216.0, 87785.0, 49001.0, 28323.0, 16442.0, 9798.0, 5906.0, 3585.0, 2043.0, 1242.0, 809.0, 517.0, 324.0, 169.0, 126.0, 78.0, 49.0, 41.0, 30.0, 21.0, 18.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5358428955078125, -0.516998291015625, -0.4981536865234375, -0.47930908203125, -0.4604644775390625, -0.441619873046875, -0.4227752685546875, -0.4039306640625, -0.3850860595703125, -0.366241455078125, -0.3473968505859375, -0.32855224609375, -0.3097076416015625, -0.290863037109375, -0.2720184326171875, -0.253173828125, -0.2343292236328125, -0.215484619140625, -0.1966400146484375, -0.17779541015625, -0.1589508056640625, -0.140106201171875, -0.1212615966796875, -0.1024169921875, -0.0835723876953125, -0.064727783203125, -0.0458831787109375, -0.02703857421875, -0.0081939697265625, 0.010650634765625, 0.0294952392578125, 0.04833984375, 0.0671844482421875, 0.086029052734375, 0.1048736572265625, 0.12371826171875, 0.1425628662109375, 0.161407470703125, 0.1802520751953125, 0.1990966796875, 0.2179412841796875, 0.236785888671875, 0.2556304931640625, 0.27447509765625, 0.2933197021484375, 0.312164306640625, 0.3310089111328125, 0.349853515625, 0.3686981201171875, 0.387542724609375, 0.4063873291015625, 0.42523193359375, 0.4440765380859375, 0.462921142578125, 0.4817657470703125, 0.5006103515625, 0.5194549560546875, 0.538299560546875, 0.5571441650390625, 0.57598876953125, 0.5948333740234375, 0.613677978515625, 0.6325225830078125, 0.6513671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 11.0, 6.0, 11.0, 15.0, 15.0, 27.0, 32.0, 27.0, 40.0, 29.0, 30.0, 33.0, 36.0, 44.0, 52.0, 32.0, 44.0, 1066.0, 44.0, 39.0, 49.0, 44.0, 37.0, 27.0, 25.0, 27.0, 24.0, 21.0, 16.0, 13.0, 12.0, 10.0, 15.0, 13.0, 8.0, 11.0, 6.0, 2.0, 3.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.07061767578125, -2.9752197265625, -2.87982177734375, -2.784423828125, -2.68902587890625, -2.5936279296875, -2.49822998046875, -2.40283203125, -2.30743408203125, -2.2120361328125, -2.11663818359375, -2.021240234375, -1.92584228515625, -1.8304443359375, -1.73504638671875, -1.6396484375, -1.54425048828125, -1.4488525390625, -1.35345458984375, -1.258056640625, -1.16265869140625, -1.0672607421875, -0.97186279296875, -0.87646484375, -0.78106689453125, -0.6856689453125, -0.59027099609375, -0.494873046875, -0.39947509765625, -0.3040771484375, -0.20867919921875, -0.11328125, -0.01788330078125, 0.0775146484375, 0.17291259765625, 0.268310546875, 0.36370849609375, 0.4591064453125, 0.55450439453125, 0.64990234375, 0.74530029296875, 0.8406982421875, 0.93609619140625, 1.031494140625, 1.12689208984375, 1.2222900390625, 1.31768798828125, 1.4130859375, 1.50848388671875, 1.6038818359375, 1.69927978515625, 1.794677734375, 1.89007568359375, 1.9854736328125, 2.08087158203125, 2.17626953125, 2.27166748046875, 2.3670654296875, 2.46246337890625, 2.557861328125, 2.65325927734375, 2.7486572265625, 2.84405517578125, 2.939453125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 10.0, 3.0, 6.0, 10.0, 18.0, 30.0, 35.0, 53.0, 89.0, 116.0, 165.0, 227.0, 284.0, 366.0, 569.0, 789.0, 1128.0, 1549.0, 2139.0, 3112.0, 4209.0, 6124.0, 9077.0, 13316.0, 19851.0, 30683.0, 47395.0, 74632.0, 121883.0, 1015505.0, 413232.0, 119269.0, 73029.0, 46458.0, 29526.0, 19662.0, 12988.0, 8841.0, 6159.0, 4202.0, 2903.0, 2108.0, 1473.0, 1108.0, 755.0, 616.0, 392.0, 298.0, 207.0, 158.0, 113.0, 85.0, 70.0, 41.0, 25.0, 21.0, 7.0, 10.0, 9.0, 3.0, 4.0], "bins": [-0.448486328125, -0.4348869323730469, -0.42128753662109375, -0.4076881408691406, -0.3940887451171875, -0.3804893493652344, -0.36688995361328125, -0.3532905578613281, -0.339691162109375, -0.3260917663574219, -0.31249237060546875, -0.2988929748535156, -0.2852935791015625, -0.2716941833496094, -0.25809478759765625, -0.24449539184570312, -0.23089599609375, -0.21729660034179688, -0.20369720458984375, -0.19009780883789062, -0.1764984130859375, -0.16289901733398438, -0.14929962158203125, -0.13570022583007812, -0.122100830078125, -0.10850143432617188, -0.09490203857421875, -0.08130264282226562, -0.0677032470703125, -0.054103851318359375, -0.04050445556640625, -0.026905059814453125, -0.0133056640625, 0.000293731689453125, 0.01389312744140625, 0.027492523193359375, 0.0410919189453125, 0.054691314697265625, 0.06829071044921875, 0.08189010620117188, 0.095489501953125, 0.10908889770507812, 0.12268829345703125, 0.13628768920898438, 0.1498870849609375, 0.16348648071289062, 0.17708587646484375, 0.19068527221679688, 0.20428466796875, 0.21788406372070312, 0.23148345947265625, 0.24508285522460938, 0.2586822509765625, 0.2722816467285156, 0.28588104248046875, 0.2994804382324219, 0.313079833984375, 0.3266792297363281, 0.34027862548828125, 0.3538780212402344, 0.3674774169921875, 0.3810768127441406, 0.39467620849609375, 0.4082756042480469, 0.421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 16.0, 26.0, 15.0, 29.0, 55.0, 67.0, 113.0, 155.0, 152.0, 109.0, 86.0, 33.0, 26.0, 24.0, 17.0, 9.0, 13.0, 5.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004093170166015625, -0.003922700881958008, -0.0037522315979003906, -0.0035817623138427734, -0.0034112930297851562, -0.003240823745727539, -0.003070354461669922, -0.0028998851776123047, -0.0027294158935546875, -0.0025589466094970703, -0.002388477325439453, -0.002218008041381836, -0.0020475387573242188, -0.0018770694732666016, -0.0017066001892089844, -0.0015361309051513672, -0.00136566162109375, -0.0011951923370361328, -0.0010247230529785156, -0.0008542537689208984, -0.0006837844848632812, -0.0005133152008056641, -0.0003428459167480469, -0.0001723766326904297, -1.9073486328125e-06, 0.0001685619354248047, 0.0003390312194824219, 0.0005095005035400391, 0.0006799697875976562, 0.0008504390716552734, 0.0010209083557128906, 0.0011913776397705078, 0.001361846923828125, 0.0015323162078857422, 0.0017027854919433594, 0.0018732547760009766, 0.0020437240600585938, 0.002214193344116211, 0.002384662628173828, 0.0025551319122314453, 0.0027256011962890625, 0.0028960704803466797, 0.003066539764404297, 0.003237009048461914, 0.0034074783325195312, 0.0035779476165771484, 0.0037484169006347656, 0.003918886184692383, 0.00408935546875, 0.004259824752807617, 0.004430294036865234, 0.0046007633209228516, 0.004771232604980469, 0.004941701889038086, 0.005112171173095703, 0.00528264045715332, 0.0054531097412109375, 0.005623579025268555, 0.005794048309326172, 0.005964517593383789, 0.006134986877441406, 0.0063054561614990234, 0.006475925445556641, 0.006646394729614258, 0.006816864013671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 4.0, 13.0, 9.0, 6.0, 10.0, 20.0, 26.0, 23.0, 48.0, 85.0, 106.0, 175.0, 422.0, 1097.0, 922826.0, 121850.0, 906.0, 365.0, 191.0, 99.0, 69.0, 55.0, 35.0, 26.0, 22.0, 17.0, 14.0, 12.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.11895751953125, -0.11597728729248047, -0.11299705505371094, -0.1100168228149414, -0.10703659057617188, -0.10405635833740234, -0.10107612609863281, -0.09809589385986328, -0.09511566162109375, -0.09213542938232422, -0.08915519714355469, -0.08617496490478516, -0.08319473266601562, -0.0802145004272461, -0.07723426818847656, -0.07425403594970703, -0.0712738037109375, -0.06829357147216797, -0.06531333923339844, -0.062333106994628906, -0.059352874755859375, -0.056372642517089844, -0.05339241027832031, -0.05041217803955078, -0.04743194580078125, -0.04445171356201172, -0.04147148132324219, -0.038491249084472656, -0.035511016845703125, -0.032530784606933594, -0.029550552368164062, -0.02657032012939453, -0.023590087890625, -0.02060985565185547, -0.017629623413085938, -0.014649391174316406, -0.011669158935546875, -0.008688926696777344, -0.0057086944580078125, -0.0027284622192382812, 0.00025177001953125, 0.0032320022583007812, 0.0062122344970703125, 0.009192466735839844, 0.012172698974609375, 0.015152931213378906, 0.018133163452148438, 0.02111339569091797, 0.0240936279296875, 0.02707386016845703, 0.030054092407226562, 0.033034324645996094, 0.036014556884765625, 0.038994789123535156, 0.04197502136230469, 0.04495525360107422, 0.04793548583984375, 0.05091571807861328, 0.05389595031738281, 0.056876182556152344, 0.059856414794921875, 0.0628366470336914, 0.06581687927246094, 0.06879711151123047, 0.07177734375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 23.0, 42.0, 106.0, 156.0, 221.0, 205.0, 133.0, 62.0, 33.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015864229062572122, -0.001497020130045712, -0.0014076174702495337, -0.0013182146940380335, -0.0012288119178265333, -0.0011394091416150331, -0.0010500064818188548, -0.0009606037056073546, -0.0008712009876035154, -0.0007817982695996761, -0.000692395493388176, -0.0006029927753843367, -0.0005135900573804975, -0.0004241872811689973, -0.00033478456316515803, -0.00024538178695365787, -0.0001559790689498186, -6.657632911810651e-05, 2.2826410713605583e-05, 0.00011222914326936007, 0.00020163189037702978, 0.0002910346374846995, 0.00038043735548853874, 0.0004698401317000389, 0.0005592428497038782, 0.0006486455677077174, 0.0007380483439192176, 0.0008274510619230568, 0.0009168537799268961, 0.0010062565561383963, 0.0010956593323498964, 0.0011850621085613966, 0.0012744648847728968, 0.001363867660984397, 0.0014532703207805753, 0.0015426730969920754, 0.0016320758732035756, 0.001721478532999754, 0.0018108813092112541, 0.0019002840854227543, 0.0019896868616342545, 0.0020790896378457546, 0.002168492414057255, 0.002257895190268755, 0.0023472977336496115, 0.0024367005098611116, 0.002526103286072612, 0.002615506062284112, 0.0027049086056649685, 0.0027943113818764687, 0.002883714158087969, 0.002973116934299469, 0.0030625194776803255, 0.0031519222538918257, 0.003241325030103326, 0.003330727806314826, 0.003420130582526326, 0.0035095333587378263, 0.0035989361349493265, 0.003688338678330183, 0.003777741454541683, 0.0038671442307531834, 0.0039565470069646835, 0.004045949783176184, 0.004135352559387684]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 11.0, 9.0, 8.0, 16.0, 17.0, 11.0, 16.0, 13.0, 17.0, 22.0, 15.0, 25.0, 27.0, 28.0, 21.0, 38.0, 37.0, 28.0, 39.0, 33.0, 31.0, 37.0, 30.0, 28.0, 40.0, 43.0, 31.0, 27.0, 24.0, 25.0, 28.0, 23.0, 26.0, 18.0, 13.0, 14.0, 15.0, 18.0, 14.0, 13.0, 10.0, 12.0, 9.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0013930201530456543, -0.0013467026874423027, -0.0013003852218389511, -0.0012540677562355995, -0.001207750290632248, -0.0011614328250288963, -0.0011151153594255447, -0.0010687978938221931, -0.0010224804282188416, -0.00097616296261549, -0.0009298454970121384, -0.0008835280314087868, -0.0008372105658054352, -0.0007908931002020836, -0.000744575634598732, -0.0006982581689953804, -0.0006519407033920288, -0.0006056232377886772, -0.0005593057721853256, -0.000512988306581974, -0.00046667084097862244, -0.00042035337537527084, -0.00037403590977191925, -0.00032771844416856766, -0.00028140097856521606, -0.00023508351296186447, -0.00018876604735851288, -0.00014244858175516129, -9.613111615180969e-05, -4.98136505484581e-05, -3.4961849451065063e-06, 4.282128065824509e-05, 8.913874626159668e-05, 0.00013545621186494827, 0.00018177367746829987, 0.00022809114307165146, 0.00027440860867500305, 0.00032072607427835464, 0.00036704353988170624, 0.00041336100548505783, 0.0004596784710884094, 0.000505995936691761, 0.0005523134022951126, 0.0005986308678984642, 0.0006449483335018158, 0.0006912657991051674, 0.000737583264708519, 0.0007839007303118706, 0.0008302181959152222, 0.0008765356615185738, 0.0009228531271219254, 0.000969170592725277, 0.0010154880583286285, 0.0010618055239319801, 0.0011081229895353317, 0.0011544404551386833, 0.001200757920742035, 0.0012470753863453865, 0.001293392851948738, 0.0013397103175520897, 0.0013860277831554413, 0.0014323452487587929, 0.0014786627143621445, 0.001524980179965496, 0.0015712976455688477]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 17.0, 15.0, 21.0, 19.0, 26.0, 26.0, 25.0, 32.0, 41.0, 62.0, 49.0, 52.0, 68.0, 70.0, 49.0, 51.0, 41.0, 59.0, 51.0, 35.0, 25.0, 29.0, 17.0, 22.0, 17.0, 10.0, 21.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9765625, -5.7806396484375, -5.584716796875, -5.3887939453125, -5.19287109375, -4.9969482421875, -4.801025390625, -4.6051025390625, -4.4091796875, -4.2132568359375, -4.017333984375, -3.8214111328125, -3.62548828125, -3.4295654296875, -3.233642578125, -3.0377197265625, -2.841796875, -2.6458740234375, -2.449951171875, -2.2540283203125, -2.05810546875, -1.8621826171875, -1.666259765625, -1.4703369140625, -1.2744140625, -1.0784912109375, -0.882568359375, -0.6866455078125, -0.49072265625, -0.2947998046875, -0.098876953125, 0.0970458984375, 0.29296875, 0.4888916015625, 0.684814453125, 0.8807373046875, 1.07666015625, 1.2725830078125, 1.468505859375, 1.6644287109375, 1.8603515625, 2.0562744140625, 2.252197265625, 2.4481201171875, 2.64404296875, 2.8399658203125, 3.035888671875, 3.2318115234375, 3.427734375, 3.6236572265625, 3.819580078125, 4.0155029296875, 4.21142578125, 4.4073486328125, 4.603271484375, 4.7991943359375, 4.9951171875, 5.1910400390625, 5.386962890625, 5.5828857421875, 5.77880859375, 5.9747314453125, 6.170654296875, 6.3665771484375, 6.5625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 13.0, 25.0, 37.0, 63.0, 91.0, 126.0, 193.0, 248.0, 373.0, 515.0, 764.0, 1062.0, 1661.0, 2670.0, 5202.0, 24419.0, 424688.0, 541451.0, 31091.0, 5700.0, 2798.0, 1724.0, 1096.0, 752.0, 536.0, 386.0, 290.0, 176.0, 120.0, 90.0, 66.0, 37.0, 26.0, 19.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.40625, -15.9097900390625, -15.413330078125, -14.9168701171875, -14.42041015625, -13.9239501953125, -13.427490234375, -12.9310302734375, -12.4345703125, -11.9381103515625, -11.441650390625, -10.9451904296875, -10.44873046875, -9.9522705078125, -9.455810546875, -8.9593505859375, -8.462890625, -7.9664306640625, -7.469970703125, -6.9735107421875, -6.47705078125, -5.9805908203125, -5.484130859375, -4.9876708984375, -4.4912109375, -3.9947509765625, -3.498291015625, -3.0018310546875, -2.50537109375, -2.0089111328125, -1.512451171875, -1.0159912109375, -0.51953125, -0.0230712890625, 0.473388671875, 0.9698486328125, 1.46630859375, 1.9627685546875, 2.459228515625, 2.9556884765625, 3.4521484375, 3.9486083984375, 4.445068359375, 4.9415283203125, 5.43798828125, 5.9344482421875, 6.430908203125, 6.9273681640625, 7.423828125, 7.9202880859375, 8.416748046875, 8.9132080078125, 9.40966796875, 9.9061279296875, 10.402587890625, 10.8990478515625, 11.3955078125, 11.8919677734375, 12.388427734375, 12.8848876953125, 13.38134765625, 13.8778076171875, 14.374267578125, 14.8707275390625, 15.3671875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 3.0, 5.0, 4.0, 5.0, 7.0, 15.0, 9.0, 14.0, 11.0, 17.0, 18.0, 23.0, 34.0, 27.0, 44.0, 35.0, 59.0, 69.0, 101.0, 197.0, 1487.0, 293.0, 121.0, 80.0, 50.0, 46.0, 37.0, 33.0, 31.0, 35.0, 19.0, 10.0, 16.0, 12.0, 12.0, 10.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-13.4140625, -13.0277099609375, -12.641357421875, -12.2550048828125, -11.86865234375, -11.4822998046875, -11.095947265625, -10.7095947265625, -10.3232421875, -9.9368896484375, -9.550537109375, -9.1641845703125, -8.77783203125, -8.3914794921875, -8.005126953125, -7.6187744140625, -7.232421875, -6.8460693359375, -6.459716796875, -6.0733642578125, -5.68701171875, -5.3006591796875, -4.914306640625, -4.5279541015625, -4.1416015625, -3.7552490234375, -3.368896484375, -2.9825439453125, -2.59619140625, -2.2098388671875, -1.823486328125, -1.4371337890625, -1.05078125, -0.6644287109375, -0.278076171875, 0.1082763671875, 0.49462890625, 0.8809814453125, 1.267333984375, 1.6536865234375, 2.0400390625, 2.4263916015625, 2.812744140625, 3.1990966796875, 3.58544921875, 3.9718017578125, 4.358154296875, 4.7445068359375, 5.130859375, 5.5172119140625, 5.903564453125, 6.2899169921875, 6.67626953125, 7.0626220703125, 7.448974609375, 7.8353271484375, 8.2216796875, 8.6080322265625, 8.994384765625, 9.3807373046875, 9.76708984375, 10.1534423828125, 10.539794921875, 10.9261474609375, 11.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 9.0, 9.0, 9.0, 14.0, 13.0, 20.0, 40.0, 41.0, 60.0, 89.0, 130.0, 183.0, 320.0, 546.0, 1260.0, 5273.0, 3124077.0, 10481.0, 1416.0, 675.0, 357.0, 217.0, 135.0, 85.0, 68.0, 47.0, 25.0, 20.0, 17.0, 16.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.84375, -47.19287109375, -45.5419921875, -43.89111328125, -42.240234375, -40.58935546875, -38.9384765625, -37.28759765625, -35.63671875, -33.98583984375, -32.3349609375, -30.68408203125, -29.033203125, -27.38232421875, -25.7314453125, -24.08056640625, -22.4296875, -20.77880859375, -19.1279296875, -17.47705078125, -15.826171875, -14.17529296875, -12.5244140625, -10.87353515625, -9.22265625, -7.57177734375, -5.9208984375, -4.27001953125, -2.619140625, -0.96826171875, 0.6826171875, 2.33349609375, 3.984375, 5.63525390625, 7.2861328125, 8.93701171875, 10.587890625, 12.23876953125, 13.8896484375, 15.54052734375, 17.19140625, 18.84228515625, 20.4931640625, 22.14404296875, 23.794921875, 25.44580078125, 27.0966796875, 28.74755859375, 30.3984375, 32.04931640625, 33.7001953125, 35.35107421875, 37.001953125, 38.65283203125, 40.3037109375, 41.95458984375, 43.60546875, 45.25634765625, 46.9072265625, 48.55810546875, 50.208984375, 51.85986328125, 53.5107421875, 55.16162109375, 56.8125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 8.0, 18.0, 39.0, 64.0, 93.0, 153.0, 187.0, 180.0, 132.0, 50.0, 33.0, 27.0, 11.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-59.476871490478516, -58.30275344848633, -57.128631591796875, -55.95451354980469, -54.7803955078125, -53.60627746582031, -52.432159423828125, -51.25803756713867, -50.083919525146484, -48.9098014831543, -47.735679626464844, -46.561561584472656, -45.38744354248047, -44.21332550048828, -43.039207458496094, -41.86508560180664, -40.69096755981445, -39.516849517822266, -38.34272766113281, -37.168609619140625, -35.99449157714844, -34.82037353515625, -33.64625549316406, -32.47213363647461, -31.298015594482422, -30.123897552490234, -28.949777603149414, -27.775657653808594, -26.601539611816406, -25.42742156982422, -24.2533016204834, -23.079181671142578, -21.905059814453125, -20.730941772460938, -19.556821823120117, -18.382701873779297, -17.20858383178711, -16.034465789794922, -14.860345840454102, -13.686226844787598, -12.512107849121094, -11.33798885345459, -10.163869857788086, -8.989750862121582, -7.815631866455078, -6.641512870788574, -5.46739387512207, -4.293274879455566, -3.1191558837890625, -1.9450368881225586, -0.7709178924560547, 0.4032011032104492, 1.5773200988769531, 2.751439094543457, 3.925558090209961, 5.099677085876465, 6.273796081542969, 7.447915077209473, 8.622034072875977, 9.79615306854248, 10.970272064208984, 12.144391059875488, 13.318510055541992, 14.492629051208496, 15.666748046875]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 14.0, 9.0, 10.0, 12.0, 14.0, 26.0, 25.0, 23.0, 21.0, 24.0, 28.0, 40.0, 43.0, 41.0, 43.0, 45.0, 49.0, 51.0, 39.0, 37.0, 36.0, 35.0, 35.0, 34.0, 35.0, 33.0, 28.0, 20.0, 24.0, 23.0, 14.0, 17.0, 14.0, 13.0, 4.0, 8.0, 3.0, 6.0, 8.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.430519104003906, -38.2956428527832, -37.1607666015625, -36.0258903503418, -34.891014099121094, -33.756134033203125, -32.62126159667969, -31.48638343811035, -30.351505279541016, -29.216629028320312, -28.08175277709961, -26.946876525878906, -25.81199836730957, -24.677122116088867, -23.542245864868164, -22.40736961364746, -21.272493362426758, -20.137617111206055, -19.00274085998535, -17.867862701416016, -16.732986450195312, -15.59811019897461, -14.463233947753906, -13.328357696533203, -12.193480491638184, -11.05860424041748, -9.923727035522461, -8.788850784301758, -7.6539740562438965, -6.519097328186035, -5.384221076965332, -4.249344348907471, -3.1144676208496094, -1.9795910120010376, -0.8447144031524658, 0.2901620864868164, 1.4250388145446777, 2.559915542602539, 3.694791793823242, 4.8296685218811035, 5.964545249938965, 7.099421977996826, 8.234298706054688, 9.36917495727539, 10.504051208496094, 11.638928413391113, 12.773804664611816, 13.908681869506836, 15.043558120727539, 16.178434371948242, 17.313310623168945, 18.44818878173828, 19.583065032958984, 20.717941284179688, 21.85281753540039, 22.987693786621094, 24.122570037841797, 25.2574462890625, 26.392322540283203, 27.527198791503906, 28.662076950073242, 29.796953201293945, 30.93182945251465, 32.066707611083984, 33.20158386230469]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 12.0, 11.0, 6.0, 10.0, 13.0, 10.0, 26.0, 18.0, 19.0, 30.0, 30.0, 25.0, 32.0, 44.0, 38.0, 40.0, 39.0, 45.0, 51.0, 45.0, 39.0, 48.0, 35.0, 38.0, 30.0, 37.0, 27.0, 34.0, 20.0, 19.0, 20.0, 16.0, 14.0, 8.0, 10.0, 10.0, 7.0, 7.0, 7.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.6610107421875, -4.497802734375, -4.3345947265625, -4.17138671875, -4.0081787109375, -3.844970703125, -3.6817626953125, -3.5185546875, -3.3553466796875, -3.192138671875, -3.0289306640625, -2.86572265625, -2.7025146484375, -2.539306640625, -2.3760986328125, -2.212890625, -2.0496826171875, -1.886474609375, -1.7232666015625, -1.56005859375, -1.3968505859375, -1.233642578125, -1.0704345703125, -0.9072265625, -0.7440185546875, -0.580810546875, -0.4176025390625, -0.25439453125, -0.0911865234375, 0.072021484375, 0.2352294921875, 0.3984375, 0.5616455078125, 0.724853515625, 0.8880615234375, 1.05126953125, 1.2144775390625, 1.377685546875, 1.5408935546875, 1.7041015625, 1.8673095703125, 2.030517578125, 2.1937255859375, 2.35693359375, 2.5201416015625, 2.683349609375, 2.8465576171875, 3.009765625, 3.1729736328125, 3.336181640625, 3.4993896484375, 3.66259765625, 3.8258056640625, 3.989013671875, 4.1522216796875, 4.3154296875, 4.4786376953125, 4.641845703125, 4.8050537109375, 4.96826171875, 5.1314697265625, 5.294677734375, 5.4578857421875, 5.62109375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 2.0, 4.0, 6.0, 8.0, 12.0, 13.0, 21.0, 20.0, 32.0, 37.0, 58.0, 72.0, 133.0, 206.0, 386.0, 674.0, 1494.0, 3515.0, 10894.0, 60323.0, 699824.0, 2645354.0, 694556.0, 59473.0, 10725.0, 3336.0, 1457.0, 682.0, 351.0, 199.0, 110.0, 72.0, 56.0, 45.0, 21.0, 26.0, 18.0, 12.0, 9.0, 4.0, 10.0, 10.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1893310546875, -9.855224609375, -9.5211181640625, -9.18701171875, -8.8529052734375, -8.518798828125, -8.1846923828125, -7.8505859375, -7.5164794921875, -7.182373046875, -6.8482666015625, -6.51416015625, -6.1800537109375, -5.845947265625, -5.5118408203125, -5.177734375, -4.8436279296875, -4.509521484375, -4.1754150390625, -3.84130859375, -3.5072021484375, -3.173095703125, -2.8389892578125, -2.5048828125, -2.1707763671875, -1.836669921875, -1.5025634765625, -1.16845703125, -0.8343505859375, -0.500244140625, -0.1661376953125, 0.16796875, 0.5020751953125, 0.836181640625, 1.1702880859375, 1.50439453125, 1.8385009765625, 2.172607421875, 2.5067138671875, 2.8408203125, 3.1749267578125, 3.509033203125, 3.8431396484375, 4.17724609375, 4.5113525390625, 4.845458984375, 5.1795654296875, 5.513671875, 5.8477783203125, 6.181884765625, 6.5159912109375, 6.85009765625, 7.1842041015625, 7.518310546875, 7.8524169921875, 8.1865234375, 8.5206298828125, 8.854736328125, 9.1888427734375, 9.52294921875, 9.8570556640625, 10.191162109375, 10.5252685546875, 10.859375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 10.0, 7.0, 9.0, 18.0, 30.0, 41.0, 64.0, 106.0, 156.0, 215.0, 296.0, 417.0, 549.0, 575.0, 489.0, 345.0, 220.0, 184.0, 124.0, 68.0, 37.0, 49.0, 28.0, 10.0, 12.0, 6.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5703125, -11.2115478515625, -10.852783203125, -10.4940185546875, -10.13525390625, -9.7764892578125, -9.417724609375, -9.0589599609375, -8.7001953125, -8.3414306640625, -7.982666015625, -7.6239013671875, -7.26513671875, -6.9063720703125, -6.547607421875, -6.1888427734375, -5.830078125, -5.4713134765625, -5.112548828125, -4.7537841796875, -4.39501953125, -4.0362548828125, -3.677490234375, -3.3187255859375, -2.9599609375, -2.6011962890625, -2.242431640625, -1.8836669921875, -1.52490234375, -1.1661376953125, -0.807373046875, -0.4486083984375, -0.08984375, 0.2689208984375, 0.627685546875, 0.9864501953125, 1.34521484375, 1.7039794921875, 2.062744140625, 2.4215087890625, 2.7802734375, 3.1390380859375, 3.497802734375, 3.8565673828125, 4.21533203125, 4.5740966796875, 4.932861328125, 5.2916259765625, 5.650390625, 6.0091552734375, 6.367919921875, 6.7266845703125, 7.08544921875, 7.4442138671875, 7.802978515625, 8.1617431640625, 8.5205078125, 8.8792724609375, 9.238037109375, 9.5968017578125, 9.95556640625, 10.3143310546875, 10.673095703125, 11.0318603515625, 11.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 10.0, 27.0, 34.0, 46.0, 73.0, 165.0, 241.0, 495.0, 1045.0, 2451.0, 13703.0, 2609771.0, 1551014.0, 10865.0, 2342.0, 931.0, 466.0, 247.0, 134.0, 78.0, 58.0, 23.0, 13.0, 12.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.6142578125, -25.806640625, -24.9990234375, -24.19140625, -23.3837890625, -22.576171875, -21.7685546875, -20.9609375, -20.1533203125, -19.345703125, -18.5380859375, -17.73046875, -16.9228515625, -16.115234375, -15.3076171875, -14.5, -13.6923828125, -12.884765625, -12.0771484375, -11.26953125, -10.4619140625, -9.654296875, -8.8466796875, -8.0390625, -7.2314453125, -6.423828125, -5.6162109375, -4.80859375, -4.0009765625, -3.193359375, -2.3857421875, -1.578125, -0.7705078125, 0.037109375, 0.8447265625, 1.65234375, 2.4599609375, 3.267578125, 4.0751953125, 4.8828125, 5.6904296875, 6.498046875, 7.3056640625, 8.11328125, 8.9208984375, 9.728515625, 10.5361328125, 11.34375, 12.1513671875, 12.958984375, 13.7666015625, 14.57421875, 15.3818359375, 16.189453125, 16.9970703125, 17.8046875, 18.6123046875, 19.419921875, 20.2275390625, 21.03515625, 21.8427734375, 22.650390625, 23.4580078125, 24.265625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 79.0, 372.0, 431.0, 112.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.60830688476562, -207.1083221435547, -202.6083221435547, -198.10833740234375, -193.60833740234375, -189.1083526611328, -184.60836791992188, -180.10836791992188, -175.60838317871094, -171.1083984375, -166.6083984375, -162.10841369628906, -157.60842895507812, -153.10842895507812, -148.6084442138672, -144.1084442138672, -139.60845947265625, -135.1084747314453, -130.6084747314453, -126.10848999023438, -121.6084976196289, -117.10850524902344, -112.6085205078125, -108.10852813720703, -103.60853576660156, -99.1085433959961, -94.60855102539062, -90.10856628417969, -85.60857391357422, -81.10858154296875, -76.60859680175781, -72.10860443115234, -67.60861206054688, -63.108619689941406, -58.6086311340332, -54.108642578125, -49.60865020751953, -45.10865783691406, -40.60866928100586, -36.108680725097656, -31.608688354492188, -27.10869789123535, -22.608707427978516, -18.10871696472168, -13.608726501464844, -9.108736038208008, -4.608745574951172, -0.10875511169433594, 4.3912353515625, 8.891225814819336, 13.391216278076172, 17.891206741333008, 22.391197204589844, 26.89118766784668, 31.391178131103516, 35.89116668701172, 40.39115905761719, 44.891151428222656, 49.39113998413086, 53.89112854003906, 58.39112091064453, 62.89111328125, 67.39109802246094, 71.8910903930664, 76.39108276367188]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 7.0, 10.0, 8.0, 9.0, 9.0, 16.0, 15.0, 15.0, 20.0, 27.0, 21.0, 15.0, 24.0, 24.0, 29.0, 32.0, 34.0, 46.0, 31.0, 33.0, 36.0, 50.0, 27.0, 34.0, 31.0, 44.0, 36.0, 37.0, 31.0, 26.0, 30.0, 20.0, 22.0, 15.0, 20.0, 14.0, 11.0, 11.0, 13.0, 11.0, 12.0, 8.0, 9.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-31.290489196777344, -30.29682731628418, -29.303163528442383, -28.30950164794922, -27.315839767456055, -26.32217788696289, -25.328514099121094, -24.33485221862793, -23.341190338134766, -22.3475284576416, -21.353864669799805, -20.36020278930664, -19.366540908813477, -18.372879028320312, -17.379215240478516, -16.38555335998535, -15.391889572143555, -14.398226737976074, -13.40456485748291, -12.41090202331543, -11.417240142822266, -10.423577308654785, -9.429914474487305, -8.43625259399414, -7.44258975982666, -6.448927402496338, -5.455265045166016, -4.461602210998535, -3.467939853668213, -2.4742774963378906, -1.4806146621704102, -0.4869523048400879, 0.5067100524902344, 1.5003725290298462, 2.494035005569458, 3.4876976013183594, 4.481359958648682, 5.475022315979004, 6.468685150146484, 7.462347507476807, 8.456009864807129, 9.44967269897461, 10.443334579467773, 11.436997413635254, 12.430660247802734, 13.424322128295898, 14.417984962463379, 15.41164779663086, 16.405309677124023, 17.398971557617188, 18.392635345458984, 19.38629722595215, 20.379959106445312, 21.37362289428711, 22.367284774780273, 23.360946655273438, 24.354610443115234, 25.3482723236084, 26.341936111450195, 27.33559799194336, 28.329259872436523, 29.322921752929688, 30.316585540771484, 31.31024742126465, 32.30390930175781]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 11.0, 14.0, 20.0, 25.0, 30.0, 23.0, 34.0, 37.0, 42.0, 33.0, 54.0, 66.0, 46.0, 50.0, 52.0, 40.0, 45.0, 39.0, 43.0, 45.0, 37.0, 34.0, 23.0, 28.0, 20.0, 12.0, 20.0, 13.0, 9.0, 14.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.91796875, -4.7784423828125, -4.638916015625, -4.4993896484375, -4.35986328125, -4.2203369140625, -4.080810546875, -3.9412841796875, -3.8017578125, -3.6622314453125, -3.522705078125, -3.3831787109375, -3.24365234375, -3.1041259765625, -2.964599609375, -2.8250732421875, -2.685546875, -2.5460205078125, -2.406494140625, -2.2669677734375, -2.12744140625, -1.9879150390625, -1.848388671875, -1.7088623046875, -1.5693359375, -1.4298095703125, -1.290283203125, -1.1507568359375, -1.01123046875, -0.8717041015625, -0.732177734375, -0.5926513671875, -0.453125, -0.3135986328125, -0.174072265625, -0.0345458984375, 0.10498046875, 0.2445068359375, 0.384033203125, 0.5235595703125, 0.6630859375, 0.8026123046875, 0.942138671875, 1.0816650390625, 1.22119140625, 1.3607177734375, 1.500244140625, 1.6397705078125, 1.779296875, 1.9188232421875, 2.058349609375, 2.1978759765625, 2.33740234375, 2.4769287109375, 2.616455078125, 2.7559814453125, 2.8955078125, 3.0350341796875, 3.174560546875, 3.3140869140625, 3.45361328125, 3.5931396484375, 3.732666015625, 3.8721923828125, 4.01171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 16.0, 27.0, 36.0, 54.0, 83.0, 121.0, 177.0, 237.0, 371.0, 546.0, 834.0, 1219.0, 1769.0, 2603.0, 3989.0, 5825.0, 9163.0, 13776.0, 20704.0, 32057.0, 49084.0, 76733.0, 120676.0, 184725.0, 183577.0, 120522.0, 76636.0, 49576.0, 31959.0, 20885.0, 13652.0, 8859.0, 6072.0, 3897.0, 2733.0, 1744.0, 1179.0, 755.0, 530.0, 375.0, 253.0, 158.0, 118.0, 80.0, 42.0, 47.0, 22.0, 14.0, 14.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.3473091125488281, -0.33573150634765625, -0.3241539001464844, -0.3125762939453125, -0.3009986877441406, -0.28942108154296875, -0.2778434753417969, -0.266265869140625, -0.2546882629394531, -0.24311065673828125, -0.23153305053710938, -0.2199554443359375, -0.20837783813476562, -0.19680023193359375, -0.18522262573242188, -0.17364501953125, -0.16206741333007812, -0.15048980712890625, -0.13891220092773438, -0.1273345947265625, -0.11575698852539062, -0.10417938232421875, -0.09260177612304688, -0.081024169921875, -0.06944656372070312, -0.05786895751953125, -0.046291351318359375, -0.0347137451171875, -0.023136138916015625, -0.01155853271484375, 1.9073486328125e-05, 0.0115966796875, 0.023174285888671875, 0.03475189208984375, 0.046329498291015625, 0.0579071044921875, 0.06948471069335938, 0.08106231689453125, 0.09263992309570312, 0.104217529296875, 0.11579513549804688, 0.12737274169921875, 0.13895034790039062, 0.1505279541015625, 0.16210556030273438, 0.17368316650390625, 0.18526077270507812, 0.19683837890625, 0.20841598510742188, 0.21999359130859375, 0.23157119750976562, 0.2431488037109375, 0.2547264099121094, 0.26630401611328125, 0.2778816223144531, 0.289459228515625, 0.3010368347167969, 0.31261444091796875, 0.3241920471191406, 0.3357696533203125, 0.3473472595214844, 0.35892486572265625, 0.3705024719238281, 0.382080078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 13.0, 11.0, 19.0, 8.0, 16.0, 20.0, 25.0, 32.0, 32.0, 27.0, 30.0, 23.0, 28.0, 42.0, 39.0, 48.0, 41.0, 1066.0, 49.0, 47.0, 44.0, 40.0, 40.0, 35.0, 33.0, 20.0, 21.0, 23.0, 19.0, 20.0, 20.0, 18.0, 13.0, 6.0, 5.0, 7.0, 11.0, 10.0, 1.0, 3.0, 4.0, 8.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.375, -2.299652099609375, -2.22430419921875, -2.148956298828125, -2.0736083984375, -1.998260498046875, -1.92291259765625, -1.847564697265625, -1.772216796875, -1.696868896484375, -1.62152099609375, -1.546173095703125, -1.4708251953125, -1.395477294921875, -1.32012939453125, -1.244781494140625, -1.16943359375, -1.094085693359375, -1.01873779296875, -0.943389892578125, -0.8680419921875, -0.792694091796875, -0.71734619140625, -0.641998291015625, -0.566650390625, -0.491302490234375, -0.41595458984375, -0.340606689453125, -0.2652587890625, -0.189910888671875, -0.11456298828125, -0.039215087890625, 0.0361328125, 0.111480712890625, 0.18682861328125, 0.262176513671875, 0.3375244140625, 0.412872314453125, 0.48822021484375, 0.563568115234375, 0.638916015625, 0.714263916015625, 0.78961181640625, 0.864959716796875, 0.9403076171875, 1.015655517578125, 1.09100341796875, 1.166351318359375, 1.24169921875, 1.317047119140625, 1.39239501953125, 1.467742919921875, 1.5430908203125, 1.618438720703125, 1.69378662109375, 1.769134521484375, 1.844482421875, 1.919830322265625, 1.99517822265625, 2.070526123046875, 2.1458740234375, 2.221221923828125, 2.29656982421875, 2.371917724609375, 2.447265625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 6.0, 11.0, 14.0, 14.0, 34.0, 43.0, 55.0, 80.0, 107.0, 193.0, 242.0, 347.0, 495.0, 779.0, 1015.0, 1427.0, 2056.0, 2932.0, 4180.0, 6323.0, 9141.0, 13535.0, 20564.0, 31834.0, 49714.0, 80055.0, 131346.0, 1246661.0, 189773.0, 109989.0, 68242.0, 42809.0, 27157.0, 17991.0, 11739.0, 7991.0, 5491.0, 3770.0, 2654.0, 1885.0, 1288.0, 924.0, 691.0, 474.0, 350.0, 207.0, 161.0, 119.0, 74.0, 53.0, 36.0, 15.0, 29.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.343017578125, -0.3322410583496094, -0.32146453857421875, -0.3106880187988281, -0.2999114990234375, -0.2891349792480469, -0.27835845947265625, -0.2675819396972656, -0.256805419921875, -0.24602890014648438, -0.23525238037109375, -0.22447586059570312, -0.2136993408203125, -0.20292282104492188, -0.19214630126953125, -0.18136978149414062, -0.17059326171875, -0.15981674194335938, -0.14904022216796875, -0.13826370239257812, -0.1274871826171875, -0.11671066284179688, -0.10593414306640625, -0.09515762329101562, -0.084381103515625, -0.07360458374023438, -0.06282806396484375, -0.052051544189453125, -0.0412750244140625, -0.030498504638671875, -0.01972198486328125, -0.008945465087890625, 0.0018310546875, 0.012607574462890625, 0.02338409423828125, 0.034160614013671875, 0.0449371337890625, 0.055713653564453125, 0.06649017333984375, 0.07726669311523438, 0.088043212890625, 0.09881973266601562, 0.10959625244140625, 0.12037277221679688, 0.1311492919921875, 0.14192581176757812, 0.15270233154296875, 0.16347885131835938, 0.17425537109375, 0.18503189086914062, 0.19580841064453125, 0.20658493041992188, 0.2173614501953125, 0.22813796997070312, 0.23891448974609375, 0.24969100952148438, 0.260467529296875, 0.2712440490722656, 0.28202056884765625, 0.2927970886230469, 0.3035736083984375, 0.3143501281738281, 0.32512664794921875, 0.3359031677246094, 0.3466796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 6.0, 7.0, 14.0, 8.0, 15.0, 25.0, 26.0, 32.0, 48.0, 55.0, 74.0, 82.0, 89.0, 93.0, 99.0, 63.0, 79.0, 33.0, 37.0, 30.0, 24.0, 17.0, 15.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0034503936767578125, -0.0033492743968963623, -0.003248155117034912, -0.003147035837173462, -0.0030459165573120117, -0.0029447972774505615, -0.0028436779975891113, -0.002742558717727661, -0.002641439437866211, -0.0025403201580047607, -0.0024392008781433105, -0.0023380815982818604, -0.00223696231842041, -0.00213584303855896, -0.0020347237586975098, -0.0019336044788360596, -0.0018324851989746094, -0.0017313659191131592, -0.001630246639251709, -0.0015291273593902588, -0.0014280080795288086, -0.0013268887996673584, -0.0012257695198059082, -0.001124650239944458, -0.0010235309600830078, -0.0009224116802215576, -0.0008212924003601074, -0.0007201731204986572, -0.000619053840637207, -0.0005179345607757568, -0.00041681528091430664, -0.00031569600105285645, -0.00021457672119140625, -0.00011345744132995605, -1.233816146850586e-05, 8.878111839294434e-05, 0.00018990039825439453, 0.0002910196781158447, 0.0003921389579772949, 0.0004932582378387451, 0.0005943775177001953, 0.0006954967975616455, 0.0007966160774230957, 0.0008977353572845459, 0.000998854637145996, 0.0010999739170074463, 0.0012010931968688965, 0.0013022124767303467, 0.0014033317565917969, 0.001504451036453247, 0.0016055703163146973, 0.0017066895961761475, 0.0018078088760375977, 0.0019089281558990479, 0.002010047435760498, 0.0021111667156219482, 0.0022122859954833984, 0.0023134052753448486, 0.002414524555206299, 0.002515643835067749, 0.0026167631149291992, 0.0027178823947906494, 0.0028190016746520996, 0.00292012095451355, 0.003021240234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 18.0, 8.0, 23.0, 37.0, 43.0, 68.0, 95.0, 122.0, 183.0, 323.0, 533.0, 1287.0, 326692.0, 716094.0, 1407.0, 583.0, 319.0, 202.0, 131.0, 88.0, 77.0, 50.0, 39.0, 29.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04974365234375, -0.048087120056152344, -0.04643058776855469, -0.04477405548095703, -0.043117523193359375, -0.04146099090576172, -0.03980445861816406, -0.038147926330566406, -0.03649139404296875, -0.034834861755371094, -0.03317832946777344, -0.03152179718017578, -0.029865264892578125, -0.02820873260498047, -0.026552200317382812, -0.024895668029785156, -0.0232391357421875, -0.021582603454589844, -0.019926071166992188, -0.01826953887939453, -0.016613006591796875, -0.014956474304199219, -0.013299942016601562, -0.011643409729003906, -0.00998687744140625, -0.008330345153808594, -0.0066738128662109375, -0.005017280578613281, -0.003360748291015625, -0.0017042160034179688, -4.76837158203125e-05, 0.0016088485717773438, 0.003265380859375, 0.004921913146972656, 0.0065784454345703125, 0.008234977722167969, 0.009891510009765625, 0.011548042297363281, 0.013204574584960938, 0.014861106872558594, 0.01651763916015625, 0.018174171447753906, 0.019830703735351562, 0.02148723602294922, 0.023143768310546875, 0.02480030059814453, 0.026456832885742188, 0.028113365173339844, 0.0297698974609375, 0.031426429748535156, 0.03308296203613281, 0.03473949432373047, 0.036396026611328125, 0.03805255889892578, 0.03970909118652344, 0.041365623474121094, 0.04302215576171875, 0.044678688049316406, 0.04633522033691406, 0.04799175262451172, 0.049648284912109375, 0.05130481719970703, 0.05296134948730469, 0.054617881774902344, 0.0562744140625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 83.0, 860.0, 71.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006993314251303673, -0.0066674454137682915, -0.00634157657623291, -0.006015708204358816, -0.005689839366823435, -0.0053639705292880535, -0.0050381021574139595, -0.004712233319878578, -0.004386364482343197, -0.0040604956448078156, -0.003734627040103078, -0.0034087584353983402, -0.003082889597862959, -0.0027570207603275776, -0.00243115215562284, -0.0021052835509181023, -0.001779414713382721, -0.0014535459922626615, -0.001127677271142602, -0.0008018085500225425, -0.000475939828902483, -0.0001500711077824235, 0.000175797613337636, 0.0005016662180423737, 0.000827535055577755, 0.0011534037766978145, 0.001479272497817874, 0.0018051412189379334, 0.002131009940057993, 0.0024568787775933743, 0.002782747382298112, 0.0031086159870028496, 0.003434484824538231, 0.003760353662073612, 0.0040862224996089935, 0.0044120908714830875, 0.004737959709018469, 0.00506382854655385, 0.005389696918427944, 0.0057155657559633255, 0.006041434593498707, 0.006367303431034088, 0.0066931722685694695, 0.0070190406404435635, 0.007344909477978945, 0.007670778315514326, 0.00799664668738842, 0.008322515524923801, 0.008648384362459183, 0.008974253199994564, 0.009300122037529945, 0.009625990875065327, 0.009951859712600708, 0.010277727618813515, 0.010603596456348896, 0.010929465293884277, 0.011255334131419659, 0.01158120296895504, 0.011907071806490421, 0.012232940644025803, 0.01255880855023861, 0.01288467738777399, 0.013210546225309372, 0.013536415062844753, 0.013862283900380135]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 4.0, 7.0, 9.0, 17.0, 6.0, 18.0, 21.0, 23.0, 24.0, 25.0, 31.0, 43.0, 41.0, 51.0, 42.0, 62.0, 43.0, 51.0, 46.0, 36.0, 45.0, 41.0, 40.0, 35.0, 23.0, 41.0, 22.0, 26.0, 24.0, 13.0, 21.0, 15.0, 15.0, 8.0, 12.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014762282371520996, -0.001432240940630436, -0.0013882536441087723, -0.0013442663475871086, -0.001300279051065445, -0.0012562917545437813, -0.0012123044580221176, -0.001168317161500454, -0.0011243298649787903, -0.0010803425684571266, -0.001036355271935463, -0.0009923679754137993, -0.0009483806788921356, -0.000904393382370472, -0.0008604060858488083, -0.0008164187893271446, -0.000772431492805481, -0.0007284441962838173, -0.0006844568997621536, -0.00064046960324049, -0.0005964823067188263, -0.0005524950101971626, -0.000508507713675499, -0.0004645204171538353, -0.00042053312063217163, -0.00037654582411050797, -0.0003325585275888443, -0.00028857123106718063, -0.00024458393454551697, -0.0002005966380238533, -0.00015660934150218964, -0.00011262204498052597, -6.86347484588623e-05, -2.464745193719864e-05, 1.9339844584465027e-05, 6.332714110612869e-05, 0.00010731443762779236, 0.00015130173414945602, 0.0001952890306711197, 0.00023927632719278336, 0.000283263623714447, 0.0003272509202361107, 0.00037123821675777435, 0.000415225513279438, 0.0004592128098011017, 0.0005032001063227654, 0.000547187402844429, 0.0005911746993660927, 0.0006351619958877563, 0.00067914929240942, 0.0007231365889310837, 0.0007671238854527473, 0.000811111181974411, 0.0008550984784960747, 0.0008990857750177383, 0.000943073071539402, 0.0009870603680610657, 0.0010310476645827293, 0.001075034961104393, 0.0011190222576260567, 0.0011630095541477203, 0.001206996850669384, 0.0012509841471910477, 0.0012949714437127113, 0.001338958740234375]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 11.0, 14.0, 20.0, 25.0, 30.0, 23.0, 34.0, 37.0, 42.0, 33.0, 54.0, 66.0, 46.0, 50.0, 52.0, 40.0, 45.0, 39.0, 43.0, 45.0, 37.0, 34.0, 23.0, 28.0, 20.0, 12.0, 20.0, 13.0, 9.0, 14.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.91796875, -4.7784423828125, -4.638916015625, -4.4993896484375, -4.35986328125, -4.2203369140625, -4.080810546875, -3.9412841796875, -3.8017578125, -3.6622314453125, -3.522705078125, -3.3831787109375, -3.24365234375, -3.1041259765625, -2.964599609375, -2.8250732421875, -2.685546875, -2.5460205078125, -2.406494140625, -2.2669677734375, -2.12744140625, -1.9879150390625, -1.848388671875, -1.7088623046875, -1.5693359375, -1.4298095703125, -1.290283203125, -1.1507568359375, -1.01123046875, -0.8717041015625, -0.732177734375, -0.5926513671875, -0.453125, -0.3135986328125, -0.174072265625, -0.0345458984375, 0.10498046875, 0.2445068359375, 0.384033203125, 0.5235595703125, 0.6630859375, 0.8026123046875, 0.942138671875, 1.0816650390625, 1.22119140625, 1.3607177734375, 1.500244140625, 1.6397705078125, 1.779296875, 1.9188232421875, 2.058349609375, 2.1978759765625, 2.33740234375, 2.4769287109375, 2.616455078125, 2.7559814453125, 2.8955078125, 3.0350341796875, 3.174560546875, 3.3140869140625, 3.45361328125, 3.5931396484375, 3.732666015625, 3.8721923828125, 4.01171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 11.0, 37.0, 25.0, 43.0, 42.0, 62.0, 107.0, 130.0, 178.0, 220.0, 336.0, 542.0, 785.0, 1316.0, 2555.0, 5990.0, 18175.0, 89577.0, 564835.0, 299738.0, 43475.0, 11083.0, 4007.0, 2009.0, 1081.0, 667.0, 417.0, 308.0, 220.0, 154.0, 93.0, 99.0, 56.0, 40.0, 30.0, 31.0, 19.0, 11.0, 10.0, 8.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.62890625, -7.39630126953125, -7.1636962890625, -6.93109130859375, -6.698486328125, -6.46588134765625, -6.2332763671875, -6.00067138671875, -5.76806640625, -5.53546142578125, -5.3028564453125, -5.07025146484375, -4.837646484375, -4.60504150390625, -4.3724365234375, -4.13983154296875, -3.9072265625, -3.67462158203125, -3.4420166015625, -3.20941162109375, -2.976806640625, -2.74420166015625, -2.5115966796875, -2.27899169921875, -2.04638671875, -1.81378173828125, -1.5811767578125, -1.34857177734375, -1.115966796875, -0.88336181640625, -0.6507568359375, -0.41815185546875, -0.185546875, 0.04705810546875, 0.2796630859375, 0.51226806640625, 0.744873046875, 0.97747802734375, 1.2100830078125, 1.44268798828125, 1.67529296875, 1.90789794921875, 2.1405029296875, 2.37310791015625, 2.605712890625, 2.83831787109375, 3.0709228515625, 3.30352783203125, 3.5361328125, 3.76873779296875, 4.0013427734375, 4.23394775390625, 4.466552734375, 4.69915771484375, 4.9317626953125, 5.16436767578125, 5.39697265625, 5.62957763671875, 5.8621826171875, 6.09478759765625, 6.327392578125, 6.55999755859375, 6.7926025390625, 7.02520751953125, 7.2578125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 0.0, 8.0, 13.0, 10.0, 12.0, 15.0, 23.0, 24.0, 31.0, 43.0, 37.0, 53.0, 46.0, 98.0, 180.0, 1570.0, 338.0, 133.0, 78.0, 74.0, 48.0, 34.0, 34.0, 33.0, 23.0, 13.0, 9.0, 16.0, 12.0, 6.0, 4.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.609375, -13.2183837890625, -12.827392578125, -12.4364013671875, -12.04541015625, -11.6544189453125, -11.263427734375, -10.8724365234375, -10.4814453125, -10.0904541015625, -9.699462890625, -9.3084716796875, -8.91748046875, -8.5264892578125, -8.135498046875, -7.7445068359375, -7.353515625, -6.9625244140625, -6.571533203125, -6.1805419921875, -5.78955078125, -5.3985595703125, -5.007568359375, -4.6165771484375, -4.2255859375, -3.8345947265625, -3.443603515625, -3.0526123046875, -2.66162109375, -2.2706298828125, -1.879638671875, -1.4886474609375, -1.09765625, -0.7066650390625, -0.315673828125, 0.0753173828125, 0.46630859375, 0.8572998046875, 1.248291015625, 1.6392822265625, 2.0302734375, 2.4212646484375, 2.812255859375, 3.2032470703125, 3.59423828125, 3.9852294921875, 4.376220703125, 4.7672119140625, 5.158203125, 5.5491943359375, 5.940185546875, 6.3311767578125, 6.72216796875, 7.1131591796875, 7.504150390625, 7.8951416015625, 8.2861328125, 8.6771240234375, 9.068115234375, 9.4591064453125, 9.85009765625, 10.2410888671875, 10.632080078125, 11.0230712890625, 11.4140625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 10.0, 10.0, 15.0, 16.0, 44.0, 54.0, 67.0, 90.0, 126.0, 241.0, 402.0, 992.0, 8424.0, 3124440.0, 8577.0, 990.0, 435.0, 238.0, 167.0, 110.0, 71.0, 50.0, 32.0, 14.0, 21.0, 14.0, 3.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.578125, -22.653564453125, -21.72900390625, -20.804443359375, -19.8798828125, -18.955322265625, -18.03076171875, -17.106201171875, -16.181640625, -15.257080078125, -14.33251953125, -13.407958984375, -12.4833984375, -11.558837890625, -10.63427734375, -9.709716796875, -8.78515625, -7.860595703125, -6.93603515625, -6.011474609375, -5.0869140625, -4.162353515625, -3.23779296875, -2.313232421875, -1.388671875, -0.464111328125, 0.46044921875, 1.385009765625, 2.3095703125, 3.234130859375, 4.15869140625, 5.083251953125, 6.0078125, 6.932373046875, 7.85693359375, 8.781494140625, 9.7060546875, 10.630615234375, 11.55517578125, 12.479736328125, 13.404296875, 14.328857421875, 15.25341796875, 16.177978515625, 17.1025390625, 18.027099609375, 18.95166015625, 19.876220703125, 20.80078125, 21.725341796875, 22.64990234375, 23.574462890625, 24.4990234375, 25.423583984375, 26.34814453125, 27.272705078125, 28.197265625, 29.121826171875, 30.04638671875, 30.970947265625, 31.8955078125, 32.820068359375, 33.74462890625, 34.669189453125, 35.59375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 53.0, 615.0, 336.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.44959259033203, -66.53363037109375, -63.61766815185547, -60.70170593261719, -57.785743713378906, -54.869781494140625, -51.953819274902344, -49.03785705566406, -46.12189483642578, -43.2059326171875, -40.28997039794922, -37.37400817871094, -34.458045959472656, -31.542083740234375, -28.62611961364746, -25.71015739440918, -22.794193267822266, -19.878231048583984, -16.962268829345703, -14.046305656433105, -11.130343437194824, -8.214381217956543, -5.298418045043945, -2.382455825805664, 0.5335063934326172, 3.4494688510894775, 6.365431308746338, 9.281394004821777, 12.197356224060059, 15.11331844329834, 18.029281616210938, 20.94524383544922, 23.8612060546875, 26.77716827392578, 29.693130493164062, 32.609092712402344, 35.525054931640625, 38.441017150878906, 41.35697937011719, 44.27294158935547, 47.18890380859375, 50.10486602783203, 53.02082824707031, 55.936790466308594, 58.852752685546875, 61.768714904785156, 64.68467712402344, 67.60063934326172, 70.5166015625, 73.43256378173828, 76.34852600097656, 79.26448822021484, 82.18045043945312, 85.0964126586914, 88.01237487792969, 90.92833709716797, 93.84430694580078, 96.76026916503906, 99.67623138427734, 102.59219360351562, 105.5081558227539, 108.42411804199219, 111.34008026123047, 114.25604248046875, 117.17200469970703]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 9.0, 8.0, 16.0, 16.0, 23.0, 22.0, 30.0, 31.0, 30.0, 37.0, 32.0, 35.0, 48.0, 47.0, 44.0, 45.0, 54.0, 41.0, 46.0, 38.0, 41.0, 33.0, 44.0, 33.0, 33.0, 29.0, 26.0, 22.0, 22.0, 14.0, 9.0, 9.0, 5.0, 6.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.248985290527344, -33.392330169677734, -32.53567886352539, -31.679025650024414, -30.822372436523438, -29.965717315673828, -29.109066009521484, -28.252410888671875, -27.3957576751709, -26.539104461669922, -25.682451248168945, -24.82579803466797, -23.969144821166992, -23.112491607666016, -22.255836486816406, -21.39918327331543, -20.542530059814453, -19.685876846313477, -18.8292236328125, -17.972570419311523, -17.115917205810547, -16.259262084960938, -15.402609825134277, -14.545955657958984, -13.68930435180664, -12.832651138305664, -11.975997924804688, -11.119344711303711, -10.262690544128418, -9.406037330627441, -8.549384117126465, -7.69273042678833, -6.836076736450195, -5.979423522949219, -5.122769832611084, -4.266116619110107, -3.4094631671905518, -2.552809715270996, -1.6961565017700195, -0.8395028114318848, 0.017150402069091797, 0.8738037943840027, 1.7304571866989136, 2.5871105194091797, 3.4437639713287354, 4.300417423248291, 5.157070636749268, 6.013724327087402, 6.870377540588379, 7.7270307540893555, 8.583683967590332, 9.440338134765625, 10.296991348266602, 11.153644561767578, 12.010297775268555, 12.866950988769531, 13.723604202270508, 14.580257415771484, 15.436910629272461, 16.293563842773438, 17.150217056274414, 18.00687026977539, 18.863525390625, 19.720178604125977, 20.576831817626953]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 9.0, 1.0, 8.0, 4.0, 8.0, 11.0, 19.0, 16.0, 13.0, 23.0, 23.0, 33.0, 26.0, 22.0, 42.0, 28.0, 33.0, 40.0, 44.0, 37.0, 35.0, 41.0, 50.0, 44.0, 46.0, 30.0, 36.0, 41.0, 28.0, 27.0, 24.0, 20.0, 19.0, 16.0, 25.0, 14.0, 13.0, 9.0, 11.0, 10.0, 10.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.06640625, -3.92877197265625, -3.7911376953125, -3.65350341796875, -3.515869140625, -3.37823486328125, -3.2406005859375, -3.10296630859375, -2.96533203125, -2.82769775390625, -2.6900634765625, -2.55242919921875, -2.414794921875, -2.27716064453125, -2.1395263671875, -2.00189208984375, -1.8642578125, -1.72662353515625, -1.5889892578125, -1.45135498046875, -1.313720703125, -1.17608642578125, -1.0384521484375, -0.90081787109375, -0.76318359375, -0.62554931640625, -0.4879150390625, -0.35028076171875, -0.212646484375, -0.07501220703125, 0.0626220703125, 0.20025634765625, 0.337890625, 0.47552490234375, 0.6131591796875, 0.75079345703125, 0.888427734375, 1.02606201171875, 1.1636962890625, 1.30133056640625, 1.43896484375, 1.57659912109375, 1.7142333984375, 1.85186767578125, 1.989501953125, 2.12713623046875, 2.2647705078125, 2.40240478515625, 2.5400390625, 2.67767333984375, 2.8153076171875, 2.95294189453125, 3.090576171875, 3.22821044921875, 3.3658447265625, 3.50347900390625, 3.64111328125, 3.77874755859375, 3.9163818359375, 4.05401611328125, 4.191650390625, 4.32928466796875, 4.4669189453125, 4.60455322265625, 4.7421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 13.0, 17.0, 25.0, 20.0, 37.0, 49.0, 75.0, 102.0, 124.0, 155.0, 227.0, 354.0, 509.0, 840.0, 1456.0, 6730.0, 693906.0, 3455081.0, 29020.0, 2512.0, 1009.0, 611.0, 399.0, 256.0, 206.0, 141.0, 91.0, 72.0, 77.0, 51.0, 34.0, 21.0, 21.0, 12.0, 7.0, 4.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.203125, -27.354248046875, -26.50537109375, -25.656494140625, -24.8076171875, -23.958740234375, -23.10986328125, -22.260986328125, -21.412109375, -20.563232421875, -19.71435546875, -18.865478515625, -18.0166015625, -17.167724609375, -16.31884765625, -15.469970703125, -14.62109375, -13.772216796875, -12.92333984375, -12.074462890625, -11.2255859375, -10.376708984375, -9.52783203125, -8.678955078125, -7.830078125, -6.981201171875, -6.13232421875, -5.283447265625, -4.4345703125, -3.585693359375, -2.73681640625, -1.887939453125, -1.0390625, -0.190185546875, 0.65869140625, 1.507568359375, 2.3564453125, 3.205322265625, 4.05419921875, 4.903076171875, 5.751953125, 6.600830078125, 7.44970703125, 8.298583984375, 9.1474609375, 9.996337890625, 10.84521484375, 11.694091796875, 12.54296875, 13.391845703125, 14.24072265625, 15.089599609375, 15.9384765625, 16.787353515625, 17.63623046875, 18.485107421875, 19.333984375, 20.182861328125, 21.03173828125, 21.880615234375, 22.7294921875, 23.578369140625, 24.42724609375, 25.276123046875, 26.125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 22.0, 20.0, 48.0, 82.0, 150.0, 233.0, 418.0, 665.0, 788.0, 671.0, 438.0, 205.0, 140.0, 79.0, 41.0, 23.0, 15.0, 10.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.0078125, -13.653564453125, -13.29931640625, -12.945068359375, -12.5908203125, -12.236572265625, -11.88232421875, -11.528076171875, -11.173828125, -10.819580078125, -10.46533203125, -10.111083984375, -9.7568359375, -9.402587890625, -9.04833984375, -8.694091796875, -8.33984375, -7.985595703125, -7.63134765625, -7.277099609375, -6.9228515625, -6.568603515625, -6.21435546875, -5.860107421875, -5.505859375, -5.151611328125, -4.79736328125, -4.443115234375, -4.0888671875, -3.734619140625, -3.38037109375, -3.026123046875, -2.671875, -2.317626953125, -1.96337890625, -1.609130859375, -1.2548828125, -0.900634765625, -0.54638671875, -0.192138671875, 0.162109375, 0.516357421875, 0.87060546875, 1.224853515625, 1.5791015625, 1.933349609375, 2.28759765625, 2.641845703125, 2.99609375, 3.350341796875, 3.70458984375, 4.058837890625, 4.4130859375, 4.767333984375, 5.12158203125, 5.475830078125, 5.830078125, 6.184326171875, 6.53857421875, 6.892822265625, 7.2470703125, 7.601318359375, 7.95556640625, 8.309814453125, 8.6640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 4.0, 9.0, 11.0, 17.0, 28.0, 61.0, 114.0, 243.0, 522.0, 1129.0, 2822.0, 10499.0, 87034.0, 1803020.0, 2163740.0, 107647.0, 12033.0, 3160.0, 1169.0, 528.0, 215.0, 107.0, 61.0, 34.0, 20.0, 11.0, 10.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.4254150390625, -9.100830078125, -8.7762451171875, -8.45166015625, -8.1270751953125, -7.802490234375, -7.4779052734375, -7.1533203125, -6.8287353515625, -6.504150390625, -6.1795654296875, -5.85498046875, -5.5303955078125, -5.205810546875, -4.8812255859375, -4.556640625, -4.2320556640625, -3.907470703125, -3.5828857421875, -3.25830078125, -2.9337158203125, -2.609130859375, -2.2845458984375, -1.9599609375, -1.6353759765625, -1.310791015625, -0.9862060546875, -0.66162109375, -0.3370361328125, -0.012451171875, 0.3121337890625, 0.63671875, 0.9613037109375, 1.285888671875, 1.6104736328125, 1.93505859375, 2.2596435546875, 2.584228515625, 2.9088134765625, 3.2333984375, 3.5579833984375, 3.882568359375, 4.2071533203125, 4.53173828125, 4.8563232421875, 5.180908203125, 5.5054931640625, 5.830078125, 6.1546630859375, 6.479248046875, 6.8038330078125, 7.12841796875, 7.4530029296875, 7.777587890625, 8.1021728515625, 8.4267578125, 8.7513427734375, 9.075927734375, 9.4005126953125, 9.72509765625, 10.0496826171875, 10.374267578125, 10.6988525390625, 11.0234375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 12.0, 22.0, 41.0, 34.0, 90.0, 120.0, 135.0, 142.0, 133.0, 100.0, 66.0, 53.0, 25.0, 17.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.958391189575195, -25.867084503173828, -23.77577781677246, -21.684471130371094, -19.59316635131836, -17.50185775756836, -15.410552978515625, -13.319246292114258, -11.22793960571289, -9.136632919311523, -7.0453267097473145, -4.9540205001831055, -2.8627138137817383, -0.7714071273803711, 1.3198986053466797, 3.411205291748047, 5.502511978149414, 7.593818664550781, 9.685125350952148, 11.7764310836792, 13.867737770080566, 15.959044456481934, 18.050350189208984, 20.14165687561035, 22.23296356201172, 24.324270248413086, 26.415576934814453, 28.506881713867188, 30.598190307617188, 32.68949508666992, 34.780799865722656, 36.872108459472656, 38.963409423828125, 41.05471420288086, 43.14602279663086, 45.237327575683594, 47.328636169433594, 49.41994094848633, 51.51124572753906, 53.60255432128906, 55.69386291503906, 57.7851676940918, 59.8764762878418, 61.96778106689453, 64.05908966064453, 66.15039825439453, 68.24169921875, 70.3330078125, 72.42431640625, 74.515625, 76.60692596435547, 78.69823455810547, 80.78954315185547, 82.88085174560547, 84.97215270996094, 87.06346130371094, 89.1547622680664, 91.2460708618164, 93.33737182617188, 95.42868041992188, 97.51998901367188, 99.61129760742188, 101.70259857177734, 103.79390716552734, 105.88521575927734]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 3.0, 7.0, 3.0, 1.0, 7.0, 5.0, 9.0, 6.0, 13.0, 18.0, 18.0, 21.0, 18.0, 28.0, 28.0, 32.0, 34.0, 27.0, 23.0, 36.0, 37.0, 43.0, 41.0, 44.0, 29.0, 42.0, 33.0, 33.0, 30.0, 31.0, 22.0, 37.0, 41.0, 20.0, 26.0, 19.0, 14.0, 14.0, 15.0, 19.0, 13.0, 9.0, 11.0, 8.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.928709030151367, -21.200014114379883, -20.4713191986084, -19.742624282836914, -19.01392936706543, -18.285234451293945, -17.556537628173828, -16.827842712402344, -16.09914779663086, -15.370452880859375, -14.64175796508789, -13.913063049316406, -13.184368133544922, -12.455673217773438, -11.726977348327637, -10.998282432556152, -10.269588470458984, -9.5408935546875, -8.812198638916016, -8.083503723144531, -7.354808330535889, -6.626113414764404, -5.897418022155762, -5.168723106384277, -4.440028190612793, -3.7113332748413086, -2.982638120651245, -2.2539429664611816, -1.5252480506896973, -0.7965531349182129, -0.06785774230957031, 0.6608371734619141, 1.3895339965820312, 2.1182289123535156, 2.846924066543579, 3.5756192207336426, 4.304314136505127, 5.033009052276611, 5.761704444885254, 6.490399360656738, 7.219094276428223, 7.947789192199707, 8.676484107971191, 9.405179977416992, 10.133874893188477, 10.862569808959961, 11.591264724731445, 12.31995964050293, 13.048654556274414, 13.777349472045898, 14.506044387817383, 15.234739303588867, 15.963434219360352, 16.692129135131836, 17.420825958251953, 18.149520874023438, 18.878215789794922, 19.606910705566406, 20.33560562133789, 21.064300537109375, 21.79299545288086, 22.521690368652344, 23.250385284423828, 23.979080200195312, 24.707775115966797]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 4.0, 6.0, 3.0, 4.0, 2.0, 12.0, 12.0, 5.0, 13.0, 12.0, 23.0, 19.0, 16.0, 20.0, 26.0, 31.0, 39.0, 30.0, 29.0, 45.0, 36.0, 34.0, 38.0, 41.0, 40.0, 30.0, 36.0, 34.0, 32.0, 28.0, 35.0, 34.0, 32.0, 30.0, 23.0, 20.0, 21.0, 11.0, 16.0, 10.0, 11.0, 11.0, 10.0, 6.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.5, -38.18310546875, -36.8662109375, -35.54931640625, -34.232421875, -32.91552734375, -31.5986328125, -30.28173828125, -28.96484375, -27.64794921875, -26.3310546875, -25.01416015625, -23.697265625, -22.38037109375, -21.0634765625, -19.74658203125, -18.4296875, -17.11279296875, -15.7958984375, -14.47900390625, -13.162109375, -11.84521484375, -10.5283203125, -9.21142578125, -7.89453125, -6.57763671875, -5.2607421875, -3.94384765625, -2.626953125, -1.31005859375, 0.0068359375, 1.32373046875, 2.640625, 3.95751953125, 5.2744140625, 6.59130859375, 7.908203125, 9.22509765625, 10.5419921875, 11.85888671875, 13.17578125, 14.49267578125, 15.8095703125, 17.12646484375, 18.443359375, 19.76025390625, 21.0771484375, 22.39404296875, 23.7109375, 25.02783203125, 26.3447265625, 27.66162109375, 28.978515625, 30.29541015625, 31.6123046875, 32.92919921875, 34.24609375, 35.56298828125, 36.8798828125, 38.19677734375, 39.513671875, 40.83056640625, 42.1474609375, 43.46435546875, 44.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 13.0, 15.0, 29.0, 20.0, 31.0, 42.0, 90.0, 124.0, 190.0, 324.0, 528.0, 953.0, 1588.0, 2672.0, 4678.0, 8341.0, 14157.0, 25141.0, 46007.0, 85644.0, 159931.0, 257204.0, 200036.0, 108773.0, 58503.0, 31504.0, 17821.0, 10231.0, 5782.0, 3352.0, 1968.0, 1155.0, 641.0, 408.0, 225.0, 156.0, 105.0, 58.0, 40.0, 21.0, 14.0, 14.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.837158203125, -5.64697265625, -5.456787109375, -5.2666015625, -5.076416015625, -4.88623046875, -4.696044921875, -4.505859375, -4.315673828125, -4.12548828125, -3.935302734375, -3.7451171875, -3.554931640625, -3.36474609375, -3.174560546875, -2.984375, -2.794189453125, -2.60400390625, -2.413818359375, -2.2236328125, -2.033447265625, -1.84326171875, -1.653076171875, -1.462890625, -1.272705078125, -1.08251953125, -0.892333984375, -0.7021484375, -0.511962890625, -0.32177734375, -0.131591796875, 0.05859375, 0.248779296875, 0.43896484375, 0.629150390625, 0.8193359375, 1.009521484375, 1.19970703125, 1.389892578125, 1.580078125, 1.770263671875, 1.96044921875, 2.150634765625, 2.3408203125, 2.531005859375, 2.72119140625, 2.911376953125, 3.1015625, 3.291748046875, 3.48193359375, 3.672119140625, 3.8623046875, 4.052490234375, 4.24267578125, 4.432861328125, 4.623046875, 4.813232421875, 5.00341796875, 5.193603515625, 5.3837890625, 5.573974609375, 5.76416015625, 5.954345703125, 6.14453125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 1.0, 8.0, 0.0, 2.0, 6.0, 6.0, 11.0, 9.0, 14.0, 15.0, 17.0, 21.0, 16.0, 30.0, 23.0, 21.0, 25.0, 21.0, 29.0, 35.0, 31.0, 43.0, 39.0, 22.0, 46.0, 1055.0, 39.0, 31.0, 25.0, 34.0, 31.0, 42.0, 29.0, 21.0, 23.0, 19.0, 28.0, 20.0, 19.0, 15.0, 13.0, 19.0, 13.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 1.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0], "bins": [-24.046875, -23.29638671875, -22.5458984375, -21.79541015625, -21.044921875, -20.29443359375, -19.5439453125, -18.79345703125, -18.04296875, -17.29248046875, -16.5419921875, -15.79150390625, -15.041015625, -14.29052734375, -13.5400390625, -12.78955078125, -12.0390625, -11.28857421875, -10.5380859375, -9.78759765625, -9.037109375, -8.28662109375, -7.5361328125, -6.78564453125, -6.03515625, -5.28466796875, -4.5341796875, -3.78369140625, -3.033203125, -2.28271484375, -1.5322265625, -0.78173828125, -0.03125, 0.71923828125, 1.4697265625, 2.22021484375, 2.970703125, 3.72119140625, 4.4716796875, 5.22216796875, 5.97265625, 6.72314453125, 7.4736328125, 8.22412109375, 8.974609375, 9.72509765625, 10.4755859375, 11.22607421875, 11.9765625, 12.72705078125, 13.4775390625, 14.22802734375, 14.978515625, 15.72900390625, 16.4794921875, 17.22998046875, 17.98046875, 18.73095703125, 19.4814453125, 20.23193359375, 20.982421875, 21.73291015625, 22.4833984375, 23.23388671875, 23.984375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 22.0, 25.0, 31.0, 42.0, 78.0, 129.0, 192.0, 245.0, 353.0, 509.0, 802.0, 1045.0, 1579.0, 2486.0, 3755.0, 5529.0, 8362.0, 12954.0, 19888.0, 31231.0, 48995.0, 77726.0, 125267.0, 1117557.0, 310175.0, 120195.0, 74909.0, 47102.0, 30156.0, 18884.0, 12482.0, 8164.0, 5334.0, 3460.0, 2367.0, 1649.0, 1093.0, 740.0, 518.0, 344.0, 223.0, 179.0, 105.0, 77.0, 53.0, 54.0, 20.0, 18.0, 10.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.4453125, -4.3104248046875, -4.175537109375, -4.0406494140625, -3.90576171875, -3.7708740234375, -3.635986328125, -3.5010986328125, -3.3662109375, -3.2313232421875, -3.096435546875, -2.9615478515625, -2.82666015625, -2.6917724609375, -2.556884765625, -2.4219970703125, -2.287109375, -2.1522216796875, -2.017333984375, -1.8824462890625, -1.74755859375, -1.6126708984375, -1.477783203125, -1.3428955078125, -1.2080078125, -1.0731201171875, -0.938232421875, -0.8033447265625, -0.66845703125, -0.5335693359375, -0.398681640625, -0.2637939453125, -0.12890625, 0.0059814453125, 0.140869140625, 0.2757568359375, 0.41064453125, 0.5455322265625, 0.680419921875, 0.8153076171875, 0.9501953125, 1.0850830078125, 1.219970703125, 1.3548583984375, 1.48974609375, 1.6246337890625, 1.759521484375, 1.8944091796875, 2.029296875, 2.1641845703125, 2.299072265625, 2.4339599609375, 2.56884765625, 2.7037353515625, 2.838623046875, 2.9735107421875, 3.1083984375, 3.2432861328125, 3.378173828125, 3.5130615234375, 3.64794921875, 3.7828369140625, 3.917724609375, 4.0526123046875, 4.1875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 12.0, 15.0, 4.0, 20.0, 15.0, 26.0, 26.0, 39.0, 45.0, 61.0, 77.0, 97.0, 102.0, 105.0, 49.0, 48.0, 54.0, 37.0, 37.0, 28.0, 17.0, 16.0, 13.0, 16.0, 11.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047393798828125, -0.045804500579833984, -0.04421520233154297, -0.04262590408325195, -0.04103660583496094, -0.03944730758666992, -0.037858009338378906, -0.03626871109008789, -0.034679412841796875, -0.03309011459350586, -0.031500816345214844, -0.029911518096923828, -0.028322219848632812, -0.026732921600341797, -0.02514362335205078, -0.023554325103759766, -0.02196502685546875, -0.020375728607177734, -0.01878643035888672, -0.017197132110595703, -0.015607833862304688, -0.014018535614013672, -0.012429237365722656, -0.01083993911743164, -0.009250640869140625, -0.007661342620849609, -0.006072044372558594, -0.004482746124267578, -0.0028934478759765625, -0.0013041496276855469, 0.00028514862060546875, 0.0018744468688964844, 0.0034637451171875, 0.005053043365478516, 0.006642341613769531, 0.008231639862060547, 0.009820938110351562, 0.011410236358642578, 0.012999534606933594, 0.01458883285522461, 0.016178131103515625, 0.01776742935180664, 0.019356727600097656, 0.020946025848388672, 0.022535324096679688, 0.024124622344970703, 0.02571392059326172, 0.027303218841552734, 0.02889251708984375, 0.030481815338134766, 0.03207111358642578, 0.0336604118347168, 0.03524971008300781, 0.03683900833129883, 0.038428306579589844, 0.04001760482788086, 0.041606903076171875, 0.04319620132446289, 0.044785499572753906, 0.04637479782104492, 0.04796409606933594, 0.04955339431762695, 0.05114269256591797, 0.052731990814208984, 0.0543212890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 13.0, 24.0, 29.0, 45.0, 42.0, 76.0, 118.0, 167.0, 265.0, 427.0, 710.0, 1351.0, 2857.0, 6552.0, 16466.0, 48685.0, 181483.0, 569302.0, 151105.0, 42479.0, 14683.0, 5957.0, 2534.0, 1307.0, 702.0, 386.0, 222.0, 157.0, 113.0, 77.0, 50.0, 38.0, 28.0, 16.0, 15.0, 15.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.2890625, -0.28041839599609375, -0.2717742919921875, -0.26313018798828125, -0.254486083984375, -0.24584197998046875, -0.2371978759765625, -0.22855377197265625, -0.21990966796875, -0.21126556396484375, -0.2026214599609375, -0.19397735595703125, -0.185333251953125, -0.17668914794921875, -0.1680450439453125, -0.15940093994140625, -0.1507568359375, -0.14211273193359375, -0.1334686279296875, -0.12482452392578125, -0.116180419921875, -0.10753631591796875, -0.0988922119140625, -0.09024810791015625, -0.08160400390625, -0.07295989990234375, -0.0643157958984375, -0.05567169189453125, -0.047027587890625, -0.03838348388671875, -0.0297393798828125, -0.02109527587890625, -0.012451171875, -0.00380706787109375, 0.0048370361328125, 0.01348114013671875, 0.022125244140625, 0.03076934814453125, 0.0394134521484375, 0.04805755615234375, 0.05670166015625, 0.06534576416015625, 0.0739898681640625, 0.08263397216796875, 0.091278076171875, 0.09992218017578125, 0.1085662841796875, 0.11721038818359375, 0.1258544921875, 0.13449859619140625, 0.1431427001953125, 0.15178680419921875, 0.160430908203125, 0.16907501220703125, 0.1777191162109375, 0.18636322021484375, 0.19500732421875, 0.20365142822265625, 0.2122955322265625, 0.22093963623046875, 0.229583740234375, 0.23822784423828125, 0.2468719482421875, 0.25551605224609375, 0.26416015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 15.0, 18.0, 39.0, 75.0, 101.0, 166.0, 198.0, 161.0, 108.0, 63.0, 28.0, 13.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09357429295778275, -0.09071171283721924, -0.08784912526607513, -0.08498654514551163, -0.08212395757436752, -0.07926137745380402, -0.07639878988265991, -0.0735362097620964, -0.0706736296415329, -0.06781104952096939, -0.06494846194982529, -0.06208588182926178, -0.059223294258117676, -0.05636071413755417, -0.05349813029170036, -0.05063554644584656, -0.047772958874702454, -0.04491037502884865, -0.04204779118299484, -0.039185211062431335, -0.03632262349128723, -0.033460043370723724, -0.03059745952486992, -0.027734875679016113, -0.024872291833162308, -0.022009707987308502, -0.019147124141454697, -0.01628454215824604, -0.013421958312392235, -0.01055937446653843, -0.007696792483329773, -0.004834208637475967, -0.001971632242202759, 0.0008909511379897594, 0.0037535345181822777, 0.006616117432713509, 0.009478701278567314, 0.01234128512442112, 0.015203867107629776, 0.01806645095348358, 0.020929034799337387, 0.023791618645191193, 0.026654202491044998, 0.029516784474253654, 0.03237936645746231, 0.035241954028606415, 0.03810453414916992, 0.04096711799502373, 0.04382970184087753, 0.04669228568673134, 0.049554869532585144, 0.05241744965314865, 0.055280037224292755, 0.05814261734485626, 0.06100520119071007, 0.06386778503656387, 0.06673036515712738, 0.06959294527769089, 0.07245553284883499, 0.0753181129693985, 0.0781807005405426, 0.08104328066110611, 0.08390586078166962, 0.08676844835281372, 0.08963103592395782]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 10.0, 10.0, 14.0, 10.0, 18.0, 13.0, 13.0, 19.0, 22.0, 26.0, 30.0, 32.0, 41.0, 32.0, 45.0, 41.0, 31.0, 34.0, 39.0, 60.0, 39.0, 46.0, 42.0, 35.0, 31.0, 36.0, 27.0, 24.0, 32.0, 19.0, 17.0, 20.0, 21.0, 12.0, 13.0, 11.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.022138595581054688, -0.02141142636537552, -0.0206842552870512, -0.019957084208726883, -0.019229914993047714, -0.018502745777368546, -0.017775574699044228, -0.01704840362071991, -0.01632123440504074, -0.015594064258038998, -0.014866894111037254, -0.014139723964035511, -0.013412553817033768, -0.012685383670032024, -0.011958213523030281, -0.011231043376028538, -0.010503873229026794, -0.009776703082025051, -0.009049532935023308, -0.008322362788021564, -0.007595192641019821, -0.006868022494018078, -0.0061408523470163345, -0.005413682200014591, -0.004686512053012848, -0.003959341906011105, -0.0032321717590093613, -0.002505001612007618, -0.0017778314650058746, -0.0010506613180041313, -0.000323491171002388, 0.0004036789759993553, 0.0011308491230010986, 0.001858019270002842, 0.0025851894170045853, 0.0033123595640063286, 0.004039529711008072, 0.004766699858009815, 0.0054938700050115585, 0.006221040152013302, 0.006948210299015045, 0.0076753804460167885, 0.008402550593018532, 0.009129720740020275, 0.009856890887022018, 0.010584061034023762, 0.011311231181025505, 0.012038401328027248, 0.012765571475028992, 0.013492741622030735, 0.014219911769032478, 0.014947081916034222, 0.015674252063035965, 0.016401421278715134, 0.01712859235703945, 0.01785576343536377, 0.018582932651042938, 0.019310101866722107, 0.020037272945046425, 0.020764444023370743, 0.02149161323904991, 0.02221878245472908, 0.022945953533053398, 0.023673124611377716, 0.024400293827056885]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 1.0, 5.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 11.0, 13.0, 6.0, 14.0, 10.0, 23.0, 19.0, 17.0, 20.0, 27.0, 30.0, 40.0, 28.0, 31.0, 42.0, 37.0, 35.0, 39.0, 42.0, 38.0, 31.0, 33.0, 35.0, 34.0, 24.0, 39.0, 32.0, 32.0, 30.0, 23.0, 23.0, 18.0, 10.0, 17.0, 10.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.4375, -38.12158203125, -36.8056640625, -35.48974609375, -34.173828125, -32.85791015625, -31.5419921875, -30.22607421875, -28.91015625, -27.59423828125, -26.2783203125, -24.96240234375, -23.646484375, -22.33056640625, -21.0146484375, -19.69873046875, -18.3828125, -17.06689453125, -15.7509765625, -14.43505859375, -13.119140625, -11.80322265625, -10.4873046875, -9.17138671875, -7.85546875, -6.53955078125, -5.2236328125, -3.90771484375, -2.591796875, -1.27587890625, 0.0400390625, 1.35595703125, 2.671875, 3.98779296875, 5.3037109375, 6.61962890625, 7.935546875, 9.25146484375, 10.5673828125, 11.88330078125, 13.19921875, 14.51513671875, 15.8310546875, 17.14697265625, 18.462890625, 19.77880859375, 21.0947265625, 22.41064453125, 23.7265625, 25.04248046875, 26.3583984375, 27.67431640625, 28.990234375, 30.30615234375, 31.6220703125, 32.93798828125, 34.25390625, 35.56982421875, 36.8857421875, 38.20166015625, 39.517578125, 40.83349609375, 42.1494140625, 43.46533203125, 44.78125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 15.0, 9.0, 17.0, 20.0, 29.0, 32.0, 64.0, 80.0, 111.0, 164.0, 212.0, 342.0, 570.0, 940.0, 1706.0, 3389.0, 7741.0, 20508.0, 70405.0, 276679.0, 456813.0, 146425.0, 38768.0, 12468.0, 5061.0, 2507.0, 1298.0, 733.0, 437.0, 297.0, 206.0, 122.0, 95.0, 79.0, 57.0, 34.0, 19.0, 12.0, 16.0, 12.0, 12.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0], "bins": [-9.0625, -8.79803466796875, -8.5335693359375, -8.26910400390625, -8.004638671875, -7.74017333984375, -7.4757080078125, -7.21124267578125, -6.94677734375, -6.68231201171875, -6.4178466796875, -6.15338134765625, -5.888916015625, -5.62445068359375, -5.3599853515625, -5.09552001953125, -4.8310546875, -4.56658935546875, -4.3021240234375, -4.03765869140625, -3.773193359375, -3.50872802734375, -3.2442626953125, -2.97979736328125, -2.71533203125, -2.45086669921875, -2.1864013671875, -1.92193603515625, -1.657470703125, -1.39300537109375, -1.1285400390625, -0.86407470703125, -0.599609375, -0.33514404296875, -0.0706787109375, 0.19378662109375, 0.458251953125, 0.72271728515625, 0.9871826171875, 1.25164794921875, 1.51611328125, 1.78057861328125, 2.0450439453125, 2.30950927734375, 2.573974609375, 2.83843994140625, 3.1029052734375, 3.36737060546875, 3.6318359375, 3.89630126953125, 4.1607666015625, 4.42523193359375, 4.689697265625, 4.95416259765625, 5.2186279296875, 5.48309326171875, 5.74755859375, 6.01202392578125, 6.2764892578125, 6.54095458984375, 6.805419921875, 7.06988525390625, 7.3343505859375, 7.59881591796875, 7.86328125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 13.0, 16.0, 25.0, 36.0, 44.0, 51.0, 63.0, 79.0, 101.0, 2127.0, 116.0, 94.0, 70.0, 58.0, 47.0, 26.0, 27.0, 23.0, 10.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.625, -149.1796875, -144.734375, -140.2890625, -135.84375, -131.3984375, -126.953125, -122.5078125, -118.0625, -113.6171875, -109.171875, -104.7265625, -100.28125, -95.8359375, -91.390625, -86.9453125, -82.5, -78.0546875, -73.609375, -69.1640625, -64.71875, -60.2734375, -55.828125, -51.3828125, -46.9375, -42.4921875, -38.046875, -33.6015625, -29.15625, -24.7109375, -20.265625, -15.8203125, -11.375, -6.9296875, -2.484375, 1.9609375, 6.40625, 10.8515625, 15.296875, 19.7421875, 24.1875, 28.6328125, 33.078125, 37.5234375, 41.96875, 46.4140625, 50.859375, 55.3046875, 59.75, 64.1953125, 68.640625, 73.0859375, 77.53125, 81.9765625, 86.421875, 90.8671875, 95.3125, 99.7578125, 104.203125, 108.6484375, 113.09375, 117.5390625, 121.984375, 126.4296875, 130.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 11.0, 4.0, 5.0, 6.0, 10.0, 10.0, 21.0, 19.0, 37.0, 66.0, 114.0, 174.0, 285.0, 482.0, 831.0, 2026.0, 9682.0, 195206.0, 2883997.0, 45393.0, 4307.0, 1298.0, 698.0, 388.0, 226.0, 154.0, 103.0, 51.0, 39.0, 17.0, 10.0, 15.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.40625, -19.732421875, -19.05859375, -18.384765625, -17.7109375, -17.037109375, -16.36328125, -15.689453125, -15.015625, -14.341796875, -13.66796875, -12.994140625, -12.3203125, -11.646484375, -10.97265625, -10.298828125, -9.625, -8.951171875, -8.27734375, -7.603515625, -6.9296875, -6.255859375, -5.58203125, -4.908203125, -4.234375, -3.560546875, -2.88671875, -2.212890625, -1.5390625, -0.865234375, -0.19140625, 0.482421875, 1.15625, 1.830078125, 2.50390625, 3.177734375, 3.8515625, 4.525390625, 5.19921875, 5.873046875, 6.546875, 7.220703125, 7.89453125, 8.568359375, 9.2421875, 9.916015625, 10.58984375, 11.263671875, 11.9375, 12.611328125, 13.28515625, 13.958984375, 14.6328125, 15.306640625, 15.98046875, 16.654296875, 17.328125, 18.001953125, 18.67578125, 19.349609375, 20.0234375, 20.697265625, 21.37109375, 22.044921875, 22.71875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 45.0, 103.0, 263.0, 295.0, 170.0, 68.0, 25.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5347900390625, -257.50286865234375, -249.47091674804688, -241.43898010253906, -233.40704345703125, -225.3751220703125, -217.3431854248047, -209.31124877929688, -201.27931213378906, -193.24737548828125, -185.21543884277344, -177.18350219726562, -169.15158081054688, -161.11962890625, -153.08770751953125, -145.05577087402344, -137.02383422851562, -128.9918975830078, -120.9599609375, -112.92803192138672, -104.8960952758789, -96.8641586303711, -88.83222961425781, -80.80029296875, -72.76835632324219, -64.73641967773438, -56.70448684692383, -48.67255401611328, -40.64061737060547, -32.608680725097656, -24.57674789428711, -16.544815063476562, -8.512863159179688, -0.4809284210205078, 7.551006317138672, 15.582941055297852, 23.61487579345703, 31.646812438964844, 39.67874526977539, 47.71067810058594, 55.74261474609375, 63.77455139160156, 71.80648803710938, 79.83841705322266, 87.87035369873047, 95.90229034423828, 103.93421936035156, 111.96615600585938, 119.99809265136719, 128.030029296875, 136.0619659423828, 144.09390258789062, 152.12582397460938, 160.15777587890625, 168.189697265625, 176.2216339111328, 184.25357055664062, 192.28550720214844, 200.31744384765625, 208.34938049316406, 216.38131713867188, 224.41323852539062, 232.44517517089844, 240.47711181640625, 248.50904846191406]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 5.0, 8.0, 12.0, 3.0, 14.0, 12.0, 28.0, 24.0, 24.0, 38.0, 31.0, 46.0, 50.0, 41.0, 43.0, 59.0, 64.0, 60.0, 47.0, 53.0, 42.0, 39.0, 31.0, 27.0, 38.0, 37.0, 22.0, 24.0, 17.0, 13.0, 15.0, 7.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.22595977783203, -100.63916778564453, -97.0523681640625, -93.465576171875, -89.87877655029297, -86.29198455810547, -82.70518493652344, -79.11839294433594, -75.5315933227539, -71.9448013305664, -68.35800170898438, -64.77120971679688, -61.184410095214844, -57.597618103027344, -54.01081848144531, -50.42402648925781, -46.83723068237305, -43.25043487548828, -39.663639068603516, -36.07684326171875, -32.490047454833984, -28.90325355529785, -25.316457748413086, -21.72966194152832, -18.142866134643555, -14.556070327758789, -10.969274520874023, -7.382479667663574, -3.7956838607788086, -0.20888900756835938, 3.3779067993164062, 6.964702606201172, 10.551498413085938, 14.138294219970703, 17.72509002685547, 21.311885833740234, 24.898681640625, 28.485475540161133, 32.07227325439453, 35.65906524658203, 39.24586486816406, 42.83266067504883, 46.419456481933594, 50.00625228881836, 53.593048095703125, 57.179840087890625, 60.766639709472656, 64.35343170166016, 67.94023132324219, 71.52702331542969, 75.11382293701172, 78.70061492919922, 82.28741455078125, 85.87420654296875, 89.46100616455078, 93.04779815673828, 96.63459014892578, 100.22138214111328, 103.80818176269531, 107.39497375488281, 110.98177337646484, 114.56856536865234, 118.15536499023438, 121.74215698242188, 125.3289566040039]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 15.0, 16.0, 23.0, 28.0, 38.0, 83.0, 111.0, 164.0, 227.0, 369.0, 486.0, 667.0, 910.0, 1311.0, 1806.0, 2518.0, 3787.0, 1018730.0, 4957.0, 3724.0, 2466.0, 1759.0, 1225.0, 887.0, 699.0, 463.0, 309.0, 243.0, 149.0, 108.0, 66.0, 56.0, 32.0, 27.0, 25.0, 13.0, 10.0, 15.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.109224319458008, -17.52462387084961, -16.940025329589844, -16.355424880981445, -15.770824432373047, -15.186223983764648, -14.601624488830566, -14.017024993896484, -13.432424545288086, -12.847824096679688, -12.263224601745605, -11.678625106811523, -11.094024658203125, -10.509424209594727, -9.924824714660645, -9.340225219726562, -8.755624771118164, -8.171024322509766, -7.586424827575684, -7.001824855804443, -6.417224884033203, -5.832624912261963, -5.248024940490723, -4.663424968719482, -4.078824996948242, -3.494225025177002, -2.9096250534057617, -2.3250250816345215, -1.7404251098632812, -1.155825138092041, -0.5712251663208008, 0.013374805450439453, 0.5979766845703125, 1.1825766563415527, 1.767176628112793, 2.351776599884033, 2.9363765716552734, 3.5209765434265137, 4.105576515197754, 4.690176486968994, 5.274776458740234, 5.859376430511475, 6.443976402282715, 7.028576374053955, 7.613176345825195, 8.197776794433594, 8.782376289367676, 9.366975784301758, 9.951576232910156, 10.536176681518555, 11.120776176452637, 11.705375671386719, 12.289976119995117, 12.874576568603516, 13.459176063537598, 14.04377555847168, 14.628376007080078, 15.212976455688477, 15.797575950622559, 16.38217544555664, 16.96677589416504, 17.551376342773438, 18.135974884033203, 18.7205753326416, 19.30517578125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 4.0, 10.0, 27.0, 43.0, 46.0, 73.0, 631.0, 51461960.0, 183.0, 54.0, 22.0, 23.0, 19.0, 17.0, 17.0, 17.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6716.453125, -6526.1005859375, -6335.748046875, -6145.3955078125, -5955.04296875, -5764.6904296875, -5574.337890625, -5383.9853515625, -5193.6328125, -5003.2802734375, -4812.927734375, -4622.5751953125, -4432.22265625, -4241.8701171875, -4051.517578125, -3861.1650390625, -3670.812255859375, -3480.459716796875, -3290.107177734375, -3099.754638671875, -2909.402099609375, -2719.049560546875, -2528.69677734375, -2338.34423828125, -2147.99169921875, -1957.63916015625, -1767.28662109375, -1576.93408203125, -1386.58154296875, -1196.22900390625, -1005.8763427734375, -815.5238037109375, -625.17138671875, -434.81884765625, -244.46627807617188, -54.11370849609375, 136.23883056640625, 326.59136962890625, 516.9439697265625, 707.2965087890625, 897.6490478515625, 1088.0015869140625, 1278.3541259765625, 1468.706787109375, 1659.059326171875, 1849.411865234375, 2039.764404296875, 2230.116943359375, 2420.469482421875, 2610.822021484375, 2801.174560546875, 2991.527099609375, 3181.879638671875, 3372.232177734375, 3562.5849609375, 3752.9375, 3943.2900390625, 4133.642578125, 4323.9951171875, 4514.34765625, 4704.7001953125, 4895.052734375, 5085.4052734375, 5275.7578125, 5466.1103515625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 28.0, 20.0, 38.0, 56.0, 81.0, 90.0, 187.0, 331.0, 613.0, 928.0, 1440.0, 2514.0, 3977.0, 6693.0, 11024.0, 18790.0, 32449.0, 56305.0, 100362.0, 183069.0, 338130.0, 896661.0, 3691701.0, 429856.0, 226794.0, 123969.0, 69519.0, 38999.0, 22831.0, 13392.0, 8195.0, 4946.0, 2906.0, 1768.0, 1066.0, 683.0, 366.0, 240.0, 133.0, 74.0, 68.0, 36.0, 25.0, 19.0, 24.0, 11.0, 13.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.896484375, -2.811737060546875, -2.72698974609375, -2.642242431640625, -2.5574951171875, -2.472747802734375, -2.38800048828125, -2.303253173828125, -2.218505859375, -2.133758544921875, -2.04901123046875, -1.964263916015625, -1.8795166015625, -1.794769287109375, -1.71002197265625, -1.625274658203125, -1.54052734375, -1.455780029296875, -1.37103271484375, -1.286285400390625, -1.2015380859375, -1.116790771484375, -1.03204345703125, -0.947296142578125, -0.862548828125, -0.777801513671875, -0.69305419921875, -0.608306884765625, -0.5235595703125, -0.438812255859375, -0.35406494140625, -0.269317626953125, -0.1845703125, -0.099822998046875, -0.01507568359375, 0.069671630859375, 0.1544189453125, 0.239166259765625, 0.32391357421875, 0.408660888671875, 0.493408203125, 0.578155517578125, 0.66290283203125, 0.747650146484375, 0.8323974609375, 0.917144775390625, 1.00189208984375, 1.086639404296875, 1.17138671875, 1.256134033203125, 1.34088134765625, 1.425628662109375, 1.5103759765625, 1.595123291015625, 1.67987060546875, 1.764617919921875, 1.849365234375, 1.934112548828125, 2.01885986328125, 2.103607177734375, 2.1883544921875, 2.273101806640625, 2.35784912109375, 2.442596435546875, 2.52734375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [5.0, 1.0, 9.0, 2.0, 2.0, 6.0, 9.0, 5.0, 11.0, 15.0, 10.0, 22.0, 19.0, 14.0, 32.0, 28.0, 20.0, 24.0, 31.0, 49.0, 36.0, 39.0, 33.0, 50.0, 160.0, 833.0, 129.0, 57.0, 30.0, 37.0, 29.0, 40.0, 33.0, 24.0, 23.0, 25.0, 17.0, 19.0, 15.0, 25.0, 11.0, 15.0, 11.0, 8.0, 10.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5859375, -7.2877197265625, -6.989501953125, -6.6912841796875, -6.39306640625, -6.0948486328125, -5.796630859375, -5.4984130859375, -5.2001953125, -4.9019775390625, -4.603759765625, -4.3055419921875, -4.00732421875, -3.7091064453125, -3.410888671875, -3.1126708984375, -2.814453125, -2.5162353515625, -2.218017578125, -1.9197998046875, -1.62158203125, -1.3233642578125, -1.025146484375, -0.7269287109375, -0.4287109375, -0.1304931640625, 0.167724609375, 0.4659423828125, 0.76416015625, 1.0623779296875, 1.360595703125, 1.6588134765625, 1.95703125, 2.2552490234375, 2.553466796875, 2.8516845703125, 3.14990234375, 3.4481201171875, 3.746337890625, 4.0445556640625, 4.3427734375, 4.6409912109375, 4.939208984375, 5.2374267578125, 5.53564453125, 5.8338623046875, 6.132080078125, 6.4302978515625, 6.728515625, 7.0267333984375, 7.324951171875, 7.6231689453125, 7.92138671875, 8.2196044921875, 8.517822265625, 8.8160400390625, 9.1142578125, 9.4124755859375, 9.710693359375, 10.0089111328125, 10.30712890625, 10.6053466796875, 10.903564453125, 11.2017822265625, 11.5]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 4.0, 10.0, 4.0, 11.0, 20.0, 20.0, 29.0, 59.0, 101.0, 108.0, 159.0, 237.0, 470.0, 727.0, 1107.0, 1729.0, 3002.0, 4910.0, 7945.0, 13542.0, 23741.0, 42113.0, 75161.0, 142563.0, 298651.0, 892467.0, 3905377.0, 450584.0, 195664.0, 100620.0, 55667.0, 30989.0, 17601.0, 10392.0, 6053.0, 3547.0, 2257.0, 1359.0, 875.0, 514.0, 396.0, 243.0, 131.0, 100.0, 64.0, 36.0, 29.0, 16.0, 11.0, 17.0, 2.0, 5.0, 2.0, 3.0], "bins": [-4.22265625, -4.106109619140625, -3.98956298828125, -3.873016357421875, -3.7564697265625, -3.639923095703125, -3.52337646484375, -3.406829833984375, -3.290283203125, -3.173736572265625, -3.05718994140625, -2.940643310546875, -2.8240966796875, -2.707550048828125, -2.59100341796875, -2.474456787109375, -2.35791015625, -2.241363525390625, -2.12481689453125, -2.008270263671875, -1.8917236328125, -1.775177001953125, -1.65863037109375, -1.542083740234375, -1.425537109375, -1.308990478515625, -1.19244384765625, -1.075897216796875, -0.9593505859375, -0.842803955078125, -0.72625732421875, -0.609710693359375, -0.4931640625, -0.376617431640625, -0.26007080078125, -0.143524169921875, -0.0269775390625, 0.089569091796875, 0.20611572265625, 0.322662353515625, 0.439208984375, 0.555755615234375, 0.67230224609375, 0.788848876953125, 0.9053955078125, 1.021942138671875, 1.13848876953125, 1.255035400390625, 1.37158203125, 1.488128662109375, 1.60467529296875, 1.721221923828125, 1.8377685546875, 1.954315185546875, 2.07086181640625, 2.187408447265625, 2.303955078125, 2.420501708984375, 2.53704833984375, 2.653594970703125, 2.7701416015625, 2.886688232421875, 3.00323486328125, 3.119781494140625, 3.236328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 13.0, 18.0, 18.0, 22.0, 18.0, 23.0, 35.0, 25.0, 26.0, 34.0, 36.0, 29.0, 36.0, 55.0, 61.0, 235.0, 720.0, 149.0, 67.0, 45.0, 53.0, 42.0, 19.0, 31.0, 23.0, 31.0, 15.0, 28.0, 21.0, 15.0, 15.0, 7.0, 7.0, 10.0, 3.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.10546875, -6.87890625, -6.65234375, -6.42578125, -6.19921875, -5.97265625, -5.74609375, -5.51953125, -5.29296875, -5.06640625, -4.83984375, -4.61328125, -4.38671875, -4.16015625, -3.93359375, -3.70703125, -3.48046875, -3.25390625, -3.02734375, -2.80078125, -2.57421875, -2.34765625, -2.12109375, -1.89453125, -1.66796875, -1.44140625, -1.21484375, -0.98828125, -0.76171875, -0.53515625, -0.30859375, -0.08203125, 0.14453125, 0.37109375, 0.59765625, 0.82421875, 1.05078125, 1.27734375, 1.50390625, 1.73046875, 1.95703125, 2.18359375, 2.41015625, 2.63671875, 2.86328125, 3.08984375, 3.31640625, 3.54296875, 3.76953125, 3.99609375, 4.22265625, 4.44921875, 4.67578125, 4.90234375, 5.12890625, 5.35546875, 5.58203125, 5.80859375, 6.03515625, 6.26171875, 6.48828125, 6.71484375, 6.94140625, 7.16796875, 7.39453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 12.0, 7.0, 6.0, 5.0, 3.0, 7.0, 13.0, 15.0, 46.0, 56.0, 72.0, 70.0, 96.0, 128.0, 170.0, 213.0, 278.0, 409.0, 561.0, 856.0, 1135.0, 1729.0, 2755.0, 4700.0, 8750.0, 19867.0, 59208.0, 657799.0, 5430880.0, 59506.0, 20109.0, 8772.0, 4668.0, 2744.0, 1737.0, 1093.0, 805.0, 535.0, 418.0, 299.0, 219.0, 168.0, 125.0, 81.0, 89.0, 80.0, 37.0, 21.0, 19.0, 13.0, 13.0, 6.0, 10.0, 12.0, 1.0, 5.0, 5.0, 6.0, 4.0], "bins": [-11.921875, -11.5606689453125, -11.199462890625, -10.8382568359375, -10.47705078125, -10.1158447265625, -9.754638671875, -9.3934326171875, -9.0322265625, -8.6710205078125, -8.309814453125, -7.9486083984375, -7.58740234375, -7.2261962890625, -6.864990234375, -6.5037841796875, -6.142578125, -5.7813720703125, -5.420166015625, -5.0589599609375, -4.69775390625, -4.3365478515625, -3.975341796875, -3.6141357421875, -3.2529296875, -2.8917236328125, -2.530517578125, -2.1693115234375, -1.80810546875, -1.4468994140625, -1.085693359375, -0.7244873046875, -0.36328125, -0.0020751953125, 0.359130859375, 0.7203369140625, 1.08154296875, 1.4427490234375, 1.803955078125, 2.1651611328125, 2.5263671875, 2.8875732421875, 3.248779296875, 3.6099853515625, 3.97119140625, 4.3323974609375, 4.693603515625, 5.0548095703125, 5.416015625, 5.7772216796875, 6.138427734375, 6.4996337890625, 6.86083984375, 7.2220458984375, 7.583251953125, 7.9444580078125, 8.3056640625, 8.6668701171875, 9.028076171875, 9.3892822265625, 9.75048828125, 10.1116943359375, 10.472900390625, 10.8341064453125, 11.1953125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 8.0, 11.0, 13.0, 14.0, 21.0, 22.0, 17.0, 11.0, 18.0, 36.0, 45.0, 38.0, 36.0, 41.0, 47.0, 64.0, 161.0, 529.0, 342.0, 108.0, 67.0, 37.0, 37.0, 37.0, 44.0, 24.0, 22.0, 24.0, 25.0, 26.0, 16.0, 17.0, 13.0, 5.0, 8.0, 10.0, 4.0, 1.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.2667236328125, -5.095947265625, -4.9251708984375, -4.75439453125, -4.5836181640625, -4.412841796875, -4.2420654296875, -4.0712890625, -3.9005126953125, -3.729736328125, -3.5589599609375, -3.38818359375, -3.2174072265625, -3.046630859375, -2.8758544921875, -2.705078125, -2.5343017578125, -2.363525390625, -2.1927490234375, -2.02197265625, -1.8511962890625, -1.680419921875, -1.5096435546875, -1.3388671875, -1.1680908203125, -0.997314453125, -0.8265380859375, -0.65576171875, -0.4849853515625, -0.314208984375, -0.1434326171875, 0.02734375, 0.1981201171875, 0.368896484375, 0.5396728515625, 0.71044921875, 0.8812255859375, 1.052001953125, 1.2227783203125, 1.3935546875, 1.5643310546875, 1.735107421875, 1.9058837890625, 2.07666015625, 2.2474365234375, 2.418212890625, 2.5889892578125, 2.759765625, 2.9305419921875, 3.101318359375, 3.2720947265625, 3.44287109375, 3.6136474609375, 3.784423828125, 3.9552001953125, 4.1259765625, 4.2967529296875, 4.467529296875, 4.6383056640625, 4.80908203125, 4.9798583984375, 5.150634765625, 5.3214111328125, 5.4921875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 38.0, 188.0, 625.0, 119.0, 15.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.082847595214844, -42.47198486328125, -40.86111831665039, -39.2502555847168, -37.63938903808594, -36.028526306152344, -34.41766357421875, -32.80679702758789, -31.195932388305664, -29.585067749023438, -27.97420310974121, -26.363338470458984, -24.75247573852539, -23.14160919189453, -21.530746459960938, -19.91988182067871, -18.309017181396484, -16.698152542114258, -15.087287902832031, -13.476424217224121, -11.865559577941895, -10.254694938659668, -8.643831253051758, -7.032966613769531, -5.422101974487305, -3.8112375736236572, -2.2003731727600098, -0.5895090103149414, 1.0213556289672852, 2.6322202682495117, 4.243083953857422, 5.853948593139648, 7.464813232421875, 9.075677871704102, 10.686542510986328, 12.297406196594238, 13.908270835876465, 15.519135475158691, 17.1299991607666, 18.740863800048828, 20.351728439331055, 21.96259307861328, 23.573457717895508, 25.184322357177734, 26.795185089111328, 28.406051635742188, 30.01691436767578, 31.627779006958008, 33.238643646240234, 34.84950637817383, 36.46037292480469, 38.07123565673828, 39.68210220336914, 41.292964935302734, 42.903831481933594, 44.51469421386719, 46.12555694580078, 47.736419677734375, 49.347286224365234, 50.95814895629883, 52.56901550292969, 54.17987823486328, 55.790740966796875, 57.401607513427734, 59.012474060058594]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 18.0, 6.0, 25.0, 23.0, 27.0, 49.0, 54.0, 62.0, 67.0, 75.0, 85.0, 76.0, 71.0, 78.0, 59.0, 52.0, 43.0, 34.0, 19.0, 18.0, 24.0, 15.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.274150848388672, -7.842296123504639, -7.410440921783447, -6.978586196899414, -6.546731472015381, -6.114876747131348, -5.683021545410156, -5.251166820526123, -4.81931209564209, -4.387457370758057, -3.9556024074554443, -3.523747444152832, -3.091892719268799, -2.6600377559661865, -2.228182792663574, -1.796328067779541, -1.3644728660583496, -0.9326180219650269, -0.5007631182670593, -0.0689082145690918, 0.36294662952423096, 0.7948014736175537, 1.226656436920166, 1.6585111618041992, 2.0903661251068115, 2.522221088409424, 2.954075813293457, 3.3859307765960693, 3.8177857398986816, 4.249640464782715, 4.681495666503906, 5.113349914550781, 5.545205116271973, 5.977059841156006, 6.408915042877197, 6.8407697677612305, 7.272624492645264, 7.704479217529297, 8.136334419250488, 8.56818962097168, 9.000043869018555, 9.431899070739746, 9.863753318786621, 10.295608520507812, 10.727463722229004, 11.159317970275879, 11.59117317199707, 12.023027420043945, 12.454883575439453, 12.886738777160645, 13.31859302520752, 13.750448226928711, 14.182303428649902, 14.614157676696777, 15.046012878417969, 15.477867126464844, 15.909722328186035, 16.341577529907227, 16.7734317779541, 17.20528793334961, 17.637142181396484, 18.06899642944336, 18.500850677490234, 18.932706832885742, 19.364561080932617]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 21.0, 21.0, 37.0, 36.0, 67.0, 118.0, 137.0, 204.0, 314.0, 549.0, 834.0, 1404.0, 2362.0, 4401.0, 9061.0, 22035.0, 82373.0, 3941520.0, 86993.0, 21950.0, 8950.0, 4410.0, 2434.0, 1411.0, 829.0, 554.0, 368.0, 253.0, 137.0, 106.0, 89.0, 53.0, 44.0, 44.0, 24.0, 24.0, 12.0, 12.0, 17.0, 14.0, 8.0, 8.0, 7.0, 7.0, 4.0, 4.0, 4.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1368408203125, -0.13048362731933594, -0.12412643432617188, -0.11776924133300781, -0.11141204833984375, -0.10505485534667969, -0.09869766235351562, -0.09234046936035156, -0.0859832763671875, -0.07962608337402344, -0.07326889038085938, -0.06691169738769531, -0.06055450439453125, -0.05419731140136719, -0.047840118408203125, -0.04148292541503906, -0.035125732421875, -0.028768539428710938, -0.022411346435546875, -0.016054153442382812, -0.00969696044921875, -0.0033397674560546875, 0.003017425537109375, 0.009374618530273438, 0.0157318115234375, 0.022089004516601562, 0.028446197509765625, 0.03480339050292969, 0.04116058349609375, 0.04751777648925781, 0.053874969482421875, 0.06023216247558594, 0.06658935546875, 0.07294654846191406, 0.07930374145507812, 0.08566093444824219, 0.09201812744140625, 0.09837532043457031, 0.10473251342773438, 0.11108970642089844, 0.1174468994140625, 0.12380409240722656, 0.13016128540039062, 0.1365184783935547, 0.14287567138671875, 0.1492328643798828, 0.15559005737304688, 0.16194725036621094, 0.168304443359375, 0.17466163635253906, 0.18101882934570312, 0.1873760223388672, 0.19373321533203125, 0.2000904083251953, 0.20644760131835938, 0.21280479431152344, 0.2191619873046875, 0.22551918029785156, 0.23187637329101562, 0.2382335662841797, 0.24459075927734375, 0.2509479522705078, 0.2573051452636719, 0.26366233825683594, 0.27001953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 18.0, 29.0, 673.0, 151.0, 22.0, 13.0, 11.0, 5.0, 4.0, 6.0, 2.0, 7.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0242156982421875, -0.02298760414123535, -0.021759510040283203, -0.020531415939331055, -0.019303321838378906, -0.018075227737426758, -0.01684713363647461, -0.015619039535522461, -0.014390945434570312, -0.013162851333618164, -0.011934757232666016, -0.010706663131713867, -0.009478569030761719, -0.00825047492980957, -0.007022380828857422, -0.0057942867279052734, -0.004566192626953125, -0.0033380985260009766, -0.002110004425048828, -0.0008819103240966797, 0.00034618377685546875, 0.0015742778778076172, 0.0028023719787597656, 0.004030466079711914, 0.0052585601806640625, 0.006486654281616211, 0.007714748382568359, 0.008942842483520508, 0.010170936584472656, 0.011399030685424805, 0.012627124786376953, 0.013855218887329102, 0.01508331298828125, 0.0163114070892334, 0.017539501190185547, 0.018767595291137695, 0.019995689392089844, 0.021223783493041992, 0.02245187759399414, 0.02367997169494629, 0.024908065795898438, 0.026136159896850586, 0.027364253997802734, 0.028592348098754883, 0.02982044219970703, 0.03104853630065918, 0.03227663040161133, 0.03350472450256348, 0.034732818603515625, 0.03596091270446777, 0.03718900680541992, 0.03841710090637207, 0.03964519500732422, 0.04087328910827637, 0.042101383209228516, 0.043329477310180664, 0.04455757141113281, 0.04578566551208496, 0.04701375961303711, 0.04824185371398926, 0.049469947814941406, 0.050698041915893555, 0.0519261360168457, 0.05315423011779785, 0.05438232421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 11.0, 13.0, 18.0, 27.0, 30.0, 53.0, 72.0, 99.0, 135.0, 217.0, 292.0, 445.0, 692.0, 1203.0, 2025.0, 3897.0, 7939.0, 18331.0, 47394.0, 160354.0, 1017056.0, 2589287.0, 244719.0, 61848.0, 21045.0, 8417.0, 3890.0, 1927.0, 1103.0, 587.0, 398.0, 225.0, 162.0, 94.0, 70.0, 52.0, 37.0, 34.0, 17.0, 17.0, 4.0, 7.0, 8.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.144775390625, -0.14077091217041016, -0.1367664337158203, -0.13276195526123047, -0.12875747680664062, -0.12475299835205078, -0.12074851989746094, -0.1167440414428711, -0.11273956298828125, -0.1087350845336914, -0.10473060607910156, -0.10072612762451172, -0.09672164916992188, -0.09271717071533203, -0.08871269226074219, -0.08470821380615234, -0.0807037353515625, -0.07669925689697266, -0.07269477844238281, -0.06869029998779297, -0.06468582153320312, -0.06068134307861328, -0.05667686462402344, -0.052672386169433594, -0.04866790771484375, -0.044663429260253906, -0.04065895080566406, -0.03665447235107422, -0.032649993896484375, -0.02864551544189453, -0.024641036987304688, -0.020636558532714844, -0.016632080078125, -0.012627601623535156, -0.008623123168945312, -0.004618644714355469, -0.000614166259765625, 0.0033903121948242188, 0.0073947906494140625, 0.011399269104003906, 0.01540374755859375, 0.019408226013183594, 0.023412704467773438, 0.02741718292236328, 0.031421661376953125, 0.03542613983154297, 0.03943061828613281, 0.043435096740722656, 0.0474395751953125, 0.051444053649902344, 0.05544853210449219, 0.05945301055908203, 0.06345748901367188, 0.06746196746826172, 0.07146644592285156, 0.0754709243774414, 0.07947540283203125, 0.0834798812866211, 0.08748435974121094, 0.09148883819580078, 0.09549331665039062, 0.09949779510498047, 0.10350227355957031, 0.10750675201416016, 0.11151123046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 15.0, 13.0, 19.0, 28.0, 30.0, 44.0, 46.0, 73.0, 81.0, 118.0, 143.0, 234.0, 383.0, 941.0, 853.0, 345.0, 229.0, 139.0, 86.0, 60.0, 53.0, 28.0, 29.0, 21.0, 13.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.05672502517700195, -0.055100440979003906, -0.05347585678100586, -0.05185127258300781, -0.050226688385009766, -0.04860210418701172, -0.04697751998901367, -0.045352935791015625, -0.04372835159301758, -0.04210376739501953, -0.040479183197021484, -0.03885459899902344, -0.03723001480102539, -0.035605430603027344, -0.0339808464050293, -0.03235626220703125, -0.030731678009033203, -0.029107093811035156, -0.02748250961303711, -0.025857925415039062, -0.024233341217041016, -0.02260875701904297, -0.020984172821044922, -0.019359588623046875, -0.017735004425048828, -0.01611042022705078, -0.014485836029052734, -0.012861251831054688, -0.01123666763305664, -0.009612083435058594, -0.007987499237060547, -0.0063629150390625, -0.004738330841064453, -0.0031137466430664062, -0.0014891624450683594, 0.0001354217529296875, 0.0017600059509277344, 0.0033845901489257812, 0.005009174346923828, 0.006633758544921875, 0.008258342742919922, 0.009882926940917969, 0.011507511138916016, 0.013132095336914062, 0.01475667953491211, 0.016381263732910156, 0.018005847930908203, 0.01963043212890625, 0.021255016326904297, 0.022879600524902344, 0.02450418472290039, 0.026128768920898438, 0.027753353118896484, 0.02937793731689453, 0.031002521514892578, 0.032627105712890625, 0.03425168991088867, 0.03587627410888672, 0.037500858306884766, 0.03912544250488281, 0.04075002670288086, 0.042374610900878906, 0.04399919509887695, 0.045623779296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 29.0, 53.0, 117.0, 352.0, 321.0, 92.0, 17.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9253787994384766, -1.8869627714157104, -1.8485468626022339, -1.8101308345794678, -1.7717148065567017, -1.7332987785339355, -1.694882869720459, -1.6564668416976929, -1.6180508136749268, -1.5796347856521606, -1.541218876838684, -1.502802848815918, -1.4643868207931519, -1.4259707927703857, -1.3875548839569092, -1.349138855934143, -1.3107229471206665, -1.2723069190979004, -1.2338910102844238, -1.1954749822616577, -1.1570589542388916, -1.118643045425415, -1.080227017402649, -1.0418109893798828, -1.0033950805664062, -0.9649791121482849, -0.9265630841255188, -0.8881471157073975, -0.8497310876846313, -0.81131511926651, -0.7728991508483887, -0.7344831228256226, -0.696067214012146, -0.6576512455940247, -0.6192352175712585, -0.5808192491531372, -0.5424032211303711, -0.5039872527122498, -0.4655712842941284, -0.4271552860736847, -0.38873928785324097, -0.35032328963279724, -0.3119072914123535, -0.2734913229942322, -0.23507532477378845, -0.19665932655334473, -0.1582433432340622, -0.11982735991477966, -0.08141136169433594, -0.04299537092447281, -0.00457938015460968, 0.03383661061525345, 0.07225260138511658, 0.1106685996055603, 0.14908458292484283, 0.18750056624412537, 0.2259165644645691, 0.2643325626850128, 0.30274856090545654, 0.3411645293235779, 0.3795805275440216, 0.41799652576446533, 0.45641249418258667, 0.4948284924030304, 0.5332444906234741]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 11.0, 15.0, 20.0, 36.0, 58.0, 40.0, 67.0, 73.0, 96.0, 90.0, 83.0, 88.0, 82.0, 61.0, 60.0, 47.0, 17.0, 19.0, 10.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6453368663787842, -0.6270866394042969, -0.6088364720344543, -0.590586245059967, -0.5723360776901245, -0.5540858507156372, -0.5358356237411499, -0.5175853967666626, -0.49933522939682007, -0.48108503222465515, -0.46283483505249023, -0.44458460807800293, -0.426334410905838, -0.4080842137336731, -0.3898339867591858, -0.3715837895870209, -0.35333359241485596, -0.33508339524269104, -0.3168331980705261, -0.2985829710960388, -0.2803327739238739, -0.262082576751709, -0.24383236467838287, -0.22558215260505676, -0.20733195543289185, -0.18908175826072693, -0.17083154618740082, -0.1525813341140747, -0.1343311369419098, -0.11608093231916428, -0.09783072769641876, -0.07958051562309265, -0.06133037805557251, -0.043080173432826996, -0.024829968810081482, -0.006579764187335968, 0.011670440435409546, 0.02992064505815506, 0.048170849680900574, 0.06642106175422668, 0.0846712589263916, 0.10292146354913712, 0.12117166817188263, 0.13942188024520874, 0.15767207741737366, 0.17592227458953857, 0.19417248666286469, 0.2124226987361908, 0.2306728959083557, 0.24892309308052063, 0.26717329025268555, 0.28542351722717285, 0.30367371439933777, 0.3219239115715027, 0.34017413854599, 0.3584243357181549, 0.3766745328903198, 0.39492473006248474, 0.41317492723464966, 0.43142515420913696, 0.4496753513813019, 0.4679255485534668, 0.4861757755279541, 0.5044260025024414, 0.5226761698722839]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 19.0, 22.0, 37.0, 48.0, 59.0, 103.0, 153.0, 228.0, 343.0, 455.0, 699.0, 1045.0, 1689.0, 2922.0, 5120.0, 9839.0, 25150.0, 145913.0, 738713.0, 78233.0, 18414.0, 8077.0, 4290.0, 2467.0, 1568.0, 986.0, 628.0, 418.0, 269.0, 214.0, 110.0, 88.0, 61.0, 47.0, 38.0, 24.0, 16.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.160400390625, -0.15586471557617188, -0.15132904052734375, -0.14679336547851562, -0.1422576904296875, -0.13772201538085938, -0.13318634033203125, -0.12865066528320312, -0.124114990234375, -0.11957931518554688, -0.11504364013671875, -0.11050796508789062, -0.1059722900390625, -0.10143661499023438, -0.09690093994140625, -0.09236526489257812, -0.08782958984375, -0.08329391479492188, -0.07875823974609375, -0.07422256469726562, -0.0696868896484375, -0.06515121459960938, -0.06061553955078125, -0.056079864501953125, -0.051544189453125, -0.047008514404296875, -0.04247283935546875, -0.037937164306640625, -0.0334014892578125, -0.028865814208984375, -0.02433013916015625, -0.019794464111328125, -0.0152587890625, -0.010723114013671875, -0.00618743896484375, -0.001651763916015625, 0.0028839111328125, 0.007419586181640625, 0.01195526123046875, 0.016490936279296875, 0.021026611328125, 0.025562286376953125, 0.03009796142578125, 0.034633636474609375, 0.0391693115234375, 0.043704986572265625, 0.04824066162109375, 0.052776336669921875, 0.05731201171875, 0.061847686767578125, 0.06638336181640625, 0.07091903686523438, 0.0754547119140625, 0.07999038696289062, 0.08452606201171875, 0.08906173706054688, 0.093597412109375, 0.09813308715820312, 0.10266876220703125, 0.10720443725585938, 0.1117401123046875, 0.11627578735351562, 0.12081146240234375, 0.12534713745117188, 0.1298828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 9.0, 19.0, 33.0, 56.0, 94.0, 183.0, 200.0, 151.0, 94.0, 53.0, 24.0, 9.0, 5.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.02879643440246582, -0.02792978286743164, -0.02706313133239746, -0.02619647979736328, -0.0253298282623291, -0.024463176727294922, -0.023596525192260742, -0.022729873657226562, -0.021863222122192383, -0.020996570587158203, -0.020129919052124023, -0.019263267517089844, -0.018396615982055664, -0.017529964447021484, -0.016663312911987305, -0.015796661376953125, -0.014930009841918945, -0.014063358306884766, -0.013196706771850586, -0.012330055236816406, -0.011463403701782227, -0.010596752166748047, -0.009730100631713867, -0.008863449096679688, -0.007996797561645508, -0.007130146026611328, -0.0062634944915771484, -0.005396842956542969, -0.004530191421508789, -0.0036635398864746094, -0.0027968883514404297, -0.00193023681640625, -0.0010635852813720703, -0.00019693374633789062, 0.0006697177886962891, 0.0015363693237304688, 0.0024030208587646484, 0.003269672393798828, 0.004136323928833008, 0.0050029754638671875, 0.005869626998901367, 0.006736278533935547, 0.0076029300689697266, 0.008469581604003906, 0.009336233139038086, 0.010202884674072266, 0.011069536209106445, 0.011936187744140625, 0.012802839279174805, 0.013669490814208984, 0.014536142349243164, 0.015402793884277344, 0.016269445419311523, 0.017136096954345703, 0.018002748489379883, 0.018869400024414062, 0.019736051559448242, 0.020602703094482422, 0.0214693546295166, 0.02233600616455078, 0.02320265769958496, 0.02406930923461914, 0.02493596076965332, 0.0258026123046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 8.0, 13.0, 25.0, 26.0, 40.0, 48.0, 63.0, 127.0, 218.0, 395.0, 752.0, 1629.0, 4396.0, 15903.0, 104931.0, 754862.0, 137159.0, 19237.0, 5024.0, 1843.0, 758.0, 420.0, 209.0, 129.0, 86.0, 67.0, 43.0, 32.0, 25.0, 14.0, 7.0, 10.0, 10.0, 9.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2218017578125, -0.21344947814941406, -0.20509719848632812, -0.1967449188232422, -0.18839263916015625, -0.1800403594970703, -0.17168807983398438, -0.16333580017089844, -0.1549835205078125, -0.14663124084472656, -0.13827896118164062, -0.1299266815185547, -0.12157440185546875, -0.11322212219238281, -0.10486984252929688, -0.09651756286621094, -0.088165283203125, -0.07981300354003906, -0.07146072387695312, -0.06310844421386719, -0.05475616455078125, -0.04640388488769531, -0.038051605224609375, -0.029699325561523438, -0.0213470458984375, -0.012994766235351562, -0.004642486572265625, 0.0037097930908203125, 0.01206207275390625, 0.020414352416992188, 0.028766632080078125, 0.03711891174316406, 0.04547119140625, 0.05382347106933594, 0.062175750732421875, 0.07052803039550781, 0.07888031005859375, 0.08723258972167969, 0.09558486938476562, 0.10393714904785156, 0.1122894287109375, 0.12064170837402344, 0.12899398803710938, 0.1373462677001953, 0.14569854736328125, 0.1540508270263672, 0.16240310668945312, 0.17075538635253906, 0.179107666015625, 0.18745994567871094, 0.19581222534179688, 0.2041645050048828, 0.21251678466796875, 0.2208690643310547, 0.22922134399414062, 0.23757362365722656, 0.2459259033203125, 0.25427818298339844, 0.2626304626464844, 0.2709827423095703, 0.27933502197265625, 0.2876873016357422, 0.2960395812988281, 0.30439186096191406, 0.312744140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 11.0, 6.0, 7.0, 13.0, 18.0, 27.0, 19.0, 24.0, 26.0, 33.0, 31.0, 29.0, 50.0, 39.0, 40.0, 47.0, 48.0, 37.0, 44.0, 35.0, 44.0, 56.0, 43.0, 31.0, 39.0, 35.0, 34.0, 22.0, 13.0, 20.0, 14.0, 13.0, 3.0, 10.0, 7.0, 4.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11865234375, -0.11455917358398438, -0.11046600341796875, -0.10637283325195312, -0.1022796630859375, -0.09818649291992188, -0.09409332275390625, -0.09000015258789062, -0.085906982421875, -0.08181381225585938, -0.07772064208984375, -0.07362747192382812, -0.0695343017578125, -0.06544113159179688, -0.06134796142578125, -0.057254791259765625, -0.05316162109375, -0.049068450927734375, -0.04497528076171875, -0.040882110595703125, -0.0367889404296875, -0.032695770263671875, -0.02860260009765625, -0.024509429931640625, -0.020416259765625, -0.016323089599609375, -0.01222991943359375, -0.008136749267578125, -0.0040435791015625, 4.9591064453125e-05, 0.00414276123046875, 0.008235931396484375, 0.0123291015625, 0.016422271728515625, 0.02051544189453125, 0.024608612060546875, 0.0287017822265625, 0.032794952392578125, 0.03688812255859375, 0.040981292724609375, 0.045074462890625, 0.049167633056640625, 0.05326080322265625, 0.057353973388671875, 0.0614471435546875, 0.06554031372070312, 0.06963348388671875, 0.07372665405273438, 0.07781982421875, 0.08191299438476562, 0.08600616455078125, 0.09009933471679688, 0.0941925048828125, 0.09828567504882812, 0.10237884521484375, 0.10647201538085938, 0.110565185546875, 0.11465835571289062, 0.11875152587890625, 0.12284469604492188, 0.1269378662109375, 0.13103103637695312, 0.13512420654296875, 0.13921737670898438, 0.143310546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 3.0, 8.0, 14.0, 13.0, 34.0, 40.0, 110.0, 257.0, 865.0, 7493.0, 1026828.0, 11301.0, 1056.0, 276.0, 101.0, 53.0, 32.0, 16.0, 18.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9426116943359375, -0.914520263671875, -0.8864288330078125, -0.85833740234375, -0.8302459716796875, -0.802154541015625, -0.7740631103515625, -0.7459716796875, -0.7178802490234375, -0.689788818359375, -0.6616973876953125, -0.63360595703125, -0.6055145263671875, -0.577423095703125, -0.5493316650390625, -0.521240234375, -0.4931488037109375, -0.465057373046875, -0.4369659423828125, -0.40887451171875, -0.3807830810546875, -0.352691650390625, -0.3246002197265625, -0.2965087890625, -0.2684173583984375, -0.240325927734375, -0.2122344970703125, -0.18414306640625, -0.1560516357421875, -0.127960205078125, -0.0998687744140625, -0.07177734375, -0.0436859130859375, -0.015594482421875, 0.0124969482421875, 0.04058837890625, 0.0686798095703125, 0.096771240234375, 0.1248626708984375, 0.1529541015625, 0.1810455322265625, 0.209136962890625, 0.2372283935546875, 0.26531982421875, 0.2934112548828125, 0.321502685546875, 0.3495941162109375, 0.377685546875, 0.4057769775390625, 0.433868408203125, 0.4619598388671875, 0.49005126953125, 0.5181427001953125, 0.546234130859375, 0.5743255615234375, 0.6024169921875, 0.6305084228515625, 0.658599853515625, 0.6866912841796875, 0.71478271484375, 0.7428741455078125, 0.770965576171875, 0.7990570068359375, 0.8271484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 4.0, 7.0, 9.0, 15.0, 8.0, 6.0, 17.0, 15.0, 19.0, 42.0, 40.0, 51.0, 96.0, 120.0, 151.0, 107.0, 70.0, 45.0, 48.0, 27.0, 16.0, 16.0, 12.0, 8.0, 9.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005564689636230469, -0.0005392804741859436, -0.0005220919847488403, -0.0005049034953117371, -0.0004877150058746338, -0.0004705265164375305, -0.00045333802700042725, -0.000436149537563324, -0.0004189610481262207, -0.00040177255868911743, -0.00038458406925201416, -0.0003673955798149109, -0.0003502070903778076, -0.00033301860094070435, -0.0003158301115036011, -0.0002986416220664978, -0.00028145313262939453, -0.00026426464319229126, -0.000247076153755188, -0.00022988766431808472, -0.00021269917488098145, -0.00019551068544387817, -0.0001783221960067749, -0.00016113370656967163, -0.00014394521713256836, -0.0001267567276954651, -0.00010956823825836182, -9.237974882125854e-05, -7.519125938415527e-05, -5.8002769947052e-05, -4.081428050994873e-05, -2.362579107284546e-05, -6.4373016357421875e-06, 1.0751187801361084e-05, 2.7939677238464355e-05, 4.512816667556763e-05, 6.23166561126709e-05, 7.950514554977417e-05, 9.669363498687744e-05, 0.00011388212442398071, 0.00013107061386108398, 0.00014825910329818726, 0.00016544759273529053, 0.0001826360821723938, 0.00019982457160949707, 0.00021701306104660034, 0.0002342015504837036, 0.0002513900399208069, 0.00026857852935791016, 0.00028576701879501343, 0.0003029555082321167, 0.00032014399766921997, 0.00033733248710632324, 0.0003545209765434265, 0.0003717094659805298, 0.00038889795541763306, 0.00040608644485473633, 0.0004232749342918396, 0.00044046342372894287, 0.00045765191316604614, 0.0004748404026031494, 0.0004920288920402527, 0.000509217381477356, 0.0005264058709144592, 0.0005435943603515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 10.0, 8.0, 12.0, 14.0, 36.0, 52.0, 95.0, 159.0, 295.0, 596.0, 1236.0, 2857.0, 7654.0, 25860.0, 153841.0, 735716.0, 90884.0, 18611.0, 6092.0, 2346.0, 1023.0, 512.0, 283.0, 117.0, 86.0, 66.0, 26.0, 19.0, 19.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2069091796875, -0.20106124877929688, -0.19521331787109375, -0.18936538696289062, -0.1835174560546875, -0.17766952514648438, -0.17182159423828125, -0.16597366333007812, -0.160125732421875, -0.15427780151367188, -0.14842987060546875, -0.14258193969726562, -0.1367340087890625, -0.13088607788085938, -0.12503814697265625, -0.11919021606445312, -0.11334228515625, -0.10749435424804688, -0.10164642333984375, -0.09579849243164062, -0.0899505615234375, -0.08410263061523438, -0.07825469970703125, -0.07240676879882812, -0.066558837890625, -0.060710906982421875, -0.05486297607421875, -0.049015045166015625, -0.0431671142578125, -0.037319183349609375, -0.03147125244140625, -0.025623321533203125, -0.019775390625, -0.013927459716796875, -0.00807952880859375, -0.002231597900390625, 0.0036163330078125, 0.009464263916015625, 0.01531219482421875, 0.021160125732421875, 0.027008056640625, 0.032855987548828125, 0.03870391845703125, 0.044551849365234375, 0.0503997802734375, 0.056247711181640625, 0.06209564208984375, 0.06794357299804688, 0.07379150390625, 0.07963943481445312, 0.08548736572265625, 0.09133529663085938, 0.0971832275390625, 0.10303115844726562, 0.10887908935546875, 0.11472702026367188, 0.120574951171875, 0.12642288208007812, 0.13227081298828125, 0.13811874389648438, 0.1439666748046875, 0.14981460571289062, 0.15566253662109375, 0.16151046752929688, 0.1673583984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 1.0, 7.0, 7.0, 6.0, 6.0, 16.0, 9.0, 19.0, 24.0, 21.0, 39.0, 55.0, 70.0, 74.0, 95.0, 104.0, 106.0, 77.0, 68.0, 40.0, 25.0, 30.0, 26.0, 15.0, 8.0, 7.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.13829994201660156, -0.13402175903320312, -0.1297435760498047, -0.12546539306640625, -0.12118721008300781, -0.11690902709960938, -0.11263084411621094, -0.1083526611328125, -0.10407447814941406, -0.09979629516601562, -0.09551811218261719, -0.09123992919921875, -0.08696174621582031, -0.08268356323242188, -0.07840538024902344, -0.074127197265625, -0.06984901428222656, -0.06557083129882812, -0.06129264831542969, -0.05701446533203125, -0.05273628234863281, -0.048458099365234375, -0.04417991638183594, -0.0399017333984375, -0.03562355041503906, -0.031345367431640625, -0.027067184448242188, -0.02278900146484375, -0.018510818481445312, -0.014232635498046875, -0.009954452514648438, -0.00567626953125, -0.0013980865478515625, 0.002880096435546875, 0.0071582794189453125, 0.01143646240234375, 0.015714645385742188, 0.019992828369140625, 0.024271011352539062, 0.0285491943359375, 0.03282737731933594, 0.037105560302734375, 0.04138374328613281, 0.04566192626953125, 0.04994010925292969, 0.054218292236328125, 0.05849647521972656, 0.062774658203125, 0.06705284118652344, 0.07133102416992188, 0.07560920715332031, 0.07988739013671875, 0.08416557312011719, 0.08844375610351562, 0.09272193908691406, 0.0970001220703125, 0.10127830505371094, 0.10555648803710938, 0.10983467102050781, 0.11411285400390625, 0.11839103698730469, 0.12266921997070312, 0.12694740295410156, 0.1312255859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 12.0, 12.0, 21.0, 40.0, 127.0, 380.0, 273.0, 80.0, 18.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3472275733947754, -3.2589545249938965, -3.1706812381744385, -3.0824081897735596, -2.9941349029541016, -2.9058618545532227, -2.8175888061523438, -2.7293155193328857, -2.6410422325134277, -2.552769184112549, -2.464495897293091, -2.376222848892212, -2.287949562072754, -2.199676513671875, -2.111403465270996, -2.023130178451538, -1.9348571300506592, -1.8465839624404907, -1.7583107948303223, -1.6700377464294434, -1.5817644596099854, -1.4934914112091064, -1.405218243598938, -1.3169450759887695, -1.228671908378601, -1.1403987407684326, -1.0521255731582642, -0.9638524651527405, -0.875579297542572, -0.7873061299324036, -0.6990330219268799, -0.6107598543167114, -0.522486686706543, -0.4342135190963745, -0.34594038128852844, -0.2576672434806824, -0.16939407587051392, -0.08112090826034546, 0.007152199745178223, 0.09542536735534668, 0.18369853496551514, 0.2719717025756836, 0.36024484038352966, 0.44851797819137573, 0.5367911458015442, 0.6250643134117126, 0.7133374214172363, 0.8016105890274048, 0.8898837566375732, 0.9781569242477417, 1.0664300918579102, 1.154703140258789, 1.242976427078247, 1.331249475479126, 1.4195226430892944, 1.507795810699463, 1.5960689783096313, 1.6843421459197998, 1.7726153135299683, 1.8608884811401367, 1.9491615295410156, 2.0374348163604736, 2.1257078647613525, 2.2139811515808105, 2.3022541999816895]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 3.0, 12.0, 17.0, 15.0, 36.0, 39.0, 64.0, 87.0, 144.0, 144.0, 130.0, 94.0, 61.0, 45.0, 26.0, 22.0, 13.0, 6.0, 3.0, 3.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3614094257354736, -2.283756971359253, -2.206104278564453, -2.1284518241882324, -2.0507993698120117, -1.9731467962265015, -1.8954942226409912, -1.8178417682647705, -1.7401891946792603, -1.66253662109375, -1.5848841667175293, -1.507231593132019, -1.4295790195465088, -1.351926565170288, -1.2742739915847778, -1.1966214179992676, -1.1189689636230469, -1.0413163900375366, -0.9636639356613159, -0.8860113620758057, -0.8083588480949402, -0.7307063341140747, -0.6530537605285645, -0.575401246547699, -0.4977487325668335, -0.420096218585968, -0.34244367480278015, -0.2647911310195923, -0.1871386170387268, -0.10948610305786133, -0.03183355927467346, 0.045818984508514404, 0.12347173690795898, 0.20112426578998566, 0.27877679467201233, 0.3564293384552002, 0.4340818524360657, 0.5117343664169312, 0.5893869400024414, 0.6670394539833069, 0.7446919679641724, 0.8223444819450378, 0.8999969959259033, 0.9776495695114136, 1.0553021430969238, 1.1329545974731445, 1.2106071710586548, 1.288259744644165, 1.3659121990203857, 1.443564772605896, 1.5212172269821167, 1.598869800567627, 1.6765222549438477, 1.754174828529358, 1.8318274021148682, 1.9094798564910889, 1.9871324300765991, 2.0647850036621094, 2.14243745803833, 2.220089912414551, 2.2977426052093506, 2.3753950595855713, 2.453047513961792, 2.530700206756592, 2.6083526611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 11.0, 7.0, 6.0, 27.0, 29.0, 47.0, 122.0, 2998.0, 4185167.0, 5289.0, 379.0, 105.0, 43.0, 22.0, 10.0, 11.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.405548095703125, -1.29351806640625, -1.181488037109375, -1.0694580078125, -0.957427978515625, -0.84539794921875, -0.733367919921875, -0.621337890625, -0.509307861328125, -0.39727783203125, -0.285247802734375, -0.1732177734375, -0.061187744140625, 0.05084228515625, 0.162872314453125, 0.27490234375, 0.386932373046875, 0.49896240234375, 0.610992431640625, 0.7230224609375, 0.835052490234375, 0.94708251953125, 1.059112548828125, 1.171142578125, 1.283172607421875, 1.39520263671875, 1.507232666015625, 1.6192626953125, 1.731292724609375, 1.84332275390625, 1.955352783203125, 2.0673828125, 2.179412841796875, 2.29144287109375, 2.403472900390625, 2.5155029296875, 2.627532958984375, 2.73956298828125, 2.851593017578125, 2.963623046875, 3.075653076171875, 3.18768310546875, 3.299713134765625, 3.4117431640625, 3.523773193359375, 3.63580322265625, 3.747833251953125, 3.85986328125, 3.971893310546875, 4.08392333984375, 4.195953369140625, 4.3079833984375, 4.420013427734375, 4.53204345703125, 4.644073486328125, 4.756103515625, 4.868133544921875, 4.98016357421875, 5.092193603515625, 5.2042236328125, 5.316253662109375, 5.42828369140625, 5.540313720703125, 5.65234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 24.0, 22.0, 47.0, 49.0, 67.0, 106.0, 127.0, 127.0, 101.0, 98.0, 66.0, 35.0, 18.0, 22.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021209716796875, -0.020504474639892578, -0.019799232482910156, -0.019093990325927734, -0.018388748168945312, -0.01768350601196289, -0.01697826385498047, -0.016273021697998047, -0.015567779541015625, -0.014862537384033203, -0.014157295227050781, -0.01345205307006836, -0.012746810913085938, -0.012041568756103516, -0.011336326599121094, -0.010631084442138672, -0.00992584228515625, -0.009220600128173828, -0.008515357971191406, -0.007810115814208984, -0.0071048736572265625, -0.006399631500244141, -0.005694389343261719, -0.004989147186279297, -0.004283905029296875, -0.003578662872314453, -0.0028734207153320312, -0.0021681785583496094, -0.0014629364013671875, -0.0007576942443847656, -5.245208740234375e-05, 0.0006527900695800781, 0.0013580322265625, 0.002063274383544922, 0.0027685165405273438, 0.0034737586975097656, 0.0041790008544921875, 0.004884243011474609, 0.005589485168457031, 0.006294727325439453, 0.006999969482421875, 0.007705211639404297, 0.008410453796386719, 0.00911569595336914, 0.009820938110351562, 0.010526180267333984, 0.011231422424316406, 0.011936664581298828, 0.01264190673828125, 0.013347148895263672, 0.014052391052246094, 0.014757633209228516, 0.015462875366210938, 0.01616811752319336, 0.01687335968017578, 0.017578601837158203, 0.018283843994140625, 0.018989086151123047, 0.01969432830810547, 0.02039957046508789, 0.021104812622070312, 0.021810054779052734, 0.022515296936035156, 0.023220539093017578, 0.02392578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 10.0, 12.0, 16.0, 25.0, 29.0, 52.0, 69.0, 89.0, 152.0, 224.0, 380.0, 760.0, 1982.0, 6542.0, 36068.0, 3441911.0, 674399.0, 23968.0, 4925.0, 1510.0, 610.0, 258.0, 128.0, 63.0, 33.0, 20.0, 8.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0], "bins": [-0.7333984375, -0.7177619934082031, -0.7021255493164062, -0.6864891052246094, -0.6708526611328125, -0.6552162170410156, -0.6395797729492188, -0.6239433288574219, -0.608306884765625, -0.5926704406738281, -0.5770339965820312, -0.5613975524902344, -0.5457611083984375, -0.5301246643066406, -0.5144882202148438, -0.4988517761230469, -0.48321533203125, -0.4675788879394531, -0.45194244384765625, -0.4363059997558594, -0.4206695556640625, -0.4050331115722656, -0.38939666748046875, -0.3737602233886719, -0.358123779296875, -0.3424873352050781, -0.32685089111328125, -0.3112144470214844, -0.2955780029296875, -0.2799415588378906, -0.26430511474609375, -0.24866867065429688, -0.2330322265625, -0.21739578247070312, -0.20175933837890625, -0.18612289428710938, -0.1704864501953125, -0.15485000610351562, -0.13921356201171875, -0.12357711791992188, -0.107940673828125, -0.09230422973632812, -0.07666778564453125, -0.061031341552734375, -0.0453948974609375, -0.029758453369140625, -0.01412200927734375, 0.001514434814453125, 0.01715087890625, 0.032787322998046875, 0.04842376708984375, 0.06406021118164062, 0.0796966552734375, 0.09533309936523438, 0.11096954345703125, 0.12660598754882812, 0.142242431640625, 0.15787887573242188, 0.17351531982421875, 0.18915176391601562, 0.2047882080078125, 0.22042465209960938, 0.23606109619140625, 0.2516975402832031, 0.267333984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 7.0, 9.0, 6.0, 6.0, 8.0, 14.0, 16.0, 29.0, 48.0, 72.0, 160.0, 499.0, 2061.0, 616.0, 204.0, 103.0, 72.0, 50.0, 23.0, 19.0, 15.0, 2.0, 8.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06159639358520508, -0.059960365295410156, -0.058324337005615234, -0.05668830871582031, -0.05505228042602539, -0.05341625213623047, -0.05178022384643555, -0.050144195556640625, -0.0485081672668457, -0.04687213897705078, -0.04523611068725586, -0.04360008239746094, -0.041964054107666016, -0.040328025817871094, -0.03869199752807617, -0.03705596923828125, -0.03541994094848633, -0.033783912658691406, -0.032147884368896484, -0.030511856079101562, -0.02887582778930664, -0.02723979949951172, -0.025603771209716797, -0.023967742919921875, -0.022331714630126953, -0.02069568634033203, -0.01905965805053711, -0.017423629760742188, -0.015787601470947266, -0.014151573181152344, -0.012515544891357422, -0.0108795166015625, -0.009243488311767578, -0.007607460021972656, -0.005971431732177734, -0.0043354034423828125, -0.0026993751525878906, -0.0010633468627929688, 0.0005726814270019531, 0.002208709716796875, 0.003844738006591797, 0.005480766296386719, 0.007116794586181641, 0.008752822875976562, 0.010388851165771484, 0.012024879455566406, 0.013660907745361328, 0.01529693603515625, 0.016932964324951172, 0.018568992614746094, 0.020205020904541016, 0.021841049194335938, 0.02347707748413086, 0.02511310577392578, 0.026749134063720703, 0.028385162353515625, 0.030021190643310547, 0.03165721893310547, 0.03329324722290039, 0.03492927551269531, 0.036565303802490234, 0.038201332092285156, 0.03983736038208008, 0.041473388671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 42.0, 745.0, 204.0, 16.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.72111701965332, -4.6379780769348145, -4.554839611053467, -4.471700668334961, -4.388562202453613, -4.305423259735107, -4.222284317016602, -4.139145851135254, -4.056006908416748, -3.9728682041168213, -3.8897294998168945, -3.8065905570983887, -3.723451852798462, -3.640313148498535, -3.5571744441986084, -3.4740357398986816, -3.390897035598755, -3.307758331298828, -3.2246196269989014, -3.1414806842803955, -3.0583419799804688, -2.975203275680542, -2.8920645713806152, -2.8089258670806885, -2.7257871627807617, -2.642648458480835, -2.559509754180908, -2.4763708114624023, -2.3932321071624756, -2.310093402862549, -2.226954698562622, -2.1438159942626953, -2.0606768131256104, -1.9775381088256836, -1.8943992853164673, -1.8112605810165405, -1.7281217575073242, -1.6449830532073975, -1.5618443489074707, -1.478705644607544, -1.3955669403076172, -1.3124282360076904, -1.2292894124984741, -1.1461507081985474, -1.063011884689331, -0.9798731803894043, -0.8967344760894775, -0.813595712184906, -0.7304568886756897, -0.6473181247711182, -0.5641794204711914, -0.4810406565666199, -0.39790189266204834, -0.3147631287574768, -0.23162439465522766, -0.14848566055297852, -0.06534689664840698, 0.017791852355003357, 0.1009306013584137, 0.18406935036182404, 0.2672080993652344, 0.3503468632698059, 0.43348559737205505, 0.5166243314743042, 0.5997630953788757]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 15.0, 16.0, 23.0, 38.0, 43.0, 67.0, 74.0, 73.0, 75.0, 59.0, 79.0, 80.0, 63.0, 59.0, 47.0, 52.0, 32.0, 31.0, 19.0, 5.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26728546619415283, -0.2590864300727844, -0.250887393951416, -0.2426883578300476, -0.2344893217086792, -0.2262902855873108, -0.21809124946594238, -0.20989221334457397, -0.20169317722320557, -0.19349414110183716, -0.18529510498046875, -0.17709606885910034, -0.16889703273773193, -0.16069799661636353, -0.15249896049499512, -0.1442999243736267, -0.1361008733510971, -0.1279018372297287, -0.11970280110836029, -0.11150376498699188, -0.10330472886562347, -0.09510569274425507, -0.08690664917230606, -0.07870761305093765, -0.07050857692956924, -0.062309540808200836, -0.05411050468683243, -0.04591146484017372, -0.03771242871880531, -0.029513392597436905, -0.021314352750778198, -0.01311531662940979, -0.004916280508041382, 0.003282756544649601, 0.011481793597340584, 0.01968083158135414, 0.02787986770272255, 0.03607890382409096, 0.044277943670749664, 0.05247697979211807, 0.06067601591348648, 0.06887505203485489, 0.0770740881562233, 0.0852731317281723, 0.09347216784954071, 0.10167120397090912, 0.10987024009227753, 0.11806927621364594, 0.12626831233501434, 0.13446734845638275, 0.14266638457775116, 0.15086542069911957, 0.15906445682048798, 0.16726349294185638, 0.175462543964386, 0.1836615800857544, 0.1918606162071228, 0.2000596523284912, 0.20825868844985962, 0.21645772457122803, 0.22465676069259644, 0.23285579681396484, 0.24105483293533325, 0.24925386905670166, 0.25745290517807007]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 6.0, 12.0, 17.0, 22.0, 31.0, 44.0, 68.0, 91.0, 166.0, 274.0, 431.0, 693.0, 1284.0, 2393.0, 5092.0, 11514.0, 31402.0, 118720.0, 601902.0, 202058.0, 44150.0, 15129.0, 6402.0, 2956.0, 1552.0, 841.0, 475.0, 294.0, 203.0, 102.0, 71.0, 53.0, 35.0, 26.0, 12.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1466064453125, -0.14182281494140625, -0.1370391845703125, -0.13225555419921875, -0.127471923828125, -0.12268829345703125, -0.1179046630859375, -0.11312103271484375, -0.10833740234375, -0.10355377197265625, -0.0987701416015625, -0.09398651123046875, -0.089202880859375, -0.08441925048828125, -0.0796356201171875, -0.07485198974609375, -0.070068359375, -0.06528472900390625, -0.0605010986328125, -0.05571746826171875, -0.050933837890625, -0.04615020751953125, -0.0413665771484375, -0.03658294677734375, -0.03179931640625, -0.02701568603515625, -0.0222320556640625, -0.01744842529296875, -0.012664794921875, -0.00788116455078125, -0.0030975341796875, 0.00168609619140625, 0.0064697265625, 0.01125335693359375, 0.0160369873046875, 0.02082061767578125, 0.025604248046875, 0.03038787841796875, 0.0351715087890625, 0.03995513916015625, 0.04473876953125, 0.04952239990234375, 0.0543060302734375, 0.05908966064453125, 0.063873291015625, 0.06865692138671875, 0.0734405517578125, 0.07822418212890625, 0.0830078125, 0.08779144287109375, 0.0925750732421875, 0.09735870361328125, 0.102142333984375, 0.10692596435546875, 0.1117095947265625, 0.11649322509765625, 0.12127685546875, 0.12606048583984375, 0.1308441162109375, 0.13562774658203125, 0.140411376953125, 0.14519500732421875, 0.1499786376953125, 0.15476226806640625, 0.1595458984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 9.0, 4.0, 5.0, 1.0, 8.0, 5.0, 14.0, 22.0, 20.0, 29.0, 28.0, 54.0, 72.0, 71.0, 84.0, 89.0, 84.0, 107.0, 72.0, 47.0, 47.0, 36.0, 13.0, 17.0, 20.0, 12.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152130126953125, -0.01468515396118164, -0.014157295227050781, -0.013629436492919922, -0.013101577758789062, -0.012573719024658203, -0.012045860290527344, -0.011518001556396484, -0.010990142822265625, -0.010462284088134766, -0.009934425354003906, -0.009406566619873047, -0.008878707885742188, -0.008350849151611328, -0.007822990417480469, -0.007295131683349609, -0.00676727294921875, -0.006239414215087891, -0.005711555480957031, -0.005183696746826172, -0.0046558380126953125, -0.004127979278564453, -0.0036001205444335938, -0.0030722618103027344, -0.002544403076171875, -0.0020165443420410156, -0.0014886856079101562, -0.0009608268737792969, -0.0004329681396484375, 9.489059448242188e-05, 0.0006227493286132812, 0.0011506080627441406, 0.001678466796875, 0.0022063255310058594, 0.0027341842651367188, 0.003262042999267578, 0.0037899017333984375, 0.004317760467529297, 0.004845619201660156, 0.005373477935791016, 0.005901336669921875, 0.006429195404052734, 0.006957054138183594, 0.007484912872314453, 0.008012771606445312, 0.008540630340576172, 0.009068489074707031, 0.00959634780883789, 0.01012420654296875, 0.01065206527709961, 0.011179924011230469, 0.011707782745361328, 0.012235641479492188, 0.012763500213623047, 0.013291358947753906, 0.013819217681884766, 0.014347076416015625, 0.014874935150146484, 0.015402793884277344, 0.015930652618408203, 0.016458511352539062, 0.016986370086669922, 0.01751422882080078, 0.01804208755493164, 0.0185699462890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 15.0, 31.0, 52.0, 216.0, 1474.0, 29885.0, 898169.0, 114378.0, 3715.0, 383.0, 90.0, 31.0, 19.0, 9.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.50439453125, -0.4902534484863281, -0.47611236572265625, -0.4619712829589844, -0.4478302001953125, -0.4336891174316406, -0.41954803466796875, -0.4054069519042969, -0.391265869140625, -0.3771247863769531, -0.36298370361328125, -0.3488426208496094, -0.3347015380859375, -0.3205604553222656, -0.30641937255859375, -0.2922782897949219, -0.27813720703125, -0.2639961242675781, -0.24985504150390625, -0.23571395874023438, -0.2215728759765625, -0.20743179321289062, -0.19329071044921875, -0.17914962768554688, -0.165008544921875, -0.15086746215820312, -0.13672637939453125, -0.12258529663085938, -0.1084442138671875, -0.09430313110351562, -0.08016204833984375, -0.06602096557617188, -0.0518798828125, -0.037738800048828125, -0.02359771728515625, -0.009456634521484375, 0.0046844482421875, 0.018825531005859375, 0.03296661376953125, 0.047107696533203125, 0.061248779296875, 0.07538986206054688, 0.08953094482421875, 0.10367202758789062, 0.1178131103515625, 0.13195419311523438, 0.14609527587890625, 0.16023635864257812, 0.17437744140625, 0.18851852416992188, 0.20265960693359375, 0.21680068969726562, 0.2309417724609375, 0.24508285522460938, 0.25922393798828125, 0.2733650207519531, 0.287506103515625, 0.3016471862792969, 0.31578826904296875, 0.3299293518066406, 0.3440704345703125, 0.3582115173339844, 0.37235260009765625, 0.3864936828613281, 0.400634765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 7.0, 12.0, 11.0, 12.0, 17.0, 16.0, 18.0, 20.0, 26.0, 30.0, 24.0, 36.0, 25.0, 38.0, 38.0, 46.0, 34.0, 38.0, 41.0, 44.0, 54.0, 43.0, 36.0, 32.0, 35.0, 33.0, 34.0, 22.0, 26.0, 22.0, 23.0, 19.0, 15.0, 12.0, 12.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06431770324707031, -0.062168121337890625, -0.06001853942871094, -0.05786895751953125, -0.05571937561035156, -0.053569793701171875, -0.05142021179199219, -0.0492706298828125, -0.04712104797363281, -0.044971466064453125, -0.04282188415527344, -0.04067230224609375, -0.03852272033691406, -0.036373138427734375, -0.03422355651855469, -0.032073974609375, -0.029924392700195312, -0.027774810791015625, -0.025625228881835938, -0.02347564697265625, -0.021326065063476562, -0.019176483154296875, -0.017026901245117188, -0.0148773193359375, -0.012727737426757812, -0.010578155517578125, -0.008428573608398438, -0.00627899169921875, -0.0041294097900390625, -0.001979827880859375, 0.0001697540283203125, 0.0023193359375, 0.0044689178466796875, 0.006618499755859375, 0.008768081665039062, 0.01091766357421875, 0.013067245483398438, 0.015216827392578125, 0.017366409301757812, 0.0195159912109375, 0.021665573120117188, 0.023815155029296875, 0.025964736938476562, 0.02811431884765625, 0.030263900756835938, 0.032413482666015625, 0.03456306457519531, 0.036712646484375, 0.03886222839355469, 0.041011810302734375, 0.04316139221191406, 0.04531097412109375, 0.04746055603027344, 0.049610137939453125, 0.05175971984863281, 0.0539093017578125, 0.05605888366699219, 0.058208465576171875, 0.06035804748535156, 0.06250762939453125, 0.06465721130371094, 0.06680679321289062, 0.06895637512207031, 0.07110595703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 9.0, 8.0, 22.0, 32.0, 155.0, 2559.0, 1043447.0, 2087.0, 131.0, 38.0, 19.0, 11.0, 8.0, 1.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 3.0], "bins": [-5.9921875, -5.871063232421875, -5.74993896484375, -5.628814697265625, -5.5076904296875, -5.386566162109375, -5.26544189453125, -5.144317626953125, -5.023193359375, -4.902069091796875, -4.78094482421875, -4.659820556640625, -4.5386962890625, -4.417572021484375, -4.29644775390625, -4.175323486328125, -4.05419921875, -3.933074951171875, -3.81195068359375, -3.690826416015625, -3.5697021484375, -3.448577880859375, -3.32745361328125, -3.206329345703125, -3.085205078125, -2.964080810546875, -2.84295654296875, -2.721832275390625, -2.6007080078125, -2.479583740234375, -2.35845947265625, -2.237335205078125, -2.1162109375, -1.995086669921875, -1.87396240234375, -1.752838134765625, -1.6317138671875, -1.510589599609375, -1.38946533203125, -1.268341064453125, -1.147216796875, -1.026092529296875, -0.90496826171875, -0.783843994140625, -0.6627197265625, -0.541595458984375, -0.42047119140625, -0.299346923828125, -0.17822265625, -0.057098388671875, 0.06402587890625, 0.185150146484375, 0.3062744140625, 0.427398681640625, 0.54852294921875, 0.669647216796875, 0.790771484375, 0.911895751953125, 1.03302001953125, 1.154144287109375, 1.2752685546875, 1.396392822265625, 1.51751708984375, 1.638641357421875, 1.759765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 14.0, 14.0, 26.0, 47.0, 84.0, 477.0, 167.0, 60.0, 28.0, 25.0, 11.0, 10.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012149810791015625, -0.0011532306671142578, -0.0010914802551269531, -0.0010297298431396484, -0.0009679794311523438, -0.0009062290191650391, -0.0008444786071777344, -0.0007827281951904297, -0.000720977783203125, -0.0006592273712158203, -0.0005974769592285156, -0.0005357265472412109, -0.00047397613525390625, -0.00041222572326660156, -0.0003504753112792969, -0.0002887248992919922, -0.0002269744873046875, -0.0001652240753173828, -0.00010347366333007812, -4.172325134277344e-05, 2.002716064453125e-05, 8.177757263183594e-05, 0.00014352798461914062, 0.0002052783966064453, 0.00026702880859375, 0.0003287792205810547, 0.0003905296325683594, 0.00045228004455566406, 0.0005140304565429688, 0.0005757808685302734, 0.0006375312805175781, 0.0006992816925048828, 0.0007610321044921875, 0.0008227825164794922, 0.0008845329284667969, 0.0009462833404541016, 0.0010080337524414062, 0.001069784164428711, 0.0011315345764160156, 0.0011932849884033203, 0.001255035400390625, 0.0013167858123779297, 0.0013785362243652344, 0.001440286636352539, 0.0015020370483398438, 0.0015637874603271484, 0.0016255378723144531, 0.0016872882843017578, 0.0017490386962890625, 0.0018107891082763672, 0.0018725395202636719, 0.0019342899322509766, 0.0019960403442382812, 0.002057790756225586, 0.0021195411682128906, 0.0021812915802001953, 0.0022430419921875, 0.0023047924041748047, 0.0023665428161621094, 0.002428293228149414, 0.0024900436401367188, 0.0025517940521240234, 0.002613544464111328, 0.002675294876098633, 0.0027370452880859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 10.0, 9.0, 9.0, 18.0, 25.0, 34.0, 64.0, 98.0, 142.0, 294.0, 785.0, 2734.0, 17716.0, 972074.0, 48562.0, 3995.0, 967.0, 404.0, 195.0, 135.0, 97.0, 60.0, 40.0, 29.0, 25.0, 9.0, 9.0, 11.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.407958984375, -0.3872108459472656, -0.36646270751953125, -0.3457145690917969, -0.3249664306640625, -0.3042182922363281, -0.28347015380859375, -0.2627220153808594, -0.241973876953125, -0.22122573852539062, -0.20047760009765625, -0.17972946166992188, -0.1589813232421875, -0.13823318481445312, -0.11748504638671875, -0.09673690795898438, -0.07598876953125, -0.055240631103515625, -0.03449249267578125, -0.013744354248046875, 0.0070037841796875, 0.027751922607421875, 0.04850006103515625, 0.06924819946289062, 0.089996337890625, 0.11074447631835938, 0.13149261474609375, 0.15224075317382812, 0.1729888916015625, 0.19373703002929688, 0.21448516845703125, 0.23523330688476562, 0.2559814453125, 0.2767295837402344, 0.29747772216796875, 0.3182258605957031, 0.3389739990234375, 0.3597221374511719, 0.38047027587890625, 0.4012184143066406, 0.421966552734375, 0.4427146911621094, 0.46346282958984375, 0.4842109680175781, 0.5049591064453125, 0.5257072448730469, 0.5464553833007812, 0.5672035217285156, 0.58795166015625, 0.6086997985839844, 0.6294479370117188, 0.6501960754394531, 0.6709442138671875, 0.6916923522949219, 0.7124404907226562, 0.7331886291503906, 0.753936767578125, 0.7746849060058594, 0.7954330444335938, 0.8161811828613281, 0.8369293212890625, 0.8576774597167969, 0.8784255981445312, 0.8991737365722656, 0.919921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 9.0, 14.0, 33.0, 61.0, 214.0, 347.0, 181.0, 69.0, 26.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.14904022216796875, -0.1393890380859375, -0.12973785400390625, -0.120086669921875, -0.11043548583984375, -0.1007843017578125, -0.09113311767578125, -0.08148193359375, -0.07183074951171875, -0.0621795654296875, -0.05252838134765625, -0.042877197265625, -0.03322601318359375, -0.0235748291015625, -0.01392364501953125, -0.0042724609375, 0.00537872314453125, 0.0150299072265625, 0.02468109130859375, 0.034332275390625, 0.04398345947265625, 0.0536346435546875, 0.06328582763671875, 0.07293701171875, 0.08258819580078125, 0.0922393798828125, 0.10189056396484375, 0.111541748046875, 0.12119293212890625, 0.1308441162109375, 0.14049530029296875, 0.150146484375, 0.15979766845703125, 0.1694488525390625, 0.17910003662109375, 0.188751220703125, 0.19840240478515625, 0.2080535888671875, 0.21770477294921875, 0.22735595703125, 0.23700714111328125, 0.2466583251953125, 0.25630950927734375, 0.265960693359375, 0.27561187744140625, 0.2852630615234375, 0.29491424560546875, 0.3045654296875, 0.31421661376953125, 0.3238677978515625, 0.33351898193359375, 0.343170166015625, 0.35282135009765625, 0.3624725341796875, 0.37212371826171875, 0.38177490234375, 0.39142608642578125, 0.4010772705078125, 0.41072845458984375, 0.420379638671875, 0.43003082275390625, 0.4396820068359375, 0.44933319091796875, 0.458984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 10.0, 17.0, 27.0, 62.0, 183.0, 282.0, 201.0, 106.0, 45.0, 25.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2714014053344727, -2.219346523284912, -2.1672916412353516, -2.115236520767212, -2.0631816387176514, -2.011126756668091, -1.9590717554092407, -1.9070167541503906, -1.85496187210083, -1.8029069900512695, -1.7508519887924194, -1.6987969875335693, -1.6467421054840088, -1.5946872234344482, -1.5426322221755981, -1.490577220916748, -1.4385223388671875, -1.386467456817627, -1.3344124555587769, -1.2823574542999268, -1.2303025722503662, -1.1782476902008057, -1.1261926889419556, -1.0741376876831055, -1.022082805633545, -0.9700278639793396, -0.9179729223251343, -0.865917980670929, -0.8138630390167236, -0.7618080973625183, -0.709753155708313, -0.6576982140541077, -0.6056432723999023, -0.553588330745697, -0.5015333890914917, -0.4494784474372864, -0.39742350578308105, -0.34536856412887573, -0.2933136224746704, -0.2412586808204651, -0.18920373916625977, -0.13714879751205444, -0.08509385585784912, -0.0330389142036438, 0.019016027450561523, 0.07107096910476685, 0.12312591075897217, 0.1751808524131775, 0.2272357940673828, 0.27929073572158813, 0.33134567737579346, 0.3834006190299988, 0.4354555606842041, 0.4875105023384094, 0.5395654439926147, 0.5916203856468201, 0.6436753273010254, 0.6957302689552307, 0.747785210609436, 0.7998401522636414, 0.8518950939178467, 0.903950035572052, 0.9560049772262573, 1.0080599784851074, 1.060114860534668]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 5.0, 5.0, 4.0, 10.0, 5.0, 17.0, 17.0, 19.0, 29.0, 39.0, 41.0, 42.0, 50.0, 56.0, 58.0, 57.0, 56.0, 72.0, 61.0, 51.0, 44.0, 56.0, 47.0, 28.0, 20.0, 17.0, 16.0, 14.0, 14.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6870524287223816, -0.6626450419425964, -0.6382376551628113, -0.6138302683830261, -0.589422881603241, -0.5650154948234558, -0.5406081080436707, -0.5162007212638855, -0.49179333448410034, -0.4673859477043152, -0.44297856092453003, -0.4185711741447449, -0.3941637873649597, -0.36975640058517456, -0.3453490138053894, -0.32094162702560425, -0.2965342700481415, -0.2721268832683563, -0.24771949648857117, -0.223312109708786, -0.19890472292900085, -0.1744973361492157, -0.15008996427059174, -0.12568257749080658, -0.10127519071102142, -0.07686780393123627, -0.05246042087674141, -0.02805303782224655, -0.0036456510424613953, 0.02076173573732376, 0.04516911506652832, 0.06957650184631348, 0.09398388862609863, 0.11839127540588379, 0.14279866218566895, 0.1672060489654541, 0.19161343574523926, 0.21602082252502441, 0.24042819440364838, 0.2648355960845947, 0.2892429828643799, 0.31365036964416504, 0.3380577564239502, 0.36246514320373535, 0.3868725299835205, 0.41127991676330566, 0.4356873035430908, 0.460094690322876, 0.48450204730033875, 0.5089094042778015, 0.5333167910575867, 0.5577241778373718, 0.582131564617157, 0.6065389513969421, 0.6309463381767273, 0.6553537249565125, 0.6797611117362976, 0.7041684985160828, 0.7285758852958679, 0.7529832720756531, 0.7773906588554382, 0.8017980456352234, 0.8262054324150085, 0.8506128191947937, 0.8750202059745789]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 6.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 6.0, 8.0, 0.0, 4.0, 6.0, 14.0, 4.0, 14.0, 10.0, 11.0, 6.0, 21.0, 13.0, 50.0, 99.0, 254.0, 861.0, 3971.0, 36181.0, 4100343.0, 46797.0, 4341.0, 788.0, 224.0, 75.0, 45.0, 31.0, 4.0, 7.0, 18.0, 8.0, 14.0, 2.0, 6.0, 2.0, 6.0, 2.0, 12.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.88720703125, -0.8571701049804688, -0.8271331787109375, -0.7970962524414062, -0.767059326171875, -0.7370223999023438, -0.7069854736328125, -0.6769485473632812, -0.64691162109375, -0.6168746948242188, -0.5868377685546875, -0.5568008422851562, -0.526763916015625, -0.49672698974609375, -0.4666900634765625, -0.43665313720703125, -0.4066162109375, -0.37657928466796875, -0.3465423583984375, -0.31650543212890625, -0.286468505859375, -0.25643157958984375, -0.2263946533203125, -0.19635772705078125, -0.16632080078125, -0.13628387451171875, -0.1062469482421875, -0.07621002197265625, -0.046173095703125, -0.01613616943359375, 0.0139007568359375, 0.04393768310546875, 0.073974609375, 0.10401153564453125, 0.1340484619140625, 0.16408538818359375, 0.194122314453125, 0.22415924072265625, 0.2541961669921875, 0.28423309326171875, 0.31427001953125, 0.34430694580078125, 0.3743438720703125, 0.40438079833984375, 0.434417724609375, 0.46445465087890625, 0.4944915771484375, 0.5245285034179688, 0.5545654296875, 0.5846023559570312, 0.6146392822265625, 0.6446762084960938, 0.674713134765625, 0.7047500610351562, 0.7347869873046875, 0.7648239135742188, 0.79486083984375, 0.8248977661132812, 0.8549346923828125, 0.8849716186523438, 0.915008544921875, 0.9450454711914062, 0.9750823974609375, 1.0051193237304688, 1.03515625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 7.0, 6.0, 6.0, 10.0, 10.0, 17.0, 12.0, 26.0, 36.0, 40.0, 53.0, 54.0, 62.0, 60.0, 61.0, 72.0, 64.0, 61.0, 62.0, 58.0, 46.0, 31.0, 23.0, 23.0, 16.0, 13.0, 17.0, 8.0, 12.0, 6.0, 5.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01506805419921875, -0.014627218246459961, -0.014186382293701172, -0.013745546340942383, -0.013304710388183594, -0.012863874435424805, -0.012423038482666016, -0.011982202529907227, -0.011541366577148438, -0.011100530624389648, -0.01065969467163086, -0.01021885871887207, -0.009778022766113281, -0.009337186813354492, -0.008896350860595703, -0.008455514907836914, -0.008014678955078125, -0.007573843002319336, -0.007133007049560547, -0.006692171096801758, -0.006251335144042969, -0.00581049919128418, -0.005369663238525391, -0.0049288272857666016, -0.0044879913330078125, -0.0040471553802490234, -0.0036063194274902344, -0.0031654834747314453, -0.0027246475219726562, -0.002283811569213867, -0.0018429756164550781, -0.001402139663696289, -0.0009613037109375, -0.0005204677581787109, -7.963180541992188e-05, 0.0003612041473388672, 0.0008020401000976562, 0.0012428760528564453, 0.0016837120056152344, 0.0021245479583740234, 0.0025653839111328125, 0.0030062198638916016, 0.0034470558166503906, 0.0038878917694091797, 0.004328727722167969, 0.004769563674926758, 0.005210399627685547, 0.005651235580444336, 0.006092071533203125, 0.006532907485961914, 0.006973743438720703, 0.007414579391479492, 0.007855415344238281, 0.00829625129699707, 0.00873708724975586, 0.009177923202514648, 0.009618759155273438, 0.010059595108032227, 0.010500431060791016, 0.010941267013549805, 0.011382102966308594, 0.011822938919067383, 0.012263774871826172, 0.012704610824584961, 0.01314544677734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 13.0, 29.0, 112.0, 2121.0, 4125744.0, 65689.0, 479.0, 71.0, 18.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.615234375, -0.558258056640625, -0.50128173828125, -0.444305419921875, -0.3873291015625, -0.330352783203125, -0.27337646484375, -0.216400146484375, -0.159423828125, -0.102447509765625, -0.04547119140625, 0.011505126953125, 0.0684814453125, 0.125457763671875, 0.18243408203125, 0.239410400390625, 0.29638671875, 0.353363037109375, 0.41033935546875, 0.467315673828125, 0.5242919921875, 0.581268310546875, 0.63824462890625, 0.695220947265625, 0.752197265625, 0.809173583984375, 0.86614990234375, 0.923126220703125, 0.9801025390625, 1.037078857421875, 1.09405517578125, 1.151031494140625, 1.2080078125, 1.264984130859375, 1.32196044921875, 1.378936767578125, 1.4359130859375, 1.492889404296875, 1.54986572265625, 1.606842041015625, 1.663818359375, 1.720794677734375, 1.77777099609375, 1.834747314453125, 1.8917236328125, 1.948699951171875, 2.00567626953125, 2.062652587890625, 2.11962890625, 2.176605224609375, 2.23358154296875, 2.290557861328125, 2.3475341796875, 2.404510498046875, 2.46148681640625, 2.518463134765625, 2.575439453125, 2.632415771484375, 2.68939208984375, 2.746368408203125, 2.8033447265625, 2.860321044921875, 2.91729736328125, 2.974273681640625, 3.03125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 4.0, 11.0, 4.0, 16.0, 15.0, 27.0, 25.0, 45.0, 61.0, 90.0, 154.0, 358.0, 1666.0, 826.0, 297.0, 141.0, 82.0, 57.0, 46.0, 34.0, 21.0, 18.0, 12.0, 9.0, 4.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03369140625, -0.03252220153808594, -0.031352996826171875, -0.030183792114257812, -0.02901458740234375, -0.027845382690429688, -0.026676177978515625, -0.025506973266601562, -0.0243377685546875, -0.023168563842773438, -0.021999359130859375, -0.020830154418945312, -0.01966094970703125, -0.018491744995117188, -0.017322540283203125, -0.016153335571289062, -0.014984130859375, -0.013814926147460938, -0.012645721435546875, -0.011476516723632812, -0.01030731201171875, -0.009138107299804688, -0.007968902587890625, -0.0067996978759765625, -0.0056304931640625, -0.0044612884521484375, -0.003292083740234375, -0.0021228790283203125, -0.00095367431640625, 0.0002155303955078125, 0.001384735107421875, 0.0025539398193359375, 0.00372314453125, 0.0048923492431640625, 0.006061553955078125, 0.0072307586669921875, 0.00839996337890625, 0.009569168090820312, 0.010738372802734375, 0.011907577514648438, 0.0130767822265625, 0.014245986938476562, 0.015415191650390625, 0.016584396362304688, 0.01775360107421875, 0.018922805786132812, 0.020092010498046875, 0.021261215209960938, 0.022430419921875, 0.023599624633789062, 0.024768829345703125, 0.025938034057617188, 0.02710723876953125, 0.028276443481445312, 0.029445648193359375, 0.030614852905273438, 0.0317840576171875, 0.03295326232910156, 0.034122467041015625, 0.03529167175292969, 0.03646087646484375, 0.03763008117675781, 0.038799285888671875, 0.03996849060058594, 0.0411376953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [40.0, 931.0, 43.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17340520024299622, -0.05609995126724243, 0.06120529770851135, 0.17851054668426514, 0.2958157956600189, 0.4131210744380951, 0.5304262638092041, 0.6477315425872803, 0.7650368213653564, 0.8823421001434326, 0.999647319316864, 1.1169525384902954, 1.2342578172683716, 1.3515630960464478, 1.4688682556152344, 1.5861735343933105, 1.7034788131713867, 1.820784091949463, 1.938089370727539, 2.0553946495056152, 2.1726999282836914, 2.2900052070617676, 2.4073102474212646, 2.524615526199341, 2.641920804977417, 2.759226083755493, 2.8765313625335693, 2.9938366413116455, 3.1111416816711426, 3.2284469604492188, 3.345752239227295, 3.463057518005371, 3.5803627967834473, 3.6976680755615234, 3.8149733543395996, 3.932278633117676, 4.049583911895752, 4.166889190673828, 4.284194469451904, 4.4014997482299805, 4.518804550170898, 4.636109828948975, 4.753415107727051, 4.870720386505127, 4.988025665283203, 5.105330944061279, 5.2226362228393555, 5.339941024780273, 5.457246780395508, 5.574552059173584, 5.69185733795166, 5.809162616729736, 5.9264678955078125, 6.043773174285889, 6.161078453063965, 6.278383255004883, 6.395689010620117, 6.512994289398193, 6.6302995681762695, 6.747604846954346, 6.864910125732422, 6.982215404510498, 7.099520683288574, 7.216825485229492, 7.334130764007568]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 16.0, 24.0, 33.0, 46.0, 92.0, 92.0, 132.0, 131.0, 110.0, 125.0, 63.0, 42.0, 40.0, 16.0, 11.0, 13.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3009740114212036, -0.28428196907043457, -0.2675899267196655, -0.2508978843688965, -0.23420585691928864, -0.2175138145685196, -0.20082178711891174, -0.1841297447681427, -0.16743770241737366, -0.15074566006660461, -0.13405361771583557, -0.11736159026622772, -0.10066954791545868, -0.08397750556468964, -0.06728547066450119, -0.050593435764312744, -0.0339013934135437, -0.017209354788064957, -0.0005173161625862122, 0.016174722462892532, 0.03286676108837128, 0.04955880343914032, 0.06625083833932877, 0.08294287323951721, 0.09963491559028625, 0.1163269579410553, 0.13301900029182434, 0.1497110277414322, 0.16640307009220123, 0.18309511244297028, 0.19978713989257812, 0.21647918224334717, 0.2331712245941162, 0.24986326694488525, 0.2665553092956543, 0.28324735164642334, 0.2999393939971924, 0.3166314363479614, 0.3333234488964081, 0.3500154912471771, 0.36670753359794617, 0.3833995759487152, 0.40009161829948425, 0.4167836606502533, 0.43347567319869995, 0.450167715549469, 0.46685975790023804, 0.4835518002510071, 0.5002438426017761, 0.5169358849525452, 0.5336279273033142, 0.5503199696540833, 0.5670120120048523, 0.5837040543556213, 0.6003960967063904, 0.6170880794525146, 0.6337801218032837, 0.6504721641540527, 0.6671642065048218, 0.6838562488555908, 0.7005482912063599, 0.7172403335571289, 0.733932375907898, 0.750624418258667, 0.767316460609436]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 9.0, 13.0, 14.0, 5.0, 13.0, 16.0, 29.0, 23.0, 24.0, 39.0, 38.0, 38.0, 40.0, 142.0, 2753.0, 697362.0, 345815.0, 1688.0, 114.0, 42.0, 49.0, 38.0, 33.0, 36.0, 29.0, 24.0, 18.0, 16.0, 21.0, 12.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.84228515625, -0.81817626953125, -0.7940673828125, -0.76995849609375, -0.745849609375, -0.72174072265625, -0.6976318359375, -0.67352294921875, -0.6494140625, -0.62530517578125, -0.6011962890625, -0.57708740234375, -0.552978515625, -0.52886962890625, -0.5047607421875, -0.48065185546875, -0.45654296875, -0.43243408203125, -0.4083251953125, -0.38421630859375, -0.360107421875, -0.33599853515625, -0.3118896484375, -0.28778076171875, -0.263671875, -0.23956298828125, -0.2154541015625, -0.19134521484375, -0.167236328125, -0.14312744140625, -0.1190185546875, -0.09490966796875, -0.07080078125, -0.04669189453125, -0.0225830078125, 0.00152587890625, 0.025634765625, 0.04974365234375, 0.0738525390625, 0.09796142578125, 0.1220703125, 0.14617919921875, 0.1702880859375, 0.19439697265625, 0.218505859375, 0.24261474609375, 0.2667236328125, 0.29083251953125, 0.31494140625, 0.33905029296875, 0.3631591796875, 0.38726806640625, 0.411376953125, 0.43548583984375, 0.4595947265625, 0.48370361328125, 0.5078125, 0.53192138671875, 0.5560302734375, 0.58013916015625, 0.604248046875, 0.62835693359375, 0.6524658203125, 0.67657470703125, 0.70068359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 15.0, 57.0, 219.0, 380.0, 248.0, 77.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0159912109375, -0.012537002563476562, -0.009082794189453125, -0.0056285858154296875, -0.00217437744140625, 0.0012798309326171875, 0.004734039306640625, 0.008188247680664062, 0.0116424560546875, 0.015096664428710938, 0.018550872802734375, 0.022005081176757812, 0.02545928955078125, 0.028913497924804688, 0.032367706298828125, 0.03582191467285156, 0.039276123046875, 0.04273033142089844, 0.046184539794921875, 0.04963874816894531, 0.05309295654296875, 0.05654716491699219, 0.060001373291015625, 0.06345558166503906, 0.0669097900390625, 0.07036399841308594, 0.07381820678710938, 0.07727241516113281, 0.08072662353515625, 0.08418083190917969, 0.08763504028320312, 0.09108924865722656, 0.09454345703125, 0.09799766540527344, 0.10145187377929688, 0.10490608215332031, 0.10836029052734375, 0.11181449890136719, 0.11526870727539062, 0.11872291564941406, 0.1221771240234375, 0.12563133239746094, 0.12908554077148438, 0.1325397491455078, 0.13599395751953125, 0.1394481658935547, 0.14290237426757812, 0.14635658264160156, 0.149810791015625, 0.15326499938964844, 0.15671920776367188, 0.1601734161376953, 0.16362762451171875, 0.1670818328857422, 0.17053604125976562, 0.17399024963378906, 0.1774444580078125, 0.18089866638183594, 0.18435287475585938, 0.1878070831298828, 0.19126129150390625, 0.1947154998779297, 0.19816970825195312, 0.20162391662597656, 0.205078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 15.0, 13.0, 23.0, 17.0, 29.0, 53.0, 54.0, 68.0, 111.0, 200.0, 316.0, 693.0, 1745.0, 6142.0, 28728.0, 187383.0, 640750.0, 150295.0, 23572.0, 5317.0, 1498.0, 622.0, 303.0, 171.0, 126.0, 93.0, 52.0, 41.0, 30.0, 18.0, 15.0, 13.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.305908203125, -0.297027587890625, -0.28814697265625, -0.279266357421875, -0.2703857421875, -0.261505126953125, -0.25262451171875, -0.243743896484375, -0.23486328125, -0.225982666015625, -0.21710205078125, -0.208221435546875, -0.1993408203125, -0.190460205078125, -0.18157958984375, -0.172698974609375, -0.163818359375, -0.154937744140625, -0.14605712890625, -0.137176513671875, -0.1282958984375, -0.119415283203125, -0.11053466796875, -0.101654052734375, -0.0927734375, -0.083892822265625, -0.07501220703125, -0.066131591796875, -0.0572509765625, -0.048370361328125, -0.03948974609375, -0.030609130859375, -0.021728515625, -0.012847900390625, -0.00396728515625, 0.004913330078125, 0.0137939453125, 0.022674560546875, 0.03155517578125, 0.040435791015625, 0.04931640625, 0.058197021484375, 0.06707763671875, 0.075958251953125, 0.0848388671875, 0.093719482421875, 0.10260009765625, 0.111480712890625, 0.120361328125, 0.129241943359375, 0.13812255859375, 0.147003173828125, 0.1558837890625, 0.164764404296875, 0.17364501953125, 0.182525634765625, 0.19140625, 0.200286865234375, 0.20916748046875, 0.218048095703125, 0.2269287109375, 0.235809326171875, 0.24468994140625, 0.253570556640625, 0.262451171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 11.0, 17.0, 15.0, 21.0, 25.0, 31.0, 28.0, 34.0, 29.0, 39.0, 36.0, 50.0, 43.0, 36.0, 56.0, 57.0, 54.0, 58.0, 48.0, 40.0, 50.0, 31.0, 28.0, 25.0, 30.0, 23.0, 15.0, 9.0, 8.0, 6.0, 9.0, 6.0, 4.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1744384765625, -0.16913414001464844, -0.16382980346679688, -0.1585254669189453, -0.15322113037109375, -0.1479167938232422, -0.14261245727539062, -0.13730812072753906, -0.1320037841796875, -0.12669944763183594, -0.12139511108398438, -0.11609077453613281, -0.11078643798828125, -0.10548210144042969, -0.10017776489257812, -0.09487342834472656, -0.089569091796875, -0.08426475524902344, -0.07896041870117188, -0.07365608215332031, -0.06835174560546875, -0.06304740905761719, -0.057743072509765625, -0.05243873596191406, -0.0471343994140625, -0.04183006286621094, -0.036525726318359375, -0.031221389770507812, -0.02591705322265625, -0.020612716674804688, -0.015308380126953125, -0.010004043579101562, -0.00469970703125, 0.0006046295166015625, 0.005908966064453125, 0.011213302612304688, 0.01651763916015625, 0.021821975708007812, 0.027126312255859375, 0.03243064880371094, 0.0377349853515625, 0.04303932189941406, 0.048343658447265625, 0.05364799499511719, 0.05895233154296875, 0.06425666809082031, 0.06956100463867188, 0.07486534118652344, 0.080169677734375, 0.08547401428222656, 0.09077835083007812, 0.09608268737792969, 0.10138702392578125, 0.10669136047363281, 0.11199569702148438, 0.11730003356933594, 0.1226043701171875, 0.12790870666503906, 0.13321304321289062, 0.1385173797607422, 0.14382171630859375, 0.1491260528564453, 0.15443038940429688, 0.15973472595214844, 0.1650390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 6.0, 8.0, 5.0, 9.0, 11.0, 15.0, 14.0, 27.0, 44.0, 85.0, 164.0, 473.0, 1755.0, 13671.0, 992746.0, 35962.0, 2439.0, 610.0, 212.0, 99.0, 52.0, 36.0, 24.0, 15.0, 9.0, 15.0, 11.0, 7.0, 1.0, 3.0, 7.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.8642578125, -0.83929443359375, -0.8143310546875, -0.78936767578125, -0.764404296875, -0.73944091796875, -0.7144775390625, -0.68951416015625, -0.66455078125, -0.63958740234375, -0.6146240234375, -0.58966064453125, -0.564697265625, -0.53973388671875, -0.5147705078125, -0.48980712890625, -0.46484375, -0.43988037109375, -0.4149169921875, -0.38995361328125, -0.364990234375, -0.34002685546875, -0.3150634765625, -0.29010009765625, -0.26513671875, -0.24017333984375, -0.2152099609375, -0.19024658203125, -0.165283203125, -0.14031982421875, -0.1153564453125, -0.09039306640625, -0.0654296875, -0.04046630859375, -0.0155029296875, 0.00946044921875, 0.034423828125, 0.05938720703125, 0.0843505859375, 0.10931396484375, 0.13427734375, 0.15924072265625, 0.1842041015625, 0.20916748046875, 0.234130859375, 0.25909423828125, 0.2840576171875, 0.30902099609375, 0.333984375, 0.35894775390625, 0.3839111328125, 0.40887451171875, 0.433837890625, 0.45880126953125, 0.4837646484375, 0.50872802734375, 0.53369140625, 0.55865478515625, 0.5836181640625, 0.60858154296875, 0.633544921875, 0.65850830078125, 0.6834716796875, 0.70843505859375, 0.7333984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 15.0, 13.0, 15.0, 19.0, 29.0, 32.0, 39.0, 51.0, 65.0, 93.0, 115.0, 98.0, 85.0, 60.0, 55.0, 51.0, 17.0, 26.0, 19.0, 17.0, 9.0, 13.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00014519691467285156, -0.00014092959463596344, -0.00013666227459907532, -0.0001323949545621872, -0.00012812763452529907, -0.00012386031448841095, -0.00011959299445152283, -0.0001153256744146347, -0.00011105835437774658, -0.00010679103434085846, -0.00010252371430397034, -9.825639426708221e-05, -9.398907423019409e-05, -8.972175419330597e-05, -8.545443415641785e-05, -8.118711411952972e-05, -7.69197940826416e-05, -7.265247404575348e-05, -6.838515400886536e-05, -6.411783397197723e-05, -5.985051393508911e-05, -5.558319389820099e-05, -5.1315873861312866e-05, -4.7048553824424744e-05, -4.278123378753662e-05, -3.85139137506485e-05, -3.4246593713760376e-05, -2.9979273676872253e-05, -2.571195363998413e-05, -2.1444633603096008e-05, -1.7177313566207886e-05, -1.2909993529319763e-05, -8.64267349243164e-06, -4.375353455543518e-06, -1.0803341865539551e-07, 4.159286618232727e-06, 8.42660665512085e-06, 1.2693926692008972e-05, 1.6961246728897095e-05, 2.1228566765785217e-05, 2.549588680267334e-05, 2.9763206839561462e-05, 3.4030526876449585e-05, 3.829784691333771e-05, 4.256516695022583e-05, 4.683248698711395e-05, 5.1099807024002075e-05, 5.53671270608902e-05, 5.963444709777832e-05, 6.390176713466644e-05, 6.816908717155457e-05, 7.243640720844269e-05, 7.670372724533081e-05, 8.097104728221893e-05, 8.523836731910706e-05, 8.950568735599518e-05, 9.37730073928833e-05, 9.804032742977142e-05, 0.00010230764746665955, 0.00010657496750354767, 0.00011084228754043579, 0.00011510960757732391, 0.00011937692761421204, 0.00012364424765110016, 0.00012791156768798828]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 6.0, 10.0, 21.0, 26.0, 47.0, 69.0, 156.0, 343.0, 1154.0, 5613.0, 64076.0, 953054.0, 19925.0, 2941.0, 674.0, 181.0, 96.0, 45.0, 33.0, 10.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.19921875, -1.1694717407226562, -1.1397247314453125, -1.1099777221679688, -1.080230712890625, -1.0504837036132812, -1.0207366943359375, -0.9909896850585938, -0.96124267578125, -0.9314956665039062, -0.9017486572265625, -0.8720016479492188, -0.842254638671875, -0.8125076293945312, -0.7827606201171875, -0.7530136108398438, -0.7232666015625, -0.6935195922851562, -0.6637725830078125, -0.6340255737304688, -0.604278564453125, -0.5745315551757812, -0.5447845458984375, -0.5150375366210938, -0.48529052734375, -0.45554351806640625, -0.4257965087890625, -0.39604949951171875, -0.366302490234375, -0.33655548095703125, -0.3068084716796875, -0.27706146240234375, -0.247314453125, -0.21756744384765625, -0.1878204345703125, -0.15807342529296875, -0.128326416015625, -0.09857940673828125, -0.0688323974609375, -0.03908538818359375, -0.00933837890625, 0.02040863037109375, 0.0501556396484375, 0.07990264892578125, 0.109649658203125, 0.13939666748046875, 0.1691436767578125, 0.19889068603515625, 0.2286376953125, 0.25838470458984375, 0.2881317138671875, 0.31787872314453125, 0.347625732421875, 0.37737274169921875, 0.4071197509765625, 0.43686676025390625, 0.46661376953125, 0.49636077880859375, 0.5261077880859375, 0.5558547973632812, 0.585601806640625, 0.6153488159179688, 0.6450958251953125, 0.6748428344726562, 0.70458984375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 5.0, 6.0, 5.0, 9.0, 14.0, 34.0, 44.0, 94.0, 294.0, 275.0, 94.0, 39.0, 22.0, 7.0, 5.0, 8.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.72314453125, -0.7066879272460938, -0.6902313232421875, -0.6737747192382812, -0.657318115234375, -0.6408615112304688, -0.6244049072265625, -0.6079483032226562, -0.59149169921875, -0.5750350952148438, -0.5585784912109375, -0.5421218872070312, -0.525665283203125, -0.5092086791992188, -0.4927520751953125, -0.47629547119140625, -0.4598388671875, -0.44338226318359375, -0.4269256591796875, -0.41046905517578125, -0.394012451171875, -0.37755584716796875, -0.3610992431640625, -0.34464263916015625, -0.32818603515625, -0.31172943115234375, -0.2952728271484375, -0.27881622314453125, -0.262359619140625, -0.24590301513671875, -0.2294464111328125, -0.21298980712890625, -0.196533203125, -0.18007659912109375, -0.1636199951171875, -0.14716339111328125, -0.130706787109375, -0.11425018310546875, -0.0977935791015625, -0.08133697509765625, -0.06488037109375, -0.04842376708984375, -0.0319671630859375, -0.01551055908203125, 0.000946044921875, 0.01740264892578125, 0.0338592529296875, 0.05031585693359375, 0.0667724609375, 0.08322906494140625, 0.0996856689453125, 0.11614227294921875, 0.132598876953125, 0.14905548095703125, 0.1655120849609375, 0.18196868896484375, 0.19842529296875, 0.21488189697265625, 0.2313385009765625, 0.24779510498046875, 0.264251708984375, 0.28070831298828125, 0.2971649169921875, 0.31362152099609375, 0.330078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [4.0, 20.0, 963.0, 31.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.191648006439209, -2.0491628646850586, -0.9066774845123291, 0.2358078956604004, 1.3782930374145508, 2.520778179168701, 3.6632637977600098, 4.80574893951416, 5.9482340812683105, 7.090719223022461, 8.23320484161377, 9.375690460205078, 10.51817512512207, 11.660659790039062, 12.803146362304688, 13.94563102722168, 15.088115692138672, 16.230600357055664, 17.37308692932129, 18.51557159423828, 19.658056259155273, 20.800540924072266, 21.94302749633789, 23.085512161254883, 24.227998733520508, 25.3704833984375, 26.512969970703125, 27.655454635620117, 28.79793930053711, 29.940425872802734, 31.082910537719727, 32.22539520263672, 33.36787796020508, 34.5103645324707, 35.65284729003906, 36.79533386230469, 37.93782043457031, 39.08030319213867, 40.2227897644043, 41.36527633666992, 42.50775909423828, 43.650245666503906, 44.792728424072266, 45.93521499633789, 47.077701568603516, 48.220184326171875, 49.3626708984375, 50.505157470703125, 51.64764404296875, 52.790130615234375, 53.932613372802734, 55.07509994506836, 56.217586517333984, 57.360069274902344, 58.50255584716797, 59.645042419433594, 60.78752517700195, 61.93001174926758, 63.07249450683594, 64.21498107910156, 65.35746765136719, 66.49995422363281, 67.64244079589844, 68.78491973876953, 69.92740631103516]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 18.0, 31.0, 48.0, 103.0, 119.0, 174.0, 145.0, 137.0, 119.0, 59.0, 32.0, 14.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1238951683044434, -0.9953086972236633, -0.8667222261428833, -0.7381357550621033, -0.6095492839813232, -0.4809628129005432, -0.3523763418197632, -0.22378987073898315, -0.09520339965820312, 0.033383071422576904, 0.16196954250335693, 0.29055601358413696, 0.419142484664917, 0.547728955745697, 0.676315426826477, 0.8049018979072571, 0.9334883689880371, 1.062074899673462, 1.1906613111495972, 1.3192477226257324, 1.4478342533111572, 1.576420783996582, 1.7050071954727173, 1.8335936069488525, 1.9621801376342773, 2.090766668319702, 2.219353199005127, 2.3479394912719727, 2.4765260219573975, 2.6051125526428223, 2.733698844909668, 2.8622853755950928, 2.9908719062805176, 3.1194584369659424, 3.248044967651367, 3.376631259918213, 3.5052177906036377, 3.6338043212890625, 3.762390613555908, 3.890977144241333, 4.019563674926758, 4.1481499671936035, 4.276736736297607, 4.405323028564453, 4.533909797668457, 4.662496089935303, 4.791082382202148, 4.919669151306152, 5.048255443572998, 5.176841735839844, 5.305428504943848, 5.434014797210693, 5.562601089477539, 5.691187858581543, 5.819774150848389, 5.948360919952393, 6.076947212219238, 6.205533504486084, 6.334120273590088, 6.462706565856934, 6.5912933349609375, 6.719879627227783, 6.848465919494629, 6.977052688598633, 7.1056389808654785]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 14.0, 68.0, 216.0, 4150196.0, 42956.0, 475.0, 193.0, 96.0, 37.0, 22.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5087890625, -1.3176116943359375, -1.126434326171875, -0.9352569580078125, -0.74407958984375, -0.5529022216796875, -0.361724853515625, -0.1705474853515625, 0.0206298828125, 0.2118072509765625, 0.402984619140625, 0.5941619873046875, 0.78533935546875, 0.9765167236328125, 1.167694091796875, 1.3588714599609375, 1.550048828125, 1.7412261962890625, 1.932403564453125, 2.1235809326171875, 2.31475830078125, 2.5059356689453125, 2.697113037109375, 2.8882904052734375, 3.0794677734375, 3.2706451416015625, 3.461822509765625, 3.6529998779296875, 3.84417724609375, 4.0353546142578125, 4.226531982421875, 4.4177093505859375, 4.60888671875, 4.8000640869140625, 4.991241455078125, 5.1824188232421875, 5.37359619140625, 5.5647735595703125, 5.755950927734375, 5.9471282958984375, 6.1383056640625, 6.3294830322265625, 6.520660400390625, 6.7118377685546875, 6.90301513671875, 7.0941925048828125, 7.285369873046875, 7.4765472412109375, 7.667724609375, 7.8589019775390625, 8.050079345703125, 8.241256713867188, 8.43243408203125, 8.623611450195312, 8.814788818359375, 9.005966186523438, 9.1971435546875, 9.388320922851562, 9.579498291015625, 9.770675659179688, 9.96185302734375, 10.153030395507812, 10.344207763671875, 10.535385131835938, 10.7265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 11.0, 61.0, 157.0, 302.0, 284.0, 140.0, 46.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038482666015625, -0.03363943099975586, -0.02879619598388672, -0.023952960968017578, -0.019109725952148438, -0.014266490936279297, -0.009423255920410156, -0.004580020904541016, 0.000263214111328125, 0.005106449127197266, 0.009949684143066406, 0.014792919158935547, 0.019636154174804688, 0.024479389190673828, 0.02932262420654297, 0.03416585922241211, 0.03900909423828125, 0.04385232925415039, 0.04869556427001953, 0.05353879928588867, 0.05838203430175781, 0.06322526931762695, 0.0680685043334961, 0.07291173934936523, 0.07775497436523438, 0.08259820938110352, 0.08744144439697266, 0.0922846794128418, 0.09712791442871094, 0.10197114944458008, 0.10681438446044922, 0.11165761947631836, 0.1165008544921875, 0.12134408950805664, 0.12618732452392578, 0.13103055953979492, 0.13587379455566406, 0.1407170295715332, 0.14556026458740234, 0.15040349960327148, 0.15524673461914062, 0.16008996963500977, 0.1649332046508789, 0.16977643966674805, 0.1746196746826172, 0.17946290969848633, 0.18430614471435547, 0.1891493797302246, 0.19399261474609375, 0.1988358497619629, 0.20367908477783203, 0.20852231979370117, 0.2133655548095703, 0.21820878982543945, 0.2230520248413086, 0.22789525985717773, 0.23273849487304688, 0.23758172988891602, 0.24242496490478516, 0.2472681999206543, 0.25211143493652344, 0.2569546699523926, 0.2617979049682617, 0.26664113998413086, 0.271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 16.0, 48.0, 108.0, 188.0, 375.0, 4185312.0, 7390.0, 305.0, 252.0, 131.0, 93.0, 33.0, 17.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01171875, -4.74542236328125, -4.4791259765625, -4.21282958984375, -3.946533203125, -3.68023681640625, -3.4139404296875, -3.14764404296875, -2.88134765625, -2.61505126953125, -2.3487548828125, -2.08245849609375, -1.816162109375, -1.54986572265625, -1.2835693359375, -1.01727294921875, -0.7509765625, -0.48468017578125, -0.2183837890625, 0.04791259765625, 0.314208984375, 0.58050537109375, 0.8468017578125, 1.11309814453125, 1.37939453125, 1.64569091796875, 1.9119873046875, 2.17828369140625, 2.444580078125, 2.71087646484375, 2.9771728515625, 3.24346923828125, 3.509765625, 3.77606201171875, 4.0423583984375, 4.30865478515625, 4.574951171875, 4.84124755859375, 5.1075439453125, 5.37384033203125, 5.64013671875, 5.90643310546875, 6.1727294921875, 6.43902587890625, 6.705322265625, 6.97161865234375, 7.2379150390625, 7.50421142578125, 7.7705078125, 8.03680419921875, 8.3031005859375, 8.56939697265625, 8.835693359375, 9.10198974609375, 9.3682861328125, 9.63458251953125, 9.90087890625, 10.16717529296875, 10.4334716796875, 10.69976806640625, 10.966064453125, 11.23236083984375, 11.4986572265625, 11.76495361328125, 12.03125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 11.0, 25.0, 65.0, 2989.0, 973.0, 19.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.2100353240966797, -0.18362045288085938, -0.15720558166503906, -0.13079071044921875, -0.10437583923339844, -0.07796096801757812, -0.05154609680175781, -0.0251312255859375, 0.0012836456298828125, 0.027698516845703125, 0.05411338806152344, 0.08052825927734375, 0.10694313049316406, 0.13335800170898438, 0.1597728729248047, 0.186187744140625, 0.2126026153564453, 0.23901748657226562, 0.26543235778808594, 0.29184722900390625, 0.31826210021972656, 0.3446769714355469, 0.3710918426513672, 0.3975067138671875, 0.4239215850830078, 0.4503364562988281, 0.47675132751464844, 0.5031661987304688, 0.5295810699462891, 0.5559959411621094, 0.5824108123779297, 0.60882568359375, 0.6352405548095703, 0.6616554260253906, 0.6880702972412109, 0.7144851684570312, 0.7409000396728516, 0.7673149108886719, 0.7937297821044922, 0.8201446533203125, 0.8465595245361328, 0.8729743957519531, 0.8993892669677734, 0.9258041381835938, 0.9522190093994141, 0.9786338806152344, 1.0050487518310547, 1.031463623046875, 1.0578784942626953, 1.0842933654785156, 1.110708236694336, 1.1371231079101562, 1.1635379791259766, 1.1899528503417969, 1.2163677215576172, 1.2427825927734375, 1.2691974639892578, 1.2956123352050781, 1.3220272064208984, 1.3484420776367188, 1.374856948852539, 1.4012718200683594, 1.4276866912841797, 1.4541015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 47.0, 744.0, 191.0, 16.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0630295276641846, -2.7787883281707764, -2.494547128677368, -2.21030592918396, -1.9260647296905518, -1.6418235301971436, -1.3575823307037354, -1.0733411312103271, -0.789099931716919, -0.5048587322235107, -0.22061753273010254, 0.06362366676330566, 0.34786486625671387, 0.6321060657501221, 0.9163472652435303, 1.2005884647369385, 1.4848296642303467, 1.7690708637237549, 2.053312063217163, 2.3375532627105713, 2.6217944622039795, 2.9060356616973877, 3.190276861190796, 3.474518060684204, 3.7587592601776123, 4.043000221252441, 4.327241897583008, 4.611482620239258, 4.895724296569824, 5.179965019226074, 5.464206695556641, 5.748447418212891, 6.032689094543457, 6.316930294036865, 6.601171493530273, 6.885412693023682, 7.16965389251709, 7.453895092010498, 7.738136291503906, 8.022377014160156, 8.306618690490723, 8.590860366821289, 8.875101089477539, 9.159341812133789, 9.443583488464355, 9.727825164794922, 10.012065887451172, 10.296306610107422, 10.580548286437988, 10.864789962768555, 11.149030685424805, 11.433271408081055, 11.717513084411621, 12.001754760742188, 12.285995483398438, 12.570236206054688, 12.854477882385254, 13.13871955871582, 13.42296028137207, 13.70720100402832, 13.991442680358887, 14.275684356689453, 14.559925079345703, 14.844165802001953, 15.12840747833252]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 19.0, 32.0, 81.0, 83.0, 130.0, 158.0, 157.0, 136.0, 93.0, 50.0, 27.0, 16.0, 8.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.854895114898682, -4.703230857849121, -4.551567077636719, -4.399902820587158, -4.248238563537598, -4.096574783325195, -3.9449105262756348, -3.7932465076446533, -3.641582489013672, -3.4899184703826904, -3.33825421333313, -3.1865901947021484, -3.034926176071167, -2.8832621574401855, -2.731597900390625, -2.5799338817596436, -2.428269624710083, -2.2766056060791016, -2.124941349029541, -1.9732773303985596, -1.8216133117675781, -1.6699491739273071, -1.5182850360870361, -1.3666210174560547, -1.2149568796157837, -1.0632927417755127, -0.9116287231445312, -0.7599645853042603, -0.608300507068634, -0.4566364288330078, -0.3049722909927368, -0.15330827236175537, -0.001644134521484375, 0.15001995861530304, 0.30168405175209045, 0.45334815979003906, 0.6050122380256653, 0.7566763162612915, 0.9083404541015625, 1.060004472732544, 1.211668610572815, 1.363332748413086, 1.5149967670440674, 1.6666609048843384, 1.8183250427246094, 1.9699890613555908, 2.1216530799865723, 2.273317337036133, 2.4249813556671143, 2.5766453742980957, 2.7283096313476562, 2.8799736499786377, 3.031637668609619, 3.1833019256591797, 3.334965944290161, 3.4866299629211426, 3.638294219970703, 3.7899582386016846, 3.941622495651245, 4.093286514282227, 4.244950771331787, 4.3966145515441895, 4.54827880859375, 4.699942588806152, 4.851606845855713]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 15.0, 19.0, 34.0, 39.0, 49.0, 96.0, 166.0, 385.0, 919.0, 3214.0, 25121.0, 861281.0, 146256.0, 8090.0, 1691.0, 581.0, 230.0, 111.0, 70.0, 54.0, 32.0, 21.0, 15.0, 9.0, 14.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5146484375, -1.4654083251953125, -1.416168212890625, -1.3669281005859375, -1.31768798828125, -1.2684478759765625, -1.219207763671875, -1.1699676513671875, -1.1207275390625, -1.0714874267578125, -1.022247314453125, -0.9730072021484375, -0.92376708984375, -0.8745269775390625, -0.825286865234375, -0.7760467529296875, -0.726806640625, -0.6775665283203125, -0.628326416015625, -0.5790863037109375, -0.52984619140625, -0.4806060791015625, -0.431365966796875, -0.3821258544921875, -0.3328857421875, -0.2836456298828125, -0.234405517578125, -0.1851654052734375, -0.13592529296875, -0.0866851806640625, -0.037445068359375, 0.0117950439453125, 0.06103515625, 0.1102752685546875, 0.159515380859375, 0.2087554931640625, 0.25799560546875, 0.3072357177734375, 0.356475830078125, 0.4057159423828125, 0.4549560546875, 0.5041961669921875, 0.553436279296875, 0.6026763916015625, 0.65191650390625, 0.7011566162109375, 0.750396728515625, 0.7996368408203125, 0.848876953125, 0.8981170654296875, 0.947357177734375, 0.9965972900390625, 1.04583740234375, 1.0950775146484375, 1.144317626953125, 1.1935577392578125, 1.2427978515625, 1.2920379638671875, 1.341278076171875, 1.3905181884765625, 1.43975830078125, 1.4889984130859375, 1.538238525390625, 1.5874786376953125, 1.63671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 20.0, 38.0, 47.0, 106.0, 141.0, 173.0, 160.0, 137.0, 77.0, 53.0, 26.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14501953125, -0.1369171142578125, -0.128814697265625, -0.1207122802734375, -0.11260986328125, -0.1045074462890625, -0.096405029296875, -0.0883026123046875, -0.0802001953125, -0.0720977783203125, -0.063995361328125, -0.0558929443359375, -0.04779052734375, -0.0396881103515625, -0.031585693359375, -0.0234832763671875, -0.015380859375, -0.0072784423828125, 0.000823974609375, 0.0089263916015625, 0.01702880859375, 0.0251312255859375, 0.033233642578125, 0.0413360595703125, 0.0494384765625, 0.0575408935546875, 0.065643310546875, 0.0737457275390625, 0.08184814453125, 0.0899505615234375, 0.098052978515625, 0.1061553955078125, 0.1142578125, 0.1223602294921875, 0.130462646484375, 0.1385650634765625, 0.14666748046875, 0.1547698974609375, 0.162872314453125, 0.1709747314453125, 0.1790771484375, 0.1871795654296875, 0.195281982421875, 0.2033843994140625, 0.21148681640625, 0.2195892333984375, 0.227691650390625, 0.2357940673828125, 0.243896484375, 0.2519989013671875, 0.260101318359375, 0.2682037353515625, 0.27630615234375, 0.2844085693359375, 0.292510986328125, 0.3006134033203125, 0.3087158203125, 0.3168182373046875, 0.324920654296875, 0.3330230712890625, 0.34112548828125, 0.3492279052734375, 0.357330322265625, 0.3654327392578125, 0.37353515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 2.0, 9.0, 10.0, 14.0, 20.0, 14.0, 26.0, 44.0, 36.0, 80.0, 181.0, 458.0, 2095.0, 24507.0, 869860.0, 143072.0, 6547.0, 918.0, 295.0, 117.0, 75.0, 36.0, 34.0, 19.0, 17.0, 10.0, 12.0, 11.0, 7.0, 7.0, 0.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01953125, -0.9863739013671875, -0.953216552734375, -0.9200592041015625, -0.88690185546875, -0.8537445068359375, -0.820587158203125, -0.7874298095703125, -0.7542724609375, -0.7211151123046875, -0.687957763671875, -0.6548004150390625, -0.62164306640625, -0.5884857177734375, -0.555328369140625, -0.5221710205078125, -0.489013671875, -0.4558563232421875, -0.422698974609375, -0.3895416259765625, -0.35638427734375, -0.3232269287109375, -0.290069580078125, -0.2569122314453125, -0.2237548828125, -0.1905975341796875, -0.157440185546875, -0.1242828369140625, -0.09112548828125, -0.0579681396484375, -0.024810791015625, 0.0083465576171875, 0.04150390625, 0.0746612548828125, 0.107818603515625, 0.1409759521484375, 0.17413330078125, 0.2072906494140625, 0.240447998046875, 0.2736053466796875, 0.3067626953125, 0.3399200439453125, 0.373077392578125, 0.4062347412109375, 0.43939208984375, 0.4725494384765625, 0.505706787109375, 0.5388641357421875, 0.572021484375, 0.6051788330078125, 0.638336181640625, 0.6714935302734375, 0.70465087890625, 0.7378082275390625, 0.770965576171875, 0.8041229248046875, 0.8372802734375, 0.8704376220703125, 0.903594970703125, 0.9367523193359375, 0.96990966796875, 1.0030670166015625, 1.036224365234375, 1.0693817138671875, 1.1025390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 6.0, 10.0, 7.0, 11.0, 5.0, 15.0, 30.0, 25.0, 27.0, 30.0, 32.0, 33.0, 54.0, 53.0, 62.0, 65.0, 79.0, 58.0, 57.0, 62.0, 42.0, 42.0, 39.0, 32.0, 20.0, 14.0, 21.0, 19.0, 13.0, 13.0, 5.0, 4.0, 3.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.411376953125, -0.3973579406738281, -0.38333892822265625, -0.3693199157714844, -0.3553009033203125, -0.3412818908691406, -0.32726287841796875, -0.3132438659667969, -0.299224853515625, -0.2852058410644531, -0.27118682861328125, -0.2571678161621094, -0.2431488037109375, -0.22912979125976562, -0.21511077880859375, -0.20109176635742188, -0.18707275390625, -0.17305374145507812, -0.15903472900390625, -0.14501571655273438, -0.1309967041015625, -0.11697769165039062, -0.10295867919921875, -0.08893966674804688, -0.074920654296875, -0.060901641845703125, -0.04688262939453125, -0.032863616943359375, -0.0188446044921875, -0.004825592041015625, 0.00919342041015625, 0.023212432861328125, 0.0372314453125, 0.051250457763671875, 0.06526947021484375, 0.07928848266601562, 0.0933074951171875, 0.10732650756835938, 0.12134552001953125, 0.13536453247070312, 0.149383544921875, 0.16340255737304688, 0.17742156982421875, 0.19144058227539062, 0.2054595947265625, 0.21947860717773438, 0.23349761962890625, 0.24751663208007812, 0.26153564453125, 0.2755546569824219, 0.28957366943359375, 0.3035926818847656, 0.3176116943359375, 0.3316307067871094, 0.34564971923828125, 0.3596687316894531, 0.373687744140625, 0.3877067565917969, 0.40172576904296875, 0.4157447814941406, 0.4297637939453125, 0.4437828063964844, 0.45780181884765625, 0.4718208312988281, 0.48583984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 27.0, 43.0, 139.0, 324.0, 1955.0, 990145.0, 54505.0, 984.0, 253.0, 87.0, 49.0, 18.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4262847900390625, -1.371124267578125, -1.3159637451171875, -1.26080322265625, -1.2056427001953125, -1.150482177734375, -1.0953216552734375, -1.0401611328125, -0.9850006103515625, -0.929840087890625, -0.8746795654296875, -0.81951904296875, -0.7643585205078125, -0.709197998046875, -0.6540374755859375, -0.598876953125, -0.5437164306640625, -0.488555908203125, -0.4333953857421875, -0.37823486328125, -0.3230743408203125, -0.267913818359375, -0.2127532958984375, -0.1575927734375, -0.1024322509765625, -0.047271728515625, 0.0078887939453125, 0.06304931640625, 0.1182098388671875, 0.173370361328125, 0.2285308837890625, 0.28369140625, 0.3388519287109375, 0.394012451171875, 0.4491729736328125, 0.50433349609375, 0.5594940185546875, 0.614654541015625, 0.6698150634765625, 0.7249755859375, 0.7801361083984375, 0.835296630859375, 0.8904571533203125, 0.94561767578125, 1.0007781982421875, 1.055938720703125, 1.1110992431640625, 1.166259765625, 1.2214202880859375, 1.276580810546875, 1.3317413330078125, 1.38690185546875, 1.4420623779296875, 1.497222900390625, 1.5523834228515625, 1.6075439453125, 1.6627044677734375, 1.717864990234375, 1.7730255126953125, 1.82818603515625, 1.8833465576171875, 1.938507080078125, 1.9936676025390625, 2.048828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 8.0, 15.0, 14.0, 12.0, 17.0, 31.0, 29.0, 41.0, 47.0, 68.0, 86.0, 130.0, 132.0, 85.0, 70.0, 40.0, 38.0, 27.0, 21.0, 18.0, 17.0, 12.0, 10.0, 8.0, 10.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010734796524047852, -0.00010288413614034653, -9.842030704021454e-05, -9.395647794008255e-05, -8.949264883995056e-05, -8.502881973981857e-05, -8.056499063968658e-05, -7.61011615395546e-05, -7.163733243942261e-05, -6.717350333929062e-05, -6.270967423915863e-05, -5.824584513902664e-05, -5.378201603889465e-05, -4.9318186938762665e-05, -4.4854357838630676e-05, -4.039052873849869e-05, -3.59266996383667e-05, -3.146287053823471e-05, -2.6999041438102722e-05, -2.2535212337970734e-05, -1.8071383237838745e-05, -1.3607554137706757e-05, -9.143725037574768e-06, -4.6798959374427795e-06, -2.1606683731079102e-07, 4.2477622628211975e-06, 8.711591362953186e-06, 1.3175420463085175e-05, 1.7639249563217163e-05, 2.210307866334915e-05, 2.656690776348114e-05, 3.103073686361313e-05, 3.549456596374512e-05, 3.9958395063877106e-05, 4.4422224164009094e-05, 4.888605326414108e-05, 5.334988236427307e-05, 5.781371146440506e-05, 6.227754056453705e-05, 6.674136966466904e-05, 7.120519876480103e-05, 7.566902786493301e-05, 8.0132856965065e-05, 8.459668606519699e-05, 8.906051516532898e-05, 9.352434426546097e-05, 9.798817336559296e-05, 0.00010245200246572495, 0.00010691583156585693, 0.00011137966066598892, 0.00011584348976612091, 0.0001203073188662529, 0.0001247711479663849, 0.00012923497706651688, 0.00013369880616664886, 0.00013816263526678085, 0.00014262646436691284, 0.00014709029346704483, 0.00015155412256717682, 0.0001560179516673088, 0.0001604817807674408, 0.00016494560986757278, 0.00016940943896770477, 0.00017387326806783676, 0.00017833709716796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 11.0, 21.0, 37.0, 71.0, 167.0, 708.0, 3922.0, 80640.0, 951032.0, 10256.0, 1191.0, 283.0, 98.0, 49.0, 20.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92578125, -0.8951416015625, -0.864501953125, -0.8338623046875, -0.80322265625, -0.7725830078125, -0.741943359375, -0.7113037109375, -0.6806640625, -0.6500244140625, -0.619384765625, -0.5887451171875, -0.55810546875, -0.5274658203125, -0.496826171875, -0.4661865234375, -0.435546875, -0.4049072265625, -0.374267578125, -0.3436279296875, -0.31298828125, -0.2823486328125, -0.251708984375, -0.2210693359375, -0.1904296875, -0.1597900390625, -0.129150390625, -0.0985107421875, -0.06787109375, -0.0372314453125, -0.006591796875, 0.0240478515625, 0.0546875, 0.0853271484375, 0.115966796875, 0.1466064453125, 0.17724609375, 0.2078857421875, 0.238525390625, 0.2691650390625, 0.2998046875, 0.3304443359375, 0.361083984375, 0.3917236328125, 0.42236328125, 0.4530029296875, 0.483642578125, 0.5142822265625, 0.544921875, 0.5755615234375, 0.606201171875, 0.6368408203125, 0.66748046875, 0.6981201171875, 0.728759765625, 0.7593994140625, 0.7900390625, 0.8206787109375, 0.851318359375, 0.8819580078125, 0.91259765625, 0.9432373046875, 0.973876953125, 1.0045166015625, 1.03515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 6.0, 9.0, 19.0, 19.0, 33.0, 56.0, 95.0, 189.0, 243.0, 123.0, 72.0, 45.0, 26.0, 16.0, 7.0, 8.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39794921875, -0.3848075866699219, -0.37166595458984375, -0.3585243225097656, -0.3453826904296875, -0.3322410583496094, -0.31909942626953125, -0.3059577941894531, -0.292816162109375, -0.2796745300292969, -0.26653289794921875, -0.2533912658691406, -0.2402496337890625, -0.22710800170898438, -0.21396636962890625, -0.20082473754882812, -0.18768310546875, -0.17454147338867188, -0.16139984130859375, -0.14825820922851562, -0.1351165771484375, -0.12197494506835938, -0.10883331298828125, -0.09569168090820312, -0.082550048828125, -0.06940841674804688, -0.05626678466796875, -0.043125152587890625, -0.0299835205078125, -0.016841888427734375, -0.00370025634765625, 0.009441375732421875, 0.0225830078125, 0.035724639892578125, 0.04886627197265625, 0.062007904052734375, 0.0751495361328125, 0.08829116821289062, 0.10143280029296875, 0.11457443237304688, 0.127716064453125, 0.14085769653320312, 0.15399932861328125, 0.16714096069335938, 0.1802825927734375, 0.19342422485351562, 0.20656585693359375, 0.21970748901367188, 0.23284912109375, 0.24599075317382812, 0.25913238525390625, 0.2722740173339844, 0.2854156494140625, 0.2985572814941406, 0.31169891357421875, 0.3248405456542969, 0.337982177734375, 0.3511238098144531, 0.36426544189453125, 0.3774070739746094, 0.3905487060546875, 0.4036903381347656, 0.41683197021484375, 0.4299736022949219, 0.443115234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 13.0, 70.0, 694.0, 213.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.427361488342285, -5.034890174865723, -4.64241886138916, -4.2499470710754395, -3.857475757598877, -3.4650044441223145, -3.072532892227173, -2.6800613403320312, -2.2875900268554688, -1.8951185941696167, -1.5026471614837646, -1.1101757287979126, -0.7177042961120605, -0.3252328634262085, 0.06723856925964355, 0.45971012115478516, 0.8521814346313477, 1.2446528673171997, 1.6371243000030518, 2.0295958518981934, 2.422067165374756, 2.8145384788513184, 3.20701003074646, 3.5994815826416016, 3.991952896118164, 4.384424209594727, 4.776895523071289, 5.16936731338501, 5.561838626861572, 5.954309940338135, 6.3467817306518555, 6.739253044128418, 7.131723403930664, 7.524194717407227, 7.916666030883789, 8.309137344360352, 8.701608657836914, 9.094080924987793, 9.486552238464355, 9.879023551940918, 10.27149486541748, 10.663966178894043, 11.056437492370605, 11.448908805847168, 11.841381072998047, 12.23385238647461, 12.626323699951172, 13.018795013427734, 13.411266326904297, 13.80373764038086, 14.196208953857422, 14.588680267333984, 14.981151580810547, 15.373623847961426, 15.766095161437988, 16.158565521240234, 16.551036834716797, 16.94350814819336, 17.335979461669922, 17.728450775146484, 18.120922088623047, 18.51339340209961, 18.905864715576172, 19.298336029052734, 19.69080924987793]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 5.0, 15.0, 22.0, 24.0, 21.0, 23.0, 48.0, 46.0, 44.0, 61.0, 71.0, 63.0, 63.0, 57.0, 63.0, 80.0, 45.0, 48.0, 34.0, 43.0, 27.0, 28.0, 13.0, 9.0, 10.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.592923164367676, -3.4902641773223877, -3.3876051902770996, -3.2849459648132324, -3.1822869777679443, -3.0796279907226562, -2.976969003677368, -2.87431001663208, -2.771651029586792, -2.668992042541504, -2.566333055496216, -2.4636740684509277, -2.3610148429870605, -2.2583558559417725, -2.1556968688964844, -2.0530378818511963, -1.9503787755966187, -1.8477197885513306, -1.745060682296753, -1.6424016952514648, -1.5397427082061768, -1.4370837211608887, -1.334424614906311, -1.231765627861023, -1.1291065216064453, -1.0264475345611572, -0.9237884879112244, -0.8211294412612915, -0.7184704542160034, -0.6158114075660706, -0.5131523609161377, -0.4104933738708496, -0.3078343868255615, -0.20517536997795105, -0.10251633822917938, 0.00014269351959228516, 0.10280171036720276, 0.20546072721481323, 0.3081197738647461, 0.4107787609100342, 0.513437807559967, 0.6160968542098999, 0.718755841255188, 0.8214148879051208, 0.9240739345550537, 1.0267329216003418, 1.1293919086456299, 1.232050895690918, 1.3347100019454956, 1.4373689889907837, 1.5400280952453613, 1.6426870822906494, 1.7453460693359375, 1.8480050563812256, 1.9506641626358032, 2.053323268890381, 2.155982255935669, 2.258641242980957, 2.361300230026245, 2.463959217071533, 2.5666184425354004, 2.6692774295806885, 2.7719364166259766, 2.8745954036712646, 2.9772543907165527]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 7.0, 20.0, 32.0, 85.0, 245.0, 677.0, 2380.0, 12098.0, 127840.0, 3976614.0, 62554.0, 7967.0, 1967.0, 746.0, 363.0, 190.0, 113.0, 78.0, 56.0, 45.0, 40.0, 34.0, 19.0, 22.0, 14.0, 18.0, 16.0, 9.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.7260513305664062, -0.6674346923828125, -0.6088180541992188, -0.550201416015625, -0.49158477783203125, -0.4329681396484375, -0.37435150146484375, -0.31573486328125, -0.25711822509765625, -0.1985015869140625, -0.13988494873046875, -0.081268310546875, -0.02265167236328125, 0.0359649658203125, 0.09458160400390625, 0.1531982421875, 0.21181488037109375, 0.2704315185546875, 0.32904815673828125, 0.387664794921875, 0.44628143310546875, 0.5048980712890625, 0.5635147094726562, 0.62213134765625, 0.6807479858398438, 0.7393646240234375, 0.7979812622070312, 0.856597900390625, 0.9152145385742188, 0.9738311767578125, 1.0324478149414062, 1.091064453125, 1.1496810913085938, 1.2082977294921875, 1.2669143676757812, 1.325531005859375, 1.3841476440429688, 1.4427642822265625, 1.5013809204101562, 1.55999755859375, 1.6186141967773438, 1.6772308349609375, 1.7358474731445312, 1.794464111328125, 1.8530807495117188, 1.9116973876953125, 1.9703140258789062, 2.0289306640625, 2.0875473022460938, 2.1461639404296875, 2.2047805786132812, 2.263397216796875, 2.3220138549804688, 2.3806304931640625, 2.4392471313476562, 2.49786376953125, 2.5564804077148438, 2.6150970458984375, 2.6737136840820312, 2.732330322265625, 2.7909469604492188, 2.8495635986328125, 2.9081802368164062, 2.966796875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 20.0, 31.0, 56.0, 75.0, 114.0, 152.0, 167.0, 128.0, 98.0, 64.0, 49.0, 21.0, 15.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.106201171875, -0.098236083984375, -0.09027099609375, -0.082305908203125, -0.0743408203125, -0.066375732421875, -0.05841064453125, -0.050445556640625, -0.04248046875, -0.034515380859375, -0.02655029296875, -0.018585205078125, -0.0106201171875, -0.002655029296875, 0.00531005859375, 0.013275146484375, 0.021240234375, 0.029205322265625, 0.03717041015625, 0.045135498046875, 0.0531005859375, 0.061065673828125, 0.06903076171875, 0.076995849609375, 0.0849609375, 0.092926025390625, 0.10089111328125, 0.108856201171875, 0.1168212890625, 0.124786376953125, 0.13275146484375, 0.140716552734375, 0.148681640625, 0.156646728515625, 0.16461181640625, 0.172576904296875, 0.1805419921875, 0.188507080078125, 0.19647216796875, 0.204437255859375, 0.21240234375, 0.220367431640625, 0.22833251953125, 0.236297607421875, 0.2442626953125, 0.252227783203125, 0.26019287109375, 0.268157958984375, 0.276123046875, 0.284088134765625, 0.29205322265625, 0.300018310546875, 0.3079833984375, 0.315948486328125, 0.32391357421875, 0.331878662109375, 0.33984375, 0.347808837890625, 0.35577392578125, 0.363739013671875, 0.3717041015625, 0.379669189453125, 0.38763427734375, 0.395599365234375, 0.403564453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 13.0, 30.0, 87.0, 388.0, 26762.0, 4165342.0, 1220.0, 266.0, 102.0, 43.0, 18.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.345458984375, -4.05810546875, -3.770751953125, -3.4833984375, -3.196044921875, -2.90869140625, -2.621337890625, -2.333984375, -2.046630859375, -1.75927734375, -1.471923828125, -1.1845703125, -0.897216796875, -0.60986328125, -0.322509765625, -0.03515625, 0.252197265625, 0.53955078125, 0.826904296875, 1.1142578125, 1.401611328125, 1.68896484375, 1.976318359375, 2.263671875, 2.551025390625, 2.83837890625, 3.125732421875, 3.4130859375, 3.700439453125, 3.98779296875, 4.275146484375, 4.5625, 4.849853515625, 5.13720703125, 5.424560546875, 5.7119140625, 5.999267578125, 6.28662109375, 6.573974609375, 6.861328125, 7.148681640625, 7.43603515625, 7.723388671875, 8.0107421875, 8.298095703125, 8.58544921875, 8.872802734375, 9.16015625, 9.447509765625, 9.73486328125, 10.022216796875, 10.3095703125, 10.596923828125, 10.88427734375, 11.171630859375, 11.458984375, 11.746337890625, 12.03369140625, 12.321044921875, 12.6083984375, 12.895751953125, 13.18310546875, 13.470458984375, 13.7578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 6.0, 14.0, 29.0, 85.0, 1813.0, 1966.0, 108.0, 31.0, 11.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2286376953125, -0.2032299041748047, -0.17782211303710938, -0.15241432189941406, -0.12700653076171875, -0.10159873962402344, -0.07619094848632812, -0.05078315734863281, -0.0253753662109375, 3.24249267578125e-05, 0.025440216064453125, 0.05084800720214844, 0.07625579833984375, 0.10166358947753906, 0.12707138061523438, 0.1524791717529297, 0.177886962890625, 0.2032947540283203, 0.22870254516601562, 0.25411033630371094, 0.27951812744140625, 0.30492591857910156, 0.3303337097167969, 0.3557415008544922, 0.3811492919921875, 0.4065570831298828, 0.4319648742675781, 0.45737266540527344, 0.48278045654296875, 0.5081882476806641, 0.5335960388183594, 0.5590038299560547, 0.58441162109375, 0.6098194122314453, 0.6352272033691406, 0.6606349945068359, 0.6860427856445312, 0.7114505767822266, 0.7368583679199219, 0.7622661590576172, 0.7876739501953125, 0.8130817413330078, 0.8384895324707031, 0.8638973236083984, 0.8893051147460938, 0.9147129058837891, 0.9401206970214844, 0.9655284881591797, 0.990936279296875, 1.0163440704345703, 1.0417518615722656, 1.067159652709961, 1.0925674438476562, 1.1179752349853516, 1.1433830261230469, 1.1687908172607422, 1.1941986083984375, 1.2196063995361328, 1.2450141906738281, 1.2704219818115234, 1.2958297729492188, 1.321237564086914, 1.3466453552246094, 1.3720531463623047, 1.3974609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 33.0, 213.0, 606.0, 97.0, 24.0, 13.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.902418375015259, -2.721881151199341, -2.541344165802002, -2.360806941986084, -2.180269956588745, -1.9997327327728271, -1.8191956281661987, -1.6386585235595703, -1.458121418952942, -1.2775843143463135, -1.097047209739685, -0.9165100455284119, -0.7359729409217834, -0.555435836315155, -0.37489867210388184, -0.19436156749725342, -0.013824462890625, 0.1667126566171646, 0.3472497761249542, 0.527786910533905, 0.7083240151405334, 0.8888611197471619, 1.069398283958435, 1.2499353885650635, 1.430472493171692, 1.6110095977783203, 1.7915467023849487, 1.9720838069915771, 2.152621030807495, 2.333158016204834, 2.513695240020752, 2.69423246383667, 2.874769687652588, 3.055306911468506, 3.2358438968658447, 3.4163811206817627, 3.5969181060791016, 3.7774553298950195, 3.9579925537109375, 4.1385297775268555, 4.319066524505615, 4.499603748321533, 4.680140972137451, 4.860677719116211, 5.041214942932129, 5.221752166748047, 5.402289390563965, 5.582826614379883, 5.763363838195801, 5.943901062011719, 6.124438285827637, 6.3049750328063965, 6.4855122566223145, 6.666049480438232, 6.84658670425415, 7.02712345123291, 7.207660675048828, 7.388197898864746, 7.568735122680664, 7.749271869659424, 7.929809093475342, 8.110345840454102, 8.29088306427002, 8.471420288085938, 8.651957511901855]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 15.0, 13.0, 29.0, 53.0, 86.0, 78.0, 91.0, 123.0, 120.0, 96.0, 77.0, 74.0, 58.0, 30.0, 22.0, 17.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1716794967651367, -3.0620315074920654, -2.952383518218994, -2.842735528945923, -2.7330875396728516, -2.6234395503997803, -2.513791561126709, -2.4041435718536377, -2.2944955825805664, -2.184847593307495, -2.075199604034424, -1.9655516147613525, -1.8559036254882812, -1.74625563621521, -1.6366076469421387, -1.5269596576690674, -1.417311668395996, -1.3076636791229248, -1.1980156898498535, -1.0883677005767822, -0.9787197113037109, -0.8690717220306396, -0.7594237327575684, -0.6497757434844971, -0.5401277542114258, -0.4304797649383545, -0.3208317756652832, -0.21118378639221191, -0.10153579711914062, 0.008112192153930664, 0.11776018142700195, 0.22740817070007324, 0.33705615997314453, 0.4467041492462158, 0.5563521385192871, 0.6660001277923584, 0.7756481170654297, 0.885296106338501, 0.9949440956115723, 1.1045920848846436, 1.2142400741577148, 1.3238880634307861, 1.4335360527038574, 1.5431840419769287, 1.65283203125, 1.7624800205230713, 1.8721280097961426, 1.9817759990692139, 2.091423988342285, 2.2010719776153564, 2.3107199668884277, 2.420367956161499, 2.5300159454345703, 2.6396639347076416, 2.749311923980713, 2.858959913253784, 2.9686079025268555, 3.0782558917999268, 3.187903881072998, 3.2975518703460693, 3.4071998596191406, 3.516847848892212, 3.626495838165283, 3.7361438274383545, 3.845791816711426]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 6.0, 7.0, 9.0, 15.0, 12.0, 38.0, 34.0, 51.0, 62.0, 88.0, 130.0, 184.0, 277.0, 434.0, 891.0, 2009.0, 5910.0, 22237.0, 116313.0, 689084.0, 168719.0, 29621.0, 7484.0, 2393.0, 1062.0, 488.0, 305.0, 199.0, 121.0, 103.0, 66.0, 47.0, 43.0, 28.0, 21.0, 15.0, 12.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.7496871948242188, -0.7225189208984375, -0.6953506469726562, -0.668182373046875, -0.6410140991210938, -0.6138458251953125, -0.5866775512695312, -0.55950927734375, -0.5323410034179688, -0.5051727294921875, -0.47800445556640625, -0.450836181640625, -0.42366790771484375, -0.3964996337890625, -0.36933135986328125, -0.3421630859375, -0.31499481201171875, -0.2878265380859375, -0.26065826416015625, -0.233489990234375, -0.20632171630859375, -0.1791534423828125, -0.15198516845703125, -0.12481689453125, -0.09764862060546875, -0.0704803466796875, -0.04331207275390625, -0.016143798828125, 0.01102447509765625, 0.0381927490234375, 0.06536102294921875, 0.092529296875, 0.11969757080078125, 0.1468658447265625, 0.17403411865234375, 0.201202392578125, 0.22837066650390625, 0.2555389404296875, 0.28270721435546875, 0.30987548828125, 0.33704376220703125, 0.3642120361328125, 0.39138031005859375, 0.418548583984375, 0.44571685791015625, 0.4728851318359375, 0.5000534057617188, 0.5272216796875, 0.5543899536132812, 0.5815582275390625, 0.6087265014648438, 0.635894775390625, 0.6630630493164062, 0.6902313232421875, 0.7173995971679688, 0.74456787109375, 0.7717361450195312, 0.7989044189453125, 0.8260726928710938, 0.853240966796875, 0.8804092407226562, 0.9075775146484375, 0.9347457885742188, 0.9619140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 7.0, 10.0, 18.0, 31.0, 46.0, 66.0, 98.0, 101.0, 95.0, 131.0, 106.0, 74.0, 65.0, 60.0, 32.0, 24.0, 19.0, 9.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2032470703125, -0.1940937042236328, -0.18494033813476562, -0.17578697204589844, -0.16663360595703125, -0.15748023986816406, -0.14832687377929688, -0.1391735076904297, -0.1300201416015625, -0.12086677551269531, -0.11171340942382812, -0.10256004333496094, -0.09340667724609375, -0.08425331115722656, -0.07509994506835938, -0.06594657897949219, -0.056793212890625, -0.04763984680175781, -0.038486480712890625, -0.029333114624023438, -0.02017974853515625, -0.011026382446289062, -0.001873016357421875, 0.0072803497314453125, 0.0164337158203125, 0.025587081909179688, 0.034740447998046875, 0.04389381408691406, 0.05304718017578125, 0.06220054626464844, 0.07135391235351562, 0.08050727844238281, 0.08966064453125, 0.09881401062011719, 0.10796737670898438, 0.11712074279785156, 0.12627410888671875, 0.13542747497558594, 0.14458084106445312, 0.1537342071533203, 0.1628875732421875, 0.1720409393310547, 0.18119430541992188, 0.19034767150878906, 0.19950103759765625, 0.20865440368652344, 0.21780776977539062, 0.2269611358642578, 0.236114501953125, 0.2452678680419922, 0.2544212341308594, 0.26357460021972656, 0.27272796630859375, 0.28188133239746094, 0.2910346984863281, 0.3001880645751953, 0.3093414306640625, 0.3184947967529297, 0.3276481628417969, 0.33680152893066406, 0.34595489501953125, 0.35510826110839844, 0.3642616271972656, 0.3734149932861328, 0.382568359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 5.0, 18.0, 14.0, 15.0, 41.0, 36.0, 63.0, 99.0, 202.0, 458.0, 1292.0, 4378.0, 22436.0, 227034.0, 722859.0, 57277.0, 8815.0, 2136.0, 687.0, 302.0, 141.0, 61.0, 40.0, 31.0, 32.0, 18.0, 16.0, 14.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9912109375, -0.9638519287109375, -0.936492919921875, -0.9091339111328125, -0.88177490234375, -0.8544158935546875, -0.827056884765625, -0.7996978759765625, -0.7723388671875, -0.7449798583984375, -0.717620849609375, -0.6902618408203125, -0.66290283203125, -0.6355438232421875, -0.608184814453125, -0.5808258056640625, -0.553466796875, -0.5261077880859375, -0.498748779296875, -0.4713897705078125, -0.44403076171875, -0.4166717529296875, -0.389312744140625, -0.3619537353515625, -0.3345947265625, -0.3072357177734375, -0.279876708984375, -0.2525177001953125, -0.22515869140625, -0.1977996826171875, -0.170440673828125, -0.1430816650390625, -0.11572265625, -0.0883636474609375, -0.061004638671875, -0.0336456298828125, -0.00628662109375, 0.0210723876953125, 0.048431396484375, 0.0757904052734375, 0.1031494140625, 0.1305084228515625, 0.157867431640625, 0.1852264404296875, 0.21258544921875, 0.2399444580078125, 0.267303466796875, 0.2946624755859375, 0.322021484375, 0.3493804931640625, 0.376739501953125, 0.4040985107421875, 0.43145751953125, 0.4588165283203125, 0.486175537109375, 0.5135345458984375, 0.5408935546875, 0.5682525634765625, 0.595611572265625, 0.6229705810546875, 0.65032958984375, 0.6776885986328125, 0.705047607421875, 0.7324066162109375, 0.759765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 4.0, 5.0, 6.0, 9.0, 14.0, 11.0, 16.0, 23.0, 18.0, 29.0, 30.0, 32.0, 57.0, 58.0, 54.0, 59.0, 50.0, 66.0, 49.0, 63.0, 49.0, 49.0, 34.0, 45.0, 30.0, 24.0, 17.0, 25.0, 18.0, 12.0, 16.0, 5.0, 8.0, 2.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.73486328125, -0.7141799926757812, -0.6934967041015625, -0.6728134155273438, -0.652130126953125, -0.6314468383789062, -0.6107635498046875, -0.5900802612304688, -0.56939697265625, -0.5487136840820312, -0.5280303955078125, -0.5073471069335938, -0.486663818359375, -0.46598052978515625, -0.4452972412109375, -0.42461395263671875, -0.4039306640625, -0.38324737548828125, -0.3625640869140625, -0.34188079833984375, -0.321197509765625, -0.30051422119140625, -0.2798309326171875, -0.25914764404296875, -0.23846435546875, -0.21778106689453125, -0.1970977783203125, -0.17641448974609375, -0.155731201171875, -0.13504791259765625, -0.1143646240234375, -0.09368133544921875, -0.072998046875, -0.05231475830078125, -0.0316314697265625, -0.01094818115234375, 0.009735107421875, 0.03041839599609375, 0.0511016845703125, 0.07178497314453125, 0.09246826171875, 0.11315155029296875, 0.1338348388671875, 0.15451812744140625, 0.175201416015625, 0.19588470458984375, 0.2165679931640625, 0.23725128173828125, 0.2579345703125, 0.27861785888671875, 0.2993011474609375, 0.31998443603515625, 0.340667724609375, 0.36135101318359375, 0.3820343017578125, 0.40271759033203125, 0.42340087890625, 0.44408416748046875, 0.4647674560546875, 0.48545074462890625, 0.506134033203125, 0.5268173217773438, 0.5475006103515625, 0.5681838989257812, 0.5888671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 9.0, 5.0, 7.0, 13.0, 15.0, 22.0, 29.0, 46.0, 50.0, 107.0, 229.0, 518.0, 1654.0, 7084.0, 222754.0, 799662.0, 12656.0, 2361.0, 718.0, 277.0, 124.0, 73.0, 37.0, 31.0, 11.0, 16.0, 12.0, 4.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.419921875, -0.40550994873046875, -0.3910980224609375, -0.37668609619140625, -0.362274169921875, -0.34786224365234375, -0.3334503173828125, -0.31903839111328125, -0.30462646484375, -0.29021453857421875, -0.2758026123046875, -0.26139068603515625, -0.246978759765625, -0.23256683349609375, -0.2181549072265625, -0.20374298095703125, -0.1893310546875, -0.17491912841796875, -0.1605072021484375, -0.14609527587890625, -0.131683349609375, -0.11727142333984375, -0.1028594970703125, -0.08844757080078125, -0.07403564453125, -0.05962371826171875, -0.0452117919921875, -0.03079986572265625, -0.016387939453125, -0.00197601318359375, 0.0124359130859375, 0.02684783935546875, 0.041259765625, 0.05567169189453125, 0.0700836181640625, 0.08449554443359375, 0.098907470703125, 0.11331939697265625, 0.1277313232421875, 0.14214324951171875, 0.15655517578125, 0.17096710205078125, 0.1853790283203125, 0.19979095458984375, 0.214202880859375, 0.22861480712890625, 0.2430267333984375, 0.25743865966796875, 0.2718505859375, 0.28626251220703125, 0.3006744384765625, 0.31508636474609375, 0.329498291015625, 0.34391021728515625, 0.3583221435546875, 0.37273406982421875, 0.38714599609375, 0.40155792236328125, 0.4159698486328125, 0.43038177490234375, 0.444793701171875, 0.45920562744140625, 0.4736175537109375, 0.48802947998046875, 0.50244140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 10.0, 12.0, 16.0, 27.0, 34.0, 36.0, 52.0, 51.0, 94.0, 100.0, 125.0, 79.0, 82.0, 71.0, 32.0, 38.0, 27.0, 20.0, 18.0, 19.0, 11.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.422136306762695e-05, -8.14441591501236e-05, -7.866695523262024e-05, -7.588975131511688e-05, -7.311254739761353e-05, -7.033534348011017e-05, -6.755813956260681e-05, -6.478093564510345e-05, -6.20037317276001e-05, -5.922652781009674e-05, -5.6449323892593384e-05, -5.367211997509003e-05, -5.089491605758667e-05, -4.811771214008331e-05, -4.5340508222579956e-05, -4.25633043050766e-05, -3.978610038757324e-05, -3.7008896470069885e-05, -3.423169255256653e-05, -3.145448863506317e-05, -2.8677284717559814e-05, -2.5900080800056458e-05, -2.31228768825531e-05, -2.0345672965049744e-05, -1.7568469047546387e-05, -1.479126513004303e-05, -1.2014061212539673e-05, -9.236857295036316e-06, -6.459653377532959e-06, -3.682449460029602e-06, -9.052455425262451e-07, 1.8719583749771118e-06, 4.649162292480469e-06, 7.426366209983826e-06, 1.0203570127487183e-05, 1.298077404499054e-05, 1.5757977962493896e-05, 1.8535181879997253e-05, 2.131238579750061e-05, 2.4089589715003967e-05, 2.6866793632507324e-05, 2.964399755001068e-05, 3.242120146751404e-05, 3.5198405385017395e-05, 3.797560930252075e-05, 4.075281322002411e-05, 4.3530017137527466e-05, 4.630722105503082e-05, 4.908442497253418e-05, 5.186162889003754e-05, 5.4638832807540894e-05, 5.741603672504425e-05, 6.019324064254761e-05, 6.297044456005096e-05, 6.574764847755432e-05, 6.852485239505768e-05, 7.130205631256104e-05, 7.407926023006439e-05, 7.685646414756775e-05, 7.96336680650711e-05, 8.241087198257446e-05, 8.518807590007782e-05, 8.796527981758118e-05, 9.074248373508453e-05, 9.351968765258789e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 11.0, 10.0, 13.0, 10.0, 12.0, 33.0, 55.0, 70.0, 168.0, 299.0, 757.0, 2087.0, 7689.0, 94163.0, 901679.0, 33868.0, 5038.0, 1449.0, 572.0, 220.0, 115.0, 76.0, 49.0, 32.0, 16.0, 16.0, 11.0, 7.0, 8.0, 1.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2509269714355469, -0.24062347412109375, -0.23031997680664062, -0.2200164794921875, -0.20971298217773438, -0.19940948486328125, -0.18910598754882812, -0.178802490234375, -0.16849899291992188, -0.15819549560546875, -0.14789199829101562, -0.1375885009765625, -0.12728500366210938, -0.11698150634765625, -0.10667800903320312, -0.09637451171875, -0.08607101440429688, -0.07576751708984375, -0.06546401977539062, -0.0551605224609375, -0.044857025146484375, -0.03455352783203125, -0.024250030517578125, -0.013946533203125, -0.003643035888671875, 0.00666046142578125, 0.016963958740234375, 0.0272674560546875, 0.037570953369140625, 0.04787445068359375, 0.058177947998046875, 0.0684814453125, 0.07878494262695312, 0.08908843994140625, 0.09939193725585938, 0.1096954345703125, 0.11999893188476562, 0.13030242919921875, 0.14060592651367188, 0.150909423828125, 0.16121292114257812, 0.17151641845703125, 0.18181991577148438, 0.1921234130859375, 0.20242691040039062, 0.21273040771484375, 0.22303390502929688, 0.23333740234375, 0.24364089965820312, 0.25394439697265625, 0.2642478942871094, 0.2745513916015625, 0.2848548889160156, 0.29515838623046875, 0.3054618835449219, 0.315765380859375, 0.3260688781738281, 0.33637237548828125, 0.3466758728027344, 0.3569793701171875, 0.3672828674316406, 0.37758636474609375, 0.3878898620605469, 0.398193359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 9.0, 5.0, 17.0, 47.0, 58.0, 136.0, 163.0, 189.0, 138.0, 87.0, 49.0, 29.0, 17.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.197998046875, -0.19017410278320312, -0.18235015869140625, -0.17452621459960938, -0.1667022705078125, -0.15887832641601562, -0.15105438232421875, -0.14323043823242188, -0.135406494140625, -0.12758255004882812, -0.11975860595703125, -0.11193466186523438, -0.1041107177734375, -0.09628677368164062, -0.08846282958984375, -0.08063888549804688, -0.07281494140625, -0.06499099731445312, -0.05716705322265625, -0.049343109130859375, -0.0415191650390625, -0.033695220947265625, -0.02587127685546875, -0.018047332763671875, -0.010223388671875, -0.002399444580078125, 0.00542449951171875, 0.013248443603515625, 0.0210723876953125, 0.028896331787109375, 0.03672027587890625, 0.044544219970703125, 0.0523681640625, 0.060192108154296875, 0.06801605224609375, 0.07583999633789062, 0.0836639404296875, 0.09148788452148438, 0.09931182861328125, 0.10713577270507812, 0.114959716796875, 0.12278366088867188, 0.13060760498046875, 0.13843154907226562, 0.1462554931640625, 0.15407943725585938, 0.16190338134765625, 0.16972732543945312, 0.17755126953125, 0.18537521362304688, 0.19319915771484375, 0.20102310180664062, 0.2088470458984375, 0.21667098999023438, 0.22449493408203125, 0.23231887817382812, 0.240142822265625, 0.24796676635742188, 0.25579071044921875, 0.2636146545410156, 0.2714385986328125, 0.2792625427246094, 0.28708648681640625, 0.2949104309082031, 0.302734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 19.0, 44.0, 101.0, 389.0, 314.0, 87.0, 27.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.50838565826416, -3.287754535675049, -3.0671234130859375, -2.846492290496826, -2.6258609294891357, -2.4052298069000244, -2.184598684310913, -1.9639674425125122, -1.7433363199234009, -1.5227051973342896, -1.3020739555358887, -1.0814428329467773, -0.8608116507530212, -0.6401804685592651, -0.4195493459701538, -0.19891810417175293, 0.0217130184173584, 0.2423441857099533, 0.4629753530025482, 0.6836065053939819, 0.904237687587738, 1.1248688697814941, 1.3454999923706055, 1.5661312341690063, 1.7867623567581177, 2.0073935985565186, 2.22802472114563, 2.448655843734741, 2.6692869663238525, 2.889918327331543, 3.1105494499206543, 3.3311805725097656, 3.551811695098877, 3.7724428176879883, 3.9930739402770996, 4.213705062866211, 4.434336185455322, 4.654967308044434, 4.875598907470703, 5.0962300300598145, 5.316861152648926, 5.537492275238037, 5.758123397827148, 5.97875452041626, 6.199385643005371, 6.420017242431641, 6.640647888183594, 6.861279487609863, 7.081910133361816, 7.302541255950928, 7.523172378540039, 7.74380350112915, 7.964434623718262, 8.185066223144531, 8.405696868896484, 8.626328468322754, 8.846960067749023, 9.067591667175293, 9.288222312927246, 9.508853912353516, 9.729484558105469, 9.950116157531738, 10.170746803283691, 10.391378402709961, 10.612009048461914]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 6.0, 5.0, 8.0, 12.0, 17.0, 27.0, 17.0, 22.0, 31.0, 44.0, 48.0, 41.0, 39.0, 63.0, 52.0, 77.0, 60.0, 53.0, 40.0, 54.0, 39.0, 35.0, 36.0, 33.0, 30.0, 17.0, 23.0, 17.0, 12.0, 5.0, 7.0, 2.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154299259185791, -3.0381417274475098, -2.9219841957092285, -2.8058266639709473, -2.689669370651245, -2.573511838912964, -2.4573543071746826, -2.3411967754364014, -2.225039482116699, -2.108881950378418, -1.9927245378494263, -1.876567006111145, -1.7604095935821533, -1.644252061843872, -1.5280945301055908, -1.4119369983673096, -1.2957794666290283, -1.179621934890747, -1.0634645223617554, -0.9473069906234741, -0.8311495184898376, -0.7149920463562012, -0.5988345146179199, -0.48267704248428345, -0.366519570350647, -0.2503620982170105, -0.13420459628105164, -0.018047094345092773, 0.0981103777885437, 0.21426784992218018, 0.3304253816604614, 0.4465828537940979, 0.5627403259277344, 0.6788977980613708, 0.7950552701950073, 0.9112128019332886, 1.0273702144622803, 1.1435277462005615, 1.2596852779388428, 1.375842809677124, 1.4920002222061157, 1.608157753944397, 1.7243151664733887, 1.84047269821167, 1.9566302299499512, 2.0727877616882324, 2.1889452934265137, 2.305102586746216, 2.421260118484497, 2.5374176502227783, 2.6535751819610596, 2.7697324752807617, 2.885890007019043, 3.002047538757324, 3.1182050704956055, 3.2343626022338867, 3.350520133972168, 3.466677665710449, 3.5828351974487305, 3.6989927291870117, 3.815150022506714, 3.931307554244995, 4.0474653244018555, 4.1636223793029785, 4.27977991104126]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 16.0, 20.0, 27.0, 76.0, 99.0, 233.0, 451.0, 1037.0, 2763.0, 9036.0, 46922.0, 3171092.0, 913869.0, 35494.0, 7764.0, 2547.0, 1130.0, 584.0, 330.0, 230.0, 137.0, 110.0, 70.0, 62.0, 50.0, 29.0, 15.0, 24.0, 8.0, 9.0, 11.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6298370361328125, -0.596588134765625, -0.5633392333984375, -0.53009033203125, -0.4968414306640625, -0.463592529296875, -0.4303436279296875, -0.3970947265625, -0.3638458251953125, -0.330596923828125, -0.2973480224609375, -0.26409912109375, -0.2308502197265625, -0.197601318359375, -0.1643524169921875, -0.131103515625, -0.0978546142578125, -0.064605712890625, -0.0313568115234375, 0.00189208984375, 0.0351409912109375, 0.068389892578125, 0.1016387939453125, 0.1348876953125, 0.1681365966796875, 0.201385498046875, 0.2346343994140625, 0.26788330078125, 0.3011322021484375, 0.334381103515625, 0.3676300048828125, 0.40087890625, 0.4341278076171875, 0.467376708984375, 0.5006256103515625, 0.53387451171875, 0.5671234130859375, 0.600372314453125, 0.6336212158203125, 0.6668701171875, 0.7001190185546875, 0.733367919921875, 0.7666168212890625, 0.79986572265625, 0.8331146240234375, 0.866363525390625, 0.8996124267578125, 0.932861328125, 0.9661102294921875, 0.999359130859375, 1.0326080322265625, 1.06585693359375, 1.0991058349609375, 1.132354736328125, 1.1656036376953125, 1.1988525390625, 1.2321014404296875, 1.265350341796875, 1.2985992431640625, 1.33184814453125, 1.3650970458984375, 1.398345947265625, 1.4315948486328125, 1.46484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 13.0, 16.0, 24.0, 48.0, 57.0, 73.0, 83.0, 87.0, 100.0, 110.0, 91.0, 74.0, 68.0, 52.0, 42.0, 21.0, 11.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.15662193298339844, -0.14783859252929688, -0.1390552520751953, -0.13027191162109375, -0.12148857116699219, -0.11270523071289062, -0.10392189025878906, -0.0951385498046875, -0.08635520935058594, -0.07757186889648438, -0.06878852844238281, -0.06000518798828125, -0.05122184753417969, -0.042438507080078125, -0.03365516662597656, -0.024871826171875, -0.016088485717773438, -0.007305145263671875, 0.0014781951904296875, 0.01026153564453125, 0.019044876098632812, 0.027828216552734375, 0.03661155700683594, 0.0453948974609375, 0.05417823791503906, 0.06296157836914062, 0.07174491882324219, 0.08052825927734375, 0.08931159973144531, 0.09809494018554688, 0.10687828063964844, 0.11566162109375, 0.12444496154785156, 0.13322830200195312, 0.1420116424560547, 0.15079498291015625, 0.1595783233642578, 0.16836166381835938, 0.17714500427246094, 0.1859283447265625, 0.19471168518066406, 0.20349502563476562, 0.2122783660888672, 0.22106170654296875, 0.2298450469970703, 0.23862838745117188, 0.24741172790527344, 0.256195068359375, 0.26497840881347656, 0.2737617492675781, 0.2825450897216797, 0.29132843017578125, 0.3001117706298828, 0.3088951110839844, 0.31767845153808594, 0.3264617919921875, 0.33524513244628906, 0.3440284729003906, 0.3528118133544922, 0.36159515380859375, 0.3703784942626953, 0.3791618347167969, 0.38794517517089844, 0.396728515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 11.0, 27.0, 45.0, 98.0, 170.0, 403.0, 1056.0, 24473.0, 4162642.0, 4204.0, 627.0, 272.0, 111.0, 64.0, 35.0, 24.0, 9.0, 10.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.2967529296875, -2.212646484375, -2.1285400390625, -2.04443359375, -1.9603271484375, -1.876220703125, -1.7921142578125, -1.7080078125, -1.6239013671875, -1.539794921875, -1.4556884765625, -1.37158203125, -1.2874755859375, -1.203369140625, -1.1192626953125, -1.03515625, -0.9510498046875, -0.866943359375, -0.7828369140625, -0.69873046875, -0.6146240234375, -0.530517578125, -0.4464111328125, -0.3623046875, -0.2781982421875, -0.194091796875, -0.1099853515625, -0.02587890625, 0.0582275390625, 0.142333984375, 0.2264404296875, 0.310546875, 0.3946533203125, 0.478759765625, 0.5628662109375, 0.64697265625, 0.7310791015625, 0.815185546875, 0.8992919921875, 0.9833984375, 1.0675048828125, 1.151611328125, 1.2357177734375, 1.31982421875, 1.4039306640625, 1.488037109375, 1.5721435546875, 1.65625, 1.7403564453125, 1.824462890625, 1.9085693359375, 1.99267578125, 2.0767822265625, 2.160888671875, 2.2449951171875, 2.3291015625, 2.4132080078125, 2.497314453125, 2.5814208984375, 2.66552734375, 2.7496337890625, 2.833740234375, 2.9178466796875, 3.001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 14.0, 48.0, 134.0, 2575.0, 1114.0, 130.0, 40.0, 12.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4813652038574219, -0.46346282958984375, -0.4455604553222656, -0.4276580810546875, -0.4097557067871094, -0.39185333251953125, -0.3739509582519531, -0.356048583984375, -0.3381462097167969, -0.32024383544921875, -0.3023414611816406, -0.2844390869140625, -0.2665367126464844, -0.24863433837890625, -0.23073196411132812, -0.21282958984375, -0.19492721557617188, -0.17702484130859375, -0.15912246704101562, -0.1412200927734375, -0.12331771850585938, -0.10541534423828125, -0.08751296997070312, -0.069610595703125, -0.051708221435546875, -0.03380584716796875, -0.015903472900390625, 0.0019989013671875, 0.019901275634765625, 0.03780364990234375, 0.055706024169921875, 0.0736083984375, 0.09151077270507812, 0.10941314697265625, 0.12731552124023438, 0.1452178955078125, 0.16312026977539062, 0.18102264404296875, 0.19892501831054688, 0.216827392578125, 0.23472976684570312, 0.25263214111328125, 0.2705345153808594, 0.2884368896484375, 0.3063392639160156, 0.32424163818359375, 0.3421440124511719, 0.36004638671875, 0.3779487609863281, 0.39585113525390625, 0.4137535095214844, 0.4316558837890625, 0.4495582580566406, 0.46746063232421875, 0.4853630065917969, 0.503265380859375, 0.5211677551269531, 0.5390701293945312, 0.5569725036621094, 0.5748748779296875, 0.5927772521972656, 0.6106796264648438, 0.6285820007324219, 0.646484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 47.0, 275.0, 550.0, 89.0, 16.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2722790241241455, -2.181706428527832, -2.0911340713500977, -2.0005617141723633, -1.9099891185760498, -1.8194166421890259, -1.728844165802002, -1.638271689414978, -1.547699213027954, -1.4571267366409302, -1.3665542602539062, -1.2759817838668823, -1.1854093074798584, -1.0948368310928345, -1.0042643547058105, -0.9136918783187866, -0.8231194019317627, -0.7325469255447388, -0.6419744491577148, -0.5514019727706909, -0.460829496383667, -0.37025701999664307, -0.27968454360961914, -0.18911206722259521, -0.09853959083557129, -0.007967114448547363, 0.08260536193847656, 0.1731778383255005, 0.2637503147125244, 0.35432279109954834, 0.44489526748657227, 0.5354677438735962, 0.6260404586791992, 0.7166129350662231, 0.8071854114532471, 0.897757887840271, 0.9883303642272949, 1.0789028406143188, 1.1694753170013428, 1.2600477933883667, 1.3506202697753906, 1.4411927461624146, 1.5317652225494385, 1.6223376989364624, 1.7129101753234863, 1.8034826517105103, 1.8940551280975342, 1.984627604484558, 2.075200080871582, 2.1657724380493164, 2.25634503364563, 2.3469176292419434, 2.4374899864196777, 2.528062343597412, 2.6186349391937256, 2.709207534790039, 2.7997798919677734, 2.890352249145508, 2.9809248447418213, 3.0714974403381348, 3.162069797515869, 3.2526421546936035, 3.343214750289917, 3.4337873458862305, 3.524359703063965]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 10.0, 12.0, 17.0, 23.0, 23.0, 24.0, 27.0, 27.0, 22.0, 56.0, 36.0, 52.0, 46.0, 55.0, 35.0, 66.0, 59.0, 48.0, 36.0, 45.0, 41.0, 36.0, 32.0, 24.0, 28.0, 24.0, 12.0, 20.0, 12.0, 8.0, 6.0, 3.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.660089373588562, -0.6382043957710266, -0.616319477558136, -0.5944344997406006, -0.57254958152771, -0.5506646037101746, -0.5287796258926392, -0.5068947076797485, -0.48500972986221313, -0.4631247818470001, -0.4412398338317871, -0.4193548560142517, -0.3974699079990387, -0.3755849599838257, -0.3536999821662903, -0.33181503415107727, -0.30993008613586426, -0.28804513812065125, -0.26616019010543823, -0.24427521228790283, -0.22239026427268982, -0.2005053162574768, -0.1786203533411026, -0.1567353904247284, -0.13485044240951538, -0.11296548694372177, -0.09108053147792816, -0.06919557601213455, -0.04731062054634094, -0.025425665080547333, -0.003540709614753723, 0.018344253301620483, 0.04022914171218872, 0.06211409717798233, 0.08399905264377594, 0.10588400810956955, 0.12776896357536316, 0.14965391159057617, 0.17153887450695038, 0.19342383742332458, 0.2153087854385376, 0.2371937334537506, 0.2590786814689636, 0.280963659286499, 0.30284860730171204, 0.32473355531692505, 0.34661853313446045, 0.36850348114967346, 0.3903884291648865, 0.4122733771800995, 0.4341583251953125, 0.4560433030128479, 0.4779282510280609, 0.4998131990432739, 0.5216981768608093, 0.5435831546783447, 0.5654680728912354, 0.5873530507087708, 0.6092379689216614, 0.6311229467391968, 0.6530078649520874, 0.6748928427696228, 0.6967778205871582, 0.7186627388000488, 0.7405477166175842]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 15.0, 16.0, 24.0, 27.0, 61.0, 107.0, 162.0, 264.0, 559.0, 1236.0, 3882.0, 19336.0, 189365.0, 750348.0, 69361.0, 9631.0, 2370.0, 843.0, 380.0, 230.0, 102.0, 70.0, 54.0, 30.0, 31.0, 14.0, 9.0, 9.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2564010620117188, -1.2208099365234375, -1.1852188110351562, -1.149627685546875, -1.1140365600585938, -1.0784454345703125, -1.0428543090820312, -1.00726318359375, -0.9716720581054688, -0.9360809326171875, -0.9004898071289062, -0.864898681640625, -0.8293075561523438, -0.7937164306640625, -0.7581253051757812, -0.7225341796875, -0.6869430541992188, -0.6513519287109375, -0.6157608032226562, -0.580169677734375, -0.5445785522460938, -0.5089874267578125, -0.47339630126953125, -0.43780517578125, -0.40221405029296875, -0.3666229248046875, -0.33103179931640625, -0.295440673828125, -0.25984954833984375, -0.2242584228515625, -0.18866729736328125, -0.153076171875, -0.11748504638671875, -0.0818939208984375, -0.04630279541015625, -0.010711669921875, 0.02487945556640625, 0.0604705810546875, 0.09606170654296875, 0.13165283203125, 0.16724395751953125, 0.2028350830078125, 0.23842620849609375, 0.274017333984375, 0.30960845947265625, 0.3451995849609375, 0.38079071044921875, 0.4163818359375, 0.45197296142578125, 0.4875640869140625, 0.5231552124023438, 0.558746337890625, 0.5943374633789062, 0.6299285888671875, 0.6655197143554688, 0.70111083984375, 0.7367019653320312, 0.7722930908203125, 0.8078842163085938, 0.843475341796875, 0.8790664672851562, 0.9146575927734375, 0.9502487182617188, 0.98583984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 13.0, 18.0, 38.0, 37.0, 63.0, 65.0, 65.0, 100.0, 76.0, 94.0, 98.0, 64.0, 66.0, 52.0, 53.0, 36.0, 15.0, 12.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1666259765625, -0.15830039978027344, -0.14997482299804688, -0.1416492462158203, -0.13332366943359375, -0.12499809265136719, -0.11667251586914062, -0.10834693908691406, -0.1000213623046875, -0.09169578552246094, -0.08337020874023438, -0.07504463195800781, -0.06671905517578125, -0.05839347839355469, -0.050067901611328125, -0.04174232482910156, -0.033416748046875, -0.025091171264648438, -0.016765594482421875, -0.008440017700195312, -0.00011444091796875, 0.008211135864257812, 0.016536712646484375, 0.024862289428710938, 0.0331878662109375, 0.04151344299316406, 0.049839019775390625, 0.05816459655761719, 0.06649017333984375, 0.07481575012207031, 0.08314132690429688, 0.09146690368652344, 0.09979248046875, 0.10811805725097656, 0.11644363403320312, 0.12476921081542969, 0.13309478759765625, 0.1414203643798828, 0.14974594116210938, 0.15807151794433594, 0.1663970947265625, 0.17472267150878906, 0.18304824829101562, 0.1913738250732422, 0.19969940185546875, 0.2080249786376953, 0.21635055541992188, 0.22467613220214844, 0.233001708984375, 0.24132728576660156, 0.24965286254882812, 0.2579784393310547, 0.26630401611328125, 0.2746295928955078, 0.2829551696777344, 0.29128074645996094, 0.2996063232421875, 0.30793190002441406, 0.3162574768066406, 0.3245830535888672, 0.33290863037109375, 0.3412342071533203, 0.3495597839355469, 0.35788536071777344, 0.3662109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 6.0, 5.0, 11.0, 15.0, 18.0, 29.0, 47.0, 65.0, 125.0, 286.0, 533.0, 1388.0, 4755.0, 25302.0, 318882.0, 646803.0, 40524.0, 6608.0, 1767.0, 635.0, 286.0, 164.0, 97.0, 72.0, 42.0, 20.0, 16.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81005859375, -0.7764663696289062, -0.7428741455078125, -0.7092819213867188, -0.675689697265625, -0.6420974731445312, -0.6085052490234375, -0.5749130249023438, -0.54132080078125, -0.5077285766601562, -0.4741363525390625, -0.44054412841796875, -0.406951904296875, -0.37335968017578125, -0.3397674560546875, -0.30617523193359375, -0.2725830078125, -0.23899078369140625, -0.2053985595703125, -0.17180633544921875, -0.138214111328125, -0.10462188720703125, -0.0710296630859375, -0.03743743896484375, -0.00384521484375, 0.02974700927734375, 0.0633392333984375, 0.09693145751953125, 0.130523681640625, 0.16411590576171875, 0.1977081298828125, 0.23130035400390625, 0.264892578125, 0.29848480224609375, 0.3320770263671875, 0.36566925048828125, 0.399261474609375, 0.43285369873046875, 0.4664459228515625, 0.5000381469726562, 0.53363037109375, 0.5672225952148438, 0.6008148193359375, 0.6344070434570312, 0.667999267578125, 0.7015914916992188, 0.7351837158203125, 0.7687759399414062, 0.8023681640625, 0.8359603881835938, 0.8695526123046875, 0.9031448364257812, 0.936737060546875, 0.9703292846679688, 1.0039215087890625, 1.0375137329101562, 1.07110595703125, 1.1046981811523438, 1.1382904052734375, 1.1718826293945312, 1.205474853515625, 1.2390670776367188, 1.2726593017578125, 1.3062515258789062, 1.33984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 19.0, 21.0, 24.0, 32.0, 43.0, 47.0, 55.0, 63.0, 78.0, 88.0, 76.0, 60.0, 66.0, 66.0, 51.0, 41.0, 50.0, 24.0, 11.0, 10.0, 12.0, 14.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7705078125, -0.738433837890625, -0.70635986328125, -0.674285888671875, -0.6422119140625, -0.610137939453125, -0.57806396484375, -0.545989990234375, -0.513916015625, -0.481842041015625, -0.44976806640625, -0.417694091796875, -0.3856201171875, -0.353546142578125, -0.32147216796875, -0.289398193359375, -0.25732421875, -0.225250244140625, -0.19317626953125, -0.161102294921875, -0.1290283203125, -0.096954345703125, -0.06488037109375, -0.032806396484375, -0.000732421875, 0.031341552734375, 0.06341552734375, 0.095489501953125, 0.1275634765625, 0.159637451171875, 0.19171142578125, 0.223785400390625, 0.255859375, 0.287933349609375, 0.32000732421875, 0.352081298828125, 0.3841552734375, 0.416229248046875, 0.44830322265625, 0.480377197265625, 0.512451171875, 0.544525146484375, 0.57659912109375, 0.608673095703125, 0.6407470703125, 0.672821044921875, 0.70489501953125, 0.736968994140625, 0.76904296875, 0.801116943359375, 0.83319091796875, 0.865264892578125, 0.8973388671875, 0.929412841796875, 0.96148681640625, 0.993560791015625, 1.025634765625, 1.057708740234375, 1.08978271484375, 1.121856689453125, 1.1539306640625, 1.186004638671875, 1.21807861328125, 1.250152587890625, 1.2822265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 18.0, 12.0, 22.0, 40.0, 60.0, 101.0, 163.0, 312.0, 689.0, 1460.0, 4185.0, 20725.0, 399226.0, 584883.0, 28341.0, 5004.0, 1698.0, 719.0, 332.0, 194.0, 108.0, 74.0, 41.0, 31.0, 25.0, 17.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.26209449768066406, -0.2541694641113281, -0.2462444305419922, -0.23831939697265625, -0.2303943634033203, -0.22246932983398438, -0.21454429626464844, -0.2066192626953125, -0.19869422912597656, -0.19076919555664062, -0.1828441619873047, -0.17491912841796875, -0.1669940948486328, -0.15906906127929688, -0.15114402770996094, -0.143218994140625, -0.13529396057128906, -0.12736892700195312, -0.11944389343261719, -0.11151885986328125, -0.10359382629394531, -0.09566879272460938, -0.08774375915527344, -0.0798187255859375, -0.07189369201660156, -0.06396865844726562, -0.05604362487792969, -0.04811859130859375, -0.04019355773925781, -0.032268524169921875, -0.024343490600585938, -0.01641845703125, -0.008493423461914062, -0.000568389892578125, 0.0073566436767578125, 0.01528167724609375, 0.023206710815429688, 0.031131744384765625, 0.03905677795410156, 0.0469818115234375, 0.05490684509277344, 0.06283187866210938, 0.07075691223144531, 0.07868194580078125, 0.08660697937011719, 0.09453201293945312, 0.10245704650878906, 0.110382080078125, 0.11830711364746094, 0.12623214721679688, 0.1341571807861328, 0.14208221435546875, 0.1500072479248047, 0.15793228149414062, 0.16585731506347656, 0.1737823486328125, 0.18170738220214844, 0.18963241577148438, 0.1975574493408203, 0.20548248291015625, 0.2134075164794922, 0.22133255004882812, 0.22925758361816406, 0.2371826171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 16.0, 25.0, 27.0, 35.0, 48.0, 78.0, 92.0, 112.0, 113.0, 110.0, 74.0, 63.0, 57.0, 33.0, 20.0, 18.0, 12.0, 6.0, 8.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.827447891235352e-05, -8.563883602619171e-05, -8.300319314002991e-05, -8.03675502538681e-05, -7.77319073677063e-05, -7.50962644815445e-05, -7.246062159538269e-05, -6.982497870922089e-05, -6.718933582305908e-05, -6.455369293689728e-05, -6.191805005073547e-05, -5.928240716457367e-05, -5.6646764278411865e-05, -5.401112139225006e-05, -5.137547850608826e-05, -4.873983561992645e-05, -4.610419273376465e-05, -4.3468549847602844e-05, -4.083290696144104e-05, -3.8197264075279236e-05, -3.556162118911743e-05, -3.292597830295563e-05, -3.0290335416793823e-05, -2.765469253063202e-05, -2.5019049644470215e-05, -2.238340675830841e-05, -1.9747763872146606e-05, -1.7112120985984802e-05, -1.4476478099822998e-05, -1.1840835213661194e-05, -9.20519232749939e-06, -6.5695494413375854e-06, -3.933906555175781e-06, -1.298263669013977e-06, 1.3373792171478271e-06, 3.973022103309631e-06, 6.6086649894714355e-06, 9.24430787563324e-06, 1.1879950761795044e-05, 1.4515593647956848e-05, 1.7151236534118652e-05, 1.9786879420280457e-05, 2.242252230644226e-05, 2.5058165192604065e-05, 2.769380807876587e-05, 3.0329450964927673e-05, 3.296509385108948e-05, 3.560073673725128e-05, 3.8236379623413086e-05, 4.087202250957489e-05, 4.3507665395736694e-05, 4.61433082818985e-05, 4.87789511680603e-05, 5.141459405422211e-05, 5.405023694038391e-05, 5.6685879826545715e-05, 5.932152271270752e-05, 6.195716559886932e-05, 6.459280848503113e-05, 6.722845137119293e-05, 6.986409425735474e-05, 7.249973714351654e-05, 7.513538002967834e-05, 7.777102291584015e-05, 8.040666580200195e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 0.0, 3.0, 8.0, 12.0, 28.0, 49.0, 96.0, 202.0, 457.0, 1296.0, 6269.0, 148458.0, 868358.0, 19556.0, 2520.0, 659.0, 304.0, 119.0, 65.0, 44.0, 21.0, 10.0, 10.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326904296875, -0.31490325927734375, -0.3029022216796875, -0.29090118408203125, -0.278900146484375, -0.26689910888671875, -0.2548980712890625, -0.24289703369140625, -0.23089599609375, -0.21889495849609375, -0.2068939208984375, -0.19489288330078125, -0.182891845703125, -0.17089080810546875, -0.1588897705078125, -0.14688873291015625, -0.1348876953125, -0.12288665771484375, -0.1108856201171875, -0.09888458251953125, -0.086883544921875, -0.07488250732421875, -0.0628814697265625, -0.05088043212890625, -0.03887939453125, -0.02687835693359375, -0.0148773193359375, -0.00287628173828125, 0.009124755859375, 0.02112579345703125, 0.0331268310546875, 0.04512786865234375, 0.05712890625, 0.06912994384765625, 0.0811309814453125, 0.09313201904296875, 0.105133056640625, 0.11713409423828125, 0.1291351318359375, 0.14113616943359375, 0.15313720703125, 0.16513824462890625, 0.1771392822265625, 0.18914031982421875, 0.201141357421875, 0.21314239501953125, 0.2251434326171875, 0.23714447021484375, 0.2491455078125, 0.26114654541015625, 0.2731475830078125, 0.28514862060546875, 0.297149658203125, 0.30915069580078125, 0.3211517333984375, 0.33315277099609375, 0.34515380859375, 0.35715484619140625, 0.3691558837890625, 0.38115692138671875, 0.393157958984375, 0.40515899658203125, 0.4171600341796875, 0.42916107177734375, 0.441162109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 24.0, 28.0, 60.0, 137.0, 257.0, 257.0, 111.0, 46.0, 24.0, 16.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.31102752685546875, -0.2990570068359375, -0.28708648681640625, -0.275115966796875, -0.26314544677734375, -0.2511749267578125, -0.23920440673828125, -0.22723388671875, -0.21526336669921875, -0.2032928466796875, -0.19132232666015625, -0.179351806640625, -0.16738128662109375, -0.1554107666015625, -0.14344024658203125, -0.1314697265625, -0.11949920654296875, -0.1075286865234375, -0.09555816650390625, -0.083587646484375, -0.07161712646484375, -0.0596466064453125, -0.04767608642578125, -0.03570556640625, -0.02373504638671875, -0.0117645263671875, 0.00020599365234375, 0.012176513671875, 0.02414703369140625, 0.0361175537109375, 0.04808807373046875, 0.06005859375, 0.07202911376953125, 0.0839996337890625, 0.09597015380859375, 0.107940673828125, 0.11991119384765625, 0.1318817138671875, 0.14385223388671875, 0.15582275390625, 0.16779327392578125, 0.1797637939453125, 0.19173431396484375, 0.203704833984375, 0.21567535400390625, 0.2276458740234375, 0.23961639404296875, 0.2515869140625, 0.26355743408203125, 0.2755279541015625, 0.28749847412109375, 0.299468994140625, 0.31143951416015625, 0.3234100341796875, 0.33538055419921875, 0.34735107421875, 0.35932159423828125, 0.3712921142578125, 0.38326263427734375, 0.395233154296875, 0.40720367431640625, 0.4191741943359375, 0.43114471435546875, 0.443115234375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 15.0, 16.0, 27.0, 45.0, 89.0, 212.0, 270.0, 152.0, 71.0, 43.0, 22.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.955911159515381, -2.803083658218384, -2.6502559185028076, -2.4974284172058105, -2.3446006774902344, -2.1917731761932373, -2.0389456748962402, -1.8861180543899536, -1.733290433883667, -1.5804628133773804, -1.4276351928710938, -1.2748076915740967, -1.12198007106781, -0.9691524505615234, -0.8163248896598816, -0.6634973287582397, -0.5106697082519531, -0.3578421175479889, -0.20501452684402466, -0.052186936140060425, 0.10064065456390381, 0.25346827507019043, 0.4062958359718323, 0.5591233968734741, 0.7119510173797607, 0.8647786378860474, 1.017606258392334, 1.170433759689331, 1.3232613801956177, 1.4760890007019043, 1.6289165019989014, 1.781744122505188, 1.9345712661743164, 2.0873987674713135, 2.2402265071868896, 2.3930540084838867, 2.545881748199463, 2.69870924949646, 2.851536750793457, 3.004364490509033, 3.1571919918060303, 3.3100194931030273, 3.4628472328186035, 3.6156747341156006, 3.7685022354125977, 3.921329975128174, 4.07415771484375, 4.226984977722168, 4.379812717437744, 4.53264045715332, 4.685467720031738, 4.8382954597473145, 4.991123199462891, 5.143950462341309, 5.296778202056885, 5.449605941772461, 5.602433204650879, 5.755260944366455, 5.908088207244873, 6.060915946960449, 6.213743686676025, 6.366571426391602, 6.5193986892700195, 6.672226428985596, 6.825054168701172]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 8.0, 13.0, 10.0, 9.0, 14.0, 16.0, 22.0, 28.0, 21.0, 28.0, 34.0, 22.0, 25.0, 44.0, 48.0, 48.0, 41.0, 70.0, 56.0, 51.0, 39.0, 50.0, 37.0, 31.0, 35.0, 26.0, 26.0, 26.0, 21.0, 16.0, 11.0, 11.0, 13.0, 11.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6705427169799805, -3.55070161819458, -3.4308605194091797, -3.3110194206237793, -3.191178321838379, -3.0713372230529785, -2.951496124267578, -2.8316550254821777, -2.7118139266967773, -2.591972827911377, -2.4721317291259766, -2.352290630340576, -2.232449531555176, -2.1126084327697754, -1.992767333984375, -1.8729262351989746, -1.7530850172042847, -1.6332439184188843, -1.5134028196334839, -1.3935617208480835, -1.273720622062683, -1.1538794040679932, -1.0340383052825928, -0.9141972661018372, -0.7943561673164368, -0.6745150685310364, -0.554673969745636, -0.4348328411579132, -0.3149917423725128, -0.19515061378479004, -0.07530951499938965, 0.04453158378601074, 0.16437268257141113, 0.2842137813568115, 0.4040548801422119, 0.5238959789276123, 0.6437370777130127, 0.7635782361030579, 0.8834193348884583, 1.0032603740692139, 1.1231014728546143, 1.2429425716400146, 1.362783670425415, 1.4826247692108154, 1.6024658679962158, 1.7223069667816162, 1.8421480655670166, 1.961989164352417, 2.0818305015563965, 2.201671600341797, 2.3215126991271973, 2.4413537979125977, 2.561194896697998, 2.6810359954833984, 2.800877094268799, 2.920718193054199, 3.0405592918395996, 3.160400390625, 3.2802414894104004, 3.400082588195801, 3.519923686981201, 3.6397647857666016, 3.759605884552002, 3.8794469833374023, 3.9992880821228027]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 0.0, 12.0, 15.0, 21.0, 33.0, 40.0, 91.0, 160.0, 274.0, 618.0, 1243.0, 2811.0, 7946.0, 36232.0, 1115336.0, 2972532.0, 41287.0, 8908.0, 3322.0, 1492.0, 730.0, 415.0, 242.0, 142.0, 106.0, 72.0, 39.0, 32.0, 25.0, 22.0, 8.0, 13.0, 12.0, 16.0, 4.0, 1.0, 4.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88427734375, -0.8401565551757812, -0.7960357666015625, -0.7519149780273438, -0.707794189453125, -0.6636734008789062, -0.6195526123046875, -0.5754318237304688, -0.53131103515625, -0.48719024658203125, -0.4430694580078125, -0.39894866943359375, -0.354827880859375, -0.31070709228515625, -0.2665863037109375, -0.22246551513671875, -0.1783447265625, -0.13422393798828125, -0.0901031494140625, -0.04598236083984375, -0.001861572265625, 0.04225921630859375, 0.0863800048828125, 0.13050079345703125, 0.17462158203125, 0.21874237060546875, 0.2628631591796875, 0.30698394775390625, 0.351104736328125, 0.39522552490234375, 0.4393463134765625, 0.48346710205078125, 0.527587890625, 0.5717086791992188, 0.6158294677734375, 0.6599502563476562, 0.704071044921875, 0.7481918334960938, 0.7923126220703125, 0.8364334106445312, 0.88055419921875, 0.9246749877929688, 0.9687957763671875, 1.0129165649414062, 1.057037353515625, 1.1011581420898438, 1.1452789306640625, 1.1893997192382812, 1.2335205078125, 1.2776412963867188, 1.3217620849609375, 1.3658828735351562, 1.410003662109375, 1.4541244506835938, 1.4982452392578125, 1.5423660278320312, 1.58648681640625, 1.6306076049804688, 1.6747283935546875, 1.7188491821289062, 1.762969970703125, 1.8070907592773438, 1.8512115478515625, 1.8953323364257812, 1.939453125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 9.0, 23.0, 36.0, 31.0, 52.0, 52.0, 71.0, 79.0, 85.0, 103.0, 77.0, 83.0, 78.0, 59.0, 50.0, 33.0, 30.0, 14.0, 15.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1669921875, -0.15843582153320312, -0.14987945556640625, -0.14132308959960938, -0.1327667236328125, -0.12421035766601562, -0.11565399169921875, -0.10709762573242188, -0.098541259765625, -0.08998489379882812, -0.08142852783203125, -0.07287216186523438, -0.0643157958984375, -0.055759429931640625, -0.04720306396484375, -0.038646697998046875, -0.03009033203125, -0.021533966064453125, -0.01297760009765625, -0.004421234130859375, 0.0041351318359375, 0.012691497802734375, 0.02124786376953125, 0.029804229736328125, 0.038360595703125, 0.046916961669921875, 0.05547332763671875, 0.06402969360351562, 0.0725860595703125, 0.08114242553710938, 0.08969879150390625, 0.09825515747070312, 0.1068115234375, 0.11536788940429688, 0.12392425537109375, 0.13248062133789062, 0.1410369873046875, 0.14959335327148438, 0.15814971923828125, 0.16670608520507812, 0.175262451171875, 0.18381881713867188, 0.19237518310546875, 0.20093154907226562, 0.2094879150390625, 0.21804428100585938, 0.22660064697265625, 0.23515701293945312, 0.24371337890625, 0.2522697448730469, 0.26082611083984375, 0.2693824768066406, 0.2779388427734375, 0.2864952087402344, 0.29505157470703125, 0.3036079406738281, 0.312164306640625, 0.3207206726074219, 0.32927703857421875, 0.3378334045410156, 0.3463897705078125, 0.3549461364746094, 0.36350250244140625, 0.3720588684082031, 0.380615234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 19.0, 16.0, 18.0, 28.0, 53.0, 97.0, 221.0, 581.0, 1711.0, 6749.0, 110758.0, 4053225.0, 15579.0, 3304.0, 1060.0, 412.0, 177.0, 95.0, 60.0, 41.0, 34.0, 17.0, 6.0, 12.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.158203125, -2.084320068359375, -2.01043701171875, -1.936553955078125, -1.8626708984375, -1.788787841796875, -1.71490478515625, -1.641021728515625, -1.567138671875, -1.493255615234375, -1.41937255859375, -1.345489501953125, -1.2716064453125, -1.197723388671875, -1.12384033203125, -1.049957275390625, -0.97607421875, -0.902191162109375, -0.82830810546875, -0.754425048828125, -0.6805419921875, -0.606658935546875, -0.53277587890625, -0.458892822265625, -0.385009765625, -0.311126708984375, -0.23724365234375, -0.163360595703125, -0.0894775390625, -0.015594482421875, 0.05828857421875, 0.132171630859375, 0.2060546875, 0.279937744140625, 0.35382080078125, 0.427703857421875, 0.5015869140625, 0.575469970703125, 0.64935302734375, 0.723236083984375, 0.797119140625, 0.871002197265625, 0.94488525390625, 1.018768310546875, 1.0926513671875, 1.166534423828125, 1.24041748046875, 1.314300537109375, 1.38818359375, 1.462066650390625, 1.53594970703125, 1.609832763671875, 1.6837158203125, 1.757598876953125, 1.83148193359375, 1.905364990234375, 1.979248046875, 2.053131103515625, 2.12701416015625, 2.200897216796875, 2.2747802734375, 2.348663330078125, 2.42254638671875, 2.496429443359375, 2.5703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 0.0, 4.0, 3.0, 5.0, 3.0, 11.0, 17.0, 43.0, 118.0, 830.0, 2691.0, 216.0, 57.0, 25.0, 18.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5555038452148438, -0.5265350341796875, -0.49756622314453125, -0.468597412109375, -0.43962860107421875, -0.4106597900390625, -0.38169097900390625, -0.35272216796875, -0.32375335693359375, -0.2947845458984375, -0.26581573486328125, -0.236846923828125, -0.20787811279296875, -0.1789093017578125, -0.14994049072265625, -0.1209716796875, -0.09200286865234375, -0.0630340576171875, -0.03406524658203125, -0.005096435546875, 0.02387237548828125, 0.0528411865234375, 0.08180999755859375, 0.11077880859375, 0.13974761962890625, 0.1687164306640625, 0.19768524169921875, 0.226654052734375, 0.25562286376953125, 0.2845916748046875, 0.31356048583984375, 0.342529296875, 0.37149810791015625, 0.4004669189453125, 0.42943572998046875, 0.458404541015625, 0.48737335205078125, 0.5163421630859375, 0.5453109741210938, 0.57427978515625, 0.6032485961914062, 0.6322174072265625, 0.6611862182617188, 0.690155029296875, 0.7191238403320312, 0.7480926513671875, 0.7770614624023438, 0.8060302734375, 0.8349990844726562, 0.8639678955078125, 0.8929367065429688, 0.921905517578125, 0.9508743286132812, 0.9798431396484375, 1.0088119506835938, 1.03778076171875, 1.0667495727539062, 1.0957183837890625, 1.1246871948242188, 1.153656005859375, 1.1826248168945312, 1.2115936279296875, 1.2405624389648438, 1.26953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 26.0, 89.0, 511.0, 293.0, 53.0, 17.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8825347423553467, -1.689887523651123, -1.4972403049468994, -1.3045932054519653, -1.1119459867477417, -0.9192987680435181, -0.726651668548584, -0.5340044498443604, -0.3413572311401367, -0.14871004223823547, 0.04393714666366577, 0.23658430576324463, 0.42923152446746826, 0.6218787431716919, 0.814525842666626, 1.0071730613708496, 1.1998202800750732, 1.3924674987792969, 1.5851147174835205, 1.7777618169784546, 1.9704090356826782, 2.1630563735961914, 2.355703353881836, 2.5483505725860596, 2.740997791290283, 2.933645009994507, 3.1262922286987305, 3.318939208984375, 3.5115866661071777, 3.7042336463928223, 3.896880865097046, 4.0895280838012695, 4.282175064086914, 4.474822044372559, 4.667469501495361, 4.860116481781006, 5.052763938903809, 5.245410919189453, 5.438057899475098, 5.6307053565979, 5.823352813720703, 6.015999794006348, 6.20864725112915, 6.401294231414795, 6.593941688537598, 6.786588668823242, 6.979235649108887, 7.1718831062316895, 7.364530086517334, 7.5571770668029785, 7.749824523925781, 7.942471504211426, 8.13511848449707, 8.327766418457031, 8.520413398742676, 8.71306037902832, 8.905707359313965, 9.09835433959961, 9.291001319885254, 9.483649253845215, 9.67629623413086, 9.868943214416504, 10.061590194702148, 10.25423812866211, 10.446885108947754]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 13.0, 14.0, 30.0, 54.0, 79.0, 116.0, 125.0, 124.0, 132.0, 108.0, 76.0, 57.0, 43.0, 14.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8807637691497803, -3.7486610412597656, -3.61655855178833, -3.4844558238983154, -3.352353096008301, -3.2202506065368652, -3.0881478786468506, -2.956045150756836, -2.8239426612854004, -2.6918399333953857, -2.55973744392395, -2.4276347160339355, -2.2955322265625, -2.1634294986724854, -2.0313267707824707, -1.8992241621017456, -1.7671215534210205, -1.6350189447402954, -1.5029163360595703, -1.3708136081695557, -1.2387109994888306, -1.1066083908081055, -0.9745057225227356, -0.8424030542373657, -0.7103004455566406, -0.5781978368759155, -0.44609516859054565, -0.31399253010749817, -0.18188989162445068, -0.049787282943725586, 0.08231538534164429, 0.21441805362701416, 0.34652042388916016, 0.47862306237220764, 0.6107257008552551, 0.742828369140625, 0.8749309778213501, 1.0070335865020752, 1.1391363143920898, 1.271238923072815, 1.40334153175354, 1.5354441404342651, 1.6675467491149902, 1.7996494770050049, 1.93175208568573, 2.063854694366455, 2.1959574222564697, 2.3280601501464844, 2.46016263961792, 2.5922653675079346, 2.72436785697937, 2.8564705848693848, 2.9885730743408203, 3.120675802230835, 3.2527785301208496, 3.384881019592285, 3.5169837474823, 3.6490864753723145, 3.78118896484375, 3.9132916927337646, 4.045394420623779, 4.177496910095215, 4.30959939956665, 4.441702365875244, 4.57380485534668]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 10.0, 12.0, 13.0, 20.0, 41.0, 77.0, 100.0, 187.0, 376.0, 926.0, 3080.0, 16035.0, 207437.0, 764989.0, 46482.0, 5868.0, 1618.0, 549.0, 259.0, 155.0, 103.0, 55.0, 34.0, 34.0, 19.0, 15.0, 13.0, 6.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4697265625, -1.425506591796875, -1.38128662109375, -1.337066650390625, -1.2928466796875, -1.248626708984375, -1.20440673828125, -1.160186767578125, -1.115966796875, -1.071746826171875, -1.02752685546875, -0.983306884765625, -0.9390869140625, -0.894866943359375, -0.85064697265625, -0.806427001953125, -0.76220703125, -0.717987060546875, -0.67376708984375, -0.629547119140625, -0.5853271484375, -0.541107177734375, -0.49688720703125, -0.452667236328125, -0.408447265625, -0.364227294921875, -0.32000732421875, -0.275787353515625, -0.2315673828125, -0.187347412109375, -0.14312744140625, -0.098907470703125, -0.0546875, -0.010467529296875, 0.03375244140625, 0.077972412109375, 0.1221923828125, 0.166412353515625, 0.21063232421875, 0.254852294921875, 0.299072265625, 0.343292236328125, 0.38751220703125, 0.431732177734375, 0.4759521484375, 0.520172119140625, 0.56439208984375, 0.608612060546875, 0.65283203125, 0.697052001953125, 0.74127197265625, 0.785491943359375, 0.8297119140625, 0.873931884765625, 0.91815185546875, 0.962371826171875, 1.006591796875, 1.050811767578125, 1.09503173828125, 1.139251708984375, 1.1834716796875, 1.227691650390625, 1.27191162109375, 1.316131591796875, 1.3603515625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 11.0, 9.0, 24.0, 45.0, 62.0, 85.0, 121.0, 127.0, 129.0, 119.0, 83.0, 78.0, 50.0, 38.0, 13.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.2344799041748047, -0.22225570678710938, -0.21003150939941406, -0.19780731201171875, -0.18558311462402344, -0.17335891723632812, -0.1611347198486328, -0.1489105224609375, -0.1366863250732422, -0.12446212768554688, -0.11223793029785156, -0.10001373291015625, -0.08778953552246094, -0.07556533813476562, -0.06334114074707031, -0.051116943359375, -0.03889274597167969, -0.026668548583984375, -0.014444351196289062, -0.00222015380859375, 0.010004043579101562, 0.022228240966796875, 0.03445243835449219, 0.0466766357421875, 0.05890083312988281, 0.07112503051757812, 0.08334922790527344, 0.09557342529296875, 0.10779762268066406, 0.12002182006835938, 0.1322460174560547, 0.14447021484375, 0.1566944122314453, 0.16891860961914062, 0.18114280700683594, 0.19336700439453125, 0.20559120178222656, 0.21781539916992188, 0.2300395965576172, 0.2422637939453125, 0.2544879913330078, 0.2667121887207031, 0.27893638610839844, 0.29116058349609375, 0.30338478088378906, 0.3156089782714844, 0.3278331756591797, 0.340057373046875, 0.3522815704345703, 0.3645057678222656, 0.37672996520996094, 0.38895416259765625, 0.40117835998535156, 0.4134025573730469, 0.4256267547607422, 0.4378509521484375, 0.4500751495361328, 0.4622993469238281, 0.47452354431152344, 0.48674774169921875, 0.49897193908691406, 0.5111961364746094, 0.5234203338623047, 0.53564453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 14.0, 23.0, 24.0, 48.0, 67.0, 89.0, 169.0, 347.0, 811.0, 2248.0, 7691.0, 31647.0, 173426.0, 675352.0, 122822.0, 24514.0, 6012.0, 1815.0, 703.0, 318.0, 137.0, 101.0, 56.0, 30.0, 28.0, 17.0, 9.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7216796875, -0.7007064819335938, -0.6797332763671875, -0.6587600708007812, -0.637786865234375, -0.6168136596679688, -0.5958404541015625, -0.5748672485351562, -0.55389404296875, -0.5329208374023438, -0.5119476318359375, -0.49097442626953125, -0.470001220703125, -0.44902801513671875, -0.4280548095703125, -0.40708160400390625, -0.3861083984375, -0.36513519287109375, -0.3441619873046875, -0.32318878173828125, -0.302215576171875, -0.28124237060546875, -0.2602691650390625, -0.23929595947265625, -0.21832275390625, -0.19734954833984375, -0.1763763427734375, -0.15540313720703125, -0.134429931640625, -0.11345672607421875, -0.0924835205078125, -0.07151031494140625, -0.050537109375, -0.02956390380859375, -0.0085906982421875, 0.01238250732421875, 0.033355712890625, 0.05432891845703125, 0.0753021240234375, 0.09627532958984375, 0.11724853515625, 0.13822174072265625, 0.1591949462890625, 0.18016815185546875, 0.201141357421875, 0.22211456298828125, 0.2430877685546875, 0.26406097412109375, 0.2850341796875, 0.30600738525390625, 0.3269805908203125, 0.34795379638671875, 0.368927001953125, 0.38990020751953125, 0.4108734130859375, 0.43184661865234375, 0.45281982421875, 0.47379302978515625, 0.4947662353515625, 0.5157394409179688, 0.536712646484375, 0.5576858520507812, 0.5786590576171875, 0.5996322631835938, 0.62060546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 14.0, 10.0, 8.0, 16.0, 24.0, 22.0, 28.0, 38.0, 34.0, 34.0, 46.0, 51.0, 56.0, 60.0, 42.0, 57.0, 62.0, 48.0, 44.0, 32.0, 41.0, 38.0, 44.0, 26.0, 25.0, 28.0, 13.0, 8.0, 15.0, 10.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7421875, -0.7213516235351562, -0.7005157470703125, -0.6796798706054688, -0.658843994140625, -0.6380081176757812, -0.6171722412109375, -0.5963363647460938, -0.57550048828125, -0.5546646118164062, -0.5338287353515625, -0.5129928588867188, -0.492156982421875, -0.47132110595703125, -0.4504852294921875, -0.42964935302734375, -0.4088134765625, -0.38797760009765625, -0.3671417236328125, -0.34630584716796875, -0.325469970703125, -0.30463409423828125, -0.2837982177734375, -0.26296234130859375, -0.24212646484375, -0.22129058837890625, -0.2004547119140625, -0.17961883544921875, -0.158782958984375, -0.13794708251953125, -0.1171112060546875, -0.09627532958984375, -0.075439453125, -0.05460357666015625, -0.0337677001953125, -0.01293182373046875, 0.007904052734375, 0.02873992919921875, 0.0495758056640625, 0.07041168212890625, 0.09124755859375, 0.11208343505859375, 0.1329193115234375, 0.15375518798828125, 0.174591064453125, 0.19542694091796875, 0.2162628173828125, 0.23709869384765625, 0.2579345703125, 0.27877044677734375, 0.2996063232421875, 0.32044219970703125, 0.341278076171875, 0.36211395263671875, 0.3829498291015625, 0.40378570556640625, 0.42462158203125, 0.44545745849609375, 0.4662933349609375, 0.48712921142578125, 0.507965087890625, 0.5288009643554688, 0.5496368408203125, 0.5704727172851562, 0.59130859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 10.0, 22.0, 28.0, 33.0, 45.0, 78.0, 128.0, 188.0, 376.0, 781.0, 2474.0, 11221.0, 147146.0, 818716.0, 57389.0, 6694.0, 1761.0, 661.0, 318.0, 173.0, 100.0, 76.0, 41.0, 24.0, 13.0, 12.0, 15.0, 11.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.2960700988769531, -0.28745269775390625, -0.2788352966308594, -0.2702178955078125, -0.2616004943847656, -0.25298309326171875, -0.24436569213867188, -0.235748291015625, -0.22713088989257812, -0.21851348876953125, -0.20989608764648438, -0.2012786865234375, -0.19266128540039062, -0.18404388427734375, -0.17542648315429688, -0.16680908203125, -0.15819168090820312, -0.14957427978515625, -0.14095687866210938, -0.1323394775390625, -0.12372207641601562, -0.11510467529296875, -0.10648727416992188, -0.097869873046875, -0.08925247192382812, -0.08063507080078125, -0.07201766967773438, -0.0634002685546875, -0.054782867431640625, -0.04616546630859375, -0.037548065185546875, -0.0289306640625, -0.020313262939453125, -0.01169586181640625, -0.003078460693359375, 0.0055389404296875, 0.014156341552734375, 0.02277374267578125, 0.031391143798828125, 0.040008544921875, 0.048625946044921875, 0.05724334716796875, 0.06586074829101562, 0.0744781494140625, 0.08309555053710938, 0.09171295166015625, 0.10033035278320312, 0.10894775390625, 0.11756515502929688, 0.12618255615234375, 0.13479995727539062, 0.1434173583984375, 0.15203475952148438, 0.16065216064453125, 0.16926956176757812, 0.177886962890625, 0.18650436401367188, 0.19512176513671875, 0.20373916625976562, 0.2123565673828125, 0.22097396850585938, 0.22959136962890625, 0.23820877075195312, 0.246826171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 26.0, 49.0, 113.0, 203.0, 240.0, 150.0, 89.0, 38.0, 20.0, 16.0, 11.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017309188842773438, -0.00016788765788078308, -0.0001626834273338318, -0.0001574791967868805, -0.0001522749662399292, -0.0001470707356929779, -0.0001418665051460266, -0.00013666227459907532, -0.00013145804405212402, -0.00012625381350517273, -0.00012104958295822144, -0.00011584535241127014, -0.00011064112186431885, -0.00010543689131736755, -0.00010023266077041626, -9.502843022346497e-05, -8.982419967651367e-05, -8.461996912956238e-05, -7.941573858261108e-05, -7.421150803565979e-05, -6.90072774887085e-05, -6.38030469417572e-05, -5.859881639480591e-05, -5.3394585847854614e-05, -4.819035530090332e-05, -4.2986124753952026e-05, -3.778189420700073e-05, -3.257766366004944e-05, -2.7373433113098145e-05, -2.216920256614685e-05, -1.6964972019195557e-05, -1.1760741472244263e-05, -6.556510925292969e-06, -1.3522803783416748e-06, 3.851950168609619e-06, 9.056180715560913e-06, 1.4260411262512207e-05, 1.94646418094635e-05, 2.4668872356414795e-05, 2.987310290336609e-05, 3.507733345031738e-05, 4.028156399726868e-05, 4.548579454421997e-05, 5.0690025091171265e-05, 5.589425563812256e-05, 6.109848618507385e-05, 6.630271673202515e-05, 7.150694727897644e-05, 7.671117782592773e-05, 8.191540837287903e-05, 8.711963891983032e-05, 9.232386946678162e-05, 9.752810001373291e-05, 0.0001027323305606842, 0.0001079365611076355, 0.00011314079165458679, 0.00011834502220153809, 0.00012354925274848938, 0.00012875348329544067, 0.00013395771384239197, 0.00013916194438934326, 0.00014436617493629456, 0.00014957040548324585, 0.00015477463603019714, 0.00015997886657714844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 5.0, 5.0, 12.0, 21.0, 46.0, 59.0, 103.0, 209.0, 434.0, 921.0, 2689.0, 9572.0, 53365.0, 519916.0, 408053.0, 41324.0, 7808.0, 2306.0, 891.0, 368.0, 177.0, 101.0, 53.0, 40.0, 22.0, 14.0, 8.0, 5.0, 11.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.15960121154785156, -0.15367507934570312, -0.1477489471435547, -0.14182281494140625, -0.1358966827392578, -0.12997055053710938, -0.12404441833496094, -0.1181182861328125, -0.11219215393066406, -0.10626602172851562, -0.10033988952636719, -0.09441375732421875, -0.08848762512207031, -0.08256149291992188, -0.07663536071777344, -0.070709228515625, -0.06478309631347656, -0.058856964111328125, -0.05293083190917969, -0.04700469970703125, -0.04107856750488281, -0.035152435302734375, -0.029226303100585938, -0.0233001708984375, -0.017374038696289062, -0.011447906494140625, -0.0055217742919921875, 0.00040435791015625, 0.0063304901123046875, 0.012256622314453125, 0.018182754516601562, 0.02410888671875, 0.030035018920898438, 0.035961151123046875, 0.04188728332519531, 0.04781341552734375, 0.05373954772949219, 0.059665679931640625, 0.06559181213378906, 0.0715179443359375, 0.07744407653808594, 0.08337020874023438, 0.08929634094238281, 0.09522247314453125, 0.10114860534667969, 0.10707473754882812, 0.11300086975097656, 0.118927001953125, 0.12485313415527344, 0.13077926635742188, 0.1367053985595703, 0.14263153076171875, 0.1485576629638672, 0.15448379516601562, 0.16040992736816406, 0.1663360595703125, 0.17226219177246094, 0.17818832397460938, 0.1841144561767578, 0.19004058837890625, 0.1959667205810547, 0.20189285278320312, 0.20781898498535156, 0.2137451171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 13.0, 17.0, 25.0, 25.0, 32.0, 41.0, 49.0, 83.0, 108.0, 103.0, 112.0, 76.0, 60.0, 58.0, 46.0, 33.0, 29.0, 16.0, 14.0, 9.0, 6.0, 4.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17296981811523438, -0.16698455810546875, -0.16099929809570312, -0.1550140380859375, -0.14902877807617188, -0.14304351806640625, -0.13705825805664062, -0.131072998046875, -0.12508773803710938, -0.11910247802734375, -0.11311721801757812, -0.1071319580078125, -0.10114669799804688, -0.09516143798828125, -0.08917617797851562, -0.08319091796875, -0.07720565795898438, -0.07122039794921875, -0.06523513793945312, -0.0592498779296875, -0.053264617919921875, -0.04727935791015625, -0.041294097900390625, -0.035308837890625, -0.029323577880859375, -0.02333831787109375, -0.017353057861328125, -0.0113677978515625, -0.005382537841796875, 0.00060272216796875, 0.006587982177734375, 0.0125732421875, 0.018558502197265625, 0.02454376220703125, 0.030529022216796875, 0.0365142822265625, 0.042499542236328125, 0.04848480224609375, 0.054470062255859375, 0.060455322265625, 0.06644058227539062, 0.07242584228515625, 0.07841110229492188, 0.0843963623046875, 0.09038162231445312, 0.09636688232421875, 0.10235214233398438, 0.10833740234375, 0.11432266235351562, 0.12030792236328125, 0.12629318237304688, 0.1322784423828125, 0.13826370239257812, 0.14424896240234375, 0.15023422241210938, 0.156219482421875, 0.16220474243164062, 0.16819000244140625, 0.17417526245117188, 0.1801605224609375, 0.18614578247070312, 0.19213104248046875, 0.19811630249023438, 0.2041015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 10.0, 21.0, 28.0, 45.0, 74.0, 213.0, 263.0, 176.0, 79.0, 47.0, 20.0, 9.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.911275386810303, -4.768937110900879, -4.626598358154297, -4.484260082244873, -4.341921806335449, -4.199583530426025, -4.057245254516602, -3.9149065017700195, -3.7725682258605957, -3.630229949951172, -3.487891435623169, -3.345552921295166, -3.203214645385742, -3.0608763694763184, -2.9185378551483154, -2.7761993408203125, -2.6338610649108887, -2.491522789001465, -2.349184274673462, -2.206845760345459, -2.064507484436035, -1.9221690893173218, -1.7798306941986084, -1.637492299079895, -1.4951539039611816, -1.3528155088424683, -1.2104771137237549, -1.0681387186050415, -0.9258003234863281, -0.7834619283676147, -0.6411235332489014, -0.498785138130188, -0.3564472198486328, -0.21410882472991943, -0.07177042961120605, 0.07056796550750732, 0.2129063606262207, 0.3552447557449341, 0.49758315086364746, 0.6399215459823608, 0.7822599411010742, 0.9245983362197876, 1.066936731338501, 1.2092751264572144, 1.3516135215759277, 1.4939519166946411, 1.6362903118133545, 1.7786287069320679, 1.9209671020507812, 2.063305377960205, 2.205643892288208, 2.347982406616211, 2.4903206825256348, 2.6326589584350586, 2.7749974727630615, 2.9173359870910645, 3.0596742630004883, 3.202012538909912, 3.344351053237915, 3.486689567565918, 3.629027843475342, 3.7713661193847656, 3.9137046337127686, 4.0560431480407715, 4.198381423950195]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 1.0, 8.0, 14.0, 8.0, 8.0, 13.0, 17.0, 15.0, 22.0, 19.0, 29.0, 26.0, 44.0, 37.0, 44.0, 32.0, 41.0, 46.0, 48.0, 43.0, 48.0, 50.0, 39.0, 39.0, 41.0, 40.0, 36.0, 32.0, 35.0, 27.0, 17.0, 23.0, 8.0, 11.0, 8.0, 7.0, 7.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.335688591003418, -3.2290048599243164, -3.1223208904266357, -3.015637159347534, -2.9089534282684326, -2.802269458770752, -2.6955857276916504, -2.588901996612549, -2.4822182655334473, -2.3755345344543457, -2.268850564956665, -2.1621668338775635, -2.055483102798462, -1.9487992525100708, -1.8421154022216797, -1.7354316711425781, -1.6287477016448975, -1.5220638513565063, -1.4153801202774048, -1.3086962699890137, -1.202012538909912, -1.095328688621521, -0.9886448383331299, -0.8819610476493835, -0.7752772569656372, -0.6685934662818909, -0.5619096755981445, -0.4552258253097534, -0.3485420346260071, -0.24185824394226074, -0.13517439365386963, -0.02849060297012329, 0.07819318771362305, 0.18487699329853058, 0.2915607988834381, 0.39824461936950684, 0.5049284100532532, 0.6116122007369995, 0.7182960510253906, 0.824979841709137, 0.9316636323928833, 1.0383474826812744, 1.145031213760376, 1.251715064048767, 1.3583989143371582, 1.4650826454162598, 1.5717664957046509, 1.678450345993042, 1.7851340770721436, 1.8918179273605347, 1.9985016584396362, 2.1051855087280273, 2.211869239807129, 2.3185529708862305, 2.425236940383911, 2.5319206714630127, 2.6386046409606934, 2.745288372039795, 2.8519723415374756, 2.958656072616577, 3.0653398036956787, 3.1720237731933594, 3.278707504272461, 3.3853912353515625, 3.492074966430664]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 38.0, 62.0, 172.0, 458.0, 2089.0, 25347.0, 4105499.0, 55919.0, 3291.0, 771.0, 291.0, 143.0, 71.0, 49.0, 27.0, 15.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -0.9990234375, -0.9453125, -0.8916015625, -0.837890625, -0.7841796875, -0.73046875, -0.6767578125, -0.623046875, -0.5693359375, -0.515625, -0.4619140625, -0.408203125, -0.3544921875, -0.30078125, -0.2470703125, -0.193359375, -0.1396484375, -0.0859375, -0.0322265625, 0.021484375, 0.0751953125, 0.12890625, 0.1826171875, 0.236328125, 0.2900390625, 0.34375, 0.3974609375, 0.451171875, 0.5048828125, 0.55859375, 0.6123046875, 0.666015625, 0.7197265625, 0.7734375, 0.8271484375, 0.880859375, 0.9345703125, 0.98828125, 1.0419921875, 1.095703125, 1.1494140625, 1.203125, 1.2568359375, 1.310546875, 1.3642578125, 1.41796875, 1.4716796875, 1.525390625, 1.5791015625, 1.6328125, 1.6865234375, 1.740234375, 1.7939453125, 1.84765625, 1.9013671875, 1.955078125, 2.0087890625, 2.0625, 2.1162109375, 2.169921875, 2.2236328125, 2.27734375, 2.3310546875, 2.384765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 8.0, 16.0, 38.0, 62.0, 81.0, 106.0, 100.0, 125.0, 108.0, 96.0, 91.0, 63.0, 43.0, 29.0, 7.0, 15.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2384033203125, -0.2263164520263672, -0.21422958374023438, -0.20214271545410156, -0.19005584716796875, -0.17796897888183594, -0.16588211059570312, -0.1537952423095703, -0.1417083740234375, -0.1296215057373047, -0.11753463745117188, -0.10544776916503906, -0.09336090087890625, -0.08127403259277344, -0.06918716430664062, -0.05710029602050781, -0.045013427734375, -0.03292655944824219, -0.020839691162109375, -0.008752822875976562, 0.00333404541015625, 0.015420913696289062, 0.027507781982421875, 0.03959465026855469, 0.0516815185546875, 0.06376838684082031, 0.07585525512695312, 0.08794212341308594, 0.10002899169921875, 0.11211585998535156, 0.12420272827148438, 0.1362895965576172, 0.14837646484375, 0.1604633331298828, 0.17255020141601562, 0.18463706970214844, 0.19672393798828125, 0.20881080627441406, 0.22089767456054688, 0.2329845428466797, 0.2450714111328125, 0.2571582794189453, 0.2692451477050781, 0.28133201599121094, 0.29341888427734375, 0.30550575256347656, 0.3175926208496094, 0.3296794891357422, 0.341766357421875, 0.3538532257080078, 0.3659400939941406, 0.37802696228027344, 0.39011383056640625, 0.40220069885253906, 0.4142875671386719, 0.4263744354248047, 0.4384613037109375, 0.4505481719970703, 0.4626350402832031, 0.47472190856933594, 0.48680877685546875, 0.49889564514160156, 0.5109825134277344, 0.5230693817138672, 0.53515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 13.0, 32.0, 32.0, 47.0, 92.0, 159.0, 326.0, 621.0, 1650.0, 4584.0, 19362.0, 334769.0, 3779487.0, 42412.0, 6926.0, 2167.0, 822.0, 362.0, 189.0, 84.0, 57.0, 31.0, 25.0, 10.0, 5.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4777030944824219, -0.45711517333984375, -0.4365272521972656, -0.4159393310546875, -0.3953514099121094, -0.37476348876953125, -0.3541755676269531, -0.333587646484375, -0.3129997253417969, -0.29241180419921875, -0.2718238830566406, -0.2512359619140625, -0.23064804077148438, -0.21006011962890625, -0.18947219848632812, -0.16888427734375, -0.14829635620117188, -0.12770843505859375, -0.10712051391601562, -0.0865325927734375, -0.06594467163085938, -0.04535675048828125, -0.024768829345703125, -0.004180908203125, 0.016407012939453125, 0.03699493408203125, 0.057582855224609375, 0.0781707763671875, 0.09875869750976562, 0.11934661865234375, 0.13993453979492188, 0.1605224609375, 0.18111038208007812, 0.20169830322265625, 0.22228622436523438, 0.2428741455078125, 0.2634620666503906, 0.28404998779296875, 0.3046379089355469, 0.325225830078125, 0.3458137512207031, 0.36640167236328125, 0.3869895935058594, 0.4075775146484375, 0.4281654357910156, 0.44875335693359375, 0.4693412780761719, 0.48992919921875, 0.5105171203613281, 0.5311050415039062, 0.5516929626464844, 0.5722808837890625, 0.5928688049316406, 0.6134567260742188, 0.6340446472167969, 0.654632568359375, 0.6752204895019531, 0.6958084106445312, 0.7163963317871094, 0.7369842529296875, 0.7575721740722656, 0.7781600952148438, 0.7987480163574219, 0.8193359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 6.0, 11.0, 21.0, 22.0, 34.0, 91.0, 147.0, 468.0, 2558.0, 442.0, 135.0, 48.0, 31.0, 13.0, 16.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.35027503967285156, -0.3411750793457031, -0.3320751190185547, -0.32297515869140625, -0.3138751983642578, -0.3047752380371094, -0.29567527770996094, -0.2865753173828125, -0.27747535705566406, -0.2683753967285156, -0.2592754364013672, -0.25017547607421875, -0.2410755157470703, -0.23197555541992188, -0.22287559509277344, -0.213775634765625, -0.20467567443847656, -0.19557571411132812, -0.1864757537841797, -0.17737579345703125, -0.1682758331298828, -0.15917587280273438, -0.15007591247558594, -0.1409759521484375, -0.13187599182128906, -0.12277603149414062, -0.11367607116699219, -0.10457611083984375, -0.09547615051269531, -0.08637619018554688, -0.07727622985839844, -0.06817626953125, -0.05907630920410156, -0.049976348876953125, -0.04087638854980469, -0.03177642822265625, -0.022676467895507812, -0.013576507568359375, -0.0044765472412109375, 0.0046234130859375, 0.013723373413085938, 0.022823333740234375, 0.03192329406738281, 0.04102325439453125, 0.05012321472167969, 0.059223175048828125, 0.06832313537597656, 0.077423095703125, 0.08652305603027344, 0.09562301635742188, 0.10472297668457031, 0.11382293701171875, 0.12292289733886719, 0.13202285766601562, 0.14112281799316406, 0.1502227783203125, 0.15932273864746094, 0.16842269897460938, 0.1775226593017578, 0.18662261962890625, 0.1957225799560547, 0.20482254028320312, 0.21392250061035156, 0.2230224609375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 70.0, 443.0, 432.0, 43.0, 10.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.605253219604492, -5.493514537811279, -5.381776332855225, -5.270037651062012, -5.158299446105957, -5.046560764312744, -4.934822082519531, -4.823083877563477, -4.711345195770264, -4.599606513977051, -4.487868309020996, -4.376129627227783, -4.2643914222717285, -4.152652740478516, -4.040914535522461, -3.929175853729248, -3.8174376487731934, -3.7056992053985596, -3.593960762023926, -3.482222080230713, -3.370483636856079, -3.2587451934814453, -3.1470067501068115, -3.0352683067321777, -2.923529624938965, -2.811791181564331, -2.7000527381896973, -2.5883140563964844, -2.4765756130218506, -2.364837169647217, -2.253098726272583, -2.141360282897949, -2.0296218395233154, -1.9178833961486816, -1.8061448335647583, -1.6944063901901245, -1.5826679468154907, -1.4709293842315674, -1.3591909408569336, -1.2474524974822998, -1.135714054107666, -1.0239756107330322, -0.9122371077537537, -0.8004986047744751, -0.6887601613998413, -0.5770216584205627, -0.4652831554412842, -0.3535447120666504, -0.24180614948272705, -0.13006767630577087, -0.018329188227653503, 0.09340929985046387, 0.20514777302742004, 0.3168862462043762, 0.4286247491836548, 0.5403631925582886, 0.6521016955375671, 0.7638401985168457, 0.8755786418914795, 0.9873171448707581, 1.0990556478500366, 1.2107940912246704, 1.3225326538085938, 1.4342710971832275, 1.5460095405578613]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 10.0, 11.0, 24.0, 37.0, 57.0, 62.0, 70.0, 91.0, 117.0, 116.0, 91.0, 86.0, 67.0, 55.0, 40.0, 35.0, 18.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951565265655518, -1.451539158821106, -1.4079217910766602, -1.364304542541504, -1.320687174797058, -1.2770698070526123, -1.2334524393081665, -1.1898350715637207, -1.1462178230285645, -1.1026004552841187, -1.0589830875396729, -1.0153658390045166, -0.9717484712600708, -0.928131103515625, -0.8845137357711792, -0.8408963680267334, -0.7972790002822876, -0.7536616325378418, -0.7100443243980408, -0.666426956653595, -0.622809648513794, -0.5791922807693481, -0.5355749130249023, -0.49195757508277893, -0.4483402371406555, -0.4047228991985321, -0.3611055612564087, -0.3174881935119629, -0.2738708555698395, -0.23025351762771606, -0.18663614988327026, -0.14301881194114685, -0.09940135478973389, -0.05578400939702988, -0.012166664004325867, 0.03145068883895874, 0.07506802678108215, 0.11868536472320557, 0.16230273246765137, 0.20592007040977478, 0.2495374083518982, 0.2931547462940216, 0.336772084236145, 0.3803894519805908, 0.42400678992271423, 0.46762412786483765, 0.5112414956092834, 0.5548588037490845, 0.5984761714935303, 0.6420935392379761, 0.6857108473777771, 0.7293282151222229, 0.7729455232620239, 0.8165628910064697, 0.8601802587509155, 0.9037976264953613, 0.9474149346351624, 0.9910323023796082, 1.0346496105194092, 1.078266978263855, 1.1218843460083008, 1.165501594543457, 1.2091190814971924, 1.2527363300323486, 1.2963536977767944]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 1.0, 5.0, 6.0, 12.0, 8.0, 10.0, 21.0, 24.0, 36.0, 39.0, 71.0, 99.0, 133.0, 263.0, 477.0, 1021.0, 2673.0, 8411.0, 36275.0, 245820.0, 638527.0, 89748.0, 16991.0, 4528.0, 1615.0, 726.0, 376.0, 193.0, 155.0, 71.0, 58.0, 34.0, 38.0, 23.0, 16.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9052734375, -0.8780517578125, -0.850830078125, -0.8236083984375, -0.79638671875, -0.7691650390625, -0.741943359375, -0.7147216796875, -0.6875, -0.6602783203125, -0.633056640625, -0.6058349609375, -0.57861328125, -0.5513916015625, -0.524169921875, -0.4969482421875, -0.4697265625, -0.4425048828125, -0.415283203125, -0.3880615234375, -0.36083984375, -0.3336181640625, -0.306396484375, -0.2791748046875, -0.251953125, -0.2247314453125, -0.197509765625, -0.1702880859375, -0.14306640625, -0.1158447265625, -0.088623046875, -0.0614013671875, -0.0341796875, -0.0069580078125, 0.020263671875, 0.0474853515625, 0.07470703125, 0.1019287109375, 0.129150390625, 0.1563720703125, 0.18359375, 0.2108154296875, 0.238037109375, 0.2652587890625, 0.29248046875, 0.3197021484375, 0.346923828125, 0.3741455078125, 0.4013671875, 0.4285888671875, 0.455810546875, 0.4830322265625, 0.51025390625, 0.5374755859375, 0.564697265625, 0.5919189453125, 0.619140625, 0.6463623046875, 0.673583984375, 0.7008056640625, 0.72802734375, 0.7552490234375, 0.782470703125, 0.8096923828125, 0.8369140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 17.0, 39.0, 49.0, 73.0, 87.0, 103.0, 105.0, 106.0, 84.0, 89.0, 87.0, 50.0, 41.0, 29.0, 10.0, 10.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.2076873779296875, -0.196868896484375, -0.1860504150390625, -0.17523193359375, -0.1644134521484375, -0.153594970703125, -0.1427764892578125, -0.1319580078125, -0.1211395263671875, -0.110321044921875, -0.0995025634765625, -0.08868408203125, -0.0778656005859375, -0.067047119140625, -0.0562286376953125, -0.04541015625, -0.0345916748046875, -0.023773193359375, -0.0129547119140625, -0.00213623046875, 0.0086822509765625, 0.019500732421875, 0.0303192138671875, 0.0411376953125, 0.0519561767578125, 0.062774658203125, 0.0735931396484375, 0.08441162109375, 0.0952301025390625, 0.106048583984375, 0.1168670654296875, 0.127685546875, 0.1385040283203125, 0.149322509765625, 0.1601409912109375, 0.17095947265625, 0.1817779541015625, 0.192596435546875, 0.2034149169921875, 0.2142333984375, 0.2250518798828125, 0.235870361328125, 0.2466888427734375, 0.25750732421875, 0.2683258056640625, 0.279144287109375, 0.2899627685546875, 0.30078125, 0.3115997314453125, 0.322418212890625, 0.3332366943359375, 0.34405517578125, 0.3548736572265625, 0.365692138671875, 0.3765106201171875, 0.3873291015625, 0.3981475830078125, 0.408966064453125, 0.4197845458984375, 0.43060302734375, 0.4414215087890625, 0.452239990234375, 0.4630584716796875, 0.473876953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 8.0, 3.0, 11.0, 12.0, 18.0, 13.0, 20.0, 29.0, 46.0, 64.0, 90.0, 126.0, 245.0, 407.0, 712.0, 1424.0, 2882.0, 6443.0, 15797.0, 44378.0, 171535.0, 562275.0, 169708.0, 44304.0, 15644.0, 6337.0, 2860.0, 1409.0, 702.0, 397.0, 223.0, 135.0, 91.0, 56.0, 35.0, 31.0, 19.0, 16.0, 12.0, 14.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.50048828125, -0.4855461120605469, -0.47060394287109375, -0.4556617736816406, -0.4407196044921875, -0.4257774353027344, -0.41083526611328125, -0.3958930969238281, -0.380950927734375, -0.3660087585449219, -0.35106658935546875, -0.3361244201660156, -0.3211822509765625, -0.3062400817871094, -0.29129791259765625, -0.2763557434082031, -0.26141357421875, -0.24647140502929688, -0.23152923583984375, -0.21658706665039062, -0.2016448974609375, -0.18670272827148438, -0.17176055908203125, -0.15681838989257812, -0.141876220703125, -0.12693405151367188, -0.11199188232421875, -0.09704971313476562, -0.0821075439453125, -0.06716537475585938, -0.05222320556640625, -0.037281036376953125, -0.0223388671875, -0.007396697998046875, 0.00754547119140625, 0.022487640380859375, 0.0374298095703125, 0.052371978759765625, 0.06731414794921875, 0.08225631713867188, 0.097198486328125, 0.11214065551757812, 0.12708282470703125, 0.14202499389648438, 0.1569671630859375, 0.17190933227539062, 0.18685150146484375, 0.20179367065429688, 0.21673583984375, 0.23167800903320312, 0.24662017822265625, 0.2615623474121094, 0.2765045166015625, 0.2914466857910156, 0.30638885498046875, 0.3213310241699219, 0.336273193359375, 0.3512153625488281, 0.36615753173828125, 0.3810997009277344, 0.3960418701171875, 0.4109840393066406, 0.42592620849609375, 0.4408683776855469, 0.455810546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 9.0, 15.0, 21.0, 19.0, 23.0, 26.0, 28.0, 48.0, 41.0, 51.0, 45.0, 57.0, 50.0, 55.0, 47.0, 59.0, 47.0, 40.0, 43.0, 46.0, 32.0, 33.0, 27.0, 21.0, 21.0, 17.0, 13.0, 7.0, 4.0, 5.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6499481201171875, -0.627044677734375, -0.6041412353515625, -0.58123779296875, -0.5583343505859375, -0.535430908203125, -0.5125274658203125, -0.4896240234375, -0.4667205810546875, -0.443817138671875, -0.4209136962890625, -0.39801025390625, -0.3751068115234375, -0.352203369140625, -0.3292999267578125, -0.306396484375, -0.2834930419921875, -0.260589599609375, -0.2376861572265625, -0.21478271484375, -0.1918792724609375, -0.168975830078125, -0.1460723876953125, -0.1231689453125, -0.1002655029296875, -0.077362060546875, -0.0544586181640625, -0.03155517578125, -0.0086517333984375, 0.014251708984375, 0.0371551513671875, 0.06005859375, 0.0829620361328125, 0.105865478515625, 0.1287689208984375, 0.15167236328125, 0.1745758056640625, 0.197479248046875, 0.2203826904296875, 0.2432861328125, 0.2661895751953125, 0.289093017578125, 0.3119964599609375, 0.33489990234375, 0.3578033447265625, 0.380706787109375, 0.4036102294921875, 0.426513671875, 0.4494171142578125, 0.472320556640625, 0.4952239990234375, 0.51812744140625, 0.5410308837890625, 0.563934326171875, 0.5868377685546875, 0.6097412109375, 0.6326446533203125, 0.655548095703125, 0.6784515380859375, 0.70135498046875, 0.7242584228515625, 0.747161865234375, 0.7700653076171875, 0.79296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 18.0, 28.0, 54.0, 80.0, 147.0, 290.0, 793.0, 2815.0, 23577.0, 755489.0, 253252.0, 9333.0, 1639.0, 549.0, 209.0, 105.0, 61.0, 34.0, 15.0, 20.0, 10.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28275299072265625, -0.2732696533203125, -0.26378631591796875, -0.254302978515625, -0.24481964111328125, -0.2353363037109375, -0.22585296630859375, -0.21636962890625, -0.20688629150390625, -0.1974029541015625, -0.18791961669921875, -0.178436279296875, -0.16895294189453125, -0.1594696044921875, -0.14998626708984375, -0.1405029296875, -0.13101959228515625, -0.1215362548828125, -0.11205291748046875, -0.102569580078125, -0.09308624267578125, -0.0836029052734375, -0.07411956787109375, -0.06463623046875, -0.05515289306640625, -0.0456695556640625, -0.03618621826171875, -0.026702880859375, -0.01721954345703125, -0.0077362060546875, 0.00174713134765625, 0.01123046875, 0.02071380615234375, 0.0301971435546875, 0.03968048095703125, 0.049163818359375, 0.05864715576171875, 0.0681304931640625, 0.07761383056640625, 0.08709716796875, 0.09658050537109375, 0.1060638427734375, 0.11554718017578125, 0.125030517578125, 0.13451385498046875, 0.1439971923828125, 0.15348052978515625, 0.1629638671875, 0.17244720458984375, 0.1819305419921875, 0.19141387939453125, 0.200897216796875, 0.21038055419921875, 0.2198638916015625, 0.22934722900390625, 0.23883056640625, 0.24831390380859375, 0.2577972412109375, 0.26728057861328125, 0.276763916015625, 0.28624725341796875, 0.2957305908203125, 0.30521392822265625, 0.314697265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 3.0, 7.0, 9.0, 5.0, 16.0, 13.0, 24.0, 35.0, 51.0, 65.0, 74.0, 83.0, 102.0, 92.0, 85.0, 70.0, 61.0, 49.0, 36.0, 25.0, 28.0, 18.0, 11.0, 8.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.836652755737305e-05, -6.646942347288132e-05, -6.457231938838959e-05, -6.267521530389786e-05, -6.077811121940613e-05, -5.88810071349144e-05, -5.698390305042267e-05, -5.508679896593094e-05, -5.318969488143921e-05, -5.129259079694748e-05, -4.939548671245575e-05, -4.749838262796402e-05, -4.560127854347229e-05, -4.370417445898056e-05, -4.180707037448883e-05, -3.99099662899971e-05, -3.801286220550537e-05, -3.611575812101364e-05, -3.421865403652191e-05, -3.232154995203018e-05, -3.0424445867538452e-05, -2.8527341783046722e-05, -2.6630237698554993e-05, -2.4733133614063263e-05, -2.2836029529571533e-05, -2.0938925445079803e-05, -1.9041821360588074e-05, -1.7144717276096344e-05, -1.5247613191604614e-05, -1.3350509107112885e-05, -1.1453405022621155e-05, -9.556300938129425e-06, -7.659196853637695e-06, -5.7620927691459656e-06, -3.864988684654236e-06, -1.967884600162506e-06, -7.078051567077637e-08, 1.8263235688209534e-06, 3.723427653312683e-06, 5.620531737804413e-06, 7.517635822296143e-06, 9.414739906787872e-06, 1.1311843991279602e-05, 1.3208948075771332e-05, 1.5106052160263062e-05, 1.700315624475479e-05, 1.890026032924652e-05, 2.079736441373825e-05, 2.269446849822998e-05, 2.459157258272171e-05, 2.648867666721344e-05, 2.838578075170517e-05, 3.02828848361969e-05, 3.217998892068863e-05, 3.407709300518036e-05, 3.597419708967209e-05, 3.787130117416382e-05, 3.976840525865555e-05, 4.166550934314728e-05, 4.356261342763901e-05, 4.545971751213074e-05, 4.735682159662247e-05, 4.92539256811142e-05, 5.1151029765605927e-05, 5.3048133850097656e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 13.0, 32.0, 54.0, 103.0, 166.0, 312.0, 654.0, 1626.0, 5462.0, 31794.0, 487183.0, 481690.0, 31081.0, 5425.0, 1625.0, 623.0, 276.0, 179.0, 96.0, 61.0, 25.0, 13.0, 13.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.25830078125, -0.25150299072265625, -0.2447052001953125, -0.23790740966796875, -0.231109619140625, -0.22431182861328125, -0.2175140380859375, -0.21071624755859375, -0.20391845703125, -0.19712066650390625, -0.1903228759765625, -0.18352508544921875, -0.176727294921875, -0.16992950439453125, -0.1631317138671875, -0.15633392333984375, -0.1495361328125, -0.14273834228515625, -0.1359405517578125, -0.12914276123046875, -0.122344970703125, -0.11554718017578125, -0.1087493896484375, -0.10195159912109375, -0.09515380859375, -0.08835601806640625, -0.0815582275390625, -0.07476043701171875, -0.067962646484375, -0.06116485595703125, -0.0543670654296875, -0.04756927490234375, -0.040771484375, -0.03397369384765625, -0.0271759033203125, -0.02037811279296875, -0.013580322265625, -0.00678253173828125, 1.52587890625e-05, 0.00681304931640625, 0.01361083984375, 0.02040863037109375, 0.0272064208984375, 0.03400421142578125, 0.040802001953125, 0.04759979248046875, 0.0543975830078125, 0.06119537353515625, 0.0679931640625, 0.07479095458984375, 0.0815887451171875, 0.08838653564453125, 0.095184326171875, 0.10198211669921875, 0.1087799072265625, 0.11557769775390625, 0.12237548828125, 0.12917327880859375, 0.1359710693359375, 0.14276885986328125, 0.149566650390625, 0.15636444091796875, 0.1631622314453125, 0.16996002197265625, 0.1767578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 18.0, 32.0, 32.0, 67.0, 113.0, 151.0, 168.0, 142.0, 108.0, 62.0, 38.0, 20.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.26410675048828125, -0.2562408447265625, -0.24837493896484375, -0.240509033203125, -0.23264312744140625, -0.2247772216796875, -0.21691131591796875, -0.20904541015625, -0.20117950439453125, -0.1933135986328125, -0.18544769287109375, -0.177581787109375, -0.16971588134765625, -0.1618499755859375, -0.15398406982421875, -0.1461181640625, -0.13825225830078125, -0.1303863525390625, -0.12252044677734375, -0.114654541015625, -0.10678863525390625, -0.0989227294921875, -0.09105682373046875, -0.08319091796875, -0.07532501220703125, -0.0674591064453125, -0.05959320068359375, -0.051727294921875, -0.04386138916015625, -0.0359954833984375, -0.02812957763671875, -0.020263671875, -0.01239776611328125, -0.0045318603515625, 0.00333404541015625, 0.011199951171875, 0.01906585693359375, 0.0269317626953125, 0.03479766845703125, 0.04266357421875, 0.05052947998046875, 0.0583953857421875, 0.06626129150390625, 0.074127197265625, 0.08199310302734375, 0.0898590087890625, 0.09772491455078125, 0.1055908203125, 0.11345672607421875, 0.1213226318359375, 0.12918853759765625, 0.137054443359375, 0.14492034912109375, 0.1527862548828125, 0.16065216064453125, 0.16851806640625, 0.17638397216796875, 0.1842498779296875, 0.19211578369140625, 0.199981689453125, 0.20784759521484375, 0.2157135009765625, 0.22357940673828125, 0.2314453125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 12.0, 19.0, 52.0, 129.0, 414.0, 266.0, 70.0, 17.0, 17.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.617115020751953, -3.355769157409668, -3.094423294067383, -2.8330774307250977, -2.5717315673828125, -2.3103857040405273, -2.049039602279663, -1.787693738937378, -1.5263478755950928, -1.2650020122528076, -1.0036561489105225, -0.7423101663589478, -0.4809643030166626, -0.21961843967437744, 0.041727542877197266, 0.3030734062194824, 0.5644192695617676, 0.8257651329040527, 1.087110996246338, 1.3484569787979126, 1.6098028421401978, 1.871148705482483, 2.1324946880340576, 2.3938405513763428, 2.655186414718628, 2.916532278060913, 3.1778781414031982, 3.4392242431640625, 3.7005701065063477, 3.961915969848633, 4.223261833190918, 4.484607696533203, 4.745953559875488, 5.007299423217773, 5.268645286560059, 5.529991149902344, 5.791337013244629, 6.052682876586914, 6.314028739929199, 6.575374603271484, 6.8367204666137695, 7.098066329956055, 7.35941219329834, 7.620758056640625, 7.88210391998291, 8.143449783325195, 8.40479564666748, 8.666141510009766, 8.927488327026367, 9.188834190368652, 9.450180053710938, 9.711525917053223, 9.972871780395508, 10.234217643737793, 10.495563507080078, 10.756909370422363, 11.018255233764648, 11.279601097106934, 11.540946960449219, 11.802292823791504, 12.063638687133789, 12.324984550476074, 12.58633041381836, 12.847676277160645, 13.10902214050293]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 10.0, 11.0, 8.0, 14.0, 15.0, 14.0, 13.0, 23.0, 19.0, 35.0, 24.0, 29.0, 26.0, 34.0, 44.0, 48.0, 41.0, 51.0, 57.0, 54.0, 39.0, 40.0, 42.0, 43.0, 29.0, 33.0, 29.0, 32.0, 27.0, 25.0, 12.0, 20.0, 13.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.3461103439331055, -4.223694324493408, -4.101278781890869, -3.978863000869751, -3.856447219848633, -3.7340314388275146, -3.6116156578063965, -3.489199638366699, -3.36678409576416, -3.244368314743042, -3.121952533721924, -2.9995367527008057, -2.8771209716796875, -2.7547051906585693, -2.632289409637451, -2.509873390197754, -2.3874576091766357, -2.2650418281555176, -2.1426260471343994, -2.0202102661132812, -1.897794485092163, -1.775378704071045, -1.6529628038406372, -1.530547022819519, -1.4081312417984009, -1.2857154607772827, -1.1632996797561646, -1.0408837795257568, -0.9184680581092834, -0.7960522770881653, -0.6736364364624023, -0.5512206554412842, -0.4288046360015869, -0.30638885498046875, -0.1839730441570282, -0.061557233333587646, 0.06085854768753052, 0.18327432870864868, 0.3056901693344116, 0.4281059503555298, 0.550521731376648, 0.6729375123977661, 0.7953532934188843, 0.9177691340446472, 1.0401849746704102, 1.1626007556915283, 1.2850165367126465, 1.4074323177337646, 1.5298480987548828, 1.652263879776001, 1.7746796607971191, 1.8970954418182373, 2.0195112228393555, 2.1419270038604736, 2.264342784881592, 2.386758804321289, 2.509174346923828, 2.6315901279449463, 2.7540059089660645, 2.8764216899871826, 2.998837471008301, 3.121253252029419, 3.243669033050537, 3.3660850524902344, 3.4885008335113525]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 8.0, 9.0, 12.0, 20.0, 30.0, 56.0, 94.0, 150.0, 376.0, 873.0, 3152.0, 27327.0, 4089111.0, 65809.0, 4859.0, 1333.0, 481.0, 244.0, 125.0, 77.0, 42.0, 37.0, 14.0, 12.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1382904052734375, -1.080291748046875, -1.0222930908203125, -0.96429443359375, -0.9062957763671875, -0.848297119140625, -0.7902984619140625, -0.7322998046875, -0.6743011474609375, -0.616302490234375, -0.5583038330078125, -0.50030517578125, -0.4423065185546875, -0.384307861328125, -0.3263092041015625, -0.268310546875, -0.2103118896484375, -0.152313232421875, -0.0943145751953125, -0.03631591796875, 0.0216827392578125, 0.079681396484375, 0.1376800537109375, 0.1956787109375, 0.2536773681640625, 0.311676025390625, 0.3696746826171875, 0.42767333984375, 0.4856719970703125, 0.543670654296875, 0.6016693115234375, 0.65966796875, 0.7176666259765625, 0.775665283203125, 0.8336639404296875, 0.89166259765625, 0.9496612548828125, 1.007659912109375, 1.0656585693359375, 1.1236572265625, 1.1816558837890625, 1.239654541015625, 1.2976531982421875, 1.35565185546875, 1.4136505126953125, 1.471649169921875, 1.5296478271484375, 1.587646484375, 1.6456451416015625, 1.703643798828125, 1.7616424560546875, 1.81964111328125, 1.8776397705078125, 1.935638427734375, 1.9936370849609375, 2.0516357421875, 2.1096343994140625, 2.167633056640625, 2.2256317138671875, 2.28363037109375, 2.3416290283203125, 2.399627685546875, 2.4576263427734375, 2.515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 14.0, 21.0, 30.0, 43.0, 47.0, 75.0, 77.0, 89.0, 71.0, 84.0, 86.0, 94.0, 56.0, 43.0, 48.0, 43.0, 19.0, 23.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.19637107849121094, -0.18607711791992188, -0.1757831573486328, -0.16548919677734375, -0.1551952362060547, -0.14490127563476562, -0.13460731506347656, -0.1243133544921875, -0.11401939392089844, -0.10372543334960938, -0.09343147277832031, -0.08313751220703125, -0.07284355163574219, -0.06254959106445312, -0.05225563049316406, -0.041961669921875, -0.03166770935058594, -0.021373748779296875, -0.011079788208007812, -0.00078582763671875, 0.009508132934570312, 0.019802093505859375, 0.030096054077148438, 0.0403900146484375, 0.05068397521972656, 0.060977935791015625, 0.07127189636230469, 0.08156585693359375, 0.09185981750488281, 0.10215377807617188, 0.11244773864746094, 0.12274169921875, 0.13303565979003906, 0.14332962036132812, 0.1536235809326172, 0.16391754150390625, 0.1742115020751953, 0.18450546264648438, 0.19479942321777344, 0.2050933837890625, 0.21538734436035156, 0.22568130493164062, 0.2359752655029297, 0.24626922607421875, 0.2565631866455078, 0.2668571472167969, 0.27715110778808594, 0.287445068359375, 0.29773902893066406, 0.3080329895019531, 0.3183269500732422, 0.32862091064453125, 0.3389148712158203, 0.3492088317871094, 0.35950279235839844, 0.3697967529296875, 0.38009071350097656, 0.3903846740722656, 0.4006786346435547, 0.41097259521484375, 0.4212665557861328, 0.4315605163574219, 0.44185447692871094, 0.4521484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 14.0, 12.0, 18.0, 17.0, 34.0, 52.0, 63.0, 109.0, 159.0, 275.0, 518.0, 1214.0, 3445.0, 14698.0, 889869.0, 3259387.0, 17867.0, 3910.0, 1269.0, 590.0, 310.0, 148.0, 88.0, 77.0, 45.0, 25.0, 25.0, 16.0, 12.0, 8.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9384765625, -0.9072418212890625, -0.876007080078125, -0.8447723388671875, -0.81353759765625, -0.7823028564453125, -0.751068115234375, -0.7198333740234375, -0.6885986328125, -0.6573638916015625, -0.626129150390625, -0.5948944091796875, -0.56365966796875, -0.5324249267578125, -0.501190185546875, -0.4699554443359375, -0.438720703125, -0.4074859619140625, -0.376251220703125, -0.3450164794921875, -0.31378173828125, -0.2825469970703125, -0.251312255859375, -0.2200775146484375, -0.1888427734375, -0.1576080322265625, -0.126373291015625, -0.0951385498046875, -0.06390380859375, -0.0326690673828125, -0.001434326171875, 0.0298004150390625, 0.06103515625, 0.0922698974609375, 0.123504638671875, 0.1547393798828125, 0.18597412109375, 0.2172088623046875, 0.248443603515625, 0.2796783447265625, 0.3109130859375, 0.3421478271484375, 0.373382568359375, 0.4046173095703125, 0.43585205078125, 0.4670867919921875, 0.498321533203125, 0.5295562744140625, 0.560791015625, 0.5920257568359375, 0.623260498046875, 0.6544952392578125, 0.68572998046875, 0.7169647216796875, 0.748199462890625, 0.7794342041015625, 0.8106689453125, 0.8419036865234375, 0.873138427734375, 0.9043731689453125, 0.93560791015625, 0.9668426513671875, 0.998077392578125, 1.0293121337890625, 1.060546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 9.0, 27.0, 61.0, 201.0, 2802.0, 770.0, 114.0, 36.0, 15.0, 6.0, 12.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7998046875, -0.7786636352539062, -0.7575225830078125, -0.7363815307617188, -0.715240478515625, -0.6940994262695312, -0.6729583740234375, -0.6518173217773438, -0.63067626953125, -0.6095352172851562, -0.5883941650390625, -0.5672531127929688, -0.546112060546875, -0.5249710083007812, -0.5038299560546875, -0.48268890380859375, -0.4615478515625, -0.44040679931640625, -0.4192657470703125, -0.39812469482421875, -0.376983642578125, -0.35584259033203125, -0.3347015380859375, -0.31356048583984375, -0.29241943359375, -0.27127838134765625, -0.2501373291015625, -0.22899627685546875, -0.207855224609375, -0.18671417236328125, -0.1655731201171875, -0.14443206787109375, -0.123291015625, -0.10214996337890625, -0.0810089111328125, -0.05986785888671875, -0.038726806640625, -0.01758575439453125, 0.0035552978515625, 0.02469635009765625, 0.04583740234375, 0.06697845458984375, 0.0881195068359375, 0.10926055908203125, 0.130401611328125, 0.15154266357421875, 0.1726837158203125, 0.19382476806640625, 0.2149658203125, 0.23610687255859375, 0.2572479248046875, 0.27838897705078125, 0.299530029296875, 0.32067108154296875, 0.3418121337890625, 0.36295318603515625, 0.38409423828125, 0.40523529052734375, 0.4263763427734375, 0.44751739501953125, 0.468658447265625, 0.48979949951171875, 0.5109405517578125, 0.5320816040039062, 0.55322265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 16.0, 76.0, 524.0, 356.0, 28.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.893589496612549, -6.729454517364502, -6.565319538116455, -6.401184558868408, -6.2370500564575195, -6.072915077209473, -5.908780097961426, -5.744645118713379, -5.580510139465332, -5.416375160217285, -5.252240180969238, -5.088105201721191, -4.9239702224731445, -4.759835720062256, -4.595700740814209, -4.431565761566162, -4.267430782318115, -4.103295803070068, -3.9391608238220215, -3.7750260829925537, -3.610891103744507, -3.44675612449646, -3.282621383666992, -3.1184864044189453, -2.9543514251708984, -2.7902164459228516, -2.6260814666748047, -2.461946725845337, -2.29781174659729, -2.133676767349243, -1.9695419073104858, -1.8054070472717285, -1.6412720680236816, -1.4771370887756348, -1.3130022287368774, -1.1488673686981201, -0.9847323894500732, -0.8205974698066711, -0.656462550163269, -0.4923276901245117, -0.32819271087646484, -0.16405779123306274, 7.712841033935547e-05, 0.16421204805374146, 0.32834696769714355, 0.49248188734054565, 0.6566168069839478, 0.8207516670227051, 0.984886646270752, 1.1490216255187988, 1.3131564855575562, 1.4772913455963135, 1.6414263248443604, 1.8055613040924072, 1.9696961641311646, 2.133831024169922, 2.2979660034179688, 2.4621009826660156, 2.6262359619140625, 2.7903707027435303, 2.954505681991577, 3.118640661239624, 3.282775402069092, 3.4469103813171387, 3.6110453605651855]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 14.0, 18.0, 19.0, 16.0, 32.0, 41.0, 36.0, 47.0, 46.0, 58.0, 54.0, 56.0, 63.0, 65.0, 62.0, 55.0, 59.0, 41.0, 32.0, 41.0, 24.0, 30.0, 22.0, 12.0, 10.0, 7.0, 14.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9871852397918701, -0.9456499814987183, -0.9041147828102112, -0.8625795245170593, -0.8210443258285522, -0.7795090675354004, -0.7379738092422485, -0.6964385509490967, -0.6549033522605896, -0.6133680939674377, -0.5718328952789307, -0.5302976369857788, -0.48876240849494934, -0.4472271800041199, -0.405691921710968, -0.36415669322013855, -0.3226214647293091, -0.2810862362384796, -0.23955099284648895, -0.1980157494544983, -0.15648052096366882, -0.11494529247283936, -0.0734100490808487, -0.03187480568885803, 0.009660422801971436, 0.0511956587433815, 0.09273089468479156, 0.13426613807678223, 0.1758013665676117, 0.21733659505844116, 0.258871853351593, 0.3004070818424225, 0.3419424295425415, 0.38347765803337097, 0.42501288652420044, 0.4665481448173523, 0.5080833435058594, 0.5496186017990112, 0.5911538600921631, 0.6326891183853149, 0.674224317073822, 0.7157595753669739, 0.757294774055481, 0.7988300323486328, 0.8403652906417847, 0.8819004893302917, 0.9234357476234436, 0.9649709463119507, 1.0065062046051025, 1.0480414628982544, 1.0895767211914062, 1.1311118602752686, 1.1726471185684204, 1.2141823768615723, 1.2557176351547241, 1.297252893447876, 1.3387880325317383, 1.3803232908248901, 1.421858549118042, 1.4633936882019043, 1.5049289464950562, 1.546464204788208, 1.5879994630813599, 1.6295347213745117, 1.6710699796676636]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 13.0, 17.0, 45.0, 49.0, 93.0, 201.0, 398.0, 1051.0, 3155.0, 15260.0, 151394.0, 805721.0, 59465.0, 8150.0, 2106.0, 781.0, 301.0, 150.0, 75.0, 49.0, 17.0, 21.0, 11.0, 2.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5679168701171875, -1.523529052734375, -1.4791412353515625, -1.43475341796875, -1.3903656005859375, -1.345977783203125, -1.3015899658203125, -1.2572021484375, -1.2128143310546875, -1.168426513671875, -1.1240386962890625, -1.07965087890625, -1.0352630615234375, -0.990875244140625, -0.9464874267578125, -0.902099609375, -0.8577117919921875, -0.813323974609375, -0.7689361572265625, -0.72454833984375, -0.6801605224609375, -0.635772705078125, -0.5913848876953125, -0.5469970703125, -0.5026092529296875, -0.458221435546875, -0.4138336181640625, -0.36944580078125, -0.3250579833984375, -0.280670166015625, -0.2362823486328125, -0.19189453125, -0.1475067138671875, -0.103118896484375, -0.0587310791015625, -0.01434326171875, 0.0300445556640625, 0.074432373046875, 0.1188201904296875, 0.1632080078125, 0.2075958251953125, 0.251983642578125, 0.2963714599609375, 0.34075927734375, 0.3851470947265625, 0.429534912109375, 0.4739227294921875, 0.518310546875, 0.5626983642578125, 0.607086181640625, 0.6514739990234375, 0.69586181640625, 0.7402496337890625, 0.784637451171875, 0.8290252685546875, 0.8734130859375, 0.9178009033203125, 0.962188720703125, 1.0065765380859375, 1.05096435546875, 1.0953521728515625, 1.139739990234375, 1.1841278076171875, 1.228515625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 18.0, 23.0, 27.0, 38.0, 50.0, 65.0, 79.0, 84.0, 71.0, 79.0, 97.0, 99.0, 58.0, 45.0, 40.0, 34.0, 25.0, 23.0, 14.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.20787620544433594, -0.19761276245117188, -0.1873493194580078, -0.17708587646484375, -0.1668224334716797, -0.15655899047851562, -0.14629554748535156, -0.1360321044921875, -0.12576866149902344, -0.11550521850585938, -0.10524177551269531, -0.09497833251953125, -0.08471488952636719, -0.07445144653320312, -0.06418800354003906, -0.053924560546875, -0.04366111755371094, -0.033397674560546875, -0.023134231567382812, -0.01287078857421875, -0.0026073455810546875, 0.007656097412109375, 0.017919540405273438, 0.0281829833984375, 0.03844642639160156, 0.048709869384765625, 0.05897331237792969, 0.06923675537109375, 0.07950019836425781, 0.08976364135742188, 0.10002708435058594, 0.11029052734375, 0.12055397033691406, 0.13081741333007812, 0.1410808563232422, 0.15134429931640625, 0.1616077423095703, 0.17187118530273438, 0.18213462829589844, 0.1923980712890625, 0.20266151428222656, 0.21292495727539062, 0.2231884002685547, 0.23345184326171875, 0.2437152862548828, 0.2539787292480469, 0.26424217224121094, 0.274505615234375, 0.28476905822753906, 0.2950325012207031, 0.3052959442138672, 0.31555938720703125, 0.3258228302001953, 0.3360862731933594, 0.34634971618652344, 0.3566131591796875, 0.36687660217285156, 0.3771400451660156, 0.3874034881591797, 0.39766693115234375, 0.4079303741455078, 0.4181938171386719, 0.42845726013183594, 0.438720703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 14.0, 19.0, 21.0, 23.0, 34.0, 70.0, 86.0, 130.0, 251.0, 582.0, 1170.0, 2606.0, 7158.0, 25499.0, 128440.0, 696569.0, 145571.0, 27589.0, 7570.0, 2725.0, 1153.0, 518.0, 267.0, 170.0, 83.0, 71.0, 35.0, 22.0, 12.0, 10.0, 13.0, 11.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.630859375, -0.6094970703125, -0.588134765625, -0.5667724609375, -0.54541015625, -0.5240478515625, -0.502685546875, -0.4813232421875, -0.4599609375, -0.4385986328125, -0.417236328125, -0.3958740234375, -0.37451171875, -0.3531494140625, -0.331787109375, -0.3104248046875, -0.2890625, -0.2677001953125, -0.246337890625, -0.2249755859375, -0.20361328125, -0.1822509765625, -0.160888671875, -0.1395263671875, -0.1181640625, -0.0968017578125, -0.075439453125, -0.0540771484375, -0.03271484375, -0.0113525390625, 0.010009765625, 0.0313720703125, 0.052734375, 0.0740966796875, 0.095458984375, 0.1168212890625, 0.13818359375, 0.1595458984375, 0.180908203125, 0.2022705078125, 0.2236328125, 0.2449951171875, 0.266357421875, 0.2877197265625, 0.30908203125, 0.3304443359375, 0.351806640625, 0.3731689453125, 0.39453125, 0.4158935546875, 0.437255859375, 0.4586181640625, 0.47998046875, 0.5013427734375, 0.522705078125, 0.5440673828125, 0.5654296875, 0.5867919921875, 0.608154296875, 0.6295166015625, 0.65087890625, 0.6722412109375, 0.693603515625, 0.7149658203125, 0.736328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 3.0, 9.0, 22.0, 23.0, 22.0, 22.0, 40.0, 42.0, 39.0, 39.0, 58.0, 64.0, 73.0, 57.0, 71.0, 53.0, 57.0, 59.0, 40.0, 46.0, 32.0, 38.0, 19.0, 18.0, 12.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8495101928710938, -0.8186492919921875, -0.7877883911132812, -0.756927490234375, -0.7260665893554688, -0.6952056884765625, -0.6643447875976562, -0.63348388671875, -0.6026229858398438, -0.5717620849609375, -0.5409011840820312, -0.510040283203125, -0.47917938232421875, -0.4483184814453125, -0.41745758056640625, -0.3865966796875, -0.35573577880859375, -0.3248748779296875, -0.29401397705078125, -0.263153076171875, -0.23229217529296875, -0.2014312744140625, -0.17057037353515625, -0.13970947265625, -0.10884857177734375, -0.0779876708984375, -0.04712677001953125, -0.016265869140625, 0.01459503173828125, 0.0454559326171875, 0.07631683349609375, 0.107177734375, 0.13803863525390625, 0.1688995361328125, 0.19976043701171875, 0.230621337890625, 0.26148223876953125, 0.2923431396484375, 0.32320404052734375, 0.35406494140625, 0.38492584228515625, 0.4157867431640625, 0.44664764404296875, 0.477508544921875, 0.5083694458007812, 0.5392303466796875, 0.5700912475585938, 0.6009521484375, 0.6318130493164062, 0.6626739501953125, 0.6935348510742188, 0.724395751953125, 0.7552566528320312, 0.7861175537109375, 0.8169784545898438, 0.84783935546875, 0.8787002563476562, 0.9095611572265625, 0.9404220581054688, 0.971282958984375, 1.0021438598632812, 1.0330047607421875, 1.0638656616210938, 1.0947265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 7.0, 8.0, 14.0, 37.0, 76.0, 180.0, 521.0, 7828.0, 1036360.0, 2881.0, 370.0, 141.0, 67.0, 34.0, 16.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.49609375, -2.418975830078125, -2.34185791015625, -2.264739990234375, -2.1876220703125, -2.110504150390625, -2.03338623046875, -1.956268310546875, -1.879150390625, -1.802032470703125, -1.72491455078125, -1.647796630859375, -1.5706787109375, -1.493560791015625, -1.41644287109375, -1.339324951171875, -1.26220703125, -1.185089111328125, -1.10797119140625, -1.030853271484375, -0.9537353515625, -0.876617431640625, -0.79949951171875, -0.722381591796875, -0.645263671875, -0.568145751953125, -0.49102783203125, -0.413909912109375, -0.3367919921875, -0.259674072265625, -0.18255615234375, -0.105438232421875, -0.0283203125, 0.048797607421875, 0.12591552734375, 0.203033447265625, 0.2801513671875, 0.357269287109375, 0.43438720703125, 0.511505126953125, 0.588623046875, 0.665740966796875, 0.74285888671875, 0.819976806640625, 0.8970947265625, 0.974212646484375, 1.05133056640625, 1.128448486328125, 1.20556640625, 1.282684326171875, 1.35980224609375, 1.436920166015625, 1.5140380859375, 1.591156005859375, 1.66827392578125, 1.745391845703125, 1.822509765625, 1.899627685546875, 1.97674560546875, 2.053863525390625, 2.1309814453125, 2.208099365234375, 2.28521728515625, 2.362335205078125, 2.439453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 28.0, 30.0, 50.0, 124.0, 164.0, 175.0, 184.0, 92.0, 64.0, 39.0, 13.0, 12.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016117095947265625, -0.00015746243298053741, -0.00015375390648841858, -0.00015004537999629974, -0.0001463368535041809, -0.00014262832701206207, -0.00013891980051994324, -0.0001352112740278244, -0.00013150274753570557, -0.00012779422104358673, -0.0001240856945514679, -0.00012037716805934906, -0.00011666864156723022, -0.00011296011507511139, -0.00010925158858299255, -0.00010554306209087372, -0.00010183453559875488, -9.812600910663605e-05, -9.441748261451721e-05, -9.070895612239838e-05, -8.700042963027954e-05, -8.32919031381607e-05, -7.958337664604187e-05, -7.587485015392303e-05, -7.21663236618042e-05, -6.845779716968536e-05, -6.474927067756653e-05, -6.104074418544769e-05, -5.733221769332886e-05, -5.362369120121002e-05, -4.9915164709091187e-05, -4.620663821697235e-05, -4.2498111724853516e-05, -3.878958523273468e-05, -3.5081058740615845e-05, -3.137253224849701e-05, -2.7664005756378174e-05, -2.395547926425934e-05, -2.0246952772140503e-05, -1.6538426280021667e-05, -1.2829899787902832e-05, -9.121373295783997e-06, -5.412846803665161e-06, -1.7043203115463257e-06, 2.0042061805725098e-06, 5.712732672691345e-06, 9.42125916481018e-06, 1.3129785656929016e-05, 1.683831214904785e-05, 2.0546838641166687e-05, 2.4255365133285522e-05, 2.7963891625404358e-05, 3.167241811752319e-05, 3.538094460964203e-05, 3.9089471101760864e-05, 4.27979975938797e-05, 4.6506524085998535e-05, 5.021505057811737e-05, 5.3923577070236206e-05, 5.763210356235504e-05, 6.134063005447388e-05, 6.504915654659271e-05, 6.875768303871155e-05, 7.246620953083038e-05, 7.617473602294922e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 15.0, 14.0, 51.0, 74.0, 135.0, 283.0, 1814.0, 1039705.0, 5665.0, 433.0, 152.0, 89.0, 53.0, 29.0, 19.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25, -2.158721923828125, -2.06744384765625, -1.976165771484375, -1.8848876953125, -1.793609619140625, -1.70233154296875, -1.611053466796875, -1.519775390625, -1.428497314453125, -1.33721923828125, -1.245941162109375, -1.1546630859375, -1.063385009765625, -0.97210693359375, -0.880828857421875, -0.78955078125, -0.698272705078125, -0.60699462890625, -0.515716552734375, -0.4244384765625, -0.333160400390625, -0.24188232421875, -0.150604248046875, -0.059326171875, 0.031951904296875, 0.12322998046875, 0.214508056640625, 0.3057861328125, 0.397064208984375, 0.48834228515625, 0.579620361328125, 0.6708984375, 0.762176513671875, 0.85345458984375, 0.944732666015625, 1.0360107421875, 1.127288818359375, 1.21856689453125, 1.309844970703125, 1.401123046875, 1.492401123046875, 1.58367919921875, 1.674957275390625, 1.7662353515625, 1.857513427734375, 1.94879150390625, 2.040069580078125, 2.13134765625, 2.222625732421875, 2.31390380859375, 2.405181884765625, 2.4964599609375, 2.587738037109375, 2.67901611328125, 2.770294189453125, 2.861572265625, 2.952850341796875, 3.04412841796875, 3.135406494140625, 3.2266845703125, 3.317962646484375, 3.40924072265625, 3.500518798828125, 3.591796875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 93.0, 807.0, 75.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8428192138671875, -1.760833740234375, -1.6788482666015625, -1.59686279296875, -1.5148773193359375, -1.432891845703125, -1.3509063720703125, -1.2689208984375, -1.1869354248046875, -1.104949951171875, -1.0229644775390625, -0.94097900390625, -0.8589935302734375, -0.777008056640625, -0.6950225830078125, -0.613037109375, -0.5310516357421875, -0.449066162109375, -0.3670806884765625, -0.28509521484375, -0.2031097412109375, -0.121124267578125, -0.0391387939453125, 0.0428466796875, 0.1248321533203125, 0.206817626953125, 0.2888031005859375, 0.37078857421875, 0.4527740478515625, 0.534759521484375, 0.6167449951171875, 0.69873046875, 0.7807159423828125, 0.862701416015625, 0.9446868896484375, 1.02667236328125, 1.1086578369140625, 1.190643310546875, 1.2726287841796875, 1.3546142578125, 1.4365997314453125, 1.518585205078125, 1.6005706787109375, 1.68255615234375, 1.7645416259765625, 1.846527099609375, 1.9285125732421875, 2.010498046875, 2.0924835205078125, 2.174468994140625, 2.2564544677734375, 2.33843994140625, 2.4204254150390625, 2.502410888671875, 2.5843963623046875, 2.6663818359375, 2.7483673095703125, 2.830352783203125, 2.9123382568359375, 2.99432373046875, 3.0763092041015625, 3.158294677734375, 3.2402801513671875, 3.322265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 22.0, 124.0, 768.0, 86.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.723486423492432, -5.8407769203186035, -4.958067417144775, -4.075357913970947, -3.192648410797119, -2.309938907623291, -1.427229404449463, -0.5445199012756348, 0.33818960189819336, 1.2208991050720215, 2.1036086082458496, 2.9863181114196777, 3.869027614593506, 4.751737117767334, 5.634446620941162, 6.51715612411499, 7.399865627288818, 8.282575607299805, 9.165285110473633, 10.047994613647461, 10.930704116821289, 11.813413619995117, 12.696123123168945, 13.578832626342773, 14.461542129516602, 15.34425163269043, 16.226961135864258, 17.109670639038086, 17.992380142211914, 18.875089645385742, 19.75779914855957, 20.6405086517334, 21.523216247558594, 22.405925750732422, 23.28863525390625, 24.171344757080078, 25.054054260253906, 25.936763763427734, 26.819473266601562, 27.70218276977539, 28.58489227294922, 29.467601776123047, 30.350311279296875, 31.233020782470703, 32.11573028564453, 32.99843978881836, 33.88114929199219, 34.763858795166016, 35.646568298339844, 36.52927780151367, 37.4119873046875, 38.29469680786133, 39.177406311035156, 40.060115814208984, 40.94282531738281, 41.82553482055664, 42.70824432373047, 43.5909538269043, 44.473663330078125, 45.35637283325195, 46.23908233642578, 47.12179183959961, 48.00450134277344, 48.887210845947266, 49.769920349121094]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 12.0, 7.0, 9.0, 20.0, 23.0, 23.0, 24.0, 24.0, 28.0, 22.0, 38.0, 38.0, 35.0, 37.0, 39.0, 40.0, 58.0, 42.0, 47.0, 55.0, 42.0, 41.0, 33.0, 32.0, 34.0, 28.0, 21.0, 20.0, 21.0, 18.0, 10.0, 14.0, 10.0, 5.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.195096969604492, -4.0719895362854, -3.9488821029663086, -3.825774669647217, -3.702667474746704, -3.5795600414276123, -3.4564526081085205, -3.3333451747894287, -3.210237979888916, -3.087130546569824, -2.9640231132507324, -2.8409156799316406, -2.717808485031128, -2.594701051712036, -2.4715936183929443, -2.3484861850738525, -2.2253787517547607, -2.102271318435669, -1.9791640043258667, -1.856056571006775, -1.7329492568969727, -1.6098418235778809, -1.486734390258789, -1.3636269569396973, -1.240519642829895, -1.1174122095108032, -0.994304895401001, -0.8711974620819092, -0.7480900883674622, -0.6249827146530151, -0.5018752813339233, -0.3787679076194763, -0.2556605339050293, -0.13255314528942108, -0.009445756673812866, 0.11366164684295654, 0.23676902055740356, 0.3598763942718506, 0.4829838275909424, 0.6060912013053894, 0.7291985750198364, 0.8523059487342834, 0.9754133224487305, 1.0985207557678223, 1.221628189086914, 1.3447355031967163, 1.467842936515808, 1.5909502506256104, 1.7140576839447021, 1.837165117263794, 1.9602724313735962, 2.0833797454833984, 2.2064871788024902, 2.329594612121582, 2.452702045440674, 2.5758094787597656, 2.6989169120788574, 2.822024345397949, 2.945131778717041, 3.068239212036133, 3.1913464069366455, 3.3144538402557373, 3.437561273574829, 3.560668706893921, 3.6837759017944336]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 16.0, 28.0, 56.0, 90.0, 195.0, 440.0, 1174.0, 4529.0, 32489.0, 4036158.0, 107605.0, 8437.0, 1827.0, 622.0, 258.0, 126.0, 78.0, 49.0, 32.0, 13.0, 18.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8597564697265625, -0.820098876953125, -0.7804412841796875, -0.74078369140625, -0.7011260986328125, -0.661468505859375, -0.6218109130859375, -0.5821533203125, -0.5424957275390625, -0.502838134765625, -0.4631805419921875, -0.42352294921875, -0.3838653564453125, -0.344207763671875, -0.3045501708984375, -0.264892578125, -0.2252349853515625, -0.185577392578125, -0.1459197998046875, -0.10626220703125, -0.0666046142578125, -0.026947021484375, 0.0127105712890625, 0.0523681640625, 0.0920257568359375, 0.131683349609375, 0.1713409423828125, 0.21099853515625, 0.2506561279296875, 0.290313720703125, 0.3299713134765625, 0.36962890625, 0.4092864990234375, 0.448944091796875, 0.4886016845703125, 0.52825927734375, 0.5679168701171875, 0.607574462890625, 0.6472320556640625, 0.6868896484375, 0.7265472412109375, 0.766204833984375, 0.8058624267578125, 0.84552001953125, 0.8851776123046875, 0.924835205078125, 0.9644927978515625, 1.004150390625, 1.0438079833984375, 1.083465576171875, 1.1231231689453125, 1.16278076171875, 1.2024383544921875, 1.242095947265625, 1.2817535400390625, 1.3214111328125, 1.3610687255859375, 1.400726318359375, 1.4403839111328125, 1.48004150390625, 1.5196990966796875, 1.559356689453125, 1.5990142822265625, 1.638671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 8.0, 5.0, 16.0, 16.0, 17.0, 36.0, 42.0, 46.0, 69.0, 85.0, 75.0, 68.0, 70.0, 88.0, 85.0, 59.0, 53.0, 29.0, 34.0, 21.0, 22.0, 20.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.21792984008789062, -0.20709991455078125, -0.19626998901367188, -0.1854400634765625, -0.17461013793945312, -0.16378021240234375, -0.15295028686523438, -0.142120361328125, -0.13129043579101562, -0.12046051025390625, -0.10963058471679688, -0.0988006591796875, -0.08797073364257812, -0.07714080810546875, -0.06631088256835938, -0.05548095703125, -0.044651031494140625, -0.03382110595703125, -0.022991180419921875, -0.0121612548828125, -0.001331329345703125, 0.00949859619140625, 0.020328521728515625, 0.031158447265625, 0.041988372802734375, 0.05281829833984375, 0.06364822387695312, 0.0744781494140625, 0.08530807495117188, 0.09613800048828125, 0.10696792602539062, 0.1177978515625, 0.12862777709960938, 0.13945770263671875, 0.15028762817382812, 0.1611175537109375, 0.17194747924804688, 0.18277740478515625, 0.19360733032226562, 0.204437255859375, 0.21526718139648438, 0.22609710693359375, 0.23692703247070312, 0.2477569580078125, 0.2585868835449219, 0.26941680908203125, 0.2802467346191406, 0.29107666015625, 0.3019065856933594, 0.31273651123046875, 0.3235664367675781, 0.3343963623046875, 0.3452262878417969, 0.35605621337890625, 0.3668861389160156, 0.377716064453125, 0.3885459899902344, 0.39937591552734375, 0.4102058410644531, 0.4210357666015625, 0.4318656921386719, 0.44269561767578125, 0.4535255432128906, 0.46435546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 14.0, 22.0, 36.0, 48.0, 67.0, 85.0, 127.0, 169.0, 230.0, 381.0, 653.0, 1371.0, 3891.0, 20553.0, 1511419.0, 2625212.0, 22152.0, 4427.0, 1607.0, 714.0, 376.0, 197.0, 170.0, 110.0, 78.0, 55.0, 33.0, 25.0, 19.0, 8.0, 11.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.01953125, -0.9912185668945312, -0.9629058837890625, -0.9345932006835938, -0.906280517578125, -0.8779678344726562, -0.8496551513671875, -0.8213424682617188, -0.79302978515625, -0.7647171020507812, -0.7364044189453125, -0.7080917358398438, -0.679779052734375, -0.6514663696289062, -0.6231536865234375, -0.5948410034179688, -0.5665283203125, -0.5382156372070312, -0.5099029541015625, -0.48159027099609375, -0.453277587890625, -0.42496490478515625, -0.3966522216796875, -0.36833953857421875, -0.34002685546875, -0.31171417236328125, -0.2834014892578125, -0.25508880615234375, -0.226776123046875, -0.19846343994140625, -0.1701507568359375, -0.14183807373046875, -0.113525390625, -0.08521270751953125, -0.0569000244140625, -0.02858734130859375, -0.000274658203125, 0.02803802490234375, 0.0563507080078125, 0.08466339111328125, 0.11297607421875, 0.14128875732421875, 0.1696014404296875, 0.19791412353515625, 0.226226806640625, 0.25453948974609375, 0.2828521728515625, 0.31116485595703125, 0.3394775390625, 0.36779022216796875, 0.3961029052734375, 0.42441558837890625, 0.452728271484375, 0.48104095458984375, 0.5093536376953125, 0.5376663208007812, 0.56597900390625, 0.5942916870117188, 0.6226043701171875, 0.6509170532226562, 0.679229736328125, 0.7075424194335938, 0.7358551025390625, 0.7641677856445312, 0.79248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 11.0, 32.0, 57.0, 240.0, 3055.0, 443.0, 110.0, 52.0, 28.0, 10.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5666122436523438, -0.5507049560546875, -0.5347976684570312, -0.518890380859375, -0.5029830932617188, -0.4870758056640625, -0.47116851806640625, -0.45526123046875, -0.43935394287109375, -0.4234466552734375, -0.40753936767578125, -0.391632080078125, -0.37572479248046875, -0.3598175048828125, -0.34391021728515625, -0.3280029296875, -0.31209564208984375, -0.2961883544921875, -0.28028106689453125, -0.264373779296875, -0.24846649169921875, -0.2325592041015625, -0.21665191650390625, -0.20074462890625, -0.18483734130859375, -0.1689300537109375, -0.15302276611328125, -0.137115478515625, -0.12120819091796875, -0.1053009033203125, -0.08939361572265625, -0.073486328125, -0.05757904052734375, -0.0416717529296875, -0.02576446533203125, -0.009857177734375, 0.00605010986328125, 0.0219573974609375, 0.03786468505859375, 0.05377197265625, 0.06967926025390625, 0.0855865478515625, 0.10149383544921875, 0.117401123046875, 0.13330841064453125, 0.1492156982421875, 0.16512298583984375, 0.1810302734375, 0.19693756103515625, 0.2128448486328125, 0.22875213623046875, 0.244659423828125, 0.26056671142578125, 0.2764739990234375, 0.29238128662109375, 0.30828857421875, 0.32419586181640625, 0.3401031494140625, 0.35601043701171875, 0.371917724609375, 0.38782501220703125, 0.4037322998046875, 0.41963958740234375, 0.435546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 2.0, 12.0, 7.0, 13.0, 20.0, 34.0, 65.0, 92.0, 145.0, 178.0, 137.0, 113.0, 68.0, 30.0, 23.0, 16.0, 12.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5903318524360657, -0.5571885108947754, -0.5240452289581299, -0.4909018874168396, -0.4577585458755493, -0.42461520433425903, -0.39147189259529114, -0.35832858085632324, -0.32518523931503296, -0.2920418977737427, -0.2588985860347748, -0.2257552593946457, -0.1926119327545166, -0.1594686061143875, -0.12632527947425842, -0.09318195283412933, -0.060038626194000244, -0.026895299553871155, 0.006248027086257935, 0.039391353726387024, 0.07253468036651611, 0.1056780070066452, 0.1388213336467743, 0.17196466028690338, 0.20510798692703247, 0.23825131356716156, 0.27139464020729065, 0.30453795194625854, 0.33768129348754883, 0.3708246350288391, 0.403967946767807, 0.4371112585067749, 0.47025465965270996, 0.5033980011940002, 0.5365413427352905, 0.569684624671936, 0.6028279662132263, 0.6359713077545166, 0.6691145896911621, 0.7022579312324524, 0.7354012727737427, 0.768544614315033, 0.8016879558563232, 0.8348312377929688, 0.867974579334259, 0.9011179208755493, 0.9342612028121948, 0.9674045443534851, 1.0005478858947754, 1.033691167831421, 1.066834568977356, 1.0999778509140015, 1.1331212520599365, 1.166264533996582, 1.1994078159332275, 1.2325512170791626, 1.265694499015808, 1.2988377809524536, 1.3319811820983887, 1.3651244640350342, 1.3982677459716797, 1.4314111471176147, 1.4645544290542603, 1.4976978302001953, 1.5308411121368408]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 16.0, 8.0, 17.0, 21.0, 25.0, 30.0, 33.0, 47.0, 42.0, 43.0, 48.0, 51.0, 52.0, 62.0, 65.0, 54.0, 50.0, 58.0, 37.0, 32.0, 42.0, 36.0, 26.0, 21.0, 23.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9422817230224609, -0.9109719395637512, -0.8796621561050415, -0.8483523726463318, -0.8170425891876221, -0.7857328653335571, -0.7544230818748474, -0.7231132984161377, -0.691803514957428, -0.6604937314987183, -0.6291839480400085, -0.5978741645812988, -0.5665644407272339, -0.5352545976638794, -0.5039448738098145, -0.47263509035110474, -0.441325306892395, -0.4100155234336853, -0.3787057399749756, -0.34739598631858826, -0.31608620285987854, -0.2847764194011688, -0.2534666657447815, -0.22215688228607178, -0.19084709882736206, -0.15953731536865234, -0.12822754681110382, -0.0969177708029747, -0.06560799479484558, -0.034298211336135864, -0.0029884427785873413, 0.02832132577896118, 0.0596311092376709, 0.09094088524580002, 0.12225066125392914, 0.15356042981147766, 0.18487021327018738, 0.2161799967288971, 0.24748976528644562, 0.27879953384399414, 0.31010931730270386, 0.3414191007614136, 0.3727288842201233, 0.4040386378765106, 0.43534842133522034, 0.46665820479393005, 0.4979679584503174, 0.5292777419090271, 0.5605875253677368, 0.5918973088264465, 0.6232070922851562, 0.654516875743866, 0.6858266592025757, 0.7171363830566406, 0.7484461665153503, 0.7797559499740601, 0.8110657334327698, 0.8423755168914795, 0.8736853003501892, 0.9049950838088989, 0.9363048076629639, 0.9676146507263184, 0.9989243745803833, 1.0302340984344482, 1.0615439414978027]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 6.0, 10.0, 14.0, 23.0, 34.0, 64.0, 132.0, 286.0, 859.0, 2747.0, 12801.0, 122402.0, 822274.0, 74218.0, 9409.0, 2059.0, 660.0, 252.0, 133.0, 68.0, 33.0, 30.0, 14.0, 9.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0582427978515625, -1.011016845703125, -0.9637908935546875, -0.91656494140625, -0.8693389892578125, -0.822113037109375, -0.7748870849609375, -0.7276611328125, -0.6804351806640625, -0.633209228515625, -0.5859832763671875, -0.53875732421875, -0.4915313720703125, -0.444305419921875, -0.3970794677734375, -0.349853515625, -0.3026275634765625, -0.255401611328125, -0.2081756591796875, -0.16094970703125, -0.1137237548828125, -0.066497802734375, -0.0192718505859375, 0.0279541015625, 0.0751800537109375, 0.122406005859375, 0.1696319580078125, 0.21685791015625, 0.2640838623046875, 0.311309814453125, 0.3585357666015625, 0.40576171875, 0.4529876708984375, 0.500213623046875, 0.5474395751953125, 0.59466552734375, 0.6418914794921875, 0.689117431640625, 0.7363433837890625, 0.7835693359375, 0.8307952880859375, 0.878021240234375, 0.9252471923828125, 0.97247314453125, 1.0196990966796875, 1.066925048828125, 1.1141510009765625, 1.161376953125, 1.2086029052734375, 1.255828857421875, 1.3030548095703125, 1.35028076171875, 1.3975067138671875, 1.444732666015625, 1.4919586181640625, 1.5391845703125, 1.5864105224609375, 1.633636474609375, 1.6808624267578125, 1.72808837890625, 1.7753143310546875, 1.822540283203125, 1.8697662353515625, 1.9169921875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 6.0, 19.0, 46.0, 35.0, 60.0, 82.0, 72.0, 80.0, 81.0, 86.0, 84.0, 70.0, 65.0, 50.0, 37.0, 30.0, 15.0, 22.0, 18.0, 3.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2294921875, -0.2179718017578125, -0.206451416015625, -0.1949310302734375, -0.18341064453125, -0.1718902587890625, -0.160369873046875, -0.1488494873046875, -0.1373291015625, -0.1258087158203125, -0.114288330078125, -0.1027679443359375, -0.09124755859375, -0.0797271728515625, -0.068206787109375, -0.0566864013671875, -0.045166015625, -0.0336456298828125, -0.022125244140625, -0.0106048583984375, 0.00091552734375, 0.0124359130859375, 0.023956298828125, 0.0354766845703125, 0.0469970703125, 0.0585174560546875, 0.070037841796875, 0.0815582275390625, 0.09307861328125, 0.1045989990234375, 0.116119384765625, 0.1276397705078125, 0.13916015625, 0.1506805419921875, 0.162200927734375, 0.1737213134765625, 0.18524169921875, 0.1967620849609375, 0.208282470703125, 0.2198028564453125, 0.2313232421875, 0.2428436279296875, 0.254364013671875, 0.2658843994140625, 0.27740478515625, 0.2889251708984375, 0.300445556640625, 0.3119659423828125, 0.323486328125, 0.3350067138671875, 0.346527099609375, 0.3580474853515625, 0.36956787109375, 0.3810882568359375, 0.392608642578125, 0.4041290283203125, 0.4156494140625, 0.4271697998046875, 0.438690185546875, 0.4502105712890625, 0.46173095703125, 0.4732513427734375, 0.484771728515625, 0.4962921142578125, 0.5078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 8.0, 17.0, 15.0, 19.0, 35.0, 41.0, 56.0, 75.0, 146.0, 314.0, 769.0, 2525.0, 10746.0, 70003.0, 723961.0, 210143.0, 22871.0, 4553.0, 1302.0, 452.0, 218.0, 97.0, 68.0, 31.0, 24.0, 17.0, 13.0, 15.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.783203125, -0.75152587890625, -0.7198486328125, -0.68817138671875, -0.656494140625, -0.62481689453125, -0.5931396484375, -0.56146240234375, -0.52978515625, -0.49810791015625, -0.4664306640625, -0.43475341796875, -0.403076171875, -0.37139892578125, -0.3397216796875, -0.30804443359375, -0.2763671875, -0.24468994140625, -0.2130126953125, -0.18133544921875, -0.149658203125, -0.11798095703125, -0.0863037109375, -0.05462646484375, -0.02294921875, 0.00872802734375, 0.0404052734375, 0.07208251953125, 0.103759765625, 0.13543701171875, 0.1671142578125, 0.19879150390625, 0.23046875, 0.26214599609375, 0.2938232421875, 0.32550048828125, 0.357177734375, 0.38885498046875, 0.4205322265625, 0.45220947265625, 0.48388671875, 0.51556396484375, 0.5472412109375, 0.57891845703125, 0.610595703125, 0.64227294921875, 0.6739501953125, 0.70562744140625, 0.7373046875, 0.76898193359375, 0.8006591796875, 0.83233642578125, 0.864013671875, 0.89569091796875, 0.9273681640625, 0.95904541015625, 0.99072265625, 1.02239990234375, 1.0540771484375, 1.08575439453125, 1.117431640625, 1.14910888671875, 1.1807861328125, 1.21246337890625, 1.244140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 10.0, 10.0, 7.0, 11.0, 18.0, 30.0, 33.0, 52.0, 48.0, 71.0, 73.0, 73.0, 63.0, 64.0, 64.0, 68.0, 68.0, 55.0, 56.0, 30.0, 29.0, 25.0, 10.0, 10.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7759475708007812, -0.7359771728515625, -0.6960067749023438, -0.656036376953125, -0.6160659790039062, -0.5760955810546875, -0.5361251831054688, -0.49615478515625, -0.45618438720703125, -0.4162139892578125, -0.37624359130859375, -0.336273193359375, -0.29630279541015625, -0.2563323974609375, -0.21636199951171875, -0.1763916015625, -0.13642120361328125, -0.0964508056640625, -0.05648040771484375, -0.016510009765625, 0.02346038818359375, 0.0634307861328125, 0.10340118408203125, 0.14337158203125, 0.18334197998046875, 0.2233123779296875, 0.26328277587890625, 0.303253173828125, 0.34322357177734375, 0.3831939697265625, 0.42316436767578125, 0.463134765625, 0.5031051635742188, 0.5430755615234375, 0.5830459594726562, 0.623016357421875, 0.6629867553710938, 0.7029571533203125, 0.7429275512695312, 0.78289794921875, 0.8228683471679688, 0.8628387451171875, 0.9028091430664062, 0.942779541015625, 0.9827499389648438, 1.0227203369140625, 1.0626907348632812, 1.1026611328125, 1.1426315307617188, 1.1826019287109375, 1.2225723266601562, 1.262542724609375, 1.3025131225585938, 1.3424835205078125, 1.3824539184570312, 1.42242431640625, 1.4623947143554688, 1.5023651123046875, 1.5423355102539062, 1.582305908203125, 1.6222763061523438, 1.6622467041015625, 1.7022171020507812, 1.7421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 6.0, 11.0, 12.0, 28.0, 48.0, 93.0, 236.0, 666.0, 2264.0, 28134.0, 951818.0, 60626.0, 3322.0, 744.0, 280.0, 128.0, 65.0, 26.0, 19.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.26430511474609375, -0.2473602294921875, -0.23041534423828125, -0.213470458984375, -0.19652557373046875, -0.1795806884765625, -0.16263580322265625, -0.14569091796875, -0.12874603271484375, -0.1118011474609375, -0.09485626220703125, -0.077911376953125, -0.06096649169921875, -0.0440216064453125, -0.02707672119140625, -0.0101318359375, 0.00681304931640625, 0.0237579345703125, 0.04070281982421875, 0.057647705078125, 0.07459259033203125, 0.0915374755859375, 0.10848236083984375, 0.12542724609375, 0.14237213134765625, 0.1593170166015625, 0.17626190185546875, 0.193206787109375, 0.21015167236328125, 0.2270965576171875, 0.24404144287109375, 0.260986328125, 0.27793121337890625, 0.2948760986328125, 0.31182098388671875, 0.328765869140625, 0.34571075439453125, 0.3626556396484375, 0.37960052490234375, 0.39654541015625, 0.41349029541015625, 0.4304351806640625, 0.44738006591796875, 0.464324951171875, 0.48126983642578125, 0.4982147216796875, 0.5151596069335938, 0.5321044921875, 0.5490493774414062, 0.5659942626953125, 0.5829391479492188, 0.599884033203125, 0.6168289184570312, 0.6337738037109375, 0.6507186889648438, 0.66766357421875, 0.6846084594726562, 0.7015533447265625, 0.7184982299804688, 0.735443115234375, 0.7523880004882812, 0.7693328857421875, 0.7862777709960938, 0.80322265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 18.0, 23.0, 47.0, 73.0, 86.0, 149.0, 155.0, 150.0, 94.0, 71.0, 24.0, 20.0, 17.0, 13.0, 13.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.526708602905273e-05, -6.270594894886017e-05, -6.01448118686676e-05, -5.758367478847504e-05, -5.502253770828247e-05, -5.2461400628089905e-05, -4.990026354789734e-05, -4.733912646770477e-05, -4.477798938751221e-05, -4.221685230731964e-05, -3.9655715227127075e-05, -3.709457814693451e-05, -3.453344106674194e-05, -3.197230398654938e-05, -2.941116690635681e-05, -2.6850029826164246e-05, -2.428889274597168e-05, -2.1727755665779114e-05, -1.9166618585586548e-05, -1.6605481505393982e-05, -1.4044344425201416e-05, -1.148320734500885e-05, -8.922070264816284e-06, -6.360933184623718e-06, -3.7997961044311523e-06, -1.2386590242385864e-06, 1.3224780559539795e-06, 3.883615136146545e-06, 6.444752216339111e-06, 9.005889296531677e-06, 1.1567026376724243e-05, 1.4128163456916809e-05, 1.6689300537109375e-05, 1.925043761730194e-05, 2.1811574697494507e-05, 2.4372711777687073e-05, 2.693384885787964e-05, 2.9494985938072205e-05, 3.205612301826477e-05, 3.4617260098457336e-05, 3.71783971786499e-05, 3.973953425884247e-05, 4.2300671339035034e-05, 4.48618084192276e-05, 4.7422945499420166e-05, 4.998408257961273e-05, 5.25452196598053e-05, 5.5106356739997864e-05, 5.766749382019043e-05, 6.0228630900382996e-05, 6.278976798057556e-05, 6.535090506076813e-05, 6.79120421409607e-05, 7.047317922115326e-05, 7.303431630134583e-05, 7.559545338153839e-05, 7.815659046173096e-05, 8.071772754192352e-05, 8.327886462211609e-05, 8.584000170230865e-05, 8.840113878250122e-05, 9.096227586269379e-05, 9.352341294288635e-05, 9.608455002307892e-05, 9.864568710327148e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 13.0, 25.0, 30.0, 38.0, 41.0, 78.0, 135.0, 288.0, 633.0, 2165.0, 17000.0, 653263.0, 360539.0, 11433.0, 1712.0, 596.0, 256.0, 121.0, 58.0, 40.0, 24.0, 15.0, 13.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5211257934570312, -0.5080718994140625, -0.49501800537109375, -0.481964111328125, -0.46891021728515625, -0.4558563232421875, -0.44280242919921875, -0.42974853515625, -0.41669464111328125, -0.4036407470703125, -0.39058685302734375, -0.377532958984375, -0.36447906494140625, -0.3514251708984375, -0.33837127685546875, -0.3253173828125, -0.31226348876953125, -0.2992095947265625, -0.28615570068359375, -0.273101806640625, -0.26004791259765625, -0.2469940185546875, -0.23394012451171875, -0.22088623046875, -0.20783233642578125, -0.1947784423828125, -0.18172454833984375, -0.168670654296875, -0.15561676025390625, -0.1425628662109375, -0.12950897216796875, -0.116455078125, -0.10340118408203125, -0.0903472900390625, -0.07729339599609375, -0.064239501953125, -0.05118560791015625, -0.0381317138671875, -0.02507781982421875, -0.01202392578125, 0.00102996826171875, 0.0140838623046875, 0.02713775634765625, 0.040191650390625, 0.05324554443359375, 0.0662994384765625, 0.07935333251953125, 0.0924072265625, 0.10546112060546875, 0.1185150146484375, 0.13156890869140625, 0.144622802734375, 0.15767669677734375, 0.1707305908203125, 0.18378448486328125, 0.19683837890625, 0.20989227294921875, 0.2229461669921875, 0.23600006103515625, 0.249053955078125, 0.26210784912109375, 0.2751617431640625, 0.28821563720703125, 0.30126953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 19.0, 22.0, 44.0, 75.0, 136.0, 225.0, 204.0, 130.0, 75.0, 29.0, 13.0, 11.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.8779296875, -0.8599891662597656, -0.8420486450195312, -0.8241081237792969, -0.8061676025390625, -0.7882270812988281, -0.7702865600585938, -0.7523460388183594, -0.734405517578125, -0.7164649963378906, -0.6985244750976562, -0.6805839538574219, -0.6626434326171875, -0.6447029113769531, -0.6267623901367188, -0.6088218688964844, -0.59088134765625, -0.5729408264160156, -0.5550003051757812, -0.5370597839355469, -0.5191192626953125, -0.5011787414550781, -0.48323822021484375, -0.4652976989746094, -0.447357177734375, -0.4294166564941406, -0.41147613525390625, -0.3935356140136719, -0.3755950927734375, -0.3576545715332031, -0.33971405029296875, -0.3217735290527344, -0.3038330078125, -0.2858924865722656, -0.26795196533203125, -0.2500114440917969, -0.2320709228515625, -0.21413040161132812, -0.19618988037109375, -0.17824935913085938, -0.160308837890625, -0.14236831665039062, -0.12442779541015625, -0.10648727416992188, -0.0885467529296875, -0.07060623168945312, -0.05266571044921875, -0.034725189208984375, -0.01678466796875, 0.001155853271484375, 0.01909637451171875, 0.037036895751953125, 0.0549774169921875, 0.07291793823242188, 0.09085845947265625, 0.10879898071289062, 0.126739501953125, 0.14468002319335938, 0.16262054443359375, 0.18056106567382812, 0.1985015869140625, 0.21644210815429688, 0.23438262939453125, 0.2523231506347656, 0.270263671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 23.0, 88.0, 551.0, 312.0, 25.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.654504776000977, -7.104128360748291, -6.5537519454956055, -6.00337553024292, -5.452999114990234, -4.902622699737549, -4.352246284484863, -3.8018698692321777, -3.251493453979492, -2.7011170387268066, -2.150740623474121, -1.6003642082214355, -1.04998779296875, -0.49961137771606445, 0.050765037536621094, 0.6011414527893066, 1.1515178680419922, 1.7018942832946777, 2.2522706985473633, 2.802647113800049, 3.3530235290527344, 3.90339994430542, 4.4537763595581055, 5.004152774810791, 5.554529190063477, 6.104905605316162, 6.655282020568848, 7.205658435821533, 7.756034851074219, 8.306411743164062, 8.85678768157959, 9.407163619995117, 9.957538604736328, 10.507915496826172, 11.0582914352417, 11.608667373657227, 12.15904426574707, 12.709421157836914, 13.259797096252441, 13.810173034667969, 14.360549926757812, 14.910926818847656, 15.461302757263184, 16.01167869567871, 16.562055587768555, 17.1124324798584, 17.66280746459961, 18.213184356689453, 18.763561248779297, 19.31393814086914, 19.864315032958984, 20.414690017700195, 20.96506690979004, 21.515443801879883, 22.065818786621094, 22.616195678710938, 23.16657257080078, 23.716949462890625, 24.26732635498047, 24.81770133972168, 25.368078231811523, 25.918455123901367, 26.468830108642578, 27.019207000732422, 27.569583892822266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 9.0, 3.0, 3.0, 14.0, 11.0, 12.0, 27.0, 33.0, 34.0, 42.0, 38.0, 50.0, 48.0, 41.0, 58.0, 58.0, 43.0, 49.0, 51.0, 57.0, 47.0, 49.0, 38.0, 38.0, 40.0, 22.0, 13.0, 14.0, 19.0, 13.0, 5.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.186199188232422, -6.022626876831055, -5.859055042266846, -5.6954827308654785, -5.5319108963012695, -5.368338584899902, -5.204766750335693, -5.041194438934326, -4.877622604370117, -4.71405029296875, -4.550478458404541, -4.386906147003174, -4.223334312438965, -4.059762001037598, -3.8961901664733887, -3.7326178550720215, -3.5690457820892334, -3.4054737091064453, -3.2419016361236572, -3.078329563140869, -2.914757490158081, -2.751185417175293, -2.587613105773926, -2.424041271209717, -2.2604689598083496, -2.0968968868255615, -1.9333248138427734, -1.7697527408599854, -1.6061806678771973, -1.4426085948944092, -1.2790364027023315, -1.1154643297195435, -0.9518923759460449, -0.7883203029632568, -0.6247482299804688, -0.4611760973930359, -0.2976040244102478, -0.13403195142745972, 0.029540181159973145, 0.19311225414276123, 0.3566843271255493, 0.5202564001083374, 0.6838284730911255, 0.8474006056785583, 1.0109727382659912, 1.1745448112487793, 1.3381168842315674, 1.5016889572143555, 1.6652610301971436, 1.8288331031799316, 1.9924051761627197, 2.155977249145508, 2.319549322128296, 2.483121395111084, 2.646693706512451, 2.81026554107666, 2.9738378524780273, 3.1374099254608154, 3.3009819984436035, 3.4645540714263916, 3.6281261444091797, 3.7916982173919678, 3.955270290374756, 4.118842601776123, 4.282414436340332]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 11.0, 12.0, 13.0, 16.0, 26.0, 36.0, 49.0, 60.0, 132.0, 176.0, 286.0, 536.0, 978.0, 1915.0, 5049.0, 19795.0, 2356383.0, 1779168.0, 20122.0, 5281.0, 1922.0, 873.0, 498.0, 337.0, 177.0, 129.0, 81.0, 77.0, 49.0, 22.0, 22.0, 14.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.229278564453125, -1.17340087890625, -1.117523193359375, -1.0616455078125, -1.005767822265625, -0.94989013671875, -0.894012451171875, -0.838134765625, -0.782257080078125, -0.72637939453125, -0.670501708984375, -0.6146240234375, -0.558746337890625, -0.50286865234375, -0.446990966796875, -0.39111328125, -0.335235595703125, -0.27935791015625, -0.223480224609375, -0.1676025390625, -0.111724853515625, -0.05584716796875, 3.0517578125e-05, 0.055908203125, 0.111785888671875, 0.16766357421875, 0.223541259765625, 0.2794189453125, 0.335296630859375, 0.39117431640625, 0.447052001953125, 0.5029296875, 0.558807373046875, 0.61468505859375, 0.670562744140625, 0.7264404296875, 0.782318115234375, 0.83819580078125, 0.894073486328125, 0.949951171875, 1.005828857421875, 1.06170654296875, 1.117584228515625, 1.1734619140625, 1.229339599609375, 1.28521728515625, 1.341094970703125, 1.39697265625, 1.452850341796875, 1.50872802734375, 1.564605712890625, 1.6204833984375, 1.676361083984375, 1.73223876953125, 1.788116455078125, 1.843994140625, 1.899871826171875, 1.95574951171875, 2.011627197265625, 2.0675048828125, 2.123382568359375, 2.17926025390625, 2.235137939453125, 2.291015625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 2.0, 10.0, 5.0, 5.0, 9.0, 25.0, 27.0, 29.0, 42.0, 51.0, 51.0, 73.0, 73.0, 65.0, 68.0, 72.0, 63.0, 62.0, 55.0, 47.0, 36.0, 30.0, 21.0, 24.0, 19.0, 13.0, 13.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2421875, -0.23142242431640625, -0.2206573486328125, -0.20989227294921875, -0.199127197265625, -0.18836212158203125, -0.1775970458984375, -0.16683197021484375, -0.15606689453125, -0.14530181884765625, -0.1345367431640625, -0.12377166748046875, -0.113006591796875, -0.10224151611328125, -0.0914764404296875, -0.08071136474609375, -0.0699462890625, -0.05918121337890625, -0.0484161376953125, -0.03765106201171875, -0.026885986328125, -0.01612091064453125, -0.0053558349609375, 0.00540924072265625, 0.01617431640625, 0.02693939208984375, 0.0377044677734375, 0.04846954345703125, 0.059234619140625, 0.06999969482421875, 0.0807647705078125, 0.09152984619140625, 0.102294921875, 0.11305999755859375, 0.1238250732421875, 0.13459014892578125, 0.145355224609375, 0.15612030029296875, 0.1668853759765625, 0.17765045166015625, 0.18841552734375, 0.19918060302734375, 0.2099456787109375, 0.22071075439453125, 0.231475830078125, 0.24224090576171875, 0.2530059814453125, 0.26377105712890625, 0.2745361328125, 0.28530120849609375, 0.2960662841796875, 0.30683135986328125, 0.317596435546875, 0.32836151123046875, 0.3391265869140625, 0.34989166259765625, 0.36065673828125, 0.37142181396484375, 0.3821868896484375, 0.39295196533203125, 0.403717041015625, 0.41448211669921875, 0.4252471923828125, 0.43601226806640625, 0.44677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 11.0, 31.0, 42.0, 57.0, 97.0, 111.0, 200.0, 299.0, 637.0, 1550.0, 7039.0, 4028648.0, 149200.0, 4038.0, 1126.0, 464.0, 242.0, 145.0, 99.0, 57.0, 54.0, 31.0, 24.0, 15.0, 12.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.55462646484375, -2.4744873046875, -2.39434814453125, -2.314208984375, -2.23406982421875, -2.1539306640625, -2.07379150390625, -1.99365234375, -1.91351318359375, -1.8333740234375, -1.75323486328125, -1.673095703125, -1.59295654296875, -1.5128173828125, -1.43267822265625, -1.3525390625, -1.27239990234375, -1.1922607421875, -1.11212158203125, -1.031982421875, -0.95184326171875, -0.8717041015625, -0.79156494140625, -0.71142578125, -0.63128662109375, -0.5511474609375, -0.47100830078125, -0.390869140625, -0.31072998046875, -0.2305908203125, -0.15045166015625, -0.0703125, 0.00982666015625, 0.0899658203125, 0.17010498046875, 0.250244140625, 0.33038330078125, 0.4105224609375, 0.49066162109375, 0.57080078125, 0.65093994140625, 0.7310791015625, 0.81121826171875, 0.891357421875, 0.97149658203125, 1.0516357421875, 1.13177490234375, 1.2119140625, 1.29205322265625, 1.3721923828125, 1.45233154296875, 1.532470703125, 1.61260986328125, 1.6927490234375, 1.77288818359375, 1.85302734375, 1.93316650390625, 2.0133056640625, 2.09344482421875, 2.173583984375, 2.25372314453125, 2.3338623046875, 2.41400146484375, 2.494140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 9.0, 15.0, 21.0, 64.0, 3073.0, 775.0, 76.0, 24.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.859375, -1.8228645324707031, -1.7863540649414062, -1.7498435974121094, -1.7133331298828125, -1.6768226623535156, -1.6403121948242188, -1.6038017272949219, -1.567291259765625, -1.5307807922363281, -1.4942703247070312, -1.4577598571777344, -1.4212493896484375, -1.3847389221191406, -1.3482284545898438, -1.3117179870605469, -1.27520751953125, -1.2386970520019531, -1.2021865844726562, -1.1656761169433594, -1.1291656494140625, -1.0926551818847656, -1.0561447143554688, -1.0196342468261719, -0.983123779296875, -0.9466133117675781, -0.9101028442382812, -0.8735923767089844, -0.8370819091796875, -0.8005714416503906, -0.7640609741210938, -0.7275505065917969, -0.6910400390625, -0.6545295715332031, -0.6180191040039062, -0.5815086364746094, -0.5449981689453125, -0.5084877014160156, -0.47197723388671875, -0.4354667663574219, -0.398956298828125, -0.3624458312988281, -0.32593536376953125, -0.2894248962402344, -0.2529144287109375, -0.21640396118164062, -0.17989349365234375, -0.14338302612304688, -0.10687255859375, -0.07036209106445312, -0.03385162353515625, 0.002658843994140625, 0.0391693115234375, 0.07567977905273438, 0.11219024658203125, 0.14870071411132812, 0.185211181640625, 0.22172164916992188, 0.25823211669921875, 0.2947425842285156, 0.3312530517578125, 0.3677635192871094, 0.40427398681640625, 0.4407844543457031, 0.477294921875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 12.0, 20.0, 22.0, 45.0, 123.0, 297.0, 337.0, 97.0, 21.0, 12.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.823479652404785, -4.711548805236816, -4.599617958068848, -4.487687110900879, -4.37575626373291, -4.263825416564941, -4.151894569396973, -4.039963722229004, -3.9280331134796143, -3.8161022663116455, -3.7041714191436768, -3.592240571975708, -3.4803099632263184, -3.3683791160583496, -3.256448268890381, -3.144517421722412, -3.0325865745544434, -2.9206557273864746, -2.808724880218506, -2.696794033050537, -2.5848631858825684, -2.4729323387145996, -2.36100172996521, -2.249070882797241, -2.1371400356292725, -2.0252091884613037, -1.913278341293335, -1.8013476133346558, -1.689416766166687, -1.5774859189987183, -1.465555191040039, -1.3536243438720703, -1.2416934967041016, -1.1297626495361328, -1.017831802368164, -0.9059010744094849, -0.7939702272415161, -0.6820393800735474, -0.5701085925102234, -0.4581778049468994, -0.34624695777893066, -0.2343161404132843, -0.12238532304763794, -0.010454505681991577, 0.10147631168365479, 0.21340715885162354, 0.3253379464149475, 0.4372687339782715, 0.5491995811462402, 0.661130428314209, 0.773061215877533, 0.8849920034408569, 0.9969228506088257, 1.1088536977767944, 1.2207844257354736, 1.3327152729034424, 1.4446461200714111, 1.5565769672393799, 1.6685078144073486, 1.7804385423660278, 1.8923693895339966, 2.004300117492676, 2.1162309646606445, 2.2281618118286133, 2.340092658996582]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 10.0, 23.0, 17.0, 25.0, 34.0, 34.0, 47.0, 61.0, 53.0, 60.0, 80.0, 73.0, 58.0, 52.0, 43.0, 55.0, 51.0, 34.0, 36.0, 27.0, 13.0, 27.0, 18.0, 13.0, 10.0, 9.0, 11.0, 2.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4600982666015625, -2.387486696243286, -2.3148751258850098, -2.2422635555267334, -2.169651985168457, -2.0970401763916016, -2.024428606033325, -1.9518170356750488, -1.8792054653167725, -1.806593894958496, -1.7339823246002197, -1.6613706350326538, -1.5887590646743774, -1.516147494316101, -1.4435358047485352, -1.3709242343902588, -1.2983126640319824, -1.225701093673706, -1.1530895233154297, -1.0804778337478638, -1.0078662633895874, -0.935254693031311, -0.8626430630683899, -0.7900314331054688, -0.7174198627471924, -0.644808292388916, -0.5721966624259949, -0.4995850622653961, -0.42697346210479736, -0.3543618619441986, -0.28175026178359985, -0.2091386318206787, -0.13652682304382324, -0.06391522288322449, 0.008696377277374268, 0.08130797743797302, 0.15391957759857178, 0.22653117775917053, 0.2991427779197693, 0.37175440788269043, 0.4443659782409668, 0.5169775485992432, 0.5895891785621643, 0.6622008085250854, 0.7348123788833618, 0.8074239492416382, 0.8800355792045593, 0.9526472091674805, 1.0252587795257568, 1.0978703498840332, 1.1704819202423096, 1.2430936098098755, 1.3157051801681519, 1.3883167505264282, 1.4609284400939941, 1.5335400104522705, 1.6061515808105469, 1.6787631511688232, 1.7513747215270996, 1.8239864110946655, 1.896597981452942, 1.9692095518112183, 2.041821241378784, 2.1144328117370605, 2.187044382095337]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 4.0, 7.0, 9.0, 26.0, 36.0, 70.0, 120.0, 205.0, 355.0, 726.0, 1536.0, 3857.0, 12485.0, 60500.0, 522967.0, 382560.0, 46666.0, 10326.0, 3303.0, 1318.0, 676.0, 367.0, 166.0, 111.0, 58.0, 27.0, 24.0, 17.0, 11.0, 4.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.177947998046875, -1.14105224609375, -1.104156494140625, -1.0672607421875, -1.030364990234375, -0.99346923828125, -0.956573486328125, -0.919677734375, -0.882781982421875, -0.84588623046875, -0.808990478515625, -0.7720947265625, -0.735198974609375, -0.69830322265625, -0.661407470703125, -0.62451171875, -0.587615966796875, -0.55072021484375, -0.513824462890625, -0.4769287109375, -0.440032958984375, -0.40313720703125, -0.366241455078125, -0.329345703125, -0.292449951171875, -0.25555419921875, -0.218658447265625, -0.1817626953125, -0.144866943359375, -0.10797119140625, -0.071075439453125, -0.0341796875, 0.002716064453125, 0.03961181640625, 0.076507568359375, 0.1134033203125, 0.150299072265625, 0.18719482421875, 0.224090576171875, 0.260986328125, 0.297882080078125, 0.33477783203125, 0.371673583984375, 0.4085693359375, 0.445465087890625, 0.48236083984375, 0.519256591796875, 0.55615234375, 0.593048095703125, 0.62994384765625, 0.666839599609375, 0.7037353515625, 0.740631103515625, 0.77752685546875, 0.814422607421875, 0.851318359375, 0.888214111328125, 0.92510986328125, 0.962005615234375, 0.9989013671875, 1.035797119140625, 1.07269287109375, 1.109588623046875, 1.146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 9.0, 12.0, 17.0, 19.0, 20.0, 29.0, 47.0, 44.0, 46.0, 54.0, 57.0, 55.0, 71.0, 63.0, 59.0, 49.0, 64.0, 46.0, 43.0, 32.0, 38.0, 28.0, 16.0, 15.0, 18.0, 15.0, 9.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2740669250488281, -0.26273345947265625, -0.2513999938964844, -0.2400665283203125, -0.22873306274414062, -0.21739959716796875, -0.20606613159179688, -0.194732666015625, -0.18339920043945312, -0.17206573486328125, -0.16073226928710938, -0.1493988037109375, -0.13806533813476562, -0.12673187255859375, -0.11539840698242188, -0.10406494140625, -0.09273147583007812, -0.08139801025390625, -0.07006454467773438, -0.0587310791015625, -0.047397613525390625, -0.03606414794921875, -0.024730682373046875, -0.013397216796875, -0.002063751220703125, 0.00926971435546875, 0.020603179931640625, 0.0319366455078125, 0.043270111083984375, 0.05460357666015625, 0.06593704223632812, 0.0772705078125, 0.08860397338867188, 0.09993743896484375, 0.11127090454101562, 0.1226043701171875, 0.13393783569335938, 0.14527130126953125, 0.15660476684570312, 0.167938232421875, 0.17927169799804688, 0.19060516357421875, 0.20193862915039062, 0.2132720947265625, 0.22460556030273438, 0.23593902587890625, 0.24727249145507812, 0.25860595703125, 0.2699394226074219, 0.28127288818359375, 0.2926063537597656, 0.3039398193359375, 0.3152732849121094, 0.32660675048828125, 0.3379402160644531, 0.349273681640625, 0.3606071472167969, 0.37194061279296875, 0.3832740783691406, 0.3946075439453125, 0.4059410095214844, 0.41727447509765625, 0.4286079406738281, 0.43994140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 8.0, 11.0, 19.0, 28.0, 44.0, 60.0, 77.0, 134.0, 202.0, 314.0, 561.0, 935.0, 1828.0, 4269.0, 13724.0, 63845.0, 522436.0, 373122.0, 48189.0, 11128.0, 3712.0, 1642.0, 885.0, 488.0, 302.0, 182.0, 132.0, 69.0, 52.0, 39.0, 25.0, 18.0, 12.0, 14.0, 6.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8359375, -0.8079986572265625, -0.780059814453125, -0.7521209716796875, -0.72418212890625, -0.6962432861328125, -0.668304443359375, -0.6403656005859375, -0.6124267578125, -0.5844879150390625, -0.556549072265625, -0.5286102294921875, -0.50067138671875, -0.4727325439453125, -0.444793701171875, -0.4168548583984375, -0.388916015625, -0.3609771728515625, -0.333038330078125, -0.3050994873046875, -0.27716064453125, -0.2492218017578125, -0.221282958984375, -0.1933441162109375, -0.1654052734375, -0.1374664306640625, -0.109527587890625, -0.0815887451171875, -0.05364990234375, -0.0257110595703125, 0.002227783203125, 0.0301666259765625, 0.05810546875, 0.0860443115234375, 0.113983154296875, 0.1419219970703125, 0.16986083984375, 0.1977996826171875, 0.225738525390625, 0.2536773681640625, 0.2816162109375, 0.3095550537109375, 0.337493896484375, 0.3654327392578125, 0.39337158203125, 0.4213104248046875, 0.449249267578125, 0.4771881103515625, 0.505126953125, 0.5330657958984375, 0.561004638671875, 0.5889434814453125, 0.61688232421875, 0.6448211669921875, 0.672760009765625, 0.7006988525390625, 0.7286376953125, 0.7565765380859375, 0.784515380859375, 0.8124542236328125, 0.84039306640625, 0.8683319091796875, 0.896270751953125, 0.9242095947265625, 0.9521484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 13.0, 9.0, 11.0, 24.0, 32.0, 40.0, 42.0, 52.0, 57.0, 50.0, 64.0, 68.0, 62.0, 81.0, 70.0, 63.0, 51.0, 46.0, 36.0, 24.0, 17.0, 25.0, 18.0, 7.0, 6.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.5733642578125, -1.515869140625, -1.4583740234375, -1.40087890625, -1.3433837890625, -1.285888671875, -1.2283935546875, -1.1708984375, -1.1134033203125, -1.055908203125, -0.9984130859375, -0.94091796875, -0.8834228515625, -0.825927734375, -0.7684326171875, -0.7109375, -0.6534423828125, -0.595947265625, -0.5384521484375, -0.48095703125, -0.4234619140625, -0.365966796875, -0.3084716796875, -0.2509765625, -0.1934814453125, -0.135986328125, -0.0784912109375, -0.02099609375, 0.0364990234375, 0.093994140625, 0.1514892578125, 0.208984375, 0.2664794921875, 0.323974609375, 0.3814697265625, 0.43896484375, 0.4964599609375, 0.553955078125, 0.6114501953125, 0.6689453125, 0.7264404296875, 0.783935546875, 0.8414306640625, 0.89892578125, 0.9564208984375, 1.013916015625, 1.0714111328125, 1.12890625, 1.1864013671875, 1.243896484375, 1.3013916015625, 1.35888671875, 1.4163818359375, 1.473876953125, 1.5313720703125, 1.5888671875, 1.6463623046875, 1.703857421875, 1.7613525390625, 1.81884765625, 1.8763427734375, 1.933837890625, 1.9913330078125, 2.048828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 1.0, 8.0, 4.0, 0.0, 12.0, 8.0, 9.0, 13.0, 24.0, 35.0, 36.0, 68.0, 89.0, 181.0, 387.0, 1115.0, 4411.0, 113607.0, 920402.0, 5689.0, 1421.0, 514.0, 193.0, 97.0, 69.0, 47.0, 30.0, 19.0, 19.0, 11.0, 21.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.1868743896484375, -1.124725341796875, -1.0625762939453125, -1.00042724609375, -0.9382781982421875, -0.876129150390625, -0.8139801025390625, -0.7518310546875, -0.6896820068359375, -0.627532958984375, -0.5653839111328125, -0.50323486328125, -0.4410858154296875, -0.378936767578125, -0.3167877197265625, -0.254638671875, -0.1924896240234375, -0.130340576171875, -0.0681915283203125, -0.00604248046875, 0.0561065673828125, 0.118255615234375, 0.1804046630859375, 0.2425537109375, 0.3047027587890625, 0.366851806640625, 0.4290008544921875, 0.49114990234375, 0.5532989501953125, 0.615447998046875, 0.6775970458984375, 0.73974609375, 0.8018951416015625, 0.864044189453125, 0.9261932373046875, 0.98834228515625, 1.0504913330078125, 1.112640380859375, 1.1747894287109375, 1.2369384765625, 1.2990875244140625, 1.361236572265625, 1.4233856201171875, 1.48553466796875, 1.5476837158203125, 1.609832763671875, 1.6719818115234375, 1.734130859375, 1.7962799072265625, 1.858428955078125, 1.9205780029296875, 1.98272705078125, 2.0448760986328125, 2.107025146484375, 2.1691741943359375, 2.2313232421875, 2.2934722900390625, 2.355621337890625, 2.4177703857421875, 2.47991943359375, 2.5420684814453125, 2.604217529296875, 2.6663665771484375, 2.728515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 13.0, 16.0, 22.0, 38.0, 45.0, 41.0, 89.0, 129.0, 171.0, 118.0, 96.0, 46.0, 41.0, 22.0, 26.0, 12.0, 10.0, 10.0, 12.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0001125335693359375, -0.0001097479835152626, -0.00010696239769458771, -0.00010417681187391281, -0.00010139122605323792, -9.860564023256302e-05, -9.582005441188812e-05, -9.303446859121323e-05, -9.024888277053833e-05, -8.746329694986343e-05, -8.467771112918854e-05, -8.189212530851364e-05, -7.910653948783875e-05, -7.632095366716385e-05, -7.353536784648895e-05, -7.074978202581406e-05, -6.796419620513916e-05, -6.517861038446426e-05, -6.239302456378937e-05, -5.960743874311447e-05, -5.6821852922439575e-05, -5.403626710176468e-05, -5.125068128108978e-05, -4.8465095460414886e-05, -4.567950963973999e-05, -4.2893923819065094e-05, -4.01083379983902e-05, -3.73227521777153e-05, -3.4537166357040405e-05, -3.175158053636551e-05, -2.8965994715690613e-05, -2.6180408895015717e-05, -2.339482307434082e-05, -2.0609237253665924e-05, -1.7823651432991028e-05, -1.5038065612316132e-05, -1.2252479791641235e-05, -9.466893970966339e-06, -6.681308150291443e-06, -3.895722329616547e-06, -1.1101365089416504e-06, 1.6754493117332458e-06, 4.461035132408142e-06, 7.246620953083038e-06, 1.0032206773757935e-05, 1.281779259443283e-05, 1.5603378415107727e-05, 1.8388964235782623e-05, 2.117455005645752e-05, 2.3960135877132416e-05, 2.6745721697807312e-05, 2.9531307518482208e-05, 3.2316893339157104e-05, 3.5102479159832e-05, 3.78880649805069e-05, 4.067365080118179e-05, 4.345923662185669e-05, 4.6244822442531586e-05, 4.903040826320648e-05, 5.181599408388138e-05, 5.4601579904556274e-05, 5.738716572523117e-05, 6.017275154590607e-05, 6.295833736658096e-05, 6.574392318725586e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 14.0, 30.0, 52.0, 93.0, 180.0, 643.0, 21112.0, 1024791.0, 1233.0, 182.0, 97.0, 49.0, 40.0, 14.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.412506103515625, -5.27423095703125, -5.135955810546875, -4.9976806640625, -4.859405517578125, -4.72113037109375, -4.582855224609375, -4.444580078125, -4.306304931640625, -4.16802978515625, -4.029754638671875, -3.8914794921875, -3.753204345703125, -3.61492919921875, -3.476654052734375, -3.33837890625, -3.200103759765625, -3.06182861328125, -2.923553466796875, -2.7852783203125, -2.647003173828125, -2.50872802734375, -2.370452880859375, -2.232177734375, -2.093902587890625, -1.95562744140625, -1.817352294921875, -1.6790771484375, -1.540802001953125, -1.40252685546875, -1.264251708984375, -1.1259765625, -0.987701416015625, -0.84942626953125, -0.711151123046875, -0.5728759765625, -0.434600830078125, -0.29632568359375, -0.158050537109375, -0.019775390625, 0.118499755859375, 0.25677490234375, 0.395050048828125, 0.5333251953125, 0.671600341796875, 0.80987548828125, 0.948150634765625, 1.08642578125, 1.224700927734375, 1.36297607421875, 1.501251220703125, 1.6395263671875, 1.777801513671875, 1.91607666015625, 2.054351806640625, 2.192626953125, 2.330902099609375, 2.46917724609375, 2.607452392578125, 2.7457275390625, 2.884002685546875, 3.02227783203125, 3.160552978515625, 3.298828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 6.0, 122.0, 792.0, 52.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.93359375, -7.779296875, -7.625, -7.470703125, -7.31640625, -7.162109375, -7.0078125, -6.853515625, -6.69921875, -6.544921875, -6.390625, -6.236328125, -6.08203125, -5.927734375, -5.7734375, -5.619140625, -5.46484375, -5.310546875, -5.15625, -5.001953125, -4.84765625, -4.693359375, -4.5390625, -4.384765625, -4.23046875, -4.076171875, -3.921875, -3.767578125, -3.61328125, -3.458984375, -3.3046875, -3.150390625, -2.99609375, -2.841796875, -2.6875, -2.533203125, -2.37890625, -2.224609375, -2.0703125, -1.916015625, -1.76171875, -1.607421875, -1.453125, -1.298828125, -1.14453125, -0.990234375, -0.8359375, -0.681640625, -0.52734375, -0.373046875, -0.21875, -0.064453125, 0.08984375, 0.244140625, 0.3984375, 0.552734375, 0.70703125, 0.861328125, 1.015625, 1.169921875, 1.32421875, 1.478515625, 1.6328125, 1.787109375, 1.94140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 20.0, 104.0, 530.0, 325.0, 27.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.638710021972656, -16.455074310302734, -15.271437644958496, -14.087801933288574, -12.904165267944336, -11.720529556274414, -10.536893844604492, -9.353257179260254, -8.169621467590332, -6.985985279083252, -5.802349090576172, -4.61871337890625, -3.43507719039917, -2.25144100189209, -1.067805290222168, 0.11583137512207031, 1.2994670867919922, 2.4831032752990723, 3.6667392253875732, 4.850375175476074, 6.034011363983154, 7.217647552490234, 8.401283264160156, 9.584919929504395, 10.768555641174316, 11.952191352844238, 13.135828018188477, 14.319463729858398, 15.50309944152832, 16.686737060546875, 17.870372772216797, 19.05400848388672, 20.23764419555664, 21.421279907226562, 22.604915618896484, 23.788551330566406, 24.97218894958496, 26.155824661254883, 27.339460372924805, 28.52309799194336, 29.70673370361328, 30.890369415283203, 32.074005126953125, 33.25764083862305, 34.44127655029297, 35.624916076660156, 36.80854797363281, 37.9921875, 39.175819396972656, 40.35945510864258, 41.5430908203125, 42.72672653198242, 43.910362243652344, 45.09400177001953, 46.27763366699219, 47.461273193359375, 48.6449089050293, 49.82854461669922, 51.01218032836914, 52.19581604003906, 53.379451751708984, 54.563087463378906, 55.746726989746094, 56.930362701416016, 58.11399841308594]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 3.0, 12.0, 6.0, 8.0, 14.0, 6.0, 21.0, 23.0, 22.0, 25.0, 22.0, 29.0, 24.0, 36.0, 32.0, 39.0, 38.0, 39.0, 45.0, 43.0, 53.0, 35.0, 54.0, 41.0, 30.0, 26.0, 32.0, 36.0, 29.0, 20.0, 16.0, 20.0, 22.0, 19.0, 10.0, 5.0, 12.0, 11.0, 6.0, 5.0, 0.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0741801261901855, -6.83461856842041, -6.595056533813477, -6.355494976043701, -6.115933418273926, -5.876371383666992, -5.636809825897217, -5.397248268127441, -5.157686233520508, -4.918124675750732, -4.678562641143799, -4.439001083374023, -4.19943904876709, -3.9598774909973145, -3.720315933227539, -3.4807541370391846, -3.24119234085083, -3.0016305446624756, -2.762068748474121, -2.5225071907043457, -2.282945394515991, -2.0433835983276367, -1.8038219213485718, -1.5642602443695068, -1.3246984481811523, -1.0851366519927979, -0.8455749750137329, -0.6060132384300232, -0.3664515018463135, -0.12688970565795898, 0.11267197132110596, 0.3522336483001709, 0.5917949676513672, 0.8313567042350769, 1.0709184408187866, 1.3104801177978516, 1.550041913986206, 1.7896037101745605, 2.029165267944336, 2.2687270641326904, 2.508288860321045, 2.7478506565093994, 2.987412452697754, 3.2269740104675293, 3.466535806655884, 3.7060976028442383, 3.9456591606140137, 4.185220718383789, 4.424782752990723, 4.664344310760498, 4.903906345367432, 5.143467903137207, 5.383029937744141, 5.622591495513916, 5.862153053283691, 6.101715087890625, 6.3412766456604, 6.580838203430176, 6.820400238037109, 7.059961795806885, 7.29952335357666, 7.539085388183594, 7.778646945953369, 8.018208503723145, 8.257770538330078]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 16.0, 7.0, 30.0, 40.0, 59.0, 88.0, 111.0, 174.0, 252.0, 372.0, 554.0, 787.0, 1246.0, 2001.0, 3358.0, 6046.0, 12312.0, 30168.0, 163029.0, 3852956.0, 77000.0, 21924.0, 9367.0, 4924.0, 2725.0, 1631.0, 1018.0, 636.0, 432.0, 309.0, 224.0, 137.0, 96.0, 74.0, 44.0, 36.0, 20.0, 18.0, 16.0, 12.0, 8.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8271484375, -0.7968902587890625, -0.766632080078125, -0.7363739013671875, -0.70611572265625, -0.6758575439453125, -0.645599365234375, -0.6153411865234375, -0.5850830078125, -0.5548248291015625, -0.524566650390625, -0.4943084716796875, -0.46405029296875, -0.4337921142578125, -0.403533935546875, -0.3732757568359375, -0.343017578125, -0.3127593994140625, -0.282501220703125, -0.2522430419921875, -0.22198486328125, -0.1917266845703125, -0.161468505859375, -0.1312103271484375, -0.1009521484375, -0.0706939697265625, -0.040435791015625, -0.0101776123046875, 0.02008056640625, 0.0503387451171875, 0.080596923828125, 0.1108551025390625, 0.14111328125, 0.1713714599609375, 0.201629638671875, 0.2318878173828125, 0.26214599609375, 0.2924041748046875, 0.322662353515625, 0.3529205322265625, 0.3831787109375, 0.4134368896484375, 0.443695068359375, 0.4739532470703125, 0.50421142578125, 0.5344696044921875, 0.564727783203125, 0.5949859619140625, 0.625244140625, 0.6555023193359375, 0.685760498046875, 0.7160186767578125, 0.74627685546875, 0.7765350341796875, 0.806793212890625, 0.8370513916015625, 0.8673095703125, 0.8975677490234375, 0.927825927734375, 0.9580841064453125, 0.98834228515625, 1.0186004638671875, 1.048858642578125, 1.0791168212890625, 1.109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 6.0, 8.0, 11.0, 8.0, 15.0, 19.0, 17.0, 25.0, 26.0, 29.0, 34.0, 48.0, 45.0, 44.0, 53.0, 71.0, 59.0, 74.0, 57.0, 43.0, 52.0, 43.0, 43.0, 45.0, 25.0, 27.0, 13.0, 13.0, 10.0, 6.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443359375, -0.42926025390625, -0.4151611328125, -0.40106201171875, -0.386962890625, -0.37286376953125, -0.3587646484375, -0.34466552734375, -0.33056640625, -0.31646728515625, -0.3023681640625, -0.28826904296875, -0.274169921875, -0.26007080078125, -0.2459716796875, -0.23187255859375, -0.2177734375, -0.20367431640625, -0.1895751953125, -0.17547607421875, -0.161376953125, -0.14727783203125, -0.1331787109375, -0.11907958984375, -0.10498046875, -0.09088134765625, -0.0767822265625, -0.06268310546875, -0.048583984375, -0.03448486328125, -0.0203857421875, -0.00628662109375, 0.0078125, 0.02191162109375, 0.0360107421875, 0.05010986328125, 0.064208984375, 0.07830810546875, 0.0924072265625, 0.10650634765625, 0.12060546875, 0.13470458984375, 0.1488037109375, 0.16290283203125, 0.177001953125, 0.19110107421875, 0.2052001953125, 0.21929931640625, 0.2333984375, 0.24749755859375, 0.2615966796875, 0.27569580078125, 0.289794921875, 0.30389404296875, 0.3179931640625, 0.33209228515625, 0.34619140625, 0.36029052734375, 0.3743896484375, 0.38848876953125, 0.402587890625, 0.41668701171875, 0.4307861328125, 0.44488525390625, 0.458984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 8.0, 17.0, 24.0, 22.0, 31.0, 51.0, 68.0, 106.0, 174.0, 232.0, 356.0, 493.0, 919.0, 2017.0, 6084.0, 40434.0, 4085407.0, 46545.0, 6631.0, 2090.0, 956.0, 567.0, 322.0, 190.0, 166.0, 105.0, 76.0, 46.0, 51.0, 28.0, 22.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.11016845703125, -2.0386962890625, -1.96722412109375, -1.895751953125, -1.82427978515625, -1.7528076171875, -1.68133544921875, -1.60986328125, -1.53839111328125, -1.4669189453125, -1.39544677734375, -1.323974609375, -1.25250244140625, -1.1810302734375, -1.10955810546875, -1.0380859375, -0.96661376953125, -0.8951416015625, -0.82366943359375, -0.752197265625, -0.68072509765625, -0.6092529296875, -0.53778076171875, -0.46630859375, -0.39483642578125, -0.3233642578125, -0.25189208984375, -0.180419921875, -0.10894775390625, -0.0374755859375, 0.03399658203125, 0.10546875, 0.17694091796875, 0.2484130859375, 0.31988525390625, 0.391357421875, 0.46282958984375, 0.5343017578125, 0.60577392578125, 0.67724609375, 0.74871826171875, 0.8201904296875, 0.89166259765625, 0.963134765625, 1.03460693359375, 1.1060791015625, 1.17755126953125, 1.2490234375, 1.32049560546875, 1.3919677734375, 1.46343994140625, 1.534912109375, 1.60638427734375, 1.6778564453125, 1.74932861328125, 1.82080078125, 1.89227294921875, 1.9637451171875, 2.03521728515625, 2.106689453125, 2.17816162109375, 2.2496337890625, 2.32110595703125, 2.392578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 8.0, 22.0, 53.0, 209.0, 3517.0, 152.0, 41.0, 28.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.974609375, -1.9172210693359375, -1.859832763671875, -1.8024444580078125, -1.74505615234375, -1.6876678466796875, -1.630279541015625, -1.5728912353515625, -1.5155029296875, -1.4581146240234375, -1.400726318359375, -1.3433380126953125, -1.28594970703125, -1.2285614013671875, -1.171173095703125, -1.1137847900390625, -1.056396484375, -0.9990081787109375, -0.941619873046875, -0.8842315673828125, -0.82684326171875, -0.7694549560546875, -0.712066650390625, -0.6546783447265625, -0.5972900390625, -0.5399017333984375, -0.482513427734375, -0.4251251220703125, -0.36773681640625, -0.3103485107421875, -0.252960205078125, -0.1955718994140625, -0.13818359375, -0.0807952880859375, -0.023406982421875, 0.0339813232421875, 0.09136962890625, 0.1487579345703125, 0.206146240234375, 0.2635345458984375, 0.3209228515625, 0.3783111572265625, 0.435699462890625, 0.4930877685546875, 0.55047607421875, 0.6078643798828125, 0.665252685546875, 0.7226409912109375, 0.780029296875, 0.8374176025390625, 0.894805908203125, 0.9521942138671875, 1.00958251953125, 1.0669708251953125, 1.124359130859375, 1.1817474365234375, 1.2391357421875, 1.2965240478515625, 1.353912353515625, 1.4113006591796875, 1.46868896484375, 1.5260772705078125, 1.583465576171875, 1.6408538818359375, 1.6982421875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 16.0, 47.0, 220.0, 435.0, 170.0, 66.0, 23.0, 15.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.01068115234375, -7.736680030822754, -7.4626784324646, -7.1886773109436035, -6.914675712585449, -6.640674591064453, -6.366673469543457, -6.092671871185303, -5.818670272827148, -5.544669151306152, -5.270667552947998, -4.996666431427002, -4.722664833068848, -4.448663711547852, -4.1746625900268555, -3.900660991668701, -3.626659870147705, -3.35265851020813, -3.0786571502685547, -2.8046560287475586, -2.5306544303894043, -2.256653308868408, -1.982651948928833, -1.7086505889892578, -1.4346492290496826, -1.1606478691101074, -0.886646568775177, -0.6126452684402466, -0.3386439085006714, -0.06464254856109619, 0.20935869216918945, 0.48336005210876465, 0.7573614120483398, 1.031362771987915, 1.3053641319274902, 1.5793653726577759, 1.853366732597351, 2.1273679733276367, 2.401369333267212, 2.675370693206787, 2.9493720531463623, 3.2233734130859375, 3.4973747730255127, 3.771376132965088, 4.045377254486084, 4.319378852844238, 4.593379974365234, 4.8673810958862305, 5.141382694244385, 5.415383815765381, 5.689385414123535, 5.963386535644531, 6.2373881340026855, 6.511389255523682, 6.785390853881836, 7.059391975402832, 7.333393096923828, 7.607394218444824, 7.8813958168029785, 8.155397415161133, 8.429398536682129, 8.703399658203125, 8.977400779724121, 9.251401901245117, 9.52540397644043]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 12.0, 7.0, 17.0, 20.0, 20.0, 24.0, 25.0, 43.0, 33.0, 47.0, 37.0, 53.0, 48.0, 48.0, 53.0, 37.0, 55.0, 43.0, 38.0, 34.0, 46.0, 34.0, 32.0, 38.0, 28.0, 21.0, 23.0, 8.0, 16.0, 12.0, 12.0, 5.0, 10.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.625326633453369, -2.5382437705993652, -2.4511609077453613, -2.3640780448913574, -2.2769951820373535, -2.1899120807647705, -2.1028292179107666, -2.0157463550567627, -1.9286634922027588, -1.8415806293487549, -1.754497766494751, -1.6674147844314575, -1.5803319215774536, -1.4932490587234497, -1.4061660766601562, -1.3190832138061523, -1.2320003509521484, -1.1449174880981445, -1.0578346252441406, -0.9707516431808472, -0.8836687803268433, -0.7965859174728394, -0.7095029950141907, -0.622420072555542, -0.5353372097015381, -0.4482543170452118, -0.3611714243888855, -0.2740885317325592, -0.1870056390762329, -0.09992274641990662, -0.012839853763580322, 0.07424306869506836, 0.16132616996765137, 0.24840906262397766, 0.33549195528030396, 0.42257484793663025, 0.5096577405929565, 0.5967406034469604, 0.6838235259056091, 0.7709064483642578, 0.8579893112182617, 0.9450721740722656, 1.0321550369262695, 1.119238018989563, 1.206320881843567, 1.2934037446975708, 1.3804867267608643, 1.4675695896148682, 1.554652452468872, 1.641735315322876, 1.7288181781768799, 1.8159011602401733, 1.9029840230941772, 1.9900668859481812, 2.0771498680114746, 2.1642327308654785, 2.2513155937194824, 2.3383984565734863, 2.4254813194274902, 2.512564182281494, 2.599647045135498, 2.686730146408081, 2.773813009262085, 2.860895872116089, 2.9479787349700928]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 10.0, 17.0, 39.0, 47.0, 55.0, 110.0, 179.0, 339.0, 659.0, 1277.0, 2695.0, 5928.0, 15080.0, 44198.0, 196116.0, 601802.0, 125705.0, 32861.0, 11805.0, 5072.0, 2195.0, 1060.0, 552.0, 302.0, 161.0, 127.0, 46.0, 28.0, 22.0, 22.0, 12.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2695770263671875, -1.231536865234375, -1.1934967041015625, -1.15545654296875, -1.1174163818359375, -1.079376220703125, -1.0413360595703125, -1.0032958984375, -0.9652557373046875, -0.927215576171875, -0.8891754150390625, -0.85113525390625, -0.8130950927734375, -0.775054931640625, -0.7370147705078125, -0.698974609375, -0.6609344482421875, -0.622894287109375, -0.5848541259765625, -0.54681396484375, -0.5087738037109375, -0.470733642578125, -0.4326934814453125, -0.3946533203125, -0.3566131591796875, -0.318572998046875, -0.2805328369140625, -0.24249267578125, -0.2044525146484375, -0.166412353515625, -0.1283721923828125, -0.09033203125, -0.0522918701171875, -0.014251708984375, 0.0237884521484375, 0.06182861328125, 0.0998687744140625, 0.137908935546875, 0.1759490966796875, 0.2139892578125, 0.2520294189453125, 0.290069580078125, 0.3281097412109375, 0.36614990234375, 0.4041900634765625, 0.442230224609375, 0.4802703857421875, 0.518310546875, 0.5563507080078125, 0.594390869140625, 0.6324310302734375, 0.67047119140625, 0.7085113525390625, 0.746551513671875, 0.7845916748046875, 0.8226318359375, 0.8606719970703125, 0.898712158203125, 0.9367523193359375, 0.97479248046875, 1.0128326416015625, 1.050872802734375, 1.0889129638671875, 1.126953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 6.0, 14.0, 13.0, 21.0, 16.0, 23.0, 29.0, 37.0, 45.0, 54.0, 51.0, 64.0, 63.0, 65.0, 72.0, 67.0, 64.0, 54.0, 49.0, 42.0, 31.0, 33.0, 14.0, 21.0, 13.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5447540283203125, -0.527496337890625, -0.5102386474609375, -0.49298095703125, -0.4757232666015625, -0.458465576171875, -0.4412078857421875, -0.4239501953125, -0.4066925048828125, -0.389434814453125, -0.3721771240234375, -0.35491943359375, -0.3376617431640625, -0.320404052734375, -0.3031463623046875, -0.285888671875, -0.2686309814453125, -0.251373291015625, -0.2341156005859375, -0.21685791015625, -0.1996002197265625, -0.182342529296875, -0.1650848388671875, -0.1478271484375, -0.1305694580078125, -0.113311767578125, -0.0960540771484375, -0.07879638671875, -0.0615386962890625, -0.044281005859375, -0.0270233154296875, -0.009765625, 0.0074920654296875, 0.024749755859375, 0.0420074462890625, 0.05926513671875, 0.0765228271484375, 0.093780517578125, 0.1110382080078125, 0.1282958984375, 0.1455535888671875, 0.162811279296875, 0.1800689697265625, 0.19732666015625, 0.2145843505859375, 0.231842041015625, 0.2490997314453125, 0.266357421875, 0.2836151123046875, 0.300872802734375, 0.3181304931640625, 0.33538818359375, 0.3526458740234375, 0.369903564453125, 0.3871612548828125, 0.4044189453125, 0.4216766357421875, 0.438934326171875, 0.4561920166015625, 0.47344970703125, 0.4907073974609375, 0.507965087890625, 0.5252227783203125, 0.54248046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 10.0, 16.0, 14.0, 49.0, 54.0, 113.0, 144.0, 262.0, 472.0, 1046.0, 3157.0, 12454.0, 72205.0, 796844.0, 135634.0, 18797.0, 4552.0, 1438.0, 551.0, 295.0, 166.0, 87.0, 61.0, 34.0, 38.0, 11.0, 10.0, 11.0, 7.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.9443359375, -1.880859375, -1.8173828125, -1.75390625, -1.6904296875, -1.626953125, -1.5634765625, -1.5, -1.4365234375, -1.373046875, -1.3095703125, -1.24609375, -1.1826171875, -1.119140625, -1.0556640625, -0.9921875, -0.9287109375, -0.865234375, -0.8017578125, -0.73828125, -0.6748046875, -0.611328125, -0.5478515625, -0.484375, -0.4208984375, -0.357421875, -0.2939453125, -0.23046875, -0.1669921875, -0.103515625, -0.0400390625, 0.0234375, 0.0869140625, 0.150390625, 0.2138671875, 0.27734375, 0.3408203125, 0.404296875, 0.4677734375, 0.53125, 0.5947265625, 0.658203125, 0.7216796875, 0.78515625, 0.8486328125, 0.912109375, 0.9755859375, 1.0390625, 1.1025390625, 1.166015625, 1.2294921875, 1.29296875, 1.3564453125, 1.419921875, 1.4833984375, 1.546875, 1.6103515625, 1.673828125, 1.7373046875, 1.80078125, 1.8642578125, 1.927734375, 1.9912109375, 2.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 14.0, 24.0, 31.0, 37.0, 52.0, 66.0, 89.0, 102.0, 119.0, 100.0, 97.0, 75.0, 52.0, 39.0, 38.0, 22.0, 10.0, 12.0, 5.0, 9.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.680908203125, -4.53369140625, -4.386474609375, -4.2392578125, -4.092041015625, -3.94482421875, -3.797607421875, -3.650390625, -3.503173828125, -3.35595703125, -3.208740234375, -3.0615234375, -2.914306640625, -2.76708984375, -2.619873046875, -2.47265625, -2.325439453125, -2.17822265625, -2.031005859375, -1.8837890625, -1.736572265625, -1.58935546875, -1.442138671875, -1.294921875, -1.147705078125, -1.00048828125, -0.853271484375, -0.7060546875, -0.558837890625, -0.41162109375, -0.264404296875, -0.1171875, 0.030029296875, 0.17724609375, 0.324462890625, 0.4716796875, 0.618896484375, 0.76611328125, 0.913330078125, 1.060546875, 1.207763671875, 1.35498046875, 1.502197265625, 1.6494140625, 1.796630859375, 1.94384765625, 2.091064453125, 2.23828125, 2.385498046875, 2.53271484375, 2.679931640625, 2.8271484375, 2.974365234375, 3.12158203125, 3.268798828125, 3.416015625, 3.563232421875, 3.71044921875, 3.857666015625, 4.0048828125, 4.152099609375, 4.29931640625, 4.446533203125, 4.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 4.0, 11.0, 15.0, 29.0, 73.0, 201.0, 727.0, 5874.0, 916234.0, 121621.0, 3019.0, 483.0, 140.0, 55.0, 29.0, 12.0, 12.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.828125, -2.753448486328125, -2.67877197265625, -2.604095458984375, -2.5294189453125, -2.454742431640625, -2.38006591796875, -2.305389404296875, -2.230712890625, -2.156036376953125, -2.08135986328125, -2.006683349609375, -1.9320068359375, -1.857330322265625, -1.78265380859375, -1.707977294921875, -1.63330078125, -1.558624267578125, -1.48394775390625, -1.409271240234375, -1.3345947265625, -1.259918212890625, -1.18524169921875, -1.110565185546875, -1.035888671875, -0.961212158203125, -0.88653564453125, -0.811859130859375, -0.7371826171875, -0.662506103515625, -0.58782958984375, -0.513153076171875, -0.4384765625, -0.363800048828125, -0.28912353515625, -0.214447021484375, -0.1397705078125, -0.065093994140625, 0.00958251953125, 0.084259033203125, 0.158935546875, 0.233612060546875, 0.30828857421875, 0.382965087890625, 0.4576416015625, 0.532318115234375, 0.60699462890625, 0.681671142578125, 0.75634765625, 0.831024169921875, 0.90570068359375, 0.980377197265625, 1.0550537109375, 1.129730224609375, 1.20440673828125, 1.279083251953125, 1.353759765625, 1.428436279296875, 1.50311279296875, 1.577789306640625, 1.6524658203125, 1.727142333984375, 1.80181884765625, 1.876495361328125, 1.951171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 6.0, 2.0, 12.0, 4.0, 12.0, 15.0, 35.0, 43.0, 52.0, 90.0, 83.0, 129.0, 125.0, 90.0, 78.0, 58.0, 44.0, 28.0, 23.0, 19.0, 14.0, 6.0, 8.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.712841033935547e-05, -7.456168532371521e-05, -7.199496030807495e-05, -6.942823529243469e-05, -6.686151027679443e-05, -6.429478526115417e-05, -6.172806024551392e-05, -5.916133522987366e-05, -5.65946102142334e-05, -5.402788519859314e-05, -5.146116018295288e-05, -4.889443516731262e-05, -4.632771015167236e-05, -4.3760985136032104e-05, -4.1194260120391846e-05, -3.862753510475159e-05, -3.606081008911133e-05, -3.349408507347107e-05, -3.092736005783081e-05, -2.8360635042190552e-05, -2.5793910026550293e-05, -2.3227185010910034e-05, -2.0660459995269775e-05, -1.8093734979629517e-05, -1.5527009963989258e-05, -1.2960284948348999e-05, -1.039355993270874e-05, -7.826834917068481e-06, -5.260109901428223e-06, -2.693384885787964e-06, -1.2665987014770508e-07, 2.4400651454925537e-06, 5.0067901611328125e-06, 7.573515176773071e-06, 1.014024019241333e-05, 1.2706965208053589e-05, 1.5273690223693848e-05, 1.7840415239334106e-05, 2.0407140254974365e-05, 2.2973865270614624e-05, 2.5540590286254883e-05, 2.810731530189514e-05, 3.06740403175354e-05, 3.324076533317566e-05, 3.580749034881592e-05, 3.837421536445618e-05, 4.0940940380096436e-05, 4.3507665395736694e-05, 4.607439041137695e-05, 4.864111542701721e-05, 5.120784044265747e-05, 5.377456545829773e-05, 5.634129047393799e-05, 5.890801548957825e-05, 6.14747405052185e-05, 6.404146552085876e-05, 6.660819053649902e-05, 6.917491555213928e-05, 7.174164056777954e-05, 7.43083655834198e-05, 7.687509059906006e-05, 7.944181561470032e-05, 8.200854063034058e-05, 8.457526564598083e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 11.0, 25.0, 50.0, 94.0, 215.0, 587.0, 2889.0, 86474.0, 949492.0, 7120.0, 1011.0, 329.0, 116.0, 70.0, 29.0, 18.0, 13.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.5905914306640625, -1.522003173828125, -1.4534149169921875, -1.38482666015625, -1.3162384033203125, -1.247650146484375, -1.1790618896484375, -1.1104736328125, -1.0418853759765625, -0.973297119140625, -0.9047088623046875, -0.83612060546875, -0.7675323486328125, -0.698944091796875, -0.6303558349609375, -0.561767578125, -0.4931793212890625, -0.424591064453125, -0.3560028076171875, -0.28741455078125, -0.2188262939453125, -0.150238037109375, -0.0816497802734375, -0.0130615234375, 0.0555267333984375, 0.124114990234375, 0.1927032470703125, 0.26129150390625, 0.3298797607421875, 0.398468017578125, 0.4670562744140625, 0.53564453125, 0.6042327880859375, 0.672821044921875, 0.7414093017578125, 0.80999755859375, 0.8785858154296875, 0.947174072265625, 1.0157623291015625, 1.0843505859375, 1.1529388427734375, 1.221527099609375, 1.2901153564453125, 1.35870361328125, 1.4272918701171875, 1.495880126953125, 1.5644683837890625, 1.633056640625, 1.7016448974609375, 1.770233154296875, 1.8388214111328125, 1.90740966796875, 1.9759979248046875, 2.044586181640625, 2.1131744384765625, 2.1817626953125, 2.2503509521484375, 2.318939208984375, 2.3875274658203125, 2.45611572265625, 2.5247039794921875, 2.593292236328125, 2.6618804931640625, 2.73046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 3.0, 14.0, 16.0, 29.0, 123.0, 400.0, 264.0, 65.0, 39.0, 25.0, 16.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2168426513671875, -1.139739990234375, -1.0626373291015625, -0.98553466796875, -0.9084320068359375, -0.831329345703125, -0.7542266845703125, -0.6771240234375, -0.6000213623046875, -0.522918701171875, -0.4458160400390625, -0.36871337890625, -0.2916107177734375, -0.214508056640625, -0.1374053955078125, -0.060302734375, 0.0167999267578125, 0.093902587890625, 0.1710052490234375, 0.24810791015625, 0.3252105712890625, 0.402313232421875, 0.4794158935546875, 0.5565185546875, 0.6336212158203125, 0.710723876953125, 0.7878265380859375, 0.86492919921875, 0.9420318603515625, 1.019134521484375, 1.0962371826171875, 1.17333984375, 1.2504425048828125, 1.327545166015625, 1.4046478271484375, 1.48175048828125, 1.5588531494140625, 1.635955810546875, 1.7130584716796875, 1.7901611328125, 1.8672637939453125, 1.944366455078125, 2.0214691162109375, 2.09857177734375, 2.1756744384765625, 2.252777099609375, 2.3298797607421875, 2.406982421875, 2.4840850830078125, 2.561187744140625, 2.6382904052734375, 2.71539306640625, 2.7924957275390625, 2.869598388671875, 2.9467010498046875, 3.0238037109375, 3.1009063720703125, 3.178009033203125, 3.2551116943359375, 3.33221435546875, 3.4093170166015625, 3.486419677734375, 3.5635223388671875, 3.640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 32.0, 110.0, 347.0, 388.0, 93.0, 15.0, 17.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.912158966064453, -4.955289840698242, -3.998420476913452, -3.041551113128662, -2.084681987762451, -1.1278128623962402, -0.1709432601928711, 0.7859258651733398, 1.7427949905395508, 2.6996641159057617, 3.6565334796905518, 4.613402843475342, 5.570271968841553, 6.527141094207764, 7.484010696411133, 8.440879821777344, 9.397748947143555, 10.354618072509766, 11.311487197875977, 12.268356323242188, 13.225225448608398, 14.18209457397461, 15.138964653015137, 16.09583282470703, 17.052703857421875, 18.009572982788086, 18.966442108154297, 19.923311233520508, 20.88018035888672, 21.83704948425293, 22.79391860961914, 23.750789642333984, 24.707656860351562, 25.664525985717773, 26.621395111083984, 27.578264236450195, 28.535133361816406, 29.492002487182617, 30.448871612548828, 31.405742645263672, 32.36260986328125, 33.319480895996094, 34.27634811401367, 35.233219146728516, 36.190086364746094, 37.14695739746094, 38.103824615478516, 39.06069564819336, 40.01756286621094, 40.97443389892578, 41.93130111694336, 42.8881721496582, 43.84503936767578, 44.801910400390625, 45.7587776184082, 46.71564865112305, 47.67251968383789, 48.629390716552734, 49.58625793457031, 50.543128967285156, 51.499996185302734, 52.45686721801758, 53.413734436035156, 54.37060546875, 55.32747268676758]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 5.0, 4.0, 6.0, 9.0, 19.0, 11.0, 21.0, 26.0, 26.0, 30.0, 32.0, 38.0, 29.0, 34.0, 47.0, 36.0, 46.0, 36.0, 45.0, 45.0, 39.0, 45.0, 37.0, 38.0, 40.0, 36.0, 32.0, 22.0, 26.0, 18.0, 19.0, 18.0, 11.0, 16.0, 10.0, 6.0, 4.0, 5.0, 8.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.764122009277344, -10.41481876373291, -10.06551456451416, -9.716211318969727, -9.366907119750977, -9.017603874206543, -8.66830062866211, -8.31899642944336, -7.969693183898926, -7.620389461517334, -7.271085739135742, -6.921782493591309, -6.572478771209717, -6.223175048828125, -5.873871803283691, -5.5245680809021, -5.175264358520508, -4.825960636138916, -4.476656913757324, -4.127353668212891, -3.778049945831299, -3.428746223449707, -3.0794427394866943, -2.7301392555236816, -2.38083553314209, -2.031531810760498, -1.6822283267974854, -1.332924723625183, -0.9836211204528809, -0.6343175172805786, -0.28501391410827637, 0.06428956985473633, 0.4135932922363281, 0.7628968954086304, 1.1122004985809326, 1.4615041017532349, 1.810807704925537, 2.160111427307129, 2.5094149112701416, 2.8587183952331543, 3.208022117614746, 3.557325839996338, 3.9066293239593506, 4.255932807922363, 4.605236530303955, 4.954540252685547, 5.3038434982299805, 5.653147220611572, 6.002450942993164, 6.351754665374756, 6.701058387756348, 7.050361633300781, 7.399665355682373, 7.748969078063965, 8.098272323608398, 8.447576522827148, 8.796879768371582, 9.146183013916016, 9.495487213134766, 9.8447904586792, 10.194093704223633, 10.543397903442383, 10.892701148986816, 11.24200439453125, 11.59130859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 4.0, 3.0, 8.0, 9.0, 4.0, 7.0, 19.0, 14.0, 30.0, 29.0, 32.0, 46.0, 35.0, 38.0, 52.0, 72.0, 173.0, 1077.0, 4082449.0, 108795.0, 832.0, 159.0, 77.0, 37.0, 30.0, 50.0, 24.0, 23.0, 23.0, 25.0, 11.0, 15.0, 15.0, 18.0, 6.0, 1.0, 6.0, 8.0, 2.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.75390625, -3.63995361328125, -3.5260009765625, -3.41204833984375, -3.298095703125, -3.18414306640625, -3.0701904296875, -2.95623779296875, -2.84228515625, -2.72833251953125, -2.6143798828125, -2.50042724609375, -2.386474609375, -2.27252197265625, -2.1585693359375, -2.04461669921875, -1.9306640625, -1.81671142578125, -1.7027587890625, -1.58880615234375, -1.474853515625, -1.36090087890625, -1.2469482421875, -1.13299560546875, -1.01904296875, -0.90509033203125, -0.7911376953125, -0.67718505859375, -0.563232421875, -0.44927978515625, -0.3353271484375, -0.22137451171875, -0.107421875, 0.00653076171875, 0.1204833984375, 0.23443603515625, 0.348388671875, 0.46234130859375, 0.5762939453125, 0.69024658203125, 0.80419921875, 0.91815185546875, 1.0321044921875, 1.14605712890625, 1.260009765625, 1.37396240234375, 1.4879150390625, 1.60186767578125, 1.7158203125, 1.82977294921875, 1.9437255859375, 2.05767822265625, 2.171630859375, 2.28558349609375, 2.3995361328125, 2.51348876953125, 2.62744140625, 2.74139404296875, 2.8553466796875, 2.96929931640625, 3.083251953125, 3.19720458984375, 3.3111572265625, 3.42510986328125, 3.5390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 10.0, 12.0, 13.0, 14.0, 21.0, 27.0, 24.0, 32.0, 34.0, 52.0, 55.0, 45.0, 59.0, 55.0, 58.0, 71.0, 68.0, 58.0, 59.0, 56.0, 26.0, 29.0, 17.0, 23.0, 12.0, 14.0, 14.0, 6.0, 11.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.734375, -0.7141265869140625, -0.693878173828125, -0.6736297607421875, -0.65338134765625, -0.6331329345703125, -0.612884521484375, -0.5926361083984375, -0.5723876953125, -0.5521392822265625, -0.531890869140625, -0.5116424560546875, -0.49139404296875, -0.4711456298828125, -0.450897216796875, -0.4306488037109375, -0.410400390625, -0.3901519775390625, -0.369903564453125, -0.3496551513671875, -0.32940673828125, -0.3091583251953125, -0.288909912109375, -0.2686614990234375, -0.2484130859375, -0.2281646728515625, -0.207916259765625, -0.1876678466796875, -0.16741943359375, -0.1471710205078125, -0.126922607421875, -0.1066741943359375, -0.08642578125, -0.0661773681640625, -0.045928955078125, -0.0256805419921875, -0.00543212890625, 0.0148162841796875, 0.035064697265625, 0.0553131103515625, 0.0755615234375, 0.0958099365234375, 0.116058349609375, 0.1363067626953125, 0.15655517578125, 0.1768035888671875, 0.197052001953125, 0.2173004150390625, 0.237548828125, 0.2577972412109375, 0.278045654296875, 0.2982940673828125, 0.31854248046875, 0.3387908935546875, 0.359039306640625, 0.3792877197265625, 0.3995361328125, 0.4197845458984375, 0.440032958984375, 0.4602813720703125, 0.48052978515625, 0.5007781982421875, 0.521026611328125, 0.5412750244140625, 0.5615234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 0.0, 4.0, 3.0, 6.0, 10.0, 14.0, 15.0, 17.0, 15.0, 26.0, 26.0, 21.0, 42.0, 38.0, 32.0, 37.0, 64.0, 113.0, 221.0, 1264.0, 4118172.0, 72715.0, 903.0, 165.0, 67.0, 45.0, 40.0, 38.0, 30.0, 20.0, 21.0, 20.0, 18.0, 16.0, 6.0, 10.0, 11.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.97265625, -3.84417724609375, -3.7156982421875, -3.58721923828125, -3.458740234375, -3.33026123046875, -3.2017822265625, -3.07330322265625, -2.94482421875, -2.81634521484375, -2.6878662109375, -2.55938720703125, -2.430908203125, -2.30242919921875, -2.1739501953125, -2.04547119140625, -1.9169921875, -1.78851318359375, -1.6600341796875, -1.53155517578125, -1.403076171875, -1.27459716796875, -1.1461181640625, -1.01763916015625, -0.88916015625, -0.76068115234375, -0.6322021484375, -0.50372314453125, -0.375244140625, -0.24676513671875, -0.1182861328125, 0.01019287109375, 0.138671875, 0.26715087890625, 0.3956298828125, 0.52410888671875, 0.652587890625, 0.78106689453125, 0.9095458984375, 1.03802490234375, 1.16650390625, 1.29498291015625, 1.4234619140625, 1.55194091796875, 1.680419921875, 1.80889892578125, 1.9373779296875, 2.06585693359375, 2.1943359375, 2.32281494140625, 2.4512939453125, 2.57977294921875, 2.708251953125, 2.83673095703125, 2.9652099609375, 3.09368896484375, 3.22216796875, 3.35064697265625, 3.4791259765625, 3.60760498046875, 3.736083984375, 3.86456298828125, 3.9930419921875, 4.12152099609375, 4.25]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 68.0, 3977.0, 28.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.3203125, -2.2797317504882812, -2.2391510009765625, -2.1985702514648438, -2.157989501953125, -2.1174087524414062, -2.0768280029296875, -2.0362472534179688, -1.99566650390625, -1.9550857543945312, -1.9145050048828125, -1.8739242553710938, -1.833343505859375, -1.7927627563476562, -1.7521820068359375, -1.7116012573242188, -1.6710205078125, -1.6304397583007812, -1.5898590087890625, -1.5492782592773438, -1.508697509765625, -1.4681167602539062, -1.4275360107421875, -1.3869552612304688, -1.34637451171875, -1.3057937622070312, -1.2652130126953125, -1.2246322631835938, -1.184051513671875, -1.1434707641601562, -1.1028900146484375, -1.0623092651367188, -1.021728515625, -0.9811477661132812, -0.9405670166015625, -0.8999862670898438, -0.859405517578125, -0.8188247680664062, -0.7782440185546875, -0.7376632690429688, -0.69708251953125, -0.6565017700195312, -0.6159210205078125, -0.5753402709960938, -0.534759521484375, -0.49417877197265625, -0.4535980224609375, -0.41301727294921875, -0.3724365234375, -0.33185577392578125, -0.2912750244140625, -0.25069427490234375, -0.210113525390625, -0.16953277587890625, -0.1289520263671875, -0.08837127685546875, -0.04779052734375, -0.00720977783203125, 0.0333709716796875, 0.07395172119140625, 0.114532470703125, 0.15511322021484375, 0.1956939697265625, 0.23627471923828125, 0.27685546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 16.0, 26.0, 26.0, 31.0, 45.0, 74.0, 126.0, 217.0, 196.0, 101.0, 58.0, 23.0, 15.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017465829849243, -1.9765594005584717, -1.9356529712677002, -1.8947465419769287, -1.8538401126861572, -1.8129336833953857, -1.7720272541046143, -1.7311207056045532, -1.6902142763137817, -1.6493078470230103, -1.6084014177322388, -1.5674949884414673, -1.5265885591506958, -1.4856820106506348, -1.4447755813598633, -1.4038691520690918, -1.3629627227783203, -1.3220562934875488, -1.2811498641967773, -1.2402434349060059, -1.1993370056152344, -1.158430576324463, -1.1175241470336914, -1.0766175985336304, -1.0357112884521484, -0.994804859161377, -0.9538984298706055, -0.912992000579834, -0.8720855116844177, -0.8311790823936462, -0.7902726531028748, -0.7493661642074585, -0.708459734916687, -0.6675533056259155, -0.626646876335144, -0.5857404470443726, -0.5448339581489563, -0.5039275288581848, -0.46302109956741333, -0.42211464047431946, -0.381208211183548, -0.3403017818927765, -0.2993953227996826, -0.25848889350891113, -0.21758244931697845, -0.17667600512504578, -0.1357695758342743, -0.09486311674118042, -0.053956687450408936, -0.013050246983766556, 0.027856193482875824, 0.0687626302242279, 0.10966907441616058, 0.15057551860809326, 0.19148194789886475, 0.23238840699195862, 0.2732948362827301, 0.3142012655735016, 0.35510772466659546, 0.39601415395736694, 0.4369205832481384, 0.4778270423412323, 0.5187335014343262, 0.5596399307250977, 0.6005463600158691]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 11.0, 5.0, 5.0, 11.0, 5.0, 6.0, 17.0, 10.0, 15.0, 16.0, 32.0, 26.0, 31.0, 25.0, 32.0, 26.0, 31.0, 48.0, 40.0, 30.0, 39.0, 50.0, 51.0, 40.0, 32.0, 35.0, 31.0, 37.0, 35.0, 27.0, 31.0, 24.0, 20.0, 17.0, 26.0, 18.0, 11.0, 5.0, 12.0, 10.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2060596942901611, -1.1651848554611206, -1.1243101358413696, -1.083435297012329, -1.0425605773925781, -1.0016857385635376, -0.9608110189437866, -0.9199361801147461, -0.8790614604949951, -0.8381866812705994, -0.7973119020462036, -0.7564371228218079, -0.7155623435974121, -0.6746875643730164, -0.6338127851486206, -0.5929379463195801, -0.5520631670951843, -0.5111883878707886, -0.4703136086463928, -0.42943882942199707, -0.3885640501976013, -0.34768927097320557, -0.3068144619464874, -0.2659396827220917, -0.22506490349769592, -0.18419012427330017, -0.14331534504890442, -0.10244055092334747, -0.06156577169895172, -0.02069099247455597, 0.020183801651000977, 0.06105858087539673, 0.10193336009979248, 0.14280813932418823, 0.18368291854858398, 0.22455771267414093, 0.2654324769973755, 0.30630725622177124, 0.3471820652484894, 0.38805684447288513, 0.4289316236972809, 0.46980640292167664, 0.5106812119483948, 0.5515559911727905, 0.5924307703971863, 0.633305549621582, 0.6741803288459778, 0.7150551080703735, 0.7559298872947693, 0.796804666519165, 0.8376794457435608, 0.8785542249679565, 0.9194290041923523, 0.960303783416748, 1.0011786222457886, 1.0420533418655396, 1.08292818069458, 1.1238030195236206, 1.1646777391433716, 1.205552577972412, 1.246427297592163, 1.2873021364212036, 1.3281768560409546, 1.3690516948699951, 1.409926414489746]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 1.0, 7.0, 10.0, 2.0, 9.0, 15.0, 12.0, 30.0, 39.0, 48.0, 77.0, 133.0, 283.0, 635.0, 1607.0, 4606.0, 14447.0, 55968.0, 313132.0, 527778.0, 96528.0, 22373.0, 6716.0, 2344.0, 931.0, 380.0, 183.0, 71.0, 60.0, 34.0, 17.0, 18.0, 7.0, 10.0, 8.0, 8.0, 6.0, 3.0, 4.0, 6.0, 0.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.1588592529296875, -1.120452880859375, -1.0820465087890625, -1.04364013671875, -1.0052337646484375, -0.966827392578125, -0.9284210205078125, -0.8900146484375, -0.8516082763671875, -0.813201904296875, -0.7747955322265625, -0.73638916015625, -0.6979827880859375, -0.659576416015625, -0.6211700439453125, -0.582763671875, -0.5443572998046875, -0.505950927734375, -0.4675445556640625, -0.42913818359375, -0.3907318115234375, -0.352325439453125, -0.3139190673828125, -0.2755126953125, -0.2371063232421875, -0.198699951171875, -0.1602935791015625, -0.12188720703125, -0.0834808349609375, -0.045074462890625, -0.0066680908203125, 0.03173828125, 0.0701446533203125, 0.108551025390625, 0.1469573974609375, 0.18536376953125, 0.2237701416015625, 0.262176513671875, 0.3005828857421875, 0.3389892578125, 0.3773956298828125, 0.415802001953125, 0.4542083740234375, 0.49261474609375, 0.5310211181640625, 0.569427490234375, 0.6078338623046875, 0.646240234375, 0.6846466064453125, 0.723052978515625, 0.7614593505859375, 0.79986572265625, 0.8382720947265625, 0.876678466796875, 0.9150848388671875, 0.9534912109375, 0.9918975830078125, 1.030303955078125, 1.0687103271484375, 1.10711669921875, 1.1455230712890625, 1.183929443359375, 1.2223358154296875, 1.2607421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 5.0, 11.0, 12.0, 13.0, 21.0, 29.0, 20.0, 27.0, 38.0, 47.0, 40.0, 45.0, 52.0, 53.0, 56.0, 54.0, 53.0, 52.0, 42.0, 53.0, 41.0, 30.0, 22.0, 42.0, 24.0, 21.0, 17.0, 15.0, 4.0, 8.0, 10.0, 3.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6785354614257812, -0.6568756103515625, -0.6352157592773438, -0.613555908203125, -0.5918960571289062, -0.5702362060546875, -0.5485763549804688, -0.52691650390625, -0.5052566528320312, -0.4835968017578125, -0.46193695068359375, -0.440277099609375, -0.41861724853515625, -0.3969573974609375, -0.37529754638671875, -0.3536376953125, -0.33197784423828125, -0.3103179931640625, -0.28865814208984375, -0.266998291015625, -0.24533843994140625, -0.2236785888671875, -0.20201873779296875, -0.18035888671875, -0.15869903564453125, -0.1370391845703125, -0.11537933349609375, -0.093719482421875, -0.07205963134765625, -0.0503997802734375, -0.02873992919921875, -0.007080078125, 0.01457977294921875, 0.0362396240234375, 0.05789947509765625, 0.079559326171875, 0.10121917724609375, 0.1228790283203125, 0.14453887939453125, 0.16619873046875, 0.18785858154296875, 0.2095184326171875, 0.23117828369140625, 0.252838134765625, 0.27449798583984375, 0.2961578369140625, 0.31781768798828125, 0.3394775390625, 0.36113739013671875, 0.3827972412109375, 0.40445709228515625, 0.426116943359375, 0.44777679443359375, 0.4694366455078125, 0.49109649658203125, 0.51275634765625, 0.5344161987304688, 0.5560760498046875, 0.5777359008789062, 0.599395751953125, 0.6210556030273438, 0.6427154541015625, 0.6643753051757812, 0.68603515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 8.0, 16.0, 21.0, 21.0, 28.0, 52.0, 66.0, 102.0, 155.0, 291.0, 556.0, 1127.0, 2823.0, 9039.0, 38197.0, 322204.0, 593530.0, 61183.0, 12331.0, 3800.0, 1426.0, 673.0, 320.0, 186.0, 128.0, 81.0, 50.0, 32.0, 23.0, 17.0, 10.0, 10.0, 9.0, 4.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3798065185546875, -1.328948974609375, -1.2780914306640625, -1.22723388671875, -1.1763763427734375, -1.125518798828125, -1.0746612548828125, -1.0238037109375, -0.9729461669921875, -0.922088623046875, -0.8712310791015625, -0.82037353515625, -0.7695159912109375, -0.718658447265625, -0.6678009033203125, -0.616943359375, -0.5660858154296875, -0.515228271484375, -0.4643707275390625, -0.41351318359375, -0.3626556396484375, -0.311798095703125, -0.2609405517578125, -0.2100830078125, -0.1592254638671875, -0.108367919921875, -0.0575103759765625, -0.00665283203125, 0.0442047119140625, 0.095062255859375, 0.1459197998046875, 0.19677734375, 0.2476348876953125, 0.298492431640625, 0.3493499755859375, 0.40020751953125, 0.4510650634765625, 0.501922607421875, 0.5527801513671875, 0.6036376953125, 0.6544952392578125, 0.705352783203125, 0.7562103271484375, 0.80706787109375, 0.8579254150390625, 0.908782958984375, 0.9596405029296875, 1.010498046875, 1.0613555908203125, 1.112213134765625, 1.1630706787109375, 1.21392822265625, 1.2647857666015625, 1.315643310546875, 1.3665008544921875, 1.4173583984375, 1.4682159423828125, 1.519073486328125, 1.5699310302734375, 1.62078857421875, 1.6716461181640625, 1.722503662109375, 1.7733612060546875, 1.82421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 8.0, 7.0, 9.0, 10.0, 23.0, 22.0, 30.0, 26.0, 38.0, 48.0, 54.0, 55.0, 62.0, 45.0, 52.0, 55.0, 61.0, 53.0, 40.0, 43.0, 43.0, 34.0, 28.0, 23.0, 22.0, 21.0, 16.0, 6.0, 13.0, 7.0, 9.0, 2.0, 8.0, 9.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.30859375, -4.185028076171875, -4.06146240234375, -3.937896728515625, -3.8143310546875, -3.690765380859375, -3.56719970703125, -3.443634033203125, -3.320068359375, -3.196502685546875, -3.07293701171875, -2.949371337890625, -2.8258056640625, -2.702239990234375, -2.57867431640625, -2.455108642578125, -2.33154296875, -2.207977294921875, -2.08441162109375, -1.960845947265625, -1.8372802734375, -1.713714599609375, -1.59014892578125, -1.466583251953125, -1.343017578125, -1.219451904296875, -1.09588623046875, -0.972320556640625, -0.8487548828125, -0.725189208984375, -0.60162353515625, -0.478057861328125, -0.3544921875, -0.230926513671875, -0.10736083984375, 0.016204833984375, 0.1397705078125, 0.263336181640625, 0.38690185546875, 0.510467529296875, 0.634033203125, 0.757598876953125, 0.88116455078125, 1.004730224609375, 1.1282958984375, 1.251861572265625, 1.37542724609375, 1.498992919921875, 1.62255859375, 1.746124267578125, 1.86968994140625, 1.993255615234375, 2.1168212890625, 2.240386962890625, 2.36395263671875, 2.487518310546875, 2.611083984375, 2.734649658203125, 2.85821533203125, 2.981781005859375, 3.1053466796875, 3.228912353515625, 3.35247802734375, 3.476043701171875, 3.599609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 11.0, 12.0, 15.0, 13.0, 18.0, 16.0, 22.0, 47.0, 118.0, 409.0, 1848.0, 14202.0, 968349.0, 58613.0, 3753.0, 715.0, 183.0, 63.0, 43.0, 24.0, 14.0, 11.0, 12.0, 9.0, 7.0, 5.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8505859375, -1.792205810546875, -1.73382568359375, -1.675445556640625, -1.6170654296875, -1.558685302734375, -1.50030517578125, -1.441925048828125, -1.383544921875, -1.325164794921875, -1.26678466796875, -1.208404541015625, -1.1500244140625, -1.091644287109375, -1.03326416015625, -0.974884033203125, -0.91650390625, -0.858123779296875, -0.79974365234375, -0.741363525390625, -0.6829833984375, -0.624603271484375, -0.56622314453125, -0.507843017578125, -0.449462890625, -0.391082763671875, -0.33270263671875, -0.274322509765625, -0.2159423828125, -0.157562255859375, -0.09918212890625, -0.040802001953125, 0.017578125, 0.075958251953125, 0.13433837890625, 0.192718505859375, 0.2510986328125, 0.309478759765625, 0.36785888671875, 0.426239013671875, 0.484619140625, 0.542999267578125, 0.60137939453125, 0.659759521484375, 0.7181396484375, 0.776519775390625, 0.83489990234375, 0.893280029296875, 0.95166015625, 1.010040283203125, 1.06842041015625, 1.126800537109375, 1.1851806640625, 1.243560791015625, 1.30194091796875, 1.360321044921875, 1.418701171875, 1.477081298828125, 1.53546142578125, 1.593841552734375, 1.6522216796875, 1.710601806640625, 1.76898193359375, 1.827362060546875, 1.8857421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 1.0, 4.0, 4.0, 6.0, 17.0, 25.0, 39.0, 26.0, 50.0, 82.0, 84.0, 114.0, 116.0, 103.0, 81.0, 66.0, 54.0, 37.0, 33.0, 13.0, 13.0, 13.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3763389587402344e-05, -5.156174302101135e-05, -4.936009645462036e-05, -4.715844988822937e-05, -4.495680332183838e-05, -4.275515675544739e-05, -4.0553510189056396e-05, -3.8351863622665405e-05, -3.6150217056274414e-05, -3.394857048988342e-05, -3.174692392349243e-05, -2.954527735710144e-05, -2.734363079071045e-05, -2.5141984224319458e-05, -2.2940337657928467e-05, -2.0738691091537476e-05, -1.8537044525146484e-05, -1.6335397958755493e-05, -1.4133751392364502e-05, -1.193210482597351e-05, -9.73045825958252e-06, -7.528811693191528e-06, -5.327165126800537e-06, -3.125518560409546e-06, -9.238719940185547e-07, 1.2777745723724365e-06, 3.4794211387634277e-06, 5.681067705154419e-06, 7.88271427154541e-06, 1.0084360837936401e-05, 1.2286007404327393e-05, 1.4487653970718384e-05, 1.6689300537109375e-05, 1.8890947103500366e-05, 2.1092593669891357e-05, 2.329424023628235e-05, 2.549588680267334e-05, 2.769753336906433e-05, 2.9899179935455322e-05, 3.2100826501846313e-05, 3.4302473068237305e-05, 3.6504119634628296e-05, 3.870576620101929e-05, 4.090741276741028e-05, 4.310905933380127e-05, 4.531070590019226e-05, 4.751235246658325e-05, 4.971399903297424e-05, 5.1915645599365234e-05, 5.4117292165756226e-05, 5.631893873214722e-05, 5.852058529853821e-05, 6.07222318649292e-05, 6.292387843132019e-05, 6.512552499771118e-05, 6.732717156410217e-05, 6.952881813049316e-05, 7.173046469688416e-05, 7.393211126327515e-05, 7.613375782966614e-05, 7.833540439605713e-05, 8.053705096244812e-05, 8.273869752883911e-05, 8.49403440952301e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 4.0, 2.0, 14.0, 9.0, 23.0, 31.0, 45.0, 93.0, 132.0, 276.0, 546.0, 1268.0, 3216.0, 11760.0, 119480.0, 846424.0, 52734.0, 7965.0, 2520.0, 944.0, 479.0, 233.0, 144.0, 66.0, 50.0, 23.0, 13.0, 12.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75146484375, -0.727508544921875, -0.70355224609375, -0.679595947265625, -0.6556396484375, -0.631683349609375, -0.60772705078125, -0.583770751953125, -0.559814453125, -0.535858154296875, -0.51190185546875, -0.487945556640625, -0.4639892578125, -0.440032958984375, -0.41607666015625, -0.392120361328125, -0.3681640625, -0.344207763671875, -0.32025146484375, -0.296295166015625, -0.2723388671875, -0.248382568359375, -0.22442626953125, -0.200469970703125, -0.176513671875, -0.152557373046875, -0.12860107421875, -0.104644775390625, -0.0806884765625, -0.056732177734375, -0.03277587890625, -0.008819580078125, 0.01513671875, 0.039093017578125, 0.06304931640625, 0.087005615234375, 0.1109619140625, 0.134918212890625, 0.15887451171875, 0.182830810546875, 0.206787109375, 0.230743408203125, 0.25469970703125, 0.278656005859375, 0.3026123046875, 0.326568603515625, 0.35052490234375, 0.374481201171875, 0.3984375, 0.422393798828125, 0.44635009765625, 0.470306396484375, 0.4942626953125, 0.518218994140625, 0.54217529296875, 0.566131591796875, 0.590087890625, 0.614044189453125, 0.63800048828125, 0.661956787109375, 0.6859130859375, 0.709869384765625, 0.73382568359375, 0.757781982421875, 0.78173828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 2.0, 8.0, 14.0, 10.0, 18.0, 31.0, 43.0, 97.0, 140.0, 194.0, 170.0, 92.0, 55.0, 42.0, 22.0, 9.0, 4.0, 10.0, 7.0, 3.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.27734375, -1.2327423095703125, -1.188140869140625, -1.1435394287109375, -1.09893798828125, -1.0543365478515625, -1.009735107421875, -0.9651336669921875, -0.9205322265625, -0.8759307861328125, -0.831329345703125, -0.7867279052734375, -0.74212646484375, -0.6975250244140625, -0.652923583984375, -0.6083221435546875, -0.563720703125, -0.5191192626953125, -0.474517822265625, -0.4299163818359375, -0.38531494140625, -0.3407135009765625, -0.296112060546875, -0.2515106201171875, -0.2069091796875, -0.1623077392578125, -0.117706298828125, -0.0731048583984375, -0.02850341796875, 0.0160980224609375, 0.060699462890625, 0.1053009033203125, 0.14990234375, 0.1945037841796875, 0.239105224609375, 0.2837066650390625, 0.32830810546875, 0.3729095458984375, 0.417510986328125, 0.4621124267578125, 0.5067138671875, 0.5513153076171875, 0.595916748046875, 0.6405181884765625, 0.68511962890625, 0.7297210693359375, 0.774322509765625, 0.8189239501953125, 0.863525390625, 0.9081268310546875, 0.952728271484375, 0.9973297119140625, 1.04193115234375, 1.0865325927734375, 1.131134033203125, 1.1757354736328125, 1.2203369140625, 1.2649383544921875, 1.309539794921875, 1.3541412353515625, 1.39874267578125, 1.4433441162109375, 1.487945556640625, 1.5325469970703125, 1.5771484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 18.0, 14.0, 31.0, 83.0, 145.0, 216.0, 240.0, 117.0, 71.0, 33.0, 11.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.051671981811523, -8.548155784606934, -8.044639587402344, -7.541123390197754, -7.037607192993164, -6.534090995788574, -6.030574798583984, -5.5270586013793945, -5.023542404174805, -4.520026206970215, -4.016510009765625, -3.512993812561035, -3.0094776153564453, -2.5059614181518555, -2.0024452209472656, -1.4989290237426758, -0.9954128265380859, -0.4918966293334961, 0.01161956787109375, 0.5151357650756836, 1.0186519622802734, 1.5221681594848633, 2.025684356689453, 2.529200553894043, 3.032716751098633, 3.5362329483032227, 4.0397491455078125, 4.543265342712402, 5.046781539916992, 5.550297737121582, 6.053813934326172, 6.557330131530762, 7.060848236083984, 7.564364433288574, 8.067880630493164, 8.571396827697754, 9.074913024902344, 9.578429222106934, 10.081945419311523, 10.585461616516113, 11.088977813720703, 11.592494010925293, 12.096010208129883, 12.599526405334473, 13.103042602539062, 13.606558799743652, 14.110074996948242, 14.613591194152832, 15.117107391357422, 15.620623588562012, 16.1241397857666, 16.627655029296875, 17.13117218017578, 17.634689331054688, 18.13820457458496, 18.641719818115234, 19.14523696899414, 19.648754119873047, 20.15226936340332, 20.655784606933594, 21.1593017578125, 21.662818908691406, 22.16633415222168, 22.669849395751953, 23.17336654663086]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 10.0, 12.0, 19.0, 17.0, 28.0, 27.0, 35.0, 33.0, 41.0, 37.0, 49.0, 40.0, 59.0, 63.0, 67.0, 48.0, 63.0, 47.0, 45.0, 33.0, 31.0, 31.0, 18.0, 23.0, 13.0, 13.0, 19.0, 11.0, 6.0, 7.0, 3.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.64791488647461, -20.035354614257812, -19.422792434692383, -18.810232162475586, -18.19767189025879, -17.58510971069336, -16.972549438476562, -16.359989166259766, -15.747427940368652, -15.134866714477539, -14.522306442260742, -13.909745216369629, -13.297183990478516, -12.684623718261719, -12.072062492370605, -11.459501266479492, -10.846940994262695, -10.234379768371582, -9.621819496154785, -9.009258270263672, -8.396697998046875, -7.784136772155762, -7.171575546264648, -6.559014797210693, -5.946454048156738, -5.333893299102783, -4.721332550048828, -4.108771324157715, -3.4962105751037598, -2.8836498260498047, -2.2710888385772705, -1.6585278511047363, -1.0459671020507812, -0.4334062337875366, 0.179154634475708, 0.7917155027389526, 1.4042763710021973, 2.0168371200561523, 2.6293981075286865, 3.2419590950012207, 3.854519844055176, 4.467080593109131, 5.079641342163086, 5.692202568054199, 6.304763317108154, 6.917324066162109, 7.529885292053223, 8.142446517944336, 8.755006790161133, 9.367568016052246, 9.980128288269043, 10.592689514160156, 11.205249786376953, 11.817811012268066, 12.43037223815918, 13.042932510375977, 13.65549373626709, 14.268054962158203, 14.880615234375, 15.493176460266113, 16.105737686157227, 16.718297958374023, 17.33085823059082, 17.94342041015625, 18.555980682373047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 12.0, 15.0, 25.0, 18.0, 20.0, 42.0, 63.0, 76.0, 126.0, 211.0, 420.0, 1109.0, 5395.0, 98154.0, 4074133.0, 11401.0, 1739.0, 551.0, 247.0, 149.0, 82.0, 64.0, 47.0, 43.0, 28.0, 17.0, 14.0, 6.0, 10.0, 13.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.1082305908203125, -2.046539306640625, -1.9848480224609375, -1.92315673828125, -1.8614654541015625, -1.799774169921875, -1.7380828857421875, -1.6763916015625, -1.6147003173828125, -1.553009033203125, -1.4913177490234375, -1.42962646484375, -1.3679351806640625, -1.306243896484375, -1.2445526123046875, -1.182861328125, -1.1211700439453125, -1.059478759765625, -0.9977874755859375, -0.93609619140625, -0.8744049072265625, -0.812713623046875, -0.7510223388671875, -0.6893310546875, -0.6276397705078125, -0.565948486328125, -0.5042572021484375, -0.44256591796875, -0.3808746337890625, -0.319183349609375, -0.2574920654296875, -0.19580078125, -0.1341094970703125, -0.072418212890625, -0.0107269287109375, 0.05096435546875, 0.1126556396484375, 0.174346923828125, 0.2360382080078125, 0.2977294921875, 0.3594207763671875, 0.421112060546875, 0.4828033447265625, 0.54449462890625, 0.6061859130859375, 0.667877197265625, 0.7295684814453125, 0.791259765625, 0.8529510498046875, 0.914642333984375, 0.9763336181640625, 1.03802490234375, 1.0997161865234375, 1.161407470703125, 1.2230987548828125, 1.2847900390625, 1.3464813232421875, 1.408172607421875, 1.4698638916015625, 1.53155517578125, 1.5932464599609375, 1.654937744140625, 1.7166290283203125, 1.7783203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 7.0, 8.0, 8.0, 16.0, 19.0, 22.0, 29.0, 22.0, 41.0, 44.0, 43.0, 53.0, 41.0, 64.0, 75.0, 66.0, 59.0, 47.0, 61.0, 36.0, 34.0, 30.0, 26.0, 23.0, 27.0, 15.0, 14.0, 10.0, 10.0, 7.0, 3.0, 2.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8586959838867188, -0.8316497802734375, -0.8046035766601562, -0.777557373046875, -0.7505111694335938, -0.7234649658203125, -0.6964187622070312, -0.66937255859375, -0.6423263549804688, -0.6152801513671875, -0.5882339477539062, -0.561187744140625, -0.5341415405273438, -0.5070953369140625, -0.48004913330078125, -0.4530029296875, -0.42595672607421875, -0.3989105224609375, -0.37186431884765625, -0.344818115234375, -0.31777191162109375, -0.2907257080078125, -0.26367950439453125, -0.23663330078125, -0.20958709716796875, -0.1825408935546875, -0.15549468994140625, -0.128448486328125, -0.10140228271484375, -0.0743560791015625, -0.04730987548828125, -0.020263671875, 0.00678253173828125, 0.0338287353515625, 0.06087493896484375, 0.087921142578125, 0.11496734619140625, 0.1420135498046875, 0.16905975341796875, 0.19610595703125, 0.22315216064453125, 0.2501983642578125, 0.27724456787109375, 0.304290771484375, 0.33133697509765625, 0.3583831787109375, 0.38542938232421875, 0.4124755859375, 0.43952178955078125, 0.4665679931640625, 0.49361419677734375, 0.520660400390625, 0.5477066040039062, 0.5747528076171875, 0.6017990112304688, 0.62884521484375, 0.6558914184570312, 0.6829376220703125, 0.7099838256835938, 0.737030029296875, 0.7640762329101562, 0.7911224365234375, 0.8181686401367188, 0.84521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 6.0, 6.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 6.0, 11.0, 13.0, 19.0, 17.0, 12.0, 24.0, 23.0, 28.0, 25.0, 39.0, 53.0, 65.0, 67.0, 120.0, 238.0, 687.0, 7092.0, 4167082.0, 16807.0, 945.0, 276.0, 128.0, 98.0, 76.0, 43.0, 36.0, 28.0, 33.0, 27.0, 15.0, 22.0, 17.0, 13.0, 12.0, 12.0, 5.0, 8.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.734375, -3.6162109375, -3.498046875, -3.3798828125, -3.26171875, -3.1435546875, -3.025390625, -2.9072265625, -2.7890625, -2.6708984375, -2.552734375, -2.4345703125, -2.31640625, -2.1982421875, -2.080078125, -1.9619140625, -1.84375, -1.7255859375, -1.607421875, -1.4892578125, -1.37109375, -1.2529296875, -1.134765625, -1.0166015625, -0.8984375, -0.7802734375, -0.662109375, -0.5439453125, -0.42578125, -0.3076171875, -0.189453125, -0.0712890625, 0.046875, 0.1650390625, 0.283203125, 0.4013671875, 0.51953125, 0.6376953125, 0.755859375, 0.8740234375, 0.9921875, 1.1103515625, 1.228515625, 1.3466796875, 1.46484375, 1.5830078125, 1.701171875, 1.8193359375, 1.9375, 2.0556640625, 2.173828125, 2.2919921875, 2.41015625, 2.5283203125, 2.646484375, 2.7646484375, 2.8828125, 3.0009765625, 3.119140625, 3.2373046875, 3.35546875, 3.4736328125, 3.591796875, 3.7099609375, 3.828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 497.0, 3526.0, 39.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.796875, -2.7469444274902344, -2.6970138549804688, -2.647083282470703, -2.5971527099609375, -2.547222137451172, -2.4972915649414062, -2.4473609924316406, -2.397430419921875, -2.3474998474121094, -2.2975692749023438, -2.247638702392578, -2.1977081298828125, -2.147777557373047, -2.0978469848632812, -2.0479164123535156, -1.99798583984375, -1.9480552673339844, -1.8981246948242188, -1.8481941223144531, -1.7982635498046875, -1.7483329772949219, -1.6984024047851562, -1.6484718322753906, -1.598541259765625, -1.5486106872558594, -1.4986801147460938, -1.4487495422363281, -1.3988189697265625, -1.3488883972167969, -1.2989578247070312, -1.2490272521972656, -1.1990966796875, -1.1491661071777344, -1.0992355346679688, -1.0493049621582031, -0.9993743896484375, -0.9494438171386719, -0.8995132446289062, -0.8495826721191406, -0.799652099609375, -0.7497215270996094, -0.6997909545898438, -0.6498603820800781, -0.5999298095703125, -0.5499992370605469, -0.5000686645507812, -0.4501380920410156, -0.40020751953125, -0.3502769470214844, -0.30034637451171875, -0.2504158020019531, -0.2004852294921875, -0.15055465698242188, -0.10062408447265625, -0.050693511962890625, -0.000762939453125, 0.049167633056640625, 0.09909820556640625, 0.14902877807617188, 0.1989593505859375, 0.24888992309570312, 0.29882049560546875, 0.3487510681152344, 0.398681640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 18.0, 45.0, 104.0, 208.0, 281.0, 193.0, 81.0, 34.0, 12.0, 11.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6710002422332764, -3.582590341567993, -3.49418044090271, -3.4057705402374268, -3.3173606395721436, -3.2289507389068604, -3.140540838241577, -3.052130937576294, -2.9637210369110107, -2.8753111362457275, -2.7869012355804443, -2.698491334915161, -2.610081434249878, -2.5216715335845947, -2.4332616329193115, -2.3448517322540283, -2.256441831588745, -2.168031930923462, -2.0796220302581787, -1.9912121295928955, -1.9028022289276123, -1.814392328262329, -1.725982427597046, -1.6375725269317627, -1.5491626262664795, -1.4607527256011963, -1.372342824935913, -1.2839329242706299, -1.1955230236053467, -1.1071131229400635, -1.0187032222747803, -0.9302933216094971, -0.841883659362793, -0.7534737586975098, -0.6650638580322266, -0.5766539573669434, -0.48824405670166016, -0.39983415603637695, -0.31142425537109375, -0.22301435470581055, -0.13460445404052734, -0.04619455337524414, 0.04221534729003906, 0.13062524795532227, 0.21903514862060547, 0.30744504928588867, 0.3958549499511719, 0.4842648506164551, 0.5726747512817383, 0.6610846519470215, 0.7494945526123047, 0.8379044532775879, 0.9263143539428711, 1.0147242546081543, 1.1031341552734375, 1.1915440559387207, 1.279953956604004, 1.368363857269287, 1.4567737579345703, 1.5451836585998535, 1.6335935592651367, 1.72200345993042, 1.8104133605957031, 1.8988232612609863, 1.9872331619262695]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 7.0, 6.0, 5.0, 11.0, 16.0, 22.0, 26.0, 20.0, 20.0, 29.0, 40.0, 47.0, 44.0, 39.0, 45.0, 39.0, 44.0, 31.0, 51.0, 56.0, 45.0, 32.0, 43.0, 41.0, 34.0, 35.0, 29.0, 22.0, 35.0, 18.0, 15.0, 5.0, 8.0, 10.0, 3.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.767348051071167, -1.712867259979248, -1.658386468887329, -1.6039056777954102, -1.5494247674942017, -1.4949439764022827, -1.4404631853103638, -1.3859823942184448, -1.3315014839172363, -1.2770206928253174, -1.2225399017333984, -1.1680591106414795, -1.113578200340271, -1.059097409248352, -1.004616618156433, -0.9501358270645142, -0.8956550359725952, -0.8411742448806763, -0.7866933941841125, -0.7322126030921936, -0.6777317523956299, -0.6232509613037109, -0.568770170211792, -0.514289379119873, -0.4598085284233093, -0.405327707529068, -0.35084688663482666, -0.2963660955429077, -0.24188527464866638, -0.18740445375442505, -0.1329236626625061, -0.07844284176826477, -0.023962020874023438, 0.0305187925696373, 0.08499960601329803, 0.13948041200637817, 0.1939612329006195, 0.24844205379486084, 0.3029228448867798, 0.3574036657810211, 0.41188448667526245, 0.4663653075695038, 0.5208461284637451, 0.5753269195556641, 0.629807710647583, 0.6842885613441467, 0.7387693524360657, 0.7932502031326294, 0.8477309942245483, 0.9022117853164673, 0.956692636013031, 1.0111734867095947, 1.0656542778015137, 1.1201350688934326, 1.1746158599853516, 1.2290966510772705, 1.2835774421691895, 1.3380582332611084, 1.3925390243530273, 1.4470198154449463, 1.5015007257461548, 1.5559815168380737, 1.6104623079299927, 1.6649430990219116, 1.7194240093231201]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 3.0, 13.0, 20.0, 17.0, 28.0, 31.0, 65.0, 68.0, 138.0, 162.0, 270.0, 499.0, 913.0, 1812.0, 3773.0, 8838.0, 23110.0, 72097.0, 280333.0, 462927.0, 130512.0, 38256.0, 13749.0, 5583.0, 2497.0, 1221.0, 643.0, 361.0, 194.0, 125.0, 79.0, 54.0, 41.0, 38.0, 17.0, 14.0, 16.0, 8.0, 3.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9763641357421875, -0.942962646484375, -0.9095611572265625, -0.87615966796875, -0.8427581787109375, -0.809356689453125, -0.7759552001953125, -0.7425537109375, -0.7091522216796875, -0.675750732421875, -0.6423492431640625, -0.60894775390625, -0.5755462646484375, -0.542144775390625, -0.5087432861328125, -0.475341796875, -0.4419403076171875, -0.408538818359375, -0.3751373291015625, -0.34173583984375, -0.3083343505859375, -0.274932861328125, -0.2415313720703125, -0.2081298828125, -0.1747283935546875, -0.141326904296875, -0.1079254150390625, -0.07452392578125, -0.0411224365234375, -0.007720947265625, 0.0256805419921875, 0.05908203125, 0.0924835205078125, 0.125885009765625, 0.1592864990234375, 0.19268798828125, 0.2260894775390625, 0.259490966796875, 0.2928924560546875, 0.3262939453125, 0.3596954345703125, 0.393096923828125, 0.4264984130859375, 0.45989990234375, 0.4933013916015625, 0.526702880859375, 0.5601043701171875, 0.593505859375, 0.6269073486328125, 0.660308837890625, 0.6937103271484375, 0.72711181640625, 0.7605133056640625, 0.793914794921875, 0.8273162841796875, 0.8607177734375, 0.8941192626953125, 0.927520751953125, 0.9609222412109375, 0.99432373046875, 1.0277252197265625, 1.061126708984375, 1.0945281982421875, 1.1279296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 13.0, 13.0, 18.0, 24.0, 25.0, 36.0, 45.0, 37.0, 50.0, 39.0, 58.0, 53.0, 60.0, 59.0, 53.0, 54.0, 51.0, 32.0, 39.0, 30.0, 27.0, 23.0, 26.0, 18.0, 15.0, 10.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.974609375, -0.9465408325195312, -0.9184722900390625, -0.8904037475585938, -0.862335205078125, -0.8342666625976562, -0.8061981201171875, -0.7781295776367188, -0.75006103515625, -0.7219924926757812, -0.6939239501953125, -0.6658554077148438, -0.637786865234375, -0.6097183227539062, -0.5816497802734375, -0.5535812377929688, -0.5255126953125, -0.49744415283203125, -0.4693756103515625, -0.44130706787109375, -0.413238525390625, -0.38516998291015625, -0.3571014404296875, -0.32903289794921875, -0.30096435546875, -0.27289581298828125, -0.2448272705078125, -0.21675872802734375, -0.188690185546875, -0.16062164306640625, -0.1325531005859375, -0.10448455810546875, -0.076416015625, -0.04834747314453125, -0.0202789306640625, 0.00778961181640625, 0.035858154296875, 0.06392669677734375, 0.0919952392578125, 0.12006378173828125, 0.14813232421875, 0.17620086669921875, 0.2042694091796875, 0.23233795166015625, 0.260406494140625, 0.28847503662109375, 0.3165435791015625, 0.34461212158203125, 0.3726806640625, 0.40074920654296875, 0.4288177490234375, 0.45688629150390625, 0.484954833984375, 0.5130233764648438, 0.5410919189453125, 0.5691604614257812, 0.59722900390625, 0.6252975463867188, 0.6533660888671875, 0.6814346313476562, 0.709503173828125, 0.7375717163085938, 0.7656402587890625, 0.7937088012695312, 0.82177734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 3.0, 6.0, 8.0, 15.0, 25.0, 31.0, 59.0, 73.0, 139.0, 237.0, 511.0, 1269.0, 3620.0, 14867.0, 151748.0, 813217.0, 50604.0, 8069.0, 2236.0, 891.0, 423.0, 201.0, 108.0, 70.0, 31.0, 19.0, 18.0, 15.0, 9.0, 3.0, 5.0, 2.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.271484375, -3.176116943359375, -3.08074951171875, -2.985382080078125, -2.8900146484375, -2.794647216796875, -2.69927978515625, -2.603912353515625, -2.508544921875, -2.413177490234375, -2.31781005859375, -2.222442626953125, -2.1270751953125, -2.031707763671875, -1.93634033203125, -1.840972900390625, -1.74560546875, -1.650238037109375, -1.55487060546875, -1.459503173828125, -1.3641357421875, -1.268768310546875, -1.17340087890625, -1.078033447265625, -0.982666015625, -0.887298583984375, -0.79193115234375, -0.696563720703125, -0.6011962890625, -0.505828857421875, -0.41046142578125, -0.315093994140625, -0.2197265625, -0.124359130859375, -0.02899169921875, 0.066375732421875, 0.1617431640625, 0.257110595703125, 0.35247802734375, 0.447845458984375, 0.543212890625, 0.638580322265625, 0.73394775390625, 0.829315185546875, 0.9246826171875, 1.020050048828125, 1.11541748046875, 1.210784912109375, 1.30615234375, 1.401519775390625, 1.49688720703125, 1.592254638671875, 1.6876220703125, 1.782989501953125, 1.87835693359375, 1.973724365234375, 2.069091796875, 2.164459228515625, 2.25982666015625, 2.355194091796875, 2.4505615234375, 2.545928955078125, 2.64129638671875, 2.736663818359375, 2.83203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 7.0, 8.0, 14.0, 23.0, 21.0, 36.0, 50.0, 54.0, 68.0, 80.0, 83.0, 106.0, 75.0, 76.0, 57.0, 51.0, 50.0, 33.0, 19.0, 18.0, 15.0, 7.0, 6.0, 4.0, 4.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.4501953125, -7.205078125, -6.9599609375, -6.71484375, -6.4697265625, -6.224609375, -5.9794921875, -5.734375, -5.4892578125, -5.244140625, -4.9990234375, -4.75390625, -4.5087890625, -4.263671875, -4.0185546875, -3.7734375, -3.5283203125, -3.283203125, -3.0380859375, -2.79296875, -2.5478515625, -2.302734375, -2.0576171875, -1.8125, -1.5673828125, -1.322265625, -1.0771484375, -0.83203125, -0.5869140625, -0.341796875, -0.0966796875, 0.1484375, 0.3935546875, 0.638671875, 0.8837890625, 1.12890625, 1.3740234375, 1.619140625, 1.8642578125, 2.109375, 2.3544921875, 2.599609375, 2.8447265625, 3.08984375, 3.3349609375, 3.580078125, 3.8251953125, 4.0703125, 4.3154296875, 4.560546875, 4.8056640625, 5.05078125, 5.2958984375, 5.541015625, 5.7861328125, 6.03125, 6.2763671875, 6.521484375, 6.7666015625, 7.01171875, 7.2568359375, 7.501953125, 7.7470703125, 7.9921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 27.0, 80.0, 298.0, 3535.0, 1039740.0, 4394.0, 331.0, 89.0, 33.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.449615478515625, -3.25274658203125, -3.055877685546875, -2.8590087890625, -2.662139892578125, -2.46527099609375, -2.268402099609375, -2.071533203125, -1.874664306640625, -1.67779541015625, -1.480926513671875, -1.2840576171875, -1.087188720703125, -0.89031982421875, -0.693450927734375, -0.49658203125, -0.299713134765625, -0.10284423828125, 0.094024658203125, 0.2908935546875, 0.487762451171875, 0.68463134765625, 0.881500244140625, 1.078369140625, 1.275238037109375, 1.47210693359375, 1.668975830078125, 1.8658447265625, 2.062713623046875, 2.25958251953125, 2.456451416015625, 2.6533203125, 2.850189208984375, 3.04705810546875, 3.243927001953125, 3.4407958984375, 3.637664794921875, 3.83453369140625, 4.031402587890625, 4.228271484375, 4.425140380859375, 4.62200927734375, 4.818878173828125, 5.0157470703125, 5.212615966796875, 5.40948486328125, 5.606353759765625, 5.80322265625, 6.000091552734375, 6.19696044921875, 6.393829345703125, 6.5906982421875, 6.787567138671875, 6.98443603515625, 7.181304931640625, 7.378173828125, 7.575042724609375, 7.77191162109375, 7.968780517578125, 8.1656494140625, 8.362518310546875, 8.55938720703125, 8.756256103515625, 8.953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 2.0, 0.0, 11.0, 8.0, 20.0, 23.0, 55.0, 80.0, 92.0, 134.0, 140.0, 150.0, 109.0, 68.0, 41.0, 29.0, 13.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011116266250610352, -0.00010784249752759933, -0.00010452233254909515, -0.00010120216757059097, -9.788200259208679e-05, -9.456183761358261e-05, -9.124167263507843e-05, -8.792150765657425e-05, -8.460134267807007e-05, -8.128117769956589e-05, -7.79610127210617e-05, -7.464084774255753e-05, -7.132068276405334e-05, -6.800051778554916e-05, -6.468035280704498e-05, -6.13601878285408e-05, -5.804002285003662e-05, -5.471985787153244e-05, -5.139969289302826e-05, -4.807952791452408e-05, -4.47593629360199e-05, -4.1439197957515717e-05, -3.8119032979011536e-05, -3.4798868000507355e-05, -3.1478703022003174e-05, -2.8158538043498993e-05, -2.4838373064994812e-05, -2.151820808649063e-05, -1.819804310798645e-05, -1.487787812948227e-05, -1.1557713150978088e-05, -8.237548172473907e-06, -4.9173831939697266e-06, -1.5972182154655457e-06, 1.7229467630386353e-06, 5.043111741542816e-06, 8.363276720046997e-06, 1.1683441698551178e-05, 1.5003606677055359e-05, 1.832377165555954e-05, 2.164393663406372e-05, 2.49641016125679e-05, 2.8284266591072083e-05, 3.1604431569576263e-05, 3.4924596548080444e-05, 3.8244761526584625e-05, 4.1564926505088806e-05, 4.488509148359299e-05, 4.820525646209717e-05, 5.152542144060135e-05, 5.484558641910553e-05, 5.816575139760971e-05, 6.148591637611389e-05, 6.480608135461807e-05, 6.812624633312225e-05, 7.144641131162643e-05, 7.476657629013062e-05, 7.80867412686348e-05, 8.140690624713898e-05, 8.472707122564316e-05, 8.804723620414734e-05, 9.136740118265152e-05, 9.46875661611557e-05, 9.800773113965988e-05, 0.00010132789611816406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 13.0, 16.0, 33.0, 57.0, 111.0, 254.0, 785.0, 5673.0, 947776.0, 90346.0, 2577.0, 526.0, 197.0, 91.0, 41.0, 25.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.693359375, -2.60601806640625, -2.5186767578125, -2.43133544921875, -2.343994140625, -2.25665283203125, -2.1693115234375, -2.08197021484375, -1.99462890625, -1.90728759765625, -1.8199462890625, -1.73260498046875, -1.645263671875, -1.55792236328125, -1.4705810546875, -1.38323974609375, -1.2958984375, -1.20855712890625, -1.1212158203125, -1.03387451171875, -0.946533203125, -0.85919189453125, -0.7718505859375, -0.68450927734375, -0.59716796875, -0.50982666015625, -0.4224853515625, -0.33514404296875, -0.247802734375, -0.16046142578125, -0.0731201171875, 0.01422119140625, 0.1015625, 0.18890380859375, 0.2762451171875, 0.36358642578125, 0.450927734375, 0.53826904296875, 0.6256103515625, 0.71295166015625, 0.80029296875, 0.88763427734375, 0.9749755859375, 1.06231689453125, 1.149658203125, 1.23699951171875, 1.3243408203125, 1.41168212890625, 1.4990234375, 1.58636474609375, 1.6737060546875, 1.76104736328125, 1.848388671875, 1.93572998046875, 2.0230712890625, 2.11041259765625, 2.19775390625, 2.28509521484375, 2.3724365234375, 2.45977783203125, 2.547119140625, 2.63446044921875, 2.7218017578125, 2.80914306640625, 2.896484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 14.0, 25.0, 75.0, 323.0, 401.0, 90.0, 39.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.25006103515625, -6.1173095703125, -5.98455810546875, -5.851806640625, -5.71905517578125, -5.5863037109375, -5.45355224609375, -5.32080078125, -5.18804931640625, -5.0552978515625, -4.92254638671875, -4.789794921875, -4.65704345703125, -4.5242919921875, -4.39154052734375, -4.2587890625, -4.12603759765625, -3.9932861328125, -3.86053466796875, -3.727783203125, -3.59503173828125, -3.4622802734375, -3.32952880859375, -3.19677734375, -3.06402587890625, -2.9312744140625, -2.79852294921875, -2.665771484375, -2.53302001953125, -2.4002685546875, -2.26751708984375, -2.134765625, -2.00201416015625, -1.8692626953125, -1.73651123046875, -1.603759765625, -1.47100830078125, -1.3382568359375, -1.20550537109375, -1.07275390625, -0.94000244140625, -0.8072509765625, -0.67449951171875, -0.541748046875, -0.40899658203125, -0.2762451171875, -0.14349365234375, -0.0107421875, 0.12200927734375, 0.2547607421875, 0.38751220703125, 0.520263671875, 0.65301513671875, 0.7857666015625, 0.91851806640625, 1.05126953125, 1.18402099609375, 1.3167724609375, 1.44952392578125, 1.582275390625, 1.71502685546875, 1.8477783203125, 1.98052978515625, 2.11328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 9.0, 7.0, 18.0, 23.0, 70.0, 203.0, 362.0, 209.0, 57.0, 17.0, 14.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.984283447265625, -42.721195220947266, -41.458106994628906, -40.19501876831055, -38.93193054199219, -37.66884231567383, -36.40575408935547, -35.14266586303711, -33.87957763671875, -32.61648941040039, -31.35340118408203, -30.090312957763672, -28.827224731445312, -27.564136505126953, -26.301048278808594, -25.037960052490234, -23.774869918823242, -22.511781692504883, -21.248693466186523, -19.985605239868164, -18.722517013549805, -17.459428787231445, -16.196338653564453, -14.93325138092041, -13.67016315460205, -12.407074928283691, -11.143986701965332, -9.880897521972656, -8.617809295654297, -7.354721546173096, -6.091632843017578, -4.828544616699219, -3.5654563903808594, -2.3023681640625, -1.0392796993255615, 0.22380876541137695, 1.4868969917297363, 2.7499852180480957, 4.013073921203613, 5.276162147521973, 6.539250373840332, 7.802338600158691, 9.06542682647705, 10.328516006469727, 11.591604232788086, 12.854692459106445, 14.117780685424805, 15.380868911743164, 16.643957138061523, 17.907045364379883, 19.170133590698242, 20.4332218170166, 21.69631004333496, 22.95939826965332, 24.222488403320312, 25.485576629638672, 26.74866485595703, 28.01175308227539, 29.27484130859375, 30.53792953491211, 31.80101776123047, 33.06410598754883, 34.32719421386719, 35.59028244018555, 36.853370666503906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 8.0, 21.0, 10.0, 19.0, 22.0, 31.0, 42.0, 44.0, 48.0, 42.0, 49.0, 64.0, 60.0, 49.0, 59.0, 55.0, 46.0, 48.0, 41.0, 45.0, 23.0, 22.0, 25.0, 26.0, 14.0, 16.0, 7.0, 14.0, 5.0, 4.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.218097686767578, -25.37627601623535, -24.534452438354492, -23.692630767822266, -22.85080909729004, -22.008987426757812, -21.167163848876953, -20.325342178344727, -19.4835205078125, -18.641698837280273, -17.799875259399414, -16.958053588867188, -16.11623191833496, -15.274409294128418, -14.432586669921875, -13.590764999389648, -12.748942375183105, -11.907119750976562, -11.065298080444336, -10.223475456237793, -9.381653785705566, -8.539831161499023, -7.698009014129639, -6.856186866760254, -6.014364719390869, -5.172542572021484, -4.3307204246521, -3.4888980388641357, -2.647075891494751, -1.805253505706787, -0.9634313583374023, -0.12160921096801758, 0.7202129364013672, 1.562035083770752, 2.4038572311401367, 3.2456796169281006, 4.087501525878906, 4.929324150085449, 5.771146297454834, 6.612968444824219, 7.4547905921936035, 8.296612739562988, 9.138435363769531, 9.980257034301758, 10.8220796585083, 11.663902282714844, 12.50572395324707, 13.347545623779297, 14.18936824798584, 15.031190872192383, 15.87301254272461, 16.714834213256836, 17.556657791137695, 18.398479461669922, 19.24030113220215, 20.082122802734375, 20.923946380615234, 21.76576805114746, 22.60759162902832, 23.449413299560547, 24.291234970092773, 25.133056640625, 25.97488021850586, 26.816701889038086, 27.658523559570312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 10.0, 14.0, 22.0, 19.0, 22.0, 53.0, 69.0, 135.0, 292.0, 706.0, 2481.0, 18510.0, 4148766.0, 19280.0, 2588.0, 698.0, 280.0, 125.0, 55.0, 51.0, 29.0, 18.0, 16.0, 13.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.65234375, -3.562164306640625, -3.47198486328125, -3.381805419921875, -3.2916259765625, -3.201446533203125, -3.11126708984375, -3.021087646484375, -2.930908203125, -2.840728759765625, -2.75054931640625, -2.660369873046875, -2.5701904296875, -2.480010986328125, -2.38983154296875, -2.299652099609375, -2.20947265625, -2.119293212890625, -2.02911376953125, -1.938934326171875, -1.8487548828125, -1.758575439453125, -1.66839599609375, -1.578216552734375, -1.488037109375, -1.397857666015625, -1.30767822265625, -1.217498779296875, -1.1273193359375, -1.037139892578125, -0.94696044921875, -0.856781005859375, -0.7666015625, -0.676422119140625, -0.58624267578125, -0.496063232421875, -0.4058837890625, -0.315704345703125, -0.22552490234375, -0.135345458984375, -0.045166015625, 0.045013427734375, 0.13519287109375, 0.225372314453125, 0.3155517578125, 0.405731201171875, 0.49591064453125, 0.586090087890625, 0.67626953125, 0.766448974609375, 0.85662841796875, 0.946807861328125, 1.0369873046875, 1.127166748046875, 1.21734619140625, 1.307525634765625, 1.397705078125, 1.487884521484375, 1.57806396484375, 1.668243408203125, 1.7584228515625, 1.848602294921875, 1.93878173828125, 2.028961181640625, 2.119140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 4.0, 22.0, 31.0, 38.0, 47.0, 60.0, 80.0, 81.0, 95.0, 99.0, 95.0, 69.0, 69.0, 48.0, 34.0, 20.0, 13.0, 20.0, 14.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.294921875, -2.2375640869140625, -2.180206298828125, -2.1228485107421875, -2.06549072265625, -2.0081329345703125, -1.950775146484375, -1.8934173583984375, -1.8360595703125, -1.7787017822265625, -1.721343994140625, -1.6639862060546875, -1.60662841796875, -1.5492706298828125, -1.491912841796875, -1.4345550537109375, -1.377197265625, -1.3198394775390625, -1.262481689453125, -1.2051239013671875, -1.14776611328125, -1.0904083251953125, -1.033050537109375, -0.9756927490234375, -0.9183349609375, -0.8609771728515625, -0.803619384765625, -0.7462615966796875, -0.68890380859375, -0.6315460205078125, -0.574188232421875, -0.5168304443359375, -0.45947265625, -0.4021148681640625, -0.344757080078125, -0.2873992919921875, -0.23004150390625, -0.1726837158203125, -0.115325927734375, -0.0579681396484375, -0.0006103515625, 0.0567474365234375, 0.114105224609375, 0.1714630126953125, 0.22882080078125, 0.2861785888671875, 0.343536376953125, 0.4008941650390625, 0.458251953125, 0.5156097412109375, 0.572967529296875, 0.6303253173828125, 0.68768310546875, 0.7450408935546875, 0.802398681640625, 0.8597564697265625, 0.9171142578125, 0.9744720458984375, 1.031829833984375, 1.0891876220703125, 1.14654541015625, 1.2039031982421875, 1.261260986328125, 1.3186187744140625, 1.3759765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 11.0, 14.0, 19.0, 35.0, 36.0, 45.0, 59.0, 83.0, 107.0, 191.0, 326.0, 645.0, 1813.0, 5995.0, 42238.0, 4104900.0, 29648.0, 4981.0, 1604.0, 613.0, 309.0, 172.0, 99.0, 76.0, 54.0, 53.0, 37.0, 21.0, 22.0, 18.0, 14.0, 7.0, 10.0, 3.0, 3.0, 0.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.6856231689453125, -1.624176025390625, -1.5627288818359375, -1.50128173828125, -1.4398345947265625, -1.378387451171875, -1.3169403076171875, -1.2554931640625, -1.1940460205078125, -1.132598876953125, -1.0711517333984375, -1.00970458984375, -0.9482574462890625, -0.886810302734375, -0.8253631591796875, -0.763916015625, -0.7024688720703125, -0.641021728515625, -0.5795745849609375, -0.51812744140625, -0.4566802978515625, -0.395233154296875, -0.3337860107421875, -0.2723388671875, -0.2108917236328125, -0.149444580078125, -0.0879974365234375, -0.02655029296875, 0.0348968505859375, 0.096343994140625, 0.1577911376953125, 0.21923828125, 0.2806854248046875, 0.342132568359375, 0.4035797119140625, 0.46502685546875, 0.5264739990234375, 0.587921142578125, 0.6493682861328125, 0.7108154296875, 0.7722625732421875, 0.833709716796875, 0.8951568603515625, 0.95660400390625, 1.0180511474609375, 1.079498291015625, 1.1409454345703125, 1.202392578125, 1.2638397216796875, 1.325286865234375, 1.3867340087890625, 1.44818115234375, 1.5096282958984375, 1.571075439453125, 1.6325225830078125, 1.6939697265625, 1.7554168701171875, 1.816864013671875, 1.8783111572265625, 1.93975830078125, 2.0012054443359375, 2.062652587890625, 2.1240997314453125, 2.185546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 21.0, 146.0, 3764.0, 79.0, 25.0, 14.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7280120849609375, -0.703094482421875, -0.6781768798828125, -0.65325927734375, -0.6283416748046875, -0.603424072265625, -0.5785064697265625, -0.5535888671875, -0.5286712646484375, -0.503753662109375, -0.4788360595703125, -0.45391845703125, -0.4290008544921875, -0.404083251953125, -0.3791656494140625, -0.354248046875, -0.3293304443359375, -0.304412841796875, -0.2794952392578125, -0.25457763671875, -0.2296600341796875, -0.204742431640625, -0.1798248291015625, -0.1549072265625, -0.1299896240234375, -0.105072021484375, -0.0801544189453125, -0.05523681640625, -0.0303192138671875, -0.005401611328125, 0.0195159912109375, 0.04443359375, 0.0693511962890625, 0.094268798828125, 0.1191864013671875, 0.14410400390625, 0.1690216064453125, 0.193939208984375, 0.2188568115234375, 0.2437744140625, 0.2686920166015625, 0.293609619140625, 0.3185272216796875, 0.34344482421875, 0.3683624267578125, 0.393280029296875, 0.4181976318359375, 0.443115234375, 0.4680328369140625, 0.492950439453125, 0.5178680419921875, 0.54278564453125, 0.5677032470703125, 0.592620849609375, 0.6175384521484375, 0.6424560546875, 0.6673736572265625, 0.692291259765625, 0.7172088623046875, 0.74212646484375, 0.7670440673828125, 0.791961669921875, 0.8168792724609375, 0.841796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 28.0, 162.0, 500.0, 231.0, 57.0, 16.0, 7.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.982769012451172, -4.844604969024658, -4.706440448760986, -4.568276405334473, -4.430111885070801, -4.291947841644287, -4.153783321380615, -4.015619277954102, -3.877454996109009, -3.739290714263916, -3.6011264324188232, -3.4629621505737305, -3.324798107147217, -3.186633586883545, -3.0484695434570312, -2.9103052616119385, -2.7721409797668457, -2.633976697921753, -2.49581241607666, -2.3576481342315674, -2.2194838523864746, -2.081319808959961, -1.9431555271148682, -1.8049912452697754, -1.6668269634246826, -1.5286626815795898, -1.390498399734497, -1.2523342370986938, -1.114169955253601, -0.9760056734085083, -0.8378414511680603, -0.6996772289276123, -0.5615134239196777, -0.42334917187690735, -0.28518491983413696, -0.14702066779136658, -0.008856415748596191, 0.12930786609649658, 0.2674720883369446, 0.4056363105773926, 0.5438005924224854, 0.6819648742675781, 0.8201290965080261, 0.9582933187484741, 1.096457600593567, 1.2346218824386597, 1.372786045074463, 1.5109503269195557, 1.6491146087646484, 1.7872788906097412, 1.925443172454834, 2.0636074542999268, 2.2017717361450195, 2.339935779571533, 2.478100061416626, 2.6162643432617188, 2.7544286251068115, 2.8925929069519043, 3.030757188796997, 3.16892147064209, 3.3070855140686035, 3.4452500343322754, 3.583414077758789, 3.721578359603882, 3.8597426414489746]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 4.0, 11.0, 18.0, 18.0, 17.0, 24.0, 29.0, 25.0, 34.0, 23.0, 44.0, 39.0, 44.0, 46.0, 41.0, 40.0, 51.0, 50.0, 39.0, 35.0, 37.0, 36.0, 29.0, 36.0, 41.0, 35.0, 21.0, 35.0, 20.0, 16.0, 15.0, 12.0, 11.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1971235275268555, -1.1619635820388794, -1.1268036365509033, -1.0916436910629272, -1.0564837455749512, -1.021323800086975, -0.986163854598999, -0.951003909111023, -0.9158439636230469, -0.8806840181350708, -0.8455240726470947, -0.8103641271591187, -0.7752041816711426, -0.7400442361831665, -0.7048842906951904, -0.6697243452072144, -0.6345644593238831, -0.599404513835907, -0.5642445683479309, -0.5290846228599548, -0.49392467737197876, -0.4587647318840027, -0.423604816198349, -0.3884448707103729, -0.35328492522239685, -0.3181249797344208, -0.2829650342464447, -0.24780510365962982, -0.21264515817165375, -0.17748521268367767, -0.1423252820968628, -0.10716533660888672, -0.07200539112091064, -0.03684544935822487, -0.001685507595539093, 0.033474430441856384, 0.06863437592983246, 0.10379432141780853, 0.1389542520046234, 0.1741141974925995, 0.20927414298057556, 0.24443408846855164, 0.2795940339565277, 0.3147539496421814, 0.34991389513015747, 0.38507384061813354, 0.4202337861061096, 0.4553937315940857, 0.49055367708206177, 0.5257136225700378, 0.5608735680580139, 0.59603351354599, 0.6311934590339661, 0.6663534045219421, 0.7015132904052734, 0.7366732358932495, 0.7718331813812256, 0.8069931268692017, 0.8421530723571777, 0.8773130178451538, 0.9124729633331299, 0.947632908821106, 0.982792854309082, 1.017952799797058, 1.0531127452850342]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 8.0, 15.0, 17.0, 34.0, 38.0, 60.0, 102.0, 133.0, 235.0, 357.0, 617.0, 1107.0, 2232.0, 4634.0, 10752.0, 31606.0, 132102.0, 584197.0, 210543.0, 44005.0, 14045.0, 5834.0, 2613.0, 1410.0, 714.0, 407.0, 272.0, 144.0, 101.0, 67.0, 41.0, 31.0, 15.0, 15.0, 9.0, 9.0, 8.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-1.8544921875, -1.806488037109375, -1.75848388671875, -1.710479736328125, -1.6624755859375, -1.614471435546875, -1.56646728515625, -1.518463134765625, -1.470458984375, -1.422454833984375, -1.37445068359375, -1.326446533203125, -1.2784423828125, -1.230438232421875, -1.18243408203125, -1.134429931640625, -1.08642578125, -1.038421630859375, -0.99041748046875, -0.942413330078125, -0.8944091796875, -0.846405029296875, -0.79840087890625, -0.750396728515625, -0.702392578125, -0.654388427734375, -0.60638427734375, -0.558380126953125, -0.5103759765625, -0.462371826171875, -0.41436767578125, -0.366363525390625, -0.318359375, -0.270355224609375, -0.22235107421875, -0.174346923828125, -0.1263427734375, -0.078338623046875, -0.03033447265625, 0.017669677734375, 0.065673828125, 0.113677978515625, 0.16168212890625, 0.209686279296875, 0.2576904296875, 0.305694580078125, 0.35369873046875, 0.401702880859375, 0.44970703125, 0.497711181640625, 0.54571533203125, 0.593719482421875, 0.6417236328125, 0.689727783203125, 0.73773193359375, 0.785736083984375, 0.833740234375, 0.881744384765625, 0.92974853515625, 0.977752685546875, 1.0257568359375, 1.073760986328125, 1.12176513671875, 1.169769287109375, 1.2177734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 10.0, 12.0, 20.0, 20.0, 28.0, 49.0, 53.0, 73.0, 92.0, 73.0, 87.0, 86.0, 73.0, 62.0, 63.0, 46.0, 27.0, 27.0, 13.0, 16.0, 11.0, 15.0, 8.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.9803466796875, -1.927490234375, -1.8746337890625, -1.82177734375, -1.7689208984375, -1.716064453125, -1.6632080078125, -1.6103515625, -1.5574951171875, -1.504638671875, -1.4517822265625, -1.39892578125, -1.3460693359375, -1.293212890625, -1.2403564453125, -1.1875, -1.1346435546875, -1.081787109375, -1.0289306640625, -0.97607421875, -0.9232177734375, -0.870361328125, -0.8175048828125, -0.7646484375, -0.7117919921875, -0.658935546875, -0.6060791015625, -0.55322265625, -0.5003662109375, -0.447509765625, -0.3946533203125, -0.341796875, -0.2889404296875, -0.236083984375, -0.1832275390625, -0.13037109375, -0.0775146484375, -0.024658203125, 0.0281982421875, 0.0810546875, 0.1339111328125, 0.186767578125, 0.2396240234375, 0.29248046875, 0.3453369140625, 0.398193359375, 0.4510498046875, 0.50390625, 0.5567626953125, 0.609619140625, 0.6624755859375, 0.71533203125, 0.7681884765625, 0.821044921875, 0.8739013671875, 0.9267578125, 0.9796142578125, 1.032470703125, 1.0853271484375, 1.13818359375, 1.1910400390625, 1.243896484375, 1.2967529296875, 1.349609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 12.0, 15.0, 12.0, 19.0, 22.0, 35.0, 69.0, 98.0, 173.0, 315.0, 675.0, 1490.0, 4452.0, 19724.0, 169322.0, 760304.0, 74894.0, 11641.0, 3026.0, 1111.0, 483.0, 286.0, 132.0, 74.0, 44.0, 35.0, 26.0, 12.0, 13.0, 6.0, 4.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.046875, -2.96527099609375, -2.8836669921875, -2.80206298828125, -2.720458984375, -2.63885498046875, -2.5572509765625, -2.47564697265625, -2.39404296875, -2.31243896484375, -2.2308349609375, -2.14923095703125, -2.067626953125, -1.98602294921875, -1.9044189453125, -1.82281494140625, -1.7412109375, -1.65960693359375, -1.5780029296875, -1.49639892578125, -1.414794921875, -1.33319091796875, -1.2515869140625, -1.16998291015625, -1.08837890625, -1.00677490234375, -0.9251708984375, -0.84356689453125, -0.761962890625, -0.68035888671875, -0.5987548828125, -0.51715087890625, -0.435546875, -0.35394287109375, -0.2723388671875, -0.19073486328125, -0.109130859375, -0.02752685546875, 0.0540771484375, 0.13568115234375, 0.21728515625, 0.29888916015625, 0.3804931640625, 0.46209716796875, 0.543701171875, 0.62530517578125, 0.7069091796875, 0.78851318359375, 0.8701171875, 0.95172119140625, 1.0333251953125, 1.11492919921875, 1.196533203125, 1.27813720703125, 1.3597412109375, 1.44134521484375, 1.52294921875, 1.60455322265625, 1.6861572265625, 1.76776123046875, 1.849365234375, 1.93096923828125, 2.0125732421875, 2.09417724609375, 2.17578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 9.0, 7.0, 6.0, 8.0, 11.0, 19.0, 14.0, 21.0, 34.0, 26.0, 40.0, 52.0, 48.0, 43.0, 57.0, 60.0, 70.0, 56.0, 65.0, 56.0, 52.0, 50.0, 34.0, 28.0, 28.0, 20.0, 25.0, 23.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.7984619140625, -7.573486328125, -7.3485107421875, -7.12353515625, -6.8985595703125, -6.673583984375, -6.4486083984375, -6.2236328125, -5.9986572265625, -5.773681640625, -5.5487060546875, -5.32373046875, -5.0987548828125, -4.873779296875, -4.6488037109375, -4.423828125, -4.1988525390625, -3.973876953125, -3.7489013671875, -3.52392578125, -3.2989501953125, -3.073974609375, -2.8489990234375, -2.6240234375, -2.3990478515625, -2.174072265625, -1.9490966796875, -1.72412109375, -1.4991455078125, -1.274169921875, -1.0491943359375, -0.82421875, -0.5992431640625, -0.374267578125, -0.1492919921875, 0.07568359375, 0.3006591796875, 0.525634765625, 0.7506103515625, 0.9755859375, 1.2005615234375, 1.425537109375, 1.6505126953125, 1.87548828125, 2.1004638671875, 2.325439453125, 2.5504150390625, 2.775390625, 3.0003662109375, 3.225341796875, 3.4503173828125, 3.67529296875, 3.9002685546875, 4.125244140625, 4.3502197265625, 4.5751953125, 4.8001708984375, 5.025146484375, 5.2501220703125, 5.47509765625, 5.7000732421875, 5.925048828125, 6.1500244140625, 6.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 15.0, 6.0, 31.0, 55.0, 276.0, 5713.0, 1039732.0, 2453.0, 177.0, 39.0, 18.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.96875, -7.78515625, -7.6015625, -7.41796875, -7.234375, -7.05078125, -6.8671875, -6.68359375, -6.5, -6.31640625, -6.1328125, -5.94921875, -5.765625, -5.58203125, -5.3984375, -5.21484375, -5.03125, -4.84765625, -4.6640625, -4.48046875, -4.296875, -4.11328125, -3.9296875, -3.74609375, -3.5625, -3.37890625, -3.1953125, -3.01171875, -2.828125, -2.64453125, -2.4609375, -2.27734375, -2.09375, -1.91015625, -1.7265625, -1.54296875, -1.359375, -1.17578125, -0.9921875, -0.80859375, -0.625, -0.44140625, -0.2578125, -0.07421875, 0.109375, 0.29296875, 0.4765625, 0.66015625, 0.84375, 1.02734375, 1.2109375, 1.39453125, 1.578125, 1.76171875, 1.9453125, 2.12890625, 2.3125, 2.49609375, 2.6796875, 2.86328125, 3.046875, 3.23046875, 3.4140625, 3.59765625, 3.78125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 10.0, 12.0, 24.0, 18.0, 32.0, 36.0, 67.0, 82.0, 118.0, 95.0, 112.0, 91.0, 71.0, 67.0, 38.0, 27.0, 27.0, 17.0, 15.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.118152618408203e-05, -7.854681462049484e-05, -7.591210305690765e-05, -7.327739149332047e-05, -7.064267992973328e-05, -6.800796836614609e-05, -6.53732568025589e-05, -6.273854523897171e-05, -6.010383367538452e-05, -5.746912211179733e-05, -5.4834410548210144e-05, -5.2199698984622955e-05, -4.9564987421035767e-05, -4.693027585744858e-05, -4.429556429386139e-05, -4.16608527302742e-05, -3.902614116668701e-05, -3.639142960309982e-05, -3.3756718039512634e-05, -3.1122006475925446e-05, -2.8487294912338257e-05, -2.5852583348751068e-05, -2.321787178516388e-05, -2.058316022157669e-05, -1.7948448657989502e-05, -1.5313737094402313e-05, -1.2679025530815125e-05, -1.0044313967227936e-05, -7.409602403640747e-06, -4.774890840053558e-06, -2.1401792764663696e-06, 4.945322871208191e-07, 3.129243850708008e-06, 5.7639554142951965e-06, 8.398666977882385e-06, 1.1033378541469574e-05, 1.3668090105056763e-05, 1.630280166864395e-05, 1.893751323223114e-05, 2.157222479581833e-05, 2.4206936359405518e-05, 2.6841647922992706e-05, 2.9476359486579895e-05, 3.2111071050167084e-05, 3.474578261375427e-05, 3.738049417734146e-05, 4.001520574092865e-05, 4.264991730451584e-05, 4.528462886810303e-05, 4.7919340431690216e-05, 5.0554051995277405e-05, 5.3188763558864594e-05, 5.582347512245178e-05, 5.845818668603897e-05, 6.109289824962616e-05, 6.372760981321335e-05, 6.636232137680054e-05, 6.899703294038773e-05, 7.163174450397491e-05, 7.42664560675621e-05, 7.690116763114929e-05, 7.953587919473648e-05, 8.217059075832367e-05, 8.480530232191086e-05, 8.744001388549805e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 3.0, 7.0, 14.0, 14.0, 28.0, 52.0, 80.0, 225.0, 676.0, 2384.0, 22227.0, 963877.0, 54047.0, 3620.0, 787.0, 273.0, 106.0, 60.0, 28.0, 19.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.712249755859375, -1.66278076171875, -1.613311767578125, -1.5638427734375, -1.514373779296875, -1.46490478515625, -1.415435791015625, -1.365966796875, -1.316497802734375, -1.26702880859375, -1.217559814453125, -1.1680908203125, -1.118621826171875, -1.06915283203125, -1.019683837890625, -0.97021484375, -0.920745849609375, -0.87127685546875, -0.821807861328125, -0.7723388671875, -0.722869873046875, -0.67340087890625, -0.623931884765625, -0.574462890625, -0.524993896484375, -0.47552490234375, -0.426055908203125, -0.3765869140625, -0.327117919921875, -0.27764892578125, -0.228179931640625, -0.1787109375, -0.129241943359375, -0.07977294921875, -0.030303955078125, 0.0191650390625, 0.068634033203125, 0.11810302734375, 0.167572021484375, 0.217041015625, 0.266510009765625, 0.31597900390625, 0.365447998046875, 0.4149169921875, 0.464385986328125, 0.51385498046875, 0.563323974609375, 0.61279296875, 0.662261962890625, 0.71173095703125, 0.761199951171875, 0.8106689453125, 0.860137939453125, 0.90960693359375, 0.959075927734375, 1.008544921875, 1.058013916015625, 1.10748291015625, 1.156951904296875, 1.2064208984375, 1.255889892578125, 1.30535888671875, 1.354827880859375, 1.404296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 3.0, 8.0, 19.0, 36.0, 79.0, 143.0, 196.0, 175.0, 141.0, 83.0, 44.0, 19.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-3.140625, -3.0694122314453125, -2.998199462890625, -2.9269866943359375, -2.85577392578125, -2.7845611572265625, -2.713348388671875, -2.6421356201171875, -2.5709228515625, -2.4997100830078125, -2.428497314453125, -2.3572845458984375, -2.28607177734375, -2.2148590087890625, -2.143646240234375, -2.0724334716796875, -2.001220703125, -1.9300079345703125, -1.858795166015625, -1.7875823974609375, -1.71636962890625, -1.6451568603515625, -1.573944091796875, -1.5027313232421875, -1.4315185546875, -1.3603057861328125, -1.289093017578125, -1.2178802490234375, -1.14666748046875, -1.0754547119140625, -1.004241943359375, -0.9330291748046875, -0.86181640625, -0.7906036376953125, -0.719390869140625, -0.6481781005859375, -0.57696533203125, -0.5057525634765625, -0.434539794921875, -0.3633270263671875, -0.2921142578125, -0.2209014892578125, -0.149688720703125, -0.0784759521484375, -0.00726318359375, 0.0639495849609375, 0.135162353515625, 0.2063751220703125, 0.277587890625, 0.3488006591796875, 0.420013427734375, 0.4912261962890625, 0.56243896484375, 0.6336517333984375, 0.704864501953125, 0.7760772705078125, 0.8472900390625, 0.9185028076171875, 0.989715576171875, 1.0609283447265625, 1.13214111328125, 1.2033538818359375, 1.274566650390625, 1.3457794189453125, 1.4169921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 10.0, 22.0, 58.0, 166.0, 302.0, 251.0, 96.0, 45.0, 19.0, 8.0, 10.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.58250427246094, -35.76725769042969, -34.9520149230957, -34.13676834106445, -33.32152557373047, -32.50627899169922, -31.69103240966797, -30.87578773498535, -30.060543060302734, -29.245298385620117, -28.4300537109375, -27.61480712890625, -26.799562454223633, -25.984317779541016, -25.169071197509766, -24.35382652282715, -23.53858184814453, -22.723337173461914, -21.908092498779297, -21.092845916748047, -20.27760124206543, -19.462356567382812, -18.647109985351562, -17.831865310668945, -17.016620635986328, -16.20137596130371, -15.386130332946777, -14.570884704589844, -13.755640029907227, -12.94039535522461, -12.125149726867676, -11.309904098510742, -10.494659423828125, -9.679414749145508, -8.864169120788574, -8.04892349243164, -7.233678817749023, -6.418433666229248, -5.603188514709473, -4.787943363189697, -3.972698211669922, -3.1574530601501465, -2.342207908630371, -1.5269627571105957, -0.7117176055908203, 0.10352754592895508, 0.9187726974487305, 1.7340178489685059, 2.5492630004882812, 3.3645081520080566, 4.179753303527832, 4.994998455047607, 5.810243606567383, 6.625488758087158, 7.440733909606934, 8.255979537963867, 9.071224212646484, 9.886468887329102, 10.701714515686035, 11.516960144042969, 12.332204818725586, 13.147449493408203, 13.962695121765137, 14.77794075012207, 15.593185424804688]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 8.0, 3.0, 10.0, 3.0, 9.0, 21.0, 14.0, 14.0, 12.0, 22.0, 23.0, 18.0, 32.0, 29.0, 43.0, 43.0, 49.0, 40.0, 37.0, 45.0, 50.0, 66.0, 34.0, 36.0, 39.0, 35.0, 30.0, 24.0, 24.0, 24.0, 28.0, 22.0, 16.0, 24.0, 12.0, 11.0, 6.0, 13.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.886558532714844, -18.200279235839844, -17.514001846313477, -16.827722549438477, -16.14144515991211, -15.45516586303711, -14.76888656616211, -14.082608222961426, -13.396329879760742, -12.710051536560059, -12.023773193359375, -11.337493896484375, -10.651215553283691, -9.964937210083008, -9.278657913208008, -8.592379570007324, -7.906101226806641, -7.219822883605957, -6.533544063568115, -5.847265243530273, -5.16098690032959, -4.474708557128906, -3.7884297370910645, -3.1021509170532227, -2.415872573852539, -1.7295939922332764, -1.0433154106140137, -0.357036828994751, 0.3292417526245117, 1.0155203342437744, 1.701798915863037, 2.388077735900879, 3.0743541717529297, 3.7606327533721924, 4.446911334991455, 5.133190155029297, 5.8194684982299805, 6.505746841430664, 7.192025661468506, 7.878304481506348, 8.564582824707031, 9.250861167907715, 9.937139511108398, 10.623418807983398, 11.309697151184082, 11.995975494384766, 12.682254791259766, 13.36853313446045, 14.054811477661133, 14.741089820861816, 15.4273681640625, 16.1136474609375, 16.7999267578125, 17.486204147338867, 18.172483444213867, 18.858760833740234, 19.545040130615234, 20.231319427490234, 20.9175968170166, 21.6038761138916, 22.29015350341797, 22.97643280029297, 23.66271209716797, 24.34899139404297, 25.035268783569336]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 15.0, 29.0, 42.0, 69.0, 154.0, 350.0, 970.0, 3910.0, 42147.0, 4118848.0, 23551.0, 2834.0, 716.0, 305.0, 133.0, 67.0, 43.0, 25.0, 19.0, 8.0, 10.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-4.21484375, -4.1259307861328125, -4.037017822265625, -3.9481048583984375, -3.85919189453125, -3.7702789306640625, -3.681365966796875, -3.5924530029296875, -3.5035400390625, -3.4146270751953125, -3.325714111328125, -3.2368011474609375, -3.14788818359375, -3.0589752197265625, -2.970062255859375, -2.8811492919921875, -2.792236328125, -2.7033233642578125, -2.614410400390625, -2.5254974365234375, -2.43658447265625, -2.3476715087890625, -2.258758544921875, -2.1698455810546875, -2.0809326171875, -1.9920196533203125, -1.903106689453125, -1.8141937255859375, -1.72528076171875, -1.6363677978515625, -1.547454833984375, -1.4585418701171875, -1.36962890625, -1.2807159423828125, -1.191802978515625, -1.1028900146484375, -1.01397705078125, -0.9250640869140625, -0.836151123046875, -0.7472381591796875, -0.6583251953125, -0.5694122314453125, -0.480499267578125, -0.3915863037109375, -0.30267333984375, -0.2137603759765625, -0.124847412109375, -0.0359344482421875, 0.052978515625, 0.1418914794921875, 0.230804443359375, 0.3197174072265625, 0.40863037109375, 0.4975433349609375, 0.586456298828125, 0.6753692626953125, 0.7642822265625, 0.8531951904296875, 0.942108154296875, 1.0310211181640625, 1.11993408203125, 1.2088470458984375, 1.297760009765625, 1.3866729736328125, 1.4755859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 5.0, 7.0, 24.0, 43.0, 55.0, 92.0, 115.0, 149.0, 113.0, 121.0, 83.0, 65.0, 43.0, 24.0, 19.0, 16.0, 6.0, 3.0, 0.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.3805999755859375, -3.302215576171875, -3.2238311767578125, -3.14544677734375, -3.0670623779296875, -2.988677978515625, -2.9102935791015625, -2.8319091796875, -2.7535247802734375, -2.675140380859375, -2.5967559814453125, -2.51837158203125, -2.4399871826171875, -2.361602783203125, -2.2832183837890625, -2.204833984375, -2.1264495849609375, -2.048065185546875, -1.9696807861328125, -1.89129638671875, -1.8129119873046875, -1.734527587890625, -1.6561431884765625, -1.5777587890625, -1.4993743896484375, -1.420989990234375, -1.3426055908203125, -1.26422119140625, -1.1858367919921875, -1.107452392578125, -1.0290679931640625, -0.95068359375, -0.8722991943359375, -0.793914794921875, -0.7155303955078125, -0.63714599609375, -0.5587615966796875, -0.480377197265625, -0.4019927978515625, -0.3236083984375, -0.2452239990234375, -0.166839599609375, -0.0884552001953125, -0.01007080078125, 0.0683135986328125, 0.146697998046875, 0.2250823974609375, 0.303466796875, 0.3818511962890625, 0.460235595703125, 0.5386199951171875, 0.61700439453125, 0.6953887939453125, 0.773773193359375, 0.8521575927734375, 0.9305419921875, 1.0089263916015625, 1.087310791015625, 1.1656951904296875, 1.24407958984375, 1.3224639892578125, 1.400848388671875, 1.4792327880859375, 1.5576171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 13.0, 10.0, 20.0, 21.0, 24.0, 33.0, 31.0, 47.0, 57.0, 85.0, 88.0, 122.0, 176.0, 290.0, 1036.0, 4178480.0, 12363.0, 509.0, 216.0, 141.0, 99.0, 75.0, 70.0, 45.0, 45.0, 33.0, 31.0, 22.0, 15.0, 12.0, 13.0, 11.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.270263671875, -12.85302734375, -12.435791015625, -12.0185546875, -11.601318359375, -11.18408203125, -10.766845703125, -10.349609375, -9.932373046875, -9.51513671875, -9.097900390625, -8.6806640625, -8.263427734375, -7.84619140625, -7.428955078125, -7.01171875, -6.594482421875, -6.17724609375, -5.760009765625, -5.3427734375, -4.925537109375, -4.50830078125, -4.091064453125, -3.673828125, -3.256591796875, -2.83935546875, -2.422119140625, -2.0048828125, -1.587646484375, -1.17041015625, -0.753173828125, -0.3359375, 0.081298828125, 0.49853515625, 0.915771484375, 1.3330078125, 1.750244140625, 2.16748046875, 2.584716796875, 3.001953125, 3.419189453125, 3.83642578125, 4.253662109375, 4.6708984375, 5.088134765625, 5.50537109375, 5.922607421875, 6.33984375, 6.757080078125, 7.17431640625, 7.591552734375, 8.0087890625, 8.426025390625, 8.84326171875, 9.260498046875, 9.677734375, 10.094970703125, 10.51220703125, 10.929443359375, 11.3466796875, 11.763916015625, 12.18115234375, 12.598388671875, 13.015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3954.0, 119.0, 2.0, 0.0, 2.0], "bins": [-14.9453125, -14.695114135742188, -14.444915771484375, -14.194717407226562, -13.94451904296875, -13.694320678710938, -13.444122314453125, -13.193923950195312, -12.9437255859375, -12.693527221679688, -12.443328857421875, -12.193130493164062, -11.94293212890625, -11.692733764648438, -11.442535400390625, -11.192337036132812, -10.942138671875, -10.691940307617188, -10.441741943359375, -10.191543579101562, -9.94134521484375, -9.691146850585938, -9.440948486328125, -9.190750122070312, -8.9405517578125, -8.690353393554688, -8.440155029296875, -8.189956665039062, -7.93975830078125, -7.6895599365234375, -7.439361572265625, -7.1891632080078125, -6.93896484375, -6.6887664794921875, -6.438568115234375, -6.1883697509765625, -5.93817138671875, -5.6879730224609375, -5.437774658203125, -5.1875762939453125, -4.9373779296875, -4.6871795654296875, -4.436981201171875, -4.1867828369140625, -3.93658447265625, -3.6863861083984375, -3.436187744140625, -3.1859893798828125, -2.935791015625, -2.6855926513671875, -2.435394287109375, -2.1851959228515625, -1.93499755859375, -1.6847991943359375, -1.434600830078125, -1.1844024658203125, -0.9342041015625, -0.6840057373046875, -0.433807373046875, -0.1836090087890625, 0.06658935546875, 0.3167877197265625, 0.566986083984375, 0.8171844482421875, 1.0673828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 50.0, 235.0, 570.0, 117.0, 18.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.92208480834961, -37.209564208984375, -36.49704360961914, -35.784523010253906, -35.07200241088867, -34.35948181152344, -33.6469612121582, -32.93444061279297, -32.221920013427734, -31.5093994140625, -30.796878814697266, -30.08435821533203, -29.371837615966797, -28.659317016601562, -27.946796417236328, -27.23427391052246, -26.521751403808594, -25.80923080444336, -25.096710205078125, -24.38418960571289, -23.671669006347656, -22.959148406982422, -22.246627807617188, -21.53410530090332, -20.82158660888672, -20.109066009521484, -19.39654541015625, -18.684024810791016, -17.97150421142578, -17.258983612060547, -16.546463012695312, -15.833940505981445, -15.121419906616211, -14.408899307250977, -13.696378707885742, -12.983858108520508, -12.271336555480957, -11.558815956115723, -10.846295356750488, -10.133773803710938, -9.42125415802002, -8.708733558654785, -7.996212482452393, -7.283691883087158, -6.571170806884766, -5.858650207519531, -5.146129608154297, -4.433608531951904, -3.72108793258667, -3.0085670948028564, -2.296046257019043, -1.5835256576538086, -0.8710048198699951, -0.15848398208618164, 0.5540366172790527, 1.2665576934814453, 1.9790782928466797, 2.691599130630493, 3.4041199684143066, 4.116640567779541, 4.829161643981934, 5.541682243347168, 6.254202842712402, 6.966723918914795, 7.679244518280029]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 10.0, 10.0, 19.0, 44.0, 66.0, 79.0, 135.0, 181.0, 141.0, 128.0, 84.0, 39.0, 28.0, 17.0, 11.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.86685562133789, -22.047029495239258, -21.227201461791992, -20.40737533569336, -19.587547302246094, -18.76772117614746, -17.947893142700195, -17.128067016601562, -16.308238983154297, -15.488411903381348, -14.668584823608398, -13.84875774383545, -13.0289306640625, -12.209104537963867, -11.389276504516602, -10.569450378417969, -9.74962329864502, -8.92979621887207, -8.109969139099121, -7.290142059326172, -6.470314979553223, -5.650488376617432, -4.830661296844482, -4.010834217071533, -3.191007137298584, -2.3711800575256348, -1.551353096961975, -0.7315261363983154, 0.08830094337463379, 0.9081277847290039, 1.7279548645019531, 2.5477819442749023, 3.3676090240478516, 4.187436103820801, 5.00726318359375, 5.827090263366699, 6.646917343139648, 7.4667439460754395, 8.286571502685547, 9.10639762878418, 9.926225662231445, 10.746052742004395, 11.565879821777344, 12.385706901550293, 13.205533981323242, 14.025360107421875, 14.84518814086914, 15.665014266967773, 16.484840393066406, 17.30466651916504, 18.124494552612305, 18.944320678710938, 19.764148712158203, 20.583974838256836, 21.4038028717041, 22.223628997802734, 23.04345703125, 23.863283157348633, 24.6831111907959, 25.50293731689453, 26.322765350341797, 27.14259147644043, 27.962419509887695, 28.782245635986328, 29.602073669433594]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 16.0, 21.0, 33.0, 51.0, 105.0, 163.0, 283.0, 519.0, 1273.0, 4256.0, 22384.0, 300275.0, 667782.0, 41563.0, 6548.0, 1741.0, 749.0, 306.0, 175.0, 98.0, 69.0, 41.0, 20.0, 26.0, 8.0, 13.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2265625, -3.126190185546875, -3.02581787109375, -2.925445556640625, -2.8250732421875, -2.724700927734375, -2.62432861328125, -2.523956298828125, -2.423583984375, -2.323211669921875, -2.22283935546875, -2.122467041015625, -2.0220947265625, -1.921722412109375, -1.82135009765625, -1.720977783203125, -1.62060546875, -1.520233154296875, -1.41986083984375, -1.319488525390625, -1.2191162109375, -1.118743896484375, -1.01837158203125, -0.917999267578125, -0.817626953125, -0.717254638671875, -0.61688232421875, -0.516510009765625, -0.4161376953125, -0.315765380859375, -0.21539306640625, -0.115020751953125, -0.0146484375, 0.085723876953125, 0.18609619140625, 0.286468505859375, 0.3868408203125, 0.487213134765625, 0.58758544921875, 0.687957763671875, 0.788330078125, 0.888702392578125, 0.98907470703125, 1.089447021484375, 1.1898193359375, 1.290191650390625, 1.39056396484375, 1.490936279296875, 1.59130859375, 1.691680908203125, 1.79205322265625, 1.892425537109375, 1.9927978515625, 2.093170166015625, 2.19354248046875, 2.293914794921875, 2.394287109375, 2.494659423828125, 2.59503173828125, 2.695404052734375, 2.7957763671875, 2.896148681640625, 2.99652099609375, 3.096893310546875, 3.197265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 7.0, 17.0, 19.0, 35.0, 38.0, 69.0, 116.0, 131.0, 135.0, 126.0, 105.0, 69.0, 47.0, 35.0, 22.0, 11.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.58984375, -3.491180419921875, -3.39251708984375, -3.293853759765625, -3.1951904296875, -3.096527099609375, -2.99786376953125, -2.899200439453125, -2.800537109375, -2.701873779296875, -2.60321044921875, -2.504547119140625, -2.4058837890625, -2.307220458984375, -2.20855712890625, -2.109893798828125, -2.01123046875, -1.912567138671875, -1.81390380859375, -1.715240478515625, -1.6165771484375, -1.517913818359375, -1.41925048828125, -1.320587158203125, -1.221923828125, -1.123260498046875, -1.02459716796875, -0.925933837890625, -0.8272705078125, -0.728607177734375, -0.62994384765625, -0.531280517578125, -0.4326171875, -0.333953857421875, -0.23529052734375, -0.136627197265625, -0.0379638671875, 0.060699462890625, 0.15936279296875, 0.258026123046875, 0.356689453125, 0.455352783203125, 0.55401611328125, 0.652679443359375, 0.7513427734375, 0.850006103515625, 0.94866943359375, 1.047332763671875, 1.14599609375, 1.244659423828125, 1.34332275390625, 1.441986083984375, 1.5406494140625, 1.639312744140625, 1.73797607421875, 1.836639404296875, 1.935302734375, 2.033966064453125, 2.13262939453125, 2.231292724609375, 2.3299560546875, 2.428619384765625, 2.52728271484375, 2.625946044921875, 2.724609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 47.0, 132.0, 462.0, 3466.0, 1037031.0, 6623.0, 525.0, 153.0, 46.0, 18.0, 13.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.484375, -17.96484375, -17.4453125, -16.92578125, -16.40625, -15.88671875, -15.3671875, -14.84765625, -14.328125, -13.80859375, -13.2890625, -12.76953125, -12.25, -11.73046875, -11.2109375, -10.69140625, -10.171875, -9.65234375, -9.1328125, -8.61328125, -8.09375, -7.57421875, -7.0546875, -6.53515625, -6.015625, -5.49609375, -4.9765625, -4.45703125, -3.9375, -3.41796875, -2.8984375, -2.37890625, -1.859375, -1.33984375, -0.8203125, -0.30078125, 0.21875, 0.73828125, 1.2578125, 1.77734375, 2.296875, 2.81640625, 3.3359375, 3.85546875, 4.375, 4.89453125, 5.4140625, 5.93359375, 6.453125, 6.97265625, 7.4921875, 8.01171875, 8.53125, 9.05078125, 9.5703125, 10.08984375, 10.609375, 11.12890625, 11.6484375, 12.16796875, 12.6875, 13.20703125, 13.7265625, 14.24609375, 14.765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 13.0, 30.0, 65.0, 131.0, 240.0, 223.0, 164.0, 85.0, 36.0, 17.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.765625, -30.0, -29.234375, -28.46875, -27.703125, -26.9375, -26.171875, -25.40625, -24.640625, -23.875, -23.109375, -22.34375, -21.578125, -20.8125, -20.046875, -19.28125, -18.515625, -17.75, -16.984375, -16.21875, -15.453125, -14.6875, -13.921875, -13.15625, -12.390625, -11.625, -10.859375, -10.09375, -9.328125, -8.5625, -7.796875, -7.03125, -6.265625, -5.5, -4.734375, -3.96875, -3.203125, -2.4375, -1.671875, -0.90625, -0.140625, 0.625, 1.390625, 2.15625, 2.921875, 3.6875, 4.453125, 5.21875, 5.984375, 6.75, 7.515625, 8.28125, 9.046875, 9.8125, 10.578125, 11.34375, 12.109375, 12.875, 13.640625, 14.40625, 15.171875, 15.9375, 16.703125, 17.46875, 18.234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 14.0, 25.0, 82.0, 294.0, 4489.0, 1040174.0, 3145.0, 227.0, 63.0, 20.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.10546875, -6.9381103515625, -6.770751953125, -6.6033935546875, -6.43603515625, -6.2686767578125, -6.101318359375, -5.9339599609375, -5.7666015625, -5.5992431640625, -5.431884765625, -5.2645263671875, -5.09716796875, -4.9298095703125, -4.762451171875, -4.5950927734375, -4.427734375, -4.2603759765625, -4.093017578125, -3.9256591796875, -3.75830078125, -3.5909423828125, -3.423583984375, -3.2562255859375, -3.0888671875, -2.9215087890625, -2.754150390625, -2.5867919921875, -2.41943359375, -2.2520751953125, -2.084716796875, -1.9173583984375, -1.75, -1.5826416015625, -1.415283203125, -1.2479248046875, -1.08056640625, -0.9132080078125, -0.745849609375, -0.5784912109375, -0.4111328125, -0.2437744140625, -0.076416015625, 0.0909423828125, 0.25830078125, 0.4256591796875, 0.593017578125, 0.7603759765625, 0.927734375, 1.0950927734375, 1.262451171875, 1.4298095703125, 1.59716796875, 1.7645263671875, 1.931884765625, 2.0992431640625, 2.2666015625, 2.4339599609375, 2.601318359375, 2.7686767578125, 2.93603515625, 3.1033935546875, 3.270751953125, 3.4381103515625, 3.60546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 14.0, 31.0, 52.0, 84.0, 105.0, 159.0, 186.0, 120.0, 88.0, 51.0, 31.0, 32.0, 14.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.274482727050781e-05, -8.815526962280273e-05, -8.356571197509766e-05, -7.897615432739258e-05, -7.43865966796875e-05, -6.979703903198242e-05, -6.520748138427734e-05, -6.0617923736572266e-05, -5.602836608886719e-05, -5.143880844116211e-05, -4.684925079345703e-05, -4.225969314575195e-05, -3.7670135498046875e-05, -3.30805778503418e-05, -2.849102020263672e-05, -2.390146255493164e-05, -1.9311904907226562e-05, -1.4722347259521484e-05, -1.0132789611816406e-05, -5.543231964111328e-06, -9.5367431640625e-07, 3.635883331298828e-06, 8.225440979003906e-06, 1.2814998626708984e-05, 1.7404556274414062e-05, 2.199411392211914e-05, 2.658367156982422e-05, 3.11732292175293e-05, 3.5762786865234375e-05, 4.035234451293945e-05, 4.494190216064453e-05, 4.953145980834961e-05, 5.412101745605469e-05, 5.8710575103759766e-05, 6.330013275146484e-05, 6.788969039916992e-05, 7.2479248046875e-05, 7.706880569458008e-05, 8.165836334228516e-05, 8.624792098999023e-05, 9.083747863769531e-05, 9.542703628540039e-05, 0.00010001659393310547, 0.00010460615158081055, 0.00010919570922851562, 0.0001137852668762207, 0.00011837482452392578, 0.00012296438217163086, 0.00012755393981933594, 0.00013214349746704102, 0.0001367330551147461, 0.00014132261276245117, 0.00014591217041015625, 0.00015050172805786133, 0.0001550912857055664, 0.00015968084335327148, 0.00016427040100097656, 0.00016885995864868164, 0.00017344951629638672, 0.0001780390739440918, 0.00018262863159179688, 0.00018721818923950195, 0.00019180774688720703, 0.0001963973045349121, 0.0002009868621826172]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 21.0, 70.0, 454.0, 101917.0, 945404.0, 528.0, 104.0, 33.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.551513671875, -4.34521484375, -4.138916015625, -3.9326171875, -3.726318359375, -3.52001953125, -3.313720703125, -3.107421875, -2.901123046875, -2.69482421875, -2.488525390625, -2.2822265625, -2.075927734375, -1.86962890625, -1.663330078125, -1.45703125, -1.250732421875, -1.04443359375, -0.838134765625, -0.6318359375, -0.425537109375, -0.21923828125, -0.012939453125, 0.193359375, 0.399658203125, 0.60595703125, 0.812255859375, 1.0185546875, 1.224853515625, 1.43115234375, 1.637451171875, 1.84375, 2.050048828125, 2.25634765625, 2.462646484375, 2.6689453125, 2.875244140625, 3.08154296875, 3.287841796875, 3.494140625, 3.700439453125, 3.90673828125, 4.113037109375, 4.3193359375, 4.525634765625, 4.73193359375, 4.938232421875, 5.14453125, 5.350830078125, 5.55712890625, 5.763427734375, 5.9697265625, 6.176025390625, 6.38232421875, 6.588623046875, 6.794921875, 7.001220703125, 7.20751953125, 7.413818359375, 7.6201171875, 7.826416015625, 8.03271484375, 8.239013671875, 8.4453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 19.0, 24.0, 56.0, 141.0, 254.0, 254.0, 132.0, 49.0, 27.0, 18.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -0.9873199462890625, -0.911163330078125, -0.8350067138671875, -0.75885009765625, -0.6826934814453125, -0.606536865234375, -0.5303802490234375, -0.4542236328125, -0.3780670166015625, -0.301910400390625, -0.2257537841796875, -0.14959716796875, -0.0734405517578125, 0.002716064453125, 0.0788726806640625, 0.155029296875, 0.2311859130859375, 0.307342529296875, 0.3834991455078125, 0.45965576171875, 0.5358123779296875, 0.611968994140625, 0.6881256103515625, 0.7642822265625, 0.8404388427734375, 0.916595458984375, 0.9927520751953125, 1.06890869140625, 1.1450653076171875, 1.221221923828125, 1.2973785400390625, 1.37353515625, 1.4496917724609375, 1.525848388671875, 1.6020050048828125, 1.67816162109375, 1.7543182373046875, 1.830474853515625, 1.9066314697265625, 1.9827880859375, 2.0589447021484375, 2.135101318359375, 2.2112579345703125, 2.28741455078125, 2.3635711669921875, 2.439727783203125, 2.5158843994140625, 2.592041015625, 2.6681976318359375, 2.744354248046875, 2.8205108642578125, 2.89666748046875, 2.9728240966796875, 3.048980712890625, 3.1251373291015625, 3.2012939453125, 3.2774505615234375, 3.353607177734375, 3.4297637939453125, 3.50592041015625, 3.5820770263671875, 3.658233642578125, 3.7343902587890625, 3.810546875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 33.0, 177.0, 575.0, 163.0, 27.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.12113952636719, -65.1185302734375, -62.11592483520508, -59.113319396972656, -56.11071014404297, -53.10810470581055, -50.105499267578125, -47.10289001464844, -44.10028076171875, -41.09767532348633, -38.09506607055664, -35.09246063232422, -32.08985137939453, -29.08724594116211, -26.084638595581055, -23.08203125, -20.079425811767578, -17.076818466186523, -14.074211120605469, -11.07160472869873, -8.068997383117676, -5.066390037536621, -2.063783645629883, 0.9388236999511719, 3.9414310455322266, 6.944038391113281, 9.946645736694336, 12.949252128601074, 15.951859474182129, 18.9544677734375, 21.957073211669922, 24.959680557250977, 27.96228790283203, 30.964895248413086, 33.96750259399414, 36.97010803222656, 39.97271728515625, 42.97532272338867, 45.977928161621094, 48.98053741455078, 51.98314666748047, 54.98575210571289, 57.98836135864258, 60.990966796875, 63.99357604980469, 66.99618530273438, 69.99878692626953, 73.00139617919922, 76.00399780273438, 79.00660705566406, 82.00920867919922, 85.0118179321289, 88.0144271850586, 91.01703643798828, 94.01963806152344, 97.02224731445312, 100.02485656738281, 103.0274658203125, 106.03006744384766, 109.03267669677734, 112.03528594970703, 115.03789520263672, 118.04049682617188, 121.04310607910156, 124.04571533203125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 10.0, 8.0, 8.0, 14.0, 22.0, 24.0, 23.0, 29.0, 37.0, 46.0, 68.0, 69.0, 65.0, 74.0, 77.0, 81.0, 72.0, 50.0, 43.0, 33.0, 27.0, 28.0, 16.0, 21.0, 17.0, 9.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-62.381324768066406, -60.924861907958984, -59.46839904785156, -58.01193618774414, -56.55547332763672, -55.0990104675293, -53.642547607421875, -52.18608474731445, -50.72962188720703, -49.27315902709961, -47.81669616699219, -46.360233306884766, -44.903770446777344, -43.44730758666992, -41.9908447265625, -40.53438186645508, -39.077919006347656, -37.621456146240234, -36.16499328613281, -34.70853042602539, -33.25206756591797, -31.795604705810547, -30.339141845703125, -28.882678985595703, -27.42621612548828, -25.96975326538086, -24.513290405273438, -23.056827545166016, -21.600364685058594, -20.143901824951172, -18.68743896484375, -17.230976104736328, -15.774515151977539, -14.318052291870117, -12.861589431762695, -11.405126571655273, -9.948663711547852, -8.49220085144043, -7.035737991333008, -5.579275131225586, -4.122812271118164, -2.666349411010742, -1.2098865509033203, 0.24657630920410156, 1.7030391693115234, 3.1595020294189453, 4.615964889526367, 6.072427749633789, 7.528890609741211, 8.985353469848633, 10.441816329956055, 11.898279190063477, 13.354742050170898, 14.81120491027832, 16.267667770385742, 17.724130630493164, 19.180593490600586, 20.637056350708008, 22.09351921081543, 23.54998207092285, 25.006444931030273, 26.462907791137695, 27.919370651245117, 29.37583351135254, 30.83229637145996]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 6.0, 14.0, 6.0, 12.0, 19.0, 26.0, 40.0, 81.0, 122.0, 213.0, 451.0, 1014.0, 2443.0, 7354.0, 28485.0, 476151.0, 3575609.0, 81580.0, 12704.0, 4440.0, 1687.0, 775.0, 381.0, 214.0, 156.0, 70.0, 52.0, 35.0, 35.0, 23.0, 16.0, 10.0, 16.0, 6.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7662506103515625, -1.713165283203125, -1.6600799560546875, -1.60699462890625, -1.5539093017578125, -1.500823974609375, -1.4477386474609375, -1.3946533203125, -1.3415679931640625, -1.288482666015625, -1.2353973388671875, -1.18231201171875, -1.1292266845703125, -1.076141357421875, -1.0230560302734375, -0.969970703125, -0.9168853759765625, -0.863800048828125, -0.8107147216796875, -0.75762939453125, -0.7045440673828125, -0.651458740234375, -0.5983734130859375, -0.5452880859375, -0.4922027587890625, -0.439117431640625, -0.3860321044921875, -0.33294677734375, -0.2798614501953125, -0.226776123046875, -0.1736907958984375, -0.12060546875, -0.0675201416015625, -0.014434814453125, 0.0386505126953125, 0.09173583984375, 0.1448211669921875, 0.197906494140625, 0.2509918212890625, 0.3040771484375, 0.3571624755859375, 0.410247802734375, 0.4633331298828125, 0.51641845703125, 0.5695037841796875, 0.622589111328125, 0.6756744384765625, 0.728759765625, 0.7818450927734375, 0.834930419921875, 0.8880157470703125, 0.94110107421875, 0.9941864013671875, 1.047271728515625, 1.1003570556640625, 1.1534423828125, 1.2065277099609375, 1.259613037109375, 1.3126983642578125, 1.36578369140625, 1.4188690185546875, 1.471954345703125, 1.5250396728515625, 1.578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 17.0, 24.0, 48.0, 53.0, 88.0, 109.0, 120.0, 119.0, 107.0, 95.0, 68.0, 56.0, 29.0, 22.0, 19.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.314788818359375, -2.24090576171875, -2.167022705078125, -2.0931396484375, -2.019256591796875, -1.94537353515625, -1.871490478515625, -1.797607421875, -1.723724365234375, -1.64984130859375, -1.575958251953125, -1.5020751953125, -1.428192138671875, -1.35430908203125, -1.280426025390625, -1.20654296875, -1.132659912109375, -1.05877685546875, -0.984893798828125, -0.9110107421875, -0.837127685546875, -0.76324462890625, -0.689361572265625, -0.615478515625, -0.541595458984375, -0.46771240234375, -0.393829345703125, -0.3199462890625, -0.246063232421875, -0.17218017578125, -0.098297119140625, -0.0244140625, 0.049468994140625, 0.12335205078125, 0.197235107421875, 0.2711181640625, 0.345001220703125, 0.41888427734375, 0.492767333984375, 0.566650390625, 0.640533447265625, 0.71441650390625, 0.788299560546875, 0.8621826171875, 0.936065673828125, 1.00994873046875, 1.083831787109375, 1.15771484375, 1.231597900390625, 1.30548095703125, 1.379364013671875, 1.4532470703125, 1.527130126953125, 1.60101318359375, 1.674896240234375, 1.748779296875, 1.822662353515625, 1.89654541015625, 1.970428466796875, 2.0443115234375, 2.118194580078125, 2.19207763671875, 2.265960693359375, 2.33984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 12.0, 33.0, 42.0, 80.0, 149.0, 264.0, 559.0, 1425.0, 5623.0, 34338.0, 3899904.0, 232847.0, 13932.0, 3044.0, 964.0, 490.0, 232.0, 140.0, 69.0, 38.0, 29.0, 16.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.87628173828125, -2.7857666015625, -2.69525146484375, -2.604736328125, -2.51422119140625, -2.4237060546875, -2.33319091796875, -2.24267578125, -2.15216064453125, -2.0616455078125, -1.97113037109375, -1.880615234375, -1.79010009765625, -1.6995849609375, -1.60906982421875, -1.5185546875, -1.42803955078125, -1.3375244140625, -1.24700927734375, -1.156494140625, -1.06597900390625, -0.9754638671875, -0.88494873046875, -0.79443359375, -0.70391845703125, -0.6134033203125, -0.52288818359375, -0.432373046875, -0.34185791015625, -0.2513427734375, -0.16082763671875, -0.0703125, 0.02020263671875, 0.1107177734375, 0.20123291015625, 0.291748046875, 0.38226318359375, 0.4727783203125, 0.56329345703125, 0.65380859375, 0.74432373046875, 0.8348388671875, 0.92535400390625, 1.015869140625, 1.10638427734375, 1.1968994140625, 1.28741455078125, 1.3779296875, 1.46844482421875, 1.5589599609375, 1.64947509765625, 1.739990234375, 1.83050537109375, 1.9210205078125, 2.01153564453125, 2.10205078125, 2.19256591796875, 2.2830810546875, 2.37359619140625, 2.464111328125, 2.55462646484375, 2.6451416015625, 2.73565673828125, 2.826171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 5.0, 3.0, 5.0, 8.0, 8.0, 22.0, 24.0, 24.0, 74.0, 302.0, 1971.0, 1237.0, 213.0, 49.0, 45.0, 24.0, 15.0, 9.0, 7.0, 12.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.150390625, -3.037078857421875, -2.92376708984375, -2.810455322265625, -2.6971435546875, -2.583831787109375, -2.47052001953125, -2.357208251953125, -2.243896484375, -2.130584716796875, -2.01727294921875, -1.903961181640625, -1.7906494140625, -1.677337646484375, -1.56402587890625, -1.450714111328125, -1.33740234375, -1.224090576171875, -1.11077880859375, -0.997467041015625, -0.8841552734375, -0.770843505859375, -0.65753173828125, -0.544219970703125, -0.430908203125, -0.317596435546875, -0.20428466796875, -0.090972900390625, 0.0223388671875, 0.135650634765625, 0.24896240234375, 0.362274169921875, 0.4755859375, 0.588897705078125, 0.70220947265625, 0.815521240234375, 0.9288330078125, 1.042144775390625, 1.15545654296875, 1.268768310546875, 1.382080078125, 1.495391845703125, 1.60870361328125, 1.722015380859375, 1.8353271484375, 1.948638916015625, 2.06195068359375, 2.175262451171875, 2.28857421875, 2.401885986328125, 2.51519775390625, 2.628509521484375, 2.7418212890625, 2.855133056640625, 2.96844482421875, 3.081756591796875, 3.195068359375, 3.308380126953125, 3.42169189453125, 3.535003662109375, 3.6483154296875, 3.761627197265625, 3.87493896484375, 3.988250732421875, 4.1015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 56.0, 229.0, 410.0, 181.0, 55.0, 20.0, 11.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.08222770690918, -10.297014236450195, -9.511800765991211, -8.726587295532227, -7.941373348236084, -7.1561598777771, -6.370945930480957, -5.585732460021973, -4.800518989562988, -4.015305519104004, -3.2300918102264404, -2.444878101348877, -1.6596646308898926, -0.8744511604309082, -0.08923721313476562, 0.6959762573242188, 1.4811897277832031, 2.2664031982421875, 3.051616907119751, 3.8368306159973145, 4.622044086456299, 5.407257556915283, 6.192471504211426, 6.97768497467041, 7.7628984451293945, 8.548111915588379, 9.333325386047363, 10.118539810180664, 10.903753280639648, 11.688966751098633, 12.474180221557617, 13.259393692016602, 14.044609069824219, 14.829822540283203, 15.615036010742188, 16.400249481201172, 17.185462951660156, 17.97067642211914, 18.755889892578125, 19.54110336303711, 20.326316833496094, 21.111530303955078, 21.896743774414062, 22.681957244873047, 23.46717071533203, 24.252384185791016, 25.03759765625, 25.822811126708984, 26.6080265045166, 27.393239974975586, 28.17845344543457, 28.963666915893555, 29.74888038635254, 30.534093856811523, 31.31930923461914, 32.104522705078125, 32.88973617553711, 33.674949645996094, 34.46016311645508, 35.24537658691406, 36.03059005737305, 36.81580352783203, 37.601016998291016, 38.38623046875, 39.171443939208984]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 24.0, 18.0, 20.0, 49.0, 54.0, 62.0, 53.0, 60.0, 66.0, 93.0, 81.0, 67.0, 64.0, 56.0, 39.0, 32.0, 33.0, 27.0, 25.0, 14.0, 13.0, 15.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.722731590270996, -15.204607963562012, -14.686484336853027, -14.16836166381836, -13.650238037109375, -13.13211441040039, -12.613990783691406, -12.095867156982422, -11.577743530273438, -11.059619903564453, -10.541496276855469, -10.023372650146484, -9.505249977111816, -8.987126350402832, -8.469002723693848, -7.950879096984863, -7.432756423950195, -6.914632797241211, -6.396509647369385, -5.8783860206604, -5.360262870788574, -4.84213924407959, -4.3240156173706055, -3.8058922290802, -3.287768840789795, -2.7696454524993896, -2.2515220642089844, -1.7333984375, -1.2152750492095947, -0.6971516609191895, -0.17902803421020508, 0.3390953540802002, 0.8572177886962891, 1.3753411769866943, 1.8934646844863892, 2.411588191986084, 2.9297115802764893, 3.4478349685668945, 3.965958595275879, 4.484082221984863, 5.0022053718566895, 5.520328998565674, 6.0384521484375, 6.556575775146484, 7.074699401855469, 7.592822551727295, 8.110946655273438, 8.629069328308105, 9.14719295501709, 9.665316581726074, 10.183440208435059, 10.701562881469727, 11.219686508178711, 11.737810134887695, 12.25593376159668, 12.774057388305664, 13.292181015014648, 13.810304641723633, 14.328428268432617, 14.846551895141602, 15.36467456817627, 15.882798194885254, 16.400920867919922, 16.919044494628906, 17.43716812133789]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 8.0, 15.0, 19.0, 40.0, 48.0, 67.0, 129.0, 185.0, 317.0, 549.0, 1053.0, 2079.0, 4462.0, 10664.0, 29679.0, 105483.0, 430112.0, 341303.0, 81369.0, 24129.0, 8930.0, 3790.0, 1824.0, 973.0, 553.0, 278.0, 185.0, 86.0, 77.0, 36.0, 31.0, 20.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.09332275390625, -1.0567626953125, -1.02020263671875, -0.983642578125, -0.94708251953125, -0.9105224609375, -0.87396240234375, -0.83740234375, -0.80084228515625, -0.7642822265625, -0.72772216796875, -0.691162109375, -0.65460205078125, -0.6180419921875, -0.58148193359375, -0.544921875, -0.50836181640625, -0.4718017578125, -0.43524169921875, -0.398681640625, -0.36212158203125, -0.3255615234375, -0.28900146484375, -0.25244140625, -0.21588134765625, -0.1793212890625, -0.14276123046875, -0.106201171875, -0.06964111328125, -0.0330810546875, 0.00347900390625, 0.0400390625, 0.07659912109375, 0.1131591796875, 0.14971923828125, 0.186279296875, 0.22283935546875, 0.2593994140625, 0.29595947265625, 0.33251953125, 0.36907958984375, 0.4056396484375, 0.44219970703125, 0.478759765625, 0.51531982421875, 0.5518798828125, 0.58843994140625, 0.625, 0.66156005859375, 0.6981201171875, 0.73468017578125, 0.771240234375, 0.80780029296875, 0.8443603515625, 0.88092041015625, 0.91748046875, 0.95404052734375, 0.9906005859375, 1.02716064453125, 1.063720703125, 1.10028076171875, 1.1368408203125, 1.17340087890625, 1.2099609375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 13.0, 13.0, 21.0, 17.0, 31.0, 43.0, 51.0, 57.0, 68.0, 85.0, 78.0, 86.0, 80.0, 64.0, 58.0, 60.0, 38.0, 41.0, 32.0, 10.0, 13.0, 7.0, 11.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.143035888671875, -1.09759521484375, -1.052154541015625, -1.0067138671875, -0.961273193359375, -0.91583251953125, -0.870391845703125, -0.824951171875, -0.779510498046875, -0.73406982421875, -0.688629150390625, -0.6431884765625, -0.597747802734375, -0.55230712890625, -0.506866455078125, -0.46142578125, -0.415985107421875, -0.37054443359375, -0.325103759765625, -0.2796630859375, -0.234222412109375, -0.18878173828125, -0.143341064453125, -0.097900390625, -0.052459716796875, -0.00701904296875, 0.038421630859375, 0.0838623046875, 0.129302978515625, 0.17474365234375, 0.220184326171875, 0.265625, 0.311065673828125, 0.35650634765625, 0.401947021484375, 0.4473876953125, 0.492828369140625, 0.53826904296875, 0.583709716796875, 0.629150390625, 0.674591064453125, 0.72003173828125, 0.765472412109375, 0.8109130859375, 0.856353759765625, 0.90179443359375, 0.947235107421875, 0.99267578125, 1.038116455078125, 1.08355712890625, 1.128997802734375, 1.1744384765625, 1.219879150390625, 1.26531982421875, 1.310760498046875, 1.356201171875, 1.401641845703125, 1.44708251953125, 1.492523193359375, 1.5379638671875, 1.583404541015625, 1.62884521484375, 1.674285888671875, 1.7197265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 11.0, 7.0, 9.0, 12.0, 18.0, 23.0, 31.0, 69.0, 77.0, 142.0, 188.0, 318.0, 512.0, 866.0, 1759.0, 4922.0, 30420.0, 692835.0, 292258.0, 17228.0, 3577.0, 1315.0, 725.0, 439.0, 236.0, 181.0, 112.0, 70.0, 45.0, 39.0, 32.0, 19.0, 23.0, 10.0, 11.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.38671875, -2.30108642578125, -2.2154541015625, -2.12982177734375, -2.044189453125, -1.95855712890625, -1.8729248046875, -1.78729248046875, -1.70166015625, -1.61602783203125, -1.5303955078125, -1.44476318359375, -1.359130859375, -1.27349853515625, -1.1878662109375, -1.10223388671875, -1.0166015625, -0.93096923828125, -0.8453369140625, -0.75970458984375, -0.674072265625, -0.58843994140625, -0.5028076171875, -0.41717529296875, -0.33154296875, -0.24591064453125, -0.1602783203125, -0.07464599609375, 0.010986328125, 0.09661865234375, 0.1822509765625, 0.26788330078125, 0.353515625, 0.43914794921875, 0.5247802734375, 0.61041259765625, 0.696044921875, 0.78167724609375, 0.8673095703125, 0.95294189453125, 1.03857421875, 1.12420654296875, 1.2098388671875, 1.29547119140625, 1.381103515625, 1.46673583984375, 1.5523681640625, 1.63800048828125, 1.7236328125, 1.80926513671875, 1.8948974609375, 1.98052978515625, 2.066162109375, 2.15179443359375, 2.2374267578125, 2.32305908203125, 2.40869140625, 2.49432373046875, 2.5799560546875, 2.66558837890625, 2.751220703125, 2.83685302734375, 2.9224853515625, 3.00811767578125, 3.09375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 10.0, 6.0, 13.0, 15.0, 31.0, 29.0, 32.0, 46.0, 27.0, 49.0, 45.0, 46.0, 55.0, 56.0, 50.0, 46.0, 58.0, 47.0, 49.0, 52.0, 29.0, 27.0, 25.0, 27.0, 28.0, 25.0, 15.0, 10.0, 12.0, 7.0, 10.0, 1.0, 4.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -5.0020751953125, -4.855712890625, -4.7093505859375, -4.56298828125, -4.4166259765625, -4.270263671875, -4.1239013671875, -3.9775390625, -3.8311767578125, -3.684814453125, -3.5384521484375, -3.39208984375, -3.2457275390625, -3.099365234375, -2.9530029296875, -2.806640625, -2.6602783203125, -2.513916015625, -2.3675537109375, -2.22119140625, -2.0748291015625, -1.928466796875, -1.7821044921875, -1.6357421875, -1.4893798828125, -1.343017578125, -1.1966552734375, -1.05029296875, -0.9039306640625, -0.757568359375, -0.6112060546875, -0.46484375, -0.3184814453125, -0.172119140625, -0.0257568359375, 0.12060546875, 0.2669677734375, 0.413330078125, 0.5596923828125, 0.7060546875, 0.8524169921875, 0.998779296875, 1.1451416015625, 1.29150390625, 1.4378662109375, 1.584228515625, 1.7305908203125, 1.876953125, 2.0233154296875, 2.169677734375, 2.3160400390625, 2.46240234375, 2.6087646484375, 2.755126953125, 2.9014892578125, 3.0478515625, 3.1942138671875, 3.340576171875, 3.4869384765625, 3.63330078125, 3.7796630859375, 3.926025390625, 4.0723876953125, 4.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 9.0, 20.0, 32.0, 91.0, 341.0, 3459.0, 1031041.0, 12719.0, 603.0, 124.0, 45.0, 23.0, 15.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.400390625, -3.30224609375, -3.2041015625, -3.10595703125, -3.0078125, -2.90966796875, -2.8115234375, -2.71337890625, -2.615234375, -2.51708984375, -2.4189453125, -2.32080078125, -2.22265625, -2.12451171875, -2.0263671875, -1.92822265625, -1.830078125, -1.73193359375, -1.6337890625, -1.53564453125, -1.4375, -1.33935546875, -1.2412109375, -1.14306640625, -1.044921875, -0.94677734375, -0.8486328125, -0.75048828125, -0.65234375, -0.55419921875, -0.4560546875, -0.35791015625, -0.259765625, -0.16162109375, -0.0634765625, 0.03466796875, 0.1328125, 0.23095703125, 0.3291015625, 0.42724609375, 0.525390625, 0.62353515625, 0.7216796875, 0.81982421875, 0.91796875, 1.01611328125, 1.1142578125, 1.21240234375, 1.310546875, 1.40869140625, 1.5068359375, 1.60498046875, 1.703125, 1.80126953125, 1.8994140625, 1.99755859375, 2.095703125, 2.19384765625, 2.2919921875, 2.39013671875, 2.48828125, 2.58642578125, 2.6845703125, 2.78271484375, 2.880859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 7.0, 14.0, 17.0, 20.0, 32.0, 36.0, 51.0, 60.0, 66.0, 105.0, 123.0, 105.0, 93.0, 69.0, 39.0, 35.0, 32.0, 14.0, 8.0, 14.0, 14.0, 7.0, 11.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.875131607055664e-05, -8.638110011816025e-05, -8.401088416576385e-05, -8.164066821336746e-05, -7.927045226097107e-05, -7.690023630857468e-05, -7.453002035617828e-05, -7.215980440378189e-05, -6.97895884513855e-05, -6.74193724989891e-05, -6.504915654659271e-05, -6.267894059419632e-05, -6.030872464179993e-05, -5.7938508689403534e-05, -5.556829273700714e-05, -5.319807678461075e-05, -5.0827860832214355e-05, -4.845764487981796e-05, -4.608742892742157e-05, -4.371721297502518e-05, -4.1346997022628784e-05, -3.897678107023239e-05, -3.6606565117836e-05, -3.4236349165439606e-05, -3.186613321304321e-05, -2.949591726064682e-05, -2.7125701308250427e-05, -2.4755485355854034e-05, -2.238526940345764e-05, -2.001505345106125e-05, -1.7644837498664856e-05, -1.5274621546268463e-05, -1.290440559387207e-05, -1.0534189641475677e-05, -8.163973689079285e-06, -5.793757736682892e-06, -3.423541784286499e-06, -1.0533258318901062e-06, 1.3168901205062866e-06, 3.6871060729026794e-06, 6.057322025299072e-06, 8.427537977695465e-06, 1.0797753930091858e-05, 1.316796988248825e-05, 1.5538185834884644e-05, 1.7908401787281036e-05, 2.027861773967743e-05, 2.2648833692073822e-05, 2.5019049644470215e-05, 2.7389265596866608e-05, 2.9759481549263e-05, 3.212969750165939e-05, 3.4499913454055786e-05, 3.687012940645218e-05, 3.924034535884857e-05, 4.1610561311244965e-05, 4.398077726364136e-05, 4.635099321603775e-05, 4.872120916843414e-05, 5.1091425120830536e-05, 5.346164107322693e-05, 5.583185702562332e-05, 5.8202072978019714e-05, 6.057228893041611e-05, 6.29425048828125e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 5.0, 8.0, 12.0, 23.0, 22.0, 39.0, 104.0, 149.0, 295.0, 754.0, 2630.0, 20874.0, 936566.0, 80762.0, 4367.0, 1097.0, 396.0, 186.0, 91.0, 54.0, 28.0, 16.0, 10.0, 9.0, 6.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8802871704101562, -0.8430938720703125, -0.8059005737304688, -0.768707275390625, -0.7315139770507812, -0.6943206787109375, -0.6571273803710938, -0.61993408203125, -0.5827407836914062, -0.5455474853515625, -0.5083541870117188, -0.471160888671875, -0.43396759033203125, -0.3967742919921875, -0.35958099365234375, -0.3223876953125, -0.28519439697265625, -0.2480010986328125, -0.21080780029296875, -0.173614501953125, -0.13642120361328125, -0.0992279052734375, -0.06203460693359375, -0.02484130859375, 0.01235198974609375, 0.0495452880859375, 0.08673858642578125, 0.123931884765625, 0.16112518310546875, 0.1983184814453125, 0.23551177978515625, 0.272705078125, 0.30989837646484375, 0.3470916748046875, 0.38428497314453125, 0.421478271484375, 0.45867156982421875, 0.4958648681640625, 0.5330581665039062, 0.57025146484375, 0.6074447631835938, 0.6446380615234375, 0.6818313598632812, 0.719024658203125, 0.7562179565429688, 0.7934112548828125, 0.8306045532226562, 0.8677978515625, 0.9049911499023438, 0.9421844482421875, 0.9793777465820312, 1.016571044921875, 1.0537643432617188, 1.0909576416015625, 1.1281509399414062, 1.16534423828125, 1.2025375366210938, 1.2397308349609375, 1.2769241333007812, 1.314117431640625, 1.3513107299804688, 1.3885040283203125, 1.4256973266601562, 1.462890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 3.0, 14.0, 8.0, 35.0, 38.0, 56.0, 73.0, 93.0, 121.0, 102.0, 116.0, 89.0, 68.0, 56.0, 33.0, 20.0, 20.0, 15.0, 10.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8134765625, -0.7805023193359375, -0.747528076171875, -0.7145538330078125, -0.68157958984375, -0.6486053466796875, -0.615631103515625, -0.5826568603515625, -0.5496826171875, -0.5167083740234375, -0.483734130859375, -0.4507598876953125, -0.41778564453125, -0.3848114013671875, -0.351837158203125, -0.3188629150390625, -0.285888671875, -0.2529144287109375, -0.219940185546875, -0.1869659423828125, -0.15399169921875, -0.1210174560546875, -0.088043212890625, -0.0550689697265625, -0.0220947265625, 0.0108795166015625, 0.043853759765625, 0.0768280029296875, 0.10980224609375, 0.1427764892578125, 0.175750732421875, 0.2087249755859375, 0.24169921875, 0.2746734619140625, 0.307647705078125, 0.3406219482421875, 0.37359619140625, 0.4065704345703125, 0.439544677734375, 0.4725189208984375, 0.5054931640625, 0.5384674072265625, 0.571441650390625, 0.6044158935546875, 0.63739013671875, 0.6703643798828125, 0.703338623046875, 0.7363128662109375, 0.769287109375, 0.8022613525390625, 0.835235595703125, 0.8682098388671875, 0.90118408203125, 0.9341583251953125, 0.967132568359375, 1.0001068115234375, 1.0330810546875, 1.0660552978515625, 1.099029541015625, 1.1320037841796875, 1.16497802734375, 1.1979522705078125, 1.230926513671875, 1.2639007568359375, 1.296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 73.0, 685.0, 214.0, 22.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.81246948242188, -93.8814697265625, -91.95046997070312, -90.01947021484375, -88.08847045898438, -86.157470703125, -84.22647094726562, -82.29547119140625, -80.36447143554688, -78.4334716796875, -76.50247192382812, -74.57147216796875, -72.64047241210938, -70.70947265625, -68.77847290039062, -66.84747314453125, -64.9164810180664, -62.98548126220703, -61.054481506347656, -59.12348175048828, -57.192481994628906, -55.26148223876953, -53.330482482910156, -51.39948654174805, -49.468482971191406, -47.53748321533203, -45.606483459472656, -43.67548370361328, -41.744483947753906, -39.81348419189453, -37.882484436035156, -35.95148849487305, -34.02048873901367, -32.0894889831543, -30.158489227294922, -28.227489471435547, -26.296491622924805, -24.36549186706543, -22.434492111206055, -20.503494262695312, -18.572494506835938, -16.641494750976562, -14.710495948791504, -12.779496192932129, -10.84849739074707, -8.917497634887695, -6.98649787902832, -5.055499076843262, -3.1244983673095703, -1.193498969078064, 0.7375004291534424, 2.6684999465942383, 4.599499225616455, 6.530498504638672, 8.461498260498047, 10.392497062683105, 12.32349681854248, 14.254496574401855, 16.185495376586914, 18.11649513244629, 20.047494888305664, 21.978492736816406, 23.90949249267578, 25.840492248535156, 27.77149200439453]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 2.0, 1.0, 8.0, 6.0, 4.0, 11.0, 15.0, 16.0, 10.0, 13.0, 22.0, 17.0, 20.0, 34.0, 29.0, 36.0, 45.0, 31.0, 42.0, 52.0, 64.0, 62.0, 59.0, 53.0, 41.0, 36.0, 29.0, 27.0, 27.0, 31.0, 28.0, 12.0, 18.0, 17.0, 14.0, 13.0, 11.0, 10.0, 7.0, 9.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.046215057373047, -16.564645767211914, -16.08307647705078, -15.601506233215332, -15.1199369430542, -14.638367652893066, -14.156797409057617, -13.675228118896484, -13.193658828735352, -12.712089538574219, -12.230520248413086, -11.748950004577637, -11.267380714416504, -10.785811424255371, -10.304241180419922, -9.822671890258789, -9.341102600097656, -8.859533309936523, -8.37796401977539, -7.896393775939941, -7.414824485778809, -6.933255195617676, -6.451685428619385, -5.970115661621094, -5.488546371459961, -5.006977081298828, -4.525407314300537, -4.043837547302246, -3.5622682571411133, -3.0806987285614014, -2.5991291999816895, -2.1175596714019775, -1.6359891891479492, -1.1544196605682373, -0.6728501319885254, -0.19128060340881348, 0.29028892517089844, 0.7718584537506104, 1.2534279823303223, 1.7349975109100342, 2.216567039489746, 2.698136568069458, 3.17970609664917, 3.661275625228882, 4.142845153808594, 4.624414443969727, 5.105984210968018, 5.587553977966309, 6.069123268127441, 6.550692558288574, 7.032262325286865, 7.513832092285156, 7.995401382446289, 8.476970672607422, 8.958539962768555, 9.440110206604004, 9.921679496765137, 10.40324878692627, 10.884819030761719, 11.366388320922852, 11.847957611083984, 12.329526901245117, 12.81109619140625, 13.2926664352417, 13.774235725402832]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 4.0, 8.0, 15.0, 18.0, 27.0, 22.0, 40.0, 44.0, 70.0, 101.0, 140.0, 303.0, 984.0, 21999.0, 4155650.0, 13243.0, 817.0, 251.0, 147.0, 100.0, 82.0, 47.0, 34.0, 30.0, 24.0, 13.0, 9.0, 10.0, 8.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.986328125, -3.855377197265625, -3.72442626953125, -3.593475341796875, -3.4625244140625, -3.331573486328125, -3.20062255859375, -3.069671630859375, -2.938720703125, -2.807769775390625, -2.67681884765625, -2.545867919921875, -2.4149169921875, -2.283966064453125, -2.15301513671875, -2.022064208984375, -1.89111328125, -1.760162353515625, -1.62921142578125, -1.498260498046875, -1.3673095703125, -1.236358642578125, -1.10540771484375, -0.974456787109375, -0.843505859375, -0.712554931640625, -0.58160400390625, -0.450653076171875, -0.3197021484375, -0.188751220703125, -0.05780029296875, 0.073150634765625, 0.2041015625, 0.335052490234375, 0.46600341796875, 0.596954345703125, 0.7279052734375, 0.858856201171875, 0.98980712890625, 1.120758056640625, 1.251708984375, 1.382659912109375, 1.51361083984375, 1.644561767578125, 1.7755126953125, 1.906463623046875, 2.03741455078125, 2.168365478515625, 2.29931640625, 2.430267333984375, 2.56121826171875, 2.692169189453125, 2.8231201171875, 2.954071044921875, 3.08502197265625, 3.215972900390625, 3.346923828125, 3.477874755859375, 3.60882568359375, 3.739776611328125, 3.8707275390625, 4.001678466796875, 4.13262939453125, 4.263580322265625, 4.39453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 2.0, 4.0, 12.0, 18.0, 20.0, 22.0, 26.0, 37.0, 35.0, 31.0, 46.0, 43.0, 63.0, 54.0, 72.0, 56.0, 61.0, 61.0, 44.0, 39.0, 42.0, 30.0, 36.0, 33.0, 22.0, 18.0, 14.0, 8.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0927734375, -1.0624847412109375, -1.032196044921875, -1.0019073486328125, -0.97161865234375, -0.9413299560546875, -0.911041259765625, -0.8807525634765625, -0.8504638671875, -0.8201751708984375, -0.789886474609375, -0.7595977783203125, -0.72930908203125, -0.6990203857421875, -0.668731689453125, -0.6384429931640625, -0.608154296875, -0.5778656005859375, -0.547576904296875, -0.5172882080078125, -0.48699951171875, -0.4567108154296875, -0.426422119140625, -0.3961334228515625, -0.3658447265625, -0.3355560302734375, -0.305267333984375, -0.2749786376953125, -0.24468994140625, -0.2144012451171875, -0.184112548828125, -0.1538238525390625, -0.12353515625, -0.0932464599609375, -0.062957763671875, -0.0326690673828125, -0.00238037109375, 0.0279083251953125, 0.058197021484375, 0.0884857177734375, 0.1187744140625, 0.1490631103515625, 0.179351806640625, 0.2096405029296875, 0.23992919921875, 0.2702178955078125, 0.300506591796875, 0.3307952880859375, 0.361083984375, 0.3913726806640625, 0.421661376953125, 0.4519500732421875, 0.48223876953125, 0.5125274658203125, 0.542816162109375, 0.5731048583984375, 0.6033935546875, 0.6336822509765625, 0.663970947265625, 0.6942596435546875, 0.72454833984375, 0.7548370361328125, 0.785125732421875, 0.8154144287109375, 0.845703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 13.0, 11.0, 23.0, 21.0, 38.0, 41.0, 79.0, 122.0, 164.0, 295.0, 638.0, 1582.0, 4180.0, 12601.0, 59913.0, 2921858.0, 1133637.0, 41929.0, 10516.0, 3661.0, 1417.0, 644.0, 304.0, 175.0, 109.0, 84.0, 52.0, 61.0, 30.0, 25.0, 17.0, 13.0, 17.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.34765625, -1.30670166015625, -1.2657470703125, -1.22479248046875, -1.183837890625, -1.14288330078125, -1.1019287109375, -1.06097412109375, -1.02001953125, -0.97906494140625, -0.9381103515625, -0.89715576171875, -0.856201171875, -0.81524658203125, -0.7742919921875, -0.73333740234375, -0.6923828125, -0.65142822265625, -0.6104736328125, -0.56951904296875, -0.528564453125, -0.48760986328125, -0.4466552734375, -0.40570068359375, -0.36474609375, -0.32379150390625, -0.2828369140625, -0.24188232421875, -0.200927734375, -0.15997314453125, -0.1190185546875, -0.07806396484375, -0.037109375, 0.00384521484375, 0.0447998046875, 0.08575439453125, 0.126708984375, 0.16766357421875, 0.2086181640625, 0.24957275390625, 0.29052734375, 0.33148193359375, 0.3724365234375, 0.41339111328125, 0.454345703125, 0.49530029296875, 0.5362548828125, 0.57720947265625, 0.6181640625, 0.65911865234375, 0.7000732421875, 0.74102783203125, 0.781982421875, 0.82293701171875, 0.8638916015625, 0.90484619140625, 0.94580078125, 0.98675537109375, 1.0277099609375, 1.06866455078125, 1.109619140625, 1.15057373046875, 1.1915283203125, 1.23248291015625, 1.2734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 7.0, 19.0, 31.0, 53.0, 166.0, 822.0, 2062.0, 621.0, 145.0, 55.0, 21.0, 16.0, 13.0, 13.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.7921600341796875, -1.712249755859375, -1.6323394775390625, -1.55242919921875, -1.4725189208984375, -1.392608642578125, -1.3126983642578125, -1.2327880859375, -1.1528778076171875, -1.072967529296875, -0.9930572509765625, -0.91314697265625, -0.8332366943359375, -0.753326416015625, -0.6734161376953125, -0.593505859375, -0.5135955810546875, -0.433685302734375, -0.3537750244140625, -0.27386474609375, -0.1939544677734375, -0.114044189453125, -0.0341339111328125, 0.0457763671875, 0.1256866455078125, 0.205596923828125, 0.2855072021484375, 0.36541748046875, 0.4453277587890625, 0.525238037109375, 0.6051483154296875, 0.68505859375, 0.7649688720703125, 0.844879150390625, 0.9247894287109375, 1.00469970703125, 1.0846099853515625, 1.164520263671875, 1.2444305419921875, 1.3243408203125, 1.4042510986328125, 1.484161376953125, 1.5640716552734375, 1.64398193359375, 1.7238922119140625, 1.803802490234375, 1.8837127685546875, 1.963623046875, 2.0435333251953125, 2.123443603515625, 2.2033538818359375, 2.28326416015625, 2.3631744384765625, 2.443084716796875, 2.5229949951171875, 2.6029052734375, 2.6828155517578125, 2.762725830078125, 2.8426361083984375, 2.92254638671875, 3.0024566650390625, 3.082366943359375, 3.1622772216796875, 3.2421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 9.0, 13.0, 96.0, 372.0, 338.0, 111.0, 23.0, 13.0, 11.0, 8.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.13895034790039, -7.623050689697266, -7.107151031494141, -6.591251850128174, -6.075352191925049, -5.559452533721924, -5.043553352355957, -4.527653694152832, -4.011754035949707, -3.495854377746582, -2.979954957962036, -2.4640555381774902, -1.9481558799743652, -1.4322562217712402, -0.9163568019866943, -0.40045738220214844, 0.11544227600097656, 0.631341814994812, 1.1472413539886475, 1.663140892982483, 2.1790404319763184, 2.6949400901794434, 3.2108395099639893, 3.726738929748535, 4.24263858795166, 4.758538246154785, 5.27443790435791, 5.790337085723877, 6.306236743927002, 6.822136402130127, 7.338035583496094, 7.853935241699219, 8.369836807250977, 8.885736465454102, 9.401636123657227, 9.917535781860352, 10.433435440063477, 10.949335098266602, 11.46523380279541, 11.981133460998535, 12.49703311920166, 13.012932777404785, 13.52883243560791, 14.044732093811035, 14.560630798339844, 15.076530456542969, 15.592430114746094, 16.10832977294922, 16.624229431152344, 17.14012908935547, 17.656028747558594, 18.17192840576172, 18.687828063964844, 19.20372772216797, 19.719627380371094, 20.23552703857422, 20.751426696777344, 21.26732635498047, 21.783226013183594, 22.29912567138672, 22.815025329589844, 23.33092498779297, 23.846824645996094, 24.36272430419922, 24.87862205505371]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 10.0, 14.0, 17.0, 24.0, 40.0, 51.0, 64.0, 64.0, 65.0, 87.0, 78.0, 94.0, 79.0, 68.0, 37.0, 48.0, 38.0, 28.0, 27.0, 22.0, 12.0, 10.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.893312454223633, -6.58778715133667, -6.282262325286865, -5.976737022399902, -5.6712117195129395, -5.365686416625977, -5.060161590576172, -4.754636287689209, -4.449110984802246, -4.143585681915283, -3.8380606174468994, -3.5325355529785156, -3.2270102500915527, -2.921485185623169, -2.615960121154785, -2.3104348182678223, -2.0049099922180176, -1.6993848085403442, -1.393859624862671, -1.088334560394287, -0.7828093767166138, -0.47728419303894043, -0.17175912857055664, 0.13376617431640625, 0.43929123878479004, 0.7448164224624634, 1.0503416061401367, 1.3558666706085205, 1.6613918542861938, 1.9669170379638672, 2.272442102432251, 2.577967405319214, 2.8834924697875977, 3.1890175342559814, 3.4945428371429443, 3.800067901611328, 4.105593204498291, 4.411118507385254, 4.716643333435059, 5.0221686363220215, 5.327693939208984, 5.633219242095947, 5.938744068145752, 6.244269371032715, 6.549794673919678, 6.855319976806641, 7.160844802856445, 7.466370105743408, 7.771894931793213, 8.077420234680176, 8.38294506072998, 8.688470840454102, 8.993995666503906, 9.299520492553711, 9.605045318603516, 9.910571098327637, 10.216095924377441, 10.521620750427246, 10.827146530151367, 11.132671356201172, 11.438196182250977, 11.743721961975098, 12.049246788024902, 12.354772567749023, 12.660297393798828]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 5.0, 8.0, 15.0, 18.0, 23.0, 32.0, 38.0, 64.0, 110.0, 140.0, 199.0, 374.0, 696.0, 1226.0, 2111.0, 4313.0, 9324.0, 21546.0, 57493.0, 182401.0, 456048.0, 204886.0, 64049.0, 23589.0, 9804.0, 4743.0, 2234.0, 1178.0, 729.0, 373.0, 264.0, 148.0, 95.0, 75.0, 60.0, 26.0, 22.0, 25.0, 18.0, 7.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-0.94775390625, -0.9195022583007812, -0.8912506103515625, -0.8629989624023438, -0.834747314453125, -0.8064956665039062, -0.7782440185546875, -0.7499923706054688, -0.72174072265625, -0.6934890747070312, -0.6652374267578125, -0.6369857788085938, -0.608734130859375, -0.5804824829101562, -0.5522308349609375, -0.5239791870117188, -0.4957275390625, -0.46747589111328125, -0.4392242431640625, -0.41097259521484375, -0.382720947265625, -0.35446929931640625, -0.3262176513671875, -0.29796600341796875, -0.26971435546875, -0.24146270751953125, -0.2132110595703125, -0.18495941162109375, -0.156707763671875, -0.12845611572265625, -0.1002044677734375, -0.07195281982421875, -0.043701171875, -0.01544952392578125, 0.0128021240234375, 0.04105377197265625, 0.069305419921875, 0.09755706787109375, 0.1258087158203125, 0.15406036376953125, 0.18231201171875, 0.21056365966796875, 0.2388153076171875, 0.26706695556640625, 0.295318603515625, 0.32357025146484375, 0.3518218994140625, 0.38007354736328125, 0.4083251953125, 0.43657684326171875, 0.4648284912109375, 0.49308013916015625, 0.521331787109375, 0.5495834350585938, 0.5778350830078125, 0.6060867309570312, 0.63433837890625, 0.6625900268554688, 0.6908416748046875, 0.7190933227539062, 0.747344970703125, 0.7755966186523438, 0.8038482666015625, 0.8320999145507812, 0.8603515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 10.0, 9.0, 16.0, 9.0, 18.0, 16.0, 28.0, 23.0, 34.0, 23.0, 37.0, 45.0, 50.0, 48.0, 44.0, 50.0, 47.0, 43.0, 53.0, 38.0, 34.0, 40.0, 33.0, 35.0, 36.0, 35.0, 20.0, 17.0, 15.0, 18.0, 10.0, 14.0, 8.0, 7.0, 6.0, 1.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.725799560546875, -0.70208740234375, -0.678375244140625, -0.6546630859375, -0.630950927734375, -0.60723876953125, -0.583526611328125, -0.559814453125, -0.536102294921875, -0.51239013671875, -0.488677978515625, -0.4649658203125, -0.441253662109375, -0.41754150390625, -0.393829345703125, -0.3701171875, -0.346405029296875, -0.32269287109375, -0.298980712890625, -0.2752685546875, -0.251556396484375, -0.22784423828125, -0.204132080078125, -0.180419921875, -0.156707763671875, -0.13299560546875, -0.109283447265625, -0.0855712890625, -0.061859130859375, -0.03814697265625, -0.014434814453125, 0.00927734375, 0.032989501953125, 0.05670166015625, 0.080413818359375, 0.1041259765625, 0.127838134765625, 0.15155029296875, 0.175262451171875, 0.198974609375, 0.222686767578125, 0.24639892578125, 0.270111083984375, 0.2938232421875, 0.317535400390625, 0.34124755859375, 0.364959716796875, 0.388671875, 0.412384033203125, 0.43609619140625, 0.459808349609375, 0.4835205078125, 0.507232666015625, 0.53094482421875, 0.554656982421875, 0.578369140625, 0.602081298828125, 0.62579345703125, 0.649505615234375, 0.6732177734375, 0.696929931640625, 0.72064208984375, 0.744354248046875, 0.76806640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 7.0, 12.0, 15.0, 12.0, 34.0, 74.0, 116.0, 153.0, 325.0, 781.0, 1892.0, 9409.0, 194801.0, 809965.0, 25251.0, 3460.0, 1090.0, 530.0, 258.0, 127.0, 82.0, 46.0, 35.0, 20.0, 14.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.03515625, -3.937225341796875, -3.83929443359375, -3.741363525390625, -3.6434326171875, -3.545501708984375, -3.44757080078125, -3.349639892578125, -3.251708984375, -3.153778076171875, -3.05584716796875, -2.957916259765625, -2.8599853515625, -2.762054443359375, -2.66412353515625, -2.566192626953125, -2.46826171875, -2.370330810546875, -2.27239990234375, -2.174468994140625, -2.0765380859375, -1.978607177734375, -1.88067626953125, -1.782745361328125, -1.684814453125, -1.586883544921875, -1.48895263671875, -1.391021728515625, -1.2930908203125, -1.195159912109375, -1.09722900390625, -0.999298095703125, -0.9013671875, -0.803436279296875, -0.70550537109375, -0.607574462890625, -0.5096435546875, -0.411712646484375, -0.31378173828125, -0.215850830078125, -0.117919921875, -0.019989013671875, 0.07794189453125, 0.175872802734375, 0.2738037109375, 0.371734619140625, 0.46966552734375, 0.567596435546875, 0.66552734375, 0.763458251953125, 0.86138916015625, 0.959320068359375, 1.0572509765625, 1.155181884765625, 1.25311279296875, 1.351043701171875, 1.448974609375, 1.546905517578125, 1.64483642578125, 1.742767333984375, 1.8406982421875, 1.938629150390625, 2.03656005859375, 2.134490966796875, 2.232421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 13.0, 9.0, 13.0, 23.0, 33.0, 42.0, 53.0, 59.0, 80.0, 89.0, 89.0, 91.0, 83.0, 64.0, 65.0, 47.0, 45.0, 31.0, 31.0, 16.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.84185791015625, -5.6680908203125, -5.49432373046875, -5.320556640625, -5.14678955078125, -4.9730224609375, -4.79925537109375, -4.62548828125, -4.45172119140625, -4.2779541015625, -4.10418701171875, -3.930419921875, -3.75665283203125, -3.5828857421875, -3.40911865234375, -3.2353515625, -3.06158447265625, -2.8878173828125, -2.71405029296875, -2.540283203125, -2.36651611328125, -2.1927490234375, -2.01898193359375, -1.84521484375, -1.67144775390625, -1.4976806640625, -1.32391357421875, -1.150146484375, -0.97637939453125, -0.8026123046875, -0.62884521484375, -0.455078125, -0.28131103515625, -0.1075439453125, 0.06622314453125, 0.239990234375, 0.41375732421875, 0.5875244140625, 0.76129150390625, 0.93505859375, 1.10882568359375, 1.2825927734375, 1.45635986328125, 1.630126953125, 1.80389404296875, 1.9776611328125, 2.15142822265625, 2.3251953125, 2.49896240234375, 2.6727294921875, 2.84649658203125, 3.020263671875, 3.19403076171875, 3.3677978515625, 3.54156494140625, 3.71533203125, 3.88909912109375, 4.0628662109375, 4.23663330078125, 4.410400390625, 4.58416748046875, 4.7579345703125, 4.93170166015625, 5.10546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 12.0, 10.0, 10.0, 33.0, 43.0, 51.0, 117.0, 310.0, 730.0, 2922.0, 35991.0, 995725.0, 10054.0, 1586.0, 485.0, 192.0, 111.0, 56.0, 38.0, 24.0, 16.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.357086181640625, -2.27667236328125, -2.196258544921875, -2.1158447265625, -2.035430908203125, -1.95501708984375, -1.874603271484375, -1.794189453125, -1.713775634765625, -1.63336181640625, -1.552947998046875, -1.4725341796875, -1.392120361328125, -1.31170654296875, -1.231292724609375, -1.15087890625, -1.070465087890625, -0.99005126953125, -0.909637451171875, -0.8292236328125, -0.748809814453125, -0.66839599609375, -0.587982177734375, -0.507568359375, -0.427154541015625, -0.34674072265625, -0.266326904296875, -0.1859130859375, -0.105499267578125, -0.02508544921875, 0.055328369140625, 0.1357421875, 0.216156005859375, 0.29656982421875, 0.376983642578125, 0.4573974609375, 0.537811279296875, 0.61822509765625, 0.698638916015625, 0.779052734375, 0.859466552734375, 0.93988037109375, 1.020294189453125, 1.1007080078125, 1.181121826171875, 1.26153564453125, 1.341949462890625, 1.42236328125, 1.502777099609375, 1.58319091796875, 1.663604736328125, 1.7440185546875, 1.824432373046875, 1.90484619140625, 1.985260009765625, 2.065673828125, 2.146087646484375, 2.22650146484375, 2.306915283203125, 2.3873291015625, 2.467742919921875, 2.54815673828125, 2.628570556640625, 2.708984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 22.0, 33.0, 53.0, 108.0, 153.0, 199.0, 163.0, 89.0, 59.0, 29.0, 21.0, 8.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001571178436279297, -0.0001529073342680931, -0.00014869682490825653, -0.00014448631554841995, -0.00014027580618858337, -0.0001360652968287468, -0.00013185478746891022, -0.00012764427810907364, -0.00012343376874923706, -0.00011922325938940048, -0.0001150127500295639, -0.00011080224066972733, -0.00010659173130989075, -0.00010238122195005417, -9.817071259021759e-05, -9.396020323038101e-05, -8.974969387054443e-05, -8.553918451070786e-05, -8.132867515087128e-05, -7.71181657910347e-05, -7.290765643119812e-05, -6.869714707136154e-05, -6.448663771152496e-05, -6.0276128351688385e-05, -5.606561899185181e-05, -5.185510963201523e-05, -4.764460027217865e-05, -4.343409091234207e-05, -3.922358155250549e-05, -3.5013072192668915e-05, -3.0802562832832336e-05, -2.6592053472995758e-05, -2.238154411315918e-05, -1.81710347533226e-05, -1.3960525393486023e-05, -9.750016033649445e-06, -5.539506673812866e-06, -1.3289973139762878e-06, 2.8815120458602905e-06, 7.092021405696869e-06, 1.1302530765533447e-05, 1.5513040125370026e-05, 1.9723549485206604e-05, 2.3934058845043182e-05, 2.814456820487976e-05, 3.235507756471634e-05, 3.656558692455292e-05, 4.0776096284389496e-05, 4.4986605644226074e-05, 4.919711500406265e-05, 5.340762436389923e-05, 5.761813372373581e-05, 6.182864308357239e-05, 6.603915244340897e-05, 7.024966180324554e-05, 7.446017116308212e-05, 7.86706805229187e-05, 8.288118988275528e-05, 8.709169924259186e-05, 9.130220860242844e-05, 9.551271796226501e-05, 9.972322732210159e-05, 0.00010393373668193817, 0.00010814424604177475, 0.00011235475540161133]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 15.0, 13.0, 16.0, 24.0, 44.0, 51.0, 81.0, 161.0, 271.0, 577.0, 1311.0, 4363.0, 26317.0, 839317.0, 161852.0, 10027.0, 2337.0, 863.0, 382.0, 179.0, 112.0, 66.0, 49.0, 30.0, 23.0, 9.0, 6.0, 8.0, 8.0, 6.0, 3.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99609375, -0.9647369384765625, -0.933380126953125, -0.9020233154296875, -0.87066650390625, -0.8393096923828125, -0.807952880859375, -0.7765960693359375, -0.7452392578125, -0.7138824462890625, -0.682525634765625, -0.6511688232421875, -0.61981201171875, -0.5884552001953125, -0.557098388671875, -0.5257415771484375, -0.494384765625, -0.4630279541015625, -0.431671142578125, -0.4003143310546875, -0.36895751953125, -0.3376007080078125, -0.306243896484375, -0.2748870849609375, -0.2435302734375, -0.2121734619140625, -0.180816650390625, -0.1494598388671875, -0.11810302734375, -0.0867462158203125, -0.055389404296875, -0.0240325927734375, 0.00732421875, 0.0386810302734375, 0.070037841796875, 0.1013946533203125, 0.13275146484375, 0.1641082763671875, 0.195465087890625, 0.2268218994140625, 0.2581787109375, 0.2895355224609375, 0.320892333984375, 0.3522491455078125, 0.38360595703125, 0.4149627685546875, 0.446319580078125, 0.4776763916015625, 0.509033203125, 0.5403900146484375, 0.571746826171875, 0.6031036376953125, 0.63446044921875, 0.6658172607421875, 0.697174072265625, 0.7285308837890625, 0.7598876953125, 0.7912445068359375, 0.822601318359375, 0.8539581298828125, 0.88531494140625, 0.9166717529296875, 0.948028564453125, 0.9793853759765625, 1.0107421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 11.0, 16.0, 20.0, 39.0, 49.0, 69.0, 75.0, 108.0, 119.0, 133.0, 89.0, 83.0, 50.0, 37.0, 20.0, 19.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79736328125, -0.770416259765625, -0.74346923828125, -0.716522216796875, -0.6895751953125, -0.662628173828125, -0.63568115234375, -0.608734130859375, -0.581787109375, -0.554840087890625, -0.52789306640625, -0.500946044921875, -0.4739990234375, -0.447052001953125, -0.42010498046875, -0.393157958984375, -0.3662109375, -0.339263916015625, -0.31231689453125, -0.285369873046875, -0.2584228515625, -0.231475830078125, -0.20452880859375, -0.177581787109375, -0.150634765625, -0.123687744140625, -0.09674072265625, -0.069793701171875, -0.0428466796875, -0.015899658203125, 0.01104736328125, 0.037994384765625, 0.06494140625, 0.091888427734375, 0.11883544921875, 0.145782470703125, 0.1727294921875, 0.199676513671875, 0.22662353515625, 0.253570556640625, 0.280517578125, 0.307464599609375, 0.33441162109375, 0.361358642578125, 0.3883056640625, 0.415252685546875, 0.44219970703125, 0.469146728515625, 0.49609375, 0.523040771484375, 0.54998779296875, 0.576934814453125, 0.6038818359375, 0.630828857421875, 0.65777587890625, 0.684722900390625, 0.711669921875, 0.738616943359375, 0.76556396484375, 0.792510986328125, 0.8194580078125, 0.846405029296875, 0.87335205078125, 0.900299072265625, 0.92724609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 11.0, 57.0, 350.0, 535.0, 42.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.12767028808594, -64.5235824584961, -62.919490814208984, -61.315399169921875, -59.71131134033203, -58.10721969604492, -56.50313186645508, -54.89904022216797, -53.294952392578125, -51.690860748291016, -50.08677291870117, -48.48268127441406, -46.87859344482422, -45.27450180053711, -43.670413970947266, -42.066322326660156, -40.46223449707031, -38.8581428527832, -37.25405502319336, -35.64996337890625, -34.045875549316406, -32.4417839050293, -30.837696075439453, -29.233604431152344, -27.629512786865234, -26.025423049926758, -24.42133331298828, -22.817243576049805, -21.213153839111328, -19.60906219482422, -18.004974365234375, -16.400882720947266, -14.796794891357422, -13.192705154418945, -11.588615417480469, -9.984525680541992, -8.380435943603516, -6.776345252990723, -5.172255516052246, -3.5681657791137695, -1.964076042175293, -0.35998618602752686, 1.2441036701202393, 2.848193645477295, 4.4522833824157715, 6.056373596191406, 7.660463333129883, 9.26455307006836, 10.868642807006836, 12.472732543945312, 14.076822280883789, 15.680912017822266, 17.285001754760742, 18.88909149169922, 20.493183135986328, 22.097270965576172, 23.70136260986328, 25.305452346801758, 26.909542083740234, 28.51363182067871, 30.117721557617188, 31.721813201904297, 33.32590103149414, 34.92999267578125, 36.534080505371094]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 13.0, 15.0, 20.0, 26.0, 28.0, 41.0, 53.0, 51.0, 66.0, 67.0, 84.0, 96.0, 80.0, 63.0, 52.0, 39.0, 46.0, 32.0, 26.0, 25.0, 24.0, 15.0, 13.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.88701629638672, -18.244409561157227, -17.601804733276367, -16.959197998046875, -16.316593170166016, -15.673986434936523, -15.031379699707031, -14.388773918151855, -13.74616813659668, -13.103562355041504, -12.460956573486328, -11.818349838256836, -11.17574405670166, -10.533138275146484, -9.890531539916992, -9.247925758361816, -8.60531997680664, -7.962714195251465, -7.320107936859131, -6.677501678466797, -6.034895896911621, -5.392290115356445, -4.749683856964111, -4.107077598571777, -3.4644718170166016, -2.8218657970428467, -2.179259777069092, -1.536653757095337, -0.894047737121582, -0.25144171714782715, 0.39116430282592773, 1.0337705612182617, 1.6763763427734375, 2.3189823627471924, 2.9615883827209473, 3.604194402694702, 4.246800422668457, 4.889406204223633, 5.532012462615967, 6.174618721008301, 6.817224502563477, 7.459830284118652, 8.102436065673828, 8.74504280090332, 9.387648582458496, 10.030254364013672, 10.672861099243164, 11.31546688079834, 11.958072662353516, 12.600678443908691, 13.243284225463867, 13.88589096069336, 14.528496742248535, 15.171102523803711, 15.813709259033203, 16.456314086914062, 17.098920822143555, 17.741527557373047, 18.384132385253906, 19.0267391204834, 19.66934585571289, 20.31195068359375, 20.954557418823242, 21.597164154052734, 22.239768981933594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 7.0, 10.0, 13.0, 24.0, 40.0, 67.0, 178.0, 545.0, 2580.0, 21329.0, 3136265.0, 1018422.0, 11923.0, 2084.0, 455.0, 182.0, 86.0, 25.0, 15.0, 7.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.755615234375, -1.69482421875, -1.634033203125, -1.5732421875, -1.512451171875, -1.45166015625, -1.390869140625, -1.330078125, -1.269287109375, -1.20849609375, -1.147705078125, -1.0869140625, -1.026123046875, -0.96533203125, -0.904541015625, -0.84375, -0.782958984375, -0.72216796875, -0.661376953125, -0.6005859375, -0.539794921875, -0.47900390625, -0.418212890625, -0.357421875, -0.296630859375, -0.23583984375, -0.175048828125, -0.1142578125, -0.053466796875, 0.00732421875, 0.068115234375, 0.12890625, 0.189697265625, 0.25048828125, 0.311279296875, 0.3720703125, 0.432861328125, 0.49365234375, 0.554443359375, 0.615234375, 0.676025390625, 0.73681640625, 0.797607421875, 0.8583984375, 0.919189453125, 0.97998046875, 1.040771484375, 1.1015625, 1.162353515625, 1.22314453125, 1.283935546875, 1.3447265625, 1.405517578125, 1.46630859375, 1.527099609375, 1.587890625, 1.648681640625, 1.70947265625, 1.770263671875, 1.8310546875, 1.891845703125, 1.95263671875, 2.013427734375, 2.07421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 13.0, 7.0, 25.0, 39.0, 39.0, 32.0, 37.0, 43.0, 62.0, 62.0, 64.0, 62.0, 68.0, 65.0, 59.0, 45.0, 52.0, 43.0, 34.0, 24.0, 30.0, 17.0, 29.0, 11.0, 6.0, 9.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1953125, -1.1663055419921875, -1.137298583984375, -1.1082916259765625, -1.07928466796875, -1.0502777099609375, -1.021270751953125, -0.9922637939453125, -0.9632568359375, -0.9342498779296875, -0.905242919921875, -0.8762359619140625, -0.84722900390625, -0.8182220458984375, -0.789215087890625, -0.7602081298828125, -0.731201171875, -0.7021942138671875, -0.673187255859375, -0.6441802978515625, -0.61517333984375, -0.5861663818359375, -0.557159423828125, -0.5281524658203125, -0.4991455078125, -0.4701385498046875, -0.441131591796875, -0.4121246337890625, -0.38311767578125, -0.3541107177734375, -0.325103759765625, -0.2960968017578125, -0.26708984375, -0.2380828857421875, -0.209075927734375, -0.1800689697265625, -0.15106201171875, -0.1220550537109375, -0.093048095703125, -0.0640411376953125, -0.0350341796875, -0.0060272216796875, 0.022979736328125, 0.0519866943359375, 0.08099365234375, 0.1100006103515625, 0.139007568359375, 0.1680145263671875, 0.197021484375, 0.2260284423828125, 0.255035400390625, 0.2840423583984375, 0.31304931640625, 0.3420562744140625, 0.371063232421875, 0.4000701904296875, 0.4290771484375, 0.4580841064453125, 0.487091064453125, 0.5160980224609375, 0.54510498046875, 0.5741119384765625, 0.603118896484375, 0.6321258544921875, 0.6611328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 2.0, 8.0, 8.0, 21.0, 20.0, 29.0, 40.0, 52.0, 93.0, 156.0, 270.0, 454.0, 1041.0, 2706.0, 8889.0, 37168.0, 371453.0, 3583019.0, 154559.0, 23214.0, 6513.0, 2345.0, 1005.0, 496.0, 244.0, 165.0, 85.0, 57.0, 47.0, 34.0, 18.0, 15.0, 14.0, 13.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.2383956909179688, -1.2043304443359375, -1.1702651977539062, -1.136199951171875, -1.1021347045898438, -1.0680694580078125, -1.0340042114257812, -0.99993896484375, -0.9658737182617188, -0.9318084716796875, -0.8977432250976562, -0.863677978515625, -0.8296127319335938, -0.7955474853515625, -0.7614822387695312, -0.7274169921875, -0.6933517456054688, -0.6592864990234375, -0.6252212524414062, -0.591156005859375, -0.5570907592773438, -0.5230255126953125, -0.48896026611328125, -0.45489501953125, -0.42082977294921875, -0.3867645263671875, -0.35269927978515625, -0.318634033203125, -0.28456878662109375, -0.2505035400390625, -0.21643829345703125, -0.182373046875, -0.14830780029296875, -0.1142425537109375, -0.08017730712890625, -0.046112060546875, -0.01204681396484375, 0.0220184326171875, 0.05608367919921875, 0.09014892578125, 0.12421417236328125, 0.1582794189453125, 0.19234466552734375, 0.226409912109375, 0.26047515869140625, 0.2945404052734375, 0.32860565185546875, 0.3626708984375, 0.39673614501953125, 0.4308013916015625, 0.46486663818359375, 0.498931884765625, 0.5329971313476562, 0.5670623779296875, 0.6011276245117188, 0.63519287109375, 0.6692581176757812, 0.7033233642578125, 0.7373886108398438, 0.771453857421875, 0.8055191040039062, 0.8395843505859375, 0.8736495971679688, 0.90771484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 7.0, 6.0, 10.0, 12.0, 20.0, 25.0, 32.0, 52.0, 75.0, 158.0, 348.0, 826.0, 1180.0, 675.0, 260.0, 142.0, 58.0, 51.0, 36.0, 17.0, 17.0, 11.0, 11.0, 6.0, 7.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.587890625, -1.5388336181640625, -1.489776611328125, -1.4407196044921875, -1.39166259765625, -1.3426055908203125, -1.293548583984375, -1.2444915771484375, -1.1954345703125, -1.1463775634765625, -1.097320556640625, -1.0482635498046875, -0.99920654296875, -0.9501495361328125, -0.901092529296875, -0.8520355224609375, -0.802978515625, -0.7539215087890625, -0.704864501953125, -0.6558074951171875, -0.60675048828125, -0.5576934814453125, -0.508636474609375, -0.4595794677734375, -0.4105224609375, -0.3614654541015625, -0.312408447265625, -0.2633514404296875, -0.21429443359375, -0.1652374267578125, -0.116180419921875, -0.0671234130859375, -0.01806640625, 0.0309906005859375, 0.080047607421875, 0.1291046142578125, 0.17816162109375, 0.2272186279296875, 0.276275634765625, 0.3253326416015625, 0.3743896484375, 0.4234466552734375, 0.472503662109375, 0.5215606689453125, 0.57061767578125, 0.6196746826171875, 0.668731689453125, 0.7177886962890625, 0.766845703125, 0.8159027099609375, 0.864959716796875, 0.9140167236328125, 0.96307373046875, 1.0121307373046875, 1.061187744140625, 1.1102447509765625, 1.1593017578125, 1.2083587646484375, 1.257415771484375, 1.3064727783203125, 1.35552978515625, 1.4045867919921875, 1.453643798828125, 1.5027008056640625, 1.5517578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 14.0, 21.0, 82.0, 192.0, 309.0, 203.0, 83.0, 38.0, 26.0, 7.0, 3.0, 2.0, 6.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.766538619995117, -16.37188148498535, -15.977226257324219, -15.582569122314453, -15.187912940979004, -14.793256759643555, -14.398600578308105, -14.003944396972656, -13.60928726196289, -13.214631080627441, -12.819974899291992, -12.425317764282227, -12.030661582946777, -11.636005401611328, -11.241349220275879, -10.84669303894043, -10.45203685760498, -10.057380676269531, -9.662724494934082, -9.268068313598633, -8.873411178588867, -8.478754997253418, -8.084098815917969, -7.6894426345825195, -7.294785976409912, -6.900129795074463, -6.5054731369018555, -6.110816955566406, -5.716160774230957, -5.32150411605835, -4.9268479347229, -4.532191276550293, -4.137534141540527, -3.742877721786499, -3.3482213020324707, -2.9535651206970215, -2.558908700942993, -2.164252281188965, -1.7695960998535156, -1.3749396800994873, -0.980283260345459, -0.5856269001960754, -0.1909705400466919, 0.20368576049804688, 0.5983421802520752, 0.9929986000061035, 1.3876547813415527, 1.782311201095581, 2.1769676208496094, 2.5716240406036377, 2.966280460357666, 3.3609366416931152, 3.7555930614471436, 4.150249481201172, 4.544905662536621, 4.93956184387207, 5.334218502044678, 5.728874683380127, 6.123531341552734, 6.518187522888184, 6.912843704223633, 7.30750036239624, 7.7021565437316895, 8.096813201904297, 8.491469383239746]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 8.0, 6.0, 13.0, 12.0, 12.0, 16.0, 22.0, 20.0, 28.0, 32.0, 42.0, 39.0, 54.0, 61.0, 44.0, 48.0, 59.0, 73.0, 37.0, 54.0, 47.0, 54.0, 34.0, 34.0, 18.0, 26.0, 23.0, 16.0, 11.0, 12.0, 5.0, 4.0, 6.0, 6.0, 9.0, 6.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.503739356994629, -6.268802642822266, -6.033865928649902, -5.798929214477539, -5.563992500305176, -5.3290557861328125, -5.094119071960449, -4.859182357788086, -4.624245643615723, -4.389308929443359, -4.154372215270996, -3.919435501098633, -3.6844987869262695, -3.4495620727539062, -3.214625358581543, -2.9796886444091797, -2.7447521686553955, -2.5098154544830322, -2.274878740310669, -2.0399420261383057, -1.8050053119659424, -1.5700687170028687, -1.3351320028305054, -1.100195288658142, -0.8652585744857788, -0.6303218603134155, -0.39538517594337463, -0.16044849157333374, 0.07448822259902954, 0.30942487716674805, 0.5443615913391113, 0.7792983055114746, 1.014235019683838, 1.2491717338562012, 1.4841084480285645, 1.7190451622009277, 1.953981876373291, 2.1889185905456543, 2.4238553047180176, 2.658792018890381, 2.893728733062744, 3.1286654472351074, 3.3636021614074707, 3.598538875579834, 3.8334755897521973, 4.0684123039245605, 4.303349018096924, 4.538285732269287, 4.773221969604492, 5.0081586837768555, 5.243095397949219, 5.478032112121582, 5.712968826293945, 5.947905540466309, 6.182842254638672, 6.417778968811035, 6.652715682983398, 6.887652397155762, 7.122589111328125, 7.357525825500488, 7.592462539672852, 7.827399253845215, 8.062335968017578, 8.297272682189941, 8.532209396362305]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 5.0, 10.0, 14.0, 14.0, 27.0, 29.0, 54.0, 81.0, 119.0, 197.0, 381.0, 722.0, 1284.0, 2430.0, 4807.0, 10140.0, 22175.0, 51641.0, 125806.0, 286138.0, 301889.0, 138373.0, 56386.0, 24080.0, 10814.0, 5136.0, 2620.0, 1388.0, 713.0, 418.0, 226.0, 149.0, 88.0, 64.0, 48.0, 30.0, 18.0, 9.0, 10.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.583984375, -0.566314697265625, -0.54864501953125, -0.530975341796875, -0.5133056640625, -0.495635986328125, -0.47796630859375, -0.460296630859375, -0.442626953125, -0.424957275390625, -0.40728759765625, -0.389617919921875, -0.3719482421875, -0.354278564453125, -0.33660888671875, -0.318939208984375, -0.30126953125, -0.283599853515625, -0.26593017578125, -0.248260498046875, -0.2305908203125, -0.212921142578125, -0.19525146484375, -0.177581787109375, -0.159912109375, -0.142242431640625, -0.12457275390625, -0.106903076171875, -0.0892333984375, -0.071563720703125, -0.05389404296875, -0.036224365234375, -0.0185546875, -0.000885009765625, 0.01678466796875, 0.034454345703125, 0.0521240234375, 0.069793701171875, 0.08746337890625, 0.105133056640625, 0.122802734375, 0.140472412109375, 0.15814208984375, 0.175811767578125, 0.1934814453125, 0.211151123046875, 0.22882080078125, 0.246490478515625, 0.26416015625, 0.281829833984375, 0.29949951171875, 0.317169189453125, 0.3348388671875, 0.352508544921875, 0.37017822265625, 0.387847900390625, 0.405517578125, 0.423187255859375, 0.44085693359375, 0.458526611328125, 0.4761962890625, 0.493865966796875, 0.51153564453125, 0.529205322265625, 0.546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 7.0, 7.0, 24.0, 16.0, 19.0, 23.0, 16.0, 30.0, 33.0, 24.0, 41.0, 31.0, 39.0, 56.0, 50.0, 54.0, 44.0, 47.0, 42.0, 51.0, 48.0, 35.0, 36.0, 34.0, 28.0, 27.0, 18.0, 29.0, 14.0, 13.0, 17.0, 12.0, 6.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67724609375, -0.6570892333984375, -0.636932373046875, -0.6167755126953125, -0.59661865234375, -0.5764617919921875, -0.556304931640625, -0.5361480712890625, -0.5159912109375, -0.4958343505859375, -0.475677490234375, -0.4555206298828125, -0.43536376953125, -0.4152069091796875, -0.395050048828125, -0.3748931884765625, -0.354736328125, -0.3345794677734375, -0.314422607421875, -0.2942657470703125, -0.27410888671875, -0.2539520263671875, -0.233795166015625, -0.2136383056640625, -0.1934814453125, -0.1733245849609375, -0.153167724609375, -0.1330108642578125, -0.11285400390625, -0.0926971435546875, -0.072540283203125, -0.0523834228515625, -0.0322265625, -0.0120697021484375, 0.008087158203125, 0.0282440185546875, 0.04840087890625, 0.0685577392578125, 0.088714599609375, 0.1088714599609375, 0.1290283203125, 0.1491851806640625, 0.169342041015625, 0.1894989013671875, 0.20965576171875, 0.2298126220703125, 0.249969482421875, 0.2701263427734375, 0.290283203125, 0.3104400634765625, 0.330596923828125, 0.3507537841796875, 0.37091064453125, 0.3910675048828125, 0.411224365234375, 0.4313812255859375, 0.4515380859375, 0.4716949462890625, 0.491851806640625, 0.5120086669921875, 0.53216552734375, 0.5523223876953125, 0.572479248046875, 0.5926361083984375, 0.61279296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 15.0, 8.0, 13.0, 21.0, 20.0, 32.0, 44.0, 57.0, 64.0, 110.0, 135.0, 189.0, 244.0, 355.0, 559.0, 874.0, 1953.0, 7472.0, 86994.0, 873482.0, 64970.0, 6522.0, 1786.0, 858.0, 478.0, 361.0, 213.0, 183.0, 142.0, 98.0, 89.0, 52.0, 30.0, 27.0, 22.0, 15.0, 16.0, 10.0, 7.0, 5.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.20703125, -2.142974853515625, -2.07891845703125, -2.014862060546875, -1.9508056640625, -1.886749267578125, -1.82269287109375, -1.758636474609375, -1.694580078125, -1.630523681640625, -1.56646728515625, -1.502410888671875, -1.4383544921875, -1.374298095703125, -1.31024169921875, -1.246185302734375, -1.18212890625, -1.118072509765625, -1.05401611328125, -0.989959716796875, -0.9259033203125, -0.861846923828125, -0.79779052734375, -0.733734130859375, -0.669677734375, -0.605621337890625, -0.54156494140625, -0.477508544921875, -0.4134521484375, -0.349395751953125, -0.28533935546875, -0.221282958984375, -0.1572265625, -0.093170166015625, -0.02911376953125, 0.034942626953125, 0.0989990234375, 0.163055419921875, 0.22711181640625, 0.291168212890625, 0.355224609375, 0.419281005859375, 0.48333740234375, 0.547393798828125, 0.6114501953125, 0.675506591796875, 0.73956298828125, 0.803619384765625, 0.86767578125, 0.931732177734375, 0.99578857421875, 1.059844970703125, 1.1239013671875, 1.187957763671875, 1.25201416015625, 1.316070556640625, 1.380126953125, 1.444183349609375, 1.50823974609375, 1.572296142578125, 1.6363525390625, 1.700408935546875, 1.76446533203125, 1.828521728515625, 1.892578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 19.0, 10.0, 10.0, 15.0, 25.0, 27.0, 33.0, 22.0, 47.0, 45.0, 51.0, 41.0, 45.0, 60.0, 64.0, 55.0, 54.0, 71.0, 38.0, 44.0, 44.0, 38.0, 26.0, 20.0, 21.0, 12.0, 13.0, 9.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.291015625, -3.194854736328125, -3.09869384765625, -3.002532958984375, -2.9063720703125, -2.810211181640625, -2.71405029296875, -2.617889404296875, -2.521728515625, -2.425567626953125, -2.32940673828125, -2.233245849609375, -2.1370849609375, -2.040924072265625, -1.94476318359375, -1.848602294921875, -1.75244140625, -1.656280517578125, -1.56011962890625, -1.463958740234375, -1.3677978515625, -1.271636962890625, -1.17547607421875, -1.079315185546875, -0.983154296875, -0.886993408203125, -0.79083251953125, -0.694671630859375, -0.5985107421875, -0.502349853515625, -0.40618896484375, -0.310028076171875, -0.2138671875, -0.117706298828125, -0.02154541015625, 0.074615478515625, 0.1707763671875, 0.266937255859375, 0.36309814453125, 0.459259033203125, 0.555419921875, 0.651580810546875, 0.74774169921875, 0.843902587890625, 0.9400634765625, 1.036224365234375, 1.13238525390625, 1.228546142578125, 1.32470703125, 1.420867919921875, 1.51702880859375, 1.613189697265625, 1.7093505859375, 1.805511474609375, 1.90167236328125, 1.997833251953125, 2.093994140625, 2.190155029296875, 2.28631591796875, 2.382476806640625, 2.4786376953125, 2.574798583984375, 2.67095947265625, 2.767120361328125, 2.86328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 9.0, 7.0, 19.0, 20.0, 40.0, 80.0, 155.0, 319.0, 828.0, 2451.0, 11295.0, 141698.0, 837830.0, 45356.0, 5804.0, 1539.0, 545.0, 244.0, 115.0, 71.0, 42.0, 30.0, 17.0, 10.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.44976043701171875, -0.4312591552734375, -0.41275787353515625, -0.394256591796875, -0.37575531005859375, -0.3572540283203125, -0.33875274658203125, -0.32025146484375, -0.30175018310546875, -0.2832489013671875, -0.26474761962890625, -0.246246337890625, -0.22774505615234375, -0.2092437744140625, -0.19074249267578125, -0.1722412109375, -0.15373992919921875, -0.1352386474609375, -0.11673736572265625, -0.098236083984375, -0.07973480224609375, -0.0612335205078125, -0.04273223876953125, -0.02423095703125, -0.00572967529296875, 0.0127716064453125, 0.03127288818359375, 0.049774169921875, 0.06827545166015625, 0.0867767333984375, 0.10527801513671875, 0.123779296875, 0.14228057861328125, 0.1607818603515625, 0.17928314208984375, 0.197784423828125, 0.21628570556640625, 0.2347869873046875, 0.25328826904296875, 0.27178955078125, 0.29029083251953125, 0.3087921142578125, 0.32729339599609375, 0.345794677734375, 0.36429595947265625, 0.3827972412109375, 0.40129852294921875, 0.4197998046875, 0.43830108642578125, 0.4568023681640625, 0.47530364990234375, 0.493804931640625, 0.5123062133789062, 0.5308074951171875, 0.5493087768554688, 0.56781005859375, 0.5863113403320312, 0.6048126220703125, 0.6233139038085938, 0.641815185546875, 0.6603164672851562, 0.6788177490234375, 0.6973190307617188, 0.7158203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 7.0, 9.0, 11.0, 11.0, 7.0, 19.0, 16.0, 20.0, 31.0, 42.0, 31.0, 43.0, 70.0, 74.0, 93.0, 95.0, 91.0, 56.0, 63.0, 37.0, 39.0, 23.0, 25.0, 20.0, 17.0, 9.0, 7.0, 10.0, 5.0, 3.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.9723854064941406e-05, -5.791429430246353e-05, -5.610473453998566e-05, -5.429517477750778e-05, -5.248561501502991e-05, -5.067605525255203e-05, -4.886649549007416e-05, -4.705693572759628e-05, -4.524737596511841e-05, -4.3437816202640533e-05, -4.162825644016266e-05, -3.9818696677684784e-05, -3.800913691520691e-05, -3.6199577152729034e-05, -3.439001739025116e-05, -3.2580457627773285e-05, -3.077089786529541e-05, -2.8961338102817535e-05, -2.715177834033966e-05, -2.5342218577861786e-05, -2.353265881538391e-05, -2.1723099052906036e-05, -1.991353929042816e-05, -1.8103979527950287e-05, -1.6294419765472412e-05, -1.4484860002994537e-05, -1.2675300240516663e-05, -1.0865740478038788e-05, -9.056180715560913e-06, -7.246620953083038e-06, -5.4370611906051636e-06, -3.627501428127289e-06, -1.817941665649414e-06, -8.381903171539307e-09, 1.8011778593063354e-06, 3.61073762178421e-06, 5.420297384262085e-06, 7.22985714673996e-06, 9.039416909217834e-06, 1.084897667169571e-05, 1.2658536434173584e-05, 1.4468096196651459e-05, 1.6277655959129333e-05, 1.8087215721607208e-05, 1.9896775484085083e-05, 2.1706335246562958e-05, 2.3515895009040833e-05, 2.5325454771518707e-05, 2.7135014533996582e-05, 2.8944574296474457e-05, 3.075413405895233e-05, 3.2563693821430206e-05, 3.437325358390808e-05, 3.6182813346385956e-05, 3.799237310886383e-05, 3.9801932871341705e-05, 4.161149263381958e-05, 4.3421052396297455e-05, 4.523061215877533e-05, 4.7040171921253204e-05, 4.884973168373108e-05, 5.0659291446208954e-05, 5.246885120868683e-05, 5.42784109711647e-05, 5.608797073364258e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 2.0, 5.0, 7.0, 7.0, 3.0, 10.0, 22.0, 33.0, 42.0, 39.0, 58.0, 79.0, 171.0, 218.0, 428.0, 744.0, 1710.0, 4790.0, 19713.0, 194119.0, 755887.0, 55855.0, 9244.0, 2794.0, 1134.0, 554.0, 331.0, 153.0, 111.0, 82.0, 59.0, 36.0, 36.0, 21.0, 14.0, 17.0, 6.0, 10.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.479248046875, -0.4656562805175781, -0.45206451416015625, -0.4384727478027344, -0.4248809814453125, -0.4112892150878906, -0.39769744873046875, -0.3841056823730469, -0.370513916015625, -0.3569221496582031, -0.34333038330078125, -0.3297386169433594, -0.3161468505859375, -0.3025550842285156, -0.28896331787109375, -0.2753715515136719, -0.26177978515625, -0.24818801879882812, -0.23459625244140625, -0.22100448608398438, -0.2074127197265625, -0.19382095336914062, -0.18022918701171875, -0.16663742065429688, -0.153045654296875, -0.13945388793945312, -0.12586212158203125, -0.11227035522460938, -0.0986785888671875, -0.08508682250976562, -0.07149505615234375, -0.057903289794921875, -0.0443115234375, -0.030719757080078125, -0.01712799072265625, -0.003536224365234375, 0.0100555419921875, 0.023647308349609375, 0.03723907470703125, 0.050830841064453125, 0.064422607421875, 0.07801437377929688, 0.09160614013671875, 0.10519790649414062, 0.1187896728515625, 0.13238143920898438, 0.14597320556640625, 0.15956497192382812, 0.17315673828125, 0.18674850463867188, 0.20034027099609375, 0.21393203735351562, 0.2275238037109375, 0.24111557006835938, 0.25470733642578125, 0.2682991027832031, 0.281890869140625, 0.2954826354980469, 0.30907440185546875, 0.3226661682128906, 0.3362579345703125, 0.3498497009277344, 0.36344146728515625, 0.3770332336425781, 0.390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 15.0, 13.0, 15.0, 22.0, 39.0, 46.0, 44.0, 71.0, 69.0, 78.0, 84.0, 74.0, 63.0, 44.0, 53.0, 47.0, 37.0, 33.0, 26.0, 21.0, 15.0, 10.0, 10.0, 11.0, 2.0, 4.0, 6.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.4017524719238281, -0.38871002197265625, -0.3756675720214844, -0.3626251220703125, -0.3495826721191406, -0.33654022216796875, -0.3234977722167969, -0.310455322265625, -0.2974128723144531, -0.28437042236328125, -0.2713279724121094, -0.2582855224609375, -0.24524307250976562, -0.23220062255859375, -0.21915817260742188, -0.20611572265625, -0.19307327270507812, -0.18003082275390625, -0.16698837280273438, -0.1539459228515625, -0.14090347290039062, -0.12786102294921875, -0.11481857299804688, -0.101776123046875, -0.08873367309570312, -0.07569122314453125, -0.06264877319335938, -0.0496063232421875, -0.036563873291015625, -0.02352142333984375, -0.010478973388671875, 0.0025634765625, 0.015605926513671875, 0.02864837646484375, 0.041690826416015625, 0.0547332763671875, 0.06777572631835938, 0.08081817626953125, 0.09386062622070312, 0.106903076171875, 0.11994552612304688, 0.13298797607421875, 0.14603042602539062, 0.1590728759765625, 0.17211532592773438, 0.18515777587890625, 0.19820022583007812, 0.21124267578125, 0.22428512573242188, 0.23732757568359375, 0.2503700256347656, 0.2634124755859375, 0.2764549255371094, 0.28949737548828125, 0.3025398254394531, 0.315582275390625, 0.3286247253417969, 0.34166717529296875, 0.3547096252441406, 0.3677520751953125, 0.3807945251464844, 0.39383697509765625, 0.4068794250488281, 0.419921875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 22.0, 114.0, 377.0, 332.0, 94.0, 29.0, 14.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.400068283081055, -13.74610710144043, -13.092145919799805, -12.43818473815918, -11.784223556518555, -11.13026237487793, -10.476300239562988, -9.822339057922363, -9.168377876281738, -8.514416694641113, -7.860455513000488, -7.206493854522705, -6.55253267288208, -5.898571491241455, -5.244609832763672, -4.590648651123047, -3.936687469482422, -3.282726287841797, -2.6287648677825928, -1.9748035669326782, -1.3208422660827637, -0.6668810844421387, -0.01291966438293457, 0.6410417556762695, 1.2950029373168945, 1.948964238166809, 2.6029255390167236, 3.2568869590759277, 3.9108481407165527, 4.564809322357178, 5.218770980834961, 5.872732162475586, 6.526695251464844, 7.180656433105469, 7.834617614746094, 8.488578796386719, 9.142539978027344, 9.796501159667969, 10.45046329498291, 11.104424476623535, 11.75838565826416, 12.412346839904785, 13.06630802154541, 13.720269203186035, 14.374231338500977, 15.028192520141602, 15.682153701782227, 16.33611488342285, 16.990076065063477, 17.6440372467041, 18.297998428344727, 18.95195960998535, 19.605920791625977, 20.2598819732666, 20.913843154907227, 21.567806243896484, 22.22176742553711, 22.875728607177734, 23.52968978881836, 24.183650970458984, 24.83761215209961, 25.491573333740234, 26.14553451538086, 26.799495697021484, 27.45345687866211]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 1.0, 10.0, 5.0, 11.0, 12.0, 12.0, 13.0, 17.0, 25.0, 21.0, 26.0, 26.0, 24.0, 34.0, 26.0, 39.0, 45.0, 54.0, 51.0, 49.0, 75.0, 49.0, 49.0, 35.0, 28.0, 28.0, 21.0, 26.0, 29.0, 18.0, 18.0, 16.0, 13.0, 12.0, 11.0, 9.0, 11.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.76205062866211, -8.47878360748291, -8.195515632629395, -7.912248611450195, -7.628981590270996, -7.345714092254639, -7.062446594238281, -6.779179573059082, -6.495912551879883, -6.212645053863525, -5.929378032684326, -5.646110534667969, -5.3628435134887695, -5.079576015472412, -4.796308517456055, -4.5130414962768555, -4.229773998260498, -3.9465067386627197, -3.6632394790649414, -3.379971981048584, -3.0967049598693848, -2.8134374618530273, -2.530170202255249, -2.2469029426574707, -1.9636356830596924, -1.680368423461914, -1.3971011638641357, -1.1138337850570679, -0.8305665254592896, -0.5472992658615112, -0.26403188705444336, 0.01923537254333496, 0.3025026321411133, 0.5857698917388916, 0.8690372109413147, 1.1523045301437378, 1.4355717897415161, 1.7188390493392944, 2.0021064281463623, 2.2853736877441406, 2.568640947341919, 2.8519082069396973, 3.1351754665374756, 3.418442726135254, 3.7017102241516113, 3.9849772453308105, 4.268244743347168, 4.551511764526367, 4.834779262542725, 5.118046760559082, 5.401313781738281, 5.684581279754639, 5.967848300933838, 6.251115798950195, 6.5343828201293945, 6.817650318145752, 7.100917816162109, 7.384185314178467, 7.667452335357666, 7.950719833374023, 8.233986854553223, 8.517253875732422, 8.800521850585938, 9.083788871765137, 9.367055892944336]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 19.0, 18.0, 25.0, 57.0, 81.0, 120.0, 233.0, 374.0, 635.0, 1139.0, 2284.0, 5468.0, 16615.0, 73134.0, 395988.0, 1748553.0, 1530560.0, 334405.0, 60733.0, 14268.0, 4801.0, 2237.0, 1099.0, 598.0, 307.0, 209.0, 123.0, 70.0, 38.0, 27.0, 22.0, 17.0, 9.0, 2.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.56640625, -0.5529022216796875, -0.539398193359375, -0.5258941650390625, -0.51239013671875, -0.4988861083984375, -0.485382080078125, -0.4718780517578125, -0.4583740234375, -0.4448699951171875, -0.431365966796875, -0.4178619384765625, -0.40435791015625, -0.3908538818359375, -0.377349853515625, -0.3638458251953125, -0.350341796875, -0.3368377685546875, -0.323333740234375, -0.3098297119140625, -0.29632568359375, -0.2828216552734375, -0.269317626953125, -0.2558135986328125, -0.2423095703125, -0.2288055419921875, -0.215301513671875, -0.2017974853515625, -0.18829345703125, -0.1747894287109375, -0.161285400390625, -0.1477813720703125, -0.13427734375, -0.1207733154296875, -0.107269287109375, -0.0937652587890625, -0.08026123046875, -0.0667572021484375, -0.053253173828125, -0.0397491455078125, -0.0262451171875, -0.0127410888671875, 0.000762939453125, 0.0142669677734375, 0.02777099609375, 0.0412750244140625, 0.054779052734375, 0.0682830810546875, 0.081787109375, 0.0952911376953125, 0.108795166015625, 0.1222991943359375, 0.13580322265625, 0.1493072509765625, 0.162811279296875, 0.1763153076171875, 0.1898193359375, 0.2033233642578125, 0.216827392578125, 0.2303314208984375, 0.24383544921875, 0.2573394775390625, 0.270843505859375, 0.2843475341796875, 0.2978515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 9.0, 12.0, 13.0, 14.0, 9.0, 14.0, 17.0, 21.0, 23.0, 14.0, 25.0, 26.0, 27.0, 30.0, 34.0, 35.0, 42.0, 38.0, 35.0, 30.0, 47.0, 38.0, 30.0, 36.0, 38.0, 52.0, 32.0, 17.0, 31.0, 25.0, 29.0, 24.0, 15.0, 18.0, 13.0, 9.0, 12.0, 4.0, 8.0, 9.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4443359375, -0.4298858642578125, -0.415435791015625, -0.4009857177734375, -0.38653564453125, -0.3720855712890625, -0.357635498046875, -0.3431854248046875, -0.3287353515625, -0.3142852783203125, -0.299835205078125, -0.2853851318359375, -0.27093505859375, -0.2564849853515625, -0.242034912109375, -0.2275848388671875, -0.213134765625, -0.1986846923828125, -0.184234619140625, -0.1697845458984375, -0.15533447265625, -0.1408843994140625, -0.126434326171875, -0.1119842529296875, -0.0975341796875, -0.0830841064453125, -0.068634033203125, -0.0541839599609375, -0.03973388671875, -0.0252838134765625, -0.010833740234375, 0.0036163330078125, 0.01806640625, 0.0325164794921875, 0.046966552734375, 0.0614166259765625, 0.07586669921875, 0.0903167724609375, 0.104766845703125, 0.1192169189453125, 0.1336669921875, 0.1481170654296875, 0.162567138671875, 0.1770172119140625, 0.19146728515625, 0.2059173583984375, 0.220367431640625, 0.2348175048828125, 0.249267578125, 0.2637176513671875, 0.278167724609375, 0.2926177978515625, 0.30706787109375, 0.3215179443359375, 0.335968017578125, 0.3504180908203125, 0.3648681640625, 0.3793182373046875, 0.393768310546875, 0.4082183837890625, 0.42266845703125, 0.4371185302734375, 0.451568603515625, 0.4660186767578125, 0.48046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 12.0, 21.0, 34.0, 40.0, 61.0, 77.0, 125.0, 193.0, 304.0, 543.0, 1184.0, 3041.0, 11202.0, 71477.0, 3085502.0, 969246.0, 39683.0, 7298.0, 2230.0, 957.0, 451.0, 222.0, 132.0, 83.0, 56.0, 27.0, 21.0, 11.0, 7.0, 12.0, 6.0, 6.0, 1.0, 0.0, 4.0], "bins": [-1.3505859375, -1.319793701171875, -1.28900146484375, -1.258209228515625, -1.2274169921875, -1.196624755859375, -1.16583251953125, -1.135040283203125, -1.104248046875, -1.073455810546875, -1.04266357421875, -1.011871337890625, -0.9810791015625, -0.950286865234375, -0.91949462890625, -0.888702392578125, -0.85791015625, -0.827117919921875, -0.79632568359375, -0.765533447265625, -0.7347412109375, -0.703948974609375, -0.67315673828125, -0.642364501953125, -0.611572265625, -0.580780029296875, -0.54998779296875, -0.519195556640625, -0.4884033203125, -0.457611083984375, -0.42681884765625, -0.396026611328125, -0.365234375, -0.334442138671875, -0.30364990234375, -0.272857666015625, -0.2420654296875, -0.211273193359375, -0.18048095703125, -0.149688720703125, -0.118896484375, -0.088104248046875, -0.05731201171875, -0.026519775390625, 0.0042724609375, 0.035064697265625, 0.06585693359375, 0.096649169921875, 0.12744140625, 0.158233642578125, 0.18902587890625, 0.219818115234375, 0.2506103515625, 0.281402587890625, 0.31219482421875, 0.342987060546875, 0.373779296875, 0.404571533203125, 0.43536376953125, 0.466156005859375, 0.4969482421875, 0.527740478515625, 0.55853271484375, 0.589324951171875, 0.6201171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 6.0, 5.0, 12.0, 25.0, 32.0, 48.0, 107.0, 234.0, 782.0, 1396.0, 839.0, 305.0, 108.0, 60.0, 36.0, 23.0, 16.0, 11.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -2.0072021484375, -1.957763671875, -1.9083251953125, -1.85888671875, -1.8094482421875, -1.760009765625, -1.7105712890625, -1.6611328125, -1.6116943359375, -1.562255859375, -1.5128173828125, -1.46337890625, -1.4139404296875, -1.364501953125, -1.3150634765625, -1.265625, -1.2161865234375, -1.166748046875, -1.1173095703125, -1.06787109375, -1.0184326171875, -0.968994140625, -0.9195556640625, -0.8701171875, -0.8206787109375, -0.771240234375, -0.7218017578125, -0.67236328125, -0.6229248046875, -0.573486328125, -0.5240478515625, -0.474609375, -0.4251708984375, -0.375732421875, -0.3262939453125, -0.27685546875, -0.2274169921875, -0.177978515625, -0.1285400390625, -0.0791015625, -0.0296630859375, 0.019775390625, 0.0692138671875, 0.11865234375, 0.1680908203125, 0.217529296875, 0.2669677734375, 0.31640625, 0.3658447265625, 0.415283203125, 0.4647216796875, 0.51416015625, 0.5635986328125, 0.613037109375, 0.6624755859375, 0.7119140625, 0.7613525390625, 0.810791015625, 0.8602294921875, 0.90966796875, 0.9591064453125, 1.008544921875, 1.0579833984375, 1.107421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 90.0, 401.0, 372.0, 89.0, 17.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.647078514099121, -12.094755172729492, -11.542431831359863, -10.990108489990234, -10.437784194946289, -9.885461807250977, -9.333137512207031, -8.780814170837402, -8.228490829467773, -7.6761674880981445, -7.123844146728516, -6.5715203285217285, -6.0191969871521, -5.466873645782471, -4.914549827575684, -4.362226486206055, -3.809903144836426, -3.257579803466797, -2.705256223678589, -2.152932643890381, -1.600609302520752, -1.048285961151123, -0.49596238136291504, 0.05636119842529297, 0.6086845397949219, 1.1610080003738403, 1.7133314609527588, 2.265655040740967, 2.8179783821105957, 3.3703017234802246, 3.9226253032684326, 4.474948883056641, 5.027273178100586, 5.579596519470215, 6.131919860839844, 6.684243679046631, 7.23656702041626, 7.788890361785889, 8.341214179992676, 8.893537521362305, 9.445860862731934, 9.998184204101562, 10.550507545471191, 11.10283088684082, 11.655155181884766, 12.207477569580078, 12.759801864624023, 13.312125205993652, 13.864448547363281, 14.41677188873291, 14.969095230102539, 15.521418571472168, 16.073741912841797, 16.626066207885742, 17.178388595581055, 17.730712890625, 18.283035278320312, 18.835359573364258, 19.38768196105957, 19.940006256103516, 20.492328643798828, 21.044652938842773, 21.596975326538086, 22.14929962158203, 22.701623916625977]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 1.0, 4.0, 13.0, 11.0, 18.0, 18.0, 27.0, 25.0, 28.0, 37.0, 37.0, 54.0, 40.0, 53.0, 61.0, 54.0, 56.0, 41.0, 53.0, 54.0, 56.0, 43.0, 37.0, 27.0, 24.0, 25.0, 21.0, 15.0, 14.0, 13.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.617569923400879, -4.455904483795166, -4.294239044189453, -4.132573127746582, -3.9709079265594482, -3.8092422485351562, -3.6475768089294434, -3.4859113693237305, -3.3242459297180176, -3.1625804901123047, -3.0009148120880127, -2.8392493724823, -2.677583932876587, -2.515918254852295, -2.354252815246582, -2.192587375640869, -2.030921697616577, -1.8692561388015747, -1.7075906991958618, -1.5459251403808594, -1.3842597007751465, -1.222594141960144, -1.0609285831451416, -0.8992631435394287, -0.7375975847244263, -0.5759320855140686, -0.41426655650138855, -0.2526010274887085, -0.09093552827835083, 0.07072997093200684, 0.23239552974700928, 0.39406096935272217, 0.5557265281677246, 0.7173920273780823, 0.8790575265884399, 1.0407230854034424, 1.2023885250091553, 1.3640540838241577, 1.5257196426391602, 1.687385082244873, 1.8490506410598755, 2.010716199874878, 2.172381639480591, 2.334047317504883, 2.4957127571105957, 2.6573781967163086, 2.8190436363220215, 2.9807090759277344, 3.1423747539520264, 3.3040401935577393, 3.4657058715820312, 3.627371311187744, 3.789036750793457, 3.95070219039917, 4.112367630004883, 4.274033546447754, 4.435698986053467, 4.59736442565918, 4.759029865264893, 4.9206953048706055, 5.082361221313477, 5.2440266609191895, 5.405692100524902, 5.567357540130615, 5.729022979736328]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 12.0, 17.0, 20.0, 30.0, 60.0, 87.0, 156.0, 291.0, 502.0, 930.0, 1812.0, 3577.0, 7714.0, 17740.0, 43727.0, 110019.0, 274764.0, 339045.0, 146833.0, 58651.0, 23283.0, 9953.0, 4517.0, 2304.0, 1134.0, 595.0, 321.0, 181.0, 127.0, 53.0, 33.0, 19.0, 20.0, 9.0, 6.0, 2.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62646484375, -0.608123779296875, -0.58978271484375, -0.571441650390625, -0.5531005859375, -0.534759521484375, -0.51641845703125, -0.498077392578125, -0.479736328125, -0.461395263671875, -0.44305419921875, -0.424713134765625, -0.4063720703125, -0.388031005859375, -0.36968994140625, -0.351348876953125, -0.3330078125, -0.314666748046875, -0.29632568359375, -0.277984619140625, -0.2596435546875, -0.241302490234375, -0.22296142578125, -0.204620361328125, -0.186279296875, -0.167938232421875, -0.14959716796875, -0.131256103515625, -0.1129150390625, -0.094573974609375, -0.07623291015625, -0.057891845703125, -0.03955078125, -0.021209716796875, -0.00286865234375, 0.015472412109375, 0.0338134765625, 0.052154541015625, 0.07049560546875, 0.088836669921875, 0.107177734375, 0.125518798828125, 0.14385986328125, 0.162200927734375, 0.1805419921875, 0.198883056640625, 0.21722412109375, 0.235565185546875, 0.25390625, 0.272247314453125, 0.29058837890625, 0.308929443359375, 0.3272705078125, 0.345611572265625, 0.36395263671875, 0.382293701171875, 0.400634765625, 0.418975830078125, 0.43731689453125, 0.455657958984375, 0.4739990234375, 0.492340087890625, 0.51068115234375, 0.529022216796875, 0.54736328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 7.0, 6.0, 10.0, 10.0, 6.0, 15.0, 21.0, 22.0, 23.0, 14.0, 28.0, 21.0, 20.0, 30.0, 29.0, 37.0, 38.0, 40.0, 34.0, 49.0, 40.0, 39.0, 31.0, 43.0, 44.0, 34.0, 51.0, 25.0, 26.0, 42.0, 19.0, 18.0, 14.0, 17.0, 13.0, 11.0, 15.0, 13.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.447509765625, -0.4329109191894531, -0.41831207275390625, -0.4037132263183594, -0.3891143798828125, -0.3745155334472656, -0.35991668701171875, -0.3453178405761719, -0.330718994140625, -0.3161201477050781, -0.30152130126953125, -0.2869224548339844, -0.2723236083984375, -0.2577247619628906, -0.24312591552734375, -0.22852706909179688, -0.21392822265625, -0.19932937622070312, -0.18473052978515625, -0.17013168334960938, -0.1555328369140625, -0.14093399047851562, -0.12633514404296875, -0.11173629760742188, -0.097137451171875, -0.08253860473632812, -0.06793975830078125, -0.053340911865234375, -0.0387420654296875, -0.024143218994140625, -0.00954437255859375, 0.005054473876953125, 0.0196533203125, 0.034252166748046875, 0.04885101318359375, 0.06344985961914062, 0.0780487060546875, 0.09264755249023438, 0.10724639892578125, 0.12184524536132812, 0.136444091796875, 0.15104293823242188, 0.16564178466796875, 0.18024063110351562, 0.1948394775390625, 0.20943832397460938, 0.22403717041015625, 0.23863601684570312, 0.25323486328125, 0.2678337097167969, 0.28243255615234375, 0.2970314025878906, 0.3116302490234375, 0.3262290954589844, 0.34082794189453125, 0.3554267883300781, 0.370025634765625, 0.3846244812011719, 0.39922332763671875, 0.4138221740722656, 0.4284210205078125, 0.4430198669433594, 0.45761871337890625, 0.4722175598144531, 0.48681640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 10.0, 11.0, 11.0, 23.0, 29.0, 43.0, 34.0, 49.0, 78.0, 96.0, 175.0, 180.0, 235.0, 330.0, 495.0, 859.0, 1531.0, 3849.0, 17865.0, 186442.0, 759138.0, 62650.0, 8498.0, 2465.0, 1145.0, 636.0, 430.0, 306.0, 221.0, 199.0, 121.0, 98.0, 60.0, 66.0, 47.0, 33.0, 23.0, 21.0, 9.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.5869140625, -1.5406341552734375, -1.494354248046875, -1.4480743408203125, -1.40179443359375, -1.3555145263671875, -1.309234619140625, -1.2629547119140625, -1.2166748046875, -1.1703948974609375, -1.124114990234375, -1.0778350830078125, -1.03155517578125, -0.9852752685546875, -0.938995361328125, -0.8927154541015625, -0.846435546875, -0.8001556396484375, -0.753875732421875, -0.7075958251953125, -0.66131591796875, -0.6150360107421875, -0.568756103515625, -0.5224761962890625, -0.4761962890625, -0.4299163818359375, -0.383636474609375, -0.3373565673828125, -0.29107666015625, -0.2447967529296875, -0.198516845703125, -0.1522369384765625, -0.10595703125, -0.0596771240234375, -0.013397216796875, 0.0328826904296875, 0.07916259765625, 0.1254425048828125, 0.171722412109375, 0.2180023193359375, 0.2642822265625, 0.3105621337890625, 0.356842041015625, 0.4031219482421875, 0.44940185546875, 0.4956817626953125, 0.541961669921875, 0.5882415771484375, 0.634521484375, 0.6808013916015625, 0.727081298828125, 0.7733612060546875, 0.81964111328125, 0.8659210205078125, 0.912200927734375, 0.9584808349609375, 1.0047607421875, 1.0510406494140625, 1.097320556640625, 1.1436004638671875, 1.18988037109375, 1.2361602783203125, 1.282440185546875, 1.3287200927734375, 1.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 9.0, 14.0, 8.0, 12.0, 14.0, 25.0, 22.0, 25.0, 34.0, 39.0, 35.0, 47.0, 46.0, 59.0, 50.0, 52.0, 48.0, 41.0, 47.0, 48.0, 45.0, 35.0, 38.0, 24.0, 30.0, 25.0, 28.0, 13.0, 15.0, 12.0, 9.0, 13.0, 13.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.7963714599609375, -1.734344482421875, -1.6723175048828125, -1.61029052734375, -1.5482635498046875, -1.486236572265625, -1.4242095947265625, -1.3621826171875, -1.3001556396484375, -1.238128662109375, -1.1761016845703125, -1.11407470703125, -1.0520477294921875, -0.990020751953125, -0.9279937744140625, -0.865966796875, -0.8039398193359375, -0.741912841796875, -0.6798858642578125, -0.61785888671875, -0.5558319091796875, -0.493804931640625, -0.4317779541015625, -0.3697509765625, -0.3077239990234375, -0.245697021484375, -0.1836700439453125, -0.12164306640625, -0.0596160888671875, 0.002410888671875, 0.0644378662109375, 0.12646484375, 0.1884918212890625, 0.250518798828125, 0.3125457763671875, 0.37457275390625, 0.4365997314453125, 0.498626708984375, 0.5606536865234375, 0.6226806640625, 0.6847076416015625, 0.746734619140625, 0.8087615966796875, 0.87078857421875, 0.9328155517578125, 0.994842529296875, 1.0568695068359375, 1.118896484375, 1.1809234619140625, 1.242950439453125, 1.3049774169921875, 1.36700439453125, 1.4290313720703125, 1.491058349609375, 1.5530853271484375, 1.6151123046875, 1.6771392822265625, 1.739166259765625, 1.8011932373046875, 1.86322021484375, 1.9252471923828125, 1.987274169921875, 2.0493011474609375, 2.111328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 2.0, 5.0, 4.0, 12.0, 11.0, 16.0, 13.0, 16.0, 30.0, 41.0, 39.0, 43.0, 88.0, 143.0, 292.0, 637.0, 1965.0, 8620.0, 58315.0, 743280.0, 207648.0, 21294.0, 3999.0, 1066.0, 432.0, 183.0, 115.0, 64.0, 42.0, 27.0, 21.0, 15.0, 16.0, 12.0, 8.0, 13.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.459716796875, -0.4452400207519531, -0.43076324462890625, -0.4162864685058594, -0.4018096923828125, -0.3873329162597656, -0.37285614013671875, -0.3583793640136719, -0.343902587890625, -0.3294258117675781, -0.31494903564453125, -0.3004722595214844, -0.2859954833984375, -0.2715187072753906, -0.25704193115234375, -0.24256515502929688, -0.22808837890625, -0.21361160278320312, -0.19913482666015625, -0.18465805053710938, -0.1701812744140625, -0.15570449829101562, -0.14122772216796875, -0.12675094604492188, -0.112274169921875, -0.09779739379882812, -0.08332061767578125, -0.06884384155273438, -0.0543670654296875, -0.039890289306640625, -0.02541351318359375, -0.010936737060546875, 0.0035400390625, 0.018016815185546875, 0.03249359130859375, 0.046970367431640625, 0.0614471435546875, 0.07592391967773438, 0.09040069580078125, 0.10487747192382812, 0.119354248046875, 0.13383102416992188, 0.14830780029296875, 0.16278457641601562, 0.1772613525390625, 0.19173812866210938, 0.20621490478515625, 0.22069168090820312, 0.23516845703125, 0.24964523315429688, 0.26412200927734375, 0.2785987854003906, 0.2930755615234375, 0.3075523376464844, 0.32202911376953125, 0.3365058898925781, 0.350982666015625, 0.3654594421386719, 0.37993621826171875, 0.3944129943847656, 0.4088897705078125, 0.4233665466308594, 0.43784332275390625, 0.4523200988769531, 0.466796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 3.0, 4.0, 10.0, 6.0, 17.0, 20.0, 20.0, 25.0, 27.0, 47.0, 51.0, 88.0, 109.0, 99.0, 104.0, 71.0, 59.0, 58.0, 36.0, 18.0, 24.0, 14.0, 14.0, 16.0, 10.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.170438766479492e-05, -6.962940096855164e-05, -6.755441427230835e-05, -6.547942757606506e-05, -6.340444087982178e-05, -6.132945418357849e-05, -5.9254467487335205e-05, -5.717948079109192e-05, -5.510449409484863e-05, -5.302950739860535e-05, -5.095452070236206e-05, -4.8879534006118774e-05, -4.680454730987549e-05, -4.47295606136322e-05, -4.2654573917388916e-05, -4.057958722114563e-05, -3.8504600524902344e-05, -3.642961382865906e-05, -3.435462713241577e-05, -3.2279640436172485e-05, -3.02046537399292e-05, -2.8129667043685913e-05, -2.6054680347442627e-05, -2.397969365119934e-05, -2.1904706954956055e-05, -1.982972025871277e-05, -1.7754733562469482e-05, -1.5679746866226196e-05, -1.360476016998291e-05, -1.1529773473739624e-05, -9.454786777496338e-06, -7.379800081253052e-06, -5.304813385009766e-06, -3.2298266887664795e-06, -1.1548399925231934e-06, 9.201467037200928e-07, 2.995133399963379e-06, 5.070120096206665e-06, 7.145106792449951e-06, 9.220093488693237e-06, 1.1295080184936523e-05, 1.337006688117981e-05, 1.5445053577423096e-05, 1.7520040273666382e-05, 1.9595026969909668e-05, 2.1670013666152954e-05, 2.374500036239624e-05, 2.5819987058639526e-05, 2.7894973754882812e-05, 2.99699604511261e-05, 3.2044947147369385e-05, 3.411993384361267e-05, 3.619492053985596e-05, 3.826990723609924e-05, 4.034489393234253e-05, 4.2419880628585815e-05, 4.44948673248291e-05, 4.656985402107239e-05, 4.8644840717315674e-05, 5.071982741355896e-05, 5.2794814109802246e-05, 5.486980080604553e-05, 5.694478750228882e-05, 5.9019774198532104e-05, 6.109476089477539e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 10.0, 11.0, 21.0, 17.0, 40.0, 29.0, 77.0, 117.0, 142.0, 240.0, 456.0, 897.0, 2026.0, 6468.0, 37401.0, 492028.0, 460739.0, 37292.0, 6554.0, 2047.0, 852.0, 411.0, 240.0, 159.0, 88.0, 57.0, 37.0, 33.0, 14.0, 19.0, 6.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3359031677246094, -0.32390594482421875, -0.3119087219238281, -0.2999114990234375, -0.2879142761230469, -0.27591705322265625, -0.2639198303222656, -0.251922607421875, -0.23992538452148438, -0.22792816162109375, -0.21593093872070312, -0.2039337158203125, -0.19193649291992188, -0.17993927001953125, -0.16794204711914062, -0.15594482421875, -0.14394760131835938, -0.13195037841796875, -0.11995315551757812, -0.1079559326171875, -0.09595870971679688, -0.08396148681640625, -0.07196426391601562, -0.059967041015625, -0.047969818115234375, -0.03597259521484375, -0.023975372314453125, -0.0119781494140625, 1.9073486328125e-05, 0.01201629638671875, 0.024013519287109375, 0.0360107421875, 0.048007965087890625, 0.06000518798828125, 0.07200241088867188, 0.0839996337890625, 0.09599685668945312, 0.10799407958984375, 0.11999130249023438, 0.131988525390625, 0.14398574829101562, 0.15598297119140625, 0.16798019409179688, 0.1799774169921875, 0.19197463989257812, 0.20397186279296875, 0.21596908569335938, 0.22796630859375, 0.23996353149414062, 0.25196075439453125, 0.2639579772949219, 0.2759552001953125, 0.2879524230957031, 0.29994964599609375, 0.3119468688964844, 0.323944091796875, 0.3359413146972656, 0.34793853759765625, 0.3599357604980469, 0.3719329833984375, 0.3839302062988281, 0.39592742919921875, 0.4079246520996094, 0.419921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 10.0, 14.0, 15.0, 26.0, 27.0, 32.0, 43.0, 59.0, 81.0, 92.0, 89.0, 100.0, 91.0, 71.0, 61.0, 45.0, 34.0, 28.0, 23.0, 12.0, 11.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.34314727783203125, -0.3303375244140625, -0.31752777099609375, -0.304718017578125, -0.29190826416015625, -0.2790985107421875, -0.26628875732421875, -0.25347900390625, -0.24066925048828125, -0.2278594970703125, -0.21504974365234375, -0.202239990234375, -0.18943023681640625, -0.1766204833984375, -0.16381072998046875, -0.1510009765625, -0.13819122314453125, -0.1253814697265625, -0.11257171630859375, -0.099761962890625, -0.08695220947265625, -0.0741424560546875, -0.06133270263671875, -0.04852294921875, -0.03571319580078125, -0.0229034423828125, -0.01009368896484375, 0.002716064453125, 0.01552581787109375, 0.0283355712890625, 0.04114532470703125, 0.053955078125, 0.06676483154296875, 0.0795745849609375, 0.09238433837890625, 0.105194091796875, 0.11800384521484375, 0.1308135986328125, 0.14362335205078125, 0.15643310546875, 0.16924285888671875, 0.1820526123046875, 0.19486236572265625, 0.207672119140625, 0.22048187255859375, 0.2332916259765625, 0.24610137939453125, 0.2589111328125, 0.27172088623046875, 0.2845306396484375, 0.29734039306640625, 0.310150146484375, 0.32295989990234375, 0.3357696533203125, 0.34857940673828125, 0.36138916015625, 0.37419891357421875, 0.3870086669921875, 0.39981842041015625, 0.412628173828125, 0.42543792724609375, 0.4382476806640625, 0.45105743408203125, 0.4638671875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 13.0, 42.0, 78.0, 173.0, 301.0, 226.0, 81.0, 32.0, 14.0, 7.0, 7.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7344255447387695, -7.3654351234436035, -6.9964447021484375, -6.62745475769043, -6.2584638595581055, -5.889473915100098, -5.520483493804932, -5.151493072509766, -4.7825026512146, -4.413512229919434, -4.044521808624268, -3.6755316257476807, -3.3065412044525146, -2.9375507831573486, -2.5685606002807617, -2.1995701789855957, -1.8305797576904297, -1.4615893363952637, -1.0925990343093872, -0.7236087322235107, -0.3546183109283447, 0.014372110366821289, 0.3833622932434082, 0.7523527145385742, 1.1213431358337402, 1.4903335571289062, 1.8593238592147827, 2.228314161300659, 2.597304582595825, 2.966295003890991, 3.335285186767578, 3.704275608062744, 4.073266983032227, 4.442257404327393, 4.811247825622559, 5.180237770080566, 5.549228668212891, 5.918218612670898, 6.2872090339660645, 6.6561994552612305, 7.0251898765563965, 7.3941802978515625, 7.7631707191467285, 8.132161140441895, 8.501151084899902, 8.870141983032227, 9.239131927490234, 9.608121871948242, 9.977112770080566, 10.346102714538574, 10.715093612670898, 11.084083557128906, 11.45307445526123, 11.822064399719238, 12.191055297851562, 12.56004524230957, 12.929035186767578, 13.298025131225586, 13.66701602935791, 14.036005973815918, 14.404996871948242, 14.77398681640625, 15.142976760864258, 15.511967658996582, 15.880958557128906]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 10.0, 16.0, 15.0, 11.0, 23.0, 22.0, 26.0, 26.0, 28.0, 34.0, 40.0, 41.0, 47.0, 46.0, 65.0, 73.0, 65.0, 55.0, 52.0, 28.0, 33.0, 29.0, 26.0, 20.0, 33.0, 15.0, 15.0, 19.0, 16.0, 10.0, 11.0, 11.0, 3.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.341265678405762, -8.097949028015137, -7.854632377624512, -7.6113152503967285, -7.3679986000061035, -7.1246819496154785, -6.881364822387695, -6.63804817199707, -6.394731521606445, -6.15141487121582, -5.908098220825195, -5.664781093597412, -5.421464443206787, -5.178147792816162, -4.934830665588379, -4.691514015197754, -4.448197364807129, -4.204880714416504, -3.9615638256073, -3.7182469367980957, -3.4749302864074707, -3.2316136360168457, -2.9882967472076416, -2.7449798583984375, -2.5016632080078125, -2.2583465576171875, -2.0150296688079834, -1.7717128992080688, -1.5283961296081543, -1.2850793600082397, -1.0417625904083252, -0.7984458208084106, -0.5551290512084961, -0.31181228160858154, -0.06849551200866699, 0.17482125759124756, 0.4181380271911621, 0.6614547967910767, 0.9047715663909912, 1.1480883359909058, 1.3914051055908203, 1.6347218751907349, 1.8780386447906494, 2.1213555335998535, 2.3646721839904785, 2.6079888343811035, 2.8513057231903076, 3.0946226119995117, 3.3379392623901367, 3.5812559127807617, 3.824572801589966, 4.06788969039917, 4.311206340789795, 4.55452299118042, 4.797840118408203, 5.041156768798828, 5.284473419189453, 5.527790069580078, 5.771106719970703, 6.014423847198486, 6.257740497589111, 6.501057147979736, 6.7443742752075195, 6.9876909255981445, 7.2310075759887695]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 19.0, 18.0, 28.0, 35.0, 36.0, 43.0, 70.0, 101.0, 123.0, 194.0, 400.0, 808.0, 2169.0, 8523.0, 71374.0, 1097097.0, 2709357.0, 278177.0, 19229.0, 3719.0, 1276.0, 538.0, 269.0, 171.0, 126.0, 100.0, 62.0, 49.0, 34.0, 23.0, 14.0, 14.0, 21.0, 11.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6390304565429688, -0.6179046630859375, -0.5967788696289062, -0.575653076171875, -0.5545272827148438, -0.5334014892578125, -0.5122756958007812, -0.49114990234375, -0.47002410888671875, -0.4488983154296875, -0.42777252197265625, -0.406646728515625, -0.38552093505859375, -0.3643951416015625, -0.34326934814453125, -0.3221435546875, -0.30101776123046875, -0.2798919677734375, -0.25876617431640625, -0.237640380859375, -0.21651458740234375, -0.1953887939453125, -0.17426300048828125, -0.15313720703125, -0.13201141357421875, -0.1108856201171875, -0.08975982666015625, -0.068634033203125, -0.04750823974609375, -0.0263824462890625, -0.00525665283203125, 0.015869140625, 0.03699493408203125, 0.0581207275390625, 0.07924652099609375, 0.100372314453125, 0.12149810791015625, 0.1426239013671875, 0.16374969482421875, 0.18487548828125, 0.20600128173828125, 0.2271270751953125, 0.24825286865234375, 0.269378662109375, 0.29050445556640625, 0.3116302490234375, 0.33275604248046875, 0.3538818359375, 0.37500762939453125, 0.3961334228515625, 0.41725921630859375, 0.438385009765625, 0.45951080322265625, 0.4806365966796875, 0.5017623901367188, 0.52288818359375, 0.5440139770507812, 0.5651397705078125, 0.5862655639648438, 0.607391357421875, 0.6285171508789062, 0.6496429443359375, 0.6707687377929688, 0.69189453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 10.0, 11.0, 18.0, 13.0, 15.0, 25.0, 21.0, 22.0, 28.0, 26.0, 40.0, 36.0, 34.0, 26.0, 54.0, 40.0, 51.0, 45.0, 40.0, 48.0, 39.0, 40.0, 33.0, 29.0, 31.0, 30.0, 31.0, 19.0, 18.0, 14.0, 17.0, 13.0, 16.0, 15.0, 11.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3771018981933594, -0.36284637451171875, -0.3485908508300781, -0.3343353271484375, -0.3200798034667969, -0.30582427978515625, -0.2915687561035156, -0.277313232421875, -0.2630577087402344, -0.24880218505859375, -0.23454666137695312, -0.2202911376953125, -0.20603561401367188, -0.19178009033203125, -0.17752456665039062, -0.16326904296875, -0.14901351928710938, -0.13475799560546875, -0.12050247192382812, -0.1062469482421875, -0.09199142456054688, -0.07773590087890625, -0.06348037719726562, -0.049224853515625, -0.034969329833984375, -0.02071380615234375, -0.006458282470703125, 0.0077972412109375, 0.022052764892578125, 0.03630828857421875, 0.050563812255859375, 0.0648193359375, 0.07907485961914062, 0.09333038330078125, 0.10758590698242188, 0.1218414306640625, 0.13609695434570312, 0.15035247802734375, 0.16460800170898438, 0.178863525390625, 0.19311904907226562, 0.20737457275390625, 0.22163009643554688, 0.2358856201171875, 0.2501411437988281, 0.26439666748046875, 0.2786521911621094, 0.29290771484375, 0.3071632385253906, 0.32141876220703125, 0.3356742858886719, 0.3499298095703125, 0.3641853332519531, 0.37844085693359375, 0.3926963806152344, 0.406951904296875, 0.4212074279785156, 0.43546295166015625, 0.4497184753417969, 0.4639739990234375, 0.4782295227050781, 0.49248504638671875, 0.5067405700683594, 0.52099609375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 9.0, 5.0, 11.0, 18.0, 22.0, 18.0, 44.0, 55.0, 103.0, 149.0, 264.0, 488.0, 1053.0, 2622.0, 9676.0, 143861.0, 3963864.0, 62259.0, 6267.0, 1864.0, 767.0, 354.0, 188.0, 114.0, 87.0, 33.0, 26.0, 23.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1460418701171875, -1.102630615234375, -1.0592193603515625, -1.01580810546875, -0.9723968505859375, -0.928985595703125, -0.8855743408203125, -0.8421630859375, -0.7987518310546875, -0.755340576171875, -0.7119293212890625, -0.66851806640625, -0.6251068115234375, -0.581695556640625, -0.5382843017578125, -0.494873046875, -0.4514617919921875, -0.408050537109375, -0.3646392822265625, -0.32122802734375, -0.2778167724609375, -0.234405517578125, -0.1909942626953125, -0.1475830078125, -0.1041717529296875, -0.060760498046875, -0.0173492431640625, 0.02606201171875, 0.0694732666015625, 0.112884521484375, 0.1562957763671875, 0.19970703125, 0.2431182861328125, 0.286529541015625, 0.3299407958984375, 0.37335205078125, 0.4167633056640625, 0.460174560546875, 0.5035858154296875, 0.5469970703125, 0.5904083251953125, 0.633819580078125, 0.6772308349609375, 0.72064208984375, 0.7640533447265625, 0.807464599609375, 0.8508758544921875, 0.894287109375, 0.9376983642578125, 0.981109619140625, 1.0245208740234375, 1.06793212890625, 1.1113433837890625, 1.154754638671875, 1.1981658935546875, 1.2415771484375, 1.2849884033203125, 1.328399658203125, 1.3718109130859375, 1.41522216796875, 1.4586334228515625, 1.502044677734375, 1.5454559326171875, 1.5888671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 11.0, 26.0, 58.0, 145.0, 418.0, 1272.0, 1374.0, 460.0, 163.0, 50.0, 21.0, 16.0, 9.0, 11.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.0567169189453125, -2.004058837890625, -1.9514007568359375, -1.89874267578125, -1.8460845947265625, -1.793426513671875, -1.7407684326171875, -1.6881103515625, -1.6354522705078125, -1.582794189453125, -1.5301361083984375, -1.47747802734375, -1.4248199462890625, -1.372161865234375, -1.3195037841796875, -1.266845703125, -1.2141876220703125, -1.161529541015625, -1.1088714599609375, -1.05621337890625, -1.0035552978515625, -0.950897216796875, -0.8982391357421875, -0.8455810546875, -0.7929229736328125, -0.740264892578125, -0.6876068115234375, -0.63494873046875, -0.5822906494140625, -0.529632568359375, -0.4769744873046875, -0.42431640625, -0.3716583251953125, -0.319000244140625, -0.2663421630859375, -0.21368408203125, -0.1610260009765625, -0.108367919921875, -0.0557098388671875, -0.0030517578125, 0.0496063232421875, 0.102264404296875, 0.1549224853515625, 0.20758056640625, 0.2602386474609375, 0.312896728515625, 0.3655548095703125, 0.418212890625, 0.4708709716796875, 0.523529052734375, 0.5761871337890625, 0.62884521484375, 0.6815032958984375, 0.734161376953125, 0.7868194580078125, 0.8394775390625, 0.8921356201171875, 0.944793701171875, 0.9974517822265625, 1.05010986328125, 1.1027679443359375, 1.155426025390625, 1.2080841064453125, 1.2607421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 6.0, 8.0, 10.0, 35.0, 144.0, 420.0, 273.0, 64.0, 24.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.080427169799805, -19.587905883789062, -19.095382690429688, -18.602861404418945, -18.110340118408203, -17.617816925048828, -17.125295639038086, -16.632774353027344, -16.14025115966797, -15.64772891998291, -15.155207633972168, -14.66268539428711, -14.17016315460205, -13.677640914916992, -13.18511962890625, -12.692597389221191, -12.20007610321045, -11.70755386352539, -11.215032577514648, -10.72251033782959, -10.229988098144531, -9.737466812133789, -9.24494457244873, -8.752422332763672, -8.25990104675293, -7.767379283905029, -7.274857044219971, -6.78233528137207, -6.289813041687012, -5.797291278839111, -5.304769515991211, -4.812247276306152, -4.31972599029541, -3.8272039890289307, -3.334681987762451, -2.842160224914551, -2.3496382236480713, -1.8571162223815918, -1.3645944595336914, -0.8720724582672119, -0.3795504570007324, 0.1129714846611023, 0.605493426322937, 1.098015308380127, 1.5905373096466064, 2.083059310913086, 2.5755810737609863, 3.068103075027466, 3.5606250762939453, 4.053146839141846, 4.545669078826904, 5.038190841674805, 5.530713081359863, 6.023234844207764, 6.515756607055664, 7.008278846740723, 7.500800609588623, 7.993322372436523, 8.485844612121582, 8.97836685180664, 9.470888137817383, 9.963410377502441, 10.4559326171875, 10.948453903198242, 11.4409761428833]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 7.0, 11.0, 12.0, 20.0, 40.0, 47.0, 65.0, 78.0, 91.0, 85.0, 97.0, 90.0, 77.0, 66.0, 57.0, 46.0, 31.0, 29.0, 12.0, 15.0, 12.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962279319763184, -5.722749710083008, -5.483220100402832, -5.243690490722656, -5.0041608810424805, -4.764631271362305, -4.525101661682129, -4.285572052001953, -4.046042442321777, -3.8065128326416016, -3.566983222961426, -3.32745361328125, -3.087924003601074, -2.8483943939208984, -2.6088647842407227, -2.369335174560547, -2.129805564880371, -1.8902759552001953, -1.6507463455200195, -1.4112167358398438, -1.171687126159668, -0.9321575164794922, -0.6926279067993164, -0.4530982971191406, -0.21356868743896484, 0.025960922241210938, 0.2654905319213867, 0.5050201416015625, 0.7445497512817383, 0.9840793609619141, 1.2236089706420898, 1.4631385803222656, 1.7026681900024414, 1.9421977996826172, 2.181727409362793, 2.4212570190429688, 2.6607866287231445, 2.9003162384033203, 3.139845848083496, 3.379375457763672, 3.6189050674438477, 3.8584346771240234, 4.097964286804199, 4.337493896484375, 4.577023506164551, 4.816553115844727, 5.056082725524902, 5.295612335205078, 5.535141944885254, 5.77467155456543, 6.0142011642456055, 6.253730773925781, 6.493260383605957, 6.732789993286133, 6.972319602966309, 7.211849212646484, 7.45137882232666, 7.690908432006836, 7.930438041687012, 8.169967651367188, 8.409497261047363, 8.649026870727539, 8.888556480407715, 9.12808609008789, 9.367615699768066]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 14.0, 28.0, 46.0, 106.0, 214.0, 528.0, 1281.0, 3825.0, 13666.0, 59597.0, 303962.0, 508586.0, 121035.0, 25855.0, 6527.0, 2029.0, 725.0, 263.0, 117.0, 71.0, 30.0, 14.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.084320068359375, -1.05438232421875, -1.024444580078125, -0.9945068359375, -0.964569091796875, -0.93463134765625, -0.904693603515625, -0.874755859375, -0.844818115234375, -0.81488037109375, -0.784942626953125, -0.7550048828125, -0.725067138671875, -0.69512939453125, -0.665191650390625, -0.63525390625, -0.605316162109375, -0.57537841796875, -0.545440673828125, -0.5155029296875, -0.485565185546875, -0.45562744140625, -0.425689697265625, -0.395751953125, -0.365814208984375, -0.33587646484375, -0.305938720703125, -0.2760009765625, -0.246063232421875, -0.21612548828125, -0.186187744140625, -0.15625, -0.126312255859375, -0.09637451171875, -0.066436767578125, -0.0364990234375, -0.006561279296875, 0.02337646484375, 0.053314208984375, 0.083251953125, 0.113189697265625, 0.14312744140625, 0.173065185546875, 0.2030029296875, 0.232940673828125, 0.26287841796875, 0.292816162109375, 0.32275390625, 0.352691650390625, 0.38262939453125, 0.412567138671875, 0.4425048828125, 0.472442626953125, 0.50238037109375, 0.532318115234375, 0.562255859375, 0.592193603515625, 0.62213134765625, 0.652069091796875, 0.6820068359375, 0.711944580078125, 0.74188232421875, 0.771820068359375, 0.8017578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 9.0, 16.0, 15.0, 15.0, 10.0, 26.0, 20.0, 23.0, 23.0, 26.0, 30.0, 29.0, 27.0, 37.0, 36.0, 40.0, 46.0, 30.0, 50.0, 31.0, 47.0, 31.0, 23.0, 42.0, 24.0, 31.0, 34.0, 28.0, 33.0, 18.0, 21.0, 18.0, 21.0, 9.0, 17.0, 8.0, 6.0, 9.0, 5.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.3828125, -0.3694610595703125, -0.356109619140625, -0.3427581787109375, -0.32940673828125, -0.3160552978515625, -0.302703857421875, -0.2893524169921875, -0.2760009765625, -0.2626495361328125, -0.249298095703125, -0.2359466552734375, -0.22259521484375, -0.2092437744140625, -0.195892333984375, -0.1825408935546875, -0.169189453125, -0.1558380126953125, -0.142486572265625, -0.1291351318359375, -0.11578369140625, -0.1024322509765625, -0.089080810546875, -0.0757293701171875, -0.0623779296875, -0.0490264892578125, -0.035675048828125, -0.0223236083984375, -0.00897216796875, 0.0043792724609375, 0.017730712890625, 0.0310821533203125, 0.04443359375, 0.0577850341796875, 0.071136474609375, 0.0844879150390625, 0.09783935546875, 0.1111907958984375, 0.124542236328125, 0.1378936767578125, 0.1512451171875, 0.1645965576171875, 0.177947998046875, 0.1912994384765625, 0.20465087890625, 0.2180023193359375, 0.231353759765625, 0.2447052001953125, 0.258056640625, 0.2714080810546875, 0.284759521484375, 0.2981109619140625, 0.31146240234375, 0.3248138427734375, 0.338165283203125, 0.3515167236328125, 0.3648681640625, 0.3782196044921875, 0.391571044921875, 0.4049224853515625, 0.41827392578125, 0.4316253662109375, 0.444976806640625, 0.4583282470703125, 0.4716796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 7.0, 16.0, 8.0, 24.0, 31.0, 40.0, 47.0, 83.0, 102.0, 176.0, 358.0, 737.0, 1931.0, 7016.0, 40149.0, 328232.0, 600616.0, 55741.0, 9048.0, 2290.0, 869.0, 391.0, 217.0, 111.0, 80.0, 54.0, 51.0, 26.0, 24.0, 18.0, 12.0, 10.0, 6.0, 3.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1337890625, -1.096099853515625, -1.05841064453125, -1.020721435546875, -0.9830322265625, -0.945343017578125, -0.90765380859375, -0.869964599609375, -0.832275390625, -0.794586181640625, -0.75689697265625, -0.719207763671875, -0.6815185546875, -0.643829345703125, -0.60614013671875, -0.568450927734375, -0.53076171875, -0.493072509765625, -0.45538330078125, -0.417694091796875, -0.3800048828125, -0.342315673828125, -0.30462646484375, -0.266937255859375, -0.229248046875, -0.191558837890625, -0.15386962890625, -0.116180419921875, -0.0784912109375, -0.040802001953125, -0.00311279296875, 0.034576416015625, 0.072265625, 0.109954833984375, 0.14764404296875, 0.185333251953125, 0.2230224609375, 0.260711669921875, 0.29840087890625, 0.336090087890625, 0.373779296875, 0.411468505859375, 0.44915771484375, 0.486846923828125, 0.5245361328125, 0.562225341796875, 0.59991455078125, 0.637603759765625, 0.67529296875, 0.712982177734375, 0.75067138671875, 0.788360595703125, 0.8260498046875, 0.863739013671875, 0.90142822265625, 0.939117431640625, 0.976806640625, 1.014495849609375, 1.05218505859375, 1.089874267578125, 1.1275634765625, 1.165252685546875, 1.20294189453125, 1.240631103515625, 1.2783203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 12.0, 13.0, 15.0, 9.0, 22.0, 23.0, 23.0, 27.0, 39.0, 34.0, 34.0, 53.0, 50.0, 60.0, 48.0, 56.0, 53.0, 46.0, 50.0, 54.0, 45.0, 33.0, 40.0, 31.0, 30.0, 22.0, 14.0, 19.0, 17.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.083984375, -2.0233154296875, -1.962646484375, -1.9019775390625, -1.84130859375, -1.7806396484375, -1.719970703125, -1.6593017578125, -1.5986328125, -1.5379638671875, -1.477294921875, -1.4166259765625, -1.35595703125, -1.2952880859375, -1.234619140625, -1.1739501953125, -1.11328125, -1.0526123046875, -0.991943359375, -0.9312744140625, -0.87060546875, -0.8099365234375, -0.749267578125, -0.6885986328125, -0.6279296875, -0.5672607421875, -0.506591796875, -0.4459228515625, -0.38525390625, -0.3245849609375, -0.263916015625, -0.2032470703125, -0.142578125, -0.0819091796875, -0.021240234375, 0.0394287109375, 0.10009765625, 0.1607666015625, 0.221435546875, 0.2821044921875, 0.3427734375, 0.4034423828125, 0.464111328125, 0.5247802734375, 0.58544921875, 0.6461181640625, 0.706787109375, 0.7674560546875, 0.828125, 0.8887939453125, 0.949462890625, 1.0101318359375, 1.07080078125, 1.1314697265625, 1.192138671875, 1.2528076171875, 1.3134765625, 1.3741455078125, 1.434814453125, 1.4954833984375, 1.55615234375, 1.6168212890625, 1.677490234375, 1.7381591796875, 1.798828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 17.0, 14.0, 32.0, 56.0, 83.0, 126.0, 286.0, 619.0, 1453.0, 4329.0, 14142.0, 58389.0, 304283.0, 562238.0, 76062.0, 18111.0, 5190.0, 1726.0, 643.0, 336.0, 159.0, 97.0, 56.0, 37.0, 23.0, 13.0, 6.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.281005859375, -0.2729969024658203, -0.2649879455566406, -0.25697898864746094, -0.24897003173828125, -0.24096107482910156, -0.23295211791992188, -0.2249431610107422, -0.2169342041015625, -0.2089252471923828, -0.20091629028320312, -0.19290733337402344, -0.18489837646484375, -0.17688941955566406, -0.16888046264648438, -0.1608715057373047, -0.152862548828125, -0.1448535919189453, -0.13684463500976562, -0.12883567810058594, -0.12082672119140625, -0.11281776428222656, -0.10480880737304688, -0.09679985046386719, -0.0887908935546875, -0.08078193664550781, -0.07277297973632812, -0.06476402282714844, -0.05675506591796875, -0.04874610900878906, -0.040737152099609375, -0.03272819519042969, -0.02471923828125, -0.016710281372070312, -0.008701324462890625, -0.0006923675537109375, 0.00731658935546875, 0.015325546264648438, 0.023334503173828125, 0.03134346008300781, 0.0393524169921875, 0.04736137390136719, 0.055370330810546875, 0.06337928771972656, 0.07138824462890625, 0.07939720153808594, 0.08740615844726562, 0.09541511535644531, 0.103424072265625, 0.11143302917480469, 0.11944198608398438, 0.12745094299316406, 0.13545989990234375, 0.14346885681152344, 0.15147781372070312, 0.1594867706298828, 0.1674957275390625, 0.1755046844482422, 0.18351364135742188, 0.19152259826660156, 0.19953155517578125, 0.20754051208496094, 0.21554946899414062, 0.2235584259033203, 0.2315673828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 11.0, 13.0, 30.0, 23.0, 42.0, 36.0, 71.0, 72.0, 79.0, 132.0, 75.0, 74.0, 70.0, 62.0, 49.0, 28.0, 20.0, 23.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.258487701416016e-05, -6.08246773481369e-05, -5.906447768211365e-05, -5.730427801609039e-05, -5.554407835006714e-05, -5.3783878684043884e-05, -5.202367901802063e-05, -5.0263479351997375e-05, -4.850327968597412e-05, -4.674308001995087e-05, -4.498288035392761e-05, -4.322268068790436e-05, -4.1462481021881104e-05, -3.970228135585785e-05, -3.7942081689834595e-05, -3.618188202381134e-05, -3.4421682357788086e-05, -3.266148269176483e-05, -3.090128302574158e-05, -2.9141083359718323e-05, -2.738088369369507e-05, -2.5620684027671814e-05, -2.386048436164856e-05, -2.2100284695625305e-05, -2.034008502960205e-05, -1.8579885363578796e-05, -1.6819685697555542e-05, -1.5059486031532288e-05, -1.3299286365509033e-05, -1.1539086699485779e-05, -9.778887033462524e-06, -8.01868736743927e-06, -6.258487701416016e-06, -4.498288035392761e-06, -2.738088369369507e-06, -9.778887033462524e-07, 7.82310962677002e-07, 2.5425106287002563e-06, 4.302710294723511e-06, 6.062909960746765e-06, 7.82310962677002e-06, 9.583309292793274e-06, 1.1343508958816528e-05, 1.3103708624839783e-05, 1.4863908290863037e-05, 1.662410795688629e-05, 1.8384307622909546e-05, 2.01445072889328e-05, 2.1904706954956055e-05, 2.366490662097931e-05, 2.5425106287002563e-05, 2.7185305953025818e-05, 2.8945505619049072e-05, 3.070570528507233e-05, 3.246590495109558e-05, 3.4226104617118835e-05, 3.598630428314209e-05, 3.7746503949165344e-05, 3.95067036151886e-05, 4.126690328121185e-05, 4.302710294723511e-05, 4.478730261325836e-05, 4.6547502279281616e-05, 4.830770194530487e-05, 5.0067901611328125e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 10.0, 26.0, 35.0, 66.0, 158.0, 506.0, 3228.0, 89074.0, 924128.0, 29080.0, 1672.0, 331.0, 108.0, 69.0, 36.0, 13.0, 10.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7111053466796875, -0.689788818359375, -0.6684722900390625, -0.64715576171875, -0.6258392333984375, -0.604522705078125, -0.5832061767578125, -0.5618896484375, -0.5405731201171875, -0.519256591796875, -0.4979400634765625, -0.47662353515625, -0.4553070068359375, -0.433990478515625, -0.4126739501953125, -0.391357421875, -0.3700408935546875, -0.348724365234375, -0.3274078369140625, -0.30609130859375, -0.2847747802734375, -0.263458251953125, -0.2421417236328125, -0.2208251953125, -0.1995086669921875, -0.178192138671875, -0.1568756103515625, -0.13555908203125, -0.1142425537109375, -0.092926025390625, -0.0716094970703125, -0.05029296875, -0.0289764404296875, -0.007659912109375, 0.0136566162109375, 0.03497314453125, 0.0562896728515625, 0.077606201171875, 0.0989227294921875, 0.1202392578125, 0.1415557861328125, 0.162872314453125, 0.1841888427734375, 0.20550537109375, 0.2268218994140625, 0.248138427734375, 0.2694549560546875, 0.290771484375, 0.3120880126953125, 0.333404541015625, 0.3547210693359375, 0.37603759765625, 0.3973541259765625, 0.418670654296875, 0.4399871826171875, 0.4613037109375, 0.4826202392578125, 0.503936767578125, 0.5252532958984375, 0.54656982421875, 0.5678863525390625, 0.589202880859375, 0.6105194091796875, 0.6318359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 7.0, 16.0, 9.0, 13.0, 19.0, 17.0, 32.0, 27.0, 42.0, 47.0, 60.0, 67.0, 60.0, 73.0, 67.0, 65.0, 58.0, 53.0, 44.0, 38.0, 44.0, 22.0, 21.0, 13.0, 17.0, 9.0, 9.0, 7.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2021484375, -0.1951141357421875, -0.188079833984375, -0.1810455322265625, -0.17401123046875, -0.1669769287109375, -0.159942626953125, -0.1529083251953125, -0.1458740234375, -0.1388397216796875, -0.131805419921875, -0.1247711181640625, -0.11773681640625, -0.1107025146484375, -0.103668212890625, -0.0966339111328125, -0.089599609375, -0.0825653076171875, -0.075531005859375, -0.0684967041015625, -0.06146240234375, -0.0544281005859375, -0.047393798828125, -0.0403594970703125, -0.0333251953125, -0.0262908935546875, -0.019256591796875, -0.0122222900390625, -0.00518798828125, 0.0018463134765625, 0.008880615234375, 0.0159149169921875, 0.02294921875, 0.0299835205078125, 0.037017822265625, 0.0440521240234375, 0.05108642578125, 0.0581207275390625, 0.065155029296875, 0.0721893310546875, 0.0792236328125, 0.0862579345703125, 0.093292236328125, 0.1003265380859375, 0.10736083984375, 0.1143951416015625, 0.121429443359375, 0.1284637451171875, 0.135498046875, 0.1425323486328125, 0.149566650390625, 0.1566009521484375, 0.16363525390625, 0.1706695556640625, 0.177703857421875, 0.1847381591796875, 0.1917724609375, 0.1988067626953125, 0.205841064453125, 0.2128753662109375, 0.21990966796875, 0.2269439697265625, 0.233978271484375, 0.2410125732421875, 0.248046875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 9.0, 14.0, 30.0, 36.0, 72.0, 125.0, 201.0, 306.0, 95.0, 49.0, 27.0, 10.0, 9.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.560540199279785, -8.295269012451172, -8.029998779296875, -7.764727592468262, -7.499456405639648, -7.234185695648193, -6.968914985656738, -6.703643798828125, -6.43837308883667, -6.173102378845215, -5.907831192016602, -5.6425604820251465, -5.377289772033691, -5.112018585205078, -4.846747875213623, -4.581477165222168, -4.316205978393555, -4.0509352684021, -3.7856640815734863, -3.5203933715820312, -3.255122423171997, -2.989851474761963, -2.724580764770508, -2.4593098163604736, -2.1940388679504395, -1.9287679195404053, -1.6634970903396606, -1.398226261138916, -1.1329553127288818, -0.8676843643188477, -0.602413535118103, -0.3371427059173584, -0.07187080383300781, 0.1934000849723816, 0.458670973777771, 0.7239418625831604, 0.9892127513885498, 1.254483699798584, 1.5197545289993286, 1.7850253582000732, 2.0502963066101074, 2.3155672550201416, 2.580838203430176, 2.846108913421631, 3.111379861831665, 3.376650810241699, 3.6419215202331543, 3.9071924686431885, 4.172463417053223, 4.437734127044678, 4.703005313873291, 4.968276023864746, 5.233547210693359, 5.4988179206848145, 5.7640886306762695, 6.029359817504883, 6.294630527496338, 6.559901237487793, 6.825172424316406, 7.090443134307861, 7.355713844299316, 7.62098503112793, 7.886255741119385, 8.15152645111084, 8.416797637939453]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 7.0, 5.0, 6.0, 7.0, 13.0, 17.0, 20.0, 17.0, 20.0, 30.0, 30.0, 32.0, 34.0, 29.0, 57.0, 54.0, 57.0, 85.0, 67.0, 50.0, 51.0, 46.0, 38.0, 23.0, 33.0, 28.0, 17.0, 16.0, 18.0, 11.0, 11.0, 12.0, 9.0, 5.0, 11.0, 2.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312359809875488, -6.098534107208252, -5.884708404541016, -5.670882701873779, -5.457056999206543, -5.243231296539307, -5.02940559387207, -4.815579891204834, -4.601754188537598, -4.387928485870361, -4.174102783203125, -3.9602770805358887, -3.7464513778686523, -3.532625675201416, -3.3187999725341797, -3.1049742698669434, -2.891148567199707, -2.6773228645324707, -2.4634971618652344, -2.249671459197998, -2.0358457565307617, -1.8220200538635254, -1.608194351196289, -1.3943686485290527, -1.1805429458618164, -0.9667172431945801, -0.7528915405273438, -0.5390658378601074, -0.3252401351928711, -0.11141443252563477, 0.10241127014160156, 0.3162369728088379, 0.530062198638916, 0.7438879013061523, 0.9577136039733887, 1.171539306640625, 1.3853650093078613, 1.5991907119750977, 1.813016414642334, 2.0268421173095703, 2.2406678199768066, 2.454493522644043, 2.6683192253112793, 2.8821449279785156, 3.095970630645752, 3.3097963333129883, 3.5236220359802246, 3.737447738647461, 3.9512734413146973, 4.165099143981934, 4.37892484664917, 4.592750549316406, 4.806576251983643, 5.020401954650879, 5.234227657318115, 5.448053359985352, 5.661879062652588, 5.875704765319824, 6.0895304679870605, 6.303356170654297, 6.517181873321533, 6.7310075759887695, 6.944833278656006, 7.158658981323242, 7.3724846839904785]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 14.0, 7.0, 19.0, 32.0, 42.0, 52.0, 116.0, 140.0, 245.0, 369.0, 598.0, 1083.0, 2269.0, 6542.0, 23680.0, 116640.0, 562173.0, 1814739.0, 1276845.0, 309030.0, 59079.0, 12233.0, 4145.0, 1952.0, 860.0, 497.0, 287.0, 204.0, 127.0, 84.0, 54.0, 34.0, 29.0, 16.0, 14.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.34287261962890625, -0.3317413330078125, -0.32061004638671875, -0.309478759765625, -0.29834747314453125, -0.2872161865234375, -0.27608489990234375, -0.26495361328125, -0.25382232666015625, -0.2426910400390625, -0.23155975341796875, -0.220428466796875, -0.20929718017578125, -0.1981658935546875, -0.18703460693359375, -0.1759033203125, -0.16477203369140625, -0.1536407470703125, -0.14250946044921875, -0.131378173828125, -0.12024688720703125, -0.1091156005859375, -0.09798431396484375, -0.08685302734375, -0.07572174072265625, -0.0645904541015625, -0.05345916748046875, -0.042327880859375, -0.03119659423828125, -0.0200653076171875, -0.00893402099609375, 0.002197265625, 0.01332855224609375, 0.0244598388671875, 0.03559112548828125, 0.046722412109375, 0.05785369873046875, 0.0689849853515625, 0.08011627197265625, 0.09124755859375, 0.10237884521484375, 0.1135101318359375, 0.12464141845703125, 0.135772705078125, 0.14690399169921875, 0.1580352783203125, 0.16916656494140625, 0.1802978515625, 0.19142913818359375, 0.2025604248046875, 0.21369171142578125, 0.224822998046875, 0.23595428466796875, 0.2470855712890625, 0.25821685791015625, 0.26934814453125, 0.28047943115234375, 0.2916107177734375, 0.30274200439453125, 0.313873291015625, 0.32500457763671875, 0.3361358642578125, 0.34726715087890625, 0.3583984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 5.0, 7.0, 14.0, 19.0, 13.0, 22.0, 20.0, 30.0, 37.0, 40.0, 34.0, 38.0, 42.0, 60.0, 61.0, 39.0, 56.0, 48.0, 46.0, 40.0, 43.0, 37.0, 37.0, 50.0, 30.0, 22.0, 22.0, 18.0, 17.0, 15.0, 5.0, 10.0, 7.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5664520263671875, -0.550384521484375, -0.5343170166015625, -0.51824951171875, -0.5021820068359375, -0.486114501953125, -0.4700469970703125, -0.4539794921875, -0.4379119873046875, -0.421844482421875, -0.4057769775390625, -0.38970947265625, -0.3736419677734375, -0.357574462890625, -0.3415069580078125, -0.325439453125, -0.3093719482421875, -0.293304443359375, -0.2772369384765625, -0.26116943359375, -0.2451019287109375, -0.229034423828125, -0.2129669189453125, -0.1968994140625, -0.1808319091796875, -0.164764404296875, -0.1486968994140625, -0.13262939453125, -0.1165618896484375, -0.100494384765625, -0.0844268798828125, -0.068359375, -0.0522918701171875, -0.036224365234375, -0.0201568603515625, -0.00408935546875, 0.0119781494140625, 0.028045654296875, 0.0441131591796875, 0.0601806640625, 0.0762481689453125, 0.092315673828125, 0.1083831787109375, 0.12445068359375, 0.1405181884765625, 0.156585693359375, 0.1726531982421875, 0.188720703125, 0.2047882080078125, 0.220855712890625, 0.2369232177734375, 0.25299072265625, 0.2690582275390625, 0.285125732421875, 0.3011932373046875, 0.3172607421875, 0.3333282470703125, 0.349395751953125, 0.3654632568359375, 0.38153076171875, 0.3975982666015625, 0.413665771484375, 0.4297332763671875, 0.44580078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 0.0, 9.0, 5.0, 10.0, 5.0, 12.0, 17.0, 23.0, 39.0, 64.0, 100.0, 193.0, 403.0, 962.0, 3021.0, 12289.0, 127110.0, 3441023.0, 572376.0, 28527.0, 5197.0, 1633.0, 625.0, 243.0, 129.0, 91.0, 44.0, 35.0, 29.0, 17.0, 10.0, 8.0, 6.0, 2.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.76806640625, -0.7445831298828125, -0.721099853515625, -0.6976165771484375, -0.67413330078125, -0.6506500244140625, -0.627166748046875, -0.6036834716796875, -0.5802001953125, -0.5567169189453125, -0.533233642578125, -0.5097503662109375, -0.48626708984375, -0.4627838134765625, -0.439300537109375, -0.4158172607421875, -0.392333984375, -0.3688507080078125, -0.345367431640625, -0.3218841552734375, -0.29840087890625, -0.2749176025390625, -0.251434326171875, -0.2279510498046875, -0.2044677734375, -0.1809844970703125, -0.157501220703125, -0.1340179443359375, -0.11053466796875, -0.0870513916015625, -0.063568115234375, -0.0400848388671875, -0.0166015625, 0.0068817138671875, 0.030364990234375, 0.0538482666015625, 0.07733154296875, 0.1008148193359375, 0.124298095703125, 0.1477813720703125, 0.1712646484375, 0.1947479248046875, 0.218231201171875, 0.2417144775390625, 0.26519775390625, 0.2886810302734375, 0.312164306640625, 0.3356475830078125, 0.359130859375, 0.3826141357421875, 0.406097412109375, 0.4295806884765625, 0.45306396484375, 0.4765472412109375, 0.500030517578125, 0.5235137939453125, 0.5469970703125, 0.5704803466796875, 0.593963623046875, 0.6174468994140625, 0.64093017578125, 0.6644134521484375, 0.687896728515625, 0.7113800048828125, 0.73486328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 6.0, 14.0, 15.0, 23.0, 32.0, 58.0, 73.0, 141.0, 229.0, 382.0, 558.0, 675.0, 590.0, 467.0, 293.0, 170.0, 119.0, 61.0, 40.0, 40.0, 26.0, 15.0, 7.0, 9.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6207656860351562, -0.5999298095703125, -0.5790939331054688, -0.558258056640625, -0.5374221801757812, -0.5165863037109375, -0.49575042724609375, -0.47491455078125, -0.45407867431640625, -0.4332427978515625, -0.41240692138671875, -0.391571044921875, -0.37073516845703125, -0.3498992919921875, -0.32906341552734375, -0.3082275390625, -0.28739166259765625, -0.2665557861328125, -0.24571990966796875, -0.224884033203125, -0.20404815673828125, -0.1832122802734375, -0.16237640380859375, -0.14154052734375, -0.12070465087890625, -0.0998687744140625, -0.07903289794921875, -0.058197021484375, -0.03736114501953125, -0.0165252685546875, 0.00431060791015625, 0.025146484375, 0.04598236083984375, 0.0668182373046875, 0.08765411376953125, 0.108489990234375, 0.12932586669921875, 0.1501617431640625, 0.17099761962890625, 0.19183349609375, 0.21266937255859375, 0.2335052490234375, 0.25434112548828125, 0.275177001953125, 0.29601287841796875, 0.3168487548828125, 0.33768463134765625, 0.3585205078125, 0.37935638427734375, 0.4001922607421875, 0.42102813720703125, 0.441864013671875, 0.46269989013671875, 0.4835357666015625, 0.5043716430664062, 0.52520751953125, 0.5460433959960938, 0.5668792724609375, 0.5877151489257812, 0.608551025390625, 0.6293869018554688, 0.6502227783203125, 0.6710586547851562, 0.69189453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 16.0, 29.0, 113.0, 247.0, 304.0, 189.0, 52.0, 23.0, 13.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.395692825317383, -4.126665115356445, -3.857637405395508, -3.588609457015991, -3.3195817470550537, -3.050554037094116, -2.7815260887145996, -2.512498378753662, -2.2434706687927246, -1.974442958831787, -1.70541512966156, -1.436387300491333, -1.1673595905303955, -0.898331880569458, -0.629304051399231, -0.3602762222290039, -0.0912485122680664, 0.17777925729751587, 0.44680702686309814, 0.7158347964286804, 0.9848625659942627, 1.2538902759552002, 1.5229181051254272, 1.7919459342956543, 2.060973644256592, 2.3300013542175293, 2.599029064178467, 2.8680570125579834, 3.137084722518921, 3.4061124324798584, 3.675140380859375, 3.9441680908203125, 4.21319580078125, 4.4822235107421875, 4.751251220703125, 5.0202789306640625, 5.289306640625, 5.5583343505859375, 5.827362537384033, 6.096390247344971, 6.365417957305908, 6.634445667266846, 6.903473377227783, 7.172501087188721, 7.441529273986816, 7.710556983947754, 7.979584693908691, 8.248612403869629, 8.517640113830566, 8.786667823791504, 9.055695533752441, 9.324723243713379, 9.593750953674316, 9.862778663635254, 10.131806373596191, 10.400835037231445, 10.669862747192383, 10.93889045715332, 11.207918167114258, 11.476945877075195, 11.745973587036133, 12.01500129699707, 12.284029006958008, 12.553056716918945, 12.822084426879883]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 1.0, 5.0, 7.0, 7.0, 10.0, 17.0, 12.0, 18.0, 31.0, 15.0, 32.0, 28.0, 36.0, 37.0, 41.0, 41.0, 46.0, 44.0, 51.0, 66.0, 55.0, 48.0, 41.0, 35.0, 37.0, 34.0, 30.0, 25.0, 19.0, 20.0, 20.0, 19.0, 16.0, 13.0, 8.0, 4.0, 4.0, 3.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.714219331741333, -2.6280808448791504, -2.541942596435547, -2.4558041095733643, -2.3696658611297607, -2.283527374267578, -2.1973891258239746, -2.111250638961792, -2.0251121520996094, -1.9389737844467163, -1.8528354167938232, -1.7666969299316406, -1.680558681488037, -1.5944201946258545, -1.5082818269729614, -1.4221434593200684, -1.3360052108764648, -1.2498668432235718, -1.1637284755706787, -1.077589988708496, -0.9914516806602478, -0.9053133130073547, -0.8191748857498169, -0.7330365180969238, -0.6468981504440308, -0.5607597827911377, -0.47462138533592224, -0.3884829878807068, -0.3023446202278137, -0.21620625257492065, -0.1300678253173828, -0.043929457664489746, 0.04220890998840332, 0.12834729254245758, 0.21448567509651184, 0.3006240725517273, 0.38676244020462036, 0.4729008078575134, 0.5590392351150513, 0.6451776027679443, 0.7313159704208374, 0.8174543380737305, 0.9035927057266235, 0.9897311329841614, 1.0758695602416992, 1.1620078086853027, 1.2481462955474854, 1.3342846632003784, 1.4204230308532715, 1.5065613985061646, 1.5926997661590576, 1.6788382530212402, 1.7649765014648438, 1.8511149883270264, 1.9372533559799194, 2.0233917236328125, 2.109529972076416, 2.1956684589385986, 2.281806707382202, 2.3679451942443848, 2.4540834426879883, 2.540221929550171, 2.6263604164123535, 2.712498664855957, 2.7986371517181396]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 6.0, 18.0, 17.0, 44.0, 62.0, 97.0, 206.0, 432.0, 914.0, 1990.0, 4855.0, 12775.0, 38663.0, 130894.0, 418232.0, 308475.0, 87977.0, 27037.0, 9187.0, 3686.0, 1584.0, 689.0, 324.0, 165.0, 105.0, 47.0, 32.0, 19.0, 16.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455810546875, -0.4358558654785156, -0.41590118408203125, -0.3959465026855469, -0.3759918212890625, -0.3560371398925781, -0.33608245849609375, -0.3161277770996094, -0.296173095703125, -0.2762184143066406, -0.25626373291015625, -0.23630905151367188, -0.2163543701171875, -0.19639968872070312, -0.17644500732421875, -0.15649032592773438, -0.13653564453125, -0.11658096313476562, -0.09662628173828125, -0.07667160034179688, -0.0567169189453125, -0.036762237548828125, -0.01680755615234375, 0.003147125244140625, 0.023101806640625, 0.043056488037109375, 0.06301116943359375, 0.08296585083007812, 0.1029205322265625, 0.12287521362304688, 0.14282989501953125, 0.16278457641601562, 0.1827392578125, 0.20269393920898438, 0.22264862060546875, 0.24260330200195312, 0.2625579833984375, 0.2825126647949219, 0.30246734619140625, 0.3224220275878906, 0.342376708984375, 0.3623313903808594, 0.38228607177734375, 0.4022407531738281, 0.4221954345703125, 0.4421501159667969, 0.46210479736328125, 0.4820594787597656, 0.50201416015625, 0.5219688415527344, 0.5419235229492188, 0.5618782043457031, 0.5818328857421875, 0.6017875671386719, 0.6217422485351562, 0.6416969299316406, 0.661651611328125, 0.6816062927246094, 0.7015609741210938, 0.7215156555175781, 0.7414703369140625, 0.7614250183105469, 0.7813796997070312, 0.8013343811035156, 0.8212890625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 5.0, 5.0, 4.0, 7.0, 6.0, 18.0, 10.0, 15.0, 9.0, 20.0, 26.0, 31.0, 30.0, 38.0, 43.0, 36.0, 48.0, 52.0, 48.0, 36.0, 46.0, 56.0, 36.0, 41.0, 41.0, 38.0, 40.0, 41.0, 27.0, 34.0, 14.0, 20.0, 17.0, 11.0, 18.0, 10.0, 5.0, 2.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5068359375, -0.4920310974121094, -0.47722625732421875, -0.4624214172363281, -0.4476165771484375, -0.4328117370605469, -0.41800689697265625, -0.4032020568847656, -0.388397216796875, -0.3735923767089844, -0.35878753662109375, -0.3439826965332031, -0.3291778564453125, -0.3143730163574219, -0.29956817626953125, -0.2847633361816406, -0.26995849609375, -0.2551536560058594, -0.24034881591796875, -0.22554397583007812, -0.2107391357421875, -0.19593429565429688, -0.18112945556640625, -0.16632461547851562, -0.151519775390625, -0.13671493530273438, -0.12191009521484375, -0.10710525512695312, -0.0923004150390625, -0.07749557495117188, -0.06269073486328125, -0.047885894775390625, -0.0330810546875, -0.018276214599609375, -0.00347137451171875, 0.011333465576171875, 0.0261383056640625, 0.040943145751953125, 0.05574798583984375, 0.07055282592773438, 0.085357666015625, 0.10016250610351562, 0.11496734619140625, 0.12977218627929688, 0.1445770263671875, 0.15938186645507812, 0.17418670654296875, 0.18899154663085938, 0.20379638671875, 0.21860122680664062, 0.23340606689453125, 0.24821090698242188, 0.2630157470703125, 0.2778205871582031, 0.29262542724609375, 0.3074302673339844, 0.322235107421875, 0.3370399475097656, 0.35184478759765625, 0.3666496276855469, 0.3814544677734375, 0.3962593078613281, 0.41106414794921875, 0.4258689880371094, 0.440673828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 11.0, 13.0, 22.0, 22.0, 29.0, 48.0, 71.0, 71.0, 124.0, 149.0, 170.0, 277.0, 421.0, 707.0, 1451.0, 3526.0, 12551.0, 63570.0, 674415.0, 243810.0, 34087.0, 7702.0, 2477.0, 1047.0, 535.0, 335.0, 246.0, 165.0, 133.0, 97.0, 47.0, 48.0, 28.0, 22.0, 23.0, 19.0, 17.0, 12.0, 3.0, 10.0, 10.0, 5.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0329360961914062, -1.0023956298828125, -0.9718551635742188, -0.941314697265625, -0.9107742309570312, -0.8802337646484375, -0.8496932983398438, -0.81915283203125, -0.7886123657226562, -0.7580718994140625, -0.7275314331054688, -0.696990966796875, -0.6664505004882812, -0.6359100341796875, -0.6053695678710938, -0.5748291015625, -0.5442886352539062, -0.5137481689453125, -0.48320770263671875, -0.452667236328125, -0.42212677001953125, -0.3915863037109375, -0.36104583740234375, -0.33050537109375, -0.29996490478515625, -0.2694244384765625, -0.23888397216796875, -0.208343505859375, -0.17780303955078125, -0.1472625732421875, -0.11672210693359375, -0.086181640625, -0.05564117431640625, -0.0251007080078125, 0.00543975830078125, 0.035980224609375, 0.06652069091796875, 0.0970611572265625, 0.12760162353515625, 0.15814208984375, 0.18868255615234375, 0.2192230224609375, 0.24976348876953125, 0.280303955078125, 0.31084442138671875, 0.3413848876953125, 0.37192535400390625, 0.4024658203125, 0.43300628662109375, 0.4635467529296875, 0.49408721923828125, 0.524627685546875, 0.5551681518554688, 0.5857086181640625, 0.6162490844726562, 0.64678955078125, 0.6773300170898438, 0.7078704833984375, 0.7384109497070312, 0.768951416015625, 0.7994918823242188, 0.8300323486328125, 0.8605728149414062, 0.89111328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 10.0, 11.0, 17.0, 18.0, 20.0, 22.0, 23.0, 36.0, 35.0, 33.0, 55.0, 37.0, 52.0, 40.0, 61.0, 63.0, 54.0, 47.0, 48.0, 47.0, 38.0, 38.0, 26.0, 30.0, 20.0, 21.0, 20.0, 12.0, 11.0, 6.0, 9.0, 1.0, 4.0, 1.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.7744140625, -1.722869873046875, -1.67132568359375, -1.619781494140625, -1.5682373046875, -1.516693115234375, -1.46514892578125, -1.413604736328125, -1.362060546875, -1.310516357421875, -1.25897216796875, -1.207427978515625, -1.1558837890625, -1.104339599609375, -1.05279541015625, -1.001251220703125, -0.94970703125, -0.898162841796875, -0.84661865234375, -0.795074462890625, -0.7435302734375, -0.691986083984375, -0.64044189453125, -0.588897705078125, -0.537353515625, -0.485809326171875, -0.43426513671875, -0.382720947265625, -0.3311767578125, -0.279632568359375, -0.22808837890625, -0.176544189453125, -0.125, -0.073455810546875, -0.02191162109375, 0.029632568359375, 0.0811767578125, 0.132720947265625, 0.18426513671875, 0.235809326171875, 0.287353515625, 0.338897705078125, 0.39044189453125, 0.441986083984375, 0.4935302734375, 0.545074462890625, 0.59661865234375, 0.648162841796875, 0.69970703125, 0.751251220703125, 0.80279541015625, 0.854339599609375, 0.9058837890625, 0.957427978515625, 1.00897216796875, 1.060516357421875, 1.112060546875, 1.163604736328125, 1.21514892578125, 1.266693115234375, 1.3182373046875, 1.369781494140625, 1.42132568359375, 1.472869873046875, 1.5244140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 15.0, 20.0, 28.0, 46.0, 67.0, 110.0, 208.0, 454.0, 936.0, 2467.0, 7533.0, 29177.0, 178489.0, 733886.0, 72481.0, 15220.0, 4430.0, 1572.0, 698.0, 295.0, 157.0, 100.0, 45.0, 32.0, 15.0, 13.0, 13.0, 5.0, 9.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3125, -0.30310821533203125, -0.2937164306640625, -0.28432464599609375, -0.274932861328125, -0.26554107666015625, -0.2561492919921875, -0.24675750732421875, -0.23736572265625, -0.22797393798828125, -0.2185821533203125, -0.20919036865234375, -0.199798583984375, -0.19040679931640625, -0.1810150146484375, -0.17162322998046875, -0.1622314453125, -0.15283966064453125, -0.1434478759765625, -0.13405609130859375, -0.124664306640625, -0.11527252197265625, -0.1058807373046875, -0.09648895263671875, -0.08709716796875, -0.07770538330078125, -0.0683135986328125, -0.05892181396484375, -0.049530029296875, -0.04013824462890625, -0.0307464599609375, -0.02135467529296875, -0.011962890625, -0.00257110595703125, 0.0068206787109375, 0.01621246337890625, 0.025604248046875, 0.03499603271484375, 0.0443878173828125, 0.05377960205078125, 0.06317138671875, 0.07256317138671875, 0.0819549560546875, 0.09134674072265625, 0.100738525390625, 0.11013031005859375, 0.1195220947265625, 0.12891387939453125, 0.1383056640625, 0.14769744873046875, 0.1570892333984375, 0.16648101806640625, 0.175872802734375, 0.18526458740234375, 0.1946563720703125, 0.20404815673828125, 0.21343994140625, 0.22283172607421875, 0.2322235107421875, 0.24161529541015625, 0.251007080078125, 0.26039886474609375, 0.2697906494140625, 0.27918243408203125, 0.28857421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 1.0, 6.0, 9.0, 12.0, 10.0, 13.0, 9.0, 18.0, 15.0, 23.0, 36.0, 41.0, 50.0, 68.0, 101.0, 97.0, 88.0, 78.0, 61.0, 55.0, 46.0, 28.0, 26.0, 18.0, 18.0, 15.0, 11.0, 7.0, 10.0, 6.0, 10.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-5.4717063903808594e-05, -5.3306110203266144e-05, -5.1895156502723694e-05, -5.0484202802181244e-05, -4.9073249101638794e-05, -4.7662295401096344e-05, -4.6251341700553894e-05, -4.4840388000011444e-05, -4.3429434299468994e-05, -4.2018480598926544e-05, -4.0607526898384094e-05, -3.9196573197841644e-05, -3.7785619497299194e-05, -3.6374665796756744e-05, -3.4963712096214294e-05, -3.3552758395671844e-05, -3.2141804695129395e-05, -3.0730850994586945e-05, -2.9319897294044495e-05, -2.7908943593502045e-05, -2.6497989892959595e-05, -2.5087036192417145e-05, -2.3676082491874695e-05, -2.2265128791332245e-05, -2.0854175090789795e-05, -1.9443221390247345e-05, -1.8032267689704895e-05, -1.6621313989162445e-05, -1.5210360288619995e-05, -1.3799406588077545e-05, -1.2388452887535095e-05, -1.0977499186992645e-05, -9.566545486450195e-06, -8.155591785907745e-06, -6.744638085365295e-06, -5.3336843848228455e-06, -3.9227306842803955e-06, -2.5117769837379456e-06, -1.1008232831954956e-06, 3.1013041734695435e-07, 1.7210841178894043e-06, 3.1320378184318542e-06, 4.542991518974304e-06, 5.953945219516754e-06, 7.364898920059204e-06, 8.775852620601654e-06, 1.0186806321144104e-05, 1.1597760021686554e-05, 1.3008713722229004e-05, 1.4419667422771454e-05, 1.5830621123313904e-05, 1.7241574823856354e-05, 1.8652528524398804e-05, 2.0063482224941254e-05, 2.1474435925483704e-05, 2.2885389626026154e-05, 2.4296343326568604e-05, 2.5707297027111053e-05, 2.7118250727653503e-05, 2.8529204428195953e-05, 2.9940158128738403e-05, 3.135111182928085e-05, 3.27620655298233e-05, 3.417301923036575e-05, 3.55839729309082e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 11.0, 12.0, 13.0, 20.0, 29.0, 42.0, 70.0, 111.0, 191.0, 337.0, 708.0, 1684.0, 4750.0, 17899.0, 99124.0, 750706.0, 139840.0, 23511.0, 5846.0, 1920.0, 809.0, 424.0, 192.0, 109.0, 62.0, 47.0, 36.0, 17.0, 12.0, 9.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.248626708984375, -0.23992919921875, -0.231231689453125, -0.2225341796875, -0.213836669921875, -0.20513916015625, -0.196441650390625, -0.187744140625, -0.179046630859375, -0.17034912109375, -0.161651611328125, -0.1529541015625, -0.144256591796875, -0.13555908203125, -0.126861572265625, -0.1181640625, -0.109466552734375, -0.10076904296875, -0.092071533203125, -0.0833740234375, -0.074676513671875, -0.06597900390625, -0.057281494140625, -0.048583984375, -0.039886474609375, -0.03118896484375, -0.022491455078125, -0.0137939453125, -0.005096435546875, 0.00360107421875, 0.012298583984375, 0.02099609375, 0.029693603515625, 0.03839111328125, 0.047088623046875, 0.0557861328125, 0.064483642578125, 0.07318115234375, 0.081878662109375, 0.090576171875, 0.099273681640625, 0.10797119140625, 0.116668701171875, 0.1253662109375, 0.134063720703125, 0.14276123046875, 0.151458740234375, 0.16015625, 0.168853759765625, 0.17755126953125, 0.186248779296875, 0.1949462890625, 0.203643798828125, 0.21234130859375, 0.221038818359375, 0.229736328125, 0.238433837890625, 0.24713134765625, 0.255828857421875, 0.2645263671875, 0.273223876953125, 0.28192138671875, 0.290618896484375, 0.29931640625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 4.0, 4.0, 3.0, 10.0, 12.0, 14.0, 23.0, 18.0, 32.0, 47.0, 45.0, 73.0, 85.0, 111.0, 117.0, 97.0, 73.0, 49.0, 50.0, 33.0, 16.0, 23.0, 8.0, 8.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2776527404785156, -0.26844024658203125, -0.2592277526855469, -0.2500152587890625, -0.24080276489257812, -0.23159027099609375, -0.22237777709960938, -0.213165283203125, -0.20395278930664062, -0.19474029541015625, -0.18552780151367188, -0.1763153076171875, -0.16710281372070312, -0.15789031982421875, -0.14867782592773438, -0.13946533203125, -0.13025283813476562, -0.12104034423828125, -0.11182785034179688, -0.1026153564453125, -0.09340286254882812, -0.08419036865234375, -0.07497787475585938, -0.065765380859375, -0.056552886962890625, -0.04734039306640625, -0.038127899169921875, -0.0289154052734375, -0.019702911376953125, -0.01049041748046875, -0.001277923583984375, 0.0079345703125, 0.017147064208984375, 0.02635955810546875, 0.035572052001953125, 0.0447845458984375, 0.053997039794921875, 0.06320953369140625, 0.07242202758789062, 0.081634521484375, 0.09084701538085938, 0.10005950927734375, 0.10927200317382812, 0.1184844970703125, 0.12769699096679688, 0.13690948486328125, 0.14612197875976562, 0.15533447265625, 0.16454696655273438, 0.17375946044921875, 0.18297195434570312, 0.1921844482421875, 0.20139694213867188, 0.21060943603515625, 0.21982192993164062, 0.229034423828125, 0.23824691772460938, 0.24745941162109375, 0.2566719055175781, 0.2658843994140625, 0.2750968933105469, 0.28430938720703125, 0.2935218811035156, 0.302734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 11.0, 16.0, 32.0, 42.0, 92.0, 166.0, 380.0, 142.0, 69.0, 24.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0], "bins": [-15.669515609741211, -15.382220268249512, -15.094923973083496, -14.807628631591797, -14.520333290100098, -14.233037948608398, -13.945741653442383, -13.658446311950684, -13.371150970458984, -13.083855628967285, -12.79655933380127, -12.50926399230957, -12.221968650817871, -11.934673309326172, -11.647377014160156, -11.360081672668457, -11.072785377502441, -10.785490036010742, -10.498193740844727, -10.210898399353027, -9.923603057861328, -9.636306762695312, -9.349011421203613, -9.061716079711914, -8.774419784545898, -8.4871244430542, -8.199828147888184, -7.912532806396484, -7.625237464904785, -7.337941646575928, -7.05064582824707, -6.763350486755371, -6.476055145263672, -6.1887593269348145, -5.901463985443115, -5.614168167114258, -5.326872825622559, -5.039577007293701, -4.752281188964844, -4.4649858474731445, -4.177690505981445, -3.890394926071167, -3.6030993461608887, -3.3158035278320312, -3.028507947921753, -2.7412123680114746, -2.453916549682617, -2.166620969772339, -1.8793251514434814, -1.5920295715332031, -1.3047338724136353, -1.0174381732940674, -0.7301425933837891, -0.44284701347351074, -0.15555131435394287, 0.131744384765625, 0.4190399646759033, 0.7063356041908264, 0.9936312437057495, 1.2809269428253174, 1.5682225227355957, 1.855518102645874, 2.1428136825561523, 2.4301095008850098, 2.717405080795288]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 13.0, 14.0, 16.0, 18.0, 27.0, 21.0, 30.0, 20.0, 35.0, 35.0, 37.0, 54.0, 75.0, 125.0, 103.0, 63.0, 39.0, 40.0, 30.0, 27.0, 29.0, 21.0, 19.0, 15.0, 13.0, 9.0, 12.0, 6.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.655926704406738, -6.458719730377197, -6.261512279510498, -6.064305305480957, -5.867098331451416, -5.669891357421875, -5.472683906555176, -5.275476932525635, -5.078269958496094, -4.881062984466553, -4.6838555335998535, -4.4866485595703125, -4.2894415855407715, -4.0922346115112305, -3.8950271606445312, -3.6978201866149902, -3.500612735748291, -3.303405523300171, -3.10619854927063, -2.9089913368225098, -2.7117843627929688, -2.5145771503448486, -2.3173699378967285, -2.1201629638671875, -1.9229557514190674, -1.7257486581802368, -1.5285415649414062, -1.3313343524932861, -1.1341272592544556, -0.936920166015625, -0.7397129535675049, -0.5425058603286743, -0.34529876708984375, -0.1480916440486908, 0.04911547899246216, 0.2463226318359375, 0.44352972507476807, 0.6407368183135986, 0.8379440307617188, 1.0351511240005493, 1.2323582172393799, 1.4295653104782104, 1.626772403717041, 1.8239796161651611, 2.0211868286132812, 2.2183938026428223, 2.4156010150909424, 2.6128082275390625, 2.8100152015686035, 3.0072224140167236, 3.2044293880462646, 3.4016366004943848, 3.598843574523926, 3.796050786972046, 3.993257999420166, 4.190464973449707, 4.387672424316406, 4.584879398345947, 4.7820868492126465, 4.9792938232421875, 5.1765007972717285, 5.3737077713012695, 5.570915222167969, 5.76812219619751, 5.965329170227051]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 6.0, 11.0, 22.0, 15.0, 27.0, 42.0, 52.0, 56.0, 84.0, 125.0, 206.0, 378.0, 723.0, 1584.0, 6315.0, 48447.0, 648973.0, 2757104.0, 675858.0, 45437.0, 5476.0, 1572.0, 721.0, 338.0, 196.0, 137.0, 92.0, 64.0, 49.0, 37.0, 25.0, 26.0, 13.0, 12.0, 14.0, 10.0, 1.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4665565490722656, -0.44751739501953125, -0.4284782409667969, -0.4094390869140625, -0.3903999328613281, -0.37136077880859375, -0.3523216247558594, -0.333282470703125, -0.3142433166503906, -0.29520416259765625, -0.2761650085449219, -0.2571258544921875, -0.23808670043945312, -0.21904754638671875, -0.20000839233398438, -0.18096923828125, -0.16193008422851562, -0.14289093017578125, -0.12385177612304688, -0.1048126220703125, -0.08577346801757812, -0.06673431396484375, -0.047695159912109375, -0.028656005859375, -0.009616851806640625, 0.00942230224609375, 0.028461456298828125, 0.0475006103515625, 0.06653976440429688, 0.08557891845703125, 0.10461807250976562, 0.1236572265625, 0.14269638061523438, 0.16173553466796875, 0.18077468872070312, 0.1998138427734375, 0.21885299682617188, 0.23789215087890625, 0.2569313049316406, 0.275970458984375, 0.2950096130371094, 0.31404876708984375, 0.3330879211425781, 0.3521270751953125, 0.3711662292480469, 0.39020538330078125, 0.4092445373535156, 0.42828369140625, 0.4473228454589844, 0.46636199951171875, 0.4854011535644531, 0.5044403076171875, 0.5234794616699219, 0.5425186157226562, 0.5615577697753906, 0.580596923828125, 0.5996360778808594, 0.6186752319335938, 0.6377143859863281, 0.6567535400390625, 0.6757926940917969, 0.6948318481445312, 0.7138710021972656, 0.73291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 10.0, 22.0, 13.0, 12.0, 20.0, 14.0, 23.0, 21.0, 35.0, 39.0, 40.0, 44.0, 44.0, 43.0, 51.0, 40.0, 61.0, 39.0, 39.0, 41.0, 35.0, 34.0, 37.0, 33.0, 41.0, 30.0, 20.0, 22.0, 16.0, 11.0, 16.0, 12.0, 10.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3804283142089844, -0.36608123779296875, -0.3517341613769531, -0.3373870849609375, -0.3230400085449219, -0.30869293212890625, -0.2943458557128906, -0.279998779296875, -0.2656517028808594, -0.25130462646484375, -0.23695755004882812, -0.2226104736328125, -0.20826339721679688, -0.19391632080078125, -0.17956924438476562, -0.16522216796875, -0.15087509155273438, -0.13652801513671875, -0.12218093872070312, -0.1078338623046875, -0.09348678588867188, -0.07913970947265625, -0.06479263305664062, -0.050445556640625, -0.036098480224609375, -0.02175140380859375, -0.007404327392578125, 0.0069427490234375, 0.021289825439453125, 0.03563690185546875, 0.049983978271484375, 0.0643310546875, 0.07867813110351562, 0.09302520751953125, 0.10737228393554688, 0.1217193603515625, 0.13606643676757812, 0.15041351318359375, 0.16476058959960938, 0.179107666015625, 0.19345474243164062, 0.20780181884765625, 0.22214889526367188, 0.2364959716796875, 0.2508430480957031, 0.26519012451171875, 0.2795372009277344, 0.29388427734375, 0.3082313537597656, 0.32257843017578125, 0.3369255065917969, 0.3512725830078125, 0.3656196594238281, 0.37996673583984375, 0.3943138122558594, 0.408660888671875, 0.4230079650878906, 0.43735504150390625, 0.4517021179199219, 0.4660491943359375, 0.4803962707519531, 0.49474334716796875, 0.5090904235839844, 0.5234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 9.0, 18.0, 27.0, 59.0, 102.0, 185.0, 565.0, 2715.0, 947866.0, 3238119.0, 3642.0, 611.0, 188.0, 74.0, 57.0, 20.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91796875, -1.8414306640625, -1.764892578125, -1.6883544921875, -1.61181640625, -1.5352783203125, -1.458740234375, -1.3822021484375, -1.3056640625, -1.2291259765625, -1.152587890625, -1.0760498046875, -0.99951171875, -0.9229736328125, -0.846435546875, -0.7698974609375, -0.693359375, -0.6168212890625, -0.540283203125, -0.4637451171875, -0.38720703125, -0.3106689453125, -0.234130859375, -0.1575927734375, -0.0810546875, -0.0045166015625, 0.072021484375, 0.1485595703125, 0.22509765625, 0.3016357421875, 0.378173828125, 0.4547119140625, 0.53125, 0.6077880859375, 0.684326171875, 0.7608642578125, 0.83740234375, 0.9139404296875, 0.990478515625, 1.0670166015625, 1.1435546875, 1.2200927734375, 1.296630859375, 1.3731689453125, 1.44970703125, 1.5262451171875, 1.602783203125, 1.6793212890625, 1.755859375, 1.8323974609375, 1.908935546875, 1.9854736328125, 2.06201171875, 2.1385498046875, 2.215087890625, 2.2916259765625, 2.3681640625, 2.4447021484375, 2.521240234375, 2.5977783203125, 2.67431640625, 2.7508544921875, 2.827392578125, 2.9039306640625, 2.98046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 10.0, 9.0, 17.0, 54.0, 121.0, 384.0, 1115.0, 1416.0, 634.0, 175.0, 81.0, 31.0, 15.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.6424331665039062, -2.5876007080078125, -2.5327682495117188, -2.477935791015625, -2.4231033325195312, -2.3682708740234375, -2.3134384155273438, -2.25860595703125, -2.2037734985351562, -2.1489410400390625, -2.0941085815429688, -2.039276123046875, -1.9844436645507812, -1.9296112060546875, -1.8747787475585938, -1.8199462890625, -1.7651138305664062, -1.7102813720703125, -1.6554489135742188, -1.600616455078125, -1.5457839965820312, -1.4909515380859375, -1.4361190795898438, -1.38128662109375, -1.3264541625976562, -1.2716217041015625, -1.2167892456054688, -1.161956787109375, -1.1071243286132812, -1.0522918701171875, -0.9974594116210938, -0.942626953125, -0.8877944946289062, -0.8329620361328125, -0.7781295776367188, -0.723297119140625, -0.6684646606445312, -0.6136322021484375, -0.5587997436523438, -0.50396728515625, -0.44913482666015625, -0.3943023681640625, -0.33946990966796875, -0.284637451171875, -0.22980499267578125, -0.1749725341796875, -0.12014007568359375, -0.0653076171875, -0.01047515869140625, 0.0443572998046875, 0.09918975830078125, 0.154022216796875, 0.20885467529296875, 0.2636871337890625, 0.31851959228515625, 0.37335205078125, 0.42818450927734375, 0.4830169677734375, 0.5378494262695312, 0.592681884765625, 0.6475143432617188, 0.7023468017578125, 0.7571792602539062, 0.81201171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 41.0, 101.0, 351.0, 352.0, 98.0, 24.0, 12.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.493446350097656, -11.034473419189453, -10.57550048828125, -10.116527557373047, -9.657553672790527, -9.198580741882324, -8.739607810974121, -8.280634880065918, -7.821661472320557, -7.3626885414123535, -6.903715133666992, -6.444742202758789, -5.985769271850586, -5.526795864105225, -5.0678229331970215, -4.60884952545166, -4.149876594543457, -3.690903425216675, -3.2319302558898926, -2.7729573249816895, -2.3139841556549072, -1.855010986328125, -1.3960380554199219, -0.9370648860931396, -0.4780917167663574, -0.01911860704421997, 0.4398545026779175, 0.8988275527954102, 1.3578007221221924, 1.8167738914489746, 2.2757468223571777, 2.73471999168396, 3.193693161010742, 3.6526663303375244, 4.111639499664307, 4.57061243057251, 5.029585838317871, 5.488558769226074, 5.947531700134277, 6.4065046310424805, 6.865478038787842, 7.324450969696045, 7.783424377441406, 8.24239730834961, 8.701370239257812, 9.160343170166016, 9.619316101074219, 10.078289985656738, 10.537262916564941, 10.996235847473145, 11.455208778381348, 11.914182662963867, 12.37315559387207, 12.832128524780273, 13.291101455688477, 13.75007438659668, 14.209047317504883, 14.668020248413086, 15.126993179321289, 15.585966110229492, 16.044939041137695, 16.50391387939453, 16.962886810302734, 17.421859741210938, 17.88083267211914]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 7.0, 15.0, 14.0, 13.0, 27.0, 25.0, 18.0, 35.0, 50.0, 42.0, 45.0, 59.0, 66.0, 54.0, 57.0, 53.0, 60.0, 61.0, 53.0, 46.0, 29.0, 26.0, 27.0, 21.0, 15.0, 15.0, 13.0, 13.0, 7.0, 2.0, 8.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8660454750061035, -4.705453872680664, -4.544862270355225, -4.384270668029785, -4.223679065704346, -4.063087463378906, -3.902495861053467, -3.7419042587280273, -3.581312656402588, -3.4207210540771484, -3.260129451751709, -3.0995378494262695, -2.93894624710083, -2.7783546447753906, -2.617763042449951, -2.4571714401245117, -2.2965798377990723, -2.135988235473633, -1.9753966331481934, -1.814805030822754, -1.6542134284973145, -1.493621826171875, -1.3330302238464355, -1.172438621520996, -1.0118470191955566, -0.8512554168701172, -0.6906638145446777, -0.5300722122192383, -0.36948060989379883, -0.20888900756835938, -0.04829740524291992, 0.11229419708251953, 0.2728853225708008, 0.43347692489624023, 0.5940685272216797, 0.7546601295471191, 0.9152517318725586, 1.075843334197998, 1.2364349365234375, 1.397026538848877, 1.5576181411743164, 1.7182097434997559, 1.8788013458251953, 2.0393929481506348, 2.199984550476074, 2.3605761528015137, 2.521167755126953, 2.6817593574523926, 2.842350959777832, 3.0029425621032715, 3.163534164428711, 3.3241257667541504, 3.48471736907959, 3.6453089714050293, 3.8059005737304688, 3.966492176055908, 4.127083778381348, 4.287675380706787, 4.448266983032227, 4.608858585357666, 4.7694501876831055, 4.930041790008545, 5.090633392333984, 5.251224994659424, 5.411816596984863]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 3.0, 11.0, 14.0, 21.0, 34.0, 39.0, 50.0, 71.0, 139.0, 210.0, 325.0, 463.0, 723.0, 1126.0, 1780.0, 2910.0, 5246.0, 9683.0, 19254.0, 42172.0, 105839.0, 300660.0, 340407.0, 123297.0, 47936.0, 21550.0, 10469.0, 5581.0, 3197.0, 1927.0, 1236.0, 761.0, 490.0, 329.0, 195.0, 134.0, 85.0, 60.0, 37.0, 31.0, 27.0, 9.0, 14.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5620651245117188, -0.5445404052734375, -0.5270156860351562, -0.509490966796875, -0.49196624755859375, -0.4744415283203125, -0.45691680908203125, -0.43939208984375, -0.42186737060546875, -0.4043426513671875, -0.38681793212890625, -0.369293212890625, -0.35176849365234375, -0.3342437744140625, -0.31671905517578125, -0.2991943359375, -0.28166961669921875, -0.2641448974609375, -0.24662017822265625, -0.229095458984375, -0.21157073974609375, -0.1940460205078125, -0.17652130126953125, -0.15899658203125, -0.14147186279296875, -0.1239471435546875, -0.10642242431640625, -0.088897705078125, -0.07137298583984375, -0.0538482666015625, -0.03632354736328125, -0.018798828125, -0.00127410888671875, 0.0162506103515625, 0.03377532958984375, 0.051300048828125, 0.06882476806640625, 0.0863494873046875, 0.10387420654296875, 0.12139892578125, 0.13892364501953125, 0.1564483642578125, 0.17397308349609375, 0.191497802734375, 0.20902252197265625, 0.2265472412109375, 0.24407196044921875, 0.2615966796875, 0.27912139892578125, 0.2966461181640625, 0.31417083740234375, 0.331695556640625, 0.34922027587890625, 0.3667449951171875, 0.38426971435546875, 0.40179443359375, 0.41931915283203125, 0.4368438720703125, 0.45436859130859375, 0.471893310546875, 0.48941802978515625, 0.5069427490234375, 0.5244674682617188, 0.5419921875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 6.0, 8.0, 8.0, 8.0, 8.0, 9.0, 17.0, 9.0, 19.0, 20.0, 19.0, 26.0, 26.0, 24.0, 33.0, 31.0, 41.0, 33.0, 34.0, 47.0, 40.0, 48.0, 42.0, 27.0, 43.0, 28.0, 39.0, 32.0, 42.0, 18.0, 28.0, 22.0, 25.0, 18.0, 18.0, 16.0, 12.0, 11.0, 9.0, 8.0, 6.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.37158203125, -0.3594093322753906, -0.34723663330078125, -0.3350639343261719, -0.3228912353515625, -0.3107185363769531, -0.29854583740234375, -0.2863731384277344, -0.274200439453125, -0.2620277404785156, -0.24985504150390625, -0.23768234252929688, -0.2255096435546875, -0.21333694458007812, -0.20116424560546875, -0.18899154663085938, -0.17681884765625, -0.16464614868164062, -0.15247344970703125, -0.14030075073242188, -0.1281280517578125, -0.11595535278320312, -0.10378265380859375, -0.09160995483398438, -0.079437255859375, -0.06726455688476562, -0.05509185791015625, -0.042919158935546875, -0.0307464599609375, -0.018573760986328125, -0.00640106201171875, 0.005771636962890625, 0.0179443359375, 0.030117034912109375, 0.04228973388671875, 0.054462432861328125, 0.0666351318359375, 0.07880783081054688, 0.09098052978515625, 0.10315322875976562, 0.115325927734375, 0.12749862670898438, 0.13967132568359375, 0.15184402465820312, 0.1640167236328125, 0.17618942260742188, 0.18836212158203125, 0.20053482055664062, 0.21270751953125, 0.22488021850585938, 0.23705291748046875, 0.24922561645507812, 0.2613983154296875, 0.2735710144042969, 0.28574371337890625, 0.2979164123535156, 0.310089111328125, 0.3222618103027344, 0.33443450927734375, 0.3466072082519531, 0.3587799072265625, 0.3709526062011719, 0.38312530517578125, 0.3952980041503906, 0.407470703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 5.0, 7.0, 1.0, 6.0, 11.0, 17.0, 21.0, 24.0, 31.0, 50.0, 63.0, 76.0, 110.0, 190.0, 290.0, 434.0, 751.0, 1681.0, 5499.0, 47037.0, 913946.0, 67775.0, 6484.0, 1808.0, 781.0, 462.0, 305.0, 185.0, 145.0, 92.0, 63.0, 46.0, 39.0, 34.0, 14.0, 19.0, 14.0, 11.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.8525390625, -1.7989349365234375, -1.745330810546875, -1.6917266845703125, -1.63812255859375, -1.5845184326171875, -1.530914306640625, -1.4773101806640625, -1.4237060546875, -1.3701019287109375, -1.316497802734375, -1.2628936767578125, -1.20928955078125, -1.1556854248046875, -1.102081298828125, -1.0484771728515625, -0.994873046875, -0.9412689208984375, -0.887664794921875, -0.8340606689453125, -0.78045654296875, -0.7268524169921875, -0.673248291015625, -0.6196441650390625, -0.5660400390625, -0.5124359130859375, -0.458831787109375, -0.4052276611328125, -0.35162353515625, -0.2980194091796875, -0.244415283203125, -0.1908111572265625, -0.13720703125, -0.0836029052734375, -0.029998779296875, 0.0236053466796875, 0.07720947265625, 0.1308135986328125, 0.184417724609375, 0.2380218505859375, 0.2916259765625, 0.3452301025390625, 0.398834228515625, 0.4524383544921875, 0.50604248046875, 0.5596466064453125, 0.613250732421875, 0.6668548583984375, 0.720458984375, 0.7740631103515625, 0.827667236328125, 0.8812713623046875, 0.93487548828125, 0.9884796142578125, 1.042083740234375, 1.0956878662109375, 1.1492919921875, 1.2028961181640625, 1.256500244140625, 1.3101043701171875, 1.36370849609375, 1.4173126220703125, 1.470916748046875, 1.5245208740234375, 1.578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 8.0, 2.0, 2.0, 7.0, 14.0, 15.0, 15.0, 16.0, 22.0, 26.0, 27.0, 34.0, 35.0, 31.0, 46.0, 55.0, 53.0, 48.0, 62.0, 48.0, 67.0, 41.0, 44.0, 44.0, 41.0, 31.0, 24.0, 29.0, 16.0, 12.0, 17.0, 7.0, 11.0, 6.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.638671875, -1.585662841796875, -1.53265380859375, -1.479644775390625, -1.4266357421875, -1.373626708984375, -1.32061767578125, -1.267608642578125, -1.214599609375, -1.161590576171875, -1.10858154296875, -1.055572509765625, -1.0025634765625, -0.949554443359375, -0.89654541015625, -0.843536376953125, -0.79052734375, -0.737518310546875, -0.68450927734375, -0.631500244140625, -0.5784912109375, -0.525482177734375, -0.47247314453125, -0.419464111328125, -0.366455078125, -0.313446044921875, -0.26043701171875, -0.207427978515625, -0.1544189453125, -0.101409912109375, -0.04840087890625, 0.004608154296875, 0.0576171875, 0.110626220703125, 0.16363525390625, 0.216644287109375, 0.2696533203125, 0.322662353515625, 0.37567138671875, 0.428680419921875, 0.481689453125, 0.534698486328125, 0.58770751953125, 0.640716552734375, 0.6937255859375, 0.746734619140625, 0.79974365234375, 0.852752685546875, 0.90576171875, 0.958770751953125, 1.01177978515625, 1.064788818359375, 1.1177978515625, 1.170806884765625, 1.22381591796875, 1.276824951171875, 1.329833984375, 1.382843017578125, 1.43585205078125, 1.488861083984375, 1.5418701171875, 1.594879150390625, 1.64788818359375, 1.700897216796875, 1.75390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 4.0, 5.0, 7.0, 11.0, 5.0, 17.0, 14.0, 26.0, 55.0, 107.0, 337.0, 1174.0, 6626.0, 1003475.0, 33387.0, 2346.0, 554.0, 149.0, 70.0, 44.0, 31.0, 19.0, 7.0, 7.0, 6.0, 5.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 0.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2802734375, -1.23992919921875, -1.1995849609375, -1.15924072265625, -1.118896484375, -1.07855224609375, -1.0382080078125, -0.99786376953125, -0.95751953125, -0.91717529296875, -0.8768310546875, -0.83648681640625, -0.796142578125, -0.75579833984375, -0.7154541015625, -0.67510986328125, -0.634765625, -0.59442138671875, -0.5540771484375, -0.51373291015625, -0.473388671875, -0.43304443359375, -0.3927001953125, -0.35235595703125, -0.31201171875, -0.27166748046875, -0.2313232421875, -0.19097900390625, -0.150634765625, -0.11029052734375, -0.0699462890625, -0.02960205078125, 0.0107421875, 0.05108642578125, 0.0914306640625, 0.13177490234375, 0.172119140625, 0.21246337890625, 0.2528076171875, 0.29315185546875, 0.33349609375, 0.37384033203125, 0.4141845703125, 0.45452880859375, 0.494873046875, 0.53521728515625, 0.5755615234375, 0.61590576171875, 0.65625, 0.69659423828125, 0.7369384765625, 0.77728271484375, 0.817626953125, 0.85797119140625, 0.8983154296875, 0.93865966796875, 0.97900390625, 1.01934814453125, 1.0596923828125, 1.10003662109375, 1.140380859375, 1.18072509765625, 1.2210693359375, 1.26141357421875, 1.3017578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 23.0, 24.0, 53.0, 109.0, 225.0, 275.0, 125.0, 59.0, 45.0, 9.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.237361907958984e-05, -7.806532084941864e-05, -7.375702261924744e-05, -6.944872438907623e-05, -6.514042615890503e-05, -6.0832127928733826e-05, -5.652382969856262e-05, -5.221553146839142e-05, -4.7907233238220215e-05, -4.359893500804901e-05, -3.929063677787781e-05, -3.4982338547706604e-05, -3.06740403175354e-05, -2.6365742087364197e-05, -2.2057443857192993e-05, -1.774914562702179e-05, -1.3440847396850586e-05, -9.132549166679382e-06, -4.824250936508179e-06, -5.159527063369751e-07, 3.7923455238342285e-06, 8.100643754005432e-06, 1.2408941984176636e-05, 1.671724021434784e-05, 2.1025538444519043e-05, 2.5333836674690247e-05, 2.964213490486145e-05, 3.3950433135032654e-05, 3.825873136520386e-05, 4.256702959537506e-05, 4.6875327825546265e-05, 5.118362605571747e-05, 5.549192428588867e-05, 5.9800222516059875e-05, 6.410852074623108e-05, 6.841681897640228e-05, 7.272511720657349e-05, 7.703341543674469e-05, 8.13417136669159e-05, 8.56500118970871e-05, 8.99583101272583e-05, 9.42666083574295e-05, 9.857490658760071e-05, 0.00010288320481777191, 0.00010719150304794312, 0.00011149980127811432, 0.00011580809950828552, 0.00012011639773845673, 0.00012442469596862793, 0.00012873299419879913, 0.00013304129242897034, 0.00013734959065914154, 0.00014165788888931274, 0.00014596618711948395, 0.00015027448534965515, 0.00015458278357982635, 0.00015889108180999756, 0.00016319938004016876, 0.00016750767827033997, 0.00017181597650051117, 0.00017612427473068237, 0.00018043257296085358, 0.00018474087119102478, 0.00018904916942119598, 0.0001933574676513672]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 2.0, 5.0, 7.0, 17.0, 10.0, 25.0, 28.0, 30.0, 55.0, 98.0, 199.0, 602.0, 2499.0, 21287.0, 953363.0, 64467.0, 4309.0, 843.0, 321.0, 149.0, 69.0, 49.0, 28.0, 21.0, 13.0, 6.0, 11.0, 3.0, 4.0, 7.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4814453125, -0.4640350341796875, -0.446624755859375, -0.4292144775390625, -0.41180419921875, -0.3943939208984375, -0.376983642578125, -0.3595733642578125, -0.3421630859375, -0.3247528076171875, -0.307342529296875, -0.2899322509765625, -0.27252197265625, -0.2551116943359375, -0.237701416015625, -0.2202911376953125, -0.202880859375, -0.1854705810546875, -0.168060302734375, -0.1506500244140625, -0.13323974609375, -0.1158294677734375, -0.098419189453125, -0.0810089111328125, -0.0635986328125, -0.0461883544921875, -0.028778076171875, -0.0113677978515625, 0.00604248046875, 0.0234527587890625, 0.040863037109375, 0.0582733154296875, 0.07568359375, 0.0930938720703125, 0.110504150390625, 0.1279144287109375, 0.14532470703125, 0.1627349853515625, 0.180145263671875, 0.1975555419921875, 0.2149658203125, 0.2323760986328125, 0.249786376953125, 0.2671966552734375, 0.28460693359375, 0.3020172119140625, 0.319427490234375, 0.3368377685546875, 0.354248046875, 0.3716583251953125, 0.389068603515625, 0.4064788818359375, 0.42388916015625, 0.4412994384765625, 0.458709716796875, 0.4761199951171875, 0.4935302734375, 0.5109405517578125, 0.528350830078125, 0.5457611083984375, 0.56317138671875, 0.5805816650390625, 0.597991943359375, 0.6154022216796875, 0.6328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 12.0, 27.0, 61.0, 87.0, 127.0, 181.0, 149.0, 105.0, 98.0, 56.0, 20.0, 19.0, 8.0, 7.0, 10.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51953125, -0.5038719177246094, -0.48821258544921875, -0.4725532531738281, -0.4568939208984375, -0.4412345886230469, -0.42557525634765625, -0.4099159240722656, -0.394256591796875, -0.3785972595214844, -0.36293792724609375, -0.3472785949707031, -0.3316192626953125, -0.3159599304199219, -0.30030059814453125, -0.2846412658691406, -0.26898193359375, -0.2533226013183594, -0.23766326904296875, -0.22200393676757812, -0.2063446044921875, -0.19068527221679688, -0.17502593994140625, -0.15936660766601562, -0.143707275390625, -0.12804794311523438, -0.11238861083984375, -0.09672927856445312, -0.0810699462890625, -0.06541061401367188, -0.04975128173828125, -0.034091949462890625, -0.0184326171875, -0.002773284912109375, 0.01288604736328125, 0.028545379638671875, 0.0442047119140625, 0.059864044189453125, 0.07552337646484375, 0.09118270874023438, 0.106842041015625, 0.12250137329101562, 0.13816070556640625, 0.15382003784179688, 0.1694793701171875, 0.18513870239257812, 0.20079803466796875, 0.21645736694335938, 0.23211669921875, 0.24777603149414062, 0.26343536376953125, 0.2790946960449219, 0.2947540283203125, 0.3104133605957031, 0.32607269287109375, 0.3417320251464844, 0.357391357421875, 0.3730506896972656, 0.38871002197265625, 0.4043693542480469, 0.4200286865234375, 0.4356880187988281, 0.45134735107421875, 0.4670066833496094, 0.482666015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 24.0, 69.0, 661.0, 218.0, 24.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.79591369628906, -48.88642120361328, -47.976924896240234, -47.06743240356445, -46.15793991088867, -45.248443603515625, -44.338951110839844, -43.42945861816406, -42.51996612548828, -41.6104736328125, -40.70097732543945, -39.79148483276367, -38.88199234008789, -37.972496032714844, -37.06300354003906, -36.15351104736328, -35.244014739990234, -34.33452224731445, -33.425025939941406, -32.515533447265625, -31.606040954589844, -30.69654655456543, -29.787052154541016, -28.877559661865234, -27.96806526184082, -27.058570861816406, -26.149078369140625, -25.23958396911621, -24.330089569091797, -23.420597076416016, -22.5111026763916, -21.601608276367188, -20.69211769104004, -19.782623291015625, -18.873130798339844, -17.96363639831543, -17.054141998291016, -16.144649505615234, -15.23515510559082, -14.325661659240723, -13.416168212890625, -12.506674766540527, -11.59718132019043, -10.687686920166016, -9.778193473815918, -8.86870002746582, -7.9592061042785645, -7.049712181091309, -6.140218734741211, -5.230725288391113, -4.321231365203857, -3.4117376804351807, -2.502243995666504, -1.5927505493164062, -0.6832566261291504, 0.22623729705810547, 1.1357307434082031, 2.04522442817688, 2.9547181129455566, 3.8642117977142334, 4.77370548248291, 5.683198928833008, 6.592692852020264, 7.5021867752075195, 8.411680221557617]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 17.0, 6.0, 19.0, 16.0, 16.0, 14.0, 14.0, 34.0, 23.0, 34.0, 28.0, 41.0, 44.0, 109.0, 160.0, 73.0, 44.0, 30.0, 24.0, 33.0, 22.0, 24.0, 22.0, 16.0, 17.0, 11.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.7891411781311035, -7.555935382843018, -7.322729587554932, -7.089523792266846, -6.85631799697876, -6.623112201690674, -6.389906883239746, -6.15670108795166, -5.923495292663574, -5.690289497375488, -5.457083702087402, -5.223877906799316, -4.9906721115112305, -4.7574663162231445, -4.524260520935059, -4.291054725646973, -4.057848930358887, -3.824643135070801, -3.591437339782715, -3.358231544494629, -3.125025749206543, -2.891819953918457, -2.65861439704895, -2.4254086017608643, -2.1922028064727783, -1.9589970111846924, -1.7257912158966064, -1.49258553981781, -1.2593797445297241, -1.0261739492416382, -0.7929682731628418, -0.5597624778747559, -0.3265562057495117, -0.09335044026374817, 0.13985532522201538, 0.37306106090545654, 0.6062668561935425, 0.8394726514816284, 1.0726783275604248, 1.3058841228485107, 1.5390899181365967, 1.7722957134246826, 2.0055015087127686, 2.2387070655822754, 2.4719128608703613, 2.7051186561584473, 2.938324451446533, 3.171530246734619, 3.404736042022705, 3.637941837310791, 3.871147632598877, 4.104353427886963, 4.337559223175049, 4.570765018463135, 4.8039703369140625, 5.037176132202148, 5.270381927490234, 5.50358772277832, 5.736793518066406, 5.969999313354492, 6.203205108642578, 6.436410903930664, 6.66961669921875, 6.902822494506836, 7.136028289794922]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 4.0, 6.0, 18.0, 21.0, 34.0, 72.0, 113.0, 185.0, 287.0, 434.0, 753.0, 1317.0, 2365.0, 4889.0, 12721.0, 49826.0, 239914.0, 900965.0, 1757376.0, 912162.0, 244579.0, 45189.0, 10963.0, 4469.0, 2267.0, 1241.0, 781.0, 460.0, 304.0, 177.0, 147.0, 77.0, 55.0, 39.0, 28.0, 9.0, 11.0, 8.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439208984375, -0.4248085021972656, -0.41040802001953125, -0.3960075378417969, -0.3816070556640625, -0.3672065734863281, -0.35280609130859375, -0.3384056091308594, -0.324005126953125, -0.3096046447753906, -0.29520416259765625, -0.2808036804199219, -0.2664031982421875, -0.2520027160644531, -0.23760223388671875, -0.22320175170898438, -0.20880126953125, -0.19440078735351562, -0.18000030517578125, -0.16559982299804688, -0.1511993408203125, -0.13679885864257812, -0.12239837646484375, -0.10799789428710938, -0.093597412109375, -0.07919692993164062, -0.06479644775390625, -0.050395965576171875, -0.0359954833984375, -0.021595001220703125, -0.00719451904296875, 0.007205963134765625, 0.0216064453125, 0.036006927490234375, 0.05040740966796875, 0.06480789184570312, 0.0792083740234375, 0.09360885620117188, 0.10800933837890625, 0.12240982055664062, 0.136810302734375, 0.15121078491210938, 0.16561126708984375, 0.18001174926757812, 0.1944122314453125, 0.20881271362304688, 0.22321319580078125, 0.23761367797851562, 0.25201416015625, 0.2664146423339844, 0.28081512451171875, 0.2952156066894531, 0.3096160888671875, 0.3240165710449219, 0.33841705322265625, 0.3528175354003906, 0.367218017578125, 0.3816184997558594, 0.39601898193359375, 0.4104194641113281, 0.4248199462890625, 0.4392204284667969, 0.45362091064453125, 0.4680213928222656, 0.482421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 2.0, 11.0, 6.0, 12.0, 5.0, 4.0, 16.0, 17.0, 20.0, 17.0, 22.0, 28.0, 29.0, 32.0, 32.0, 40.0, 47.0, 39.0, 49.0, 57.0, 44.0, 51.0, 34.0, 37.0, 32.0, 43.0, 38.0, 33.0, 29.0, 24.0, 27.0, 22.0, 14.0, 18.0, 16.0, 12.0, 4.0, 6.0, 9.0, 5.0, 5.0, 3.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.346435546875, -0.333343505859375, -0.32025146484375, -0.307159423828125, -0.2940673828125, -0.280975341796875, -0.26788330078125, -0.254791259765625, -0.24169921875, -0.228607177734375, -0.21551513671875, -0.202423095703125, -0.1893310546875, -0.176239013671875, -0.16314697265625, -0.150054931640625, -0.136962890625, -0.123870849609375, -0.11077880859375, -0.097686767578125, -0.0845947265625, -0.071502685546875, -0.05841064453125, -0.045318603515625, -0.0322265625, -0.019134521484375, -0.00604248046875, 0.007049560546875, 0.0201416015625, 0.033233642578125, 0.04632568359375, 0.059417724609375, 0.072509765625, 0.085601806640625, 0.09869384765625, 0.111785888671875, 0.1248779296875, 0.137969970703125, 0.15106201171875, 0.164154052734375, 0.17724609375, 0.190338134765625, 0.20343017578125, 0.216522216796875, 0.2296142578125, 0.242706298828125, 0.25579833984375, 0.268890380859375, 0.281982421875, 0.295074462890625, 0.30816650390625, 0.321258544921875, 0.3343505859375, 0.347442626953125, 0.36053466796875, 0.373626708984375, 0.38671875, 0.399810791015625, 0.41290283203125, 0.425994873046875, 0.4390869140625, 0.452178955078125, 0.46527099609375, 0.478363037109375, 0.491455078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 19.0, 21.0, 25.0, 38.0, 48.0, 60.0, 119.0, 190.0, 428.0, 979.0, 3603.0, 71443.0, 4087198.0, 25223.0, 2908.0, 991.0, 442.0, 217.0, 101.0, 78.0, 39.0, 31.0, 13.0, 14.0, 12.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.154296875, -3.0761566162109375, -2.998016357421875, -2.9198760986328125, -2.84173583984375, -2.7635955810546875, -2.685455322265625, -2.6073150634765625, -2.5291748046875, -2.4510345458984375, -2.372894287109375, -2.2947540283203125, -2.21661376953125, -2.1384735107421875, -2.060333251953125, -1.9821929931640625, -1.904052734375, -1.8259124755859375, -1.747772216796875, -1.6696319580078125, -1.59149169921875, -1.5133514404296875, -1.435211181640625, -1.3570709228515625, -1.2789306640625, -1.2007904052734375, -1.122650146484375, -1.0445098876953125, -0.96636962890625, -0.8882293701171875, -0.810089111328125, -0.7319488525390625, -0.65380859375, -0.5756683349609375, -0.497528076171875, -0.4193878173828125, -0.34124755859375, -0.2631072998046875, -0.184967041015625, -0.1068267822265625, -0.0286865234375, 0.0494537353515625, 0.127593994140625, 0.2057342529296875, 0.28387451171875, 0.3620147705078125, 0.440155029296875, 0.5182952880859375, 0.596435546875, 0.6745758056640625, 0.752716064453125, 0.8308563232421875, 0.90899658203125, 0.9871368408203125, 1.065277099609375, 1.1434173583984375, 1.2215576171875, 1.2996978759765625, 1.377838134765625, 1.4559783935546875, 1.53411865234375, 1.6122589111328125, 1.690399169921875, 1.7685394287109375, 1.8466796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 13.0, 11.0, 30.0, 36.0, 38.0, 108.0, 199.0, 276.0, 468.0, 767.0, 721.0, 457.0, 320.0, 186.0, 125.0, 77.0, 62.0, 40.0, 33.0, 25.0, 24.0, 14.0, 12.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.834808349609375, -0.79071044921875, -0.746612548828125, -0.7025146484375, -0.658416748046875, -0.61431884765625, -0.570220947265625, -0.526123046875, -0.482025146484375, -0.43792724609375, -0.393829345703125, -0.3497314453125, -0.305633544921875, -0.26153564453125, -0.217437744140625, -0.17333984375, -0.129241943359375, -0.08514404296875, -0.041046142578125, 0.0030517578125, 0.047149658203125, 0.09124755859375, 0.135345458984375, 0.179443359375, 0.223541259765625, 0.26763916015625, 0.311737060546875, 0.3558349609375, 0.399932861328125, 0.44403076171875, 0.488128662109375, 0.5322265625, 0.576324462890625, 0.62042236328125, 0.664520263671875, 0.7086181640625, 0.752716064453125, 0.79681396484375, 0.840911865234375, 0.885009765625, 0.929107666015625, 0.97320556640625, 1.017303466796875, 1.0614013671875, 1.105499267578125, 1.14959716796875, 1.193695068359375, 1.23779296875, 1.281890869140625, 1.32598876953125, 1.370086669921875, 1.4141845703125, 1.458282470703125, 1.50238037109375, 1.546478271484375, 1.590576171875, 1.634674072265625, 1.67877197265625, 1.722869873046875, 1.7669677734375, 1.811065673828125, 1.85516357421875, 1.899261474609375, 1.943359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 11.0, 31.0, 116.0, 390.0, 289.0, 105.0, 31.0, 14.0, 1.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.080330848693848, -6.150125026702881, -5.219919204711914, -4.289712905883789, -3.3595073223114014, -2.4293012619018555, -1.4990954399108887, -0.5688896179199219, 0.3613162040710449, 1.2915220260620117, 2.2217278480529785, 3.1519339084625244, 4.08213996887207, 5.012345790863037, 5.942551612854004, 6.872757434844971, 7.8029632568359375, 8.733169555664062, 9.663374900817871, 10.593581199645996, 11.523786544799805, 12.45399284362793, 13.384199142456055, 14.314404487609863, 15.244609832763672, 16.174816131591797, 17.105022430419922, 18.035226821899414, 18.96543312072754, 19.895639419555664, 20.82584571838379, 21.75605010986328, 22.68625831604004, 23.616464614868164, 24.54667091369629, 25.47687530517578, 26.407081604003906, 27.33728790283203, 28.267494201660156, 29.19770050048828, 30.127904891967773, 31.0581111907959, 31.988317489624023, 32.918521881103516, 33.84872817993164, 34.778934478759766, 35.70914077758789, 36.639347076416016, 37.56955337524414, 38.499759674072266, 39.42996597290039, 40.360172271728516, 41.29037857055664, 42.2205810546875, 43.150787353515625, 44.08099365234375, 45.011199951171875, 45.94140625, 46.871612548828125, 47.80181884765625, 48.732025146484375, 49.6622314453125, 50.59243392944336, 51.522640228271484, 52.45284652709961]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 7.0, 7.0, 9.0, 6.0, 18.0, 19.0, 26.0, 38.0, 48.0, 53.0, 41.0, 68.0, 63.0, 56.0, 75.0, 67.0, 78.0, 48.0, 50.0, 46.0, 34.0, 28.0, 32.0, 25.0, 17.0, 6.0, 4.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.032562255859375, -8.712173461914062, -8.391785621643066, -8.071396827697754, -7.751008987426758, -7.430620193481445, -7.110231876373291, -6.789843559265137, -6.469455242156982, -6.149066925048828, -5.828678607940674, -5.5082902908325195, -5.187901496887207, -4.867513656616211, -4.547124862670898, -4.226736545562744, -3.90634822845459, -3.5859599113464355, -3.2655715942382812, -2.945183038711548, -2.6247947216033936, -2.3044064044952393, -1.9840179681777954, -1.6636295318603516, -1.3432412147521973, -1.022852897644043, -0.7024644613265991, -0.38207608461380005, -0.06168770790100098, 0.2587006092071533, 0.5790890455245972, 0.899477481842041, 1.219864845275879, 1.5402531623840332, 1.860641598701477, 2.181030035018921, 2.501418352127075, 2.8218066692352295, 3.142195224761963, 3.462583541870117, 3.7829718589782715, 4.103360176086426, 4.42374849319458, 4.744136810302734, 5.064525604248047, 5.384913444519043, 5.7053022384643555, 6.02569055557251, 6.346078872680664, 6.666467189788818, 6.986855506896973, 7.307243824005127, 7.627632141113281, 7.948020935058594, 8.26840877532959, 8.588797569274902, 8.909185409545898, 9.229574203491211, 9.549962043762207, 9.87035083770752, 10.190738677978516, 10.511127471923828, 10.831515312194824, 11.151904106140137, 11.47229290008545]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 1.0, 11.0, 16.0, 15.0, 10.0, 22.0, 33.0, 56.0, 76.0, 125.0, 233.0, 372.0, 730.0, 1454.0, 2926.0, 7452.0, 23803.0, 124624.0, 736368.0, 114659.0, 22532.0, 7189.0, 2830.0, 1337.0, 682.0, 363.0, 226.0, 148.0, 92.0, 50.0, 21.0, 27.0, 15.0, 7.0, 7.0, 5.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.7451171875, -0.7198410034179688, -0.6945648193359375, -0.6692886352539062, -0.644012451171875, -0.6187362670898438, -0.5934600830078125, -0.5681838989257812, -0.54290771484375, -0.5176315307617188, -0.4923553466796875, -0.46707916259765625, -0.441802978515625, -0.41652679443359375, -0.3912506103515625, -0.36597442626953125, -0.3406982421875, -0.31542205810546875, -0.2901458740234375, -0.26486968994140625, -0.239593505859375, -0.21431732177734375, -0.1890411376953125, -0.16376495361328125, -0.13848876953125, -0.11321258544921875, -0.0879364013671875, -0.06266021728515625, -0.037384033203125, -0.01210784912109375, 0.0131683349609375, 0.03844451904296875, 0.063720703125, 0.08899688720703125, 0.1142730712890625, 0.13954925537109375, 0.164825439453125, 0.19010162353515625, 0.2153778076171875, 0.24065399169921875, 0.26593017578125, 0.29120635986328125, 0.3164825439453125, 0.34175872802734375, 0.367034912109375, 0.39231109619140625, 0.4175872802734375, 0.44286346435546875, 0.4681396484375, 0.49341583251953125, 0.5186920166015625, 0.5439682006835938, 0.569244384765625, 0.5945205688476562, 0.6197967529296875, 0.6450729370117188, 0.67034912109375, 0.6956253051757812, 0.7209014892578125, 0.7461776733398438, 0.771453857421875, 0.7967300415039062, 0.8220062255859375, 0.8472824096679688, 0.87255859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 11.0, 20.0, 27.0, 25.0, 52.0, 70.0, 83.0, 78.0, 83.0, 86.0, 85.0, 88.0, 70.0, 60.0, 45.0, 38.0, 24.0, 17.0, 14.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7853317260742188, -0.7557220458984375, -0.7261123657226562, -0.696502685546875, -0.6668930053710938, -0.6372833251953125, -0.6076736450195312, -0.57806396484375, -0.5484542846679688, -0.5188446044921875, -0.48923492431640625, -0.459625244140625, -0.43001556396484375, -0.4004058837890625, -0.37079620361328125, -0.3411865234375, -0.31157684326171875, -0.2819671630859375, -0.25235748291015625, -0.222747802734375, -0.19313812255859375, -0.1635284423828125, -0.13391876220703125, -0.10430908203125, -0.07469940185546875, -0.0450897216796875, -0.01548004150390625, 0.014129638671875, 0.04373931884765625, 0.0733489990234375, 0.10295867919921875, 0.132568359375, 0.16217803955078125, 0.1917877197265625, 0.22139739990234375, 0.251007080078125, 0.28061676025390625, 0.3102264404296875, 0.33983612060546875, 0.36944580078125, 0.39905548095703125, 0.4286651611328125, 0.45827484130859375, 0.487884521484375, 0.5174942016601562, 0.5471038818359375, 0.5767135620117188, 0.6063232421875, 0.6359329223632812, 0.6655426025390625, 0.6951522827148438, 0.724761962890625, 0.7543716430664062, 0.7839813232421875, 0.8135910034179688, 0.84320068359375, 0.8728103637695312, 0.9024200439453125, 0.9320297241210938, 0.961639404296875, 0.9912490844726562, 1.0208587646484375, 1.0504684448242188, 1.080078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 5.0, 5.0, 13.0, 19.0, 23.0, 31.0, 40.0, 64.0, 76.0, 131.0, 169.0, 285.0, 575.0, 1281.0, 3953.0, 23240.0, 869695.0, 132640.0, 11409.0, 2684.0, 986.0, 454.0, 245.0, 143.0, 103.0, 67.0, 54.0, 41.0, 33.0, 18.0, 13.0, 13.0, 7.0, 16.0, 1.0, 5.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0377197265625, -1.006103515625, -0.9744873046875, -0.94287109375, -0.9112548828125, -0.879638671875, -0.8480224609375, -0.81640625, -0.7847900390625, -0.753173828125, -0.7215576171875, -0.68994140625, -0.6583251953125, -0.626708984375, -0.5950927734375, -0.5634765625, -0.5318603515625, -0.500244140625, -0.4686279296875, -0.43701171875, -0.4053955078125, -0.373779296875, -0.3421630859375, -0.310546875, -0.2789306640625, -0.247314453125, -0.2156982421875, -0.18408203125, -0.1524658203125, -0.120849609375, -0.0892333984375, -0.0576171875, -0.0260009765625, 0.005615234375, 0.0372314453125, 0.06884765625, 0.1004638671875, 0.132080078125, 0.1636962890625, 0.1953125, 0.2269287109375, 0.258544921875, 0.2901611328125, 0.32177734375, 0.3533935546875, 0.385009765625, 0.4166259765625, 0.4482421875, 0.4798583984375, 0.511474609375, 0.5430908203125, 0.57470703125, 0.6063232421875, 0.637939453125, 0.6695556640625, 0.701171875, 0.7327880859375, 0.764404296875, 0.7960205078125, 0.82763671875, 0.8592529296875, 0.890869140625, 0.9224853515625, 0.9541015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 6.0, 7.0, 12.0, 12.0, 14.0, 23.0, 17.0, 20.0, 29.0, 27.0, 28.0, 37.0, 50.0, 65.0, 68.0, 82.0, 73.0, 63.0, 63.0, 41.0, 35.0, 46.0, 23.0, 29.0, 12.0, 19.0, 10.0, 12.0, 11.0, 12.0, 7.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9140625, -1.8535919189453125, -1.793121337890625, -1.7326507568359375, -1.67218017578125, -1.6117095947265625, -1.551239013671875, -1.4907684326171875, -1.4302978515625, -1.3698272705078125, -1.309356689453125, -1.2488861083984375, -1.18841552734375, -1.1279449462890625, -1.067474365234375, -1.0070037841796875, -0.946533203125, -0.8860626220703125, -0.825592041015625, -0.7651214599609375, -0.70465087890625, -0.6441802978515625, -0.583709716796875, -0.5232391357421875, -0.4627685546875, -0.4022979736328125, -0.341827392578125, -0.2813568115234375, -0.22088623046875, -0.1604156494140625, -0.099945068359375, -0.0394744873046875, 0.02099609375, 0.0814666748046875, 0.141937255859375, 0.2024078369140625, 0.26287841796875, 0.3233489990234375, 0.383819580078125, 0.4442901611328125, 0.5047607421875, 0.5652313232421875, 0.625701904296875, 0.6861724853515625, 0.74664306640625, 0.8071136474609375, 0.867584228515625, 0.9280548095703125, 0.988525390625, 1.0489959716796875, 1.109466552734375, 1.1699371337890625, 1.23040771484375, 1.2908782958984375, 1.351348876953125, 1.4118194580078125, 1.4722900390625, 1.5327606201171875, 1.593231201171875, 1.6537017822265625, 1.71417236328125, 1.7746429443359375, 1.835113525390625, 1.8955841064453125, 1.9560546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 9.0, 8.0, 8.0, 11.0, 8.0, 16.0, 21.0, 31.0, 27.0, 51.0, 60.0, 85.0, 137.0, 208.0, 359.0, 731.0, 1414.0, 3419.0, 11484.0, 65448.0, 893143.0, 55206.0, 10485.0, 3328.0, 1233.0, 620.0, 341.0, 190.0, 144.0, 88.0, 53.0, 45.0, 34.0, 21.0, 22.0, 19.0, 17.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.11536693572998047, -0.11116600036621094, -0.1069650650024414, -0.10276412963867188, -0.09856319427490234, -0.09436225891113281, -0.09016132354736328, -0.08596038818359375, -0.08175945281982422, -0.07755851745605469, -0.07335758209228516, -0.06915664672851562, -0.0649557113647461, -0.06075477600097656, -0.05655384063720703, -0.0523529052734375, -0.04815196990966797, -0.04395103454589844, -0.039750099182128906, -0.035549163818359375, -0.031348228454589844, -0.027147293090820312, -0.02294635772705078, -0.01874542236328125, -0.014544486999511719, -0.010343551635742188, -0.006142616271972656, -0.001941680908203125, 0.0022592544555664062, 0.0064601898193359375, 0.010661125183105469, 0.014862060546875, 0.01906299591064453, 0.023263931274414062, 0.027464866638183594, 0.031665802001953125, 0.035866737365722656, 0.04006767272949219, 0.04426860809326172, 0.04846954345703125, 0.05267047882080078, 0.05687141418457031, 0.061072349548339844, 0.06527328491210938, 0.0694742202758789, 0.07367515563964844, 0.07787609100341797, 0.0820770263671875, 0.08627796173095703, 0.09047889709472656, 0.0946798324584961, 0.09888076782226562, 0.10308170318603516, 0.10728263854980469, 0.11148357391357422, 0.11568450927734375, 0.11988544464111328, 0.12408638000488281, 0.12828731536865234, 0.13248825073242188, 0.1366891860961914, 0.14089012145996094, 0.14509105682373047, 0.1492919921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 10.0, 6.0, 11.0, 6.0, 18.0, 16.0, 20.0, 33.0, 55.0, 59.0, 83.0, 100.0, 107.0, 97.0, 94.0, 56.0, 50.0, 35.0, 25.0, 20.0, 13.0, 17.0, 6.0, 15.0, 8.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7477741241455078e-05, -2.6518478989601135e-05, -2.5559216737747192e-05, -2.459995448589325e-05, -2.3640692234039307e-05, -2.2681429982185364e-05, -2.172216773033142e-05, -2.0762905478477478e-05, -1.9803643226623535e-05, -1.8844380974769592e-05, -1.788511872291565e-05, -1.6925856471061707e-05, -1.5966594219207764e-05, -1.500733196735382e-05, -1.4048069715499878e-05, -1.3088807463645935e-05, -1.2129545211791992e-05, -1.117028295993805e-05, -1.0211020708084106e-05, -9.251758456230164e-06, -8.29249620437622e-06, -7.333233952522278e-06, -6.373971700668335e-06, -5.414709448814392e-06, -4.455447196960449e-06, -3.4961849451065063e-06, -2.5369226932525635e-06, -1.5776604413986206e-06, -6.183981895446777e-07, 3.4086406230926514e-07, 1.300126314163208e-06, 2.259388566017151e-06, 3.2186508178710938e-06, 4.177913069725037e-06, 5.1371753215789795e-06, 6.096437573432922e-06, 7.055699825286865e-06, 8.014962077140808e-06, 8.974224328994751e-06, 9.933486580848694e-06, 1.0892748832702637e-05, 1.185201108455658e-05, 1.2811273336410522e-05, 1.3770535588264465e-05, 1.4729797840118408e-05, 1.568906009197235e-05, 1.6648322343826294e-05, 1.7607584595680237e-05, 1.856684684753418e-05, 1.9526109099388123e-05, 2.0485371351242065e-05, 2.1444633603096008e-05, 2.240389585494995e-05, 2.3363158106803894e-05, 2.4322420358657837e-05, 2.528168261051178e-05, 2.6240944862365723e-05, 2.7200207114219666e-05, 2.815946936607361e-05, 2.911873161792755e-05, 3.0077993869781494e-05, 3.103725612163544e-05, 3.199651837348938e-05, 3.295578062534332e-05, 3.3915042877197266e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 8.0, 10.0, 8.0, 14.0, 11.0, 32.0, 39.0, 57.0, 80.0, 121.0, 169.0, 304.0, 531.0, 929.0, 1821.0, 3966.0, 10424.0, 34538.0, 604598.0, 338478.0, 34035.0, 10322.0, 3990.0, 1791.0, 903.0, 500.0, 303.0, 188.0, 130.0, 88.0, 60.0, 26.0, 23.0, 12.0, 13.0, 2.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08740234375, -0.08458232879638672, -0.08176231384277344, -0.07894229888916016, -0.07612228393554688, -0.0733022689819336, -0.07048225402832031, -0.06766223907470703, -0.06484222412109375, -0.06202220916748047, -0.05920219421386719, -0.056382179260253906, -0.053562164306640625, -0.050742149353027344, -0.04792213439941406, -0.04510211944580078, -0.0422821044921875, -0.03946208953857422, -0.03664207458496094, -0.033822059631347656, -0.031002044677734375, -0.028182029724121094, -0.025362014770507812, -0.02254199981689453, -0.01972198486328125, -0.01690196990966797, -0.014081954956054688, -0.011261940002441406, -0.008441925048828125, -0.005621910095214844, -0.0028018951416015625, 1.811981201171875e-05, 0.002838134765625, 0.005658149719238281, 0.008478164672851562, 0.011298179626464844, 0.014118194580078125, 0.016938209533691406, 0.019758224487304688, 0.02257823944091797, 0.02539825439453125, 0.02821826934814453, 0.031038284301757812, 0.033858299255371094, 0.036678314208984375, 0.039498329162597656, 0.04231834411621094, 0.04513835906982422, 0.0479583740234375, 0.05077838897705078, 0.05359840393066406, 0.056418418884277344, 0.059238433837890625, 0.062058448791503906, 0.06487846374511719, 0.06769847869873047, 0.07051849365234375, 0.07333850860595703, 0.07615852355957031, 0.0789785385131836, 0.08179855346679688, 0.08461856842041016, 0.08743858337402344, 0.09025859832763672, 0.09307861328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 4.0, 4.0, 8.0, 9.0, 11.0, 15.0, 19.0, 16.0, 31.0, 47.0, 97.0, 79.0, 117.0, 148.0, 112.0, 85.0, 55.0, 42.0, 18.0, 14.0, 12.0, 11.0, 8.0, 7.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197509765625, -0.19135475158691406, -0.18519973754882812, -0.1790447235107422, -0.17288970947265625, -0.1667346954345703, -0.16057968139648438, -0.15442466735839844, -0.1482696533203125, -0.14211463928222656, -0.13595962524414062, -0.1298046112060547, -0.12364959716796875, -0.11749458312988281, -0.11133956909179688, -0.10518455505371094, -0.099029541015625, -0.09287452697753906, -0.08671951293945312, -0.08056449890136719, -0.07440948486328125, -0.06825447082519531, -0.062099456787109375, -0.05594444274902344, -0.0497894287109375, -0.04363441467285156, -0.037479400634765625, -0.03132438659667969, -0.02516937255859375, -0.019014358520507812, -0.012859344482421875, -0.0067043304443359375, -0.00054931640625, 0.0056056976318359375, 0.011760711669921875, 0.017915725708007812, 0.02407073974609375, 0.030225753784179688, 0.036380767822265625, 0.04253578186035156, 0.0486907958984375, 0.05484580993652344, 0.061000823974609375, 0.06715583801269531, 0.07331085205078125, 0.07946586608886719, 0.08562088012695312, 0.09177589416503906, 0.097930908203125, 0.10408592224121094, 0.11024093627929688, 0.11639595031738281, 0.12255096435546875, 0.1287059783935547, 0.13486099243164062, 0.14101600646972656, 0.1471710205078125, 0.15332603454589844, 0.15948104858398438, 0.1656360626220703, 0.17179107666015625, 0.1779460906982422, 0.18410110473632812, 0.19025611877441406, 0.1964111328125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 14.0, 18.0, 26.0, 54.0, 103.0, 551.0, 123.0, 44.0, 32.0, 13.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.00898551940918, -8.749051094055176, -8.489115715026855, -8.229181289672852, -7.9692463874816895, -7.709311485290527, -7.449377059936523, -7.189442157745361, -6.929507255554199, -6.669572353363037, -6.409637451171875, -6.149703025817871, -5.889768123626709, -5.629833221435547, -5.369898796081543, -5.109963893890381, -4.850028991699219, -4.590094089508057, -4.3301591873168945, -4.070224761962891, -3.8102898597717285, -3.5503549575805664, -3.2904202938079834, -3.0304856300354004, -2.7705507278442383, -2.510615825653076, -2.250681161880493, -1.9907463788986206, -1.730811595916748, -1.4708768129348755, -1.210942029953003, -0.9510072469711304, -0.6910734176635742, -0.43113863468170166, -0.1712038516998291, 0.08873093128204346, 0.348665714263916, 0.6086004972457886, 0.8685352802276611, 1.1284700632095337, 1.3884048461914062, 1.6483396291732788, 1.9082744121551514, 2.1682090759277344, 2.4281439781188965, 2.6880788803100586, 2.9480135440826416, 3.2079482078552246, 3.4678831100463867, 3.727818012237549, 3.987752676010132, 4.247687339782715, 4.507622241973877, 4.767557144165039, 5.027491569519043, 5.287426471710205, 5.547361373901367, 5.807296276092529, 6.067231178283691, 6.327165603637695, 6.587100505828857, 6.8470354080200195, 7.106969833374023, 7.3669047355651855, 7.626839637756348]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 10.0, 4.0, 5.0, 9.0, 4.0, 8.0, 7.0, 12.0, 19.0, 19.0, 13.0, 20.0, 14.0, 23.0, 27.0, 27.0, 81.0, 311.0, 128.0, 42.0, 31.0, 20.0, 19.0, 17.0, 21.0, 17.0, 20.0, 15.0, 11.0, 8.0, 6.0, 10.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8000617027282715, -6.609169960021973, -6.418278217315674, -6.227386474609375, -6.036495208740234, -5.8456034660339355, -5.654711723327637, -5.463819980621338, -5.272928237915039, -5.08203649520874, -4.891144752502441, -4.700253486633301, -4.509361743927002, -4.318470001220703, -4.127578258514404, -3.9366865158081055, -3.745795249938965, -3.554903507232666, -3.3640120029449463, -3.1731202602386475, -2.9822287559509277, -2.791337013244629, -2.60044527053833, -2.4095535278320312, -2.2186620235443115, -2.0277702808380127, -1.836878776550293, -1.6459870338439941, -1.4550954103469849, -1.2642037868499756, -1.0733120441436768, -0.8824204206466675, -0.6915283203125, -0.5006366968154907, -0.30974501371383667, -0.11885333061218262, 0.07203829288482666, 0.26292991638183594, 0.45382165908813477, 0.644713282585144, 0.8356049060821533, 1.0264965295791626, 1.2173881530761719, 1.4082798957824707, 1.59917151927948, 1.7900631427764893, 1.980954885482788, 2.171846389770508, 2.3627381324768066, 2.5536298751831055, 2.744521379470825, 2.935413122177124, 3.1263046264648438, 3.3171963691711426, 3.5080881118774414, 3.6989798545837402, 3.88987135887146, 4.08076286315918, 4.2716546058654785, 4.462546348571777, 4.653438091278076, 4.844329833984375, 5.035221099853516, 5.2261128425598145, 5.417004585266113]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 11.0, 23.0, 26.0, 22.0, 26.0, 31.0, 22.0, 43.0, 64.0, 246.0, 131.0, 51.0, 44.0, 32.0, 28.0, 30.0, 22.0, 21.0, 21.0, 14.0, 10.0, 6.0, 9.0, 3.0, 2.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.3615837097167969, -0.34645843505859375, -0.3313331604003906, -0.3162078857421875, -0.3010826110839844, -0.28595733642578125, -0.2708320617675781, -0.255706787109375, -0.24058151245117188, -0.22545623779296875, -0.21033096313476562, -0.1952056884765625, -0.18008041381835938, -0.16495513916015625, -0.14982986450195312, -0.13470458984375, -0.11957931518554688, -0.10445404052734375, -0.08932876586914062, -0.0742034912109375, -0.059078216552734375, -0.04395294189453125, -0.028827667236328125, -0.013702392578125, 0.001422882080078125, 0.01654815673828125, 0.031673431396484375, 0.0467987060546875, 0.061923980712890625, 0.07704925537109375, 0.09217453002929688, 0.1072998046875, 0.12242507934570312, 0.13755035400390625, 0.15267562866210938, 0.1678009033203125, 0.18292617797851562, 0.19805145263671875, 0.21317672729492188, 0.228302001953125, 0.24342727661132812, 0.25855255126953125, 0.2736778259277344, 0.2888031005859375, 0.3039283752441406, 0.31905364990234375, 0.3341789245605469, 0.34930419921875, 0.3644294738769531, 0.37955474853515625, 0.3946800231933594, 0.4098052978515625, 0.4249305725097656, 0.44005584716796875, 0.4551811218261719, 0.470306396484375, 0.4854316711425781, 0.5005569458007812, 0.5156822204589844, 0.5308074951171875, 0.5459327697753906, 0.5610580444335938, 0.5761833190917969, 0.59130859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 9.0, 4.0, 3.0, 2.0, 1.0, 11.0, 19.0, 41.0, 44.0, 65.0, 128.0, 191.0, 824.0, 5322.0, 8358822.0, 20685.0, 1623.0, 395.0, 147.0, 70.0, 32.0, 31.0, 27.0, 19.0, 17.0, 14.0, 12.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-5.298147201538086, -5.113656997680664, -4.929166793823242, -4.74467658996582, -4.560186386108398, -4.375696182250977, -4.191205978393555, -4.006715774536133, -3.82222580909729, -3.637735605239868, -3.4532454013824463, -3.2687554359436035, -3.0842652320861816, -2.8997750282287598, -2.715284824371338, -2.530794620513916, -2.346304416656494, -2.1618142127990723, -1.9773240089416504, -1.792833924293518, -1.6083437204360962, -1.4238535165786743, -1.239363431930542, -1.0548732280731201, -0.8703830242156982, -0.6858928203582764, -0.5014026761054993, -0.31691253185272217, -0.1324223279953003, 0.05206787586212158, 0.2365579605102539, 0.4210481643676758, 0.6055383682250977, 0.7900285720825195, 0.9745187163352966, 1.1590088605880737, 1.3434990644454956, 1.5279892683029175, 1.7124793529510498, 1.8969695568084717, 2.0814597606658936, 2.2659499645233154, 2.4504401683807373, 2.63493013381958, 2.819420337677002, 3.003910541534424, 3.1884007453918457, 3.3728909492492676, 3.5573811531066895, 3.7418713569641113, 3.926361560821533, 4.110851764678955, 4.295341968536377, 4.479832172393799, 4.6643218994140625, 4.848812103271484, 5.033302307128906, 5.217792510986328, 5.40228271484375, 5.586772918701172, 5.771263122558594, 5.955753326416016, 6.1402435302734375, 6.324733734130859, 6.509223937988281]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.173997402191162, -7.003606796264648, -6.833216190338135, -6.662825584411621, -6.492434978485107, -6.322044372558594, -6.151654243469238, -5.981263637542725, -5.810873031616211, -5.640482425689697, -5.470091819763184, -5.29970121383667, -5.129310607910156, -4.958920478820801, -4.788529396057129, -4.618139266967773, -4.447748184204102, -4.277357578277588, -4.106966972351074, -3.9365763664245605, -3.766185998916626, -3.5957953929901123, -3.4254047870635986, -3.255014419555664, -3.0846238136291504, -2.9142332077026367, -2.743842601776123, -2.5734519958496094, -2.403061628341675, -2.232671022415161, -2.0622804164886475, -1.8918899297714233, -1.7214992046356201, -1.5511085987091064, -1.3807181119918823, -1.2103275060653687, -1.0399370193481445, -0.8695464134216309, -0.6991558074951172, -0.5287653207778931, -0.3583747148513794, -0.1879841536283493, -0.017593592405319214, 0.15279698371887207, 0.32318753004074097, 0.49357807636260986, 0.6639686822891235, 0.8343591690063477, 1.0047497749328613, 1.175140380859375, 1.3455308675765991, 1.5159214735031128, 1.686311960220337, 1.8567025661468506, 2.0270931720733643, 2.197483539581299, 2.3678741455078125, 2.538264751434326, 2.70865535736084, 2.8790459632873535, 3.049436330795288, 3.2198269367218018, 3.3902175426483154, 3.56060791015625, 3.7309987545013428]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 7.0, 6.0, 17.0, 29.0, 29.0, 52.0, 75.0, 94.0, 171.0, 319.0, 549.0, 1379.0, 3720.0, 10970.0, 36040.0, 128077.0, 225116.0, 81096.0, 23669.0, 7563.0, 2767.0, 1218.0, 522.0, 278.0, 156.0, 112.0, 59.0, 51.0, 25.0, 27.0, 18.0, 12.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.462890625, -3.372528076171875, -3.28216552734375, -3.191802978515625, -3.1014404296875, -3.011077880859375, -2.92071533203125, -2.830352783203125, -2.739990234375, -2.649627685546875, -2.55926513671875, -2.468902587890625, -2.3785400390625, -2.288177490234375, -2.19781494140625, -2.107452392578125, -2.01708984375, -1.926727294921875, -1.83636474609375, -1.746002197265625, -1.6556396484375, -1.565277099609375, -1.47491455078125, -1.384552001953125, -1.294189453125, -1.203826904296875, -1.11346435546875, -1.023101806640625, -0.9327392578125, -0.842376708984375, -0.75201416015625, -0.661651611328125, -0.5712890625, -0.480926513671875, -0.39056396484375, -0.300201416015625, -0.2098388671875, -0.119476318359375, -0.02911376953125, 0.061248779296875, 0.151611328125, 0.241973876953125, 0.33233642578125, 0.422698974609375, 0.5130615234375, 0.603424072265625, 0.69378662109375, 0.784149169921875, 0.87451171875, 0.964874267578125, 1.05523681640625, 1.145599365234375, 1.2359619140625, 1.326324462890625, 1.41668701171875, 1.507049560546875, 1.597412109375, 1.687774658203125, 1.77813720703125, 1.868499755859375, 1.9588623046875, 2.049224853515625, 2.13958740234375, 2.229949951171875, 2.3203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 14.0, 8.0, 10.0, 21.0, 36.0, 48.0, 60.0, 83.0, 90.0, 106.0, 116.0, 103.0, 83.0, 74.0, 43.0, 33.0, 24.0, 19.0, 9.0, 10.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8443374633789062, -0.8131866455078125, -0.7820358276367188, -0.750885009765625, -0.7197341918945312, -0.6885833740234375, -0.6574325561523438, -0.62628173828125, -0.5951309204101562, -0.5639801025390625, -0.5328292846679688, -0.501678466796875, -0.47052764892578125, -0.4393768310546875, -0.40822601318359375, -0.3770751953125, -0.34592437744140625, -0.3147735595703125, -0.28362274169921875, -0.252471923828125, -0.22132110595703125, -0.1901702880859375, -0.15901947021484375, -0.12786865234375, -0.09671783447265625, -0.0655670166015625, -0.03441619873046875, -0.003265380859375, 0.02788543701171875, 0.0590362548828125, 0.09018707275390625, 0.121337890625, 0.15248870849609375, 0.1836395263671875, 0.21479034423828125, 0.245941162109375, 0.27709197998046875, 0.3082427978515625, 0.33939361572265625, 0.37054443359375, 0.40169525146484375, 0.4328460693359375, 0.46399688720703125, 0.495147705078125, 0.5262985229492188, 0.5574493408203125, 0.5886001586914062, 0.6197509765625, 0.6509017944335938, 0.6820526123046875, 0.7132034301757812, 0.744354248046875, 0.7755050659179688, 0.8066558837890625, 0.8378067016601562, 0.86895751953125, 0.9001083374023438, 0.9312591552734375, 0.9624099731445312, 0.993560791015625, 1.0247116088867188, 1.0558624267578125, 1.0870132446289062, 1.1181640625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 18.0, 54.0, 144.0, 162.0, 52.0, 19.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0163381099700928, -1.7889056205749512, -1.5614731311798096, -1.3340405225753784, -1.1066080331802368, -0.8791755437850952, -0.6517429351806641, -0.42431044578552246, -0.19687795639038086, 0.03055456280708313, 0.2579870820045471, 0.4854196310043335, 0.7128521203994751, 0.9402846097946167, 1.1677172183990479, 1.3951497077941895, 1.622582197189331, 1.8500146865844727, 2.0774471759796143, 2.304879665374756, 2.5323123931884766, 2.759744644165039, 2.9871773719787598, 3.2146098613739014, 3.442042350769043, 3.6694748401641846, 3.896907329559326, 4.124340057373047, 4.351772308349609, 4.57920503616333, 4.806637763977051, 5.034070014953613, 5.261502265930176, 5.4889349937438965, 5.716367244720459, 5.94379997253418, 6.171232223510742, 6.398664951324463, 6.626097679138184, 6.853529930114746, 7.080962181091309, 7.308394908905029, 7.535827159881592, 7.7632598876953125, 7.990692138671875, 8.218124389648438, 8.445557594299316, 8.672989845275879, 8.900423049926758, 9.12785530090332, 9.3552885055542, 9.582720756530762, 9.810153007507324, 10.037585258483887, 10.265018463134766, 10.492450714111328, 10.71988296508789, 10.947315216064453, 11.174748420715332, 11.402180671691895, 11.629612922668457, 11.85704517364502, 12.084478378295898, 12.311910629272461, 12.539342880249023]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 1.0, 0.0, 2.0, 8.0, 5.0, 5.0, 11.0, 11.0, 13.0, 26.0, 42.0, 47.0, 66.0, 53.0, 65.0, 36.0, 31.0, 11.0, 13.0, 6.0, 4.0, 2.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.1472978591918945, -4.041693687438965, -3.936089515686035, -3.8304853439331055, -3.724881410598755, -3.619277238845825, -3.5136730670928955, -3.408068895339966, -3.3024649620056152, -3.1968607902526855, -3.091256618499756, -2.985652446746826, -2.8800485134124756, -2.774444341659546, -2.668840169906616, -2.5632359981536865, -2.457631826400757, -2.352027654647827, -2.2464234828948975, -2.140819549560547, -2.035215377807617, -1.9296112060546875, -1.8240070343017578, -1.7184028625488281, -1.612798810005188, -1.5071946382522583, -1.4015905857086182, -1.2959864139556885, -1.1903822422027588, -1.0847781896591187, -0.979174017906189, -0.873569905757904, -0.7679657936096191, -0.6623616814613342, -0.5567575693130493, -0.45115339756011963, -0.3455492854118347, -0.2399451732635498, -0.13434100151062012, -0.028736889362335205, 0.07686722278594971, 0.1824713498353958, 0.2880754768848419, 0.3936796188354492, 0.49928373098373413, 0.604887843132019, 0.7104920148849487, 0.8160961270332336, 0.9217002391815186, 1.0273044109344482, 1.1329084634780884, 1.238512635231018, 1.3441166877746582, 1.449720859527588, 1.5553250312805176, 1.6609292030334473, 1.7665332555770874, 1.872137427330017, 1.9777414798736572, 2.083345651626587, 2.1889498233795166, 2.294553756713867, 2.400157928466797, 2.5057621002197266, 2.6113662719726562]}, "train/train_runtime": 5163.9194, "train/train_samples_per_second": 5.526, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.298295111399595, "eval/loss": 4.195079803466797, "eval/wer": 2.3244744149147163, "eval/runtime": 1122.559, "eval/samples_per_second": 2.354, "eval/steps_per_second": 0.295, "_wandb": {"runtime": 6633}}